comparison sam_header.xml @ 3:d6ec32ce882b draft default tip

Uploaded
author wolma
date Tue, 28 Mar 2017 04:34:04 -0400
parents
children
comparison
equal deleted inserted replaced
2:7f7028112439 3:d6ec32ce882b
1 <tool id="ngs_run_annotation" name="NGS Run Annotation" version="0.1.7.3">
2 <description>Create a SAM format header from run metadata for sample annotation.</description>
3 <macros>
4 <import>toolshed_macros.xml</import>
5 </macros>
6 <expand macro="requirements" />
7 <version_command>mimodd version -q</version_command>
8 <command>
9 mimodd header
10
11 --rg-id "$rg_id"
12 --rg-sm "$rg_sm"
13
14 #if $str($rg_cn):
15 --rg-cn "$rg_cn"
16 #end if
17 #if $str($rg_ds):
18 --rg-ds "$rg_ds"
19 #end if
20 #if $str($rg_date):
21 --rg-dt "$rg_date"
22 #end if
23 #if $str($rg_lb):
24 --rg-lb "$rg_lb"
25 #end if
26 #if $str($rg_pl):
27 --rg-pl "$rg_pl"
28 #end if
29 #if $str($rg_pi):
30 --rg-pi "$rg_pi"
31 #end if
32 #if $str($rg_pu):
33 --rg-pu "$rg_pu"
34 #end if
35
36 --ofile "$outputfile"
37
38 </command>
39
40 <inputs>
41 <param label="read-group ID (required)" name="rg_id" size="80" type="text">
42 <sanitizer invalid_char="">
43 <valid initial="string.printable">
44 <remove value="&quot;" />
45 </valid>
46 <mapping initial="none">
47 <add source="&quot;" target="\&quot;" />
48 </mapping>
49 </sanitizer>
50 </param>
51 <param label="sample name (required)" name="rg_sm" size="80" type="text">
52 <sanitizer invalid_char="">
53 <valid initial="string.printable">
54 <remove value="&quot;" />
55 </valid>
56 <mapping initial="none">
57 <add source="&quot;" target="\&quot;" />
58 </mapping>
59 </sanitizer>
60 </param>
61 <param label="description" name="rg_ds" size="80" type="text">
62 <sanitizer invalid_char="">
63 <valid initial="string.printable">
64 <remove value="&quot;" />
65 </valid>
66 <mapping initial="none">
67 <add source="&quot;" target="\&quot;" />
68 </mapping>
69 </sanitizer>
70 </param>
71 <param label="date (YYYY-MM-DD) the run was produced" name="rg_date" type="text" />
72 <param label="name of sequencing center" name="rg_cn" size="80" type="text">
73 <sanitizer invalid_char="">
74 <valid initial="string.printable">
75 <remove value="&quot;" />
76 </valid>
77 <mapping initial="none">
78 <add source="&quot;" target="\&quot;" />
79 </mapping>
80 </sanitizer>
81 </param>
82 <param label="read-group library" name="rg_lb" size="80" type="text">
83 <sanitizer invalid_char="">
84 <valid initial="string.printable">
85 <remove value="&quot;" />
86 </valid>
87 <mapping initial="none">
88 <add source="&quot;" target="\&quot;" />
89 </mapping>
90 </sanitizer>
91 </param>
92 <param label="platform/technology used to produce the reads" name="rg_pl" type="text" />
93 <param label="predicted median insert size" name="rg_pi" type="text" />
94 <param label="platform unit; unique identifier" name="rg_pu" size="80" type="text">
95 <sanitizer invalid_char="">
96 <valid initial="string.printable">
97 <remove value="&quot;" />
98 </valid>
99 <mapping initial="none">
100 <add source="&quot;" target="\&quot;" />
101 </mapping>
102 </sanitizer>
103 </param>
104 </inputs>
105
106 <outputs>
107 <data format="sam" label="${rg_sm} (${rg_id}) header information from MiModd ${tool.name} on ${on_string}" name="outputfile" />
108 </outputs>
109
110 <help>
111 .. class:: infomark
112
113 **What it does**
114
115 This tool takes the user-provided information about a next-generation sequencing run and constructs a valid header in the SAM file format from it.
116
117 The result file can be used by the tools *Convert* and *Reheader* or in the *SNAP Read Alignment* step to add run metadata to sequenced reads files (or to overwrite pre-existing information).
118
119 **Note:**
120
121 **MiModD requires run metadata for every input file at the Alignment step !**
122
123 **Tip:**
124
125 While you can do Alignments from fastq file format by providing a custom header file directly to the *SNAP Read Alignment* tool, we **recommend** you to first convert all input files to and archive all datasets in SAM/BAM format with appropriate header information prior to any downstream analysis. Although a bit more time-consuming, this practice protects against information loss and ensures that the input datasets will remain useful for others in the future.
126
127 </help>
128 </tool>