annotate sam_header.xml @ 3:d6ec32ce882b draft default tip

Uploaded
author wolma
date Tue, 28 Mar 2017 04:34:04 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
1 <tool id="ngs_run_annotation" name="NGS Run Annotation" version="0.1.7.3">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
2 <description>Create a SAM format header from run metadata for sample annotation.</description>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
3 <macros>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
4 <import>toolshed_macros.xml</import>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
5 </macros>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
6 <expand macro="requirements" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
7 <version_command>mimodd version -q</version_command>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
8 <command>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
9 mimodd header
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
10
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
11 --rg-id "$rg_id"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
12 --rg-sm "$rg_sm"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
13
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
14 #if $str($rg_cn):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
15 --rg-cn "$rg_cn"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
16 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
17 #if $str($rg_ds):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
18 --rg-ds "$rg_ds"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
19 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
20 #if $str($rg_date):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
21 --rg-dt "$rg_date"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
22 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
23 #if $str($rg_lb):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
24 --rg-lb "$rg_lb"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
25 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
26 #if $str($rg_pl):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
27 --rg-pl "$rg_pl"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
28 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
29 #if $str($rg_pi):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
30 --rg-pi "$rg_pi"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
31 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
32 #if $str($rg_pu):
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
33 --rg-pu "$rg_pu"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
34 #end if
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
35
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
36 --ofile "$outputfile"
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
37
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
38 </command>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
39
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
40 <inputs>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
41 <param label="read-group ID (required)" name="rg_id" size="80" type="text">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
42 <sanitizer invalid_char="">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
43 <valid initial="string.printable">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
44 <remove value="&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
45 </valid>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
46 <mapping initial="none">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
47 <add source="&quot;" target="\&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
48 </mapping>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
49 </sanitizer>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
50 </param>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
51 <param label="sample name (required)" name="rg_sm" size="80" type="text">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
52 <sanitizer invalid_char="">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
53 <valid initial="string.printable">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
54 <remove value="&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
55 </valid>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
56 <mapping initial="none">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
57 <add source="&quot;" target="\&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
58 </mapping>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
59 </sanitizer>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
60 </param>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
61 <param label="description" name="rg_ds" size="80" type="text">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
62 <sanitizer invalid_char="">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
63 <valid initial="string.printable">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
64 <remove value="&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
65 </valid>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
66 <mapping initial="none">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
67 <add source="&quot;" target="\&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
68 </mapping>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
69 </sanitizer>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
70 </param>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
71 <param label="date (YYYY-MM-DD) the run was produced" name="rg_date" type="text" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
72 <param label="name of sequencing center" name="rg_cn" size="80" type="text">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
73 <sanitizer invalid_char="">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
74 <valid initial="string.printable">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
75 <remove value="&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
76 </valid>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
77 <mapping initial="none">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
78 <add source="&quot;" target="\&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
79 </mapping>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
80 </sanitizer>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
81 </param>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
82 <param label="read-group library" name="rg_lb" size="80" type="text">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
83 <sanitizer invalid_char="">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
84 <valid initial="string.printable">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
85 <remove value="&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
86 </valid>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
87 <mapping initial="none">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
88 <add source="&quot;" target="\&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
89 </mapping>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
90 </sanitizer>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
91 </param>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
92 <param label="platform/technology used to produce the reads" name="rg_pl" type="text" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
93 <param label="predicted median insert size" name="rg_pi" type="text" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
94 <param label="platform unit; unique identifier" name="rg_pu" size="80" type="text">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
95 <sanitizer invalid_char="">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
96 <valid initial="string.printable">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
97 <remove value="&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
98 </valid>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
99 <mapping initial="none">
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
100 <add source="&quot;" target="\&quot;" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
101 </mapping>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
102 </sanitizer>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
103 </param>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
104 </inputs>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
105
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
106 <outputs>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
107 <data format="sam" label="${rg_sm} (${rg_id}) header information from MiModd ${tool.name} on ${on_string}" name="outputfile" />
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
108 </outputs>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
109
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
110 <help>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
111 .. class:: infomark
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
112
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
113 **What it does**
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
114
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
115 This tool takes the user-provided information about a next-generation sequencing run and constructs a valid header in the SAM file format from it.
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
116
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
117 The result file can be used by the tools *Convert* and *Reheader* or in the *SNAP Read Alignment* step to add run metadata to sequenced reads files (or to overwrite pre-existing information).
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
118
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
119 **Note:**
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
120
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
121 **MiModD requires run metadata for every input file at the Alignment step !**
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
122
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
123 **Tip:**
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
124
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
125 While you can do Alignments from fastq file format by providing a custom header file directly to the *SNAP Read Alignment* tool, we **recommend** you to first convert all input files to and archive all datasets in SAM/BAM format with appropriate header information prior to any downstream analysis. Although a bit more time-consuming, this practice protects against information loss and ensures that the input datasets will remain useful for others in the future.
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
126
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
127 </help>
d6ec32ce882b Uploaded
wolma
parents:
diff changeset
128 </tool>