comparison tmap_wrapper_0.3.3/tmap_wrapper.xml @ 2:e2640d81157a default tip

* moving to TMAP 0.3.3
author Nils Homer <nilshomer@gmail.com>
date Sun, 26 Feb 2012 20:28:27 -0500
parents tmap_wrapper_0.0.19/tmap_wrapper.xml@de2efe4dda3f
children
comparison
equal deleted inserted replaced
1:d18b5f2ada22 2:e2640d81157a
1 <tool id="tmap_wrapper" name="Map with TMAP" version="0.3.3">
2 <description>for Ion Torrent</description>
3 <parallelism method="basic"></parallelism>
4 <command interpreter="python">
5 tmap_wrapper.py
6
7 ## reference source
8 --fileSource=$genomeSource.refGenomeSource
9 #if $genomeSource.refGenomeSource == "history":
10 ##build index on the fly
11 --ref="${genomeSource.ownFile}"
12 --dbkey=$dbkey
13 #else:
14 ##use precomputed indexes
15 --ref="${ filter( lambda x: str( x[0] ) == str( $genomeSource.indices ), $__app__.tool_data_tables[ 'tmap_indexes' ].get_fields() )[0][-1] }"
16 --do_not_build_index
17 #end if
18
19 ## input SFF/fastq
20 --input=$inputs.input
21 --inputtype=$inputs.inputtype
22
23 ## output file
24 --output=$output
25
26 ## run parameters
27 --params=$params.source_select
28 #if $params.source_select != "pre_set":
29 --algorithm=$params.algorithm
30 --globalOptions=$params.globalOptions
31 --flowspaceOptions=$params.flowspaceOptions
32 --pairingOptions=$params.pairingOptions
33 --algorithmOptions=$params.algorithmOptions
34 --threads=$params.threads
35 #else:
36 --algorithm=''
37 --globalOptions=''
38 --flowspaceOptions=''
39 --pairingOptions=''
40 --algorithmOptions=''
41 --threads="4"
42 #end if
43
44 ## suppress output SAM header
45 --suppressHeader=$suppressHeader
46 </command>
47 <requirements>
48 <requirement type='package'>tmap</requirement>
49 </requirements>
50 <inputs>
51 <conditional name="genomeSource">
52 <param name="refGenomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?">
53 <option value="indexed">Use a built-in index</option>
54 <option value="history">Use one from the history</option>
55 </param>
56 <when value="indexed">
57 <param name="indices" type="select" label="Select a reference genome">
58 <options from_data_table="tmap_indexes">
59 <filter type="sort_by" column="3" />
60 <validator type="no_options" message="No indexes are available for the selected input dataset" />
61 </options>
62 </param>
63 </when>
64 <when value="history">
65 <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select a reference from history" />
66 </when>
67 </conditional>
68 <conditional name="inputs">
69 <param name="source_select" type="select" label="The input type" help="The input type" >
70 <option value="fastq">FASTQ</option>
71 <option value="sff">SFF</option>
72 </param>
73 <when value="fastq">
74 <param name="input" type="data" value="" format="fastqsanger" label="FASTQ file" help="Must have Sanger-scaled quality values with ASCII offset 33" />
75 <param name="inputtype" type="text" value="fastq" label="the input type (do not modify)"/>
76 </when>
77 <when value="sff">
78 <param name="input" type="data" value="" format="sff" label="SFF file" help="Must be a SFF file" />
79 <param name="inputtype" type="text" value="sff" label="the input type (do not modify)"/>
80 </when>
81 </conditional>
82 <conditional name="params">
83 <param name="source_select" type="select" label="TMAP settings to use" help="For most mapping needs use Commonly Used settings. If you want full control use Full Parameter List">
84 <option value="pre_set">Commonly Used</option>
85 <option value="full">Full Parameter List</option>
86 </param>
87 <when value="pre_set" />
88 <when value="full">
89 <param name="algorithm" type="select" label="The main algorithm to use">
90 <option value="mapall" selected="true">mapall</option>
91 <option value="map1" selected="false">map1</option>
92 <option value="map2" selected="false">map2</option>
93 <option value="map3" selected="false">map3</option>
94 <option value="map4" selected="false">map4</option>
95 </param>
96 <param name="threads" type="integer" value="4" label="The number of threads (-n)" />
97 <param name="globalOptions" type="text" value="" label="The global options" />
98 <param name="flowspaceOptions" type="text" value="" label="The flowspace options" />
99 <param name="pairingOptions" type="text" value="" label="The pairing options" />
100 <param name="algorithmOptions" type="text" value="" label="The algorithm options" />
101 </when>
102 </conditional>
103 <param name="suppressHeader" type="boolean" truevalue="true" falsevalue="false" checked="true" label="Suppress the header in the output SAM file" help="TMAP produces SAM with several lines of header information" />
104 </inputs>
105 <outputs>
106 <data format="sam" name="output" label="${tool.name} on ${on_string}: mapped reads">
107 <actions>
108 <conditional name="genomeSource.refGenomeSource">
109 <when value="indexed">
110 <action type="metadata" name="dbkey">
111 <option type="from_data_table" name="tmap_indexes" column="0">
112 <filter type="param_value" ref="genomeSource.indices" column="1"/>
113 </option>
114 </action>
115 </when>
116 </conditional>
117 </actions>
118 </data>
119 </outputs>
120 <help>
121
122 **What it does**
123
124 See the TMAP manual for more information.
125
126 It combines multiple mapping algorithms to give sensitive and accurate alignments quickly. It uses three core algorithms, BWA-short, BWA-long, and a variant of the SSAHA algorithm. These algorithms are described in the following publications:
127 - Li, H. and Durbin, R. (2009). Fast and accurate short read alignment with Burrows-Wheeler transform. Bioinformatics, 25, 1754–1760.
128 - Li, H. and Durbin, R. (2010). Fast and accurate long-read alignment with Burrows-Wheeler
129 - Ning, Z., Cox, A., and Mullikin, J. (2001). SSAHA: a fast search method for large DNA databases. Genome Res., 11, 1725–1729.
130
131 ------
132
133 **Know what you are doing**
134
135 .. class:: warningmark
136
137 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
138
139 .. __: http://github.com/iontorrent/TMAP
140
141 ------
142
143 **Input formats**
144
145 TMAP accepts files in Sanger FASTQ format. Use the FASTQ Groomer to prepare your files. TMAP also accepts SFF files.
146
147 ------
148
149 **A Note on Built-in Reference Genomes**
150
151 Some genomes have multiple variants. If only one "type" of genome is listed, it is the Full version, which means that everything that came in the original genome data download (possibly with mitochondrial and plasmid DNA added if it wasn't already included). The Full version is available for every genome. Some genomes also come in the Canonical variant, which contains only the "canonical" (well-defined) chromosomes or segments, such as chr1-chr22, chrX, chrY, and chrM for human. Other variations include gender. These will come in the canonical form only, so the general Canonical variant is actually Canonical Female and the other is Canonical Male (identical to female excluding chrX).
152
153 ------
154
155 **Outputs**
156
157 The output is in SAM format, and has the following columns::
158
159 Column Description
160 -------- --------------------------------------------------------
161 1 QNAME Query (pair) NAME
162 2 FLAG bitwise FLAG
163 3 RNAME Reference sequence NAME
164 4 POS 1-based leftmost POSition/coordinate of clipped sequence
165 5 MAPQ MAPping Quality (Phred-scaled)
166 6 CIGAR extended CIGAR string
167 7 MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
168 8 MPOS 1-based Mate POSition
169 9 ISIZE Inferred insert SIZE
170 10 SEQ query SEQuence on the same strand as the reference
171 11 QUAL query QUALity (ASCII-33 gives the Phred base quality)
172 12 OPT variable OPTional fields in the format TAG:VTYPE:VALU
173
174 The flags are as follows::
175
176 Flag Description
177 ------ -------------------------------------
178 0x0001 the read is paired in sequencing
179 0x0002 the read is mapped in a proper pair
180 0x0004 the query sequence itself is unmapped
181 0x0008 the mate is unmapped
182 0x0010 strand of the query (1 for reverse)
183 0x0020 strand of the mate
184 0x0040 the read is the first read in a pair
185 0x0080 the read is the second read in a pair
186 0x0100 the alignment is not primary
187
188 It looks like this (scroll sideways to see the entire example)::
189
190 QNAME FLAG RNAME POS MAPQ CIAGR MRNM MPOS ISIZE SEQ QUAL OPT
191 HWI-EAS91_1_30788AAXX:1:1:1761:343 4 * 0 0 * * 0 0 AAAAAAANNAAAAAAAAAAAAAAAAAAAAAAAAAAACNNANNGAGTNGNNNNNNNGCTTCCCACAGNNCTGG hhhhhhh;;hhhhhhhhhhh^hOhhhhghhhfhhhgh;;h;;hhhh;h;;;;;;;hhhhhhghhhh;;Phhh
192 HWI-EAS91_1_30788AAXX:1:1:1578:331 4 * 0 0 * * 0 0 GTATAGANNAATAAGAAAAAAAAAAATGAAGACTTTCNNANNTCTGNANNNNNNNTCTTTTTTCAGNNGTAG hhhhhhh;;hhhhhhhhhhhhhhhhhhhhhhhhhhhh;;h;;hhhh;h;;;;;;;hhhhhhhhhhh;;hhVh
193
194 -------
195
196 **TMAP settings**
197
198 All of the options have a default value. You can change most of them. Most of the options in TMAP have been implemented here.
199
200
201 </help>
202 </tool>
203
204