comparison bismark_bowtie_wrapper.xml @ 18:862fb59a9a25 draft

Uploaded
author bgruening
date Mon, 14 Apr 2014 16:42:38 -0400
parents 73508c5b4273
children 30caca800c9b
comparison
equal deleted inserted replaced
17:73508c5b4273 18:862fb59a9a25
1 <tool id="bismark_bowtie" name="Bismark" version="0.7.7.3"> 1 <tool id="bismark_bowtie" name="Bismark" version="0.10.0">
2 <!-- Wrapper compatible with Bismark version 0.7.7 --> 2 <!-- Wrapper compatible with Bismark version 0.10 -->
3 <description>bisulfite mapper (bowtie)</description> 3 <description>bisulfite mapper (bowtie)</description>
4 <!--<version_command>bismark version</version_command>--> 4 <!--<version_command>bismark version</version_command>-->
5 <requirements> 5 <requirements>
6 <requirement type="set_environment">SCRIPT_PATH</requirement> 6 <requirement type="set_environment">SCRIPT_PATH</requirement>
7 <requirement type="package" version="0.1.19">samtools</requirement>
7 <requirement type="package" version="0.12.8">bowtie</requirement> 8 <requirement type="package" version="0.12.8">bowtie</requirement>
8 <requirement type="package" version="2.0.0-beta7">bowtie2</requirement>
9 </requirements> 9 </requirements>
10 <parallelism method="basic"></parallelism> 10 <parallelism method="basic"></parallelism>
11 <command interpreter="python"> 11 <command interpreter="python">
12 bismark_wrapper.py 12 bismark_wrapper.py
13
14 ## Change this to accommodate the number of threads you have available.
15 --num-threads 4
16 13
17 --bismark_path \$SCRIPT_PATH 14 --bismark_path \$SCRIPT_PATH
18 15
19 ## 16 ##
20 ## Bismark Genome Preparation, if desired. 17 ## Bismark Genome Preparation, if desired.
43 --fastq 40 --fastq
44 #elif $singlePaired.input_singles.ext == "fasta": 41 #elif $singlePaired.input_singles.ext == "fasta":
45 --fasta 42 --fasta
46 #end if 43 #end if
47 #else: 44 #else:
48 --mate-paired 45 --mate-paired
49 --mate1 $singlePaired.input_mate1 46 #set $mate1 = list()
50 --mate2 $singlePaired.input_mate2 47 #set $mate2 = list()
51 48 #for $mate_pair in $singlePaired.mate_list
52 #if $singlePaired.input_mate1.ext == "fastqillumina": 49 $mate1.append( str($mate_pair.input_mate1) )
50 $mate2.append( str($mate_pair.input_mate2) )
51 #end for
52
53 --mate1 #echo ','.join($mate1)
54 --mate2 #echo ','.join($mate2)
55
56 #if $singlePaired.mate_list[0].input_mate1.ext == "fastqillumina":
53 --phred64-quals 57 --phred64-quals
54 --fastq 58 --fastq
55 #elif $singlePaired.input_mate1.ext == "fastqsanger": 59 #elif $singlePaired.mate_list[0].input_mate1.ext == "fastqsanger":
56 --fastq 60 --fastq
57 #elif $singlePaired.input_mate1.ext == "fasta": 61 #elif $singlePaired.mate_list[0].input_mate1.ext == "fasta":
58 --fasta 62 --fasta
59 #end if 63 #end if
60 64
61 -I $singlePaired.minInsert 65 -I $singlePaired.minInsert
62 -X $singlePaired.maxInsert 66 -X $singlePaired.maxInsert
83 #end if 87 #end if
84 #if $params.skip_reads != 0: 88 #if $params.skip_reads != 0:
85 --skip-reads $params.skip_reads 89 --skip-reads $params.skip_reads
86 #end if 90 #end if
87 91
88 ###if str($params.isReportOutput) == "yes": 92 #if $params.bismark_stdout:
89 ## --output-report-file $report_file 93 --stdout $output_stdout
90 ###end if 94 #end if
95
96 #if $params.isReportOutput:
97 --output-report-file $report_file
98 #end if
91 99
92 #end if 100 #end if
93 101
94 ## 102 ##
95 ## Output parameters. 103 ## Output parameters.
96 ## 104 ##
97 --output $output 105 --output $output
98 $suppress_header 106 ##$suppress_header
99 107
100 #if str( $singlePaired.sPaired ) == "single" 108 #if str( $singlePaired.sPaired ) == "single"
101 #if $output_unmapped_reads_l 109 #if $output_unmapped_reads_l
102 --output-unmapped-reads $output_unmapped_reads_l 110 --output-unmapped-reads $output_unmapped_reads_l
103 #end if 111 #end if
121 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options"> 129 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
122 <option value="indexed">Use a built-in index</option> 130 <option value="indexed">Use a built-in index</option>
123 <option value="history">Use one from the history</option> 131 <option value="history">Use one from the history</option>
124 </param> 132 </param>
125 <when value="indexed"> 133 <when value="indexed">
126 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin"> 134 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin.">
127 <options from_data_table="bowtie_indexes"> 135 <options from_data_table="bowtie_indexes">
128 <filter type="sort_by" column="2"/> 136 <filter type="sort_by" column="2"/>
129 <validator type="no_options" message="No indexes are available for the selected input dataset"/> 137 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
130 </options> 138 </options>
131 </param> 139 </param>
143 </param> 151 </param>
144 <when value="single"> 152 <when value="single">
145 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> 153 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
146 </when> 154 </when>
147 <when value="paired"> 155 <when value="paired">
148 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> 156 <repeat name="mate_list" title="Paired End Pairs" min="1">
149 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> 157 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Mate pair 1" help="FASTQ or FASTA files." />
158 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Mate pair 2" help="FASTQ or FASTA files." />
159 </repeat>
150 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" /> 160 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" />
151 <param name="maxInsert" type="integer" value="250" label="Maximum insert size for valid paired-end alignments" /> 161 <param name="maxInsert" type="integer" value="500" label="Maximum insert size for valid paired-end alignments" />
152 </when> 162 </when>
153 </conditional> 163 </conditional>
154 164
155 165
156 <conditional name="params"> 166 <conditional name="params">
160 </param> 170 </param>
161 <when value="default" /> 171 <when value="default" />
162 <!-- Full/advanced params. --> 172 <!-- Full/advanced params. -->
163 <when value="custom"> 173 <when value="custom">
164 <!-- -n --> 174 <!-- -n -->
165 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'."> 175 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'">
166 <option value="0">0</option> 176 <option value="0">0</option>
167 <option value="1">1</option> 177 <option value="1">1</option>
168 <option value="2" selected="true">2</option> 178 <option value="2" selected="true">2</option>
169 <option value="3">3</option> 179 <option value="3">3</option>
170 </param> 180 </param>
171 <!-- -l --> 181 <!-- -l -->
172 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies." /> 182 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies" />
173 <!-- 183 <!--
174 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." /> 184 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." />
175 --> 185 -->
176 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." /> 186 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." />
177 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" /> 187 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" />
178 188
179 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write ambiguous reads to an extra output file." help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." /> 189 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write ambiguous reads to an extra output file" help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." />
180 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write all reads that could not be aligned to a file" /> 190 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write all reads that could not be aligned to a file" />
181 <!-- output Options --> 191 <!-- output Options -->
182 <!-- 192 <param name="bismark_stdout" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write the bismark output and summary information to an extra file" />
183 <param name="isReportOutput" type="select" label="Offer all report files concatenated in one file."> 193 <param name="isReportOutput" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Offer all report files concatenated in one file" />
184 <option value="yes">yes</option>
185 <option value="no">no</option>
186 </param>
187 -->
188 <!--end output options --> 194 <!--end output options -->
189 </when> <!-- full --> 195 </when> <!-- full -->
190 </conditional> <!-- params --> 196 </conditional> <!-- params -->
191 <param name="suppress_header" type="boolean" truevalue="--suppress-header" falsevalue="" checked="False" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default" /> 197 <!--
198 <param name="suppress_header" type="boolean" truevalue="..suppress-header" falsevalue="" checked="false" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default." />
199 -->
192 </inputs> 200 </inputs>
193 <outputs> 201 <outputs>
194 <!-- that does not work
195 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report"> 202 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report">
196 <filter>str($params.isReportOutput) == "yes"</filter> 203 <filter>
204 ((
205 params['settingsType'] == "custom" and
206 params['isReportOutput'] is True
207 ))
208 </filter>
197 </data> 209 </data>
198 --> 210 <data format="txt" name="output_stdout" label="${tool.name} on ${on_string}: Summary">
199 <data format="sam" name="output" label="${tool.name} on ${on_string}: mapped reads"> 211 <filter>
212 ((
213 params['settingsType'] == "custom" and
214 params['bismark_stdout'] is True
215 ))
216 </filter>
217 </data>
218
219 <data format="bam" name="output" label="${tool.name} on ${on_string}: mapped reads">
200 <actions> 220 <actions>
201 <conditional name="refGenomeSource.genomeSource"> 221 <conditional name="refGenomeSource.genomeSource">
202 <when value="indexed"> 222 <when value="indexed">
203 <action type="metadata" name="dbkey"> 223 <action type="metadata" name="dbkey">
204 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0"> 224 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0">
230 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> 250 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
231 </action> 251 </action>
232 </when> 252 </when>
233 <when value="paired"> 253 <when value="paired">
234 <action type="format"> 254 <action type="format">
235 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> 255 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
236 </action> 256 </action>
237 </when> 257 </when>
238 </conditional> 258 </conditional>
239 </actions> 259 </actions>
240 </data> 260 </data>
250 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> 270 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
251 </action> 271 </action>
252 </when> 272 </when>
253 <when value="paired"> 273 <when value="paired">
254 <action type="format"> 274 <action type="format">
255 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> 275 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
256 </action> 276 </action>
257 </when> 277 </when>
258 </conditional> 278 </conditional>
259 </actions> 279 </actions>
260 </data> 280 </data>
274 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> 294 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
275 </action> 295 </action>
276 </when> 296 </when>
277 <when value="paired"> 297 <when value="paired">
278 <action type="format"> 298 <action type="format">
279 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> 299 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
280 </action> 300 </action>
281 </when> 301 </when>
282 </conditional> 302 </conditional>
283 </actions> 303 </actions>
284 </data> 304 </data>
293 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> 313 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
294 </action> 314 </action>
295 </when> 315 </when>
296 <when value="paired"> 316 <when value="paired">
297 <action type="format"> 317 <action type="format">
298 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> 318 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" />
299 </action> 319 </action>
300 </when> 320 </when>
301 </conditional> 321 </conditional>
302 </actions> 322 </actions>
303 </data> 323 </data>
335 .. class:: warningmark 355 .. class:: warningmark
336 356
337 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy. 357 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
338 358
339 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/ 359 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
360
361
362 .. class:: warningmark
363
364 Make sure all your input reads are in the correct and same format. If thats not the case please adjust/convert the filetype with galaxy's build-in converters.
340 365
341 ------ 366 ------
342 367
343 **Input formats** 368 **Input formats**
344 369
398 423
399 ------ 424 ------
400 425
401 **Bismark parameter list** 426 **Bismark parameter list**
402 427
403 This is an exhaustive list of Bismark options: 428 This is an exhaustive list of Bismark options.
404
405 ------
406
407 **OPTIONS**
408
409 429
410 Input:: 430 Input::
411 431
412 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g. 432 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g.
413 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will 433 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will
524 544
525 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If 545 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If
526 the specified folder does not exist, Bismark will attempt to create it first. The path to the 546 the specified folder does not exist, Bismark will attempt to create it first. The path to the
527 temporary folder can be either relative or absolute. 547 temporary folder can be either relative or absolute.
528 548
529 ------
530
531 Bowtie 2 alignment options::
532
533 -N INT Sets the number of mismatches to allowed in a seed alignment during multiseed alignment.
534 Can be set to 0 or 1. Setting this higher makes alignment slower (often much slower)
535 but increases sensitivity. Default: 0. This option is only available for Bowtie 2 (for
536 Bowtie 1 see -n).
537
538 -L INT Sets the length of the seed substrings to align during multiseed alignment. Smaller values
539 make alignment slower but more senstive. Default: the --sensitive preset of Bowtie 2 is
540 used by default, which sets -L to 20. This option is only available for Bowtie 2 (for
541 Bowtie 1 see -l).
542
543 --ignore-quals When calculating a mismatch penalty, always consider the quality value at the mismatched
544 position to be the highest possible, regardless of the actual value. I.e. input is treated
545 as though all quality values are high. This is also the default behavior when the input
546 doesn't specify quality values (e.g. in -f mode). This option is invariable and on by default.
547
548
549 Bowtie 2 paired-end options::
550
551 --no-mixed This option disables Bowtie 2's behavior to try to find alignments for the individual mates if
552 it cannot find a concordant or discordant alignment for a pair. This option is invariable and
553 and on by default.
554
555 --no-discordant Normally, Bowtie 2 looks for discordant alignments if it cannot find any concordant alignments.
556 A discordant alignment is an alignment where both mates align uniquely, but that does not
557 satisfy the paired-end constraints (--fr/--rf/--ff, -I, -X). This option disables that behavior
558 and it is on by default.
559
560
561 Bowtie 2 effort options::
562
563 -D INT Up to INT consecutive seed extension attempts can "fail" before Bowtie 2 moves on, using
564 the alignments found so far. A seed extension "fails" if it does not yield a new best or a
565 new second-best alignment. Default: 15.
566
567 -R INT INT is the maximum number of times Bowtie 2 will "re-seed" reads with repetitive seeds.
568 When "re-seeding," Bowtie 2 simply chooses a new set of reads (same length, same number of
569 mismatches allowed) at different offsets and searches for more alignments. A read is considered
570 to have repetitive seeds if the total number of seed hits divided by the number of seeds
571 that aligned at least once is greater than 300. Default: 2.
572
573
574 Bowtie 2 Scoring options::
575
576 --score_min "func" Sets a function governing the minimum alignment score needed for an alignment to be considered
577 "valid" (i.e. good enough to report). This is a function of read length. For instance, specifying
578 L,0,-0.2 sets the minimum-score function f to f(x) = 0 + -0.2 * x, where x is the read length.
579 See also: setting function options at http://bowtie-bio.sourceforge.net/bowtie2. The default is
580 L,0,-0.2.
581
582
583 Bowtie 2 Reporting options::
584
585 --most_valid_alignments INT This used to be the Bowtie 2 parameter -M. As of Bowtie 2 version 2.0.0 beta7 the option -M is
586 deprecated. It will be removed in subsequent versions. What used to be called -M mode is still the
587 default mode, but adjusting the -M setting is deprecated. Use the -D and -R options to adjust the
588 effort expended to find valid alignments.
589
590 For reference, this used to be the old (now deprecated) description of -M:
591 Bowtie 2 searches for at most INT+1 distinct, valid alignments for each read. The search terminates when it
592 can't find more distinct valid alignments, or when it finds INT+1 distinct alignments, whichever
593 happens first. Only the best alignment is reported. Information from the other alignments is used to
594 estimate mapping quality and to set SAM optional fields, such as AS:i and XS:i. Increasing -M makes
595 Bowtie 2 slower, but increases the likelihood that it will pick the correct alignment for a read that
596 aligns many places. For reads that have more than INT+1 distinct, valid alignments, Bowtie 2 does not
597 guarantee that the alignment reported is the best possible in terms of alignment score. -M is
598 always used and its default value is set to 10.
599
600 </help> 549 </help>
601 </tool> 550 </tool>