Mercurial > repos > bgruening > bismark
comparison bismark_bowtie_wrapper.xml @ 18:862fb59a9a25 draft
Uploaded
author | bgruening |
---|---|
date | Mon, 14 Apr 2014 16:42:38 -0400 |
parents | 73508c5b4273 |
children | 30caca800c9b |
comparison
equal
deleted
inserted
replaced
17:73508c5b4273 | 18:862fb59a9a25 |
---|---|
1 <tool id="bismark_bowtie" name="Bismark" version="0.7.7.3"> | 1 <tool id="bismark_bowtie" name="Bismark" version="0.10.0"> |
2 <!-- Wrapper compatible with Bismark version 0.7.7 --> | 2 <!-- Wrapper compatible with Bismark version 0.10 --> |
3 <description>bisulfite mapper (bowtie)</description> | 3 <description>bisulfite mapper (bowtie)</description> |
4 <!--<version_command>bismark version</version_command>--> | 4 <!--<version_command>bismark version</version_command>--> |
5 <requirements> | 5 <requirements> |
6 <requirement type="set_environment">SCRIPT_PATH</requirement> | 6 <requirement type="set_environment">SCRIPT_PATH</requirement> |
7 <requirement type="package" version="0.1.19">samtools</requirement> | |
7 <requirement type="package" version="0.12.8">bowtie</requirement> | 8 <requirement type="package" version="0.12.8">bowtie</requirement> |
8 <requirement type="package" version="2.0.0-beta7">bowtie2</requirement> | |
9 </requirements> | 9 </requirements> |
10 <parallelism method="basic"></parallelism> | 10 <parallelism method="basic"></parallelism> |
11 <command interpreter="python"> | 11 <command interpreter="python"> |
12 bismark_wrapper.py | 12 bismark_wrapper.py |
13 | |
14 ## Change this to accommodate the number of threads you have available. | |
15 --num-threads 4 | |
16 | 13 |
17 --bismark_path \$SCRIPT_PATH | 14 --bismark_path \$SCRIPT_PATH |
18 | 15 |
19 ## | 16 ## |
20 ## Bismark Genome Preparation, if desired. | 17 ## Bismark Genome Preparation, if desired. |
43 --fastq | 40 --fastq |
44 #elif $singlePaired.input_singles.ext == "fasta": | 41 #elif $singlePaired.input_singles.ext == "fasta": |
45 --fasta | 42 --fasta |
46 #end if | 43 #end if |
47 #else: | 44 #else: |
48 --mate-paired | 45 --mate-paired |
49 --mate1 $singlePaired.input_mate1 | 46 #set $mate1 = list() |
50 --mate2 $singlePaired.input_mate2 | 47 #set $mate2 = list() |
51 | 48 #for $mate_pair in $singlePaired.mate_list |
52 #if $singlePaired.input_mate1.ext == "fastqillumina": | 49 $mate1.append( str($mate_pair.input_mate1) ) |
50 $mate2.append( str($mate_pair.input_mate2) ) | |
51 #end for | |
52 | |
53 --mate1 #echo ','.join($mate1) | |
54 --mate2 #echo ','.join($mate2) | |
55 | |
56 #if $singlePaired.mate_list[0].input_mate1.ext == "fastqillumina": | |
53 --phred64-quals | 57 --phred64-quals |
54 --fastq | 58 --fastq |
55 #elif $singlePaired.input_mate1.ext == "fastqsanger": | 59 #elif $singlePaired.mate_list[0].input_mate1.ext == "fastqsanger": |
56 --fastq | 60 --fastq |
57 #elif $singlePaired.input_mate1.ext == "fasta": | 61 #elif $singlePaired.mate_list[0].input_mate1.ext == "fasta": |
58 --fasta | 62 --fasta |
59 #end if | 63 #end if |
60 | 64 |
61 -I $singlePaired.minInsert | 65 -I $singlePaired.minInsert |
62 -X $singlePaired.maxInsert | 66 -X $singlePaired.maxInsert |
83 #end if | 87 #end if |
84 #if $params.skip_reads != 0: | 88 #if $params.skip_reads != 0: |
85 --skip-reads $params.skip_reads | 89 --skip-reads $params.skip_reads |
86 #end if | 90 #end if |
87 | 91 |
88 ###if str($params.isReportOutput) == "yes": | 92 #if $params.bismark_stdout: |
89 ## --output-report-file $report_file | 93 --stdout $output_stdout |
90 ###end if | 94 #end if |
95 | |
96 #if $params.isReportOutput: | |
97 --output-report-file $report_file | |
98 #end if | |
91 | 99 |
92 #end if | 100 #end if |
93 | 101 |
94 ## | 102 ## |
95 ## Output parameters. | 103 ## Output parameters. |
96 ## | 104 ## |
97 --output $output | 105 --output $output |
98 $suppress_header | 106 ##$suppress_header |
99 | 107 |
100 #if str( $singlePaired.sPaired ) == "single" | 108 #if str( $singlePaired.sPaired ) == "single" |
101 #if $output_unmapped_reads_l | 109 #if $output_unmapped_reads_l |
102 --output-unmapped-reads $output_unmapped_reads_l | 110 --output-unmapped-reads $output_unmapped_reads_l |
103 #end if | 111 #end if |
121 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options"> | 129 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options"> |
122 <option value="indexed">Use a built-in index</option> | 130 <option value="indexed">Use a built-in index</option> |
123 <option value="history">Use one from the history</option> | 131 <option value="history">Use one from the history</option> |
124 </param> | 132 </param> |
125 <when value="indexed"> | 133 <when value="indexed"> |
126 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin"> | 134 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin."> |
127 <options from_data_table="bowtie_indexes"> | 135 <options from_data_table="bowtie_indexes"> |
128 <filter type="sort_by" column="2"/> | 136 <filter type="sort_by" column="2"/> |
129 <validator type="no_options" message="No indexes are available for the selected input dataset"/> | 137 <validator type="no_options" message="No indexes are available for the selected input dataset"/> |
130 </options> | 138 </options> |
131 </param> | 139 </param> |
143 </param> | 151 </param> |
144 <when value="single"> | 152 <when value="single"> |
145 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> | 153 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> |
146 </when> | 154 </when> |
147 <when value="paired"> | 155 <when value="paired"> |
148 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> | 156 <repeat name="mate_list" title="Paired End Pairs" min="1"> |
149 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." /> | 157 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Mate pair 1" help="FASTQ or FASTA files." /> |
158 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="Mate pair 2" help="FASTQ or FASTA files." /> | |
159 </repeat> | |
150 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" /> | 160 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" /> |
151 <param name="maxInsert" type="integer" value="250" label="Maximum insert size for valid paired-end alignments" /> | 161 <param name="maxInsert" type="integer" value="500" label="Maximum insert size for valid paired-end alignments" /> |
152 </when> | 162 </when> |
153 </conditional> | 163 </conditional> |
154 | 164 |
155 | 165 |
156 <conditional name="params"> | 166 <conditional name="params"> |
160 </param> | 170 </param> |
161 <when value="default" /> | 171 <when value="default" /> |
162 <!-- Full/advanced params. --> | 172 <!-- Full/advanced params. --> |
163 <when value="custom"> | 173 <when value="custom"> |
164 <!-- -n --> | 174 <!-- -n --> |
165 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'."> | 175 <param name="seed_mismatches" type="select" label="The maximum number of mismatches permitted in the 'seed'"> |
166 <option value="0">0</option> | 176 <option value="0">0</option> |
167 <option value="1">1</option> | 177 <option value="1">1</option> |
168 <option value="2" selected="true">2</option> | 178 <option value="2" selected="true">2</option> |
169 <option value="3">3</option> | 179 <option value="3">3</option> |
170 </param> | 180 </param> |
171 <!-- -l --> | 181 <!-- -l --> |
172 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies." /> | 182 <param name="seed_len" type="integer" value="28" label="The 'seed length'; The number of bases of the high quality end of the read to which the maximum number of mismatches applies" /> |
173 <!-- | 183 <!-- |
174 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." /> | 184 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." /> |
175 --> | 185 --> |
176 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." /> | 186 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." /> |
177 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" /> | 187 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" /> |
178 | 188 |
179 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write ambiguous reads to an extra output file." help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." /> | 189 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write ambiguous reads to an extra output file" help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." /> |
180 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write all reads that could not be aligned to a file" /> | 190 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write all reads that could not be aligned to a file" /> |
181 <!-- output Options --> | 191 <!-- output Options --> |
182 <!-- | 192 <param name="bismark_stdout" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Write the bismark output and summary information to an extra file" /> |
183 <param name="isReportOutput" type="select" label="Offer all report files concatenated in one file."> | 193 <param name="isReportOutput" type="boolean" truevalue="true" falsevalue="false" checked="false" label="Offer all report files concatenated in one file" /> |
184 <option value="yes">yes</option> | |
185 <option value="no">no</option> | |
186 </param> | |
187 --> | |
188 <!--end output options --> | 194 <!--end output options --> |
189 </when> <!-- full --> | 195 </when> <!-- full --> |
190 </conditional> <!-- params --> | 196 </conditional> <!-- params --> |
191 <param name="suppress_header" type="boolean" truevalue="--suppress-header" falsevalue="" checked="False" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default" /> | 197 <!-- |
198 <param name="suppress_header" type="boolean" truevalue="..suppress-header" falsevalue="" checked="false" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default." /> | |
199 --> | |
192 </inputs> | 200 </inputs> |
193 <outputs> | 201 <outputs> |
194 <!-- that does not work | |
195 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report"> | 202 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report"> |
196 <filter>str($params.isReportOutput) == "yes"</filter> | 203 <filter> |
204 (( | |
205 params['settingsType'] == "custom" and | |
206 params['isReportOutput'] is True | |
207 )) | |
208 </filter> | |
197 </data> | 209 </data> |
198 --> | 210 <data format="txt" name="output_stdout" label="${tool.name} on ${on_string}: Summary"> |
199 <data format="sam" name="output" label="${tool.name} on ${on_string}: mapped reads"> | 211 <filter> |
212 (( | |
213 params['settingsType'] == "custom" and | |
214 params['bismark_stdout'] is True | |
215 )) | |
216 </filter> | |
217 </data> | |
218 | |
219 <data format="bam" name="output" label="${tool.name} on ${on_string}: mapped reads"> | |
200 <actions> | 220 <actions> |
201 <conditional name="refGenomeSource.genomeSource"> | 221 <conditional name="refGenomeSource.genomeSource"> |
202 <when value="indexed"> | 222 <when value="indexed"> |
203 <action type="metadata" name="dbkey"> | 223 <action type="metadata" name="dbkey"> |
204 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0"> | 224 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0"> |
230 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> | 250 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> |
231 </action> | 251 </action> |
232 </when> | 252 </when> |
233 <when value="paired"> | 253 <when value="paired"> |
234 <action type="format"> | 254 <action type="format"> |
235 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> | 255 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" /> |
236 </action> | 256 </action> |
237 </when> | 257 </when> |
238 </conditional> | 258 </conditional> |
239 </actions> | 259 </actions> |
240 </data> | 260 </data> |
250 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> | 270 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> |
251 </action> | 271 </action> |
252 </when> | 272 </when> |
253 <when value="paired"> | 273 <when value="paired"> |
254 <action type="format"> | 274 <action type="format"> |
255 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> | 275 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" /> |
256 </action> | 276 </action> |
257 </when> | 277 </when> |
258 </conditional> | 278 </conditional> |
259 </actions> | 279 </actions> |
260 </data> | 280 </data> |
274 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> | 294 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> |
275 </action> | 295 </action> |
276 </when> | 296 </when> |
277 <when value="paired"> | 297 <when value="paired"> |
278 <action type="format"> | 298 <action type="format"> |
279 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> | 299 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" /> |
280 </action> | 300 </action> |
281 </when> | 301 </when> |
282 </conditional> | 302 </conditional> |
283 </actions> | 303 </actions> |
284 </data> | 304 </data> |
293 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> | 313 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" /> |
294 </action> | 314 </action> |
295 </when> | 315 </when> |
296 <when value="paired"> | 316 <when value="paired"> |
297 <action type="format"> | 317 <action type="format"> |
298 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" /> | 318 <option type="from_param" name="singlePaired.mate_list[0].input_mate1" param_attribute="ext" /> |
299 </action> | 319 </action> |
300 </when> | 320 </when> |
301 </conditional> | 321 </conditional> |
302 </actions> | 322 </actions> |
303 </data> | 323 </data> |
335 .. class:: warningmark | 355 .. class:: warningmark |
336 | 356 |
337 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy. | 357 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy. |
338 | 358 |
339 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/ | 359 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/ |
360 | |
361 | |
362 .. class:: warningmark | |
363 | |
364 Make sure all your input reads are in the correct and same format. If thats not the case please adjust/convert the filetype with galaxy's build-in converters. | |
340 | 365 |
341 ------ | 366 ------ |
342 | 367 |
343 **Input formats** | 368 **Input formats** |
344 | 369 |
398 | 423 |
399 ------ | 424 ------ |
400 | 425 |
401 **Bismark parameter list** | 426 **Bismark parameter list** |
402 | 427 |
403 This is an exhaustive list of Bismark options: | 428 This is an exhaustive list of Bismark options. |
404 | |
405 ------ | |
406 | |
407 **OPTIONS** | |
408 | |
409 | 429 |
410 Input:: | 430 Input:: |
411 | 431 |
412 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g. | 432 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g. |
413 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will | 433 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will |
524 | 544 |
525 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If | 545 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If |
526 the specified folder does not exist, Bismark will attempt to create it first. The path to the | 546 the specified folder does not exist, Bismark will attempt to create it first. The path to the |
527 temporary folder can be either relative or absolute. | 547 temporary folder can be either relative or absolute. |
528 | 548 |
529 ------ | |
530 | |
531 Bowtie 2 alignment options:: | |
532 | |
533 -N INT Sets the number of mismatches to allowed in a seed alignment during multiseed alignment. | |
534 Can be set to 0 or 1. Setting this higher makes alignment slower (often much slower) | |
535 but increases sensitivity. Default: 0. This option is only available for Bowtie 2 (for | |
536 Bowtie 1 see -n). | |
537 | |
538 -L INT Sets the length of the seed substrings to align during multiseed alignment. Smaller values | |
539 make alignment slower but more senstive. Default: the --sensitive preset of Bowtie 2 is | |
540 used by default, which sets -L to 20. This option is only available for Bowtie 2 (for | |
541 Bowtie 1 see -l). | |
542 | |
543 --ignore-quals When calculating a mismatch penalty, always consider the quality value at the mismatched | |
544 position to be the highest possible, regardless of the actual value. I.e. input is treated | |
545 as though all quality values are high. This is also the default behavior when the input | |
546 doesn't specify quality values (e.g. in -f mode). This option is invariable and on by default. | |
547 | |
548 | |
549 Bowtie 2 paired-end options:: | |
550 | |
551 --no-mixed This option disables Bowtie 2's behavior to try to find alignments for the individual mates if | |
552 it cannot find a concordant or discordant alignment for a pair. This option is invariable and | |
553 and on by default. | |
554 | |
555 --no-discordant Normally, Bowtie 2 looks for discordant alignments if it cannot find any concordant alignments. | |
556 A discordant alignment is an alignment where both mates align uniquely, but that does not | |
557 satisfy the paired-end constraints (--fr/--rf/--ff, -I, -X). This option disables that behavior | |
558 and it is on by default. | |
559 | |
560 | |
561 Bowtie 2 effort options:: | |
562 | |
563 -D INT Up to INT consecutive seed extension attempts can "fail" before Bowtie 2 moves on, using | |
564 the alignments found so far. A seed extension "fails" if it does not yield a new best or a | |
565 new second-best alignment. Default: 15. | |
566 | |
567 -R INT INT is the maximum number of times Bowtie 2 will "re-seed" reads with repetitive seeds. | |
568 When "re-seeding," Bowtie 2 simply chooses a new set of reads (same length, same number of | |
569 mismatches allowed) at different offsets and searches for more alignments. A read is considered | |
570 to have repetitive seeds if the total number of seed hits divided by the number of seeds | |
571 that aligned at least once is greater than 300. Default: 2. | |
572 | |
573 | |
574 Bowtie 2 Scoring options:: | |
575 | |
576 --score_min "func" Sets a function governing the minimum alignment score needed for an alignment to be considered | |
577 "valid" (i.e. good enough to report). This is a function of read length. For instance, specifying | |
578 L,0,-0.2 sets the minimum-score function f to f(x) = 0 + -0.2 * x, where x is the read length. | |
579 See also: setting function options at http://bowtie-bio.sourceforge.net/bowtie2. The default is | |
580 L,0,-0.2. | |
581 | |
582 | |
583 Bowtie 2 Reporting options:: | |
584 | |
585 --most_valid_alignments INT This used to be the Bowtie 2 parameter -M. As of Bowtie 2 version 2.0.0 beta7 the option -M is | |
586 deprecated. It will be removed in subsequent versions. What used to be called -M mode is still the | |
587 default mode, but adjusting the -M setting is deprecated. Use the -D and -R options to adjust the | |
588 effort expended to find valid alignments. | |
589 | |
590 For reference, this used to be the old (now deprecated) description of -M: | |
591 Bowtie 2 searches for at most INT+1 distinct, valid alignments for each read. The search terminates when it | |
592 can't find more distinct valid alignments, or when it finds INT+1 distinct alignments, whichever | |
593 happens first. Only the best alignment is reported. Information from the other alignments is used to | |
594 estimate mapping quality and to set SAM optional fields, such as AS:i and XS:i. Increasing -M makes | |
595 Bowtie 2 slower, but increases the likelihood that it will pick the correct alignment for a read that | |
596 aligns many places. For reads that have more than INT+1 distinct, valid alignments, Bowtie 2 does not | |
597 guarantee that the alignment reported is the best possible in terms of alignment score. -M is | |
598 always used and its default value is set to 10. | |
599 | |
600 </help> | 549 </help> |
601 </tool> | 550 </tool> |