comparison gsnap.xml @ 2:f6ba0f12cca2 draft

Untested work-in-progress GMAP wrappers v3.0.0, from JJ back in June 2013
author peterjc
date Wed, 28 Sep 2016 10:43:44 -0400
parents 74391fc6e3f2
children 488e9d642566
comparison
equal deleted inserted replaced
1:74391fc6e3f2 2:f6ba0f12cca2
1 <tool id="gsnap" name="GSNAP" version="2.0.1"> 1 <tool id="gsnap" name="GSNAP" version="3.0.0">
2 <description>Genomic Short-read Nucleotide Alignment Program</description> 2 <description>Genomic Short-read Nucleotide Alignment Program</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="2011-11-30">gmap</requirement> 4 <requirement type="package" version="2013-05-09">gmap</requirement>
5 </requirements> 5 </requirements>
6 <version_string>gsnap --version</version_string> 6 <version_string>gsnap --version</version_string>
7 <command> 7 <command>
8 #import os.path, re 8 #import os.path, re
9 gsnap 9 gsnap
10 --nthreads="4" --ordered 10 --nthreads="4" --ordered
11 #if $refGenomeSource.genomeSource == "gmapdb": 11 #if $refGenomeSource.genomeSource == "gmapdb":
12 #set $gmapdb = $os.listdir($refGenomeSource.gmapdb.extra_files_path)[0]
13 --dir=$refGenomeSource.gmapdb.extra_files_path --db=$refGenomeSource.gmapdb.metadata.db_name 12 --dir=$refGenomeSource.gmapdb.extra_files_path --db=$refGenomeSource.gmapdb.metadata.db_name
14 #else: 13 #else:
15 --dir=$os.path.dirname($refGenomeSource.gmapindex.value) --db=$os.path.basename($refGenomeSource.gmapindex.value) 14 --dir=$os.path.dirname($refGenomeSource.gmapindex.value) --db=$os.path.basename($refGenomeSource.gmapindex.value)
16 #end if 15 #end if
17 #if $refGenomeSource.kmer != None and len($refGenomeSource.kmer.__str__) == 2: 16 #if $refGenomeSource.kmer != None and len($refGenomeSource.kmer.__str__) == 2:
137 #end if 136 #end if
138 #end if 137 #end if
139 #if $output.options == "advanced": 138 #if $output.options == "advanced":
140 #if $output.npath.__str__ != '': 139 #if $output.npath.__str__ != '':
141 --npath=$output.npath 140 --npath=$output.npath
141 #end if
142 #if $output.maxsearch.__str__ != '':
143 --maxsearch=$output.maxsearch
142 #end if 144 #end if
143 $output.quiet_if_excessive 145 $output.quiet_if_excessive
144 $output.show_refdiff 146 $output.show_refdiff
145 $output.clip_overlap 147 $output.clip_overlap
146 #end if 148 #end if
246 </param> 248 </param>
247 <when value="fastq"> 249 <when value="fastq">
248 <param name="fastq" type="data" format="fastq" label="Select a fastq dataset" /> 250 <param name="fastq" type="data" format="fastq" label="Select a fastq dataset" />
249 <conditional name="paired"> 251 <conditional name="paired">
250 <param name="ispaired" type="boolean" truevalue="yes" falsevalue="no" checked="false" label="Use Paired Reads?"/> 252 <param name="ispaired" type="boolean" truevalue="yes" falsevalue="no" checked="false" label="Use Paired Reads?"/>
251 <when value="no"/> 253 <when value="no">
254 <!--
255 Could allow multiple input fastq and set the force-single-end flag
256 force-single-end When multiple FASTQ files are provided on the command line, GSNAP assumes
257 they are match paired-end files. This flag treats each file as single-end.
258 -->
259 </when>
252 <when value="yes"> 260 <when value="yes">
253 <param name="fastq" type="data" format="fastq" label="Select the paired reads reverse dataset" /> 261 <param name="fastq" type="data" format="fastq" label="Select the paired reads reverse dataset" />
254 <param name="orientation" type="select" label="Orientation of paired-end reads" help=""> 262 <param name="orientation" type="select" label="Orientation of paired-end reads" help="">
255 <option value="FR">fwd-rev, typical Illumina default</option> 263 <option value="FR">fwd-rev, typical Illumina default</option>
256 <option value="RF">rev-fwd, for circularized inserts</option> 264 <option value="RF">rev-fwd, for circularized inserts</option>
469 <option value="advanced">Set Computation Options</option> 477 <option value="advanced">Set Computation Options</option>
470 </param> 478 </param>
471 <when value="default"/> 479 <when value="default"/>
472 <when value="advanced"> 480 <when value="advanced">
473 <param name="max_mismatches" type="float" value="" optional="true" label="Maximum number of mismatches allowed (uses default when negative)" 481 <param name="max_mismatches" type="float" value="" optional="true" label="Maximum number of mismatches allowed (uses default when negative)"
474 help="Defaults to the ultrafast level of ((readlength+2)/12 - 2)). 482 help="Maximum number of mismatches allowed (if not specified, then
475 If specified between 0.0 and 1.0, then treated as a fraction 483 defaults to the ultrafast level of ((readlength+index_interval-1)/kmer - 2))
484 (By default, the genome index interval is 3, but this can be changed
485 by providing a different value for -q to gmap_build when processing the genome.)
486 If specified between 0.0 and 1.0, then treated as a fraction
476 of each read length. Otherwise, treated as an integral number 487 of each read length. Otherwise, treated as an integral number
477 of mismatches (including indel and splicing penalties) 488 of mismatches (including indel and splicing penalties)
478 For RNA-Seq, you may need to increase this value slightly 489 For RNA-Seq, you may need to increase this value slightly
479 to align reads extending past the ends of an exon."> 490 to align reads extending past the ends of an exon.">
480 <validator type="in_range" message="The mismatches must >= 0." min="0."/> 491 <validator type="in_range" message="The mismatches must >= 0." min="0."/>
481 </param> 492 </param>
482 <param name="query_unk_mismatch" type="boolean" checked="false" truevalue="--query-unk-mismatch=1" falsevalue="" label="Count unknown (N) characters in the query as a mismatch"/> 493 <param name="query_unk_mismatch" type="boolean" checked="false" truevalue="--query-unk-mismatch=1" falsevalue="" label="Count unknown (N) characters in the query as a mismatch"/>
483 <param name="genome_unk_mismatch" type="boolean" checked="true" truevalue="" falsevalue="--genome-unk-mismatch=0" label="Count unknown (N) characters in the genome as a mismatch"/> 494 <param name="genome_unk_mismatch" type="boolean" checked="true" truevalue="" falsevalue="--genome-unk-mismatch=0" label="Count unknown (N) characters in the genome as a mismatch"/>
484 <param name="terminal_threshold" type="integer" value="" optional="true" label="Threshold for searching for a terminal alignment (default 2)" 495 <param name="maxsearch" type="integer" value="" optional="true" label="Maximum number of alignments to find (default 1000)"
485 help="(from one end of the read to the best possible position at the other end). For example, if this value is 2, then if GSNAP finds an exact or 496 help="Must be larger than paths, which is the number to report.
497 Keeping this number large will allow for random selection among multiple alignments.
498 Reducing this number can speed up the program. "/>
499
500 <param name="terminal_threshold" type="integer" value="" optional="true" label="Threshold for searching for a terminal alignment"
501 help="Threshold for searching for a terminal alignment (from one end of the
502 read to the best possible position at the other end) (default 2
503 for standard, atoi-stranded, and atoi-nonstranded mode; default 100
504 for cmet-stranded and cmet-nonstranded mode).
505 For example, if this value is 2, then if GSNAP finds an exact or
486 1-mismatch alignment, it will not try to find a terminal alignment. 506 1-mismatch alignment, it will not try to find a terminal alignment.
487 Note that this default value may not be low enough if you want to 507 Note that this default value may not be low enough if you want to
488 obtain terminal alignments for very short reads, although such reads 508 obtain terminal alignments for very short reads, although such reads
489 probably don't have enough specificity for terminal alignments anyway." /> 509 probably don't have enough specificity for terminal alignments anyway.
510 To turn off terminal alignments, set this to a high value, greater
511 than the value for max-mismatches.
512 "/>
490 <param name="indel_penalty" type="integer" value="" optional="true" label="Penalty for an indel (default 2)" 513 <param name="indel_penalty" type="integer" value="" optional="true" label="Penalty for an indel (default 2)"
491 help="Counts against mismatches allowed. To find indels, make indel-penalty less than or equal to max-mismatches. A value &lt; 2 can lead to false positives at read ends" /> 514 help="Counts against mismatches allowed. To find indels, make indel-penalty less than or equal to max-mismatches. A value &lt; 2 can lead to false positives at read ends" />
492 <param name="indel_endlength" type="integer" value="" optional="true" label="Minimum length at end required for indel alignments (default 4)" /> 515 <param name="indel_endlength" type="integer" value="" optional="true" label="Minimum length at end required for indel alignments (default 4)" />
493 <param name="max_middle_insertions" type="integer" value="" optional="true" label="Maximum number of middle insertions allowed (default 9)" /> 516 <param name="max_middle_insertions" type="integer" value="" optional="true" label="Maximum number of middle insertions allowed (default 9)" />
494 <param name="max_middle_deletions" type="integer" value="" optional="true" label="Maximum number of middle deletions allowed (default 30)" /> 517 <param name="max_middle_deletions" type="integer" value="" optional="true" label="Maximum number of middle deletions allowed (default 30)" />
495 <param name="max_end_insertions" type="integer" value="" optional="true" label="Maximum number of end insertions allowed (default 3)" /> 518 <param name="max_end_insertions" type="integer" value="" optional="true" label="Maximum number of end insertions allowed (default 3)" />
496 <param name="max_end_deletions" type="integer" value="" optional="true" label="Maximum number of end deletions allowed (default 6)" /> 519 <param name="max_end_deletions" type="integer" value="" optional="true" label="Maximum number of end deletions allowed (default 6)" />
497 <param name="suboptimal_levels" type="integer" value="" optional="true" label="Report suboptimal hits beyond best hit (default 0)" 520 <param name="suboptimal_levels" type="integer" value="" optional="true" label="Report suboptimal hits beyond best hit (default 0)"
498 help="All hits with best score plus suboptimal-levels are reported" /> 521 help="All hits with best score plus suboptimal-levels are reported" />
499 <param name="adapter_strip" type="select" label="Method for removing adapters from reads" 522 <param name="adapter_strip" type="select" label="Method for removing adapters from reads"
500 help="paired removes adapters from paired-end reads if a concordant or paired alignment cannot be found from the original read"> 523 help="Default is 'off'. To turn on, specify 'paired', which removes adapters
501 <option value="paired" selected="true">paired</option> 524 from paired-end reads if they appear to be present.">
502 <option value="off">off</option> 525 <option value="paired">paired</option>
526 <option value="off" selected="true">off</option>
503 </param> 527 </param>
504 <param name="trim_mismatch_score" type="integer" value="" optional="true" label="Score to use for mismatches when trimming at ends (default is -3)" 528 <param name="trim_mismatch_score" type="integer" value="" optional="true" label="Score to use for mismatches when trimming at ends (default is -3)"
505 help="to turn off trimming, specify 0 (Warning: turning trimming off will give false positive mismatches at the ends of reads)"/> 529 help="to turn off trimming, specify 0 (Warning: turning trimming off will give false positive mismatches at the ends of reads)"/>
506 <param name="trim_indel_score" type="integer" value="" optional="true" label="Score to use for indels when trimming at ends (default is -4)" 530 <param name="trim_indel_score" type="integer" value="" optional="true" label="Score to use for indels when trimming at ends (default is -4)"
507 help="to turn off trimming, specify 0 (Warning: turning trimming off will give false positive indels at the ends of reads)"/> 531 help="to turn off trimming, specify 0 (Warning: turning trimming off will give false positive indels at the ends of reads)"/>
521 545
522 <!-- Options for GMAP alignment within GSNAP --> 546 <!-- Options for GMAP alignment within GSNAP -->
523 <param name="gmap_mode" type="select" multiple="true" optional="true" display="checkboxes" label="Cases to use GMAP for complex alignments containing multiple splices or indels" 547 <param name="gmap_mode" type="select" multiple="true" optional="true" display="checkboxes" label="Cases to use GMAP for complex alignments containing multiple splices or indels"
524 help="Default: pairsearch,terminal,improve"> 548 help="Default: pairsearch,terminal,improve">
525 <option value="pairsearch" selected="true">pairsearch</option> 549 <option value="pairsearch" selected="true">pairsearch</option>
550 <option value="indel_knownsplice" selected="true">indel_knownsplice</option>
526 <option value="terminal" selected="true">terminal</option> 551 <option value="terminal" selected="true">terminal</option>
527 <option value="improve" selected="true">improve</option> 552 <option value="improve" selected="true">improve</option>
528 </param> 553 </param>
529 <param name="trigger_score_for_gmap" type="integer" value="" optional="true" label="GMAP pairsearch threshold (default 5)" 554 <param name="trigger_score_for_gmap" type="integer" value="" optional="true" label="GMAP pairsearch threshold (default 5)"
530 help="Try GMAP pairsearch on nearby genomic regions if best score (the total of both ends if paired-end) exceeds this value (default 5)" /> 555 help="Try GMAP pairsearch on nearby genomic regions if best score (the total of both ends if paired-end) exceeds this value (default 5)" />