annotate srst2v2.xml @ 0:ffd5306daa4c draft

planemo upload
author estrain
date Tue, 28 Nov 2017 22:46:01 -0500
parents
children 16c9fccf550d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
1 <tool id="srst2v2" name="SRST2 - Short Read Sequence Typer (v2)" version="0.2.0">
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
2 <requirements>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
3 <requirement type="package" version="0.2.0">srst2</requirement>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
4 </requirements>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
5 <command detect_errors="exit_code"><![CDATA[
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
6 #if $paired_conditional.sPaired == "paired"
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
7 ln -s $paired_conditional.fastq1 sample_1.fastq;
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
8 ln -s $paired_conditional.fastq2 sample_2.fastq;
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
9 #end if
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
10
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
11 srst2
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
12
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
13 #if $paired_conditional.sPaired == "single"
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
14 --input_se $paired_conditional.fastq1
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
15 #else if $paired_conditional.sPaired == "paired"
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
16 --input_pe sample_1.fastq sample_2.fastq
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
17 #end if
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
18
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
19 --output srst2out
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
20 --save_scores
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
21 --mlst_definitions "$mlst_definitions"
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
22 --mlst_db "$mlst_db"
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
23 --mlst_delimiter $mlstdelim
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
24 --mlst_max_mismatch $mlst_max_mismatch
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
25
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
26 ]]></command>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
27 <inputs>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
28 <conditional name="paired_conditional">
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
29 <param name="sPaired" type="select" label="Single-End or Paired-End FASTQ?">
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
30 <option value="single">Single-end</option>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
31 <option value="paired">Paired-end</option>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
32 </param>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
33 <when value="single">
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
34 <param name="fastq1" type="data" format="fastq" label="FASTQ file" help="FASTQ" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
35 </when>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
36 <when value="paired">
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
37 <param name="fastq1" type="data" format="fastq" label="Forward FASTQ file" help="FASTQ" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
38 <param name="fastq2" type="data" format="fastq" label="Reverse FASTQ file" help="FASTQ" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
39 </when>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
40 </conditional>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
41
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
42 <param type="data" name="mlst_db" label="Fasta file of MLST alleles" format="fasta" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
43 <param type="data" name="mlst_definitions" label="ST definitions for MLST scheme" format="tabular" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
44 <param type="text" name="mlstdelim" value="_" format="txt" label="Character(s) separating gene name from allele number in MLST database (default &apos;_&apos;)" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
45 <param type="integer" name="mlst_max_mismatch" value="10" format="txt" label="Maximum number of mismatches per read for MLST allele calling (default 10)" />
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
46 </inputs>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
47
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
48 <outputs>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
49 <data format="txt" label="Scores" name="scores" from_work_dir="*.scores"/>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
50 <data format="bam" label="bam alignment" name="bam" from_work_dir="*.sorted.bam"/>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
51 <data format="pileup" label="pileup" name="pileup" from_work_dir="*.pileup"/>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
52 <data format="txt" label="Alleles" name="alleles" from_work_dir="*results.txt"/>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
53 </outputs>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
54
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
55 <help><![CDATA[
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
56
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
57 SRST2 - Short Read Sequence Typer (v2)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
58
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
59 This program is designed to take Illumina sequence data, a MLST database and/or a database of gene sequences (e.g. resistance genes, virulence genes, etc) and report the presence of STs and/or reference genes.
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
60
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
61
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
62
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
63 optional arguments:
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
64 -h, --help show this help message and exit
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
65 --version show program's version number and exit
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
66 --input_se INPUT_SE
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
67 Single end read file(s) for analysing (may be gzipped)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
68 --input_pe INPUT_PE
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
69 Paired end read files for analysing (may be gzipped)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
70 --merge_paired Switch on if all the input read sets belong to a
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
71 single sample, and you want to merge their data to get
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
72 a single result
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
73 --forward FORWARD Designator for forward reads (only used if NOT in
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
74 MiSeq format sample_S1_L001_R1_001.fastq.gz; otherwise
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
75 default is _1, i.e. expect forward reads as
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
76 sample_1.fastq.gz)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
77 --reverse REVERSE Designator for reverse reads (only used if NOT in
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
78 MiSeq format sample_S1_L001_R2_001.fastq.gz; otherwise
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
79 default is _2, i.e. expect forward reads as
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
80 sample_2.fastq.gz
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
81 --read_type READ_TYPE
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
82 Read file type (for bowtie2; default is q=fastq; other
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
83 options: qseq=solexa, f=fasta).
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
84 --mlst_db MLST_DB Fasta file of MLST alleles (optional)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
85 --mlst_delimiter MLST_DELIMITER
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
86 Character(s) separating gene name from allele number
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
87 in MLST database (default "-", as in arcc-1)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
88 --mlst_definitions MLST_DEFINITIONS
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
89 ST definitions for MLST scheme (required if mlst_db
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
90 supplied and you want to calculate STs)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
91 --mlst_max_mismatch MLST_MAX_MISMATCH
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
92 Maximum number of mismatches per read for MLST allele
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
93 calling (default 10)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
94 --gene_db GENE_DB
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
95 Fasta file/s for gene databases (optional)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
96 --no_gene_details Switch OFF verbose reporting of gene typing
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
97 --gene_max_mismatch GENE_MAX_MISMATCH
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
98 Maximum number of mismatches per read for gene
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
99 detection and allele calling (default 10)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
100 --min_coverage MIN_COVERAGE
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
101 Minimum %coverage cutoff for gene reporting (default
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
102 90)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
103 --max_divergence MAX_DIVERGENCE
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
104 Maximum %divergence cutoff for gene reporting (default
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
105 10)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
106 --min_depth MIN_DEPTH
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
107 Minimum mean depth to flag as dubious allele call
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
108 (default 5)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
109 --min_edge_depth MIN_EDGE_DEPTH
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
110 Minimum edge depth to flag as dubious allele call
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
111 (default 2)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
112 --prob_err PROB_ERR Probability of sequencing error (default 0.01)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
113 --truncation_score_tolerance TRUNCATION_SCORE_TOLERANCE
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
114 % increase in score allowed to choose non-truncated
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
115 allele
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
116 --stop_after STOP_AFTER
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
117 Stop mapping after this number of reads have been
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
118 mapped (otherwise map all)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
119 --other OTHER
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
120 Other arguments to pass to bowtie2 (must be escaped,
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
121 e.g. "\\--no-mixed".)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
122 --max_unaligned_overlap MAX_UNALIGNED_OVERLAP
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
123 Read discarded from alignment if either of its ends
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
124 has unaligned overlap with the reference that is
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
125 longer than this value (default 10)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
126 --mapq MAPQ Samtools -q parameter (default 1)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
127 --baseq BASEQ Samtools -Q parameter (default 20)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
128 --samtools_args SAMTOOLS_ARGS
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
129 Other arguments to pass to samtools mpileup (must be
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
130 escaped, e.g. "\\-A").
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
131 --output OUTPUT Prefix for srst2 output files
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
132 --log Switch ON logging to file (otherwise log to stdout)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
133 --save_scores Switch ON verbose reporting of all scores
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
134 --report_new_consensus
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
135 If a matching alleles is not found, report the
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
136 consensus allele. Note, only SNP differences are
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
137 considered, not indels.
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
138 --report_all_consensus
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
139 Report the consensus allele for the most likely
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
140 allele. Note, only SNP differences are considered, not
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
141 indels.
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
142 --use_existing_bowtie2_sam
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
143 Use existing SAM file generated by Bowtie2 if
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
144 available, otherwise they will be generated
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
145 --use_existing_pileup
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
146 Use existing pileups if available, otherwise they will
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
147 be generated
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
148 --use_existing_scores
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
149 Use existing scores files if available, otherwise they
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
150 will be generated
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
151 --keep_interim_alignment
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
152 Keep interim files (sam & unsorted bam), otherwise
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
153 they will be deleted after sorted bam is created
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
154 --threads THREADS Use multiple threads in Bowtie and Samtools
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
155 --prev_output PREV_OUTPUT
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
156 SRST2 results files to compile (any new results from
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
157 this run will also be incorporated)
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
158
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
159
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
160 ]]></help>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
161
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
162
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
163 <citations>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
164 <citation type="bibtex">
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
165 @misc{pope_dashnow_zobel_holt_raven_schultz_inouye_tomita_2014,
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
166 title={SRST2: Rapid genomic surveillance for public health and hospital microbiology labs},
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
167 url={https://genomemedicine.biomedcentral.com/articles/10.1186/s13073-014-0090-6},
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
168 journal={Genome Medicine}, publisher={BioMed Central},
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
169 author={Pope, Bernard J and Dashnow, Harriet and Zobel, Justin and Holt, Kathryn E and Raven, Lesley-Ann and Schultz, Mark B and Inouye, Michael and Tomita, Takehiro},
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
170 year={2014}, month={Nov}} ,
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
171 }</citation>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
172 </citations>
ffd5306daa4c planemo upload
estrain
parents:
diff changeset
173 </tool>