annotate breseq.xml @ 10:e21c4ceb0039 draft default tip

Uploaded
author dsobral
date Sat, 03 Mar 2018 11:47:47 -0500
parents 0e1caade4d38
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
1 <tool id="breseq" name="Breseq Variant Report" version="0.31.1" hidden="false">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
2 <description>Runs Breseq software on a set of fastq files</description>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
3
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
4 <requirements>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
5 <requirement type="package" version="0.31.1">breseq</requirement>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
6 </requirements>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
7
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
8 <command interpreter="python">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
9 breseq_wrapper.py
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
10
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
11 $outfile
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
12 $outfile.files_path
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
13
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
14 --num-processors \${GALAXY_SLOTS:-4}
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
15
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
16 #if str($reference.source) == "history":
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
17 #for $i, $s in enumerate( $reference.ref_series )
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
18 -r $s.own_genome
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
19 #end for
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
20 #else:
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
21 -r $reference.fixed_genome.fields.path
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
22 #end if
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
23 #for $i, $s in enumerate( $read_series )
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
24 ${s.input}
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
25 #end for
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
26
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
27 #if str($polymorphism.selection) == "yes":
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
28 --polymorphism-prediction
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
29 --polymorphism-reject-indel-homopolymer-length $polymorphism.indel_homopolymer_length
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
30 --polymorphism-reject-surrounding-homopolymer-length $polymorphism.surrounding_homopolymer_length
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
31 --polymorphism-minimum-coverage-each-strand $polymorphism.strand_coverage
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
32 --polymorphism-bias-cutoff $polymorphism.bias_pvalue
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
33 #end if
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
34
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
35 #if str($junction_reference.selection) == "yes":
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
36 #for $i, $s in enumerate( $junction_reference.j_series )
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
37 --junction-only-reference $s.jc_genome
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
38 #end for
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
39 #end if
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
40
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
41 ${cnv_evidence}
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
42
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
43 -b $minqvalue
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
44
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
45 </command>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
46
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
47 <stdio>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
48 <exit_code range="1:" level="fatal" description="Fatal ERROR exit code greater than 1" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
49 </stdio>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
50
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
51 <inputs>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
52 <!-- reference genome -->
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
53 <conditional name="reference">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
54 <param name="source" type="select" label="Will you select a reference genome from your history or use a built-in genome?" >
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
55 <option value="indexed">Use a built-in genome</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
56 <option value="history">Use one from the history</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
57 </param>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
58 <when value="indexed">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
59 <param name="fixed_genome" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact the Bioinformatics team">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
60 <options from_data_table="genbank_files">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
61 <filter type="sort_by" column="2"/>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
62 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
63 </options>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
64 </param>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
65 </when>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
66 <when value="history">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
67 <!-- <param name="own_genome" type="data" label="Select the reference genome (fasta or genbank)" /> -->
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
68 <repeat name="ref_series" title="Reference Genome" min="1">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
69 <param name="own_genome" type="data" label="Select the reference genome (fasta or genbank)" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
70 </repeat>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
71 </when>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
72 </conditional>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
73
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
74
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
75 <!-- input Fastq files -->
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
76 <repeat name="read_series" title="Read File" min="1">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
77 <param name="input" type="data" format="fastq" label="Dataset" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
78 </repeat>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
79
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
80
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
81 <!-- select polymorphism -->
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
82 <conditional name="polymorphism">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
83 <param name="selection" type="select" label="Perform polimorphism detection" help="Do you want to perform polimorphism detection in a population">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
84 <option value="no">Do not perform polymorphism detection</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
85 <option value="yes">Perform polymorphism detection</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
86 </param>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
87 <when value="yes">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
88 <param name="indel_homopolymer_length" type="integer" value="0" label="Reject insertion/deletion polymorphisms due to homopolymer repeats with this length or greater" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
89 <param name="surrounding_homopolymer_length" type="integer" value="0" label="Do not predict polymorphic base substitutions that create a homopolymer with this length on each side (with 2 TTATT->TTTTT is rejected)" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
90 <param name="strand_coverage" type="integer" value="3" label="Only accept polymorphisms if coverage in each strand is at least this" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
91 <param name="bias_pvalue" type="float" value="0.05" label="Only accept polymorphisms if pvalue of strand or read quality bias is greater than this" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
92 </when>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
93 <when value="no" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
94 </conditional>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
95
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
96 <!-- junction only reference(s) -->
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
97 <conditional name="junction_reference">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
98 <param name="selection" type="select" label="Detect external sequence insertion" help="You can select external sequences to detect insertions">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
99 <option value="no">Do not detect external sequence insertion</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
100 <option value="yes">Detect external sequence insertions</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
101 </param>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
102 <when value="yes">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
103 <repeat name="j_series" title="Junction-only references" min="1">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
104 <param name="jc_genome" type="data" label="Select an external sequence (fasta or genbank)" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
105 </repeat>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
106 </when>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
107 <when value="no" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
108 </conditional>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
109
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
110 <!-- Copy Number Evidence -->
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
111 <param name="cnv_evidence" type="select" label="Copy number variation prediction (experimental option)" help="Do you want to perform copy number variation prediction">
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
112 <option value="">Do not perform copy number variaion prediction</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
113 <option value="--cnv">Perform copy number variation prediction (--cnv)</option>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
114 </param>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
115
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
116 <param name="minqvalue" type="integer" value="3" label="Minimum Phred Q for a base to be considered" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
117
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
118
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
119 </inputs>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
120
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
121 <outputs>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
122 <data format="prezip.html" name="outfile" label="Breseq HTML report" />
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
123 </outputs>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
124
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
125 <help>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
126 **Breseq**
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
127
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
128 Breseq_ is a computational pipeline for finding mutations relative to a reference sequence in short-read DNA re-sequencing data for microbial sized genomes.
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
129
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
130 .. _Breseq: http://barricklab.org/twiki/bin/view/Lab/ToolsBacterialGenomeResequencing
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
131
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
132 ------
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
133
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
134 **Inputs**
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
135
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
136 Breseq accepts files in FASTQ format. It does not take pair-end information into account.
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
137
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
138 You can either run in clonal (consensus) mode or search for polymorphisms in a population.
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
139
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
140 You can also select an external sequence (eg. a transposon) to detect for insertions or horizontal transfer.
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
141
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
142
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
143 ------
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
144
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
145 **Outputs**
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
146
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
147 Breseq outputs a number of files. These are all condensed in a single zipped file.
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
148
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
149 It contains output files with the final results, accessible through ``output/index.html``
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
150
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
151 It also contains data files with accessory data, including:
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
152
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
153 - ``data/reference.fasta`` (file with reference genome: can be used in eg. IGV browser)
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
154 - ``data/reference.gff`` (file with genomic annotations: can be used in eg. IGV browser)
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
155 - ``data/areference.bam`` (file with read alignments: can be used in eg. IGV browser)
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
156 - ``data/unmatched.*`` (files with read that failed to align: can be used to build an assembly or to eg. blast against NCBI)
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
157
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
158 </help>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
159 </tool>
0e1caade4d38 Uploaded
dsobral
parents:
diff changeset
160