annotate bismark_wrapper/bismark_wrapper.xml @ 3:678f31a13093 draft

Uploaded
author bgruening
date Fri, 12 Oct 2012 09:29:51 -0400
parents 5226800b84ca
children a4bd52c4ed46
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
1 <tool id="bismark" name="Bismark" version="0.7.7.1">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
2 <!-- Wrapper compatible with Bismark version 0.7.7 -->
2
5226800b84ca Uploaded
bgruening
parents: 0
diff changeset
3 <description>bisulfite mapper</description>
0
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
4 <version_command>bismark --version</version_command>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
5 <requirements>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
6 <requirement type="package">bismark</requirement>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
7 <requirement type="package">bismark_genome_preparation</requirement>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
8 <requirement type="package" version="2.0.0-beta7">bowtie2</requirement>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
9 </requirements>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
10 <parallelism method="basic"></parallelism>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
11 <command interpreter="python">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
12 bismark_wrapper.py
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
13
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
14 ## Change this to accommodate the number of threads you have available.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
15 --num-threads 4
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
16
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
17 ##
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
18 ## Bismark Genome Preparation, if desired.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
19 ##
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
20
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
21 ## Handle reference file.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
22 #if $refGenomeSource.genomeSource == "history":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
23 --own-file=$refGenomeSource.ownFile
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
24 #else:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
25 --indexes-path ${refGenomeSource.index.fields.path}
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
26 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
27
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
28
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
29 ##
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
30 ## Input parameters
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
31 ##
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
32
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
33
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
34 #if $singlePaired.sPaired == "single":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
35 --single-paired $singlePaired.input_singles
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
36
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
37 #if $singlePaired.input_singles.ext == "fastqillumina":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
38 --phred64-quals
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
39 --fastq
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
40 #elif $singlePaired.input_singles.ext == "fastqsanger":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
41 --fastq
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
42 #elif $singlePaired.input_singles.ext == "fasta":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
43 --fasta
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
44 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
45 #else:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
46 --mate-paired
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
47 --mate1 $singlePaired.input_mate1
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
48 --mate2 $singlePaired.input_mate2
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
49
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
50 #if $singlePaired.input_mate1.ext == "fastqillumina":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
51 --phred64-quals
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
52 --fastq
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
53 #elif $singlePaired.input_mate1.ext == "fastqsanger":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
54 --fastq
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
55 #elif $singlePaired.input_mate1.ext == "fasta":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
56 --fasta
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
57 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
58
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
59 -I $singlePaired.minInsert
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
60 -X $singlePaired.maxInsert
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
61 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
62
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
63
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
64 ## for now hardcode the value for the required memory per thread in --best mode
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
65 --chunkmbs 512
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
66
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
67
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
68 #if $params.settingsType == "custom":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
69
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
70 ## default 20
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
71 --seed-len $params.seed_len
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
72 ## default 0
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
73 --seed-mismatches $params.seed_mismatches
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
74 ## default 15
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
75 --seed-extention-attempts $params.seed_extention_attempts
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
76 ## default 2
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
77 --max-reseed $params.max_reseed
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
78
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
79 ## default 70
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
80 ##--maqerr $params.maqerr
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
81
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
82 ## default unlimited
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
83 #if $params.qupto != 0:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
84 --qupto $params.qupto
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
85 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
86 #if $params.skip_reads != 0:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
87 --skip-reads $params.skip_reads
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
88 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
89
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
90 ## if set, disable the original behaviour
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
91 $params.no_mixed
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
92 ## if set, disable the original behaviour
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
93 $params.no_discordant
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
94
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
95
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
96 ###if str($params.isReportOutput) == "yes":
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
97 ## --output-report-file $report_file
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
98 ###end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
99
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
100 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
101
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
102 ##
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
103 ## Output parameters.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
104 ##
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
105 --output $output
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
106 $suppress_header
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
107
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
108 #if str( $singlePaired.sPaired ) == "single"
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
109 #if $output_unmapped_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
110 --output-unmapped-reads $output_unmapped_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
111 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
112 #if $output_suppressed_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
113 --output-suppressed-reads $output_suppressed_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
114 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
115 #else
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
116 #if $output_unmapped_reads_l and $output_unmapped_reads_r
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
117 --output-unmapped-reads-l $output_unmapped_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
118 --output-unmapped-reads-r $output_unmapped_reads_r
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
119 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
120 #if $output_suppressed_reads_l and $output_suppressed_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
121 --output-suppressed-reads-l $output_suppressed_reads_l
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
122 --output-suppressed-reads-r $output_suppressed_reads_r
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
123 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
124 #end if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
125
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
126 </command>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
127 <inputs>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
128 <conditional name="refGenomeSource">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
129 <param name="genomeSource" type="select" label="Will you select a reference genome from your history or use a built-in index?" help="Built-ins were indexed using default options">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
130 <option value="indexed">Use a built-in index</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
131 <option value="history">Use one from the history</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
132 </param>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
133 <when value="indexed">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
134 <param name="index" type="select" label="Select a reference genome" help="If your genome of interest is not listed, contact your Galaxy admin">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
135 <options from_data_table="bismark_indexes">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
136 <filter type="sort_by" column="2"/>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
137 <validator type="no_options" message="No indexes are available for the selected input dataset"/>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
138 </options>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
139 </param>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
140 </when> <!-- build-in -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
141 <when value="history">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
142 <param name="ownFile" type="data" format="fasta" metadata_name="dbkey" label="Select the reference genome" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
143 </when> <!-- history -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
144 </conditional> <!-- refGenomeSource -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
145
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
146 <!-- Input Parameters -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
147 <conditional name="singlePaired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
148 <param name="sPaired" type="select" label="Is this library mate-paired?">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
149 <option value="single">Single-end</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
150 <option value="paired">Paired-end</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
151 </param>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
152 <when value="single">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
153 <param name="input_singles" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
154 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
155 <when value="paired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
156 <param name="input_mate1" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
157 <param name="input_mate2" type="data" format="fastqsanger,fastqillumina,fastq,fasta" label="FASTQ/FASTA file" help="FASTQ or FASTA files." />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
158 <param name="minInsert" type="integer" value="0" label="Minimum insert size for valid paired-end alignments" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
159 <param name="maxInsert" type="integer" value="250" label="Maximum insert size for valid paired-end alignments" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
160 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
161 </conditional>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
162
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
163
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
164 <conditional name="params">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
165 <param name="settingsType" type="select" label="Bismark settings to use" help="You can use the default settings or set custom values for any of Bismark's parameters.">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
166 <option value="default">Use Defaults</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
167 <option value="custom">Full parameter list</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
168 </param>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
169 <when value="default" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
170 <!-- Full/advanced params. -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
171 <when value="custom">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
172 <param name="seed_mismatches" type="integer" value="0" label="Number of mismatches to be allowed in a seed alignment during multiseed alignment" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
173 <param name="seed_len" type="integer" value="20" label="Length of the seed substrings to align during multiseed alignment" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
174 <!--
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
175 <param name="maqerr" type="integer" value="70" label="Maximum permitted total of quality values at all mismatched read positions throughout the entire alignment, not just in the 'seed'." />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
176 -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
177 <param name="seed_extention_attempts" type="integer" value="15" label="How many consecutive seed extension attempts can fail before Bowtie 2 moves on" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
178 <param name="max_reseed" type="integer" value="2" label="Maximum number of times Bowtie 2 will re-seed reads with repetitive seeds" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
179
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
180 <param name="qupto" type="integer" value="0" label="Only aligns the first N reads or read pairs from the input" help="Default is 0 and means 'no-limit'." />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
181 <param name="skip_reads" type="integer" value="0" label="Skip (i.e. do not align) the first N reads or read pairs from the input" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
182
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
183 <param name="no_discordant" type="boolean" truevalue="--no-discordant" falsevalue="" checked="False" label="Disable looking for discordant alignments if it cannot find any concordant alignments" help="" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
184 <param name="no_mixed" type="boolean" truevalue="--no-mixed" falsevalue="" checked="False" label="Disable Bowtie 2's behaviour to try to find alignments for the individual mates" help="" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
185
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
186 <param name="suppressed_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write ambiguous reads to an extra output file." help="Write all reads which produce more than one valid alignment with the same number of lowest mismatches or other reads that fail to align uniquely." />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
187 <param name="unmapped_read_file" type="boolean" truevalue="true" falsevalue="false" checked="False" label="Write all reads that could not be aligned to a file" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
188 <!-- output Options -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
189 <!-- did not now if that is necessary and how it is possible to access that property in output
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
190 <param name="isReportOutput" type="select" label="Offer all report files concatenated in one file.">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
191 <option value="yes">yes</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
192 <option value="no">no</option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
193 </param>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
194 -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
195 <!--end output options -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
196 </when> <!-- full -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
197 </conditional> <!-- params -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
198 <param name="suppress_header" type="boolean" truevalue="--suppress-header" falsevalue="" checked="False" label="Suppress the header in the output SAM file" help="Bowtie produces SAM with several lines of header information by default" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
199 </inputs>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
200 <outputs>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
201 <!-- that does not work
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
202 <data format="txt" name="report_file" label="${tool.name} on ${on_string}: Report">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
203 <filter>str($params.isReportOutput) == "yes"</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
204 </data>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
205 -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
206 <data format="sam" name="output" label="${tool.name} on ${on_string}: mapped reads">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
207 <actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
208 <conditional name="refGenomeSource.genomeSource">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
209 <when value="indexed">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
210 <action type="metadata" name="dbkey">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
211 <option type="from_data_table" name="bowtie2_indexes" column="1" offset="0">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
212 <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
213 <filter type="param_value" ref="refGenomeSource.index" column="0"/>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
214 </option>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
215 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
216 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
217 <when value="history">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
218 <action type="metadata" name="dbkey">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
219 <option type="from_param" name="refGenomeSource.ownFile" param_attribute="dbkey" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
220 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
221 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
222 </conditional>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
223 </actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
224 </data>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
225
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
226 <data format="fastq" name="output_suppressed_reads_l" label="${tool.name} on ${on_string}: suppressed reads (L)">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
227 <filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
228 ((
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
229 params['settingsType'] == "custom" and
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
230 params['suppressed_read_file'] is True
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
231 ))
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
232 </filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
233 <actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
234 <conditional name="singlePaired.sPaired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
235 <when value="single">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
236 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
237 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
238 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
239 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
240 <when value="paired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
241 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
242 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
243 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
244 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
245 </conditional>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
246 </actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
247 </data>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
248
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
249 <data format="fastq" name="output_suppressed_reads_r" label="${tool.name} on ${on_string}: suppressed reads (R)">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
250 <filter>singlePaired['sPaired'] == "paired"</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
251 <filter>params['settingsType'] == "custom"</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
252 <filter>params['supressed_read_file'] is True</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
253 <actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
254 <conditional name="singlePaired.sPaired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
255 <when value="single">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
256 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
257 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
258 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
259 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
260 <when value="paired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
261 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
262 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
263 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
264 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
265 </conditional>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
266 </actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
267 </data>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
268
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
269 <!-- Outout unmapped reads -->
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
270 <data format="fastq" name="output_unmapped_reads_l" label="${tool.name} on ${on_string}: unmapped reads (L)">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
271 <filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
272 ((
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
273 params['settingsType'] == "custom" and
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
274 params['unmapped_read_file'] is True
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
275 ))
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
276 </filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
277 <actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
278 <conditional name="singlePaired.sPaired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
279 <when value="single">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
280 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
281 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
282 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
283 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
284 <when value="paired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
285 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
286 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
287 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
288 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
289 </conditional>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
290 </actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
291 </data>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
292 <data format="fastq" name="output_unmapped_reads_r" label="${tool.name} on ${on_string}: unmapped reads (R)">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
293 <filter>singlePaired['sPaired'] == "paired"</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
294 <filter>params['settingsType'] == "custom"</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
295 <filter>params['unmapped_read_file'] is True</filter>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
296 <actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
297 <conditional name="singlePaired.sPaired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
298 <when value="single">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
299 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
300 <option type="from_param" name="singlePaired.input_singles" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
301 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
302 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
303 <when value="paired">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
304 <action type="format">
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
305 <option type="from_param" name="singlePaired.input_mate1" param_attribute="ext" />
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
306 </action>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
307 </when>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
308 </conditional>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
309 </actions>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
310 </data>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
311
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
312
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
313 </outputs>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
314
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
315 <tests>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
316 </tests>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
317
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
318 <help>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
319
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
320 **What it does**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
321
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
322 Bismark_ is a bisulfite mapper and methylation caller. Bismark takes in FastA or FastQ files and aligns the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
323 reads to a specified bisulfite genome. Sequence reads are transformed into a bisulfite converted forward strand
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
324 version (C->T conversion) or into a bisulfite treated reverse strand (G->A conversion of the forward strand).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
325 Each of these reads are then aligned to bisulfite treated forward strand index of a reference genome
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
326 (C->T converted) and a bisulfite treated reverse strand index of the genome (G->A conversion of the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
327 forward strand, by doing this alignments will produce the same positions). These 4 instances of Bowtie (1 or 2)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
328 are run in parallel. The sequence file(s) are then read in again sequence by sequence to pull out the original
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
329 sequence from the genome and determine if there were any protected C's present or not.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
330
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
331 .. _Bismark: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
332
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
333 As of version 0.7.0 Bismark will only run 2 alignment threads for OT and OB in parallel, the 4 strand mode can be
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
334 re-enabled by using non_directional mode.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
335
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
336 It is developed by Krueger F and Andrews SR. at the Babraham Institute. Krueger F, Andrews SR. (2011) Bismark: a flexible aligner and methylation caller for Bisulfite-Seq applications. Bioinformatics, 27, 1571-2.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
337
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
338 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
339
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
340 **Know what you are doing**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
341
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
342 .. class:: warningmark
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
343
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
344 There is no such thing (yet) as an automated gearshift in short read mapping. It is all like stick-shift driving in San Francisco. In other words = running this tool with default parameters will probably not give you meaningful results. A way to deal with this is to **understand** the parameters by carefully reading the `documentation`__ and experimenting. Fortunately, Galaxy makes experimenting easy.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
345
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
346 .. __: http://www.bioinformatics.babraham.ac.uk/projects/bismark/
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
347
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
348 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
349
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
350 **Input formats**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
351
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
352 Bismark accepts files in either Sanger FASTQ format (galaxy type *fastqsanger*), Illumina FASTQ format (galaxy type *fastqillumina*) or FASTA format (galaxy type *fasta*). Use the FASTQ Groomer to prepare your files.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
353
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
354 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
355
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
356 **A Note on Built-in Reference Genomes**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
357
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
358 The default variant for all genomes is "Full", defined as all primary chromosomes (or scaffolds/contigs) including mitochondrial plus associated unmapped, plasmid, and other segments. When only one version of a genome is available in this tool, it represents the default "Full" variant. Some genomes will have more than one variant available. The "Canonical Male" or sometimes simply "Canonical" variant contains the primary chromosomes for a genome. For example a human "Canonical" variant contains chr1-chr22, chrX, chrY, and chrM. The "Canonical Female" variant contains the primary chromosomes excluding chrY.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
359
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
360 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
361
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
362 The final output of Bismark is in SAM format by default.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
363
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
364 **Outputs**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
365
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
366 The output is in SAM format, and has the following columns::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
367
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
368 Column Description
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
369 -------- --------------------------------------------------------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
370 1 QNAME seq-ID
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
371 2 FLAG this flag tries to take the strand a bisulfite read
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
372 originated from into account
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
373 (this is different from ordinary DNA alignment flags!)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
374 3 RNAME chromosome
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
375 4 POS start position
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
376 5 MAPQ always 255
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
377 6 CIGAR extended CIGAR string
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
378 7 MRNM Mate Reference sequence NaMe ('=' if same as RNAME)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
379 8 MPOS 1-based Mate POSition
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
380 9 ISIZE Inferred insert SIZE
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
381 10 SEQ query SEQuence on the same strand as the reference
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
382 11 QUAL Phred33 scale
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
383 12 NM-tag edit distance to the reference)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
384 13 XX-tag base-by-base mismatches to the reference.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
385 This does not include indels.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
386 14 XM-tag methylation call string
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
387 15 XR-tag read conversion state for the alignment
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
388 16 XG-tag genome conversion state for the alignment
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
389
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
390
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
391 Each read of paired-end alignments is written out in a separate line in the above format.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
392
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
393
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
394 It looks like this (scroll sideways to see the entire example)::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
395
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
396 QNAME FLAG RNAME POS MAPQ CIAGR MRNM MPOS ISIZE SEQ QUAL OPT
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
397 HWI-EAS91_1_30788AAXX:1:1:1761:343 4 * 0 0 * * 0 0 AAAAAAANNAAAAAAAAAAAAAAAAAAAAAAAAAAACNNANNGAGTNGNNNNNNNGCTTCCCACAGNNCTGG hhhhhhh;;hhhhhhhhhhh^hOhhhhghhhfhhhgh;;h;;hhhh;h;;;;;;;hhhhhhghhhh;;Phhh
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
398 HWI-EAS91_1_30788AAXX:1:1:1578:331 4 * 0 0 * * 0 0 GTATAGANNAATAAGAAAAAAAAAAATGAAGACTTTCNNANNTCTGNANNNNNNNTCTTTTTTCAGNNGTAG hhhhhhh;;hhhhhhhhhhhhhhhhhhhhhhhhhhhh;;h;;hhhh;h;;;;;;;hhhhhhhhhhh;;hhVh
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
399
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
400 -------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
401
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
402 **Bismark settings**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
403
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
404 All of the options have a default value. You can change any of them. If any Bismark function is missing please contact the tool author or your Galaxy admin.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
405
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
406 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
407
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
408 **Bismark parameter list**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
409
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
410 This is an exhaustive list of Bismark options:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
411
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
412 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
413
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
414 **OPTIONS**
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
415
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
416
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
417 Input::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
418
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
419 --singles A comma- or space-separated list of files containing the reads to be aligned (e.g.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
420 lane1.fq,lane2.fq lane3.fq). Reads may be a mix of different lengths. Bismark will
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
421 produce one mapping result and one report file per input file.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
422
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
423 -1 mates1 Comma-separated list of files containing the #1 mates (filename usually includes
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
424 "_1"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
425 correspond file-for-file and read-for-read with those specified in mates2.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
426 Reads may be a mix of different lengths. Bismark will produce one mapping result
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
427 and one report file per paired-end input file pair.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
428
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
429 -2 mates2 Comma-separated list of files containing the #2 mates (filename usually includes
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
430 "_2"), e.g. flyA_1.fq,flyB_1.fq). Sequences specified with this option must
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
431 correspond file-for-file and read-for-read with those specified in mates1.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
432 Reads may be a mix of different lengths.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
433
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
434 -q/--fastq The query input files (specified as mate1,mate2 or singles are FASTQ
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
435 files (usually having extension .fg or .fastq). This is the default. See also
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
436 --solexa-quals.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
437
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
438 -f/--fasta The query input files (specified as mate1,mate2 or singles are FASTA
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
439 files (usually havin extension .fa, .mfa, .fna or similar). All quality values
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
440 are assumed to be 40 on the Phred scale.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
441
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
442 -s/--skip INT Skip (i.e. do not align) the first INT reads or read pairs from the input.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
443
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
444 -u/--upto INT Only aligns the first INT reads or read pairs from the input. Default: no limit.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
445
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
446 --phred33-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 33. Default: on.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
447
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
448 --phred64-quals FASTQ qualities are ASCII chars equal to the Phred quality plus 64. Default: off.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
449
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
450 --solexa-quals Convert FASTQ qualities from solexa-scaled (which can be negative) to phred-scaled
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
451 (which can't). The formula for conversion is:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
452 phred-qual = 10 * log(1 + 10 ** (solexa-qual/10.0)) / log(10). Used with -q. This
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
453 is usually the right option for use with (unconverted) reads emitted by the GA
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
454 Pipeline versions prior to 1.3. Works only for Bowtie 1. Default: off.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
455
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
456 --solexa1.3-quals Same as --phred64-quals. This is usually the right option for use with (unconverted)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
457 reads emitted by GA Pipeline version 1.3 or later. Default: off.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
458
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
459
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
460 Alignment::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
461
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
462 -n/--seedmms INT The maximum number of mismatches permitted in the "seed", i.e. the first L base pairs
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
463 of the read (where L is set with -l/--seedlen). This may be 0, 1, 2 or 3 and the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
464 default is 1. This option is only available for Bowtie 1 (for Bowtie 2 see -N).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
465
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
466 -l/--seedlen The "seed length"; i.e., the number of bases of the high quality end of the read to
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
467 which the -n ceiling applies. The default is 28. Bowtie (and thus Bismark) is faster for
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
468 larger values of -l. This option is only available for Bowtie 1 (for Bowtie 2 see -L).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
469
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
470 -e/--maqerr INT Maximum permitted total of quality values at all mismatched read positions throughout
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
471 the entire alignment, not just in the "seed". The default is 70. Like Maq, bowtie rounds
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
472 quality values to the nearest 10 and saturates at 30. This value is not relevant for
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
473 Bowtie 2.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
474
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
475 --chunkmbs INT The number of megabytes of memory a given thread is given to store path descriptors in
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
476 --best mode. Best-first search must keep track of many paths at once to ensure it is
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
477 always extending the path with the lowest cumulative cost. Bowtie tries to minimize the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
478 memory impact of the descriptors, but they can still grow very large in some cases. If
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
479 you receive an error message saying that chunk memory has been exhausted in --best mode,
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
480 try adjusting this parameter up to dedicate more memory to the descriptors. This value
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
481 is not relevant for Bowtie 2. Default: 512.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
482
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
483 -I/--minins INT The minimum insert size for valid paired-end alignments. E.g. if -I 60 is specified and
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
484 a paired-end alignment consists of two 20-bp alignments in the appropriate orientation
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
485 with a 20-bp gap between them, that alignment is considered valid (as long as -X is also
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
486 satisfied). A 19-bp gap would not be valid in that case. Default: 0.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
487
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
488 -X/--maxins INT The maximum insert size for valid paired-end alignments. E.g. if -X 100 is specified and
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
489 a paired-end alignment consists of two 20-bp alignments in the proper orientation with a
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
490 60-bp gap between them, that alignment is considered valid (as long as -I is also satisfied).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
491 A 61-bp gap would not be valid in that case. Default: 500.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
492
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
493
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
494
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
495 Output::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
496
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
497 --non_directional The sequencing library was constructed in a non strand-specific manner, alignments to all four
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
498 bisulfite strands will be reported. Default: OFF.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
499
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
500 (The current Illumina protocol for BS-Seq is directional, in which case the strands complementary
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
501 to the original strands are merely theoretical and should not exist in reality. Specifying directional
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
502 alignments (which is the default) will only run 2 alignment threads to the original top (OT)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
503 or bottom (OB) strands in parallel and report these alignments. This is the recommended option
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
504 for sprand-specific libraries).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
505
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
506 --sam-no-hd Suppress SAM header lines (starting with @). This might be useful when very large input files are
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
507 split up into several smaller files to run concurrently and the output files are to be merged.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
508
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
509 --quiet Print nothing besides alignments.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
510
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
511 --vanilla Performs bisulfite mapping with Bowtie 1 and prints the 'old' output (as in Bismark 0.5.X) instead
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
512 of SAM format output.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
513
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
514 -un/--unmapped Write all reads that could not be aligned to a file in the output directory. Written reads will
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
515 appear as they did in the input, without any translation of quality values that may have
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
516 taken place within Bowtie or Bismark. Paired-end reads will be written to two parallel files with _1
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
517 and _2 inserted in their filenames, i.e. _unmapped_reads_1.txt and unmapped_reads_2.txt. Reads
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
518 with more than one valid alignment with the same number of lowest mismatches (ambiguous mapping)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
519 are also written to _unmapped_reads.txt unless the option --ambiguous is specified as well.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
520
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
521 --ambiguous Write all reads which produce more than one valid alignment with the same number of lowest
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
522 mismatches or other reads that fail to align uniquely to a file in the output directory.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
523 Written reads will appear as they did in the input, without any of the translation of quality
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
524 values that may have taken place within Bowtie or Bismark. Paired-end reads will be written to two
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
525 parallel files with _1 and _2 inserted in theit filenames, i.e. _ambiguous_reads_1.txt and
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
526 _ambiguous_reads_2.txt. These reads are not written to the file specified with --un.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
527
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
528 -o/--output_dir DIR Write all output files into this directory. By default the output files will be written into
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
529 the same folder as the input file(s). If the specified folder does not exist, Bismark will attempt
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
530 to create it first. The path to the output folder can be either relative or absolute.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
531
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
532 --temp_dir DIR Write temporary files to this directory instead of into the same directory as the input files. If
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
533 the specified folder does not exist, Bismark will attempt to create it first. The path to the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
534 temporary folder can be either relative or absolute.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
535
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
536 ------
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
537
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
538 Bowtie 2 alignment options::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
539
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
540 -N INT Sets the number of mismatches to allowed in a seed alignment during multiseed alignment.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
541 Can be set to 0 or 1. Setting this higher makes alignment slower (often much slower)
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
542 but increases sensitivity. Default: 0. This option is only available for Bowtie 2 (for
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
543 Bowtie 1 see -n).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
544
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
545 -L INT Sets the length of the seed substrings to align during multiseed alignment. Smaller values
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
546 make alignment slower but more senstive. Default: the --sensitive preset of Bowtie 2 is
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
547 used by default, which sets -L to 20. This option is only available for Bowtie 2 (for
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
548 Bowtie 1 see -l).
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
549
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
550 --ignore-quals When calculating a mismatch penalty, always consider the quality value at the mismatched
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
551 position to be the highest possible, regardless of the actual value. I.e. input is treated
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
552 as though all quality values are high. This is also the default behavior when the input
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
553 doesn't specify quality values (e.g. in -f mode). This option is invariable and on by default.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
554
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
555
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
556 Bowtie 2 paired-end options::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
557
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
558 --no-mixed This option disables Bowtie 2's behavior to try to find alignments for the individual mates if
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
559 it cannot find a concordant or discordant alignment for a pair. This option is invariable and
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
560 and on by default.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
561
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
562 --no-discordant Normally, Bowtie 2 looks for discordant alignments if it cannot find any concordant alignments.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
563 A discordant alignment is an alignment where both mates align uniquely, but that does not
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
564 satisfy the paired-end constraints (--fr/--rf/--ff, -I, -X). This option disables that behavior
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
565 and it is on by default.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
566
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
567
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
568 Bowtie 2 effort options::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
569
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
570 -D INT Up to INT consecutive seed extension attempts can "fail" before Bowtie 2 moves on, using
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
571 the alignments found so far. A seed extension "fails" if it does not yield a new best or a
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
572 new second-best alignment. Default: 15.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
573
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
574 -R INT INT is the maximum number of times Bowtie 2 will "re-seed" reads with repetitive seeds.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
575 When "re-seeding," Bowtie 2 simply chooses a new set of reads (same length, same number of
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
576 mismatches allowed) at different offsets and searches for more alignments. A read is considered
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
577 to have repetitive seeds if the total number of seed hits divided by the number of seeds
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
578 that aligned at least once is greater than 300. Default: 2.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
579
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
580
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
581 Bowtie 2 Scoring options::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
582
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
583 --score_min "func" Sets a function governing the minimum alignment score needed for an alignment to be considered
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
584 "valid" (i.e. good enough to report). This is a function of read length. For instance, specifying
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
585 L,0,-0.2 sets the minimum-score function f to f(x) = 0 + -0.2 * x, where x is the read length.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
586 See also: setting function options at http://bowtie-bio.sourceforge.net/bowtie2. The default is
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
587 L,0,-0.2.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
588
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
589
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
590 Bowtie 2 Reporting options::
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
591
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
592 --most_valid_alignments INT This used to be the Bowtie 2 parameter -M. As of Bowtie 2 version 2.0.0 beta7 the option -M is
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
593 deprecated. It will be removed in subsequent versions. What used to be called -M mode is still the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
594 default mode, but adjusting the -M setting is deprecated. Use the -D and -R options to adjust the
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
595 effort expended to find valid alignments.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
596
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
597 For reference, this used to be the old (now deprecated) description of -M:
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
598 Bowtie 2 searches for at most INT+1 distinct, valid alignments for each read. The search terminates when it
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
599 can't find more distinct valid alignments, or when it finds INT+1 distinct alignments, whichever
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
600 happens first. Only the best alignment is reported. Information from the other alignments is used to
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
601 estimate mapping quality and to set SAM optional fields, such as AS:i and XS:i. Increasing -M makes
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
602 Bowtie 2 slower, but increases the likelihood that it will pick the correct alignment for a read that
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
603 aligns many places. For reads that have more than INT+1 distinct, valid alignments, Bowtie 2 does not
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
604 guarantee that the alignment reported is the best possible in terms of alignment score. -M is
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
605 always used and its default value is set to 10.
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
606
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
607 </help>
550ce7d37d4b Uploaded
bgruening
parents:
diff changeset
608 </tool>