annotate trimmomatic.xml @ 14:cb56fdcbe0a5 draft default tip

Uploaded
author simon-gladman
date Thu, 10 Jul 2014 14:38:53 -0400
parents 476184b9b2f7
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
1 <tool id="trimmomatic" name="Trimmomatic" version="1.1.0">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
2
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
3 <description>Trim adapters and otherwise cleanup fastq files in a pair aware manner using trimmomatic 0.32</description>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
4 <requirements>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
5 <requirement type="set_environment">JAR_PATH</requirement>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
6 </requirements>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
7
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
8 <command interpreter="perl">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
9 trimmomatic_wrapper.pl
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
10 paired ${paired.is_paired}
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
11 #if $paired.is_paired == "single":
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
12 fwdfile ${paired.forwards_file}
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
13 #end if
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
14 #if $paired.is_paired == "paired":
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
15 fwdfile ${paired.forwards_file}
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
16 revfile ${paired.reverse_file}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
17 #end if
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
18 #if $paired.is_paired == "collection":
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
19 fwdfile ${paired.collection_data.forward}
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
20 revfile ${paired.collection_data.reverse}
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
21 #end if
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
22 phred $phred
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
23 cutadapt ${adapt.adapters}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
24 #if $adapt.adapters:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
25 adaptfile ${adapt.adapt_file}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
26 adaptseed ${adapt.adapt_seed}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
27 adaptpalindrome ${adapt.adapt_palindrome}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
28 adaptsimple ${adapt.adapt_simple}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
29 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
30 slidingwindow ${sliding.slidingwindow}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
31 #if $sliding.slidingwindow:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
32 slidingsize ${sliding.slid_window}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
33 slidingqual ${sliding.slid_qual}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
34 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
35 trimleading ${leading.trimleading}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
36 #if $leading.trimleading:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
37 leadingqual ${leading.lead_qual}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
38 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
39 trimtrailing ${trailing.trimtrailing}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
40 #if $trailing.trimtrailing:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
41 trailingqual ${trailing.trail_qual}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
42 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
43 crop ${crop.cropend}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
44 #if $crop.cropend:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
45 croplen ${crop.crop_len}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
46 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
47 headcrop ${headcrop.headcrop_s}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
48 #if $headcrop.headcrop_s:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
49 headcroplen ${headcrop.headcrop_len}
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
50 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
51 minlen $minlen
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
52 log $log
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
53 #if $log == "True":
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
54 logfile $logfile
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
55 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
56 singles $singles
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
57 #if $paired.is_paired:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
58 fwdpairs $fwdpairs
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
59 revpairs $revpairs
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
60 #end if
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
61 tool-dir \$JAR_PATH
4
e131e21fce1f Uploaded
simon-gladman
parents: 1
diff changeset
62 threads \${GALAXY_SLOTS:-4}
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
63 > $dummy_out
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
64 </command>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
65
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
66 <inputs>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
67
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
68 <conditional name="paired">
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
69 <!-- <param name="is_paired" type="boolean" checked="true" truevalue="paired" falsevalue="single" label="Paired end reads?" help="Do you have 2 separate paired end read files?"/> -->
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
70 <param name="is_paired" type="select" label="Read type selector" help="single file (not pair aware), two files (paired reads) or a dataset collection of pairs">
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
71 <option value="single" selected="true">Single File</option>
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
72 <option value="paired">Two Files</option>
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
73 <option value="collection">Single dataset collection pair</option>
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
74 </param>
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
75 <when value="paired">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
76 <param name="forwards_file" type="data" format="fastq,fastqsanger,fastqsolexa,fastqillumina" label="Direction 1 fastq reads to trim"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
77 <param name="reverse_file" type="data" format="fastq,fastqsanger,fastqsolexa,fastqillumina" label="Direction 2 fastq reads to trim"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
78 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
79 <when value="single">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
80 <param name="forwards_file" type="data" format="fastq,fastqsanger,fastqsolexa,fastqillumina" label="Fastq reads to trim"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
81 </when>
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
82 <when value="collection">
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
83 <param name="collection_data" type="data_collection" format="fastq,fastqsanger,fastqsolexa,fastqillumina" label="Paired end dataset collection" collection_type="paired"/>
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
84 </when>
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
85 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
86 <param name="phred" type="select" label="Quality encoding." help="Phred33 or Phred 64, probably Phred64">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
87 <option value="phred64">phred64</option>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
88 <option value="phred33" selected="True">phred33</option>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
89 </param>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
90
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
91 <conditional name="adapt">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
92 <param name="adapters" type="boolean" checked="false" falsevalue="False" truevalue="True" label="Clip Illumina adapters?" help="Cut adapter and other illumina-specific sequences from the read."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
93 <when value="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
94 <param name="adapt_file" type="data" format="fasta" label="Fasta of adapters to clip" help="Please supply a list of adapters to clip"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
95 <param name="adapt_seed" type="integer" value="2" label="Seed mismatches" help="Specifies the maximum mismatch count which will still allow a full match to be performed."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
96 <param name="adapt_palindrome" type="integer" value="40" label="Palindrome clip threshold" help="Specifies how accurate the match between the two 'adapter ligated' reads must be for PE palindrome read alignment."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
97 <param name="adapt_simple" type="integer" value="15" label="Simple clip threshold" help="Specifies how accurate the match between any adapter etc. sequence must be against a read."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
98 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
99 <when value="False">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
100 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
101 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
102
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
103 <conditional name="sliding">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
104 <param name="slidingwindow" type="boolean" checked="true" falsevalue="False" truevalue="True" label="Perform Sliding Window trimming?" help="Perform a sliding window trimming, cutting once the average quality within the window falls below a threshold."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
105 <when value="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
106 <param name="slid_window" type="integer" value="4" label="Sliding window size" help="Specifies the number of bases to average across"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
107 <param name="slid_qual" type="integer" value="15" label="Average quality required" help="Specifies the average quality required."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
108 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
109 <when value="false">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
110 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
111 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
112
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
113 <conditional name="leading">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
114 <param name="trimleading" type="boolean" checked="true" falsevalue="False" truevalue="True" label="Trim leading bases?" help="Cut bases off the start of a read, if below a threshold quality."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
115 <when value="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
116 <param name="lead_qual" type="integer" value="3" label="Minimum quality" help="Specifies the minimum quality required to keep a base."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
117 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
118 <when value="false">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
119 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
120 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
121
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
122 <conditional name="trailing">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
123 <param name="trimtrailing" type="boolean" checked="true" falsevalue="False" truevalue="True" label="Trim trailing bases?" help="Cut bases off the end of a read, if below a threshold quality."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
124 <when value="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
125 <param name="trail_qual" type="integer" value="3" label="Minimum quality" help="Specifies the minimum quality required to keep a base."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
126 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
127 <when value="false">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
128 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
129 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
130
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
131 <conditional name="crop">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
132 <param name="cropend" type="boolean" checked="false" falsevalue="False" truevalue="True" label="Crop reads?" help="Cut the read to a specified length."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
133 <when value="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
134 <param name="crop_len" type="integer" value="0" label="Number of bases" help="The number of bases to keep, from the start of the read."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
135 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
136 <when value="false">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
137 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
138 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
139
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
140 <conditional name="headcrop">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
141 <param name="headcrop_s" type="boolean" checked="false" falsevalue="False" truevalue="True" label="Crop starts?" help="Cut the specified number of bases from the start of the read."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
142 <when value="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
143 <param name="headcrop_len" type="integer" value="0" label="Number of bases" help="The number of bases to remove from the start of the read."/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
144 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
145 <when value="false">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
146 </when>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
147 </conditional>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
148
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
149 <param name="minlen" type="integer" value="24" label="Minimum length read" help="Drop the read if it is below specified length"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
150
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
151 <param name="logfile" type="boolean" checked="false" falsevalue="False" truevalue="True" label="Turn on log?" help="Detailed log of trims on each read. (Very large file!)"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
152 </inputs>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
153
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
154 <outputs>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
155 <data name="log" format="tabular" label="${tool.name} on ${on_string}: Trimmomatic Log" hidden="True">
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
156 </data>
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
157 <data name="fwdpairs" format="input" label="${tool.name} on ${on_string}: Dir1 trimmed pairs">
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
158 <filter>(paired['is_paired']=="single")</filter>
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
159 </data>
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
160 <data name="revpairs" format="input" label="${tool.name} on ${on_string}: Dir2 trimmed pairs">
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
161 <filter>(paired['is_paired'] == "paired" or paired['is_paired'] == "collection")</filter>
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
162 </data>
13
476184b9b2f7 Uploaded
simon-gladman
parents: 11
diff changeset
163 <data name="singles" format="input" label="${tool.name} on ${on_string}: trimmed reads"/>
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
164 <data name="dummy_out" format="tabular" label="${tool.name} on ${on_string}: DEBUG OUTPUT" hidden="True"/>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
165 </outputs>
5
afc124ad65f0 Uploaded
simon-gladman
parents: 4
diff changeset
166
afc124ad65f0 Uploaded
simon-gladman
parents: 4
diff changeset
167 <stdio>
afc124ad65f0 Uploaded
simon-gladman
parents: 4
diff changeset
168 <exit_code range="1:" level="fatal" description="Trimmomatic error" />
afc124ad65f0 Uploaded
simon-gladman
parents: 4
diff changeset
169 </stdio>
1
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
170 <help>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
171 ***Trimmomatic***
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
172
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
173 A flexible read trimming tool for Illumina NGS data
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
174
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
175
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
176
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
177 Trimmomatic performs a variety of useful trimming tasks for illumina paired-end and single ended data.The selection of trimming steps and their associated parameters are supplied on the command line.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
178
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
179 The current trimming steps are:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
180
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
181 ILLUMINACLIP: Cut adapter and other illumina-specific sequences from the read.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
182
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
183 SLIDINGWINDOW: Perform a sliding window trimming, cutting once the average quality within the window falls below a threshold.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
184
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
185 LEADING: Cut bases off the start of a read, if below a threshold quality
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
186
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
187 TRAILING: Cut bases off the end of a read, if below a threshold quality
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
188
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
189 CROP: Cut the read to a specified length
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
190
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
191 HEADCROP: Cut the specified number of bases from the start of the read
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
192
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
193 MINLEN: Drop the read if it is below a specified length
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
194
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
195 **The Adapter Fasta**
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
196
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
197 Illumina adapter and other technical sequences are copyrighted by Illumina, which makes it illegal for us to make them available without a licence. As such, you need to get access to the illumina sequences from another source, and create an appropriate adapter FASTA.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
198
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
199 To make this fasta, you must first understand how it will be used. Trimmomatic uses two strategies for adapter trimming: Palindrome and Simple
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
200
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
201 With 'simple' trimming, each adapter sequence is tested against the reads, and if a sufficiently accurate match is detected, the read is clipped appropriately.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
202
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
203 'Palindrome' trimming is specifically designed for the case of 'reading through' a short fragment into the adapter sequence on the other end. In this approach, the appropriate adapter sequences are 'in silico ligated' onto the start of the reads, and the combined adapter+read sequences, forward and reverse are aligned. If they align in a manner which indicates 'read-through', the forward read is clipped and the reverse read dropped (since it contains no new data).
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
204
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
205 Naming of the sequences indicates how they should be used. For 'Palindrome' clipping, the sequence names should both start with 'Prefix', and end in '/1' for the forward adapter and '/2' for the reverse adapter.All other sequences are checked using 'simple' mode. Sequences with names ending in '/1' or '/2' will be checked only against the forward or reverse read. All other sequences will be checked against both the forward and reverse read. If you want to check for the reverse-complement of a specific sequence, you need to specifically include the reverse-complemented form of the sequence as well, with another name.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
206
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
207 The thresholds used are a simplified log-likelihood approach. Each matching base adds just over 0.6, while each mismatch reduces the alignment score by Q/10. Therefore, a perfect match of a 20 base sequence will score just over 12, while 25 bases are needed to score 15. As such we recommend values between 12 - 15 for this parameter. For palindromic matches, the entire read sequence plus (partial) adapter sequences can be used - therefore this threshold can be higher, in the range of 30-40. The 'seed mismatch' parameter is used to make alignments more efficient, specifying the maximum base mismatch count in the 'seed' (16 bases). Typical values here are 1 or 2.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
208
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
209 **Citation**
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
210
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
211 Lohse M, Bolger AM, Nagel A, Fernie AR, Lunn JE, Stitt M, Usadel B. RobiNA: a
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
212 user-friendly, integrated software solution for RNA-Seq-based transcriptomics.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
213 Nucleic Acids Res. 2012 Jul;40(Web Server issue):W622-7.
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
214
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
215
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
216
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
217 **Contacts**
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
218
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
219 Anthony Bolger bolger at mpimp-golm dot mpg dot de
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
220
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
221 Federico M. Giorgi federico dot giorgi at gmail dot com
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
222
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
223 Wrapped for Galaxy by:
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
224
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
225 Simon Gladman (VBC/VLSCI) simon dot gladman at monash dot edu
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
226 </help>
6a5c492f34e4 Uploaded
simon-gladman
parents:
diff changeset
227 </tool>