annotate fastq_screen.xml @ 2:81a0c1c27ec8 draft default tip

Uploaded
author iuc
date Fri, 16 May 2014 19:46:52 -0400
parents 3480daf4ed27
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
8a8adbf98ecc First upload
iuc
parents:
diff changeset
1 <tool id="fastq_screen" name="fastq_screen" version="0.4.2">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
2 <description>Screen for contamination</description>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
3 <requirements>
2
81a0c1c27ec8 Uploaded
iuc
parents: 1
diff changeset
4 <requirement type="package" version="2.1.0">bowtie2</requirement>
0
8a8adbf98ecc First upload
iuc
parents:
diff changeset
5 <requirement type="package" version="0.4.2">fastq_screen</requirement>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
6 </requirements>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
7 <command>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
8 fastq_screen --aligner="bowtie2" --outdir="." --conf="$fastqrunconf"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
9 #if $sampN &gt; 0:
8a8adbf98ecc First upload
iuc
parents:
diff changeset
10 --subset "$sampN"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
11 #end if
8a8adbf98ecc First upload
iuc
parents:
diff changeset
12 "$input1"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
13 #if $singlePaired.sPaired == "paired":
8a8adbf98ecc First upload
iuc
parents:
diff changeset
14 "$input2"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
15 #end if
8a8adbf98ecc First upload
iuc
parents:
diff changeset
16 ; mv *_screen.png ${outpng} ; mv *_screen.txt ${outtext}
8a8adbf98ecc First upload
iuc
parents:
diff changeset
17 </command>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
18
8a8adbf98ecc First upload
iuc
parents:
diff changeset
19 <stdio>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
20 <regex match=".*" source="both" level="warning" description="fastqc_screen perl script output"/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
21 </stdio>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
22
8a8adbf98ecc First upload
iuc
parents:
diff changeset
23 <inputs>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
24 <param name="jobName" type="text" size="120" value="fastq_screen" label="Job narrative (included in output names as a reminder)"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
25 help="Only letters, numbers and underscores _ will be retained in this field">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
26 <sanitizer invalid_char="">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
27 <valid initial="string.letters,string.digits"><add value="_" /> </valid>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
28 </sanitizer>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
29 </param>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
30 <param name="sampN" type="integer" size="20" value="500000" label="Sample this number of reads. Set to 0 or less to use all"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
31 help="Time/precision trade off - fewer reads takes a little less time trading off precision of the estimates."/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
32 <conditional name="singlePaired">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
33 <param name="sPaired" type="select" label="Single ended or mate-pair ended reads in this library?">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
34 <option value="single" selected="true">Single-end</option>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
35 <option value="paired">Paired-end</option>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
36 </param>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
37 <when value="single">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
38 <param format="fastqsanger,fastq" name="input1" type="data" label="RNA-Seq FASTQ file" help="Nucleotide-space: Must have Sanger-scaled quality values with ASCII offset 33"/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
39 </when>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
40 <when value="paired">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
41 <param format="fastqsanger,fastq" name="input1" type="data" label="RNA-Seq FASTQ file, forward reads" help="Nucleotide-space: Must have Sanger-scaled quality values with ASCII offset 33" />
8a8adbf98ecc First upload
iuc
parents:
diff changeset
42 <param format="fastqsanger,fastq" name="input2" type="data" label="RNA-Seq FASTQ file, reverse reads" help="Nucleotide-space: Must have Sanger-scaled quality values with ASCII offset 33" />
8a8adbf98ecc First upload
iuc
parents:
diff changeset
43 </when>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
44 </conditional>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
45
8a8adbf98ecc First upload
iuc
parents:
diff changeset
46 <!-- Genome source. -->
8a8adbf98ecc First upload
iuc
parents:
diff changeset
47 <repeat name="refGenomes" title="Installed organism reference sequences to check for alignment to your fastq" min="1"
8a8adbf98ecc First upload
iuc
parents:
diff changeset
48 help="For checking cell culture sequence for contamination, Mycoplasma Genitalium might be a good choice eg">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
49 <param name="ref" type="select" label="Bowtie2 reference genome">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
50 <options from_data_table="bowtie2_indexes">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
51 <filter type="sort_by" column="3"/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
52 <validator type="no_options" message="No indexes are available for bowtie2"/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
53 </options>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
54 </param>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
55 </repeat>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
56 </inputs>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
57
8a8adbf98ecc First upload
iuc
parents:
diff changeset
58 <outputs>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
59 <data format="tabular" name="outtext" label="${jobName}.xls"/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
60 <data format="png" name="outpng" label="${jobName}.png"/>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
61 </outputs>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
62 <configfiles>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
63 <configfile name="fastqrunconf">
8a8adbf98ecc First upload
iuc
parents:
diff changeset
64 ###### autogenerated by fastq_screen.xml for fastq_screen run
2
81a0c1c27ec8 Uploaded
iuc
parents: 1
diff changeset
65 BOWTIE2 bowtie2
0
8a8adbf98ecc First upload
iuc
parents:
diff changeset
66 #for $refs in $refGenomes:
8a8adbf98ecc First upload
iuc
parents:
diff changeset
67 DATABASE $refs.ref.fields.value $refs.ref.fields.path BOWTIE2
8a8adbf98ecc First upload
iuc
parents:
diff changeset
68 #end for
8a8adbf98ecc First upload
iuc
parents:
diff changeset
69 </configfile>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
70 </configfiles>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
71
8a8adbf98ecc First upload
iuc
parents:
diff changeset
72 <help>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
73
8a8adbf98ecc First upload
iuc
parents:
diff changeset
74 **What it does**
8a8adbf98ecc First upload
iuc
parents:
diff changeset
75 This is a Galaxy wrapper exposing software from Babraham -fastq_screen_
8a8adbf98ecc First upload
iuc
parents:
diff changeset
76 Designed to search sequence data in fastq files for matches to contaminants or to check the likely
8a8adbf98ecc First upload
iuc
parents:
diff changeset
77 species.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
78 In QC checking, you can use it to look for (eg) sequence from contaminating mycoplasmae in cell cultures - it may be non-differential but it will be pro-inflammatory and, well, less than ideal.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
79
8a8adbf98ecc First upload
iuc
parents:
diff changeset
80 Here's the help from the perl script used by this wrapper:
8a8adbf98ecc First upload
iuc
parents:
diff changeset
81
8a8adbf98ecc First upload
iuc
parents:
diff changeset
82 Fastq Screen - Screen sequences against a panel of databases
8a8adbf98ecc First upload
iuc
parents:
diff changeset
83
8a8adbf98ecc First upload
iuc
parents:
diff changeset
84 Synopsis
8a8adbf98ecc First upload
iuc
parents:
diff changeset
85
8a8adbf98ecc First upload
iuc
parents:
diff changeset
86 fastq_screen [OPTION]... [FastQ FILE]...
8a8adbf98ecc First upload
iuc
parents:
diff changeset
87
8a8adbf98ecc First upload
iuc
parents:
diff changeset
88 Function
8a8adbf98ecc First upload
iuc
parents:
diff changeset
89
8a8adbf98ecc First upload
iuc
parents:
diff changeset
90 Fastq Screen is intended to be used as part of a QC pipeline.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
91 It allows you to take a sequence dataset and search it
8a8adbf98ecc First upload
iuc
parents:
diff changeset
92 against a set of bowtie databases. It will then generate
8a8adbf98ecc First upload
iuc
parents:
diff changeset
93 both a text and a graphical summary of the results to see if
8a8adbf98ecc First upload
iuc
parents:
diff changeset
94 the sequence dataset contains the kind of sequences you expect
8a8adbf98ecc First upload
iuc
parents:
diff changeset
95 or not.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
96
8a8adbf98ecc First upload
iuc
parents:
diff changeset
97 Options
8a8adbf98ecc First upload
iuc
parents:
diff changeset
98
8a8adbf98ecc First upload
iuc
parents:
diff changeset
99 --help -h Print program help and exit
8a8adbf98ecc First upload
iuc
parents:
diff changeset
100
8a8adbf98ecc First upload
iuc
parents:
diff changeset
101 --subset Don't use the whole sequence file to search, but
8a8adbf98ecc First upload
iuc
parents:
diff changeset
102 create a temporary dataset of this size. The
8a8adbf98ecc First upload
iuc
parents:
diff changeset
103 dataset created will be of approximately (within
8a8adbf98ecc First upload
iuc
parents:
diff changeset
104 a factor of 2) of this size. If the real dataset
8a8adbf98ecc First upload
iuc
parents:
diff changeset
105 is smaller than twice the specified size then the
8a8adbf98ecc First upload
iuc
parents:
diff changeset
106 whole dataset will be used. Subsets will be taken
8a8adbf98ecc First upload
iuc
parents:
diff changeset
107 evenly from throughout the whole original dataset
8a8adbf98ecc First upload
iuc
parents:
diff changeset
108
8a8adbf98ecc First upload
iuc
parents:
diff changeset
109 --paired Files are paired end. Files must be specified in
8a8adbf98ecc First upload
iuc
parents:
diff changeset
110 the correct order with pairs of files coming
8a8adbf98ecc First upload
iuc
parents:
diff changeset
111 immediately after one another. Results files will
8a8adbf98ecc First upload
iuc
parents:
diff changeset
112 be named after the first file in the pair if the
8a8adbf98ecc First upload
iuc
parents:
diff changeset
113 names differ between the two files.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
114
8a8adbf98ecc First upload
iuc
parents:
diff changeset
115 --outdir Specify a directory in which to save output files.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
116 If no directory is specified then output files
8a8adbf98ecc First upload
iuc
parents:
diff changeset
117 are saved into the same directory as the input
8a8adbf98ecc First upload
iuc
parents:
diff changeset
118 file.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
119
8a8adbf98ecc First upload
iuc
parents:
diff changeset
120 --illumina1_3 Assume that the quality values are in encoded in
8a8adbf98ecc First upload
iuc
parents:
diff changeset
121 Illumina v1.3 format. Defaults to Sanger format
8a8adbf98ecc First upload
iuc
parents:
diff changeset
122 if this flag is not specified
8a8adbf98ecc First upload
iuc
parents:
diff changeset
123
8a8adbf98ecc First upload
iuc
parents:
diff changeset
124 --quiet Supress all progress reports on stderr and only
8a8adbf98ecc First upload
iuc
parents:
diff changeset
125 report errors
8a8adbf98ecc First upload
iuc
parents:
diff changeset
126
8a8adbf98ecc First upload
iuc
parents:
diff changeset
127 --version Print the program version and exit
8a8adbf98ecc First upload
iuc
parents:
diff changeset
128
8a8adbf98ecc First upload
iuc
parents:
diff changeset
129 --threads Specify across how many threads bowtie will be
8a8adbf98ecc First upload
iuc
parents:
diff changeset
130 allowed to run. Overrides the default value set
8a8adbf98ecc First upload
iuc
parents:
diff changeset
131 in the conf file
8a8adbf98ecc First upload
iuc
parents:
diff changeset
132
8a8adbf98ecc First upload
iuc
parents:
diff changeset
133 --conf Manually specify a location for the configuration
8a8adbf98ecc First upload
iuc
parents:
diff changeset
134 file to be used for this run. If not specified
8a8adbf98ecc First upload
iuc
parents:
diff changeset
135 then the file will be taken from the same directory
8a8adbf98ecc First upload
iuc
parents:
diff changeset
136 as the fastq_screen program
8a8adbf98ecc First upload
iuc
parents:
diff changeset
137
8a8adbf98ecc First upload
iuc
parents:
diff changeset
138 --color FastQ files are in colorspace. This requires that
8a8adbf98ecc First upload
iuc
parents:
diff changeset
139 the libraries configures in the config file are
8a8adbf98ecc First upload
iuc
parents:
diff changeset
140 colorspace indices.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
141
8a8adbf98ecc First upload
iuc
parents:
diff changeset
142 --bowtie Specify extra parameters to be passed to bowtie.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
143 These parameters should be quoted to clearly
8a8adbf98ecc First upload
iuc
parents:
diff changeset
144 delimit bowtie parameters from fastq_screen
8a8adbf98ecc First upload
iuc
parents:
diff changeset
145 parameters. You should not try to use this option
8a8adbf98ecc First upload
iuc
parents:
diff changeset
146 to override the normal search or reporting options
8a8adbf98ecc First upload
iuc
parents:
diff changeset
147 for bowtie which are set automatically but it might
8a8adbf98ecc First upload
iuc
parents:
diff changeset
148 be useful to allow reads to be trimmed before
8a8adbf98ecc First upload
iuc
parents:
diff changeset
149 alignment etc.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
150
8a8adbf98ecc First upload
iuc
parents:
diff changeset
151 --bowtie2 Specify extra parameters to be passed to bowtie 2.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
152 These parameters should be quoted to clearly
8a8adbf98ecc First upload
iuc
parents:
diff changeset
153 delimit bowtie2 parameters from fastq_screen
8a8adbf98ecc First upload
iuc
parents:
diff changeset
154 parameters. You should not try to use this option
8a8adbf98ecc First upload
iuc
parents:
diff changeset
155 to override the normal search or reporting options
8a8adbf98ecc First upload
iuc
parents:
diff changeset
156 for bowtie which are set automatically but it might
8a8adbf98ecc First upload
iuc
parents:
diff changeset
157 be useful to allow reads to be trimmed before
8a8adbf98ecc First upload
iuc
parents:
diff changeset
158 alignment etc.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
159
8a8adbf98ecc First upload
iuc
parents:
diff changeset
160 --nohits Writes to a file the sequences that did not map to
8a8adbf98ecc First upload
iuc
parents:
diff changeset
161 any of the specified genome libraries. If the
8a8adbf98ecc First upload
iuc
parents:
diff changeset
162 subset option is also specified, only reads from
8a8adbf98ecc First upload
iuc
parents:
diff changeset
163 the temporary dataset that failed to align to the
8a8adbf98ecc First upload
iuc
parents:
diff changeset
164 reference genomes will be written to the output file.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
165
8a8adbf98ecc First upload
iuc
parents:
diff changeset
166 --aligner Specify the aligner to use for the mapping. Valid
8a8adbf98ecc First upload
iuc
parents:
diff changeset
167 arguments are 'bowtie' or 'bowtie2'.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
168
8a8adbf98ecc First upload
iuc
parents:
diff changeset
169
8a8adbf98ecc First upload
iuc
parents:
diff changeset
170 **Attributions**
8a8adbf98ecc First upload
iuc
parents:
diff changeset
171
8a8adbf98ecc First upload
iuc
parents:
diff changeset
172 Note that each component has its own license.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
173 Good luck with figuring out your obligations.
8a8adbf98ecc First upload
iuc
parents:
diff changeset
174
8a8adbf98ecc First upload
iuc
parents:
diff changeset
175 fastq_screen - see the web site at Fastq_screen_
8a8adbf98ecc First upload
iuc
parents:
diff changeset
176
8a8adbf98ecc First upload
iuc
parents:
diff changeset
177 Galaxy_ (that's what you are using right now!) for gluing everything together
8a8adbf98ecc First upload
iuc
parents:
diff changeset
178
8a8adbf98ecc First upload
iuc
parents:
diff changeset
179
8a8adbf98ecc First upload
iuc
parents:
diff changeset
180 Code and documentation comprising this tool was written by Ross Lazarus and that part is Licensed_ the same way as other rgenetics artefacts
8a8adbf98ecc First upload
iuc
parents:
diff changeset
181
8a8adbf98ecc First upload
iuc
parents:
diff changeset
182 .. _Fastq_screen: http://www.bioinformatics.babraham.ac.uk/projects/fastq_screen
8a8adbf98ecc First upload
iuc
parents:
diff changeset
183
8a8adbf98ecc First upload
iuc
parents:
diff changeset
184 .. _Galaxy: http://getgalaxy.org
8a8adbf98ecc First upload
iuc
parents:
diff changeset
185
8a8adbf98ecc First upload
iuc
parents:
diff changeset
186 .. _Licensed: https://www.gnu.org/licenses/lgpl.html
8a8adbf98ecc First upload
iuc
parents:
diff changeset
187
8a8adbf98ecc First upload
iuc
parents:
diff changeset
188 </help>
8a8adbf98ecc First upload
iuc
parents:
diff changeset
189 </tool>