annotate rgFastQC.xml @ 10:1f6fd7a898bd draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 4b383d48868d7f3f6d35f242a0ee35953adcb037
author iuc
date Mon, 15 May 2017 08:34:27 -0400
parents 0a7c65540937
children f5a25a56ab9d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
9
0a7c65540937 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 168f7aeb0f9f38de6dec873f3cbf0c30014fdd72
iuc
parents: 8
diff changeset
1 <tool id="fastqc" name="FastQC" version="0.68">
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
2 <description>Read Quality reports</description>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
3 <requirements>
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
4 <requirement type="package" version="0.11.5">fastqc</requirement>
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
5 </requirements>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
6 <stdio>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
7 <exit_code range="1:" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
8 <exit_code range=":-1" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
9 <regex match="Error:" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
10 <regex match="Exception:" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
11 </stdio>
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
12 <command><![CDATA[
8
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
13 python '${__tool_directory__}/rgFastQC.py'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
14 -i '$input_file'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
15 -d '${html_file.files_path}'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
16 -o '$html_file'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
17 -t '$text_file'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
18 -f '${input_file.ext}'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
19 -j '${input_file.name}'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
20 #if $contaminants.dataset and str($contaminants) > ''
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
21 -c '$contaminants'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
22 #end if
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
23 #if $limits.dataset and str($limits) > ''
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
24 -l '$limits'
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
25 #end if
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
26 ]]></command>
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
27 <inputs>
10
1f6fd7a898bd planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 4b383d48868d7f3f6d35f242a0ee35953adcb037
iuc
parents: 9
diff changeset
28 <param format="fastq,fastq.gz,fastq.bz2,bam,sam" name="input_file" type="data"
1f6fd7a898bd planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 4b383d48868d7f3f6d35f242a0ee35953adcb037
iuc
parents: 9
diff changeset
29 label="Short read data from your current history" />
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
30 <param name="contaminants" type="data" format="tabular" optional="true" label="Contaminant list"
8
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
31 help="tab delimited file with 2 columns: name and sequence. For example: Illumina Small RNA RT Primer CAAGCAGAAGACGGCATACGA" />
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
32 <param name="limits" type="data" format="txt" optional="true" label="Submodule and Limit specifing file"
8
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
33 help="a file that specifies which submodules are to be executed (default=all) and also specifies the thresholds for the each submodules warning parameter" />
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
34 </inputs>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
35 <outputs>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
36 <data format="html" name="html_file" label="${tool.name} on ${on_string}: Webpage" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
37 <data format="txt" name="text_file" label="${tool.name} on ${on_string}: RawData" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
38 </outputs>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
39 <tests>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
40 <test>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
41 <param name="input_file" value="1000gsample.fastq" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
42 <param name="contaminants" value="fastqc_contaminants.txt" ftype="tabular" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
43 <output name="html_file" file="fastqc_report.html" ftype="html" lines_diff="100"/>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
44 <output name="text_file" file="fastqc_data.txt" ftype="txt" lines_diff="100"/>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
45 </test>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
46 <test>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
47 <param name="input_file" value="1000gsample.fastq" />
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
48 <param name="limits" value="fastqc_customlimits.txt" ftype="txt" />
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
49 <output name="html_file" file="fastqc_report2.html" ftype="html" compare="sim_size" delta="4096"/>
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
50 <output name="text_file" file="fastqc_data2.txt" ftype="txt" compare="sim_size"/>
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
51 </test>
7
ec73b7c83b2c planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit 8918618a5ef7bdca55a31cd919efa593044a376e
devteam
parents: 6
diff changeset
52 <test>
8
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
53 <param name="input_file" value="1000gsample.fastq.gz" ftype="fastq.gz" />
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
54 <param name="contaminants" value="fastqc_contaminants.txt" ftype="tabular" />
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
55 <output name="html_file" file="fastqc_report.html" ftype="html" lines_diff="100"/>
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
56 <output name="text_file" file="fastqc_data.txt" ftype="txt" lines_diff="100"/>
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
57 </test>
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
58 <test>
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
59 <param name="input_file" value="1000gsample.fastq.bz2" ftype="fastq.bz2" />
7
ec73b7c83b2c planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit 8918618a5ef7bdca55a31cd919efa593044a376e
devteam
parents: 6
diff changeset
60 <param name="contaminants" value="fastqc_contaminants.txt" ftype="tabular" />
ec73b7c83b2c planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit 8918618a5ef7bdca55a31cd919efa593044a376e
devteam
parents: 6
diff changeset
61 <output name="html_file" file="fastqc_report.html" ftype="html" lines_diff="100"/>
ec73b7c83b2c planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit 8918618a5ef7bdca55a31cd919efa593044a376e
devteam
parents: 6
diff changeset
62 <output name="text_file" file="fastqc_data.txt" ftype="txt" lines_diff="100"/>
ec73b7c83b2c planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit 8918618a5ef7bdca55a31cd919efa593044a376e
devteam
parents: 6
diff changeset
63 </test>
3
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
64 </tests>
36980a78cc83 Uploaded
devteam
parents: 2
diff changeset
65 <help>
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
66 .. class:: infomark
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
67
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
68 **Purpose**
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
69
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
70 FastQC aims to provide a simple way to do some quality control checks on raw
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
71 sequence data coming from high throughput sequencing pipelines.
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
72 It provides a modular set of analyses which you can use to give a quick
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
73 impression of whether your data has any problems of
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
74 which you should be aware before doing any further analysis.
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
75
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
76 The main functions of FastQC are:
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
77
8
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
78 - Import of data from BAM, SAM or FastQ/FastQ.gz files (any variant),
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
79 - Providing a quick overview to tell you in which areas there may be problems
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
80 - Summary graphs and tables to quickly assess your data
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
81 - Export of results to an HTML based permanent report
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
82 - Offline operation to allow automated generation of reports without running the interactive application
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
83
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
84 -----
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
85
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
86 .. class:: infomark
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
87
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
88 **FastQC**
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
89
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
90 This is a Galaxy wrapper. It merely exposes the external package FastQC_ which is documented at FastQC_
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
91 Kindly acknowledge it as well as this tool if you use it.
10
1f6fd7a898bd planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 4b383d48868d7f3f6d35f242a0ee35953adcb037
iuc
parents: 9
diff changeset
92 FastQC incorporates the Picard-tools_ libraries for SAM/BAM processing.
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
93
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
94 The contaminants file parameter was borrowed from the independently developed
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
95 fastqcwrapper contributed to the Galaxy Community Tool Shed by J. Johnson.
1
67355741fbc3 Uploaded from GH
devteam
parents: 0
diff changeset
96 Adaption to version 0.11.2 by T. McGowan.
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
97
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
98 -----
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
99
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
100 .. class:: infomark
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
101
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
102 **Inputs and outputs**
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
103
6
e8c90ad3cbf9 planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit df4c0b0c6372e2984966e220fa42ecd8a3d370e8
devteam
parents: 5
diff changeset
104 FastQC_ is the best place to look for documentation - it's very good.
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
105 A summary follows below for those in a tearing hurry.
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
106
7
ec73b7c83b2c planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/fastqc commit 8918618a5ef7bdca55a31cd919efa593044a376e
devteam
parents: 6
diff changeset
107 This wrapper will accept a Galaxy fastq, fastq.gz, sam or bam as the input read file to check.
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
108 It will also take an optional file containing a list of contaminants information, in the form of
1
67355741fbc3 Uploaded from GH
devteam
parents: 0
diff changeset
109 a tab-delimited file with 2 columns, name and sequence. As another option the tool takes a custom
67355741fbc3 Uploaded from GH
devteam
parents: 0
diff changeset
110 limits.txt file that allows setting the warning thresholds for the different modules and also specifies
67355741fbc3 Uploaded from GH
devteam
parents: 0
diff changeset
111 which modules to include in the output.
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
112
1
67355741fbc3 Uploaded from GH
devteam
parents: 0
diff changeset
113 The tool produces a basic text and a HTML output file that contain all of the results, including the following:
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
114
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
115 - Basic Statistics
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
116 - Per base sequence quality
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
117 - Per sequence quality scores
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
118 - Per base sequence content
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
119 - Per base GC content
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
120 - Per sequence GC content
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
121 - Per base N content
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
122 - Sequence Length Distribution
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
123 - Sequence Duplication Levels
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
124 - Overrepresented sequences
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
125 - Kmer Content
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
126
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
127 All except Basic Statistics and Overrepresented sequences are plots.
9
0a7c65540937 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 168f7aeb0f9f38de6dec873f3cbf0c30014fdd72
iuc
parents: 8
diff changeset
128 .. _FastQC: http://www.bioinformatics.babraham.ac.uk/projects/fastqc/
10
1f6fd7a898bd planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit 4b383d48868d7f3f6d35f242a0ee35953adcb037
iuc
parents: 9
diff changeset
129 .. _Picard-tools: https://broadinstitute.github.io/picard/
2
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
130 </help>
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
131 <citations>
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
132 <citation type="bibtex">
8
5b995cef2fbb planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastqc commit bff04a5409662a8968c50501487042a3a0c93702
iuc
parents: 7
diff changeset
133 @unpublished{andrews_s,
2
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
134 author = {Andrews, S.},
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
135 keywords = {bioinformatics, ngs, qc},
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
136 priority = {2},
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
137 title = {{FastQC A Quality Control tool for High Throughput Sequence Data}},
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
138 url = {http://www.bioinformatics.babraham.ac.uk/projects/fastqc/}
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
139 }
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
140 </citation>
bf15645bae10 Uploaded from GH
devteam
parents: 1
diff changeset
141 </citations>
0
d5e4121e45ed Imported from capsule None
devteam
parents:
diff changeset
142 </tool>