annotate ncPRO-QC.xml @ 13:8a50d975ad4d draft default tip

Uploaded
author jbrayet
date Thu, 28 Jan 2016 09:33:22 -0500
parents 66a97bd8742f
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
5
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
1 <tool id="ncPRO-QC" name="Alignment and QC">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
2 <description>of sRNA-seq data</description>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
3 <requirements>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
4 <container type="docker">institutcuriengsintegration/ncproseqgalaxy:1.6.5</container>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
5 </requirements>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
6 <command interpreter="bash">ncPRO-QC.sh
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
7 #for $i in $input_conditional.sampleNumber.samples
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
8 -i ${i.input}
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
9 #end for
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
10 #for $i in $input_conditional.sampleNumber.samples
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
11 -s ${i.sampleName}
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
12 #end for
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
13 #for $i in $input_conditional.sampleNumber.samples
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
14 -q ${i.fastqFormat}
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
15 #end for
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
16 -t $input_conditional.input_type
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
17 -n $projectName
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
18 -g $genome
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
19 -f $Rfam
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
20 -l $outlog
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
21 -r $report
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
22 -h $outhtml
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
23 -p $outpdf
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
24 #if $input_conditional.input_type == "fastq"
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
25 -a $input_conditional.mapping
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
26 #if $input_conditional.sampleNumber.numberOfSample == "1"
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
27 -o $outbam_0
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
28 #end if
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
29 #if $input_conditional.sampleNumber.numberOfSample == "2"
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
30 -o $outbam_1 -o $outbam_2
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
31 #end if
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
32 #if $input_conditional.sampleNumber.numberOfSample == "3"
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
33 -o $outbam_3 -o $outbam_4 -o $outbam_5
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
34 #end if
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
35 #if $input_conditional.sampleNumber.numberOfSample == "4"
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
36 -o $outbam_6 -o $outbam_7 -o $outbam_8 -o $outbam_9
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
37 #end if
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
38 #end if
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
39 -d ${__root_dir__}
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
40 </command>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
41 <inputs>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
42 <param name="projectName" type="text" value="Project_1" size="20" label="Give a project name" >
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
43 <sanitizer invalid_char="">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
44 <valid initial="string.letters,string.digits"><add value="_"/></valid>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
45 </sanitizer>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
46 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
47 <conditional name="input_conditional">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
48 <param name="input_type" type="select" label="Select your input file format" help="Raw datafile (fastq) or aligned file (BAM) are allowed. Different treatment will be performed according to the data type.">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
49 <option value="fastq" selected="true">fastq</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
50 <option value="bam">bam</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
51 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
52 <when value="fastq">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
53 <conditional name="sampleNumber">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
54 <param name="numberOfSample" type="select" label="Number of sample(s)">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
55 <option value="1" selected="true">1</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
56 <option value="2">2</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
57 <option value="3">3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
58 <option value="4">4</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
59 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
60 <when value="1">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
61 <repeat name="samples" title="Sample Name" min="1" max="1" default="1">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
62 <param name="sampleName" type="text" value="input" size="30" label="Name">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
63 <sanitizer invalid_char="">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
64 <valid initial="string.letters,string.digits"><add value="_"/></valid>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
65 </sanitizer>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
66 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
67 <param name="fastqFormat" type="select" label="Fastq format">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
68 <option value="phred33" selected="true">phred33</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
69 <option value="solexa">solexa</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
70 <option value="solexa1.3">solexa1.3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
71 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
72 <param name="input" type="data" format="fastq" label="Raw Input file"/>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
73 </repeat>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
74 </when>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
75 <when value="2">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
76 <repeat name="samples" title="Sample Name" min="2" max="2" default="2">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
77 <param name="sampleName" type="text" value="input" size="30" label="Name">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
78 <sanitizer invalid_char="">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
79 <valid initial="string.letters,string.digits"><add value="_"/></valid>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
80 </sanitizer>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
81 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
82 <param name="fastqFormat" type="select" label="Fastq format">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
83 <option value="phred33" selected="true">phred33</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
84 <option value="solexa">solexa</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
85 <option value="solexa1.3">solexa1.3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
86 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
87 <param name="input" type="data" format="fastq" label="Raw Input file"/>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
88 </repeat>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
89 </when>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
90 <when value="3">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
91 <repeat name="samples" title="Sample Name" min="3" max="3" default="3">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
92 <param name="sampleName" type="text" value="input" size="30" label="Name">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
93 <sanitizer invalid_char="">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
94 <valid initial="string.letters,string.digits"><add value="_"/></valid>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
95 </sanitizer>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
96 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
97 <param name="fastqFormat" type="select" label="Fastq format">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
98 <option value="phred33" selected="true">phred33</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
99 <option value="solexa">solexa</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
100 <option value="solexa1.3">solexa1.3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
101 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
102 <param name="input" type="data" format="fastq" label="Raw Input file"/>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
103 </repeat>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
104 </when>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
105 <when value="4">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
106 <repeat name="samples" title="Sample Name" min="4" max="4" default="4">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
107 <param name="sampleName" type="text" value="input" size="30" label="Name">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
108 <sanitizer invalid_char="">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
109 <valid initial="string.letters,string.digits"><add value="_"/></valid>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
110 </sanitizer>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
111 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
112 <param name="fastqFormat" type="select" label="Fastq format">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
113 <option value="phred33" selected="true">phred33</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
114 <option value="solexa">solexa</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
115 <option value="solexa1.3">solexa1.3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
116 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
117 <param name="input" type="data" format="fastq" label="Raw Input file"/>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
118 </repeat>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
119 </when>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
120 </conditional>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
121 <param name="mapping" type="boolean" value="False" truevalue="True" falsevalue="False" label="Run Alignment" help="ncPRO-seq proposes to align the reads on a reference genome using the Bowtie aligner"/>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
122 </when>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
123 <when value="bam">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
124 <repeat name="samples" title="Sample Name" min="1" max="4" default="1">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
125 <param name="sampleName" type="text" value="input" size="30" label="Name">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
126 <sanitizer invalid_char="">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
127 <valid initial="string.letters,string.digits"><add value="_"/></valid>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
128 </sanitizer>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
129 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
130 <param name="input" type="data" format="bam" label="Input file"/>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
131 </repeat>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
132 </when>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
133 </conditional>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
134 <param name="genome" type="select" label="Select a reference genome">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
135 <option value="human_hg19">hg19</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
136 <option value="mouse_mm10">mm10</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
137 <option value="mouse_mm9">mm9</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
138 <option value="zebrafish_Zv9">Zv9</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
139 <option value="athaliana_TAIR9">TAIR9</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
140 <option value="zebrafinch_taeGut1">taeGut1</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
141 <option value="chicken_galGal3">galGal3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
142 <option value="rat_rn4">rn4</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
143 <option value="rat_rn5">rn5</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
144 <option value="platypus_ornAna1">ornAna1</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
145 <option value="opossum_monDom5">monDom5</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
146 <option value="macaca_rheMac2">rheMac2</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
147 <option value="horse_equCab2">equCab2</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
148 <option value="dog_canFam2">canFam2</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
149 <option value="dmelanogaster_dm3">dm3</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
150 <option value="cow_bosTau4">bosTau4</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
151 <option value="celegans_ce6">ce6</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
152 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
153 <param name="Rfam" type="boolean" value="False" truevalue="True" falsevalue="False" label="Generate the annotation overview using the RFAM and RepeatMasker database (only for aligned data)" />
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
154 <!--<param name="Rmsk" type="boolean" value="False" truevalue="True" falsevalue="False" label="Rmsk overview" />-->
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
155 <param name="report" type="select" label="Select your report format" >
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
156 <option value="all" selected="True">html and pdf</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
157 <option value="html">html</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
158 <option value="pdf">pdf</option>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
159 </param>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
160 </inputs>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
161 <outputs>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
162 <data format="bam" name="outbam_0" label="ncPRO mapped file">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
163 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '1'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
164 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
165 <data format="bam" name="outbam_1" label="ncPRO mapped file 1">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
166 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '2'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
167 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
168 <data format="bam" name="outbam_2" label="ncPRO mapped file 2">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
169 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '2'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
170 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
171 <data format="bam" name="outbam_3" label="ncPRO mapped file 1">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
172 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '3'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
173 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
174 <data format="bam" name="outbam_4" label="ncPRO mapped file 2">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
175 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '3'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
176 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
177 <data format="bam" name="outbam_5" label="ncPRO mapped file 3">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
178 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '3'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
179 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
180 <data format="bam" name="outbam_6" label="ncPRO mapped file 1">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
181 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '4'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
182 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
183 <data format="bam" name="outbam_7" label="ncPRO mapped file 2">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
184 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '4'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
185 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
186 <data format="bam" name="outbam_8" label="ncPRO mapped file 3">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
187 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '4'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
188 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
189 <data format="bam" name="outbam_9" label="ncPRO mapped file 4">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
190 <filter>((input_conditional['input_type'] == 'fastq') and (input_conditional['mapping'] == True) and (input_conditional['sampleNumber']['numberOfSample'] == '4'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
191 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
192 <data format="html" name="outhtml" label="ncPRO html report">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
193 <filter>((report == 'all') or (report == 'html'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
194 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
195 <data format="pdf" name="outpdf" label="ncPRO pdf report">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
196 <filter>((report == 'all') or (report == 'pdf'))</filter>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
197 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
198 <data format="txt" name="outlog" label="ncPRO log">
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
199 </data>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
200 </outputs>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
201 <help>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
202
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
203 **What ncPRO-seq does ?**
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
204
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
205 ------
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
206
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
207 ncPRO-seq is a tool for annotation and profiling of ncRNAs from smallRNA sequencing data. It aims to interrogate and perform detailed analysis on small RNAs derived from annotated non-coding regions in miRBase, Rfam and repeatMasker, and regions defined by users. A command line version and an online version are available at http://ncpro.curie.fr.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
208 If you use the ncPRO-seq tool for your analysis, please cite the following paper :
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
209 Chen C., Servant N., Toedling J., Sarazin A., Marchais A., Duvernois-Berthet E., Cognat V., Colot V., Voinnet O., Heard E., Ciaudo C. and Barillot E. (2012) ncPRO-seq: a tool for annotation and profiling analysis of ncRNAs from small RNA-seq.Bioinformatics.28(23):3147-9.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
210
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
211 # Copyleft ↄ⃝ 2012 Institut Curie
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
212 # Author(s): Jocelyn Brayet, Laurene Syx, Chongjian Chen, Nicolas Servant(Institut Curie) 2012 - 2015
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
213 # Contact: bioinfo.ncproseq@curie.fr
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
214 # This software is distributed without any guarantee under the terms of the GNU General
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
215 # Public License, either Version 2, June 1991 or Version 3, June 2007.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
216
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
217 ------
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
218
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
219 **Input Formats**
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
220
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
221 Raw datafile (fastq) or aligned file (BAM) are allowed. In all the case, ncPRO-seq will performed a quality control of your data.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
222
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
223 ------
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
224
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
225 **Quality Control of raw data**
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
226
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
227 -Base Composition Information
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
228
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
229 Display the proportion of each base position for which each of the four normal DNA bases has been called (or GC content). If you see strong biases which change in different bases then this usually indicates an overrepresented sequence which is contaminating your library. A bias which is consistent across all bases either indicates that the original library was sequence biased, or that there was a systematic problem during the sequencing of the library.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
230
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
231 -Quality Score
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
232
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
233 This view presents the quality values across all bases at each position in the FastQ file.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
234 The y-axis on the graph shows the mean quality scores. The higher the score the better the base call. The quality of calls on most platforms will degrade as the run progresses, so it is common to see base calls falling into the orange area towards the end of a read.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
235 We usually consider as good quality, the data with a mean quality higher than 20.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
236
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
237 -Reads Length Distribution
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
238
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
239 The insert size distribution is the most important quality control in sRNA-seq data. ncPRO-seq provides two types of information, i.e. the abundant versus the distinct reads length distribution. The abundant distribution considers all reads as they are described in the fastq file. The distinct distribution merges all duplicated sequence as one. This view usually decreases the importance of miRNAs to highlight other population-based ncRNAs.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
240
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
241 ------
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
242
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
243 **Reads Alignment**
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
244
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
245 In case of raw data, ncPRO-seq proposes to align them on a reference genome using the Bowtie aligner. A default alignment is performed to return the best read alignment with a few mismatches allowed (--best --strata -e 50 -nomaqround). Up to 20 locations for a given read are allowed (-a -m 20) in order to deal with ncRNAs repeated on the genome.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
246
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
247 ------
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
248
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
249 **Quality Control of aligned data**
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
250
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
251 -Mapping statistics
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
252
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
253 The proportions of reads with unique, multiple mapping sites in the genome, and unmapped reads is plotted. For sRNA-seq data, we usually expect to have a large proportion of unique hits.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
254
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
255 -Annotation overview
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
256
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
257 The reads annotation family is the most general overview, and counts the reads based on the following annotations: coding genes, ncRNAs from Rfam, smallRNAs from repeated regions, rRNAs, piRNAs from piRBase and precursor miRNAs from miRBase.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
258
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
259 -miRNA reads proportion (miRBase)
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
260
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
261 A dedicated plot is available for pre-miRNAs. In this step, abundant reads mapped in mature miRNA regions are counted, and plotted as the proportion of all mapped reads in the genome. The annotation file of mature miRNA is generated using files from miRBase. Each miRNA count is calculated using the intersection of the reads alignment with the precursor position.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
262 In a classical sRNA-seq experiment, we usually expect to have a high level of miRNAs (around 70%). This information can be used as a quality control for mammals. If a small proportion of miRNAs is observed, it means that another population of ncRNA predominates. This can be real biological information, or a contamination (tRNA, rRNA, etc.)
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
263
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
264 ------
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
265
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
266 **RFAM and RepeatMasker annotation overview**
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
267
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
268 After alignment, ncPRO-seq can give a first overview of your data annotation, by overlapping the aligned read with the known annotations from the RFAM or RepeatMasker database.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
269
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
270 -ncRNA annotation (RFAM)
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
271
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
272 To compare the read expression in different repeat/Rfam families, we count the number of abundant reads in each family and plot the relative proportion.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
273 We catalogue non-coding RNA genes in Rfam annotation into five big classes: tRNA, rRNA, snRNA, snoRNA and others. Note that miRNA annotations are excluded in the Rfam noncoding RNA analyses to be replaced by the miRBase annotation.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
274
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
275 -Repeats annotation (RepeatMasker)
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
276
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
277 ncPRO-seq uses repeat annotations from RepeatMasker database. We classify different repeats based on the name of repeat family.
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
278
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
279 </help>
66a97bd8742f Uploaded
jbrayet
parents:
diff changeset
280 </tool>