comparison QDNAseq.xml @ 4:15a0f137bf82 draft default tip

Deleted selected files
author stef
date Tue, 30 Dec 2014 09:09:40 -0500
parents fbe7fe47991f
children
comparison
equal deleted inserted replaced
3:fbe7fe47991f 4:15a0f137bf82
1 <tool id="QDNAseq" name="QDNAseq" version="0.0.2" force_history_refresh="True">
2
3 <requirements>
4
5 <requirement type="package" version="0.1.18">samtools</requirement>
6 <!-- R 3.1.0 dependency will be used instead when available, now default R is used, see command -->
7 <!-- <requirement type="package" version="3.1.0">R</requirement> -->
8 <!-- <requirement type="package" version="1.0.5">qdnaseq</requirement> -->
9 <requirement type="set_environment">QDNASEQ_PATH</requirement>
10
11 </requirements>
12
13 <description>Quantitative copy number abberation detection</description>
14
15 <!-- change to /full/path/to/Rscript if required (eg /ccagc/lib/R/R-3.1.0/bin/Rscript) -->
16 <command interpreter="Rscript">
17 QDNAseq.R
18 $qdnaseq_cfg
19 \$QDNASEQ_PATH
20 </command>
21
22 <stdio>
23 <!-- Anything higher than 0 means the R script didnt finish (correctly) -->
24 <!-- Because different R packages deal with err/warn differently unable to waterproof this -->
25 <exit_code range="1:" level="fatal" description="R script didnt finish correctly, check log" />
26 </stdio>
27
28 <inputs>
29
30 <!-- ==================== -->
31 <!-- General inputs -->
32 <!-- ==================== -->
33
34 <!-- Job name: must contain non-whitespace chars -->
35 <param name="jobName" type="text" optional="false" label="Analysis/ouput name" help="Supply a name for the outputs to remind you what they contain" value="TEST">
36 <validator type="empty_field" />
37 <validator type="regex" message="This field should contain some non-whitespace character">.*\S</validator>
38 </param>
39
40 <!-- Bin Size: only certain sizes are supported by QDNAseq package -->
41 <param name="binSizes" type="select" optional="false" multiple="true" label="Select bin-sizes to use (kb)" help="Larger bin sizes provide faster analysis but lower resolution">
42 <option value="1000" selected="true">1Mb</option>
43 <option value="100" selected="true">100kb</option>
44 <option value="30">30kb</option>
45 <option value="15" selected="true">15kb</option>
46 <option value="5">5kb</option>
47 <option value="1">1kb</option>
48 </param>
49
50 <!-- Experiment type: only one type (SR50) supported now, maybe more in the future-->
51 <param name="experimentType" type="select" label="Type of sequencing data" help="Currently only single end reads of lenght 50 are supported within galaxy">
52 <option value="SR50">Single Reads of 50bp</option>
53 <!-- <option value="PE1000">PairedEnd1000</option> -->
54 </param>
55
56 <!-- ==================== -->
57 <!-- Input BAMs -->
58 <!-- ==================== -->
59 <param name="bams" type="data" multiple="true" optional="True" format="bam" label="Input BAMs" help="Select the BAM files to analyze" />
60
61 <!-- ==================== -->
62 <!-- Optional segmenting -->
63 <!-- ==================== -->
64 <param name="doSegment" type="select" label="Also perform segmentation" help="Segmentation collects bins with similar ratio into regions">
65 <option value="TRUE">yes</option>
66 <option value="FALSE">no</option>
67 </param>
68
69 <!-- ==================== -->
70 <!-- Option to use your own bin annotations file -->
71 <!-- ==================== -->
72 <conditional name="binannotations_source">
73 <param name="show" type="select" label="Bin annotations to use" help="Default bin-annotations are for GRCh37/hg19 and tuned for 50bp reads (single end)">
74 <option value="default">Default</option>
75 <option value="history">From history</option>
76 </param>
77 <when value="history">
78 <param name="binannotation_file" type="data" multiple="false" label="R data structure file (*.rds) with bin-annotations" help="If you made your own bin-annotations with the QDNAseq bioconductor package you can upload them to your history and select here" />
79 </when>
80 <when value="default">
81 <param name="binannotation_file" type="hidden" value="" />
82 </when>
83
84 </conditional>
85
86 <!-- ==================== -->
87 <!-- Optional advanced options -->
88 <!-- ==================== -->
89 <conditional name="advanced">
90 <param name="show" type="select" label="Use advanced options" help="Select yes to show and use filter and output options">
91 <option value="no">no</option>
92 <option value="yes">yes</option>
93 </param>
94 <when value="yes">
95
96 <param name="copynumbers_igv" type="select" label="Also output copynumber IGV file to history">
97 <option value="FALSE">no</option>
98 <option value="TRUE">yes</option>
99 </param>
100
101 <param name="undo_splits" type="select" label="undoSplits" help="If set to sdundo, see undoSD below">
102 <option value="sdundo">sdundo</option>
103 <option value="prune">prune</option>
104 <option value="none">none</option>
105 </param>
106
107 <param name="undoSD" size="10" type="float" value="1" label="undoSD" help='The number of SDs between means to keep a split if undo.splits="sdundo".' />
108
109 <param name="blacklist" type="select" label="Filter blacklisted bins (blacklist)" help="Will exclude all blacklisted bins in the binannotation if set">
110 <option value="TRUE">yes</option>
111 <option value="FALSE">no</option>
112 </param>
113
114 <param name="mappability" type="integer" value="0" min="0" max="100" label="Filter bins with lower mappability" help="Will exclude all bins will lower mappability than this number (0-100)" />
115
116 <!-- ==================== -->
117 <!-- Optional graphical/plotting options -->
118 <!-- ==================== -->
119 <param name="plot_width" size="3" type="integer" value="1440" label="Width of the png image produced" />
120 <param name="plot_height" size="3" type="integer" value="720" label="Height of the png image produced" />
121 <param name="exclude_chrs" type="select" multiple="true" label="Hide these chromosomes in plots" help="Currently only standard human chromosomes supported. NOTE: other filters might also exclude chromosomes">
122 <option value="1">1</option><option value="2">2</option>
123 <option value="3">3</option><option value="4">4</option>
124 <option value="5">5</option><option value="6">6</option>
125 <option value="7">7</option><option value="8">8</option>
126 <option value="9">9</option><option value="10">10</option>
127 <option value="11">11</option><option value="12">12</option>
128 <option value="13">13</option><option value="14">14</option>
129 <option value="15">15</option><option value="16">16</option>
130 <option value="17">17</option><option value="18">18</option>
131 <option value="19">19</option><option value="20">20</option>
132 <option value="21">21</option><option value="22">22</option>
133 <option value="X" selected="true">X</option>
134 <option value="Y" selected="true">Y</option>
135 </param>
136 </when>
137
138 <!-- need to set defaults because params are passed to R regardless of conditional opened/closed -->
139 <when value="no">
140 <param name="copynumbers_igv" type="hidden" value="FALSE" />
141 <param name="undoSD" type="hidden" value="1" />
142 <param name="undo_splits" type="hidden" value="sdundo" />
143 <param name="blacklist" type="hidden" value="TRUE" />
144 <param name="mappability" type="hidden" value="0" />
145 <param name="plot_width" type="hidden" value="1440" />
146 <param name="plot_height" type="hidden" value="720" />
147 <param name="exclude_chrs" type="hidden" value="X,Y" />
148 </when>
149 </conditional>
150
151 <!-- ==================== -->
152 <!-- Option to perform a test run with built in data -->
153 <!-- ==================== -->
154 <param name="debug" type="select" label="Run with test data" help="Use inbuilt LGG150 data instead of input BAMs">
155 <option value="FALSE">no</option>
156 <option value="TRUE">yes</option>
157 </param>
158
159 </inputs>
160 <!-- ==================== -->
161 <!-- Config file to pass params to R script -->
162 <!-- ==================== -->
163 <configfiles>
164 <configfile name="qdnaseq_cfg">
165 ## Desc: this file was sourced in QDNAseq R wrapper script
166 ## as means to pass all galaxy params to R
167
168 ## -----
169 ## required params
170 ## -----
171 TRUE -> inGalaxy
172 "${binSizes}" -> binSizesString
173 "${experimentType}" -> experimentType
174 "${jobName}" -> outputName
175
176 ## -----
177 ## extra main params
178 ## -----
179 "${htmlFile}" -> outputHtml
180 "${htmlFile.id}" -> outputId
181 "${__new_file_path__}" -> newFilePath
182
183 "${htmlFile.files_path}" -> outputPath
184 as.logical( "${doSegment}" ) -> doSegment
185 as.logical( "${debug}" ) -> debug
186
187 ## -----
188 ## own bin-annotations file options
189 ## -----
190 "${binannotations_source.binannotation_file}" -> binAnnotations
191
192 ## -----
193 ## advanced options
194 ## -----
195 as.double( "${advanced.undoSD}" ) -> undoSD
196 as.logical( "${advanced.blacklist}" ) -> filterBlacklistedBins
197 as.integer( "${advanced.mappability}" ) -> mappabilityCutoff
198 "${advanced.undo_splits}" -> undoSplits
199 as.logical( "${advanced.copynumbers_igv}" ) -> doOutputCopynumbersIgv
200
201 ## #for binSize in $binSizes}.split(",")#
202 ## "${binSize}kbp_${igvCopyNumbers}" -> copyNumbersIgvDatasetFile
203 ## #end for
204
205 ## -----
206 ## plot options
207 ## -----
208 as.integer( "${advanced.plot_width}" ) -> PLOT_WIDTH
209 as.integer( "${advanced.plot_height}" ) -> PLOT_HEIGHT
210 "${advanced.exclude_chrs}" -> excludeChrsString
211
212 ## -----
213 ## input BAMs init
214 ## -----
215 c() -> bamsPaths
216 c() -> bamsNames
217
218 #for bam in $bams#
219 c( bamsPaths, "${bam}" ) -> bamsPaths
220 c( bamsNames, "${bam.name}" ) -> bamsNames
221 #end for
222
223 </configfile>
224 </configfiles>
225
226 <!-- ==================== -->
227 <!-- Main output is an html based report -->
228 <!-- ==================== -->
229 <outputs>
230
231 <!-- main output is a html report -->
232 <!-- ...but there can be more outputs using the id of the htmlFile output -->
233 <data format="html" name="htmlFile" label="QDNAseq: ${jobName}" />
234
235 </outputs>
236
237 <!-- ==================== -->
238 <!-- Tests still to be done -->
239 <!-- ==================== -->
240
241 <!--
242 <tests>
243 <test>
244 <param name="input1" value="input1" />
245 <param name="input2" value="input2" />
246 </test>
247 </tests>
248 -->
249
250 <help>
251 .. class:: infomark
252
253 **Introduction**
254
255 This tool is a wrapper for the R Bioconductor package QDNAseq_
256
257 .. _QDNAseq: http://www.bioconductor.org/packages/release/bioc/html/QDNAseq.html
258
259 It determines the copy number state of human chromosomes 1 - 22 for (shallow coverage) whole genome sequencing data.
260
261 For questions/remarks about the galaxy part of this tool, see contact form here_
262
263 .. _here: http://www.stefs.nl/wp/contact
264
265 You can **test this tool** with built-in data by selecting the option "Run with test data" and press execute.
266
267 -----
268
269 .. class:: warningmark
270
271 As there is no R 3.1.0 galaxy-package yet (a requirement for QDNAseq), the **dependencies** need to be installed by hand and available to the user under which galaxy runs: R (3.1.0) and bioconductor package QDNAseq (>= 1.0.5). In case the default R is not 3.1.0, also the wrapper xml must be updated to include the correct path during installation of this tool.
272
273 .. class:: warningmark
274
275 The input BAMs are expected to be **single end reads of 50bp length** mapped to GRCh37/hg19 genome build. Other experiment setups are currently not tested or supported within galaxy. See the documentation of QDNAseq at bioconductor on how to deal with different setups (or keep fingers crossed ;) )
276
277 .. class:: warningmark
278
279 Requires **internet access** for downloading bin-annotations from bitbucket and to show some styling (css) of the final report
280
281 -----
282
283 **Citation**
284
285 For the underlying QDNAseq R package please cite:
286 Scheinin I, Sie D, Bengtsson H, van de Wiel MA, Olshen AB, van Thuijl HF, van Essen HF, Eijk PP, Rustenburg F, Meijer GA, Reijneveld JC, Wesseling P, Pinkel D, Albertson DG and Ylstra B (2014). “DNA copy number analysis of fresh and formalin-fixed specimens by shallow whole-genome sequencing with identification and exclusion of problematic regions in the genome assembly.” Genome Research. doi:10.1101/gr.175141.114.
287
288 See also the bioconductor package_ documentation.
289
290 .. _package: http://www.bioconductor.org/packages/release/bioc/html/QDNAseq.html
291
292 .. image:: LGG150_copynumber.png
293 .. image:: LGG150_copynumberSegmented.png
294
295 </help>
296
297 </tool>