comparison QDNAseq-export.xml @ 88:d2ea2b842c21 draft default tip

Uploaded
author stef
date Mon, 06 Jul 2015 06:29:19 -0400
parents
children
comparison
equal deleted inserted replaced
87:8391cdb7479c 88:d2ea2b842c21
1 <tool id="QDNAseq-export" name="QDNAseq-export" version="0.0.1" force_history_refresh="True">
2
3 <requirements>
4
5 <!-- R 3.1.0 dependency will be used instead when available, now default R is used, see command -->
6 <!-- <requirement type="package" version="3.1.0">R</requirement> -->
7 <!-- <requirement type="package" version="1.2.2">qdnaseq</requirement> -->
8
9 </requirements>
10
11 <description>Export QDNAseq data to tabular</description>
12
13 <!-- change to /full/path/to/Rscript if required (eg /ccagc/lib/R/R-3.1.0/bin/Rscript) -->
14 <command interpreter="Rscript">
15 QDNAseq-export.R
16 $cfg
17 </command>
18
19 <version_command interpreter="Rscript">QDNAseq-version.R</version_command>
20
21 <stdio>
22 <!-- Anything higher than 0 means the R script didnt finish (correctly) -->
23 <!-- Because different R packages deal with err/warn differently unable to waterproof this -->
24 <exit_code range="1:" level="fatal" description="R script finished too early, check log" />
25 </stdio>
26
27 <inputs>
28
29 <!-- ==================== -->
30 <!-- General inputs -->
31 <!-- ==================== -->
32
33 <!-- Job name: must contain non-whitespace chars -->
34 <param name="jobName" type="text" optional="false" label="Analysis/ouput name" help="Supply a name for the outputs to remind you what they contain" value="TEST">
35 <!-- <validator type="empty_field" /> -->
36 <validator type="regex" message="No whitespace characters allowed">^[^\s\\]*$</validator>
37 </param>
38
39 <!-- ==================== -->
40 <!-- Input RDS -->
41 <!-- ==================== -->
42 <param name="rdsFile" type="data" optional="False" format="rds" label="Input RDS file" help="RDS file should contain a QDNAseq R object (output of QDNAseq tool)" />
43
44 <!-- ==================== -->
45 <!-- Data level -->
46 <!-- ==================== -->
47 <param name="data_level" type="select" label="Level of data to export" help="If segmentation and/or calling has been performed the segmented or called values can be exported instead of copynumber (normalized read counts)">
48 <option value="copynumber">copynumbers</option>
49 <option value="segments">segments</option>
50 <option value="calls">calls</option>
51 </param>
52
53 <!-- ==================== -->
54 <!-- Include filtered bins or not -->
55 <!-- ==================== -->
56 <param name="filter_bins" type="select" label="Also output copynumber RDS files to history" help="Each bin has a filter status. By default the bins that were previously ignored by the analysis before are not send to the output. Set to 'include' if you want to include those as well">
57 <option value="TRUE">Exclude filtered bins</option>
58 <option value="FALSE">Include filtered bins</option>
59 </param>
60
61 <!-- ==================== -->
62 <!-- Output type -->
63 <!-- ==================== -->
64 <conditional name="output_format_selection">
65 <param name="output_format" type="select" label="Plot all samples in RDS object or choose one" help="All output is tabular, but depending on downstream use some formats are more handy than others">
66 <option value="tsv">TSV</option>
67 <option value="igv">IGV</option>
68 <option value="bed">BED</option>
69 </param>
70 <when value="bed">
71 <param name="sample_index" type="integer" required="True" value="1" label="sample-index (integer)" help="The object can host muliple samples while the BED option can only export one. Therefor a sample index must be chosen for this output." />
72 </when>
73 <when value="tsv">
74 <param name="sample_index" type="hidden" value="" />
75 </when>
76 <when value="igv">
77 <param name="sample_index" type="hidden" value="" />
78 </when>
79
80 </conditional>
81
82 </inputs>
83
84 <!-- ==================== -->
85 <!-- Config file to pass params to R script -->
86 <!-- ==================== -->
87 <configfiles>
88 <configfile name="cfg">
89 ## Desc: this file is sourced in QDNAseq-export.R wrapper script
90 ## as means to pass all galaxy params to R
91
92 "${jobName}" -> outputName
93 "${output_file}" -> outputFile
94 "${data_level}" -> dataLevel
95 "${output_format_selection.output_format}" -> outputFormat
96 "${rdsFile}" -> rdsFilePath
97 as.integer( "${output_format_selection.sample_index}" ) -> sampleIndex
98 as.logical( "${filter_bins}" ) -> filterBins
99
100 </configfile>
101 </configfiles>
102
103 <!-- ==================== -->
104 <!-- One text file as output -->
105 <!-- ==================== -->
106 <outputs>
107 <data format="tabular" name="output_file" label="QDNAseq: ${jobName} export file" />
108 </outputs>
109
110 <help>
111
112 **Introduction**
113
114 This tool is a wrapper for the "exportBins" function of the R Bioconductor package QDNAseq_
115
116 .. _QDNAseq: http://www.bioconductor.org/packages/release/bioc/html/QDNAseq.html
117
118 -----
119
120 **What it does**
121
122 **Input:** The input for this tool is a QDNAseq R object in RDS (R data structure) format, a (optional) output file of the QDNAseq galaxy tool. **Output:** Running this export tool provides you with one output text file. When either TSV or IGV is chosen as output format, the output file contains data of all samples present in the object. When BED is chosen as output format, output contains only one sample (by default the first). **OutputDataLevel:** The output data can be of three levels. If the object contains segmented and/or call values these can be chosen instead of the default copynumber (log2 transformed normalized read counts).
123
124 -----
125
126 **Output examples**
127
128 *Example BED output:*
129
130 ::
131
132 track name="SAMPLE1.bam" description="copynumber"
133 1 6000000 7000000 1:6000001-7000000 1.293 +
134 1 7000000 8000000 1:7000001-8000000 1.335 +
135
136 *Example TSV output:*
137
138 ::
139
140 feature chr start end SAMPLE1.bam SAMPLE2.bam
141 1:6000001-7000000 1 6000001 7000000 1.293 -0.979
142 1:7000001-8000000 1 7000001 8000000 1.335 -1.022
143
144 *Example IGV output (at segmented level):*
145
146 ::
147
148 #type=COPY_NUMBER
149 #track coords=1
150 chr start end feature SAMPLE1.bam SAMPLE2.bam
151 1 6000001 7000000 1:6000001-7000000 1.314 -1.0005
152 1 7000001 8000000 1:7000001-8000000 1.314 -1.0005
153
154 *Example IGV output (at called level):*
155
156 ::
157
158 #type=COPY_NUMBER
159 #track coords=1
160 chr start end feature SAMPLE1.bam SAMPLE2.bam
161 1 6000001 7000000 1:6000001-7000000 1 -1
162 1 7000001 8000000 1:7000001-8000000 1 -1
163
164 -----
165
166 .. class:: warningmark
167
168 As there is no R 3.1.0 galaxy-package yet (a requirement for QDNAseq) that works with all requirements, the **dependencies** need to be installed by hand and available to the user under which galaxy runs: R (>= 3.1.0) and bioconductor package QDNAseq (>= 1.2.2). In case the path to this R installation is not "R", also the wrapper xml must be updated to include the correct path during installation of this tool.
169
170 -----
171
172 **Citation**
173
174 For the underlying QDNAseq R package please cite:
175 Scheinin I, Sie D, Bengtsson H, van de Wiel MA, Olshen AB, van Thuijl HF, van Essen HF, Eijk PP, Rustenburg F, Meijer GA, Reijneveld JC, Wesseling P, Pinkel D, Albertson DG and Ylstra B (2014). “DNA copy number analysis of fresh and formalin-fixed specimens by shallow whole-genome sequencing with identification and exclusion of problematic regions in the genome assembly.” Genome Research. doi:10.1101/gr.175141.114.
176
177 See also the bioconductor package_ documentation.
178
179 .. _package: http://www.bioconductor.org/packages/release/bioc/html/QDNAseq.html
180
181 .. image:: LGG150_copynumber.png
182 .. image:: LGG150_copynumberSegmented.png
183
184 </help>
185
186 </tool>