annotate test/cnmops.xml @ 0:3ea49d2fa85f draft default tip

Uploaded
author ric
date Fri, 07 Oct 2016 05:08:11 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
1 <tool id="cnmops" name="cn.mops" version="1.0.0">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
2 <description>cnv caller</description>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
3 <requirements>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
4 <requirement type="package" version="1.16.2">bioconductor-cn.mops</requirement>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
5 </requirements>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
6 <command interpreter="Rscript">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
7 cnmops.R $args_file
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
8 </command>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
9 <configfiles>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
10 <configfile name="args_file">target=$targetFile
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
11 padding=$padding
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
12 mapping_mode=$mapping_mode
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
13 #for $i in $inputs
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
14 bam=${i.input}
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
15 bam_bai=${i.input.metadata.bam_index}
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
16 #if str($i.label.value) != "":
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
17 bam_label=${$i.label.value}
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
18 #else
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
19 bam_label=${i.input.dataset.name}
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
20 #end if
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
21 #end for
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
22 output=$output
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
23 #if str($advanced_options.advanced_options_select) == "yes"
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
24 advanced_mode=TRUE
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
25 $advanced_options.prior_impact=$prior_impact
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
26 $advanced_options.cyc=$cyc
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
27 $advanced_options.norm=$norm
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
28 $advanced_options.norm_type=$norm_type
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
29 $advanced_options.upper_threshold=$upper_threshold
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
30 $advanced_options.lower_threshold=$lower_threshold
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
31 $advanced_options.min_width=$min_width
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
32 $advanced_options.seq_alg=$seq_alg
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
33 $advanced_options.min_read_count=$min_read_count
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
34 $advanced_options.use_median=$use_median
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
35 #end if
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
36 </configfile>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
37 </configfiles>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
38 <inputs>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
39 <param format="bed" name="targetFile" type="data" label="Target regions (BED)">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
40 <validator type="unspecified_build" />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
41 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
42 <param name="padding" type="integer" value="100" label="Padding" help="Amount of padding (in bp) to add around each target region" />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
43 <param name="mapping_mode" type="select" label="Mapping mode" help="Select whether the mapping algorithm was run using paired or unpaired reads">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
44 <option value="paired" selected="true">paired</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
45 <option value="unpaired">unpaired</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
46 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
47 <repeat name="inputs" title="BAM" min="2" help="Need to add more files? Use controls below.">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
48 <param format="bam" name="input" type="data" label="BAM file">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
49 <options>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
50 <filter type="data_meta" ref="targetFile" key="dbkey"/>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
51 </options>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
52 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
53 <param name="label" type="text" size="30" value="" label="Label" help="Label to use in the output. If not given, the dataset name will be used instead">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
54 <validator type="regex" message="Spaces are not allowed">^\S*$</validator>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
55 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
56 </repeat>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
57
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
58 <!-- Advanced options -->
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
59 <conditional name="advanced_options">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
60 <param name="advanced_options_select" type="select" label="Show advanced options">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
61 <option value="yes">Yes</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
62 <option value="no" selected="true">No</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
63 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
64 <when value="yes">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
65 <param name="prior_impact" type="integer" value="10" label="Prior impact" help="Positive real value that reflects how strong the prior assumption affects the result. The higher the value the more samples will be assumed to have copy number 2." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
66 <param name="cyc" type="integer" value="20" label="Cycles" help="Positive integer that sets the number of cycles for the algorithm. Usually after less than 15 cycles convergence is reached." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
67 <param name="norm" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="true" label="Apply normalization" help="" />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
68 <param name="norm_type" type="select" label="Normalization type" help="Mode of the normalization technique. Read counts will be scaled sample-wise.">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
69 <option value="poisson" selected="true">poisson</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
70 <option value="mean">mean</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
71 <option value="min">min</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
72 <option value="median">median</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
73 <option value="quant">quant</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
74 <option value="mode">mode</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
75 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
76 <param name="upper_threshold" type="float" value="0.55" label="Cut-off for copy number gains" help="All CNV calling values above this value will be called as gain. The value should be set close to the log2 of the expected foldchange for copy number 3 or 4." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
77 <param name="lower_threshold" type="float" value="-0.8" label="Cut-off for copy number losses" help="All CNV calling values below this value will be called as loss. The value should be set close to the log2 of the expected foldchange for copy number 1 or 0." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
78 <param name="min_width" type="integer" value="5" label="Minimum width" help="Minimum number of segments a CNV should span." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
79 <param name="seq_alg" type="select" label="Segmentation algorithm" help="">
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
80 <option value="fast" selected="false">fast</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
81 <option value="DNAcopy">DNAcopy</option>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
82 </param>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
83 <param name="min_read_count" type="integer" value="1" label="Minimum read count" help="If all samples are below this value the algorithm will return the prior knowledge. This prevents the algorithm from being applied to segments with very low coverage." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
84 <param name="use_median" type="boolean" truevalue="TRUE" falsevalue="FALSE" checked="false" label="Use median" help="Whether median instead of mean of a target region should be used for the CNV call." />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
85 </when>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
86 <when value="no" />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
87 </conditional>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
88 </inputs>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
89 <outputs>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
90 <data format="bed" name="output" label="${tool.name} on ${on_string}" />
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
91 </outputs>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
92 <help>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
93
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
94 **What it does**
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
95
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
96 This tool uses cn.mops (Copy Number estimation by a Mixture Of PoissonS) to call copy number variations
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
97 and aberrations (CNVs and CNAs) from targeted next generation sequencing (NGS) data.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
98
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
99 **Output format**
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
100
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
101 ========== ========================
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
102 Column Description
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
103 ---------- ------------------------
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
104 chr Chromosome
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
105 starts Start of CNV region
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
106 ends End of CNV region
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
107 sampleName Name of the sample with CNV
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
108 median Median value of CNV
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
109 mean Mean value of CNV
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
110 CN Copy number class (see below)
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
111 ========== ========================
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
112
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
113 Copy number classes are identified as follows::
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
114
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
115 CN2: normal copy number for diploid samples
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
116 CN1: heterozygous deletion
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
117 CN0: homozygous deletion
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
118 CN3 - CN8: amplifications
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
119
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
120 For non-tumor samples the highest copy number class is 8 - higher copy numbers have not been reported.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
121 CN8 is expected to have 4 times as many reads (for times as high coverage) as CN2.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
122 For tumor samples very high copy numbers have been observed (e.g. CN64),
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
123 therefore the parameters of cn.mops have to be adjusted to allow for high copy numbers.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
124 A way to set the parameters is given in https://gist.github.com/gklambauer/8955203
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
125
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
126 **License and citation**
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
127
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
128 This Galaxy tool is Copyright © 2015 `CRS4 Srl.`_ and is released under the `MIT license`_.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
129
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
130 .. _CRS4 Srl.: http://www.crs4.it/
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
131 .. _MIT license: http://opensource.org/licenses/MIT
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
132
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
133 You can use this tool only if you agree to the license terms of: `cn.mops`_.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
134
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
135 .. _cn.mops: http://bioconductor.org/packages/release/bioc/html/cn.mops.html
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
136
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
137 If you use this tool, please cite:
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
138
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
139 - |Cuccuru2014|_
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
140 - |Klambauer2012|_.
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
141
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
142 .. |Cuccuru2014| replace:: Cuccuru, G., Orsini, M., Pinna, A., Sbardellati, A., Soranzo, N., Travaglione, A., Uva, P., Zanetti, G., Fotia, G. (2014) Orione, a web-based framework for NGS analysis in microbiology. *Bioinformatics* 30(13), 1928-1929
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
143 .. _Cuccuru2014: http://bioinformatics.oxfordjournals.org/content/30/13/1928
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
144 .. |Klambauer2012| replace:: Klambauer, G., *et al.* (2012) cn.MOPS: Mixture of Poissons for Discovering Copy Number Variations in Next Generation Sequencing Data with a Low False Discovery Rate. *Nucleic Acids Research* 40, e69
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
145 .. _Klambauer2012: http://http://nar.oxfordjournals.org/content/40/9/e69
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
146 </help>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
147 <citations>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
148 <citation type="doi">10.1093/bioinformatics/btu135</citation>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
149 <citation type="doi">10.1093/nar/gks003</citation>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
150 </citations>
3ea49d2fa85f Uploaded
ric
parents:
diff changeset
151 </tool>