annotate bamCorrelate.xml @ 48:72d1d7c68bd3 draft

Uploaded
author bgruening
date Tue, 26 Aug 2014 13:48:56 -0400
parents b9feca1f07f0
children c0a054f2eff8
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
45
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
1 <tool id="deeptools_bamCorrelate" name="bamCorrelate" version="@WRAPPER_VERSION@.0">
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
2 <description>correlates pairs of BAM files</description>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
3 <expand macro="requirements" />
22
8710187d1eb5 Uploaded
bgruening
parents: 16
diff changeset
4 <expand macro="stdio" />
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
5 <macros>
34
934b9fccabd4 Uploaded
bgruening
parents: 33
diff changeset
6 <token name="@BINARY@">bamCorrelate</token>
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
7 <import>deepTools_macros.xml</import>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
8 </macros>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
9 <command>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
10 #set files=[]
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
11 #set labels=[]
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
12
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
13 @multiple_input_bams@
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
14
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
15 bamCorrelate
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
16
16
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
17 $mode.modeOpt
15
351cd1f8791b Uploaded
bgruening
parents: 14
diff changeset
18
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
19 @THREADS@
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
20
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
21 --bamfiles #echo " ".join($files)
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
22 --labels #echo " ".join($labels)
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
23 --fragmentLength $fragmentLength
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
24 --corMethod $corMethod
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
25
24
e43b4015b4cc Uploaded
bgruening
parents: 22
diff changeset
26 --plotFile $outFileName
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
27
29
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
28 #if $output.showOutputSettings == "yes"
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
29 --outRawCounts '$outFileRawCounts'
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
30 --outFileCorMatrix '$outFileCorMatrix'
24
e43b4015b4cc Uploaded
bgruening
parents: 22
diff changeset
31 --plotFileFormat $output.outFileFormat
e43b4015b4cc Uploaded
bgruening
parents: 22
diff changeset
32 #else:
e43b4015b4cc Uploaded
bgruening
parents: 22
diff changeset
33 --plotFileFormat 'png'
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
34 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
35
16
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
36 #if $mode.modeOpt == "bins":
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
37 --binSize '$mode.binSize'
45
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
38 --distanceBetweenBins '$mode.distanceBetweenBins'
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
39 $mode.doNotRemoveOutliers
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
40
16
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
41 #else:
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
42 --BED $mode.region_file
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
43 #end if
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
44
30
2e5b92e7f3cb Uploaded
bgruening
parents: 29
diff changeset
45 #### options available in both modes
2e5b92e7f3cb Uploaded
bgruening
parents: 29
diff changeset
46 #if str($mode.region.value) != '':
2e5b92e7f3cb Uploaded
bgruening
parents: 29
diff changeset
47 --region '$mode.region'
2e5b92e7f3cb Uploaded
bgruening
parents: 29
diff changeset
48 #end if
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
49
30
2e5b92e7f3cb Uploaded
bgruening
parents: 29
diff changeset
50 #if $mode.advancedOpt.showAdvancedOpt == "yes":
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
51
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
52 $mode.advancedOpt.doNotExtendPairedEnds
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
53 $mode.advancedOpt.ignoreDuplicates
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
54 $mode.advancedOpt.includeZeros
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
55
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
56 #if $mode.advancedOpt.minMappingQuality:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
57 --minMappingQuality '$mode.advancedOpt.minMappingQuality'
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
58 #end if
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
59
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
60 #if $mode.advancedOpt.zMin:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
61 --zMin $mode.advancedOpt.zMin
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
62 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
63 #if $mode.advancedOpt.zMax:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
64 --zMax $mode.advancedOpt.zMax
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
65 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
66 --colorMap '$mode.advancedOpt.colorMap'
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
67
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
68 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
69 </command>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
70
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
71 <inputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
72 <expand macro="multiple_input_bams" />
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
73
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
74 <param name="fragmentLength" type="integer" value="300" min="1"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
75 label="Length of the average fragment size"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
76 help ="Reads will be extended to match this length unless they are paired-end, in which case they will be extended to match the fragment length. *NOTE*: If the BAM files contain mated and unmated paired-end reads, unmated reads will be extended to match the fragment length."/>
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
77
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
78 <param name="corMethod" type="select" label="Correlation method">
45
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
79 <option value="spearman" selected="True">Spearman</option>
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
80 <option value="pearson">Pearson</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
81 </param>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
82
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
83 <conditional name="mode">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
84 <param name="modeOpt" type="select" label="Choose computation mode"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
85 help="In the bins mode, the correlation is computed based on equal length bins. In the BED file mode, as list of genomic regions in BED format has to be given. For each region in the BED file the number of overlapping reads is counted in each of the BAM files. Then the correlation is computed.">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
86 <option value="bins" selected="true">Bins</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
87 <option value="BED-file">Limit correlation to certain regions (BED file)</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
88 </param>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
89 <when value="bins">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
90 <param name="binSize" type="integer" value="10000" min="1"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
91 label="Bin size in bp"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
92 help="Length in base pairs for a window used to sample the genome."/>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
93
45
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
94 <param name="distanceBetweenBins" type="integer" value="0" min="0"
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
95 label="Distance between bins"
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
96 help="By default, bamCorrelate considers consecutive bins of
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
97 the specified 'Bin size'. However, to reduce the
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
98 computation time, a larger distance between bins can
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
99 by given. Larger distances result in less bins being
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
100 considered"/>
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
101
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
102 <param name="doNotRemoveOutliers" type="boolean"
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
103 truevalue="--doNotRemoveOutliers" falsevalue="" label="Do not filter outliers"
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
104 help="By default, bins with very large counts are removed.
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
105 By setting this option, outliers will not be
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
106 removed. Bins with unusually large counts normally
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
107 correspond to regions in the genome that accumulate
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
108 lot of reads like satellite regions. If outliers are not
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
109 removed the pearson correlation will wrongly report a
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
110 very high correlation; that's why, by default,
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
111 bamCorrelate tries to remove outliers using
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
112 the median absolute deviation (MAD) method applying a
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
113 threshold of 200 to only consider extremely large
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
114 deviations from the median."/>
b9feca1f07f0 Uploaded
bgruening
parents: 43
diff changeset
115
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
116 <expand macro="bamCorrelate_mode_actions" />
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
117 </when>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
118 <when value="BED-file">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
119 <param name="region_file" type="data" format="bed" label="Region file in BED format" help="Correlation is computed for the number of reads that overlap such regions."/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
120 <expand macro="bamCorrelate_mode_actions" />
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
121 </when>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
122
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
123 </conditional>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
124
29
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
125 <conditional name="output">
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
126 <param name="showOutputSettings" type="select" label="Show advanced output settings" >
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
127 <option value="no" selected="true">no</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
128 <option value="yes">yes</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
129 </param>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
130 <when value="no" />
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
131 <when value="yes">
25
df9f0dbb1d2a Uploaded
bgruening
parents: 24
diff changeset
132 <expand macro="input_image_file_format"/>
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
133 <param name="saveRawCounts" type="boolean" label="Save the bin counts"/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
134 <param name="saveCorMatrix" type="boolean" label="Save the correlation matrix"/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
135 </when>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
136 </conditional>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
137
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
138 </inputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
139 <outputs>
25
df9f0dbb1d2a Uploaded
bgruening
parents: 24
diff changeset
140 <expand macro="output_image_file_format" />
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
141 <data format="tabular" name="outFileRawCounts" label="${tool.name} on ${on_string}: bin counts">
29
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
142 <filter>
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
143 ((
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
144 output['showOutputSettings'] == 'yes' and
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
145 output['saveRawCounts'] is True
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
146 ))
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
147 </filter>
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
148 </data>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
149 <data format="tabular" name="outFileCorMatrix" label="${tool.name} on ${on_string}: correlation matrix">
29
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
150 <filter>
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
151 ((
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
152 output['showOutputSettings'] == 'yes' and
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
153 output['saveCorMatrix'] is True
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
154 ))
60788be7b346 Uploaded
bgruening
parents: 25
diff changeset
155 </filter>
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
156 </data>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
157 </outputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
158 <help>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
159
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
160 **What it does**
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
161
5
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
162 This tool is useful to assess the overall similarity of different BAM files. A typical application
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
163 is to check the correlation between replicates or published data sets.
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
164
6
c5847db0cb41 Uploaded
bgruening
parents: 5
diff changeset
165 The tool splits the genomes into bins of given length. For each bin, the number of reads
43
c5787c91cab8 Uploaded
bgruening
parents: 37
diff changeset
166 found in each BAM file is counted and a correlation (either Pearson or Spearman) is computed for all
c5787c91cab8 Uploaded
bgruening
parents: 37
diff changeset
167 pairs of BAM files. Finally, a heatmap is drawn based on the similarity of the samples.
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
168
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
169
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
170 .. image:: $PATH_TO_IMAGES/QC_bamCorrelate_humanSamples.png
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
171 :alt: Heatmap of RNA Polymerase II ChIP-seq
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
172
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
173
43
c5787c91cab8 Uploaded
bgruening
parents: 37
diff changeset
174 You can find more details on the bamCorrelate wiki page: https://github.com/fidelram/deepTools/wiki/QC#wiki-bamCorrelate
37
2f7edf06a5da Uploaded
bgruening
parents: 34
diff changeset
175
2f7edf06a5da Uploaded
bgruening
parents: 34
diff changeset
176
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
177 **Output files**:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
178
43
c5787c91cab8 Uploaded
bgruening
parents: 37
diff changeset
179 - **diagnostic plot**: clustered heatmap displaying the values for each pair-wise correlation, see below for an example
c5787c91cab8 Uploaded
bgruening
parents: 37
diff changeset
180 - data matrix (optional): if you want to plot the correlation values using a different program, e.g. R, this matrix can be used
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
181
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
182
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
183 -----
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
184
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
185 @REFERENCES@
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
186
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
187 </help>
48
72d1d7c68bd3 Uploaded
bgruening
parents: 45
diff changeset
188 <expand macro="citations" />
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
189 </tool>