annotate bamCorrelate.xml @ 22:8710187d1eb5 draft

Uploaded
author bgruening
date Thu, 12 Dec 2013 18:11:46 -0500
parents d0667be9cb0c
children e43b4015b4cc
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
c5847db0cb41 Uploaded
bgruening
parents: 5
diff changeset
1 <tool id="deeptools_bamCorrelate" name="bamCorrelate" version="1.0.1">
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
2 <description>correlates pairs of BAM files</description>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
3 <expand macro="requirements" />
22
8710187d1eb5 Uploaded
bgruening
parents: 16
diff changeset
4 <expand macro="stdio" />
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
5 <macros>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
6 <import>deepTools_macros.xml</import>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
7 </macros>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
8 <command>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
9 #import tempfile
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
10 #set $temp_dir = os.path.abspath(tempfile.mkdtemp())
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
11
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
12 #set files=[]
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
13 #set labels=[]
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
14
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
15 @multiple_input_bams@
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
16
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
17 bamCorrelate
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
18
16
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
19 $mode.modeOpt
15
351cd1f8791b Uploaded
bgruening
parents: 14
diff changeset
20
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
21 @THREADS@
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
22
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
23 --bamfiles #echo " ".join($files)
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
24 --labels #echo " ".join($labels)
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
25
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
26 --fragmentLength $fragmentLength
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
27 --corMethod $corMethod
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
28
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
29 #set newoutFileName=str($outFileName)+".png"
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
30 --plotFile $newoutFileName
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
31
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
32 #if $outputOpt.showOutputOpt == "yes"
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
33 --outRawCounts '$outFileRawCounts'
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
34 --outFileCorMatrix '$outFileCorMatrix'
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
35 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
36
16
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
37 #if $mode.modeOpt == "bins":
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
38 --binSize '$mode.binSize'
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
39 --numberOfSamples '$mode.numberOfSamples'
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
40 #else:
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
41 --BED $mode.region_file
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
42 #end if
d0667be9cb0c Uploaded
bgruening
parents: 15
diff changeset
43
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
44 ## options available in both modes
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
45 #if $mode.advancedOpt.showAdvancedOpt == "yes":
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
46
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
47 #if str($mode.advancedOpt.region.value) != '':
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
48 --region '$mode.advancedOpt.region'
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
49 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
50
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
51 $mode.advancedOpt.doNotExtendPairedEnds
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
52 $mode.advancedOpt.ignoreDuplicates
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
53 $mode.advancedOpt.includeZeros
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
54
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
55 #if $mode.advancedOpt.minMappingQuality:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
56 --minMappingQuality '$mode.advancedOpt.minMappingQuality'
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
57 #end if
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
58
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
59 #if $mode.advancedOpt.zMin:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
60 --zMin $mode.advancedOpt.zMin
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
61 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
62 #if $mode.advancedOpt.zMax:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
63 --zMax $mode.advancedOpt.zMax
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
64 #end if
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
65 --colorMap '$mode.advancedOpt.colorMap'
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
66
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
67 #end if
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
68
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
69 ; mv $newoutFileName $outFileName
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
70 ; rm $temp_dir -rf
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
71 </command>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
72
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
73 <inputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
74 <expand macro="multiple_input_bams" />
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
75
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
76 <param name="fragmentLength" type="integer" value="300" min="1"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
77 label="Length of the average fragment size"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
78 help ="Reads will be extended to match this length unless they are paired-end, in which case they will be extended to match the fragment length. *NOTE*: If the BAM files contain mated and unmated paired-end reads, unmated reads will be extended to match the fragment length."/>
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
79
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
80 <param name="corMethod" type="select" label="Correlation method">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
81 <option value="pearson">Pearson</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
82 <option value="spearman">Spearman</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
83 </param>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
84
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
85 <conditional name="mode">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
86 <param name="modeOpt" type="select" label="Choose computation mode"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
87 help="In the bins mode, the correlation is computed based on equal length bins. In the BED file mode, as list of genomic regions in BED format has to be given. For each region in the BED file the number of overlapping reads is counted in each of the BAM files. Then the correlation is computed.">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
88 <option value="bins" selected="true">Bins</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
89 <option value="BED-file">Limit correlation to certain regions (BED file)</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
90 </param>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
91 <when value="bins">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
92 <param name="binSize" type="integer" value="10000" min="1"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
93 label="Bin size in bp"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
94 help="Length in base pairs for a window used to sample the genome."/>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
95
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
96 <param name="numberOfSamples" type="integer" value="100000" min="1"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
97 label="Number of samples"
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
98 help="Number of samples taken from the genome to compute the scaling factors"/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
99 <expand macro="bamCorrelate_mode_actions" />
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
100 </when>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
101 <when value="BED-file">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
102 <param name="region_file" type="data" format="bed" label="Region file in BED format" help="Correlation is computed for the number of reads that overlap such regions."/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
103 <expand macro="bamCorrelate_mode_actions" />
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
104 </when>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
105
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
106 </conditional>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
107
14
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
108 <conditional name="outputOpt">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
109 <param name="showOutputOpt" type="select" label="Show additional output options" >
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
110 <option value="no" selected="true">no</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
111 <option value="yes">yes</option>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
112 </param>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
113 <when value="no" />
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
114 <when value="yes">
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
115 <param name="saveRawCounts" type="boolean" label="Save the bin counts"/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
116 <param name="saveCorMatrix" type="boolean" label="Save the correlation matrix"/>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
117 </when>
b0d64a9930d6 Uploaded
bgruening
parents: 10
diff changeset
118 </conditional>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
119
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
120 </inputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
121 <outputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
122 <data format="png" name="outFileName" />
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
123 <data format="tabular" name="outFileRawCounts" label="${tool.name} on ${on_string}: bin counts">
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
124 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveRawCounts'] == True)</filter>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
125 </data>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
126 <data format="tabular" name="outFileCorMatrix" label="${tool.name} on ${on_string}: correlation matrix">
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
127 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveCorMatrix'] == True)</filter>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
128 </data>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
129 </outputs>
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
130 <help>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
131
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
132 **What it does**
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
133
5
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
134 This tool is useful to assess the overall similarity of different BAM files. A typical application
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
135 is to check the correlation between replicates or published data sets.
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
136
6
c5847db0cb41 Uploaded
bgruening
parents: 5
diff changeset
137 The tool splits the genomes into bins of given length. For each bin, the number of reads
5
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
138 found in each BAM file is counted and a correlation is computed for all
1f312af2f8db Uploaded
bgruening
parents: 1
diff changeset
139 pairs of BAM files.
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
140
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
141
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
142 .. image:: $PATH_TO_IMAGES/QC_bamCorrelate_humanSamples.png
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
143 :alt: Heatmap of RNA Polymerase II ChIP-seq
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
144
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
145
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
146 **Output files**:
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
147
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
148 - diagnostic plot produced by bamCorrelate is a clustered heatmap displaying the values for each pair-wise correlation, see below for an example
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
149 - data matrix (optional) in case you want to plot the correlation values using a different program, e.g. R, this matrix can be used
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
150
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
151
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
152
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
153
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
154 -----
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
155
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
156 .. class:: infomark
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
157
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
158 @REFERENCES@
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
159
10
a68a771625d2 Uploaded
bgruening
parents: 9
diff changeset
160 </help>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
161 </tool>