annotate bamCorrelate.xml @ 2:4762b84d13f5 draft

Uploaded
author bgruening
date Mon, 05 Aug 2013 10:11:32 -0400
parents 21d563d5f2b2
children 1f312af2f8db
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
1 <tool id="bamCorrelate" name="bamCorrelate" version="1.0.1">
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
2 <description>corrlates pairs of bam files</description>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
3 <requirements>
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
4 <requirement type="package" version="1.5.1_59e067cce039cb93add04823c9f51cab202f8c2b">deepTools</requirement>
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
5 </requirements>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
6 <command>
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
7 #import tempfile
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
8 #set $temp_dir = os.path.abspath(tempfile.mkdtemp())
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
9
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
10 #set files=[]
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
11 #set labels=[]
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
12 #for $i in $inputs
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
13
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
14 #set $temp_input_handle = tempfile.NamedTemporaryFile( dir=$temp_dir )
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
15 #set $temp_input_path = $temp_input_handle.name
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
16 #silent $temp_input_handle.close()
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
17 #silent os.system("ln -s %s %s.bam" % (str($i.bamfile), $temp_input_path))
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
18 #silent os.system("ln -s %s %s.bam.bai" % (str($i.bamfile.metadata.bam_index), $temp_input_path))
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
19 #silent $files.append('%s.bam' % $temp_input_path)
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
20
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
21
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
22 ##set $files += [str($i.bamfile)]
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
23 #if str($i.label.value) != "":
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
24 #set $labels += ["\"%s\"" % ($i.label.value)]
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
25 #else
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
26 #set $labels += ["\"%s\"" % ($i.bamfile.name)]
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
27 #end if
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
28 #end for
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
29 bamCorrelate
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
30
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
31 ##ToDo
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
32 --numberOfProcessors 4
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
33
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
34 --bamfiles #echo " ".join($files)
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
35 --labels #echo " ".join($labels)
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
36
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
37 --fragmentLength $fragmentLength
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
38 --corMethod $corMethod
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
39
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
40 #set newoutFileName=str($outFileName)+".png"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
41 --plotFile $newoutFileName
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
42
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
43 #if $outputOpt.showOutputOpt == "yes"
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
44 --outRawCounts '$outFileRawCounts'
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
45 --outFileCorMatrix '$outFileCorMatrix'
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
46 #end if
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
47
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
48 #if $advancedOpt.showAdvancedOpt == "yes":
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
49 #if $advancedOpt.smoothLength:
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
50 --smoothLength '$advancedOpt.smoothLength'
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
51 #end if
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
52
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
53 #if str($advancedOpt.region.value) != '':
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
54 --region '$advancedOpt.region'
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
55 #end if
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
56
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
57 --binSize '$advancedOpt.binSize'
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
58 --numberOfSamples '$advancedOpt.numberOfSamples'
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
59
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
60 $advancedOpt.doNotExtendPairedEnds
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
61 $advancedOpt.ignoreDuplicates
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
62 $advancedOpt.includeZeros
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
63
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
64 #if $advancedOpt.minMappingQuality:
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
65 --minMappingQuality '$advancedOpt.minMappingQuality'
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
66 #end if
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
67 #end if
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
68 ; mv $newoutFileName $outFileName
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
69 ; rm $temp_dir -rf
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
70 </command>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
71
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
72 <inputs>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
73 <repeat name="inputs" title="Input files" min="2">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
74 <param name="bamfile" type="data" format="bam"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
75 label="Bam file"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
76 help="The BAM file must be sorted and indexed."/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
77 <param name="label" type="text" size="30" optional="true" value=""
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
78 label="Label"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
79 help="Label to use in the output. If not given the dataset name will be used instead."/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
80 </repeat>
1
21d563d5f2b2 Uploaded
bgruening
parents: 0
diff changeset
81
0
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
82 <param name="fragmentLength" type="integer" value="300" min="1"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
83 label="Length of the average fragment size"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
84 help ="Reads will be extended to match this length unless they are paired-end, in which case they will be extended to match the fragment length. If this value is set to the read length or smaller, the read will not be extended. *Warning* the fragment length affects the normalization to 1x (see &quot;normalize coverage to 1x&quot;). The formula to normalize using the sequencing depth is genomeSize/(number of mapped reads * fragment length). *NOTE*: If the BAM files contain mated and unmated paired-end reads, unmated reads will be extended to match the fragment length."/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
85
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
86 <param name="corMethod" type="select" label="Correlation method">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
87 <option value="pearson">Pearson</option>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
88 <option value="spearman">Spearman</option>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
89 </param>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
90
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
91 <conditional name="advancedOpt">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
92 <param name="showAdvancedOpt" type="select" label="Show advanced options" >
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
93 <option value="no" selected="true">no</option>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
94 <option value="yes">yes</option>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
95 </param>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
96 <when value="no" />
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
97 <when value="yes">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
98 <param name="smoothLength" type="integer" value="1" optional="true" min="1"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
99 label="Smooth values using the following length (in bp)"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
100 help ="The smooth length defines a window, larger than the bin size, to average the number of reads. For example, if the bin size is set to 20 bp and the smooth length is set to 60 bp, then, for each bin size the average of it and its left and right neighbors is considered. Any value smaller than the bin size will be ignored and no smoothing will be applied."/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
101
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
102 <param name="region" type="text" value=""
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
103 label="Region of the genome to limit the operation to"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
104 help="This is useful when testing parameters to reduce the computing time. The format is chr:start:end, for example &quot;chr10&quot; or &quot;chr10:456700:891000&quot;" />
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
105
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
106 <param name="binSize" type="integer" value="10000" min="1"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
107 label="Bin size in bp"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
108 help="Length in base pairs for a window used to sample the genome."/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
109
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
110 <param name="numberOfSamples" type="integer" value="100000" min="1"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
111 label="Number of samples"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
112 help="Number of samples taken from the genome to compute the scaling factors"/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
113
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
114 <param name="doNotExtendPairedEnds" type="boolean" truevalue="--doNotExtendPairedEnds" falsevalue=""
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
115 label="Do not extend paired ends"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
116 help="If set, reads are not extended to match the fragment length reported in the BAM file, instead they will be extended to match the fragment length. Default is to extend the reads if paired end information is available."/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
117
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
118 <param name="ignoreDuplicates" type="boolean" truevalue="--ignoreDuplicates" falsevalue=""
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
119 label="Ignore duplicates"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
120 help="If set, reads that have the same orientation and start position will be considered only once. If reads are paired, the mate position also has to coincide to ignore a read." />
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
121
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
122 <param name="minMappingQuality" type="integer" optional="true" value="1" min="1"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
123 label="Minimum mapping quality"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
124 help= "If set, only reads that have a mapping quality score higher than the given value are considered"/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
125
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
126 <param name="includeZeros" type="boolean" truevalue="--includeZeros" falsevalue=""
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
127 label ="Include zeros"
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
128 help ="If set, then zero counts that happen for *all* bam files given are included. The default behavior is to ignore those cases" />
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
129
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
130 </when>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
131 </conditional>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
132
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
133 <conditional name="outputOpt">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
134 <param name="showOutputOpt" type="select" label="Show additional output options" >
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
135 <option value="no" selected="true">no</option>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
136 <option value="yes">yes</option>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
137 </param>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
138 <when value="no" />
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
139 <when value="yes">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
140 <param name="saveRawCounts" type="boolean" label="Save the bin counts"/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
141 <param name="saveCorMatrix" type="boolean" label="Save the correlation matrix"/>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
142 </when>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
143 </conditional>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
144
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
145 </inputs>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
146 <outputs>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
147 <data format="png" name="outFileName" />
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
148 <data format="tabular" name="outFileRawCounts" label="${tool.name} on ${on_string}: bin counts">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
149 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveRawCounts'] == True)</filter>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
150 </data>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
151 <data format="tabular" name="outFileCorMatrix" label="${tool.name} on ${on_string}: correlation matrix">
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
152 <filter>(outputOpt['showOutputOpt'] == 'yes' and outputOpt['saveCorMatrix'] == True)</filter>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
153 </data>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
154 </outputs>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
155 <help>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
156
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
157 **What it does**
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
158
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
159 Genomes are split into bins of given length. For each bin the number of reads
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
160 found for each of the bam files is counted. A correlation is computed for all
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
161 pairs of bam files.
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
162
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
163 -----
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
164
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
165 .. class:: infomark
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
166
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
167 Please acknowledge that this tool **is still in development** and we will be very happy to receive feedback from the users. If you run into any trouble please sent an email to `Fidel Ramirez`_.
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
168
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
169 This tool is developed by the `Bioinformatics and Deep-Sequencing Unit`_ at the `Max Planck Institute for Immunobiology and Epigenetics`_.
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
170
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
171
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
172 .. _Bioinformatics and Deep-Sequencing Unit: http://www3.ie-freiburg.mpg.de/facilities/research-facilities/bioinformatics-and-deep-sequencing-unit/
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
173 .. _Max Planck Institute for Immunobiology and Epigenetics: http://www3.ie-freiburg.mpg.de
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
174 .. _Fidel Ramirez: ramirez@ie-freiburg.mpg.de
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
175
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
176 </help>
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
177
09b65c12a75a Uploaded
bgruening
parents:
diff changeset
178 </tool>