Mercurial > repos > bgruening > deeptools
comparison computeGCBias.xml @ 10:a68a771625d2 draft
Uploaded
author | bgruening |
---|---|
date | Tue, 29 Oct 2013 17:26:28 -0400 |
parents | 73761f33f198 |
children | 351cd1f8791b |
comparison
equal
deleted
inserted
replaced
9:73761f33f198 | 10:a68a771625d2 |
---|---|
1 <tool id="deeptools_computeGCBias" name="computeGCBias" version="1.0.1"> | 1 <tool id="deeptools_computeGCBias" name="computeGCBias" version="1.0.1"> |
2 <description>to see whether your samples should be normalized for GC bias</description> | 2 <description>to see whether your samples should be normalized for GC bias</description> |
3 | 3 <expand macro="requirements" /> |
4 <requirements> | 4 <stdio> |
5 <requirement type="package" version="1.5.1_3e13687c89e951476776b15afb4bbbc3b906f761">deepTools</requirement> | 5 <exit_code range="0" level="warning" description="Warning" /> |
6 <requirement type="package" >deepTools</requirement> | 6 </stdio> |
7 </requirements> | 7 <macros> |
8 <stdio> | 8 <import>deepTools_macros.xml</import> |
9 <exit_code range="0" level="warning" description="Warning" /> | 9 </macros> |
10 </stdio> | 10 <command> |
11 <command> | 11 #import tempfile |
12 #import tempfile | 12 #set $temp_dir = os.path.abspath(tempfile.mkdtemp()) |
13 #set $temp_dir = os.path.abspath(tempfile.mkdtemp()) | |
14 | 13 |
15 #set $temp_bam_handle = tempfile.NamedTemporaryFile( dir=$temp_dir ) | 14 #set $temp_bam_handle = tempfile.NamedTemporaryFile( dir=$temp_dir ) |
16 #set $temp_bam_path = $temp_bam_handle.name + '.bam' | 15 #set $temp_bam_path = $temp_bam_handle.name + '.bam' |
17 #silent $temp_bam_handle.close() | 16 #silent $temp_bam_handle.close() |
18 #silent os.system("ln -s %s %s" % (str($bamInput), $temp_bam_path)) | 17 #silent os.system("ln -s %s %s" % (str($bamInput), $temp_bam_path)) |
19 #silent os.system("ln -s %s %s.bai" % (str($bamInput.metadata.bam_index), $temp_bam_path)) | 18 #silent os.system("ln -s %s %s.bai" % (str($bamInput.metadata.bam_index), $temp_bam_path)) |
20 | 19 |
21 computeGCBias | 20 computeGCBias |
22 | 21 |
23 ##ToDo | 22 @THREADS@ |
24 --numberOfProcessors 4 | |
25 | 23 |
26 --bamfile '$temp_bam_path' | 24 --bamfile '$temp_bam_path' |
27 --species '$species' | |
28 --GCbiasFrequenciesFile $outFileName | 25 --GCbiasFrequenciesFile $outFileName |
29 --fragmentLength $fragmentLength | 26 --fragmentLength $fragmentLength |
30 | 27 |
31 #if $source.ref_source=="history": | 28 @reference_genome_source@ |
32 --genome $source.input1 | 29 |
30 | |
31 #if $effectiveGenomeSize.effectiveGenomeSize_opt == "specific": | |
32 --effectiveGenomeSize $effectiveGenomeSize.effectiveGenomeSize | |
33 #else: | 33 #else: |
34 --genome "${source.input1_2bit.fields.path}" | 34 --effectiveGenomeSize $effectiveGenomeSize.effectiveGenomeSize_opt |
35 #end if | 35 #end if |
36 | |
36 | 37 |
37 #if $advancedOpt.showAdvancedOpt == "yes": | 38 #if $advancedOpt.showAdvancedOpt == "yes": |
38 #if str($advancedOpt.region.value) != '': | 39 #if str($advancedOpt.region.value) != '': |
39 --region '$advancedOpt.region' | 40 --region '$advancedOpt.region' |
40 #end if | 41 #end if |
41 | 42 |
42 --binSize '$advancedOpt.binSize' | |
43 --sampleSize '$advancedOpt.sampleSize' | 43 --sampleSize '$advancedOpt.sampleSize' |
44 --regionSize '$advancedOpt.regionSize' | 44 --regionSize '$advancedOpt.regionSize' |
45 | 45 |
46 #if $advancedOpt.filterOut: | 46 #if $advancedOpt.filterOut: |
47 --filterOut $advancedOpt.filterOut | 47 --filterOut $advancedOpt.filterOut |
64 ## #end if | 64 ## #end if |
65 ## #end if | 65 ## #end if |
66 | 66 |
67 ; rm $temp_dir -rf | 67 ; rm $temp_dir -rf |
68 | 68 |
69 </command> | 69 </command> |
70 <inputs> | 70 <inputs> |
71 | 71 |
72 <param name="bamInput" format="bam" type="data" label="Input BAM file" | 72 <param name="bamInput" format="bam" type="data" label="Input BAM file" |
73 help="The BAM file must be sorted."/> | 73 help="The BAM file must be sorted."/> |
74 <!--<param name="species" type="text" value="" label="Species name abbreviation" />--> | |
75 | 74 |
76 <param name="species" type="select" label="Species name abbreviation"> | 75 <expand macro="reference_genome_source" /> |
77 <option value="hg19">hg19</option> | 76 <expand macro="effectiveGenomeSize" /> |
78 <option value="ce10">ce10</option> | |
79 <option value="dm3">dm3</option> | |
80 <option value="mm9">mm9</option> | |
81 </param> | |
82 | 77 |
83 <conditional name="source"> | |
84 <param name="ref_source" type="select" label="Reference genome"> | |
85 <option value="cached">locally cached</option> | |
86 <option value="history">in your history</option> | |
87 </param> | |
88 <when value="cached"> | |
89 <param name="input1_2bit" type="select" label="Using reference genome" help="If your genome of interest is not listed, contact the Galaxy team"> | |
90 <options from_data_table="deepTools_seqs" /> | |
91 </param> | |
92 </when> | |
93 <when value="history"> | |
94 <param name="input1" type="data" format="twobit" label="Select a reference dataset in 2bit format" /> | |
95 </when> | |
96 </conditional> | |
97 <param name="fragmentLength" type="integer" value="300" min="1" | 78 <param name="fragmentLength" type="integer" value="300" min="1" |
98 label="Fragment length used for the sequencing" | 79 label="Fragment length used for the sequencing" |
99 help ="If paired-end reads are used, the fragment length is computed from the BAM file."/> | 80 help ="If paired-end reads are used, the fragment length is computed from the BAM file."/> |
100 | 81 |
101 <conditional name="advancedOpt"> | 82 <conditional name="advancedOpt"> |
106 <when value="no" /> | 87 <when value="no" /> |
107 <when value="yes"> | 88 <when value="yes"> |
108 <param name="region" type="text" value="" | 89 <param name="region" type="text" value="" |
109 label="Region of the genome to limit the operation to" | 90 label="Region of the genome to limit the operation to" |
110 help="This is useful when testing parameters to reduce the computing time. The format is chr:start:end, for example "chr10" or "chr10:456700:891000"" /> | 91 help="This is useful when testing parameters to reduce the computing time. The format is chr:start:end, for example "chr10" or "chr10:456700:891000"" /> |
111 | |
112 <param name="binSize" type="integer" value="50" min="1" | |
113 label="Bin size in bp" | |
114 help="Size of the bins in bp for the ouput of the bigwig/bedgraph file."/> | |
115 | 92 |
116 <param name="sampleSize" type="integer" value="50000000" min="1" | 93 <param name="sampleSize" type="integer" value="50000000" min="1" |
117 label="Number of sampling points to be considered" /> | 94 label="Number of sampling points to be considered" /> |
118 | 95 |
119 <param name="regionSize" type="integer" value="300" min="1" | 96 <param name="regionSize" type="integer" value="300" min="1" |
169 sequencing as it only depends on the respective reference genome (i.e. it will most likely vary between mouse and fruit fly due to their genome's different GC contents). | 146 sequencing as it only depends on the respective reference genome (i.e. it will most likely vary between mouse and fruit fly due to their genome's different GC contents). |
170 The OBSERVED values are based on the reads from the sequenced sample. Instead of noting how many genomic regions there are per GC content, we now count the reads per GC content. | 147 The OBSERVED values are based on the reads from the sequenced sample. Instead of noting how many genomic regions there are per GC content, we now count the reads per GC content. |
171 In an ideal sample without GC bias, the ratio of OBSERVED/EXPECTED values should be close to 1 regardless of the GC content. Due to PCR (over)amplifications, the majority of ChIP samples | 148 In an ideal sample without GC bias, the ratio of OBSERVED/EXPECTED values should be close to 1 regardless of the GC content. Due to PCR (over)amplifications, the majority of ChIP samples |
172 usually shows a significant bias towards reads with high GC content (>50%) | 149 usually shows a significant bias towards reads with high GC content (>50%) |
173 | 150 |
151 .. image:: $PATH_TO_IMAGES/QC_GCplots_input.png | |
152 | |
153 | |
154 **Output files**: | |
155 | |
156 - Diagnostic plot | |
157 | |
158 - box plot of absolute read numbers per genomic GC bin | |
159 - x-y plot of observed/expected read ratios per genomic GC content bin | |
160 | |
161 - Data matrix | |
162 | |
163 - to be used for GC correction with correctGCbias | |
164 | |
165 | |
174 ----- | 166 ----- |
175 | 167 |
176 .. class:: infomark | 168 .. class:: infomark |
177 | 169 |
178 If you would like to give us feedback or you run into any trouble, please send an email to deeptools@googlegroups.com | 170 @REFERENCES@ |
179 | 171 |
180 This tool is developed by the `Bioinformatics and Deep-Sequencing Unit`_ at the `Max Planck Institute for Immunobiology and Epigenetics`_. | 172 </help> |
181 | |
182 .. _Bioinformatics and Deep-Sequencing Unit: http://www3.ie-freiburg.mpg.de/facilities/research-facilities/bioinformatics-and-deep-sequencing-unit/ | |
183 .. _Max Planck Institute for Immunobiology and Epigenetics: http://www3.ie-freiburg.mpg.de | |
184 | |
185 </help> | |
186 </tool> | 173 </tool> |