Mercurial > repos > jjohnson > cistrome_ceas
comparison ceas.xml @ 0:4e52505adaa6
Imported from capsule None
author | jjohnson |
---|---|
date | Wed, 17 Sep 2014 15:03:26 -0400 |
parents | |
children |
comparison
equal
deleted
inserted
replaced
-1:000000000000 | 0:4e52505adaa6 |
---|---|
1 <tool name="CEAS: Enrichment on chromosome and annotation" id="ceas_ceas" version="0.1.0"> | |
2 <description>Annotate the given intervals and scores with genome features such as gene body</description> | |
3 <macros> | |
4 <import>ceas_macros.xml</import> | |
5 </macros> | |
6 <expand macro="requirements_bx" /> | |
7 <command> | |
8 #import os.path | |
9 #if $genegroup.enable == "yes" | |
10 #set $gngroups = str($genegroup.genelist) | |
11 #set $gnlabels = str($genegroup.label) | |
12 #for $m in $genegroup.more | |
13 #set $gngroups = $gngroups+","+str($m.genelist) | |
14 #set $gnlabels = $gnlabels+","+str($m.label) | |
15 #end for | |
16 #set $gngroupspara = "--gn-groups="+$gngroups | |
17 #set $gnlabelspara = "--gn-group-names='"+$gnlabels+"'"+str($genegroup.idtype.value) | |
18 #else | |
19 #set $gngroupspara = "" | |
20 #set $gnlabelspara = "" | |
21 #end if | |
22 #set $sizes = str($lowersize) + "," + str($middlesize) + "," + str($uppersize) | |
23 #set $bisizes = str($lowerbisize) + "," + str($upperbisize) | |
24 #if $wfile: | |
25 #if $wfile.extension == "bigwig" | |
26 ceasBW -w $wfile | |
27 #set dbkey = $wfile.metadata.dbkey | |
28 #set $length_file = os.path.join( os.path.abspath($__app__.config.len_file_path), $dbkey+".len" ) | |
29 -l $length_file | |
30 #else | |
31 ceas -w $wfile | |
32 #end if | |
33 #else | |
34 ceas | |
35 #end if | |
36 #if $bfile: | |
37 -b $bfile | |
38 #end if | |
39 #include source=$gtpath_ceasdb_ref# | |
40 --span=$span --pf-res=$pfres --sizes=$sizes --bisizes=$bisizes | |
41 --rel-dist=$reldist $gngroupspara $gnlabelspara --name=$name &> $log && | |
42 Rscript ceas_out.R && | |
43 #if $imagetype.__str__ == "PNG": | |
44 convert ceas_out.pdf ceas_out.png && convert ceas_out-*.png -append ceas_out_joint.png && | |
45 cp ceas_out_joint.png $output | |
46 #else | |
47 cp ceas_out.pdf $output | |
48 #end if | |
49 </command> | |
50 <inputs> | |
51 <expand macro="ceasdb_ref" /> | |
52 <param name="name" type="hidden" value="ceas_out"/> | |
53 <param format="wig,bigwig" name="wfile" type="data" label="wig / bigwig file" optional="true"> | |
54 <validator type="unspecified_build" /> | |
55 </param> | |
56 <param format="bed" name="bfile" type="data" label="BED file(maximum 100000 lines)" optional="true"> | |
57 <validator type="unspecified_build" /> | |
58 </param> | |
59 <param name="span" type="integer" label="Span" value="3000"> | |
60 <validator type="in_range" max="1000000" min="100" message="The Span is out of range, the parameter has to be between 100 to 1000000" /> | |
61 </param> | |
62 <param name="pfres" type="integer" label="Profiling resolution" value="50"> | |
63 <validator type="in_range" max="1000" min="10" message="The Profiling Resolution is out of range, the parameter has to be between 10 to 1000" /> | |
64 </param> | |
65 <param name="lowersize" type="text" label="Promoter/downstream lower-interval" value="1000" > | |
66 <validator type="in_range" max="10000" min="100" message="The lower-interval is out of range, the parameter has to be between 100 to 10000" /> | |
67 </param> | |
68 <param name="middlesize" type="text" label="Promoter/downstream middle-interval" value="2000" > | |
69 <validator type="in_range" max="10000" min="100" message="The middle-interval is out of range, the parameter has to be between 100 to 10000" /> | |
70 </param> | |
71 <param name="uppersize" type="text" label="Promoter/downstream upper-interval" value="3000"> | |
72 <validator type="in_range" max="10000" min="100" message="The upper-interval is out of range, the parameter has to be between 100 to 10000" /> | |
73 </param> | |
74 <param name="lowerbisize" type="text" label="Bi-Promoter lower range" value="2500"> | |
75 <validator type="in_range" max="10000" min="100" message="The lower-range is out of range, the parameter has to be between 100 to 10000" /> | |
76 </param> | |
77 <param name="upperbisize" type="text" label="Bi-Promoter upper range" value="5000"> | |
78 <validator type="in_range" max="10000" min="100" message="The upper-range is out of range, the parameter has to be between 100 to 10000" /> | |
79 </param> | |
80 <param name="reldist" type="integer" label="Relative distance" value="3000"> | |
81 <validator type="in_range" max="10000" min="100" message="The Relative distance is out of range, the parameter has to be between 100 to 10000" /> | |
82 </param> | |
83 <param type="select" name="imagetype" display="radio" label="Image Type"> | |
84 <option value="PNG">PNG format</option> | |
85 <option value="PDF">PDF format</option> | |
86 </param> | |
87 | |
88 <conditional name="genegroup"> | |
89 <param name="enable" type="select" label="Specify gene list in the signal profiling" force_select="true"> | |
90 <option value="no">No</option> | |
91 <option value="yes">Yes</option> | |
92 </param> | |
93 | |
94 <when value="no"> | |
95 </when> | |
96 | |
97 <when value="yes"> | |
98 <param format="text" name="genelist" type="data" label="Gene List" optional="false"/> | |
99 <param name="label" type="text" label="Gene List Label" optional="false" /> | |
100 <repeat name="more" title="Gene Lists"> | |
101 <param format="text" name="genelist" type="data" label="Gene List" optional="false"/> | |
102 <param name="label" type="text" label="Gene List Label" optional="false" /> | |
103 </repeat> | |
104 <param name="idtype" type="select" label="Are they ..."> | |
105 <option value="">refseq</option> | |
106 <option value=" --gname2">genesymbol</option> | |
107 </param> | |
108 </when> | |
109 </conditional> | |
110 | |
111 </inputs> | |
112 | |
113 <outputs> | |
114 <data format="png" name="output"> | |
115 <change_format> | |
116 <when input="imagetype" value="PDF" format="pdf" /> | |
117 </change_format> | |
118 </data> | |
119 <data format="txt" name="log" label="ceas job log" /> | |
120 </outputs> | |
121 <expand macro="stdio" /> | |
122 <tests> | |
123 <test> | |
124 <param name="wfile" value="treatment.wig" /> | |
125 <param name="bfile" value="peaks.bed" /> | |
126 <param name="span" value="3000" /> | |
127 <param name="pfres" value="50" /> | |
128 <param name="lowersize" value="1000" /> | |
129 <param name="middlesize" value="2000" /> | |
130 <param name="uppersize" value="3000" /> | |
131 <param name="lowerbisize" value="2500" /> | |
132 <param name="upperbisize" value="5000" /> | |
133 <param name="reldist" value="3000" /> | |
134 <param name="refsrc" value="history"/> | |
135 <param name="gdb" ftype="ceasdb" value="mm9.refGene.ceasdb"/> | |
136 <param name="imagetype" value="PDF" /> | |
137 <param name="enable" value="no" /> | |
138 <output name="log"> | |
139 <assert_contents> | |
140 <has_text_matching expression="See ceas_out.pdf for the graphical results of CEAS" /> | |
141 </assert_contents> | |
142 </output> | |
143 </test> | |
144 <test> | |
145 <param name="wfile" value="treatment.bigwig" /> | |
146 <param name="bfile" value="peaks.bed" /> | |
147 <param name="span" value="3000" /> | |
148 <param name="pfres" value="50" /> | |
149 <param name="lowersize" value="1000" /> | |
150 <param name="middlesize" value="2000" /> | |
151 <param name="uppersize" value="3000" /> | |
152 <param name="lowerbisize" value="2500" /> | |
153 <param name="upperbisize" value="5000" /> | |
154 <param name="reldist" value="3000" /> | |
155 <param name="refsrc" value="history"/> | |
156 <param name="gdb" ftype="ceasdb" value="mm9.refGene.ceasdb"/> | |
157 <param name="imagetype" value="PDF" /> | |
158 <param name="enable" value="no" /> | |
159 <output name="log"> | |
160 <assert_contents> | |
161 <has_text_matching expression="See ceas_out.pdf for the graphical results of CEAS" /> | |
162 </assert_contents> | |
163 </output> | |
164 </test> | |
165 </tests> | |
166 <help> | |
167 ** CEAS ** | |
168 This tool annotates the given intervals and scores with genome | |
169 features such as gene body. It's the major module in CEAS package | |
170 which is written by Hyunjin Gene Shin, published in Bioinformatics | |
171 (pubmed id:19689956). | |
172 | |
173 @EXTERNAL_DOCUMENTATION@ | |
174 | |
175 @CITATION_SECTION@ | |
176 | |
177 | |
178 .. class:: warningmark | |
179 | |
180 **NEED IMPROVEMENT** | |
181 | |
182 ----- | |
183 | |
184 **Parameters** | |
185 | |
186 - **WIGGLE file** contains the scores for the experiment in a wiggle | |
187 format file. Normally, it's produced by the peak calling tool. It's | |
188 optional. | |
189 - **BED file** contains the peak locations for the experiment in a BED | |
190 format file. | |
191 - **Span** from TSS and TTS in the gene-centered annotation. ChIP | |
192 regions within this range from TSS and TTS are considered when | |
193 calculating the coverage rates in promoter and downstream. | |
194 - **Profiling resolution** is the WIGGLE profiling resolution. | |
195 - **Promoter/downstream intervals** for ChIP region annotation are | |
196 comma-separated three values or a single value can be given. If a | |
197 single value is given, it will be segmented into three equal | |
198 fractions (ie, 3000 is equivalent to 1000,2000,3000) | |
199 - **BiPromoter ranges** is for ChIP region annotation. It's | |
200 comma-separated two values or a single value can be given. If a | |
201 single value is given, it will be segmented into two equal fractions | |
202 (ie, 5000 is equivalent to 2500,5000) | |
203 - **Relative distance** is the relative distance to TSS/TTS in WIGGLE file | |
204 profiling | |
205 - **Genome Annotation Version** to specify the annotations according to | |
206 the data set. The annotations are downloaded from UCSC genome site. | |
207 - **Image type** specify the output image format, either in PNG or in | |
208 PDF format. | |
209 - If **Specify gene list in the signal profiling** is set, you can specify | |
210 different gene groups for CEAS to put them together in the profile | |
211 figure. You need to select several **Gene List** files from history which | |
212 contains the RefSeq ids or Gene Symbols for each row, and | |
213 **Gene List Label** for each gene list file. | |
214 | |
215 ----- | |
216 | |
217 **Outputs** | |
218 | |
219 - **PNG/PDF file** is the result for CEAS analysis, containing 5 pages. | |
220 - **LOG file** for job log. If you see errors, please attached this in | |
221 the bug report | |
222 | |
223 ----- | |
224 | |
225 **script parameter list of CEAS 0.9.8** | |
226 | |
227 Options: | |
228 --version show program's version number and exit | |
229 -h, --help Show this help message and exit. | |
230 -b BED, --bed=BED BED file of ChIP regions. | |
231 -w WIG, --wig=WIG WIG file for either wig profiling or genome background | |
232 annotation. WARNING: --bg flag must be set for genome | |
233 background re-annotation. | |
234 -e EBED, --ebed=EBED BED file of extra regions of interest (eg, non-coding | |
235 regions) | |
236 -g GDB, --gt=GDB Gene annotation table (eg, a refGene table in sqlite3 | |
237 db format provided through the CEAS web, | |
238 http://liulab.dfci.harvard.edu/CEAS/download.html). | |
239 --name=NAME Experiment name. This will be used to name the output | |
240 files. If an experiment name is not given, the stem of | |
241 the input BED file name will be used instead (eg, if | |
242 'peaks.bed', 'peaks' will be used as a name.) | |
243 --sizes=SIZES Promoter (also dowsntream) sizes for ChIP region | |
244 annotation. Comma-separated three values or a single | |
245 value can be given. If a single value is given, it | |
246 will be segmented into three equal fractions (ie, 3000 | |
247 is equivalent to 1000,2000,3000), DEFAULT: | |
248 1000,2000,3000. WARNING: Values > 10000bp are | |
249 automatically set to 10000bp. | |
250 --bisizes=BISIZES Bidirectional-promoter sizes for ChIP region | |
251 annotation Comma-separated two values or a single | |
252 value can be given. If a single value is given, it | |
253 will be segmented into two equal fractions (ie, 5000 | |
254 is equivalent to 2500,5000) DEFAULT: 2500,5000bp. | |
255 WARNING: Values > 20000bp are automatically set to | |
256 20000bp. | |
257 --bg Run genome BG annotation again. WARNING: This flag is | |
258 effective only if a WIG file is given through -w | |
259 (--wig). Otherwise, ignored. | |
260 --span=SPAN Span from TSS and TTS in the gene-centered annotation. | |
261 ChIP regions within this range from TSS and TTS are | |
262 considered when calculating the coverage rates in | |
263 promoter and downstream, DEFAULT=3000bp | |
264 --pf-res=PF_RES Wig profiling resolution, DEFAULT: 50bp. WARNING: | |
265 Value smaller than the wig interval (resolution) may | |
266 cause aliasing error. | |
267 --rel-dist=REL_DIST Relative distance to TSS/TTS in wig profiling, | |
268 DEFAULT: 3000bp | |
269 --gn-groups=GN_GROUPS | |
270 Gene-groups of particular interest in wig profiling. | |
271 Each gene group file must have gene names in the 1st | |
272 column. The file names are separated by commas w/ no | |
273 space (eg, --gn-groups=top10.txt,bottom10.txt) | |
274 --gn-group-names=GN_NAMES | |
275 The names of the gene groups in --gn-groups. The gene | |
276 group names are separated by commas. (eg, --gn-group- | |
277 names='top 10%,bottom 10%'). These group names appear | |
278 in the legends of the wig profiling plots. If no group | |
279 names given, the groups are represented as 'Group 1, | |
280 Group2,...Group n'. | |
281 --gname2 Whether or not use the 'name2' column of the gene | |
282 annotation table when reading the gene IDs in the | |
283 files given through --gn-groups. This flag is | |
284 meaningful only with --gn-groups. | |
285 | |
286 </help> | |
287 | |
288 </tool> |