comparison ceas.xml @ 0:4e52505adaa6

Imported from capsule None
author jjohnson
date Wed, 17 Sep 2014 15:03:26 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:4e52505adaa6
1 <tool name="CEAS: Enrichment on chromosome and annotation" id="ceas_ceas" version="0.1.0">
2 <description>Annotate the given intervals and scores with genome features such as gene body</description>
3 <macros>
4 <import>ceas_macros.xml</import>
5 </macros>
6 <expand macro="requirements_bx" />
7 <command>
8 #import os.path
9 #if $genegroup.enable == "yes"
10 #set $gngroups = str($genegroup.genelist)
11 #set $gnlabels = str($genegroup.label)
12 #for $m in $genegroup.more
13 #set $gngroups = $gngroups+","+str($m.genelist)
14 #set $gnlabels = $gnlabels+","+str($m.label)
15 #end for
16 #set $gngroupspara = "--gn-groups="+$gngroups
17 #set $gnlabelspara = "--gn-group-names='"+$gnlabels+"'"+str($genegroup.idtype.value)
18 #else
19 #set $gngroupspara = ""
20 #set $gnlabelspara = ""
21 #end if
22 #set $sizes = str($lowersize) + "," + str($middlesize) + "," + str($uppersize)
23 #set $bisizes = str($lowerbisize) + "," + str($upperbisize)
24 #if $wfile:
25 #if $wfile.extension == "bigwig"
26 ceasBW -w $wfile
27 #set dbkey = $wfile.metadata.dbkey
28 #set $length_file = os.path.join( os.path.abspath($__app__.config.len_file_path), $dbkey+".len" )
29 -l $length_file
30 #else
31 ceas -w $wfile
32 #end if
33 #else
34 ceas
35 #end if
36 #if $bfile:
37 -b $bfile
38 #end if
39 #include source=$gtpath_ceasdb_ref#
40 --span=$span --pf-res=$pfres --sizes=$sizes --bisizes=$bisizes
41 --rel-dist=$reldist $gngroupspara $gnlabelspara --name=$name &amp;> $log &amp;&amp;
42 Rscript ceas_out.R &amp;&amp;
43 #if $imagetype.__str__ == "PNG":
44 convert ceas_out.pdf ceas_out.png &amp;&amp; convert ceas_out-*.png -append ceas_out_joint.png &amp;&amp;
45 cp ceas_out_joint.png $output
46 #else
47 cp ceas_out.pdf $output
48 #end if
49 </command>
50 <inputs>
51 <expand macro="ceasdb_ref" />
52 <param name="name" type="hidden" value="ceas_out"/>
53 <param format="wig,bigwig" name="wfile" type="data" label="wig / bigwig file" optional="true">
54 <validator type="unspecified_build" />
55 </param>
56 <param format="bed" name="bfile" type="data" label="BED file(maximum 100000 lines)" optional="true">
57 <validator type="unspecified_build" />
58 </param>
59 <param name="span" type="integer" label="Span" value="3000">
60 <validator type="in_range" max="1000000" min="100" message="The Span is out of range, the parameter has to be between 100 to 1000000" />
61 </param>
62 <param name="pfres" type="integer" label="Profiling resolution" value="50">
63 <validator type="in_range" max="1000" min="10" message="The Profiling Resolution is out of range, the parameter has to be between 10 to 1000" />
64 </param>
65 <param name="lowersize" type="text" label="Promoter/downstream lower-interval" value="1000" >
66 <validator type="in_range" max="10000" min="100" message="The lower-interval is out of range, the parameter has to be between 100 to 10000" />
67 </param>
68 <param name="middlesize" type="text" label="Promoter/downstream middle-interval" value="2000" >
69 <validator type="in_range" max="10000" min="100" message="The middle-interval is out of range, the parameter has to be between 100 to 10000" />
70 </param>
71 <param name="uppersize" type="text" label="Promoter/downstream upper-interval" value="3000">
72 <validator type="in_range" max="10000" min="100" message="The upper-interval is out of range, the parameter has to be between 100 to 10000" />
73 </param>
74 <param name="lowerbisize" type="text" label="Bi-Promoter lower range" value="2500">
75 <validator type="in_range" max="10000" min="100" message="The lower-range is out of range, the parameter has to be between 100 to 10000" />
76 </param>
77 <param name="upperbisize" type="text" label="Bi-Promoter upper range" value="5000">
78 <validator type="in_range" max="10000" min="100" message="The upper-range is out of range, the parameter has to be between 100 to 10000" />
79 </param>
80 <param name="reldist" type="integer" label="Relative distance" value="3000">
81 <validator type="in_range" max="10000" min="100" message="The Relative distance is out of range, the parameter has to be between 100 to 10000" />
82 </param>
83 <param type="select" name="imagetype" display="radio" label="Image Type">
84 <option value="PNG">PNG format</option>
85 <option value="PDF">PDF format</option>
86 </param>
87
88 <conditional name="genegroup">
89 <param name="enable" type="select" label="Specify gene list in the signal profiling" force_select="true">
90 <option value="no">No</option>
91 <option value="yes">Yes</option>
92 </param>
93
94 <when value="no">
95 </when>
96
97 <when value="yes">
98 <param format="text" name="genelist" type="data" label="Gene List" optional="false"/>
99 <param name="label" type="text" label="Gene List Label" optional="false" />
100 <repeat name="more" title="Gene Lists">
101 <param format="text" name="genelist" type="data" label="Gene List" optional="false"/>
102 <param name="label" type="text" label="Gene List Label" optional="false" />
103 </repeat>
104 <param name="idtype" type="select" label="Are they ...">
105 <option value="">refseq</option>
106 <option value=" --gname2">genesymbol</option>
107 </param>
108 </when>
109 </conditional>
110
111 </inputs>
112
113 <outputs>
114 <data format="png" name="output">
115 <change_format>
116 <when input="imagetype" value="PDF" format="pdf" />
117 </change_format>
118 </data>
119 <data format="txt" name="log" label="ceas job log" />
120 </outputs>
121 <expand macro="stdio" />
122 <tests>
123 <test>
124 <param name="wfile" value="treatment.wig" />
125 <param name="bfile" value="peaks.bed" />
126 <param name="span" value="3000" />
127 <param name="pfres" value="50" />
128 <param name="lowersize" value="1000" />
129 <param name="middlesize" value="2000" />
130 <param name="uppersize" value="3000" />
131 <param name="lowerbisize" value="2500" />
132 <param name="upperbisize" value="5000" />
133 <param name="reldist" value="3000" />
134 <param name="refsrc" value="history"/>
135 <param name="gdb" ftype="ceasdb" value="mm9.refGene.ceasdb"/>
136 <param name="imagetype" value="PDF" />
137 <param name="enable" value="no" />
138 <output name="log">
139 <assert_contents>
140 <has_text_matching expression="See ceas_out.pdf for the graphical results of CEAS" />
141 </assert_contents>
142 </output>
143 </test>
144 <test>
145 <param name="wfile" value="treatment.bigwig" />
146 <param name="bfile" value="peaks.bed" />
147 <param name="span" value="3000" />
148 <param name="pfres" value="50" />
149 <param name="lowersize" value="1000" />
150 <param name="middlesize" value="2000" />
151 <param name="uppersize" value="3000" />
152 <param name="lowerbisize" value="2500" />
153 <param name="upperbisize" value="5000" />
154 <param name="reldist" value="3000" />
155 <param name="refsrc" value="history"/>
156 <param name="gdb" ftype="ceasdb" value="mm9.refGene.ceasdb"/>
157 <param name="imagetype" value="PDF" />
158 <param name="enable" value="no" />
159 <output name="log">
160 <assert_contents>
161 <has_text_matching expression="See ceas_out.pdf for the graphical results of CEAS" />
162 </assert_contents>
163 </output>
164 </test>
165 </tests>
166 <help>
167 ** CEAS **
168 This tool annotates the given intervals and scores with genome
169 features such as gene body. It's the major module in CEAS package
170 which is written by Hyunjin Gene Shin, published in Bioinformatics
171 (pubmed id:19689956).
172
173 @EXTERNAL_DOCUMENTATION@
174
175 @CITATION_SECTION@
176
177
178 .. class:: warningmark
179
180 **NEED IMPROVEMENT**
181
182 -----
183
184 **Parameters**
185
186 - **WIGGLE file** contains the scores for the experiment in a wiggle
187 format file. Normally, it's produced by the peak calling tool. It's
188 optional.
189 - **BED file** contains the peak locations for the experiment in a BED
190 format file.
191 - **Span** from TSS and TTS in the gene-centered annotation. ChIP
192 regions within this range from TSS and TTS are considered when
193 calculating the coverage rates in promoter and downstream.
194 - **Profiling resolution** is the WIGGLE profiling resolution.
195 - **Promoter/downstream intervals** for ChIP region annotation are
196 comma-separated three values or a single value can be given. If a
197 single value is given, it will be segmented into three equal
198 fractions (ie, 3000 is equivalent to 1000,2000,3000)
199 - **BiPromoter ranges** is for ChIP region annotation. It's
200 comma-separated two values or a single value can be given. If a
201 single value is given, it will be segmented into two equal fractions
202 (ie, 5000 is equivalent to 2500,5000)
203 - **Relative distance** is the relative distance to TSS/TTS in WIGGLE file
204 profiling
205 - **Genome Annotation Version** to specify the annotations according to
206 the data set. The annotations are downloaded from UCSC genome site.
207 - **Image type** specify the output image format, either in PNG or in
208 PDF format.
209 - If **Specify gene list in the signal profiling** is set, you can specify
210 different gene groups for CEAS to put them together in the profile
211 figure. You need to select several **Gene List** files from history which
212 contains the RefSeq ids or Gene Symbols for each row, and
213 **Gene List Label** for each gene list file.
214
215 -----
216
217 **Outputs**
218
219 - **PNG/PDF file** is the result for CEAS analysis, containing 5 pages.
220 - **LOG file** for job log. If you see errors, please attached this in
221 the bug report
222
223 -----
224
225 **script parameter list of CEAS 0.9.8**
226
227 Options:
228 --version show program's version number and exit
229 -h, --help Show this help message and exit.
230 -b BED, --bed=BED BED file of ChIP regions.
231 -w WIG, --wig=WIG WIG file for either wig profiling or genome background
232 annotation. WARNING: --bg flag must be set for genome
233 background re-annotation.
234 -e EBED, --ebed=EBED BED file of extra regions of interest (eg, non-coding
235 regions)
236 -g GDB, --gt=GDB Gene annotation table (eg, a refGene table in sqlite3
237 db format provided through the CEAS web,
238 http://liulab.dfci.harvard.edu/CEAS/download.html).
239 --name=NAME Experiment name. This will be used to name the output
240 files. If an experiment name is not given, the stem of
241 the input BED file name will be used instead (eg, if
242 'peaks.bed', 'peaks' will be used as a name.)
243 --sizes=SIZES Promoter (also dowsntream) sizes for ChIP region
244 annotation. Comma-separated three values or a single
245 value can be given. If a single value is given, it
246 will be segmented into three equal fractions (ie, 3000
247 is equivalent to 1000,2000,3000), DEFAULT:
248 1000,2000,3000. WARNING: Values > 10000bp are
249 automatically set to 10000bp.
250 --bisizes=BISIZES Bidirectional-promoter sizes for ChIP region
251 annotation Comma-separated two values or a single
252 value can be given. If a single value is given, it
253 will be segmented into two equal fractions (ie, 5000
254 is equivalent to 2500,5000) DEFAULT: 2500,5000bp.
255 WARNING: Values > 20000bp are automatically set to
256 20000bp.
257 --bg Run genome BG annotation again. WARNING: This flag is
258 effective only if a WIG file is given through -w
259 (--wig). Otherwise, ignored.
260 --span=SPAN Span from TSS and TTS in the gene-centered annotation.
261 ChIP regions within this range from TSS and TTS are
262 considered when calculating the coverage rates in
263 promoter and downstream, DEFAULT=3000bp
264 --pf-res=PF_RES Wig profiling resolution, DEFAULT: 50bp. WARNING:
265 Value smaller than the wig interval (resolution) may
266 cause aliasing error.
267 --rel-dist=REL_DIST Relative distance to TSS/TTS in wig profiling,
268 DEFAULT: 3000bp
269 --gn-groups=GN_GROUPS
270 Gene-groups of particular interest in wig profiling.
271 Each gene group file must have gene names in the 1st
272 column. The file names are separated by commas w/ no
273 space (eg, --gn-groups=top10.txt,bottom10.txt)
274 --gn-group-names=GN_NAMES
275 The names of the gene groups in --gn-groups. The gene
276 group names are separated by commas. (eg, --gn-group-
277 names='top 10%,bottom 10%'). These group names appear
278 in the legends of the wig profiling plots. If no group
279 names given, the groups are represented as 'Group 1,
280 Group2,...Group n'.
281 --gname2 Whether or not use the 'name2' column of the gene
282 annotation table when reading the gene IDs in the
283 files given through --gn-groups. This flag is
284 meaningful only with --gn-groups.
285
286 </help>
287
288 </tool>