annotate ideas_preprocessor.xml @ 16:aaf64c0d7a0e draft

Uploaded
author greg
date Tue, 30 Jan 2018 09:34:17 -0500
parents 4d542da396a7
children 6ff92012abb7
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
1 <tool id="ideas_preprocessor" name="IDEAS Preprocessor" version="1.0.0">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
2 <description></description>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
3 <requirements>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
4 <requirement type="package" version="2.5.4">deeptools</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
5 <requirement type="package" version="1.10.4">r-data.table</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
6 <requirement type="package" version="1.4.4">r-optparse</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
7 <requirement type="package" version="1.6">samtools</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
8 <requirement type="package" version="357">ucsc-bigwigaverageoverbed</requirement>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
9 </requirements>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
11 #set chromosome_windows = "chromosome_windows.txt"
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
12 #set ideaspre_input_config = "ideaspre_input_config.txt"
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
13 #set specify_chrom_windows = $specify_chrom_windows_cond.specify_chrom_windows
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
14 #set tmp_dir = "tmp"
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
15 mkdir $tmp_dir &&
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
16 mkdir $output.files_path &&
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
17 #if str($specify_chrom_windows) == "yes":
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
18 ##############################################
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
19 ## Using a bed file for defining chrom windows,
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
20 ## so categorize the window positions by
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
21 ## chromosome to enable the IDEAS -inv option.
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
22 ##############################################
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
23 cp '$gen_chromosome_windows' $chromosome_windows &&
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
24 #end if
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
25 ##############################################
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
26 ## Create the config file and prepare the data
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
27 ##############################################
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
28 cp '$gen_ideaspre_input_config' $ideaspre_input_config &&
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
29 sort $ideaspre_input_config -o $ideaspre_input_config &&
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
30 Rscript '$__tool_directory__/ideas_preprocessor.R'
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
31 --ideaspre_input_config '$ideaspre_input_config'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
32 #if str($specify_chrom_windows) == "yes":
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
33 --chromosome_windows '$chromosome_windows'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
34 --chrom_bed_input '$specify_chrom_windows_cond.chrom_bed_input'
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
35 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
36 --chrom_len_file '$chromInfo'
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
37 --window_size $specify_chrom_windows_cond.window_size
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
38 #set restrict_chromosomes = $specify_chrom_windows_cond.restrict_chromosomes_cond.restrict_chromosomes
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
39 #if str($restrict_chromosomes) == "yes":
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
40 #set chroms = []
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
41 #set chrom_repeat = $specify_chrom_windows_cond.restrict_chromosomes_cond.chrom_repeat
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
42 #for $i in $chrom_repeat.chrom
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
43 $chroms.append($i)
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
44 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
45 --restrict_to_chroms ",".join(chroms)
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
46 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
47 #end if
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
48 #if str($bychr) == "true":
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
49 --bychr true
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
50 #end if
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
51 --reads_per_bp $reads_per_bp
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
52 #if str($exclude_bed_input) not in ["None", ""]:
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
53 --exclude_bed_input '$exclude_bed_input'
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
54 #end if
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
55 #if str($standardize_datasets) == "true":
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
56 --standardize_datasets true
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
57 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
58 --output '$output'
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
59 --output_hid $output.hid
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
60 --output_files_path '$output.files_path'
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
61 &> ideas_preprocessor_log.txt;
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
62 if [[ $? -ne 0 ]]; then
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
63 cp ideas_preprocessor_log.txt '$output';
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
64 exit 1;
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
65 fi
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
66 ]]></command>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
67 <configfiles>
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
68 <configfile name="gen_ideaspre_input_config"><![CDATA[#if str($cell_type_epigenetic_factor_cond.cell_type_epigenetic_factor) == "extract":
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
69 #set input_name_positions = $cell_type_epigenetic_factor_cond.input_name_positions
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
70 #for $i in $cell_type_epigenetic_factor_cond.input:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
71 #set file_name_with_ext = $i.name
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
72 #if str($file_name_with_ext).find("http") >= 0 or str($file_name_with_ext).find("ftp") >= 0:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
73 #set file_name_with_ext = $file_name_with_ext.split('/')[-1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
74 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
75 #assert str($file_name_with_ext).find("-") >= 0, "The selected input '%s' is invalid because it does not include the '-' character which is required when setting cell type and epigenetic factor names by extracting them from the input file names." % $file_name_with_ext
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
76 #set file_name = $file_name_with_ext.split(".")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
77 #if str($input_name_positions) == "cell_first":
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
78 #set cell_type_name = $file_name.split("-")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
79 #set epigenetic_factor_name = $file_name.split("-")[1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
80 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
81 #set cell_type_name = $file_name.split("-")[1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
82 #set epigenetic_factor_name = $file_name.split("-")[0]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
83 #end if
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
84 ${cell_type_name} ${epigenetic_factor_name} ${i} ${file_name} ${i.ext}
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
85 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
86 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
87 #for $input_items in $cell_type_epigenetic_factor_cond.input_repeat:
2
248b5f72fc02 Uploaded
greg
parents: 0
diff changeset
88 ${input_items.cell_type_name} ${input_items.epigenetic_factor_name} ${input_items.input} ${file_name} ${input_items.input.ext}
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
89 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
90 #end if]]></configfile>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
91 <configfile name="gen_chromosome_windows"><![CDATA[#if str($specify_chrom_windows_cond.specify_chrom_windows) == "yes":
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
92 #import collections
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
93 #set window_positions_by_chroms_odict = $collections.OrderedDict()
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
94 #for count, line in enumerate(open($specify_chrom_windows_cond.chrom_bed_input.file_name, 'r')):
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
95 #set $line = $line.strip()
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
96 #if not $line or $line.startswith('#'):
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
97 #continue
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
98 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
99 #set items = $line.split('\t')
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
100 #if $items[0] in $window_positions_by_chroms_odict:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
101 #set tup = $window_positions_by_chroms_odict[$items[0]]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
102 #set $tup[1] += 1
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
103 #set $window_positions_by_chroms_odict[$items[0]] = $tup
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
104 #else:
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
105 #set $window_positions_by_chroms_odict[$items[0]] = [$count, $count+1]
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
106 #end if
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
107 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
108 #for $chrom, $tup in $window_positions_by_chroms_odict.items():
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
109 ${chrom} ${tup[0]} ${tup[1]}
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
110 #end for
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
111 #end if]]></configfile>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
112 </configfiles>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
113 <inputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
114 <conditional name="cell_type_epigenetic_factor_cond">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
115 <param name="cell_type_epigenetic_factor" type="select" label="Set cell type and epigenetic factor names by">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
116 <option value="extract" selected="true">extracting them from the selected input file names</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
117 <option value="manual">manually setting them for each selected input</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
118 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
119 <when value="extract">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
120 <param name="input" type="data" format="bigwig,bam" multiple="True" label="BAM or BigWig files">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
121 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
122 <validator type="unspecified_build"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
123 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
124 <param name="input_name_positions" type="select" display="radio" label="Selected input file name pattern is" help="A '-' character must separate cell type and epigenetic factor names within the selected input file names">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
125 <option value="cell_first" selected="true">Cell type name - Epigenetic factor name</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
126 <option value="cell_last">Epigenetic factor name - Cell type name</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
127 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
128 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
129 <when value="manual">
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
130 <repeat name="input_repeat" title="Cell type, epigenetic factor and input" min="1">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
131 <param name="cell_type_name" type="text" value="" label="Cell type name">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
132 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
133 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
134 <param name="epigenetic_factor_name" type="text" value="" label="Epigenetic factor name">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
135 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
136 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
137 <param name="input" type="data" format="bigwig,bam" label="BAM or BigWig file">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
138 <validator type="empty_field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
139 <validator type="unspecified_build"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
140 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
141 </repeat>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
142 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
143 </conditional>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
144 <conditional name="specify_chrom_windows_cond">
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
145 <param name="specify_chrom_windows" type="select" label="Define chromosome window positions from a bed file?">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
146 <option value="no" selected="true">No</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
147 <option value="yes">Yes</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
148 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
149 <when value="no">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
150 <param name="window_size" type="integer" value="200" label="Window size in base pairs"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
151 <conditional name="restrict_chromosomes_cond">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
152 <param name="restrict_chromosomes" type="select" label="Restrict processing to specified chromosomes">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
153 <option value="no" selected="true">No</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
154 <option value="yes">Yes</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
155 </param>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
156 <when value="no"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
157 <when value="yes">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
158 <repeat name="chrom_repeat" title="Chromosomes" min="1">
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
159 <param name="chrom" type="text" value="" label="Chromosome" help="One chromosome (e.g., chr1, chr2, chrX) per text field"/>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
160 </repeat>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
161 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
162 </conditional>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
163 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
164 <when value="yes">
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
165 <param name="chrom_bed_input" type="data" format="bed" label="Select bed file for defining chromosome window positions">
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
166 <validator type="empty_dataset"/>
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
167 </param>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
168 </when>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
169 </conditional>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
170 <param name="bychr" type="boolean" truevalue="true" falsevalue="" checked="False" label="Output chromosomes in separate files"/>
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
171 <param name="reads_per_bp" type="select" display="radio" label="Calculate the signal in each window using">
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
172 <option value="6" selected="true">mean</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
173 <option value="8">max</option>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
174 </param>
13
4d542da396a7 Uploaded
greg
parents: 11
diff changeset
175 <param name="exclude_bed_input" type="data" format="bed" optional="True" multiple="True" label="Select bed file(s) containing regions to exclude"/>
11
26eb979cf8d9 Uploaded
greg
parents: 8
diff changeset
176 <param name="standardize_datasets" type="boolean" truevalue="true" falsevalue="" checked="False" label="Standardize all datasets"/>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
177 </inputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
178 <outputs>
4
f577a83e86c4 Uploaded
greg
parents: 2
diff changeset
179 <data name="output" format="ideaspre"/>
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
180 </outputs>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
181 <tests>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
182 <test>
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
183 <param name="input" value="e001-h3k4me3.bigwig" ftype="bigwig" dbkey="hg19"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
184 <param name="specify_chrom_windows" value="yes"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
185 <param name="chrom_bed_input" value="chrom_windows.bed" ftype="bed" dbkey="hg19"/>
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
186 <output name="output" file="output.ideaspre" ftype="ideaspre" />
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
187 </test>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
188 </tests>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
189 <help>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
190 **What it does**
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
191
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
192 Takes as input a list of epigenetic data sets (histones, chromatin accessibility, CpG methylation, TFs, etc.)
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
193 or any other whole-genome data sets (e.g., scores). Currently the supported data formats are BigWig and BAM.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
194 All data sets are mapped by to a common genomic coordinate in a selected assembly (user-provided window size
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
195 or 200bp windows by default). The user can specify regions to be considered or removed from the analysis.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
196 The input data may come from one cell type/condition/individual/time point (although this approach does not
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
197 fully utilize the advantages of IDEAS), or from multiple cell types/conditions/individuals/time points. The
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
198 same set of epigenetic features may not be present in all cell types, in which case IDEAS perfroms imputation
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
199 of the missing tracks if specified. This tool produces a single dataset with the **IdeasPre** datatype for
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
200 use as input to the IDEAS tool.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
201
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
202 -----
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
203
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
204 **Required options**
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
205
16
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
206 * **Set cell type and epigenetic factor names by** - cell type and epigenetic factor names can be set manually or by extracting them from the names of the selected input datasets. The latter case requires all selected datasets to have names that contain a "-" character.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
207
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
208 * **BAM or BigWig files** - select one or more Bam or Bigwig files from your history, making sure that the name of every selected input include a "-" character (e.g., e001-h3k4me3.bigwig).
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
209 * **Cell type, Epigenetic factor and Input** - manually select any number of inputs, setting the cell type and epigenetic factor name for each. The combination of "cell type name" and "epigenetic factor name" must be unique for each input. For example, if you have replicate data you may want to specify the cell name as "rep1", "rep2", etc and the factor name as "rep1", "rep2", etc.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
210
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
211 * **Cell type name** - cell type name if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
212 * **Epigenetic factor name** - epigenetic factor name if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
213 * **BAM or BigWig file** - BAM or BigWig file.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
214 * **Selected input file name pattern is** - select the file name pattern, either **epigenetic factor name-cell type name** or **cell type name-epigenetic factor name**.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
215
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
216 * **Define chromosome window positions from a bed file** - select "No" to run whole genome segmentation or select "Yes" to segment genomes within the unit of the windows defined by the bed file. This file can be in BED3, BED4 or BED5 format, but only the first three columns (chr posst posed) will be used.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
217
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
218 * **Window size in base pairs** - Window size in base pairs if specifying manually.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
219 * **Restrict processing to specified chromosomes** - select "Yes" to restrict processing to specified chromosomes.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
220
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
221 * **Chromosomes** - enter a comma-separated list of chromosomes for processing.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
222
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
223 * **Select bed file for defining chromosome window positions** - select a bed file for specifying the chromosome window positions.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
224
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
225 * **Output chromosomes in separate files** - select "Yes" to produce separate files for each chromosome, allowing you to run IDEAS on different chromosomes separately.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
226 * **Calculate the signal in each window using** - use the bigWigAverageOverBed utility from the UCSC genome browser to calculate the signal (i.e., the number of reads per bp) in each window.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
227 * **Select bed file(s) containing regions to exclude** - select one or more bed files that contains regions you'd like excluded from your datasets.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
228 * **Standardize all datasets** - select "Yes" to standardize all datasets (e.g., reads / total_reads * 20 million) so that the signals from different cell types become comparable - your datasets can be read counts, logp-values or fold change.
aaf64c0d7a0e Uploaded
greg
parents: 13
diff changeset
229
0
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
230 </help>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
231 <citations>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
232 <citation type="doi">10.1093/nar/gkw278</citation>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
233 </citations>
f060a0fbd4fe Uploaded
greg
parents:
diff changeset
234 </tool>