annotate bsmap.xml @ 6:54492fec12ba draft

Uploaded
author eugen
date Thu, 16 Aug 2012 04:13:30 -0400
parents baf099f2e5fa
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
1 <tool id="bsmap" name="BSMAP Mapper">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
2 <requirements>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
3 <requirement type='package'>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
4 bsmap
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
5 </requirement>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
6 </requirements>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
7 <command interpreter="bash">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
8 bsmap_wrapper.sh
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
9 ##Reference genome
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
10 ref="${reference.fields.path}"
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
11 ##Output files (SAM output, BSMAP summary)
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
12 mapped=$mapped
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
13 ##Temp directory
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
14 tempdir=$mapped.files_path
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
15 summary=$summary
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
16 #if str($singlePaired.sPaired) == "single":
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
17 library="single"
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
18 mate1=$singlePaired.sInput1
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
19 #if str($singlePaired.sParams.sSettingsType) == "full":
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
20 fullparam=true
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
21 qual=$singlePaired.sParams.qual
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
22 threshold=$singlePaired.sParams.threshold
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
23 lowqual=$singlePaired.sParams.lowqual
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
24 adapter=$singlePaired.sParams.adapter
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
25 firstn=$singlePaired.sParams.firstn
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
26 repeat_reads=$singlePaired.sParams.repeat_reads
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
27 seed_size=$singlePaired.sParams.seed_size
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
28 mismatch=$singlePaired.sParams.mismatch
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
29 equal_best=$singlePaired.sParams.equal_best
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
30 start=$singlePaired.sParams.start
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
31 end=$singlePaired.sParams.end
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
32 index_interval=$singlePaired.sParams.index_interval
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
33 seed_random=$singlePaired.sParams.seed_random
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
34 rrbs=$singlePaired.sParams.rrbs
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
35 mode=$singlePaired.sParams.mode
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
36 align_info=$singlePaired.sParams.align_info
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
37 #end if
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
38 #else:
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
39 library="paired"
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
40 mate1=$singlePaired.pInput1
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
41 mate2=$singlePaired.pInput2
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
42 unpaired=$unpaired
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
43 #if str($singlePaired.pParams.pSettingsType) == "full":
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
44 fullparam=true
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
45 qual=$singlePaired.pParams.qual
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
46 threshold=$singlePaired.pParams.threshold
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
47 lowqual=$singlePaired.pParams.lowqual
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
48 adapter=$singlePaired.pParams.adapter
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
49 firstn=$singlePaired.pParams.firstn
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
50 repeat_reads=$singlePaired.pParams.repeat_reads
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
51 seed_size=$singlePaired.pParams.seed_size
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
52 mismatch=$singlePaired.pParams.mismatch
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
53 equal_best=$singlePaired.pParams.equal_best
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
54 start=$singlePaired.pParams.start
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
55 end=$singlePaired.pParams.end
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
56 index_interval=$singlePaired.pParams.index_interval
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
57 seed_random=$singlePaired.pParams.seed_random
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
58 rrbs=$singlePaired.pParams.rrbs
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
59 mode=$singlePaired.pParams.mode
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
60 align_info=$singlePaired.pParams.align_info
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
61 maxinsert=$singlePaired.pParams.maxinsert
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
62 mininsert=$singlePaired.pParams.mininsert
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
63 #end if
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
64 #end if
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
65 </command>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
66 <inputs>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
67 <param name="reference" type="select" label="Select a reference genome">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
68 <options from_data_table="bsmap_fasta">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
69 <filter type="sort_by" column="2" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
70 <validator type="no_options" message="No reference genomes are available" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
71 </options>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
72 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
73
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
74 <conditional name="singlePaired">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
75 <param name="sPaired" type="select" label="Is this library mate-paired?">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
76 <option value="single">Single-end</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
77 <option value="paired">Paired-end</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
78 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
79 <when value="single">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
80 <param name="sInput1" type="data" format="fastq,fasta" label="FASTQ file" help="Must have ASCII encoded quality scores"/>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
81 <conditional name="sParams">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
82 <param name="sSettingsType" type="select" label="BSMAP settings to use" help="For most mapping needs use Commonly used settings. If you want full control use Full parameter list">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
83 <option value="preSet">Commonly used</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
84 <option value="full">Full parameter list</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
85 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
86 <when value="preSet" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
87 <when value="full">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
88 <param name="qual" type="select" label="Select the type of FastQ qualities">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
89 <option value="33">phred33-quals</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
90 <option value="64">phred64-quals</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
91 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
92 <param name="threshold" type="integer" value="0" label="Quality threshold in trimming" help="0-40, default=0 (no trim)" min="0" max="40" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
93 <param name="lowqual" type="integer" value="5" label="Filter low-quality reads containing >n Ns" help="default=5" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
94 <param name="adapter" type="text" value="none" label="3-end adapter sequence" help="default: none (no trim)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
95 <param name="firstn" type="integer" value="144" label="Map the first N nucleotides of the read" help="default:144 (map the whole read)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
96
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
97 <param name="repeat_reads" type="select" label="How to report repeat hits">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
98 <option value="0">none(unique hit only)</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
99 <option value="1">random one</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
100 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
101
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
102 <param name="seed_size" type="integer" value="16" label="Seed size" min="8" max="16" help="default=16(WGBS mode), 12(RRBS mode)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
103 <param name="mismatch" type="integer" value="2" label="Maximum number of mismatches allowed on a read" max="15" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
104 <param name="equal_best" type="integer" value="20" label="Maximum number of equal best hits to count" max="1000" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
105 <param name="start" type="integer" value="1" label="Start from the Nth read or read pair" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
106 <param name="end" type="integer" value="4294967295" label="End at the Nth read or read pair" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
107 <param name="index_interval" type="integer" value="4" label="Index interval" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
108 <param name="seed_random" type="integer" value="-1" label="Seed for random number generation used in selecting multiple hits" help="other seed values generate pseudo random number based on read index number, to allow reproducible mapping results" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
109 <param name="rrbs" type="text" value="none" label="Activating RRBS mapping mode and set restriction enzyme digestion sites" help="digestion position marked by '-', example: -D C-CGG for MspI digestion. default: none (whole genome shotgun bisulfite mapping mode)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
110 <param name="mode" type="select" label="Set mapping strand information">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
111 <option value="0">only map to 2 forward strands</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
112 <option value="1">map SE or PE reads to all 4 strands</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
113 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
114 <param name="align_info" type="text" value="none" label="Set alignment information for the additional nucleotide transition" help="is in the form of two different nucleotides N1N2,indicating N1 in the reads could be mapped to N2 in the reference sequences. default: -M TC, corresponds to C=>U(T) transition in bisulfite conversion. example: -M GA could be used to detect A=>I(G) transition in RNA editing." />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
115 </when> <!-- full -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
116 </conditional> <!-- sParams -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
117 </when> <!-- single -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
118
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
119 <when value="paired">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
120 <param name="pInput1" type="data" format="fastq,fasta" label="Forward FASTQ file" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
121 <param name="pInput2" type="data" format="fastq,fasta" label="Reverse FASTQ file" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
122
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
123 <conditional name="pParams">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
124 <param name="pSettingsType" type="select" label="BSMAP settings to use" help="For most mapping needs use Commonly used settings. If you want full control use Full parameter list">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
125 <option value="preSet">Commonly used</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
126 <option value="full">Full parameter list</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
127 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
128 <when value="preSet" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
129 <when value="full">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
130 <param name="qual" type="select" label="Select the type of FastQ qualities">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
131 <option value="33">phred33-quals</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
132 <option value="64">phred64-quals</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
133 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
134
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
135 <param name="mininsert" type="integer" value="28" label="Minimal insert size allowed" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
136 <param name="maxinsert" type="integer" value="500" label="Maximal insert size allowed" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
137
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
138 <param name="threshold" type="integer" value="0" label="Quality threshold in trimming" help="0-40, default=0 (no trim)" min="0" max="40" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
139 <param name="lowqual" type="integer" value="5" label="Filter low-quality reads containing >n Ns" help="default=5" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
140 <param name="adapter" type="text" value="none" label="3-end adapter sequence" help="default: none (no trim)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
141 <param name="firstn" type="integer" value="144" label="Map the first N nucleotides of the read" help="default:144 (map the whole read)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
142
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
143 <param name="repeat_reads" type="select" label="How to report repeat hits">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
144 <option value="0">none(unique hit only)</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
145 <option value="1">random one</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
146 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
147
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
148 <param name="seed_size" type="integer" value="16" label="Seed size" min="8" max="16" help="default=16(WGBS mode), 12(RRBS mode)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
149 <param name="mismatch" type="integer" value="2" label="Maximum number of mismatches allowed on a read" max="15" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
150 <param name="equal_best" type="integer" value="20" label="Maximum number of equal best hits to count" max="1000" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
151 <param name="start" type="integer" value="1" label="Start from the Nth read or read pair" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
152 <param name="end" type="integer" value="4294967295" label="End at the Nth read or read pair" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
153 <param name="index_interval" type="integer" value="4" label="Index interval" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
154 <param name="seed_random" type="integer" value="-1" label="Seed for random number generation used in selecting multiple hits" help="other seed values generate pseudo random number based on read index number, to allow reproducible mapping results" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
155 <param name="rrbs" type="text" value="none" label="Activating RRBS mapping mode and set restriction enzyme digestion sites" help="digestion position marked by '-', example: -D C-CGG for MspI digestion. default: none (whole genome shotgun bisulfite mapping mode)" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
156 <param name="mode" type="select" label="Set mapping strand information">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
157 <option value="0">only map to 2 forward strands</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
158 <option value="1">map SE or PE reads to all 4 strands</option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
159 </param>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
160 <param name="align_info" type="text" value="none" label="Set alignment information for the additional nucleotide transition" help="is in the form of two different nucleotides N1N2,indicating N1 in the reads could be mapped to N2 in the reference sequences. default: -M TC, corresponds to C=>U(T) transition in bisulfite conversion. example: -M GA could be used to detect A=>I(G) transition in RNA editing." />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
161
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
162
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
163 </when> <!-- full -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
164 </conditional> <!-- pParams -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
165 </when> <!-- paired -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
166 </conditional> <!-- singlePaired -->
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
167
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
168
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
169 </inputs>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
170 <outputs>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
171 <data name="mapped" format="sam" label="BSMAP Mapped Reads">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
172 <actions>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
173 <action type="metadata" name="dbkey">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
174 <option type="from_data_table" name="bsmap_fasta" column="1" offset="0">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
175 <filter type="param_value" column="0" value="#" compare="startswith" keep="False"/>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
176 <filter type="param_value" ref="reference" column="0"/>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
177 </option>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
178 </action>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
179 </actions>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
180 </data>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
181 <data name="summary" format="txt" label="BSMAP Mapping Summary" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
182 <data name="unpaired" format ="sam" label="BSMAP Unpaired Hits">
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
183 <filter>(singlePaired['sPaired'] == 'paired')</filter>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
184 </data>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
185
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
186 </outputs>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
187 <help>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
188 **What it does**
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
189
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
190 BSMAP is a short reads mapping software for bisulfite sequencing reads. It has the following features:
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
191
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
192 - read length up to 144 nt, allow up to 15 mismatches, gap size up to 3 bp.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
193
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
194 - support single end and pair end mapping. support multi-thread mapping.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
195
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
196 - support both "Lister protocol" (sequence 2 forward strands only) and "Cokus protocol" (sequence all 4 bisulfite converted strands)
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
197
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
198 - reads are directly mapped to original reference genome sequence, no need to preprocess the reads and reference genome to convert C to T.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
199
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
200 - support both whole genome bisulfite sequencing (WGBS) mode and reduced representation bisulfite sequencing (RRBS) mode, allow changing the digestion site information to support different digestion enzymes for RRBS.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
201
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
202 - allow trimming adapter sequences and low quality nucleotides from the 3'end of reads
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
203
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
204 - allow trade off between speed/memory usage/mapping sensitivity. For human genome, the RRBS mode uses ~3GB. In WGBS mode, the typical memory usage is ~9GB, but can be as low as 5GB.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
205
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
206 - allow alignment for other nucleotide transitions, for example, can be set to detect the A=>I(G) transition in RNA editing.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
207
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
208 .. _BSMAP: http://code.google.com/p/bsmap/
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
209
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
210 **Input formats**
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
211
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
212 BSMAP accepts files in FASTA/FASTQ format.
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
213
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
214 **Outputs**
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
215
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
216 The output contains the following files:
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
217
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
218 - mapped reads in SAM format
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
219
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
220 - mapping summary
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
221
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
222 - unpaired hits (only for paired-end mapping)
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
223
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
224 </help>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
225
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
226 <tests>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
227 <test>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
228 <param name="sPaired" value="single" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
229 <param name="indices" value="bismark" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
230 <param name="sInput1" ftype="fastq" value="bismark_test_single.fastq" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
231 <param name="sParams" value="preSet" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
232 <output name="mapped" ftype="SAM" file="bismark_result_single_1.SAM" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
233 <ouput name="summary" ftype="txt" file="bismark_result_single_2.txt" />
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
234 </test>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
235 </tests>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
236 </tool>
baf099f2e5fa Uploaded
eugen
parents:
diff changeset
237