annotate rsem_calculate_expression.xml @ 1:73a9e9df80da draft

Uploaded
author yboursin
date Wed, 25 May 2016 10:08:02 -0400
parents 7146e81bc886
children c29f1fd1c8b6
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
1 <tool id="rsem_calculate_expression" name="RSEM calculate expression" version="EBA2016-v1">
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
2 <description>RNA-Seq by Expectation-Maximization</description>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
3 <requirements>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
4 <requirement type="package" version="1.2.28">rsem</requirement>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
5 <requirement type="package" version="1.1.2">bowtie</requirement>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
6 <requirement type="package" version="2.2.6">bowtie2</requirement>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
7 </requirements>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
8 <command>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
9 rsem-calculate-expression
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
10 ## --tag string
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
11 #if $seedlength:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
12 --seed-length $seedlength
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
13 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
14 --forward-prob $forward_prob
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
15 #if $rsem_options.fullparams == 'fullset':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
16 ## Fragment info
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
17 #if $rsem_options.fragment_length_mean:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
18 --fragment-length-mean $rsem_options.fragment_length_mean
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
19 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
20 #if $rsem_options.fragment_length_min:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
21 --fragment-length-min $rsem_options.fragment_length_min
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
22 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
23 #if $rsem_options.fragment_length_sd:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
24 --fragment-length-sd $rsem_options.fragment_length_sd
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
25 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
26 #if $rsem_options.fragment_length_max:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
27 --fragment-length-max $rsem_options.fragment_length_max
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
28 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
29 ## RSPD
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
30 #if $rsem_options.rspd.estimate == 'yes':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
31 --estimate-rspd
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
32 #if $rsem_options.rspd.num_rspd_bins:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
33 --num-rspd-bins $rsem_options.rspd.num_rspd_bins
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
34 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
35 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
36 ## Calculate 95% credibility intervals and posterior mean estimates.
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
37 #if $rsem_options.ci == 'yes':
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
38 --calc-ci
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
39 --ci-memory 2048
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
40 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
41 #end if
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
42 ## Calculate PME
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
43 $rsem_options.pme
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
44 --num-threads \${GALAXY_SLOTS:-4}
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
45 #if str($input.usebowtie.bowtie) == "one":
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
46 #if $input.format != 'bam' and $input.usebowtie.bowtie_options.fullparams == 'fullset':
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
47 ## Bowtie params
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
48 #if $input.usebowtie.bowtie_options.bowtie_e:
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
49 --bowtie-e $input.usebowtie.bowtie_options.bowtie_e
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
50 #end if
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
51 #if $input.usebowtie.bowtie_options.bowtie_m:
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
52 --bowtie-m $input.usebowtie.bowtie_options.bowtie_m
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
53 #end if
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
54 #if $input.usebowtie.bowtie_options.bowtie_n:
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
55 --bowtie-n $input.usebowtie.bowtie_options.bowtie_n
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
56 #end if
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
57 #end if
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
58
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
59 #elif str($input.usebowtie.bowtie) == "two":
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
60 --bowtie2
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
61 #end if
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
62
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
63 ## Outputs
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
64 #if $rsem_outputs.result_bams == 'none':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
65 --no-bam-output
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
66 #else
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
67 #if $rsem_outputs.result_bams == 'both':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
68 --output-genome-bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
69 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
70 $rsem_outputs.sampling_for_bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
71 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
72 ## Input data
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
73 #if $input.format=="fastq"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
74 $input.fastq_select
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
75 #if $input.fastq.matepair=="single":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
76 $input.fastq.singlefastq
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
77 #elif $input.fastq.matepair=="paired":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
78 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
79 $input.fastq.fastq1
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
80 $input.fastq.fastq2
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
81 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
82 #elif $input.format=="fasta"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
83 --no-qualities
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
84 #if $input.fasta.matepair=="single":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
85 $input.fasta.singlefasta
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
86 #elif $input.fasta.matepair=="paired":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
87 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
88 $input.fasta.fasta1
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
89 $input.fasta.fasta2
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
90 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
91 #elif $input.format=="sam"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
92 #if $input.matepair=="paired":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
93 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
94 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
95 #if $input.rsem_sam._extension == 'sam':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
96 --sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
97 #elif $input.rsem_sam._extension == 'bam':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
98 --bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
99 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
100 $input.rsem_sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
101 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
102 ## RSEM reference
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
103 #if $reference.refSrc == 'history':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
104 ${reference.rsem_ref.extra_files_path}/${reference.rsem_ref.metadata.reference_name}
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
105 #elif $reference.refSrc == 'cached':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
106 ${reference.index.fields.path}
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
107 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
108 ## sample_name: use a hard coded name so we can pull out galaxy outputs
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
109 rsem_output
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
110 ## direct output into logfile
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
111 > $log
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
112 </command>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
113 <macros>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
114 <macro name="rsem_options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
115 <param name="seedlength" type="integer" value="25" optional="true" label="Seed length used by the read aligner" help="Providing the correct value for this parameter is important for RSEM's accuracy if the data are single-end reads. RSEM uses this value for Bowtie's seed length parameter. The minimum value is 25. (Default:25)">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
116 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
117 <param name="forward_prob" type="select" label="Is the library strand specific?">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
118 <option value="0.5" selected="true">No</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
119 <option value="1">Yes, the reads (or first reads from paired-end libraries) are only in the forward orientation</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
120 <option value="0">Yes, the reads (or first reads from paired-end libraries) are only in the reverse orientation</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
121 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
122 <conditional name="rsem_options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
123 <param name="fullparams" type="select" label="Additional RSEM options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
124 <option value="default">Use RSEM Defaults</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
125 <option value="fullset">Set Additional RSEM Options</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
126 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
127 <when value="default"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
128 <when value="fullset">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
129 <param name="fragment_length_min" type="integer" value="1" optional="true" label="Minimum read/insert length." help=" This is also the value for the bowtie -I option">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
130 <validator type="in_range" message="0 or greater" min="0" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
131 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
132 <param name="fragment_length_max" type="integer" value="1000" optional="true" label="Maximum read/insert length." help=" This is also the value for the bowtie -X option">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
133 <validator type="in_range" message="0 or greater" min="0" max="1000000"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
134 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
135 <param name="fragment_length_mean" type="float" value="" optional="true" label="Fragment length mean (single-end data only)" help="The mean of the fragment length distribution, which is assumed to be a Gaussian. (Default: -1, which disables use of the fragment length distribution)">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
136 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
137 <param name="fragment_length_sd" type="float" value="" optional="true" label="The standard deviation of the fragment length distribution (single-end data only)" help="Default 0, which assumes that all fragments are of the same length, given by the rounded value of fragment length mean. ">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
138 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
139 <conditional name="rspd">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
140 <param name="estimate" type="select" lanel="Read Start Position Distribution (RSPD)"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
141 help="Set this option if you want to estimate the read start position distribution (RSPD) from data. Otherwise, RSEM will use a uniform RSPD.">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
142 <option value="no" selected="true">Use a uniform RSPD</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
143 <option value="yes">Estimate and correct for a non-uniform RSPD</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
144 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
145 <when value="no"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
146 <when value="yes">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
147 <param name="num_rspd_bins" type="integer" value="20" optional="true" label="Number of bins in the RSPD." help="Use of the default setting of 20 is recommended.">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
148 <validator type="in_range" message="" min="0" max="100"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
149 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
150 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
151 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
152 <param name="ci" type="select" label="Calculate 95% Credibility Intervals">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
153 <option value="no" selected="true">no</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
154 <option value="yes">yes</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
155 </param>
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
156
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
157 <param name="pme" type="boolean" truevalue="--calc-pme" falsevalue="" label="Calculate posterior mean estimates ? (collapsed Gibbs sampler)" />
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
158 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
159 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
160 </macro>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
161 <macro name="bowtie_options">
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
162 <conditional name="usebowtie">
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
163 <param name="bowtie" type="select" label="Use bowtie 1 or 2 ?">
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
164 <option value="one" selected="true">Bowtie 1</option>
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
165 <option value="two">Bowtie 2</option>
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
166 </param>
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
167 <when value="one">
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
168 <conditional name="bowtie_options">
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
169 <param name="fullparams" type="select" label="bowtie settings">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
170 <option value="default">use bowtie defaults</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
171 <option value="fullset">set bowtie options</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
172 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
173 <when value="default"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
174 <when value="fullset">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
175 <param name="bowtie_n" type="integer" value="2" optional="true" label="Bowtie mismatches" help="Bowtie parameter max # of mismatches in the seed. (Range: 0-3, Default: 2) ">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
176 <validator type="in_range" message="max # of mismatches in the seed between 0 and 3" min="0" max="3"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
177 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
178 <param name="bowtie_e" type="integer" value="99999999" label="Maximum sum of quality scores at mismatched positions in read alignments. This is also the value for the Bowtie -e option">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
179 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
180 <param name="bowtie_m" type="integer" value="200" label="Discard alignments for reads with number of alignments greater than">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
181 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
182 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
183 </conditional>
1
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
184 </when>
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
185 <when value="two" />
73a9e9df80da Uploaded
yboursin
parents: 0
diff changeset
186 </conditional>
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
187 </macro>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
188 <macro name="sampling_for_bam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
189 <param name="sampling_for_bam" type="boolean" truevalue="--sampling-for-bam" falsevalue="" checked="false" label="Use sampling for BAM">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
190 <help> When RSEM generates a BAM file, instead of outputing all alignments a read has with their posterior probabilities, one alignment is sampled according to the posterior probabilities. The sampling procedure includes the alignment to the "noise" transcript, which does not appear in the BAM file. Only the sampled alignment has a weight of 1. All other alignments have weight 0. If the "noise" transcript is sampled, all alignments appeared in the BAM file should have weight 0. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
191 </help>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
192 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
193 </macro>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
194 </macros>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
195
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
196 <inputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
197 <param name="sample" type="text" value="rsem_sample" label="Sample name" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
198 <conditional name="reference">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
199 <param name="refSrc" type="select" label="RSEM Reference Source">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
200 <option value="cached">Locally cached</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
201 <option value="history">From your history</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
202 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
203 <when value="cached">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
204 <param name="index" type="select" label="Select RSEM reference" help="Select from a list of pre-indexed references. If you don't see anything consult the wrapper's documentation on how to create or download a reference">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
205 <options from_data_table="rsem_indexes">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
206 <filter type="sort_by" column="2" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
207 <validator type="no_options" message="No indexes are available" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
208 </options>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
209 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
210 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
211 <when value="history">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
212 <param name="rsem_ref" type="data" format="rsem_ref" label="RSEM reference" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
213 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
214 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
215 <conditional name="input">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
216 <param name="format" type="select" label="RSEM Input file type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
217 <option value="fastq">FASTQ</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
218 <option value="fasta">FASTA</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
219 <option value="sam">SAM/BAM</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
220 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
221 <when value="fastq">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
222 <param name="fastq_select" size="15" type="select" label="FASTQ type" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
223 <option value="--phred33-quals" selected="true">phred33 qualities (default for sanger)</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
224 <option value="--solexa-quals">solexa qualities</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
225 <option value="--phred64-quals">phred64 qualities</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
226 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
227 <conditional name="fastq">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
228 <param name="matepair" type="select" label="Library type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
229 <option value="single">Single End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
230 <option value="paired">Paired End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
231 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
232 <when value="single">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
233 <param name="singlefastq" type="data" format="fastq" label="FASTQ file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
234 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
235 <when value="paired">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
236 <param name="fastq1" type="data" format="fastq" label="Read 1 fastq file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
237 <param name="fastq2" type="data" format="fastq" label="Read 2 fastq file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
238 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
239 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
240 <expand macro="bowtie_options"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
241 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
242 <when value="fasta">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
243 <conditional name="fasta">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
244 <param name="matepair" type="select" label="Library Type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
245 <option value="single">Single End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
246 <option value="paired">Paired End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
247 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
248 <when value="single">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
249 <param name="singlefasta" type="data" format="fasta" label="fasta file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
250 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
251 <when value="paired">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
252 <param name="fasta1" type="data" format="fasta" label="Read 1 fasta file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
253 <param name="fasta2" type="data" format="fasta" label="Read 2 fasta file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
254 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
255 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
256 <expand macro="bowtie_options"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
257 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
258 <when value="sam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
259 <!-- convert-sam-for-rsem /ref/mouse_125 input.sam -o input_for_rsem.sam -->
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
260 <param name="matepair" type="select" label="Library Type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
261 <option value="single">Single End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
262 <option value="paired">Paired End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
263 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
264 <param name="rsem_sam" type="data" format="rsem_sam" label="RSEM formatted SAM file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
265 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
266 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
267 <expand macro="rsem_options"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
268 <conditional name="rsem_outputs">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
269 <param name="result_bams" type="select" label="Create bam results files"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
270 help="In addition to the transcript-coordinate-based BAM file output, also output a BAM file with the read alignments in genomic coordinates" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
271 <option value="none">No BAM results files</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
272 <option value="default" selected="true">Transcript BAM results file</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
273 <option value="both">Transcript and genome BAM results files</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
274 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
275 <when value="none"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
276 <when value="default">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
277 <expand macro="sampling_for_bam"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
278 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
279 <when value="both">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
280 <expand macro="sampling_for_bam"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
281 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
282 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
283 </inputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
284 <stdio>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
285 <exit_code range="1:" level="fatal" description="Error Running RSEM" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
286 </stdio>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
287 <outputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
288 <data format="tabular" name="gene_abundances" label="${sample}.gene_abundances" from_work_dir="rsem_output.genes.results"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
289 <data format="tabular" name="isoform_abundances" label="${sample}.isoform_abundances" from_work_dir="rsem_output.isoforms.results"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
290 <data format="bam" name="transcript_bam" label="${sample}.transcript.bam" from_work_dir="rsem_output.transcript.bam" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
291 <filter>rsem_outputs['result_bams'] != "none"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
292 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
293 <data format="bam" name="transcript_sorted_bam" label="${sample}.transcript.bam" from_work_dir="rsem_output.transcript.sorted.bam" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
294 <filter>rsem_outputs['result_bams'] != "none"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
295 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
296 <data format="bam" name="genome_bam" label="${sample}.genome.bam" from_work_dir="rsem_output.genome.bam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
297 <filter>rsem_outputs['result_bams'] == "both"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
298 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
299 <data format="bam" name="genome_sorted_bam" label="${sample}.genome.sorted.bam" from_work_dir="rsem_output.genome.sorted.bam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
300 <filter>rsem_outputs['result_bams'] == "both"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
301 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
302 <data format="txt" name="log" label="${sample}.rsem_log"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
303 </outputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
304 <tests>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
305 <test>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
306 <param name="sample" value="rsem_sample"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
307 <param name="refSrc" value="history"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
308 <param name="rsem_ref" value="RSEM_ref_reference.rsem_ref" ftype="rsem_ref"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
309 <param name="format" value="fastq"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
310 <param name="matepair" value="single"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
311 <param name="singlefastq" value="test.fastq" ftype="fastqsanger"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
312 <param name="result_bams" value="none"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
313 <output name="gene_abundances">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
314 <assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
315 <has_text text="ENST00000423562,ENST00000438504,ENST00000488147,ENST00000538476,ENST00000541675" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
316 </assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
317 </output>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
318 <output name="isoform_abundances">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
319 <assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
320 <has_text text="ENST00000332831" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
321 </assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
322 </output>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
323 <output name="log">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
324 <assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
325 <has_text text="Expression Results are written" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
326 </assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
327 </output>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
328 </test>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
329 </tests>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
330 <help>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
331
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
332
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
333 RSEM HOME PAGE - http://deweylab.biostat.wisc.edu/rsem/
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
334
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
335 NAME
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
336 rsem-calculate-expression
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
337
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
338 SYNOPSIS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
339 rsem-calculate-expression [options] upstream_read_file(s) reference_name sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
340 rsem-calculate-expression [options] --paired-end upstream_read_file/s downstream_read_file/s reference_name sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
341 rsem-calculate-expression [options] --sam/--bam [--paired-end] input reference_name sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
342
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
343 ARGUMENTS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
344 upstream_read_files/s
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
345 Comma-separated list of files containing single-end reads or
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
346 upstream reads for paired-end data. By default, these files are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
347 assumed to be in FASTQ format. If the --no-qualities option is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
348 specified, then FASTA format is expected.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
349
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
350 downstream_read_file/s
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
351 Comma-separated list of files containing downstream reads which are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
352 paired with the upstream reads. By default, these files are assumed
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
353 to be in FASTQ format. If the --no-qualities option is specified,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
354 then FASTA format is expected.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
355
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
356 input
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
357 SAM/BAM formatted input file. If "-" is specified for the filename,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
358 SAM/BAM input is instead assumed to come from standard input. RSEM
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
359 requires all alignments of the same read group together. For
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
360 paired-end reads, RSEM also requires the two mates of any alignment
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
361 be adjacent. See Description section for how to make input file obey
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
362 RSEM's requirements.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
363
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
364 reference_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
365 The name of the reference used. The user must have run
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
366 'rsem-prepare-reference' with this reference_name before running
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
367 this program.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
368
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
369 sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
370 The name of the sample analyzed. All output files are prefixed by
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
371 this name (e.g., sample_name.genes.results)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
372
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
373 OPTIONS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
374
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
375 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
376 Input reads are paired-end reads. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
377
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
378 --no-qualities
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
379 Input reads do not contain quality scores. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
380
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
381 --strand-specific
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
382 The RNA-Seq protocol used to generate the reads is strand specific,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
383 i.e., all (upstream) reads are derived from the forward strand. This
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
384 option is equivalent to --forward-prob=1.0. With this option set, if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
385 RSEM runs the Bowtie aligner, the '--norc' Bowtie option will be
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
386 used, which disables alignment to the reverse strand of transcripts.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
387 (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
388
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
389 --sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
390 Input file is in SAM format. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
391
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
392 --bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
393 Input file is in BAM format. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
394
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
395 --sam-header-info [file]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
396 RSEM reads header information from input by default. If this option
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
397 is on, header information is read from the specified file. For the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
398 format of the file, please see SAM official website. (Default: "")
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
399
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
400 -p/--num-threads [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
401 Number of threads to use. Both Bowtie and expression estimation will
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
402 use this many threads. (Default: 1)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
403
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
404 --no-bam-output
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
405 Do not output any BAM file. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
406
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
407 --output-genome-bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
408 Generate a BAM file, 'sample_name.genome.bam', with alignments
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
409 mapped to genomic coordinates and annotated with their posterior
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
410 probabilities. In addition, RSEM will call samtools (included in
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
411 RSEM package) to sort and index the bam file.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
412 'sample_name.genome.sorted.bam' and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
413 'sample_name.genome.sorted.bam.bai' will be generated. (Default:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
414 off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
415
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
416 --sampling-for-bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
417 When RSEM generates a BAM file, instead of outputing all alignments
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
418 a read has with their posterior probabilities, one alignment is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
419 sampled and outputed according to the posterior probabilities. If
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
420 the sampling result is that the read comes from the "noise"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
421 transcript, nothing is outputed. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
422
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
423 --calc-ci
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
424 Calculate 95% credibility intervals and posterior mean estimates.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
425 (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
426
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
427 --seed-length [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
428 Seed length used by the read aligner. Providing the correct value is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
429 important for RSEM. If RSEM runs Bowtie, it uses this value for
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
430 Bowtie's seed length parameter. Any read with its or at least one of
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
431 its mates' (for paired-end reads) length less than this value will
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
432 be ignored. If the references are not added poly(A) tails, the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
433 minimum allowed value is 5, otherwise, the minimum allowed value is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
434 25. Note that this script will only check if the value less or equal than
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
435 5 and give a warning message if the value less than 25 but greter or equal than
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
436 5. (Default: 25)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
437
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
438 --tag [string]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
439 The name of the optional field used in the SAM input for identifying
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
440 a read with too many valid alignments. The field should have the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
441 format [tagName]:i:[value], where a [value] bigger than 0 indicates
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
442 a read with too many alignments. (Default: "")
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
443
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
444 --bowtie-path [path]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
445 The path to the bowtie executables. (Default: the path to the bowtie
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
446 executables is assumed to be in the user's PATH environment
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
447 variable)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
448
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
449 --bowtie-n [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
450 (Bowtie parameter) max # of mismatches in the seed. (Range: 0-3,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
451 Default: 2)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
452
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
453 --bowtie-e [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
454 (Bowtie parameter) max sum of mismatch quality scores across the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
455 alignment. (Default: 99999999)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
456
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
457 --bowtie-m [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
458 (Bowtie parameter) suppress all alignments for a read if greater then [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
459 valid alignments exist. (Default: 200)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
460
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
461 --bowtie-chunkmbs [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
462 (Bowtie parameter) memory allocated for best first alignment
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
463 calculation (Default: 0 - use bowtie's default)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
464
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
465 --phred33-quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
466 Input quality scores are encoded as Phred+33. (Default: on)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
467
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
468 --phred64-quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
469 Input quality scores are encoded as Phred+64 (default for GA
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
470 Pipeline ver. less than 1.3). (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
471
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
472 --solexa-quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
473 Input quality scores are solexa encoded (from GA Pipeline ver. less
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
474 than 1.3). (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
475
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
476 --forward-prob [double]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
477 Probability of generating a read from the forward strand of a
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
478 transcript. Set to 1 for a strand-specific protocol where all
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
479 (upstream) reads are derived from the forward strand, 0 for a
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
480 strand-specific protocol where all (upstream) read are derived from
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
481 the reverse strand, or 0.5 for a non-strand-specific protocol.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
482 (Default: 0.5)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
483
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
484 --fragment-length-min [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
485 Minimum read/insert length allowed. This is also the value for the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
486 bowtie -I option. (Default: 1)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
487
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
488 --fragment-length-max [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
489 Maximum read/insert length allowed. This is also the value for the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
490 bowtie -X option. (Default: 1000)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
491
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
492 --fragment-length-mean [double]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
493 (single-end data only) The mean of the fragment length distribution,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
494 which is assumed to be a Gaussian. (Default: -1, which disables use
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
495 of the fragment length distribution)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
496
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
497 --fragment-length-sd [double]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
498 (single-end data only) The standard deviation of the fragment length
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
499 distribution, which is assumed to be a Gaussian. (Default: 0, which
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
500 assumes that all fragments are of the same length, given by the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
501 rounded value of --fragment-length-mean)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
502
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
503 --estimate-rspd
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
504 Set this option if you want to estimate the read start position
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
505 distribution (RSPD) from data. Otherwise, RSEM will use a uniform
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
506 RSPD. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
507
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
508 --num-rspd-bins [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
509 Number of bins in the RSPD. Only relevant when '--estimate-rspd' is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
510 specified. Use of the default setting is recommended. (Default: 20)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
511
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
512 --ci-memory [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
513 Maximum size (in memory, MB) of the auxiliary buffer used for
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
514 computing credibility intervals (CI). Set it larger for a faster CI
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
515 calculation. However, leaving 2 GB memory free for other usage is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
516 recommended. (Default: 1024)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
517
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
518 --keep-intermediate-files
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
519 Keep temporary files generated by RSEM. RSEM creates a temporary
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
520 directory, 'sample_name.temp', into which it puts all intermediate
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
521 output files. If this directory already exists, RSEM overwrites all
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
522 files generated by previous RSEM runs inside of it. By default,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
523 after RSEM finishes, the temporary directory is deleted. Set this
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
524 option to prevent the deletion of this directory and the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
525 intermediate files inside of it. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
526
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
527 --time
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
528 Output time consumed by each step of RSEM to 'sample_name.time'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
529 (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
530
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
531 -q/--quiet
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
532 Suppress the output of logging information. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
533
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
534 -h/--help
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
535 Show help information.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
536
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
537 DESCRIPTION
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
538 In its default mode, this program aligns input reads against a reference
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
539 transcriptome with Bowtie and calculates expression values using the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
540 alignments. RSEM assumes the data are single-end reads with quality
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
541 scores, unless the '--paired-end' or '--no-qualities' options are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
542 specified. Users may use an alternative aligner by specifying one of the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
543 --sam and --bam options, and providing an alignment file in the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
544 specified format. However, users should make sure that they align
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
545 against the indices generated by 'rsem-prepare-reference' and the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
546 alignment file satisfies the requirements mentioned in ARGUMENTS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
547 section.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
548
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
549 One simple way to make the alignment file satisfying RSEM's requirements
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
550 (assuming the aligner used put mates in a paired-end read adjacent) is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
551 to use 'convert-sam-for-rsem' script. This script only accept SAM format
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
552 files as input. If a BAM format file is obtained, please use samtools to
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
553 convert it to a SAM file first. For example, if '/ref/mouse_125' is the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
554 'reference_name' and the SAM file is named 'input.sam', you can run the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
555 following command:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
556
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
557 convert-sam-for-rsem /ref/mouse_125 input.sam -o input_for_rsem.sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
558
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
559 For details, please refer to 'convert-sam-for-rsem's documentation page.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
560
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
561 The SAM/BAM format RSEM uses is v1.4. However, it is compatible with old
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
562 SAM/BAM format. However, RSEM cannot recognize 0x100 in the FLAG field.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
563 In addition, RSEM requires SEQ and QUAL are not '*'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
564
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
565 The user must run 'rsem-prepare-reference' with the appropriate
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
566 reference before using this program.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
567
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
568 For single-end data, it is strongly recommended that the user provide
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
569 the fragment length distribution parameters (--fragment-length-mean and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
570 --fragment-length-sd). For paired-end data, RSEM will automatically
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
571 learn a fragment length distribution from the data.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
572
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
573 Please note that some of the default values for the Bowtie parameters
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
574 are not the same as those defined for Bowtie itself.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
575
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
576 The temporary directory and all intermediate files will be removed when
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
577 RSEM finishes unless '--keep-intermediate-files' is specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
578
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
579 With the '--calc-ci' option, 95% credibility intervals and posterior
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
580 mean estimates will be calculated in addition to maximum likelihood
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
581 estimates.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
582
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
583 OUTPUT
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
584 sample_name.genes.results
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
585 File containing gene level expression estimates. The format of each
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
586 line in this file is:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
587
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
588 gene_id expected_counts tau_value [pmc_value tau_pme_value
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
589 tau_ci_lower_bound tau_ci_upper_bound] transcript_id_list
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
590
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
591 Fields are separated by the tab character. Fields within "[]" are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
592 only presented if '--calc-ci' is set. pme stands for posterior mean
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
593 estimation. pmc stands for posterior mean counts. ci_lower_bound(l)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
594 means the lower bound of the credibility intervals,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
595 ci_upper_bound(u) means the upper bound of the credibility
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
596 intervals. So the credibility interval is [l, u].
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
597 'transcript_id_list' is a space-separated list of transcript_ids
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
598 belonging to the gene. If no gene information is provided, this file
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
599 has the same content as 'sample_name.isoforms.results'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
600
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
601 sample_name.isoforms.results
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
602 File containing isoform level expression values. The format of each
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
603 line in this file is:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
604
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
605 transcript_id expected_counts tau_value [pmc_value tau_pme_value
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
606 tau_ci_lower_bound tau_ci_upper_bound] gene_id
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
607
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
608 Fields are separated by the tab character. 'gene_id' is the gene_id
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
609 of the gene which this transcript belongs to. If no gene information
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
610 is provided, 'gene_id' and 'transcript_id' are the same.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
611
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
612 sample_name.transcript.bam, sample_name.transcript.sorted.bam and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
613 sample_name.transcript.sorted.bam.bai
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
614 Only generated when --no-bam-output is not specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
615
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
616 'sample_name.transcript.bam' is a BAM-formatted file of read
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
617 alignments in transcript coordinates. The MAPQ field of each
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
618 alignment is set to min(100, floor(-10 * log10(1.0 - w) + 0.5)),
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
619 where w is the posterior probability of that alignment being the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
620 true mapping of a read. In addition, RSEM pads a new tag ZW:f:value,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
621 where value is a single precision floating number representing the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
622 posterior probability.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
623
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
624 'sample_name.transcript.sorted.bam' and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
625 'sample_name.transcript.sorted.bam.bai' are the sorted BAM file and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
626 indices generated by samtools (included in RSEM package).
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
627
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
628 sample_name.genome.bam, sample_name.genome.sorted.bam and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
629 sample_name.genome.sorted.bam.bai
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
630 Only generated when --no-bam-output is not specified and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
631 --output-genome-bam is specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
632
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
633 'sample_name.genome.bam' is a BAM-formatted file of read alignments
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
634 in genomic coordinates. Alignments of reads that have identical
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
635 genomic coordinates (i.e., alignments to different isoforms that
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
636 share the same genomic region) are collapsed into one alignment. The
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
637 MAPQ field of each alignment is set to min(100, floor(-10 *
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
638 log10(1.0 - w) + 0.5)), where w is the posterior probability of that
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
639 alignment being the true mapping of a read. In addition, RSEM pads a
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
640 new tag ZW:f:value, where value is a single precision floating
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
641 number representing the posterior probability. If an alignment is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
642 spliced, a XS:A:value tag is also added, where value is either '+'
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
643 or '-' indicating the strand of the transcript it aligns to.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
644
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
645 'sample_name.genome.sorted.bam' and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
646 'sample_name.genome.sorted.bam.bai' are the sorted BAM file and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
647 indices generated by samtools (included in RSEM package).
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
648
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
649 sample_name.sam.gz
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
650 Only generated when the input files are raw reads instead of SAM/BAM
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
651 format files
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
652
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
653 It is the gzipped SAM output produced by bowtie aligner.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
654
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
655 sample_name.time
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
656 Only generated when --time is specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
657
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
658 It contains time (in seconds) consumed by aligning reads, estimating
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
659 expression levels and calculating credibility intervals.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
660
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
661 sample_name.stat
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
662 This is a folder instead of a file. All model related statistics are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
663 stored in this folder. Use 'rsem-plot-model' can generate plots
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
664 using this folder.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
665
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
666 EXAMPLES
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
667 Assume the path to the bowtie executables is in the user's PATH
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
668 environment variable. Reference files are under '/ref' with name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
669 'mouse_125'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
670
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
671 1) '/data/mmliver.fq', single-end reads with quality scores. Quality
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
672 scores are encoded as for 'GA pipeline version >= 1.3'. We want to use 8
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
673 threads and generate a genome BAM file:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
674
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
675 rsem-calculate-expression --phred64-quals \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
676 -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
677 --output-genome-bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
678 /data/mmliver.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
679 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
680 mmliver_single_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
681
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
682 2) '/data/mmliver_1.fq' and '/data/mmliver_2.fq', paired-end reads with
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
683 quality scores. Quality scores are in SANGER format. We want to use 8
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
684 threads and do not generate a genome BAM file:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
685
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
686 rsem-calculate-expression -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
687 --paired-end \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
688 /data/mmliver_1.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
689 /data/mmliver_2.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
690 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
691 mmliver_paired_end_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
692
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
693 3) '/data/mmliver.fa', single-end reads without quality scores. We want
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
694 to use 8 threads:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
695
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
696 rsem-calculate-expression -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
697 --no-qualities \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
698 /data/mmliver.fa \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
699 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
700 mmliver_single_without_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
701
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
702 4) Data are the same as 1). We want to take a fragment length
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
703 distribution into consideration. We set the fragment length mean to 150
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
704 and the standard deviation to 35. In addition to a BAM file, we also
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
705 want to generate credibility intervals. We allow RSEM to use 1GB of
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
706 memory for CI calculation:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
707
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
708 rsem-calculate-expression --bowtie-path /sw/bowtie \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
709 --phred64-quals \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
710 --fragment-length-mean 150.0 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
711 --fragment-length-sd 35.0 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
712 -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
713 --output-genome-bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
714 --calc-ci \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
715 --ci-memory 1024 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
716 /data/mmliver.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
717 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
718 mmliver_single_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
719
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
720 5) '/data/mmliver_paired_end_quals.bam', paired-end reads with quality
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
721 scores. We want to use 8 threads:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
722
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
723 rsem-calculate-expression --paired-end \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
724 --bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
725 -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
726 /data/mmliver_paired_end_quals.bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
727 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
728 mmliver_paired_end_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
729 </help>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
730 </tool>