annotate rsem_calculate_expression.xml @ 0:7146e81bc886 draft

Uploaded
author yboursin
date Wed, 25 May 2016 08:35:34 -0400
parents
children 73a9e9df80da
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
1 <tool id="rsem_calculate_expression" name="RSEM calculate expression" version="1.1.17">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
2 <description>RNA-Seq by Expectation-Maximization</description>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
3 <requirements>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
4 <requirement type="package" version="1.2.28">rsem</requirement>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
5 <requirement type="package" version="1.1.2">bowtie</requirement>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
6 <requirement type="package" version="2.2.6">bowtie2</requirement>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
7 </requirements>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
8 <command>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
9 rsem-calculate-expression
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
10 ## --tag string
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
11 #if $seedlength:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
12 --seed-length $seedlength
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
13 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
14 --forward-prob $forward_prob
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
15 #if $rsem_options.fullparams == 'fullset':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
16 ## Fragment info
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
17 #if $rsem_options.fragment_length_mean:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
18 --fragment-length-mean $rsem_options.fragment_length_mean
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
19 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
20 #if $rsem_options.fragment_length_min:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
21 --fragment-length-min $rsem_options.fragment_length_min
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
22 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
23 #if $rsem_options.fragment_length_sd:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
24 --fragment-length-sd $rsem_options.fragment_length_sd
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
25 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
26 #if $rsem_options.fragment_length_max:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
27 --fragment-length-max $rsem_options.fragment_length_max
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
28 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
29 ## RSPD
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
30 #if $rsem_options.rspd.estimate == 'yes':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
31 --estimate-rspd
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
32 #if $rsem_options.rspd.num_rspd_bins:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
33 --num-rspd-bins $rsem_options.rspd.num_rspd_bins
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
34 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
35 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
36 ## Calculate 95% credibility intervals and posterior mean estimates.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
37 #if $rsem_options.useci.ci == 'yes':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
38 --calc-ci
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
39 #if $rsem_options.useci.cimem:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
40 --ci-memory $rsem_options.useci.cimem
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
41 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
42 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
43 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
44 ## --num-threads $GALAXY_SLOTS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
45 #if $input.format != 'bam' and $input.bowtie_options.fullparams == 'fullset':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
46 ## Bowtie params
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
47 #if $bowtie_options.bowtie_e:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
48 --bowtie-e $bowtie_options.bowtie_e
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
49 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
50 #if $bowtie_options.bowtie_m:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
51 --bowtie-m $bowtie_options.bowtie_m
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
52 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
53 #if $bowtie_options.bowtie_n:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
54 --bowtie-n $bowtie_options.bowtie_n
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
55 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
56 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
57 ## Outputs
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
58 #if $rsem_outputs.result_bams == 'none':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
59 --no-bam-output
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
60 #else
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
61 #if $rsem_outputs.result_bams == 'both':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
62 --output-genome-bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
63 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
64 $rsem_outputs.sampling_for_bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
65 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
66 ## Input data
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
67 #if $input.format=="fastq"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
68 $input.fastq_select
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
69 #if $input.fastq.matepair=="single":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
70 $input.fastq.singlefastq
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
71 #elif $input.fastq.matepair=="paired":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
72 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
73 $input.fastq.fastq1
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
74 $input.fastq.fastq2
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
75 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
76 #elif $input.format=="fasta"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
77 --no-qualities
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
78 #if $input.fasta.matepair=="single":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
79 $input.fasta.singlefasta
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
80 #elif $input.fasta.matepair=="paired":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
81 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
82 $input.fasta.fasta1
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
83 $input.fasta.fasta2
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
84 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
85 #elif $input.format=="sam"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
86 #if $input.matepair=="paired":
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
87 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
88 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
89 #if $input.rsem_sam._extension == 'sam':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
90 --sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
91 #elif $input.rsem_sam._extension == 'bam':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
92 --bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
93 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
94 $input.rsem_sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
95 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
96 ## RSEM reference
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
97 #if $reference.refSrc == 'history':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
98 ${reference.rsem_ref.extra_files_path}/${reference.rsem_ref.metadata.reference_name}
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
99 #elif $reference.refSrc == 'cached':
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
100 ${reference.index.fields.path}
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
101 #end if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
102 ## sample_name: use a hard coded name so we can pull out galaxy outputs
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
103 rsem_output
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
104 ## direct output into logfile
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
105 > $log
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
106 </command>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
107 <macros>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
108 <macro name="rsem_options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
109 <param name="seedlength" type="integer" value="25" optional="true" label="Seed length used by the read aligner" help="Providing the correct value for this parameter is important for RSEM's accuracy if the data are single-end reads. RSEM uses this value for Bowtie's seed length parameter. The minimum value is 25. (Default:25)">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
110 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
111 <param name="forward_prob" type="select" label="Is the library strand specific?">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
112 <option value="0.5" selected="true">No</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
113 <option value="1">Yes, the reads (or first reads from paired-end libraries) are only in the forward orientation</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
114 <option value="0">Yes, the reads (or first reads from paired-end libraries) are only in the reverse orientation</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
115 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
116 <conditional name="rsem_options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
117 <param name="fullparams" type="select" label="Additional RSEM options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
118 <option value="default">Use RSEM Defaults</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
119 <option value="fullset">Set Additional RSEM Options</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
120 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
121 <when value="default"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
122 <when value="fullset">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
123 <param name="fragment_length_min" type="integer" value="1" optional="true" label="Minimum read/insert length." help=" This is also the value for the bowtie -I option">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
124 <validator type="in_range" message="0 or greater" min="0" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
125 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
126 <param name="fragment_length_max" type="integer" value="1000" optional="true" label="Maximum read/insert length." help=" This is also the value for the bowtie -X option">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
127 <validator type="in_range" message="0 or greater" min="0" max="1000000"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
128 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
129 <param name="fragment_length_mean" type="float" value="" optional="true" label="Fragment length mean (single-end data only)" help="The mean of the fragment length distribution, which is assumed to be a Gaussian. (Default: -1, which disables use of the fragment length distribution)">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
130 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
131 <param name="fragment_length_sd" type="float" value="" optional="true" label="The standard deviation of the fragment length distribution (single-end data only)" help="Default 0, which assumes that all fragments are of the same length, given by the rounded value of fragment length mean. ">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
132 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
133 <conditional name="rspd">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
134 <param name="estimate" type="select" lanel="Read Start Position Distribution (RSPD)"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
135 help="Set this option if you want to estimate the read start position distribution (RSPD) from data. Otherwise, RSEM will use a uniform RSPD.">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
136 <option value="no" selected="true">Use a uniform RSPD</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
137 <option value="yes">Estimate and correct for a non-uniform RSPD</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
138 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
139 <when value="no"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
140 <when value="yes">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
141 <param name="num_rspd_bins" type="integer" value="20" optional="true" label="Number of bins in the RSPD." help="Use of the default setting of 20 is recommended.">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
142 <validator type="in_range" message="" min="0" max="100"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
143 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
144 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
145 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
146 <conditional name="useci">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
147 <param name="ci" type="select" label="Calculate 95% Credibility Intervals">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
148 <option value="no" selected="true">no</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
149 <option value="yes">yes</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
150 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
151 <when value="no"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
152 <when value="yes">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
153 <param name="cimem" size="4" type="text" value="1024" label="Amount of memory in (MB) for computing CI" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
154 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
155 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
156 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
157 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
158 </macro>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
159 <macro name="bowtie_options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
160 <conditional name="bowtie_options">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
161 <param name="fullparams" type="select" label="bowtie settings">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
162 <option value="default">use bowtie defaults</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
163 <option value="fullset">set bowtie options</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
164 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
165 <when value="default"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
166 <when value="fullset">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
167 <param name="bowtie_n" type="integer" value="2" optional="true" label="Bowtie mismatches" help="Bowtie parameter max # of mismatches in the seed. (Range: 0-3, Default: 2) ">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
168 <validator type="in_range" message="max # of mismatches in the seed between 0 and 3" min="0" max="3"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
169 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
170 <param name="bowtie_e" type="integer" value="99999999" label="Maximum sum of quality scores at mismatched positions in read alignments. This is also the value for the Bowtie -e option">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
171 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
172 <param name="bowtie_m" type="integer" value="200" label="Discard alignments for reads with number of alignments greater than">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
173 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
174 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
175 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
176 </macro>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
177 <macro name="sampling_for_bam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
178 <param name="sampling_for_bam" type="boolean" truevalue="--sampling-for-bam" falsevalue="" checked="false" label="Use sampling for BAM">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
179 <help> When RSEM generates a BAM file, instead of outputing all alignments a read has with their posterior probabilities, one alignment is sampled according to the posterior probabilities. The sampling procedure includes the alignment to the "noise" transcript, which does not appear in the BAM file. Only the sampled alignment has a weight of 1. All other alignments have weight 0. If the "noise" transcript is sampled, all alignments appeared in the BAM file should have weight 0. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
180 </help>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
181 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
182 </macro>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
183 </macros>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
184
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
185 <inputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
186 <param name="sample" type="text" value="rsem_sample" label="Sample name" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
187 <conditional name="reference">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
188 <param name="refSrc" type="select" label="RSEM Reference Source">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
189 <option value="cached">Locally cached</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
190 <option value="history">From your history</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
191 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
192 <when value="cached">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
193 <param name="index" type="select" label="Select RSEM reference" help="Select from a list of pre-indexed references. If you don't see anything consult the wrapper's documentation on how to create or download a reference">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
194 <options from_data_table="rsem_indexes">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
195 <filter type="sort_by" column="2" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
196 <validator type="no_options" message="No indexes are available" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
197 </options>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
198 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
199 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
200 <when value="history">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
201 <param name="rsem_ref" type="data" format="rsem_ref" label="RSEM reference" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
202 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
203 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
204 <conditional name="input">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
205 <param name="format" type="select" label="RSEM Input file type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
206 <option value="fastq">FASTQ</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
207 <option value="fasta">FASTA</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
208 <option value="sam">SAM/BAM</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
209 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
210 <when value="fastq">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
211 <param name="fastq_select" size="15" type="select" label="FASTQ type" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
212 <option value="--phred33-quals" selected="true">phred33 qualities (default for sanger)</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
213 <option value="--solexa-quals">solexa qualities</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
214 <option value="--phred64-quals">phred64 qualities</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
215 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
216 <conditional name="fastq">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
217 <param name="matepair" type="select" label="Library type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
218 <option value="single">Single End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
219 <option value="paired">Paired End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
220 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
221 <when value="single">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
222 <param name="singlefastq" type="data" format="fastq" label="FASTQ file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
223 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
224 <when value="paired">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
225 <param name="fastq1" type="data" format="fastq" label="Read 1 fastq file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
226 <param name="fastq2" type="data" format="fastq" label="Read 2 fastq file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
227 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
228 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
229 <expand macro="bowtie_options"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
230 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
231 <when value="fasta">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
232 <conditional name="fasta">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
233 <param name="matepair" type="select" label="Library Type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
234 <option value="single">Single End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
235 <option value="paired">Paired End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
236 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
237 <when value="single">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
238 <param name="singlefasta" type="data" format="fasta" label="fasta file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
239 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
240 <when value="paired">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
241 <param name="fasta1" type="data" format="fasta" label="Read 1 fasta file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
242 <param name="fasta2" type="data" format="fasta" label="Read 2 fasta file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
243 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
244 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
245 <expand macro="bowtie_options"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
246 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
247 <when value="sam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
248 <!-- convert-sam-for-rsem /ref/mouse_125 input.sam -o input_for_rsem.sam -->
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
249 <param name="matepair" type="select" label="Library Type">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
250 <option value="single">Single End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
251 <option value="paired">Paired End Reads</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
252 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
253 <param name="rsem_sam" type="data" format="rsem_sam" label="RSEM formatted SAM file" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
254 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
255 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
256 <expand macro="rsem_options"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
257 <conditional name="rsem_outputs">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
258 <param name="result_bams" type="select" label="Create bam results files"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
259 help="In addition to the transcript-coordinate-based BAM file output, also output a BAM file with the read alignments in genomic coordinates" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
260 <option value="none">No BAM results files</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
261 <option value="default" selected="true">Transcript BAM results file</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
262 <option value="both">Transcript and genome BAM results files</option>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
263 </param>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
264 <when value="none"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
265 <when value="default">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
266 <expand macro="sampling_for_bam"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
267 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
268 <when value="both">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
269 <expand macro="sampling_for_bam"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
270 </when>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
271 </conditional>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
272 </inputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
273 <stdio>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
274 <exit_code range="1:" level="fatal" description="Error Running RSEM" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
275 </stdio>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
276 <outputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
277 <data format="tabular" name="gene_abundances" label="${sample}.gene_abundances" from_work_dir="rsem_output.genes.results"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
278 <data format="tabular" name="isoform_abundances" label="${sample}.isoform_abundances" from_work_dir="rsem_output.isoforms.results"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
279 <data format="bam" name="transcript_bam" label="${sample}.transcript.bam" from_work_dir="rsem_output.transcript.bam" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
280 <filter>rsem_outputs['result_bams'] != "none"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
281 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
282 <data format="bam" name="transcript_sorted_bam" label="${sample}.transcript.bam" from_work_dir="rsem_output.transcript.sorted.bam" >
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
283 <filter>rsem_outputs['result_bams'] != "none"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
284 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
285 <data format="bam" name="genome_bam" label="${sample}.genome.bam" from_work_dir="rsem_output.genome.bam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
286 <filter>rsem_outputs['result_bams'] == "both"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
287 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
288 <data format="bam" name="genome_sorted_bam" label="${sample}.genome.sorted.bam" from_work_dir="rsem_output.genome.sorted.bam">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
289 <filter>rsem_outputs['result_bams'] == "both"</filter>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
290 </data>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
291 <data format="txt" name="log" label="${sample}.rsem_log"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
292 </outputs>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
293 <tests>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
294 <test>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
295 <param name="sample" value="rsem_sample"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
296 <param name="refSrc" value="history"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
297 <param name="rsem_ref" value="RSEM_ref_reference.rsem_ref" ftype="rsem_ref"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
298 <param name="format" value="fastq"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
299 <param name="matepair" value="single"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
300 <param name="singlefastq" value="test.fastq" ftype="fastqsanger"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
301 <param name="result_bams" value="none"/>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
302 <output name="gene_abundances">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
303 <assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
304 <has_text text="ENST00000423562,ENST00000438504,ENST00000488147,ENST00000538476,ENST00000541675" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
305 </assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
306 </output>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
307 <output name="isoform_abundances">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
308 <assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
309 <has_text text="ENST00000332831" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
310 </assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
311 </output>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
312 <output name="log">
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
313 <assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
314 <has_text text="Expression Results are written" />
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
315 </assert_contents>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
316 </output>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
317 </test>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
318 </tests>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
319 <help>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
320
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
321
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
322 RSEM HOME PAGE - http://deweylab.biostat.wisc.edu/rsem/
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
323
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
324 NAME
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
325 rsem-calculate-expression
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
326
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
327 SYNOPSIS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
328 rsem-calculate-expression [options] upstream_read_file(s) reference_name sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
329 rsem-calculate-expression [options] --paired-end upstream_read_file/s downstream_read_file/s reference_name sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
330 rsem-calculate-expression [options] --sam/--bam [--paired-end] input reference_name sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
331
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
332 ARGUMENTS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
333 upstream_read_files/s
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
334 Comma-separated list of files containing single-end reads or
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
335 upstream reads for paired-end data. By default, these files are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
336 assumed to be in FASTQ format. If the --no-qualities option is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
337 specified, then FASTA format is expected.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
338
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
339 downstream_read_file/s
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
340 Comma-separated list of files containing downstream reads which are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
341 paired with the upstream reads. By default, these files are assumed
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
342 to be in FASTQ format. If the --no-qualities option is specified,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
343 then FASTA format is expected.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
344
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
345 input
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
346 SAM/BAM formatted input file. If "-" is specified for the filename,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
347 SAM/BAM input is instead assumed to come from standard input. RSEM
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
348 requires all alignments of the same read group together. For
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
349 paired-end reads, RSEM also requires the two mates of any alignment
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
350 be adjacent. See Description section for how to make input file obey
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
351 RSEM's requirements.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
352
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
353 reference_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
354 The name of the reference used. The user must have run
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
355 'rsem-prepare-reference' with this reference_name before running
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
356 this program.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
357
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
358 sample_name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
359 The name of the sample analyzed. All output files are prefixed by
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
360 this name (e.g., sample_name.genes.results)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
361
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
362 OPTIONS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
363
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
364 --paired-end
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
365 Input reads are paired-end reads. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
366
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
367 --no-qualities
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
368 Input reads do not contain quality scores. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
369
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
370 --strand-specific
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
371 The RNA-Seq protocol used to generate the reads is strand specific,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
372 i.e., all (upstream) reads are derived from the forward strand. This
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
373 option is equivalent to --forward-prob=1.0. With this option set, if
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
374 RSEM runs the Bowtie aligner, the '--norc' Bowtie option will be
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
375 used, which disables alignment to the reverse strand of transcripts.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
376 (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
377
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
378 --sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
379 Input file is in SAM format. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
380
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
381 --bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
382 Input file is in BAM format. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
383
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
384 --sam-header-info [file]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
385 RSEM reads header information from input by default. If this option
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
386 is on, header information is read from the specified file. For the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
387 format of the file, please see SAM official website. (Default: "")
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
388
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
389 -p/--num-threads [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
390 Number of threads to use. Both Bowtie and expression estimation will
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
391 use this many threads. (Default: 1)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
392
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
393 --no-bam-output
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
394 Do not output any BAM file. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
395
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
396 --output-genome-bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
397 Generate a BAM file, 'sample_name.genome.bam', with alignments
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
398 mapped to genomic coordinates and annotated with their posterior
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
399 probabilities. In addition, RSEM will call samtools (included in
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
400 RSEM package) to sort and index the bam file.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
401 'sample_name.genome.sorted.bam' and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
402 'sample_name.genome.sorted.bam.bai' will be generated. (Default:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
403 off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
404
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
405 --sampling-for-bam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
406 When RSEM generates a BAM file, instead of outputing all alignments
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
407 a read has with their posterior probabilities, one alignment is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
408 sampled and outputed according to the posterior probabilities. If
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
409 the sampling result is that the read comes from the "noise"
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
410 transcript, nothing is outputed. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
411
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
412 --calc-ci
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
413 Calculate 95% credibility intervals and posterior mean estimates.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
414 (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
415
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
416 --seed-length [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
417 Seed length used by the read aligner. Providing the correct value is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
418 important for RSEM. If RSEM runs Bowtie, it uses this value for
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
419 Bowtie's seed length parameter. Any read with its or at least one of
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
420 its mates' (for paired-end reads) length less than this value will
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
421 be ignored. If the references are not added poly(A) tails, the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
422 minimum allowed value is 5, otherwise, the minimum allowed value is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
423 25. Note that this script will only check if the value less or equal than
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
424 5 and give a warning message if the value less than 25 but greter or equal than
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
425 5. (Default: 25)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
426
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
427 --tag [string]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
428 The name of the optional field used in the SAM input for identifying
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
429 a read with too many valid alignments. The field should have the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
430 format [tagName]:i:[value], where a [value] bigger than 0 indicates
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
431 a read with too many alignments. (Default: "")
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
432
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
433 --bowtie-path [path]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
434 The path to the bowtie executables. (Default: the path to the bowtie
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
435 executables is assumed to be in the user's PATH environment
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
436 variable)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
437
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
438 --bowtie-n [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
439 (Bowtie parameter) max # of mismatches in the seed. (Range: 0-3,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
440 Default: 2)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
441
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
442 --bowtie-e [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
443 (Bowtie parameter) max sum of mismatch quality scores across the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
444 alignment. (Default: 99999999)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
445
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
446 --bowtie-m [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
447 (Bowtie parameter) suppress all alignments for a read if greater then [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
448 valid alignments exist. (Default: 200)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
449
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
450 --bowtie-chunkmbs [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
451 (Bowtie parameter) memory allocated for best first alignment
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
452 calculation (Default: 0 - use bowtie's default)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
453
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
454 --phred33-quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
455 Input quality scores are encoded as Phred+33. (Default: on)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
456
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
457 --phred64-quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
458 Input quality scores are encoded as Phred+64 (default for GA
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
459 Pipeline ver. less than 1.3). (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
460
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
461 --solexa-quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
462 Input quality scores are solexa encoded (from GA Pipeline ver. less
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
463 than 1.3). (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
464
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
465 --forward-prob [double]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
466 Probability of generating a read from the forward strand of a
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
467 transcript. Set to 1 for a strand-specific protocol where all
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
468 (upstream) reads are derived from the forward strand, 0 for a
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
469 strand-specific protocol where all (upstream) read are derived from
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
470 the reverse strand, or 0.5 for a non-strand-specific protocol.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
471 (Default: 0.5)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
472
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
473 --fragment-length-min [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
474 Minimum read/insert length allowed. This is also the value for the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
475 bowtie -I option. (Default: 1)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
476
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
477 --fragment-length-max [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
478 Maximum read/insert length allowed. This is also the value for the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
479 bowtie -X option. (Default: 1000)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
480
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
481 --fragment-length-mean [double]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
482 (single-end data only) The mean of the fragment length distribution,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
483 which is assumed to be a Gaussian. (Default: -1, which disables use
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
484 of the fragment length distribution)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
485
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
486 --fragment-length-sd [double]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
487 (single-end data only) The standard deviation of the fragment length
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
488 distribution, which is assumed to be a Gaussian. (Default: 0, which
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
489 assumes that all fragments are of the same length, given by the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
490 rounded value of --fragment-length-mean)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
491
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
492 --estimate-rspd
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
493 Set this option if you want to estimate the read start position
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
494 distribution (RSPD) from data. Otherwise, RSEM will use a uniform
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
495 RSPD. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
496
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
497 --num-rspd-bins [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
498 Number of bins in the RSPD. Only relevant when '--estimate-rspd' is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
499 specified. Use of the default setting is recommended. (Default: 20)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
500
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
501 --ci-memory [int]
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
502 Maximum size (in memory, MB) of the auxiliary buffer used for
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
503 computing credibility intervals (CI). Set it larger for a faster CI
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
504 calculation. However, leaving 2 GB memory free for other usage is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
505 recommended. (Default: 1024)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
506
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
507 --keep-intermediate-files
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
508 Keep temporary files generated by RSEM. RSEM creates a temporary
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
509 directory, 'sample_name.temp', into which it puts all intermediate
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
510 output files. If this directory already exists, RSEM overwrites all
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
511 files generated by previous RSEM runs inside of it. By default,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
512 after RSEM finishes, the temporary directory is deleted. Set this
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
513 option to prevent the deletion of this directory and the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
514 intermediate files inside of it. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
515
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
516 --time
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
517 Output time consumed by each step of RSEM to 'sample_name.time'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
518 (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
519
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
520 -q/--quiet
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
521 Suppress the output of logging information. (Default: off)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
522
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
523 -h/--help
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
524 Show help information.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
525
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
526 DESCRIPTION
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
527 In its default mode, this program aligns input reads against a reference
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
528 transcriptome with Bowtie and calculates expression values using the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
529 alignments. RSEM assumes the data are single-end reads with quality
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
530 scores, unless the '--paired-end' or '--no-qualities' options are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
531 specified. Users may use an alternative aligner by specifying one of the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
532 --sam and --bam options, and providing an alignment file in the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
533 specified format. However, users should make sure that they align
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
534 against the indices generated by 'rsem-prepare-reference' and the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
535 alignment file satisfies the requirements mentioned in ARGUMENTS
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
536 section.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
537
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
538 One simple way to make the alignment file satisfying RSEM's requirements
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
539 (assuming the aligner used put mates in a paired-end read adjacent) is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
540 to use 'convert-sam-for-rsem' script. This script only accept SAM format
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
541 files as input. If a BAM format file is obtained, please use samtools to
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
542 convert it to a SAM file first. For example, if '/ref/mouse_125' is the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
543 'reference_name' and the SAM file is named 'input.sam', you can run the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
544 following command:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
545
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
546 convert-sam-for-rsem /ref/mouse_125 input.sam -o input_for_rsem.sam
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
547
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
548 For details, please refer to 'convert-sam-for-rsem's documentation page.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
549
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
550 The SAM/BAM format RSEM uses is v1.4. However, it is compatible with old
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
551 SAM/BAM format. However, RSEM cannot recognize 0x100 in the FLAG field.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
552 In addition, RSEM requires SEQ and QUAL are not '*'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
553
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
554 The user must run 'rsem-prepare-reference' with the appropriate
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
555 reference before using this program.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
556
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
557 For single-end data, it is strongly recommended that the user provide
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
558 the fragment length distribution parameters (--fragment-length-mean and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
559 --fragment-length-sd). For paired-end data, RSEM will automatically
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
560 learn a fragment length distribution from the data.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
561
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
562 Please note that some of the default values for the Bowtie parameters
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
563 are not the same as those defined for Bowtie itself.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
564
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
565 The temporary directory and all intermediate files will be removed when
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
566 RSEM finishes unless '--keep-intermediate-files' is specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
567
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
568 With the '--calc-ci' option, 95% credibility intervals and posterior
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
569 mean estimates will be calculated in addition to maximum likelihood
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
570 estimates.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
571
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
572 OUTPUT
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
573 sample_name.genes.results
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
574 File containing gene level expression estimates. The format of each
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
575 line in this file is:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
576
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
577 gene_id expected_counts tau_value [pmc_value tau_pme_value
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
578 tau_ci_lower_bound tau_ci_upper_bound] transcript_id_list
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
579
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
580 Fields are separated by the tab character. Fields within "[]" are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
581 only presented if '--calc-ci' is set. pme stands for posterior mean
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
582 estimation. pmc stands for posterior mean counts. ci_lower_bound(l)
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
583 means the lower bound of the credibility intervals,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
584 ci_upper_bound(u) means the upper bound of the credibility
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
585 intervals. So the credibility interval is [l, u].
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
586 'transcript_id_list' is a space-separated list of transcript_ids
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
587 belonging to the gene. If no gene information is provided, this file
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
588 has the same content as 'sample_name.isoforms.results'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
589
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
590 sample_name.isoforms.results
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
591 File containing isoform level expression values. The format of each
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
592 line in this file is:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
593
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
594 transcript_id expected_counts tau_value [pmc_value tau_pme_value
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
595 tau_ci_lower_bound tau_ci_upper_bound] gene_id
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
596
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
597 Fields are separated by the tab character. 'gene_id' is the gene_id
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
598 of the gene which this transcript belongs to. If no gene information
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
599 is provided, 'gene_id' and 'transcript_id' are the same.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
600
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
601 sample_name.transcript.bam, sample_name.transcript.sorted.bam and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
602 sample_name.transcript.sorted.bam.bai
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
603 Only generated when --no-bam-output is not specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
604
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
605 'sample_name.transcript.bam' is a BAM-formatted file of read
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
606 alignments in transcript coordinates. The MAPQ field of each
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
607 alignment is set to min(100, floor(-10 * log10(1.0 - w) + 0.5)),
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
608 where w is the posterior probability of that alignment being the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
609 true mapping of a read. In addition, RSEM pads a new tag ZW:f:value,
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
610 where value is a single precision floating number representing the
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
611 posterior probability.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
612
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
613 'sample_name.transcript.sorted.bam' and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
614 'sample_name.transcript.sorted.bam.bai' are the sorted BAM file and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
615 indices generated by samtools (included in RSEM package).
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
616
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
617 sample_name.genome.bam, sample_name.genome.sorted.bam and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
618 sample_name.genome.sorted.bam.bai
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
619 Only generated when --no-bam-output is not specified and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
620 --output-genome-bam is specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
621
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
622 'sample_name.genome.bam' is a BAM-formatted file of read alignments
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
623 in genomic coordinates. Alignments of reads that have identical
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
624 genomic coordinates (i.e., alignments to different isoforms that
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
625 share the same genomic region) are collapsed into one alignment. The
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
626 MAPQ field of each alignment is set to min(100, floor(-10 *
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
627 log10(1.0 - w) + 0.5)), where w is the posterior probability of that
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
628 alignment being the true mapping of a read. In addition, RSEM pads a
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
629 new tag ZW:f:value, where value is a single precision floating
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
630 number representing the posterior probability. If an alignment is
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
631 spliced, a XS:A:value tag is also added, where value is either '+'
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
632 or '-' indicating the strand of the transcript it aligns to.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
633
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
634 'sample_name.genome.sorted.bam' and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
635 'sample_name.genome.sorted.bam.bai' are the sorted BAM file and
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
636 indices generated by samtools (included in RSEM package).
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
637
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
638 sample_name.sam.gz
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
639 Only generated when the input files are raw reads instead of SAM/BAM
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
640 format files
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
641
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
642 It is the gzipped SAM output produced by bowtie aligner.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
643
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
644 sample_name.time
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
645 Only generated when --time is specified.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
646
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
647 It contains time (in seconds) consumed by aligning reads, estimating
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
648 expression levels and calculating credibility intervals.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
649
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
650 sample_name.stat
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
651 This is a folder instead of a file. All model related statistics are
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
652 stored in this folder. Use 'rsem-plot-model' can generate plots
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
653 using this folder.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
654
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
655 EXAMPLES
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
656 Assume the path to the bowtie executables is in the user's PATH
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
657 environment variable. Reference files are under '/ref' with name
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
658 'mouse_125'.
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
659
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
660 1) '/data/mmliver.fq', single-end reads with quality scores. Quality
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
661 scores are encoded as for 'GA pipeline version >= 1.3'. We want to use 8
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
662 threads and generate a genome BAM file:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
663
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
664 rsem-calculate-expression --phred64-quals \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
665 -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
666 --output-genome-bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
667 /data/mmliver.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
668 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
669 mmliver_single_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
670
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
671 2) '/data/mmliver_1.fq' and '/data/mmliver_2.fq', paired-end reads with
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
672 quality scores. Quality scores are in SANGER format. We want to use 8
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
673 threads and do not generate a genome BAM file:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
674
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
675 rsem-calculate-expression -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
676 --paired-end \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
677 /data/mmliver_1.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
678 /data/mmliver_2.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
679 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
680 mmliver_paired_end_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
681
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
682 3) '/data/mmliver.fa', single-end reads without quality scores. We want
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
683 to use 8 threads:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
684
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
685 rsem-calculate-expression -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
686 --no-qualities \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
687 /data/mmliver.fa \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
688 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
689 mmliver_single_without_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
690
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
691 4) Data are the same as 1). We want to take a fragment length
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
692 distribution into consideration. We set the fragment length mean to 150
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
693 and the standard deviation to 35. In addition to a BAM file, we also
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
694 want to generate credibility intervals. We allow RSEM to use 1GB of
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
695 memory for CI calculation:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
696
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
697 rsem-calculate-expression --bowtie-path /sw/bowtie \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
698 --phred64-quals \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
699 --fragment-length-mean 150.0 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
700 --fragment-length-sd 35.0 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
701 -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
702 --output-genome-bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
703 --calc-ci \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
704 --ci-memory 1024 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
705 /data/mmliver.fq \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
706 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
707 mmliver_single_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
708
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
709 5) '/data/mmliver_paired_end_quals.bam', paired-end reads with quality
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
710 scores. We want to use 8 threads:
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
711
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
712 rsem-calculate-expression --paired-end \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
713 --bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
714 -p 8 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
715 /data/mmliver_paired_end_quals.bam \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
716 /ref/mouse_125 \
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
717 mmliver_paired_end_quals
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
718 </help>
7146e81bc886 Uploaded
yboursin
parents:
diff changeset
719 </tool>