annotate rsem_calculate_expression.xml @ 0:64d45f959303

Uploaded
author jjohnson
date Mon, 11 Nov 2013 13:54:43 -0500
parents
children 1ff2fc8da328
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
1 <tool id="rsem_calculate_expression" name="RSEM calculate expression" version="1.1.17">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
2 <description>RNA-Seq by Expectation-Maximization</description>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
3 <requirements>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
4 <requirement type="package" version="1.1.17">rsem</requirement>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
5 <requirement type="package" version="0.1.19">samtools</requirement>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
6 <requirement type="package" version="1.0.0">bowtie</requirement>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
7 </requirements>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
8 <command interpreter="perl">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
9 rsem-calculate-expression
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
10 --calc-ci $useci.ci
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
11 --fragment-length-mean $fraglenmean
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
12 --fragment-length-min $fraglenmin
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
13 --fragment-length-sd $fraglensd
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
14 --fragment-length-max $fraglenmax
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
15 --bowtie-e $bowtie_e
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
16 --bowtie-m $bowtie_m
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
17
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
18 #if $input.format=="fastq"
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
19 ## IF FASTQ AND SINGLE END READS (DEFAULTS)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
20 #if $input.fastqmatepair.matepair=="single" #rsem-wrapper-1.1.17.pl --bam_genome $bam_genome --bamtype $bamtype
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
21 --seed-length $seedlength $input.fastq_select --estimate-rspd $rspd --forward-prob
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
22 $fprob -p $cpus --bowtie-n $bowtie_mis --output-genome-bam --single_fastq $singlefastq
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
23 --output $output --isoformfile $isoforms --bamfile $bam_res --log $log
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
24 --sampling-for-bam $sampling_for_bam --reference ${index.fields.path}
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
25 #end if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
26 ## IF FASTQ AND PAIRED END READS (DEFAULTS)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
27 #if $input.fastqmatepair.matepair=="paired" #rsem-wrapper-1.1.17.pl --bam_genome $bam_genome --bamtype $bamtype
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
28 --paired-end --seed-length $seedlength --estimate-rspd $rspd $input.fastq_select --forward-prob $fprob -p $cpus
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
29 --bowtie-n $bowtie_mis --output-genome-bam --fastq1 $fastq1 --fastq2 $fastq2 --output
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
30 $output --isoformfile $isoforms --bamfile $bam_res --log $log --sampling-for-bam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
31 $sampling_for_bam --reference ${index.fields.path}
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
32 #end if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
33 #end if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
34 #if $input.format=="fasta"
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
35 ## IF FASTA AND SINGLE END READS (DEFAULTS)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
36 #if $input.fastamatepair.matepair=="single" #rsem-wrapper-1.1.17.pl --bam_genome $bam_genome --bamtype $bamtype
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
37 --no-qualities --seed-length $seedlength --estimate-rspd $rspd --forward-prob $fprob -p $cpus --bowtie-n $bowtie_mis
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
38 --output-genome-bam --single_fasta $single_fasta --output $output --isoformfile
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
39 $isoforms --bamfile $bam_res --log $log --sampling-for-bam $sampling_for_bam --reference
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
40 ${index.fields.path}
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
41 #end if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
42 ## IF FASTA AND PAIRED END READS (DEFAULTS)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
43 #if $input.fastamatepair.matepair=="paired" #rsem-wrapper-1.1.17.pl --bam_genome $bam_genome --bamtype $bamtype
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
44 --no-qualities --paired-end --seed-length $seedlength --estimate-rspd $rspd --forward-prob $fprob -p $cpus
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
45 --bowtie-n $bowtie_mis --output-genome-bam --fasta1 $fasta1 --fasta2 $fasta2 --output
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
46 $output --isoformfile $isoforms --bamfile $bam_res --log $log --sampling-for-bam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
47 $sampling_for_bam --reference ${index.fields.path}
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
48 #end if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
49 #end if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
50
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
51 </command>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
52
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
53 <inputs>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
54 <param name="sample" type="text" format="txt" label="Sample label" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
55 <conditional name="input">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
56 <param name="format" type="select" label="Input file type">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
57 <option value="fastq">FASTQ</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
58 <option value="fasta">FASTA</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
59 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
60 <when value="fastq">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
61 <param name="fastq_select" size="15" type="select" label="FASTQ type" >
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
62 <option value="--phred33-quals">phred33 qualities</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
63 <option value="--solexa-quals">solexa qualities</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
64 <option value="--phred64-quals">phred64 qualities</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
65 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
66
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
67 <conditional name="fastqmatepair">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
68 <when value="single">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
69 <param name="singlefastq" type="data" checked="yes" format="fastq" label="FASTQ file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
70 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
71 <when value="paired">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
72 <param name="fastq1" type="data" format="fastq" label="Read 1 fastq file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
73 <param name="fastq2" type="data" format="fastq" label="Read 2 fastq file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
74 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
75 <param name="matepair" type="select" label="Library type">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
76 <option value="single">Single End Reads</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
77 <option value="paired">Paired End Reads</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
78 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
79 </conditional>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
80 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
81 <when value="fasta">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
82 <conditional name="fastamatepair">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
83 <param name="matepair" type="select" label="Library Type">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
84 <option value="single">Single End Reads</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
85 <option value="paired">Paired End Reads</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
86 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
87 <when value="single">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
88 <param name="single_fasta" type="data" checked="yes" format="fasta" label="fasta file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
89 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
90 <when value="paired">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
91 <param name="fasta1" type="data" format="fasta" label="Read 1 fasta file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
92 <param name="fasta2" type="data" format="fasta" label="Read 2 fasta file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
93 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
94 </conditional>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
95 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
96 <when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
97 <conditional name="fastamatepair">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
98 <param name="matepair" type="select" label="Library Type" >
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
99 <option value="single">Single End Reads</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
100 <option value="paired">Paired End Reads</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
101 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
102 <when value="single">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
103 <param name="singlefastq" type="data" checked="yes" format="fastq" label="FASTQ file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
104 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
105 <when value="paired">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
106 <param name="fastq1" type="data" format="fastq" label="Read 1 FASTQ file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
107 <param name="fastq2" type="data" format="fastq" label="Read 2 FASTQ file" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
108 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
109 </conditional>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
110 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
111 </conditional>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
112 <param name="fprob" type="select" >
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
113 <label>Is the library strand specific?</label>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
114 <option value="0.5">No</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
115 <option value="1">Yes, the reads (or first reads from paired-end libraries) are only in the forward orientation</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
116 <option value="0">Yes, the reads (or first reads from paired-end libraries) are only in the reverse orientation</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
117 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
118
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
119 <param name="index" type="select" label="Select RSEM reference" help="Select from a list of pre-indexed references. If you don't see anything consult the wrapper's documentation on how to create or download a reference">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
120 <options from_data_table="rsem_indexes">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
121 <filter type="sort_by" column="2" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
122 <validator type="no_options" message="No indexes are available" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
123 </options>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
124 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
125 <param name="fraglenmean" size="4" type="text" value="-1" label="Fragment length mean (single-end data only)" help="The mean of the fragment length distribution, which is assumed to be a Gaussian. (Default: -1, which disables use of the fragment length distribution)" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
126 <param name="fraglensd" size="4" type="text" value="0" label="The standard deviation of the fragment length distribution (single-end data only)" help="Default 0, which assumes that all fragments are of the same length, given by the rounded value of fragment length mean. " />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
127
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
128 <param name="bamtype" type="select" label="Create genome bam file" help="In addition to the transcript-coordinate-based BAM file output, also output a BAM file with the read alignments in genomic coordinates" >
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
129 <option value="no">no</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
130 <option value="yes">yes</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
131 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
132 <param name="sampling_for_bam" type="select" format="text" help="When RSEM generates a BAM file, instead of outputing all alignments a read has with their posterior probabilities, one alignment is sampled and outputed according to the posterior probabilities. If the sampling result is that the read comes from the noise transcript, nothing is outputed. (Default: off)">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
133 <label>Sample Bam File</label>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
134 <option value="no">no</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
135 <option value="yes">yes</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
136 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
137 <param name="rspd" type="select" format="text" help="Set this option if you want to estimate the read start position distribution (RSPD) from data. Otherwise, RSEM will use a uniform RSPD. (Default: off)">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
138 <label>Estimate and correct for a non-uniform read start position distribution (RSPD)</label>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
139 <option value="no">no</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
140 <option value="yes">yes</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
141 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
142
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
143 <!-- <conditional name="fullpar">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
144 <param name="fullpar" type="select" label="Full list of parameters" help="use
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
145 full list for linting all the parameters in RSEM">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
146 <option value="default">Default</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
147 <option value="fullset">Full Set</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
148 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
149 <when value="fullset"> -->
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
150 <!-- <param name="testing" size="4" type="text" value="" label="Advanced Parameters" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
151 -->
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
152 <conditional name="useci">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
153 <param name="ci" type="select" label="Calculate 95% Credibility Intervals">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
154 <option value="no">no</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
155 <option value="yes">yes</option>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
156 </param>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
157 <when value="yes">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
158 <param name="cimem" size="4" type="text" value="1024" label="Amount of memory in (MB) for computing CI" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
159 </when>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
160 </conditional>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
161 <param name="fraglenmin" size="4" type="text" value="1" label="Minimum read/insert length. Minimum read/insert length allowed. This is also the value for the bowtie -X option" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
162 <param name="fraglenmax" size="4" type="text" value="1000" label="Maximum read/insert length. Minimum read/insert length allowed. This is also the value for the bowtie -l option" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
163 <param name="bowtie_mis" size="2" type="text" value="2" label="Bowtie mismatches" help="Bowtie parameter max # of mismatches in the seed. (Range: 0-3, Default: 2) "/>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
164 <param name="bowtie_e" size="4" type="text" value="99999999" label="Maximum sum of quality scores at mismatched positions in read alignments. This is also the value for the Bowtie -e option" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
165 <param name="bowtie_m" size="4" type="text" value="200" label="Discard alignments for reads with number of alignments greater than" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
166 <param name="seedlength" size="2" type="text" value="25" label="Seed length used by the read aligner" help="Providing the correct value for this parameter is important for RSEM's accuracy if the data are single-end reads. RSEM uses this value for Bowtie's seed length parameter. The minimum value is 25. (Default:25)" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
167 <param name="cpus" size="2" type="integer" value="1" label="Number of threads to use" help="Number of threads to use. Both Bowtie and expression estimation will use this many threads. (Default: 1)" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
168 <!-- </when> --> <!-- </conditional> -->
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
169 </inputs>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
170 <stdio>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
171 <exit_code range="1:" level="fatal" description="Error Running RSEM" />
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
172 </stdio>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
173 <outputs>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
174 <data format="tabular" name="output" label="${sample}.gene_abundances"/>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
175 <data format="tabular" name="isoforms" label="${sample}.isoform_abundances"/>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
176 <data format="bam" name="bam_res" label="${sample}.transcript.bam"/>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
177 <data format="bam" name="bam_genome" label="${sample}.genome.bam">
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
178 <filter>bamtype == "yes"</filter>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
179 </data>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
180
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
181 <data format="txt" name="log" label="${sample}.rsem_log"/>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
182 </outputs>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
183 <help>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
184
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
185
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
186 RSEM HOME PAGE - http://deweylab.biostat.wisc.edu/rsem/
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
187
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
188 NAME
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
189 rsem-calculate-expression
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
190
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
191 SYNOPSIS
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
192 rsem-calculate-expression [options] upstream_read_file(s) reference_name sample_name
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
193 rsem-calculate-expression [options] --paired-end upstream_read_file/s downstream_read_file/s reference_name sample_name
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
194 rsem-calculate-expression [options] --sam/--bam [--paired-end] input reference_name sample_name
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
195
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
196 ARGUMENTS
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
197 upstream_read_files/s
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
198 Comma-separated list of files containing single-end reads or
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
199 upstream reads for paired-end data. By default, these files are
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
200 assumed to be in FASTQ format. If the --no-qualities option is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
201 specified, then FASTA format is expected.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
202
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
203 downstream_read_file/s
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
204 Comma-separated list of files containing downstream reads which are
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
205 paired with the upstream reads. By default, these files are assumed
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
206 to be in FASTQ format. If the --no-qualities option is specified,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
207 then FASTA format is expected.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
208
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
209 input
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
210 SAM/BAM formatted input file. If "-" is specified for the filename,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
211 SAM/BAM input is instead assumed to come from standard input. RSEM
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
212 requires all alignments of the same read group together. For
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
213 paired-end reads, RSEM also requires the two mates of any alignment
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
214 be adjacent. See Description section for how to make input file obey
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
215 RSEM's requirements.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
216
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
217 reference_name
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
218 The name of the reference used. The user must have run
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
219 'rsem-prepare-reference' with this reference_name before running
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
220 this program.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
221
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
222 sample_name
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
223 The name of the sample analyzed. All output files are prefixed by
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
224 this name (e.g., sample_name.genes.results)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
225
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
226 OPTIONS
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
227
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
228 --paired-end
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
229 Input reads are paired-end reads. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
230
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
231 --no-qualities
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
232 Input reads do not contain quality scores. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
233
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
234 --strand-specific
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
235 The RNA-Seq protocol used to generate the reads is strand specific,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
236 i.e., all (upstream) reads are derived from the forward strand. This
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
237 option is equivalent to --forward-prob=1.0. With this option set, if
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
238 RSEM runs the Bowtie aligner, the '--norc' Bowtie option will be
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
239 used, which disables alignment to the reverse strand of transcripts.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
240 (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
241
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
242 --sam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
243 Input file is in SAM format. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
244
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
245 --bam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
246 Input file is in BAM format. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
247
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
248 --sam-header-info [file]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
249 RSEM reads header information from input by default. If this option
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
250 is on, header information is read from the specified file. For the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
251 format of the file, please see SAM official website. (Default: "")
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
252
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
253 -p/--num-threads [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
254 Number of threads to use. Both Bowtie and expression estimation will
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
255 use this many threads. (Default: 1)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
256
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
257 --no-bam-output
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
258 Do not output any BAM file. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
259
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
260 --output-genome-bam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
261 Generate a BAM file, 'sample_name.genome.bam', with alignments
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
262 mapped to genomic coordinates and annotated with their posterior
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
263 probabilities. In addition, RSEM will call samtools (included in
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
264 RSEM package) to sort and index the bam file.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
265 'sample_name.genome.sorted.bam' and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
266 'sample_name.genome.sorted.bam.bai' will be generated. (Default:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
267 off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
268
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
269 --sampling-for-bam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
270 When RSEM generates a BAM file, instead of outputing all alignments
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
271 a read has with their posterior probabilities, one alignment is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
272 sampled and outputed according to the posterior probabilities. If
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
273 the sampling result is that the read comes from the "noise"
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
274 transcript, nothing is outputed. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
275
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
276 --calc-ci
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
277 Calculate 95% credibility intervals and posterior mean estimates.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
278 (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
279
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
280 --seed-length [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
281 Seed length used by the read aligner. Providing the correct value is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
282 important for RSEM. If RSEM runs Bowtie, it uses this value for
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
283 Bowtie's seed length parameter. Any read with its or at least one of
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
284 its mates' (for paired-end reads) length less than this value will
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
285 be ignored. If the references are not added poly(A) tails, the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
286 minimum allowed value is 5, otherwise, the minimum allowed value is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
287 25. Note that this script will only check if the value less or equal than
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
288 5 and give a warning message if the value less than 25 but greter or equal than
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
289 5. (Default: 25)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
290
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
291 --tag [string]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
292 The name of the optional field used in the SAM input for identifying
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
293 a read with too many valid alignments. The field should have the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
294 format [tagName]:i:[value], where a [value] bigger than 0 indicates
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
295 a read with too many alignments. (Default: "")
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
296
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
297 --bowtie-path [path]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
298 The path to the bowtie executables. (Default: the path to the bowtie
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
299 executables is assumed to be in the user's PATH environment
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
300 variable)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
301
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
302 --bowtie-n [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
303 (Bowtie parameter) max # of mismatches in the seed. (Range: 0-3,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
304 Default: 2)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
305
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
306 --bowtie-e [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
307 (Bowtie parameter) max sum of mismatch quality scores across the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
308 alignment. (Default: 99999999)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
309
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
310 --bowtie-m [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
311 (Bowtie parameter) suppress all alignments for a read if greater then [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
312 valid alignments exist. (Default: 200)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
313
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
314 --bowtie-chunkmbs [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
315 (Bowtie parameter) memory allocated for best first alignment
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
316 calculation (Default: 0 - use bowtie's default)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
317
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
318 --phred33-quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
319 Input quality scores are encoded as Phred+33. (Default: on)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
320
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
321 --phred64-quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
322 Input quality scores are encoded as Phred+64 (default for GA
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
323 Pipeline ver. less than 1.3). (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
324
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
325 --solexa-quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
326 Input quality scores are solexa encoded (from GA Pipeline ver. less
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
327 than 1.3). (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
328
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
329 --forward-prob [double]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
330 Probability of generating a read from the forward strand of a
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
331 transcript. Set to 1 for a strand-specific protocol where all
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
332 (upstream) reads are derived from the forward strand, 0 for a
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
333 strand-specific protocol where all (upstream) read are derived from
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
334 the reverse strand, or 0.5 for a non-strand-specific protocol.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
335 (Default: 0.5)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
336
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
337 --fragment-length-min [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
338 Minimum read/insert length allowed. This is also the value for the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
339 bowtie -I option. (Default: 1)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
340
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
341 --fragment-length-max [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
342 Maximum read/insert length allowed. This is also the value for the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
343 bowtie -X option. (Default: 1000)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
344
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
345 --fragment-length-mean [double]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
346 (single-end data only) The mean of the fragment length distribution,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
347 which is assumed to be a Gaussian. (Default: -1, which disables use
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
348 of the fragment length distribution)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
349
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
350 --fragment-length-sd [double]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
351 (single-end data only) The standard deviation of the fragment length
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
352 distribution, which is assumed to be a Gaussian. (Default: 0, which
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
353 assumes that all fragments are of the same length, given by the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
354 rounded value of --fragment-length-mean)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
355
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
356 --estimate-rspd
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
357 Set this option if you want to estimate the read start position
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
358 distribution (RSPD) from data. Otherwise, RSEM will use a uniform
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
359 RSPD. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
360
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
361 --num-rspd-bins [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
362 Number of bins in the RSPD. Only relevant when '--estimate-rspd' is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
363 specified. Use of the default setting is recommended. (Default: 20)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
364
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
365 --ci-memory [int]
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
366 Maximum size (in memory, MB) of the auxiliary buffer used for
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
367 computing credibility intervals (CI). Set it larger for a faster CI
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
368 calculation. However, leaving 2 GB memory free for other usage is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
369 recommended. (Default: 1024)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
370
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
371 --keep-intermediate-files
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
372 Keep temporary files generated by RSEM. RSEM creates a temporary
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
373 directory, 'sample_name.temp', into which it puts all intermediate
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
374 output files. If this directory already exists, RSEM overwrites all
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
375 files generated by previous RSEM runs inside of it. By default,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
376 after RSEM finishes, the temporary directory is deleted. Set this
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
377 option to prevent the deletion of this directory and the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
378 intermediate files inside of it. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
379
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
380 --time
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
381 Output time consumed by each step of RSEM to 'sample_name.time'.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
382 (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
383
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
384 -q/--quiet
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
385 Suppress the output of logging information. (Default: off)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
386
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
387 -h/--help
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
388 Show help information.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
389
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
390 DESCRIPTION
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
391 In its default mode, this program aligns input reads against a reference
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
392 transcriptome with Bowtie and calculates expression values using the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
393 alignments. RSEM assumes the data are single-end reads with quality
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
394 scores, unless the '--paired-end' or '--no-qualities' options are
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
395 specified. Users may use an alternative aligner by specifying one of the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
396 --sam and --bam options, and providing an alignment file in the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
397 specified format. However, users should make sure that they align
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
398 against the indices generated by 'rsem-prepare-reference' and the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
399 alignment file satisfies the requirements mentioned in ARGUMENTS
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
400 section.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
401
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
402 One simple way to make the alignment file satisfying RSEM's requirements
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
403 (assuming the aligner used put mates in a paired-end read adjacent) is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
404 to use 'convert-sam-for-rsem' script. This script only accept SAM format
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
405 files as input. If a BAM format file is obtained, please use samtools to
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
406 convert it to a SAM file first. For example, if '/ref/mouse_125' is the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
407 'reference_name' and the SAM file is named 'input.sam', you can run the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
408 following command:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
409
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
410 convert-sam-for-rsem /ref/mouse_125 input.sam -o input_for_rsem.sam
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
411
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
412 For details, please refer to 'convert-sam-for-rsem's documentation page.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
413
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
414 The SAM/BAM format RSEM uses is v1.4. However, it is compatible with old
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
415 SAM/BAM format. However, RSEM cannot recognize 0x100 in the FLAG field.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
416 In addition, RSEM requires SEQ and QUAL are not '*'.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
417
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
418 The user must run 'rsem-prepare-reference' with the appropriate
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
419 reference before using this program.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
420
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
421 For single-end data, it is strongly recommended that the user provide
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
422 the fragment length distribution parameters (--fragment-length-mean and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
423 --fragment-length-sd). For paired-end data, RSEM will automatically
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
424 learn a fragment length distribution from the data.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
425
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
426 Please note that some of the default values for the Bowtie parameters
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
427 are not the same as those defined for Bowtie itself.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
428
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
429 The temporary directory and all intermediate files will be removed when
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
430 RSEM finishes unless '--keep-intermediate-files' is specified.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
431
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
432 With the '--calc-ci' option, 95% credibility intervals and posterior
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
433 mean estimates will be calculated in addition to maximum likelihood
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
434 estimates.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
435
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
436 OUTPUT
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
437 sample_name.genes.results
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
438 File containing gene level expression estimates. The format of each
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
439 line in this file is:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
440
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
441 gene_id expected_counts tau_value [pmc_value tau_pme_value
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
442 tau_ci_lower_bound tau_ci_upper_bound] transcript_id_list
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
443
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
444 Fields are separated by the tab character. Fields within "[]" are
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
445 only presented if '--calc-ci' is set. pme stands for posterior mean
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
446 estimation. pmc stands for posterior mean counts. ci_lower_bound(l)
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
447 means the lower bound of the credibility intervals,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
448 ci_upper_bound(u) means the upper bound of the credibility
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
449 intervals. So the credibility interval is [l, u].
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
450 'transcript_id_list' is a space-separated list of transcript_ids
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
451 belonging to the gene. If no gene information is provided, this file
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
452 has the same content as 'sample_name.isoforms.results'.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
453
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
454 sample_name.isoforms.results
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
455 File containing isoform level expression values. The format of each
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
456 line in this file is:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
457
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
458 transcript_id expected_counts tau_value [pmc_value tau_pme_value
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
459 tau_ci_lower_bound tau_ci_upper_bound] gene_id
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
460
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
461 Fields are separated by the tab character. 'gene_id' is the gene_id
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
462 of the gene which this transcript belongs to. If no gene information
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
463 is provided, 'gene_id' and 'transcript_id' are the same.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
464
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
465 sample_name.transcript.bam, sample_name.transcript.sorted.bam and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
466 sample_name.transcript.sorted.bam.bai
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
467 Only generated when --no-bam-output is not specified.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
468
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
469 'sample_name.transcript.bam' is a BAM-formatted file of read
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
470 alignments in transcript coordinates. The MAPQ field of each
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
471 alignment is set to min(100, floor(-10 * log10(1.0 - w) + 0.5)),
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
472 where w is the posterior probability of that alignment being the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
473 true mapping of a read. In addition, RSEM pads a new tag ZW:f:value,
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
474 where value is a single precision floating number representing the
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
475 posterior probability.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
476
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
477 'sample_name.transcript.sorted.bam' and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
478 'sample_name.transcript.sorted.bam.bai' are the sorted BAM file and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
479 indices generated by samtools (included in RSEM package).
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
480
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
481 sample_name.genome.bam, sample_name.genome.sorted.bam and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
482 sample_name.genome.sorted.bam.bai
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
483 Only generated when --no-bam-output is not specified and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
484 --output-genome-bam is specified.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
485
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
486 'sample_name.genome.bam' is a BAM-formatted file of read alignments
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
487 in genomic coordinates. Alignments of reads that have identical
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
488 genomic coordinates (i.e., alignments to different isoforms that
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
489 share the same genomic region) are collapsed into one alignment. The
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
490 MAPQ field of each alignment is set to min(100, floor(-10 *
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
491 log10(1.0 - w) + 0.5)), where w is the posterior probability of that
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
492 alignment being the true mapping of a read. In addition, RSEM pads a
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
493 new tag ZW:f:value, where value is a single precision floating
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
494 number representing the posterior probability. If an alignment is
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
495 spliced, a XS:A:value tag is also added, where value is either '+'
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
496 or '-' indicating the strand of the transcript it aligns to.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
497
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
498 'sample_name.genome.sorted.bam' and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
499 'sample_name.genome.sorted.bam.bai' are the sorted BAM file and
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
500 indices generated by samtools (included in RSEM package).
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
501
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
502 sample_name.sam.gz
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
503 Only generated when the input files are raw reads instead of SAM/BAM
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
504 format files
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
505
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
506 It is the gzipped SAM output produced by bowtie aligner.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
507
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
508 sample_name.time
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
509 Only generated when --time is specified.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
510
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
511 It contains time (in seconds) consumed by aligning reads, estimating
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
512 expression levels and calculating credibility intervals.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
513
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
514 sample_name.stat
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
515 This is a folder instead of a file. All model related statistics are
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
516 stored in this folder. Use 'rsem-plot-model' can generate plots
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
517 using this folder.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
518
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
519 EXAMPLES
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
520 Assume the path to the bowtie executables is in the user's PATH
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
521 environment variable. Reference files are under '/ref' with name
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
522 'mouse_125'.
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
523
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
524 1) '/data/mmliver.fq', single-end reads with quality scores. Quality
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
525 scores are encoded as for 'GA pipeline version >= 1.3'. We want to use 8
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
526 threads and generate a genome BAM file:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
527
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
528 rsem-calculate-expression --phred64-quals \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
529 -p 8 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
530 --output-genome-bam \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
531 /data/mmliver.fq \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
532 /ref/mouse_125 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
533 mmliver_single_quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
534
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
535 2) '/data/mmliver_1.fq' and '/data/mmliver_2.fq', paired-end reads with
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
536 quality scores. Quality scores are in SANGER format. We want to use 8
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
537 threads and do not generate a genome BAM file:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
538
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
539 rsem-calculate-expression -p 8 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
540 --paired-end \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
541 /data/mmliver_1.fq \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
542 /data/mmliver_2.fq \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
543 /ref/mouse_125 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
544 mmliver_paired_end_quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
545
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
546 3) '/data/mmliver.fa', single-end reads without quality scores. We want
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
547 to use 8 threads:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
548
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
549 rsem-calculate-expression -p 8 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
550 --no-qualities \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
551 /data/mmliver.fa \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
552 /ref/mouse_125 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
553 mmliver_single_without_quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
554
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
555 4) Data are the same as 1). We want to take a fragment length
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
556 distribution into consideration. We set the fragment length mean to 150
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
557 and the standard deviation to 35. In addition to a BAM file, we also
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
558 want to generate credibility intervals. We allow RSEM to use 1GB of
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
559 memory for CI calculation:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
560
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
561 rsem-calculate-expression --bowtie-path /sw/bowtie \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
562 --phred64-quals \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
563 --fragment-length-mean 150.0 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
564 --fragment-length-sd 35.0 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
565 -p 8 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
566 --output-genome-bam \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
567 --calc-ci \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
568 --ci-memory 1024 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
569 /data/mmliver.fq \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
570 /ref/mouse_125 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
571 mmliver_single_quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
572
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
573 5) '/data/mmliver_paired_end_quals.bam', paired-end reads with quality
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
574 scores. We want to use 8 threads:
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
575
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
576 rsem-calculate-expression --paired-end \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
577 --bam \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
578 -p 8 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
579 /data/mmliver_paired_end_quals.bam \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
580 /ref/mouse_125 \
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
581 mmliver_paired_end_quals
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
582 </help>
64d45f959303 Uploaded
jjohnson
parents:
diff changeset
583 </tool>