annotate inner_distance.xml @ 5:31a43978eaa9 draft default tip

Uploaded
author bgruening
date Sat, 25 Apr 2015 10:07:21 -0400
parents 49ed5952a8b8
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
1 <tool id="rseqc_inner_distance" name="Inner Distance" version="2.4">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
2 <description>calculate the inner distance (or insert size) between two paired RNA reads</description>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
3 <requirements>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
4 <requirement type="package" version="3.0.3">R</requirement>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
5 <requirement type="package" version="1.7.1">numpy</requirement>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
6 <requirement type="package" version="2.4">rseqc</requirement>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
7 </requirements>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
8 <command>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
9 inner_distance.py -i $input -o output -r $refgene
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
10
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
11 #if $bounds.hasLowerBound
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
12 -l $bounds.lowerBound
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
13 #end if
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
14
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
15 #if $bounds2.hasUpperBound
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
16 -u $bounds2.upperBound
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
17 #end if
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
18
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
19 #if $steps.step
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
20 -s $steps.stepSize
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
21 #end if
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
22 </command>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
23 <stdio>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
24 <exit_code range="1:" level="fatal" description="An error occured during execution, see stderr and stdout for more information" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
25 <regex match="[Ee]rror" source="both" description="An error occured during execution, see stderr and stdout for more information" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
26 </stdio>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
27 <inputs>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
28 <param name="input" type="data" format="bam,sam" label="input bam/sam file" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
29 <param name="refgene" type="data" format="bed" label="reference gene model" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
30 <conditional name="bounds">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
31 <param name="hasLowerBound" type="boolean" label="Specify lower bound" value="false"/>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
32 <when value="true">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
33 <param name="lowerBound" type="integer" value="-250" label="Estimated Lower Bound (bp, default=-250)" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
34 </when>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
35 </conditional>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
36 <conditional name="bounds2">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
37 <param name="hasUpperBound" type="boolean" label="Specify upper bound" value="false" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
38 <when value="true">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
39 <param name="upperBound" type="integer" value="250" label="Estimated Upper Bound (bp, default=250)" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
40 </when>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
41 </conditional>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
42 <conditional name="steps">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
43 <param name="step" type="boolean" label="Specify step size" value="false" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
44 <when value="true">
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
45 <param name="stepSize" type="integer" value="5" label="Step size (bp, default=5)" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
46 </when>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
47 </conditional>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
48 </inputs>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
49 <outputs>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
50 <data format="txt" name="outputtxt" from_work_dir="output.inner_distance.txt" label="${tool.name} on ${on_string} (Text)"/>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
51 <data format="txt" name="outputfreqtxt" from_work_dir="output.inner_distance_freq.txt" label="${tool.name} on ${on_string} (Freq Text)" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
52 <data format="pdf" name="outputpdf" from_work_dir="output.inner_distance_plot.pdf" label="${tool.name} on ${on_string} (PDF)" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
53 <data format="txt" name="outputr" from_work_dir="output.inner_distance_plot.r" label="${tool.name} on ${on_string} (R Script)" />
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
54 </outputs>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
55 <help>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
56 inner_distance.py
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
57 +++++++++++++++++
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
58
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
59 This module is used to calculate the inner distance (or insert size) between two paired RNA
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
60 reads. The distance is the mRNA length between two paired fragments. We first determine the
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
61 genomic (DNA) size between two paired reads: D_size = read2_start - read1_end, then
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
62
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
63 * if two paired reads map to the same exon: inner distance = D_size
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
64 * if two paired reads map to different exons:inner distance = D_size - intron_size
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
65 * if two paired reads map non-exonic region (such as intron and intergenic region): inner distance = D_size
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
66 * The inner_distance might be a negative value if two fragments were overlapped.
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
67
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
68 NOTE: Not all read pairs were used to estimate the inner distance distribution. Those low
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
69 quality, PCR duplication, multiple mapped reads were skipped.
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
70
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
71 Inputs
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
72 ++++++++++++++
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
73
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
74 Input BAM/SAM file
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
75 Alignment file in BAM/SAM format.
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
76
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
77 Reference gene model
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
78 Gene model in BED format.
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
79
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
80 Estimated Upper/Lower Bounds (defaults=250 and -250)
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
81 Estimated upper/lower bounds of inner distance (bp).
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
82
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
83 Step size (default=5)
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
84 Step size of histogram
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
85
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
86
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
87 Output
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
88 ++++++++++++++
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
89
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
90 1. output.inner_distance.txt:
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
91 - first column is read ID
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
92 -second column is inner distance. Could be negative value if PE reads were overlapped or mapping error (e.g. Read1_start &lt; Read2_start, while Read1_end >> Read2_end due to spliced mapping of read1)
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
93 - third column indicates how paired reads were mapped: PE_within_same_exon, PE_within_diff_exon,PE_reads_overlap
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
94 2. output..inner_distance_freq.txt:
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
95 - inner distance starts
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
96 - inner distance ends
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
97 - number of read pairs
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
98 - note the first 2 columns are left side half open interval
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
99 3. output.inner_distance_plot.r: R script to generate histogram
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
100 4. output.inner_distance_plot.pdf: histogram plot
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
101
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
102 .. image:: http://rseqc.sourceforge.net/_images/inner_distance.png
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
103 :height: 600 px
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
104 :width: 600 px
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
105 :scale: 80 %
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
106
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
107
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
108 -----
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
109
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
110 About RSeQC
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
111 +++++++++++
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
112
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
113 The RSeQC_ package provides a number of useful modules that can comprehensively evaluate high throughput sequence data especially RNA-seq data. "Basic modules" quickly inspect sequence quality, nucleotide composition bias, PCR bias and GC bias, while "RNA-seq specific modules" investigate sequencing saturation status of both splicing junction detection and expression estimation, mapped reads clipping profile, mapped reads distribution, coverage uniformity over gene body, reproducibility, strand specificity and splice junction annotation.
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
114
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
115 The RSeQC package is licensed under the GNU GPL v3 license.
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
116
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
117 .. image:: http://rseqc.sourceforge.net/_static/logo.png
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
118
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
119 .. _RSeQC: http://rseqc.sourceforge.net/
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
120
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
121
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
122 </help>
49ed5952a8b8 Uploaded
lparsons
parents:
diff changeset
123 </tool>