annotate summarize_unique_barcodes.xml @ 11:f6265e05c55c draft

Uploaded
author nikos
date Wed, 05 Nov 2014 10:00:47 -0500
parents 33e625bef2b9
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
10
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
1 <tool id="rna_probing_summarize" version="1.0.0" name="Summarize Unique Barcodes" force_history_refresh="True">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
2 <description></description>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
3
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
4 <requirements>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
5 <requirement type="package" version="4.1.0">gnu_awk</requirement>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
6 <requirement type="package" version="0.1.19">samtools</requirement>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
7 <requirement type="package" version="3.1.1">R_3_1_1</requirement>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
8 <requirement type="set_environment">RNA_PROBING_SCRIPT_PATH</requirement>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
9 </requirements>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
10
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
11 <command interpreter="bash">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
12 summarize_unique_barcodes.sh
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
13
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
14 ## Inputs
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
15 -f $input1 -b $input2
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
16
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
17 ##
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
18
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
19 #if str( $k2n ) == 'True':
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
20 -k
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
21 #end if
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
22
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
23 #if str( $priming.flag ) == 'True':
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
24 -p $priming.position
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
25 #end if
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
26
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
27 #if str( $trimming ) == 'True':
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
28 -t
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
29 #end if
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
30
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
31 -r \$RNA_PROBING_SCRIPT_PATH
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
32 </command>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
33
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
34 <!-- basic error handling -->
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
35 <stdio>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
36 <regex match="Error" level="fatal" description="" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
37 </stdio>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
38
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
39 <inputs>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
40 <param format="bam" name="input1" type="data" label="Aligned Reads" help="BAM format." />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
41 <param format="tabular" name="input2" type="data" optional="True" label="Barcodes" help="Produced by Debarcoding tool." />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
42 <param name="k2n" type="boolean" checked="False" truevalue="True" falsevalue="False" label="Produce k2n file" help="Check the box if you ran the tool and received a warning message to produce the k2n file. Necessary if you want to use 'HRF-Seq' method in 'Normalize' tool. Warning: Can be very slow!" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
43 <param name="trimming" type="boolean" checked="True" truevalue="True" falsevalue="False" label="Trim untemplated nucleotides" help="" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
44 <conditional name="priming">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
45 <param name="flag" type="select" label="Set priming position" help="Set the priming position manually.">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
46 <option value="False">No</option>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
47 <option value="True">Yes</option>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
48 </param>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
49 <when value="True">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
50 <param name="position" type="integer" value="0" min="0" label="Priming position" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
51 </when>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
52 <when value="False" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
53 </conditional>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
54 </inputs>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
55
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
56 <outputs>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
57 <data format="tabular" name="trimming_stats" label="${tool.name} on ${on_string}: Trimming stats" from_work_dir="output_dir/trimming_stats.txt">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
58 <filter>trimming is True</filter>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
59 </data>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
60 <data format="tabular" name="unique_barcodes" label="${tool.name} on ${on_string}: Unique Barcodes" from_work_dir="output_dir/unique_barcodes.txt">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
61 <filter> input2 != None </filter>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
62 </data>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
63 <data format="tabular" name="read_counts" label="${tool.name} on ${on_string}: Read Counts" from_work_dir="output_dir/read_counts.txt" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
64 <data format="txt" name="k2n_file" label="${tool.name} on ${on_string}: k2n file" from_work_dir="output_dir/k2n.txt">
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
65 <filter> k2n is True </filter>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
66 </data>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
67 </outputs>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
68
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
69 <tests>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
70 <test>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
71 <param name="input1" value="aligned.bam" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
72 <param name="input2" value="barcodes.txt" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
73 <param name="k2n" value="True" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
74 <param name="trimming" value="True" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
75 <output name="trimming_stats" file="trimming_stats.txt" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
76 <output name="unique_barcodes" file="unique_barcodes.txt" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
77 <output name="read_counts" file="read_counts.txt" />
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
78 </test>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
79 </tests>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
80
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
81 <help>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
82 **What it does**
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
83
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
84 *Summarize Unique Barcodes* counts the number of unique random barcodes and reads associated with each sequenced fragment. A fragment is understood as 1) a pair of Reverse Transcriptase (RT) termination site and RT priming site given paired end sequencing, or 2) an RT termination site in a single end sequencing. For non-barcoded sequencing it only counts the reads matching each fragment.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
85
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
86 ------
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
87
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
88 **Inputs**
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
89
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
90 *Summarize Unique Barcodes* requires a file containing the Aligned Reads (required) in BAM_ format and tabular file with the Barcodes (optional) produced by the *Preprocessing* tool of the *RNA probing* suite.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
91
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
92 .. _BAM: http://samtools.github.io/hts-specs/SAMv1.pdf
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
93
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
94 -------
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
95
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
96 **Parameters**
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
97
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
98 **Produce k2n file** - A file that contains a sequence of numbers where the n-th element informs how many unique cDNA molecules gives rise to observing n unique barcodes in a given sample. Required for calculating Estimated Unique Counts (EUCs) in tool *Normalize*.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
99
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
100 **Trim untemplated nucleotides** - Untemplated nucleotides can be added to cDNA 3’ ends via terminal transferase activity of reverse transcriptase which offset the location of the read-end mapping and lead to erroneous assignment of reactivity information to nucleotides upstream of those which has reacted (Schmidt and Mueller, 1999, Talkish et al., 2014). Setting this parameter on will remove those nucleotides.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
101
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
102 Recommended for methods based on detecting reverse transcription termination sites (e.g. DMS-Seq, HRF-Seq or SHAPE-Seq), and not for methods based on ligating the linker directly to RNA (e.g. PARS or FragSeq).
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
103
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
104 **Set priming position** - Applicable when the priming site is fixed.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
105
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
106 ------
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
107
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
108 **Outputs**
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
109
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
110 **Unique Barcodes** (if a Barcode file is given) is a tabular file with 4 columns.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
111
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
112 ====== ==========================================================
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
113 Column Description
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
114 ------ ----------------------------------------------------------
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
115 1 Transcript identifier
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
116 2 RT termination site (start)
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
117 3 RT priming site (end)
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
118 4 Count of unique barcodes associated with fragments matching the first three columns
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
119 ====== ==========================================================
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
120
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
121 .
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
122
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
123 **Read Counts** is similar to Unique Barcodes but the fourth column is a count of reads matching first three columns.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
124
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
125 **k2n file** as described above.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
126
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
127 **Trimming Stats** reports statistics of trimming untemplated nucleotides from read ends.
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
128
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
129 </help>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
130
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
131 <citations>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
132 <citation type="doi">10.1093/nar/gku167</citation>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
133 <citation type="doi">10.1093/nar/27.21.e31-i</citation>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
134 <citation type="doi">10.1261/rna.042218.113</citation>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
135 </citations>
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
136
33e625bef2b9 Uploaded
nikos
parents:
diff changeset
137 </tool>