annotate star_fusion.xml @ 0:5ff7593a7220 draft

Uploaded
author jjohnson
date Wed, 04 Oct 2017 15:23:36 -0400
parents
children 5748e43a73e0
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
1 <tool id="star_fusion" name="STAR-Fusion" version="1.1.0" profile="17.01">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
2 <description>detect fusion genes in RNA-Seq data</description>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
3 <requirements>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
4 <!-- Bio-conda -->
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
5 <requirement type="package" version="1.1.0">star-fusion</requirement>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
6 </requirements>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
7
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
8 <stdio>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
9 <regex match="command not found" source="stderr" level="fatal"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
10 <regex match="EXITING because of INPUT ERROR" source="stderr" level="fatal"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
11 <regex match="FATAL ERROR" source="stderr" level="fatal"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
12
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
13 <regex match="Warning:" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
14 <regex match="CMD:" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
15
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
16 <regex match="-done creating index file:" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
17 <regex match="-parsing GTF file:" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
18 <regex match="-building interval tree" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
19 <regex match="-parsing fusion evidence:" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
20 <regex match="-mapping reads to genes" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
21 <regex match="-outputting fusion candidates to file:" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
22
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
23 <regex match="Process complete" source="stderr" level="warning"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
24 </stdio>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
25
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
26 <version_command>STAR-Fusion --version 2>&amp;1 | grep version | grep -o -E "software version.*?"</version_command>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
27
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
28 <command><![CDATA[
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
29 #if reference.reference_type_selector == 'cached':
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
30 ln -s '$reference.ctat_resource_lib' tmp_star_fusion_genome_dir
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
31 #else
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
32 ## 1. ensure the blastn file is provided as *.gz
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
33 if file --mime-type '${reference.blast_pairs}' | grep -q /gzip\$; then
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
34 gzip_suffix='' ;
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
35 else
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
36 ## Older versions of gzip do not support the -k option to keep
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
37 ## the original file - this should be an universion solution
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
38
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
39 gzip -1 -c -- '${reference.blast_pairs}' > '${reference.blast_pairs}.gz' &&
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
40 gzip_suffix='.gz' ;
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
41 fi &&
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
42
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
43 ## 2. create reference index - using \$(pwd) is necessary, probably because the perl script changes work directory
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
44 ## - @todo once write a decent STAR and STAR Fusion data manager
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
45 prep_genome_lib.pl
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
46 --genome_fa '${reference.fasta_type.ownFile}'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
47 --gtf '${reference.geneModel}'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
48 --blast_pairs "${reference.blast_pairs}\$gzip_suffix"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
49 --CPU \${GALAXY_SLOTS:-1}
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
50 --output_dir "\$(pwd)/tmp_star_fusion_genome_dir"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
51 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
52 &&
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
53
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
54 ## Link in fastq files so they have appropriate extensions
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
55 #if str($input_params.input_source) != "use_chimeric":
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
56 #if $input_params.left_fq.is_of_type("fastq.gz"):
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
57 #set read1 = 'input_1.fastq.gz'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
58 #else:
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
59 #set read1 = 'input_1.fastq'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
60 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
61 ln -f -s '${input_params.left_fq}' ${read1} &&
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
62
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
63 #if $input_params.right_fq:
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
64 #if $input_params.right_fq.is_of_type("fastq.gz"):
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
65 #set read2 = 'input_2.fastq.gz'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
66 #else:
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
67 #set read2 = 'input_2.fastq'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
68 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
69 ln -f -s '${input_params.right_fq}' ${read2} &&
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
70 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
71 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
72
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
73 ## 3. Run STAR-Fusion
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
74 STAR-Fusion
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
75 #if str($input_params.input_source) == "use_chimeric":
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
76 --chimeric_junction '${input_params.chimeric_junction}'
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
77 #else:
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
78 --left_fq ${read1}
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
79 #if $input_params.right_fq:
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
80 --right_fq ${read2}
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
81 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
82 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
83
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
84 --genome_lib_dir "\$(pwd)/tmp_star_fusion_genome_dir"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
85
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
86 str($input_params.optional_outputs).replace(',',' ')
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
87
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
88 #if str($params.settingsType) == "full":
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
89 --min_junction_reads $params.min_junction_reads
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
90 --min_sum_frags $params.min_sum_frags
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
91 --max_promiscuity $params.max_promiscuity
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
92 --min_novel_junction_support $params.min_novel_junction_support
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
93 --min_alt_pct_junction $params.min_alt_pct_junction
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
94 --aggregate_novel_junction_dist $params.aggregate_novel_junction_dist
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
95 --E $params.E
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
96 #end if
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
97 --CPU \${GALAXY_SLOTS:-1}
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
98 ]]></command>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
99
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
100 <inputs>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
101 <conditional name="reference">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
102 <param name="reference_type_selector" type="select" label="Star Fusion Genome Reference Source">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
103 <option value="cached">Locally Cached sequences</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
104 <option value="build" selected="true">Sequences from your history</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
105 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
106 <when value="cached">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
107 <param name="ctat_resource_lib" type="select" label="Genome to search">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
108 <options from_data_table="ctat_resource">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
109 <column name="dbkey" index="1"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
110 <column name="name" index="2"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
111 <column name="value" index="3"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
112 </options>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
113 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
114 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
115 <when value="build">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
116 <!-- Genome source. -->
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
117 <conditional name="fasta_type">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
118 <param name="fasta_type_selector" type="select" label="Source for sequence to search">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
119 <option value="cached">Locally Cached sequences</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
120 <option value="history" selected="true">Sequences from your history</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
121 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
122 <when value="cached">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
123 <param name="ownFile"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
124 type="select" label="Genome to search">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
125 <options from_data_table="all_fasta">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
126 <column name="dbkey" index="1"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
127 <column name="name" index="2"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
128 <column name="value" index="3"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
129 </options>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
130 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
131 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
132 <when value="history">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
133 <param name="ownFile"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
134 type="data"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
135 format="fasta"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
136 label="Select the reference genome (FASTA file)"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
137 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
138 </conditional>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
139 <param name="geneModel"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
140 type="data"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
141 format="gff3,gtf"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
142 label="Gene model (gff3,gtf) file for splice junctions and fusion gene detection"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
143 <param name="blast_pairs"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
144 type="data"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
145 format="tabular"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
146 label="Result of BLAST+-blastn of the reference fasta sequence with itself"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
147 help="Run blastn with '-outputfmt 6' or choose 'Tabular (standard 12 columns)' in the Galaxy wrapper. For human data it is recommended to obtain it from here: https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
148 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
149 </conditional>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
150
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
151
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
152 <conditional name="input_params">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
153 <param name="input_source"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
154 type="select"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
155 label="Use output from earlier STAR run or let STAR Fusion control running STAR">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
156 <option value="use_chimeric">Use output from earlier STAR</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
157 <option value="use_fastq">Let STAR Fusion control running STAR</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
158 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
159 <when value="use_chimeric">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
160 <param name="chimeric_junction"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
161 type="data"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
162 format="interval"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
163 argument="--chimeric_junction"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
164 label="Chimeric junction file from STAR (with STAR-Fusion settings)"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
165 <param name="optional_outputs" type="select" multiple="true" label="Additional Outputs">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
166 <option value="--annotate">--annotate</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
167 <option value="--examine_coding_effect">--examine_coding_effect</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
168 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
169 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
170 <when value="use_fastq">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
171 <param name="left_fq"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
172 type="data"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
173 format="fastqsanger,fastqsanger.gz"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
174 argument="--left_fq"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
175 label="left.fq file"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
176 <param name="right_fq"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
177 type="data"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
178 format="fastqsanger,fastqsanger.gz"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
179 optional="true"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
180 argument="--right_fq"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
181 label="right.fq file (actually optional, but highly recommended)"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
182 <param name="optional_outputs" type="select" multiple="true" label="Additional Outputs">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
183 <option value="--annotate">--annotate</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
184 <option value="--examine_coding_effect">--examine_coding_effect</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
185 <option value="--extract_fusion_reads">--extract_fusion_reads</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
186 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
187 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
188 </conditional>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
189
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
190 <conditional name="params">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
191 <param name="settingsType" type="select" label="Settings to use" help="You can use the default settings or set custom values for any STAR Fusion parameter.">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
192 <option value="default" selected="true">Use Defaults</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
193 <option value="full">Full parameter list</option>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
194 </param>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
195 <when value="default" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
196 <when value="full"><!-- Full/advanced params. -->
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
197 <param name="min_junction_reads"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
198 type="integer" value="1"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
199 label="minimum number of junction-spanning reads required."
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
200 argument="--min_junction_reads"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
201 <param name="min_sum_frags"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
202 type="integer"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
203 value="2"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
204 label="minimum fusion support = (#junction_reads + #spanning_frags)"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
205 argument="--min_sum_frags"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
206 <param name="max_promiscuity"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
207 type="integer"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
208 value="3"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
209 label="maximum number of partners allowed for a given fusion"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
210 argument="--max_promiscuity"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
211 <param name="min_novel_junction_support"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
212 type="integer"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
213 value="3"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
214 label="minimum of 3 junction reads required if breakpoint lacks involvement of only reference junctions"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
215 argument="--min_novel_junction_support"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
216 <param name="min_alt_pct_junction"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
217 type="float"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
218 value="10"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
219 label="10% of the dominant isoform junction support"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
220 argument="--min_alt_pct_junction"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
221 <param name="aggregate_novel_junction_dist"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
222 type="integer"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
223 value="5"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
224 label="non-ref junctions within 5 are merged into single calls"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
225 argument="--aggregate_novel_junction_dist"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
226 <param name="E"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
227 type="float"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
228 value="0.001"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
229 label="E-value threshold for blast searches"
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
230 argument="-E"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
231 </when>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
232 </conditional>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
233 </inputs>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
234
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
235 <outputs>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
236 <data format="bam" name="out_bam" label="${tool.name} on ${on_string}: Aligned.sortedByCoord.out.bam" from_work_dir="star-fusion.fusion_candidates.final"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
237 <data format="fastqsanger" name="output_reads_1" label="${tool.name} on ${on_string}: fusion_evidence_reads_1" from_work_dir="star-fusion.fusion_evidence_reads_1.fq">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
238 <filter>input_params['input_source'] == 'use_fastq' and str(input_params['optional_outputs']).find('extract_fusion_reads') > 0</filter>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
239 </data>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
240 <data format="fastqsanger" name="output_reads_2" label="${tool.name} on ${on_string}: fusion_evidence_reads_2" from_work_dir="star-fusion.fusion_evidence_reads_2.fq">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
241 <filter>input_params['input_source'] == 'use_fastq' and str(input_params['optional_outputs']).find('extract_fusion_reads') > 0</filter>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
242 </data>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
243 <data format="tabular" name="output_final" label="${tool.name} on ${on_string}: fusion_predictions.tsv" from_work_dir="star-fusion.fusion_predictions.tsv"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
244 <data format="tabular" name="output_final" label="${tool.name} on ${on_string}: fusion_predictions.abridged.tsv" from_work_dir="star-fusion.fusion_predictions.abridged.tsv"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
245 <data format="tabular" name="output_final" label="${tool.name} on ${on_string}: fusion_predictions.abridged.annotated.tsv" from_work_dir="star-fusion.fusion_predictions.abridged.annotated.tsv">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
246 <filter>str(input_params['optional_outputs']).find('annotate') > 0 and not str(input_params['optional_outputs']).find('examine_coding_effect') > 0</filter>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
247 </data>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
248 <data format="tabular" name="output_final" label="${tool.name} on ${on_string}: fusion_predictions.abridged.coding_effect.tsv" from_work_dir="star-fusion.fusion_predictions.abridged.coding_effect.tsv">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
249 <filter>str(input_params['optional_outputs']).find('examine_coding_effect') > 0 and not str(input_params['optional_outputs']).find('annotate') > 0</filter>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
250 </data>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
251 <data format="tabular" name="output_final" label="${tool.name} on ${on_string}: fusion_predictions.abridged.annotated.coding_effect.tsv" from_work_dir="star-fusion.fusion_predictions.abridged.annotated.coding_effect.tsv">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
252 <filter>str(input_params['optional_outputs']).find('annotate') > 0 and str(input_params['optional_outputs']).find('examine_coding_effect') > 0</filter>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
253 </data>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
254 </outputs>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
255
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
256 <tests>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
257 <test>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
258 <param name="input_source" value="use_chimeric" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
259 <param name="chimeric_junction" ftype="interval" value="test1.tabular" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
260 <param name="fasta_type_selector" value="history" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
261 <param name="ownFile" ftype="fasta" value="test1.fa" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
262 <param name="geneModel" ftype="gtf" value="test1.gtf" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
263 <param name="blast_pairs" ftype="tabular" value="test1-test1.blastn.tabular" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
264 <param name="settingsType" value="default" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
265
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
266 <!-- Last column of the results contains data in a random order so exact matching is not feasible -->
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
267 <output name="output_final">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
268 <assert_contents>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
269 <has_line line="#fusion_name&#009;JunctionReads&#009;SpanningFrags&#009;Splice_type&#009;LeftGene&#009;LeftBreakpoint&#009;RightGene&#009;RightBreakpoint&#009;JunctionReads&#009;SpanningFrags" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
270 <has_text text="GENE1--GENE2&#009;24&#009;0&#009;INCL_NON_REF_SPLICE&#009;GENE1^GENE1&#009;chr1:240:+&#009;GENE2^GENE2&#009;chr2:241:+" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
271 </assert_contents>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
272 </output>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
273 </test>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
274 <test>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
275 <param name="input_source" value="use_fastq" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
276 <param name="left_fq" ftype="fastqsanger" value="test1.fastqsanger"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
277 <param name="fasta_type_selector" value="history" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
278 <param name="ownFile" ftype="fasta" value="test1.fa" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
279 <param name="geneModel" ftype="gtf" value="test1.gtf" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
280 <param name="blast_pairs" ftype="tabular" value="test1-test1.blastn.tabular" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
281 <param name="settingsType" value="default" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
282
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
283 <!-- Last column of the results contains data in a random order so exact matching is not feasible -->
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
284 <output name="output_final">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
285 <assert_contents>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
286 <has_line line="#fusion_name&#009;JunctionReads&#009;SpanningFrags&#009;Splice_type&#009;LeftGene&#009;LeftBreakpoint&#009;RightGene&#009;RightBreakpoint&#009;JunctionReads&#009;SpanningFrags" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
287 <has_text text="GENE1--GENE2&#009;24&#009;0&#009;INCL_NON_REF_SPLICE&#009;GENE1^GENE1&#009;chr1:240:+&#009;GENE2^GENE2&#009;chr2:241:+" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
288 </assert_contents>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
289 </output>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
290 </test>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
291 <test>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
292 <param name="input_source" value="use_fastq" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
293 <param name="left_fq" ftype="fastqsanger.gz" value="test1.fastqsanger.gz"/>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
294 <param name="fasta_type_selector" value="history" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
295 <param name="ownFile" ftype="fasta" value="test1.fa" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
296 <param name="geneModel" ftype="gtf" value="test1.gtf" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
297 <param name="blast_pairs" ftype="tabular" value="test1-test1.blastn.tabular" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
298 <param name="settingsType" value="default" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
299
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
300 <!-- Last column of the results contains data in a random order so exact matching is not feasible -->
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
301 <output name="output_final">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
302 <assert_contents>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
303 <has_line line="#fusion_name&#009;JunctionReads&#009;SpanningFrags&#009;Splice_type&#009;LeftGene&#009;LeftBreakpoint&#009;RightGene&#009;RightBreakpoint&#009;JunctionReads&#009;SpanningFrags" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
304 <has_text text="GENE1--GENE2&#009;24&#009;0&#009;INCL_NON_REF_SPLICE&#009;GENE1^GENE1&#009;chr1:240:+&#009;GENE2^GENE2&#009;chr2:241:+" />
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
305 </assert_contents>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
306 </output>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
307 </test>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
308 </tests>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
309 <help>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
310 **What it does**
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
311
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
312 STAR-Fusion is a component of the Trinity Cancer Transcriptome Analysis Toolkit (CTAT). STAR-Fusion uses the STAR aligner to identify candidate fusion transcripts supported by Illumina reads. STAR-Fusion further processes the output generated by the STAR aligner to map junction reads and spanning reads to a reference annotation set.
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
313
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
314 **Input: files required to run STAR-Fusion**
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
315 - A genome reference sequence (FASTA-format)
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
316 - A corresponding protein-coding gene annotation set (GTF/GFF Format)
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
317 - A last-matching gene pairs file - in Galaxy you can create such files with the *ncbi_blast_plus* tool suite containing *blastn*: https://toolshed.g2.bx.psu.edu/view/devteam/ncbi_blast_plus
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
318 - A STAR chimeric/junction output file - this is optional as STAR Fusion can control running STAR as well.
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
319
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
320 The authors of STAR Fusion have made some of these files avaialble at: https://data.broadinstitute.org/Trinity/CTAT_RESOURCE_LIB/. The gene annotations in each case are restricted to the protein-coding and lincRNA transcripts.
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
321 More info: https://github.com/STAR-Fusion/STAR-Fusion/wiki
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
322
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
323 </help>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
324
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
325 <citations>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
326 <citation type="bibtex">
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
327 @unpublished{star_fusion,
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
328 author = {Brian Haas and Nicolas Stransky and Daniel Nicorici},
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
329 title = {STAR-Fusion},
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
330 url = {https://github.com/STAR-Fusion/STAR-Fusion}
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
331 }
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
332 </citation>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
333 </citations>
5ff7593a7220 Uploaded
jjohnson
parents:
diff changeset
334 </tool>