annotate strelka.xml @ 0:88141dfd5db1 draft

Uploaded
author morinlab
date Thu, 18 Aug 2016 19:34:55 -0400
parents
children 9c9f2706c5e1
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
1 <tool id="strelka" name="Strelka" version="1.0.14">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
2 <description>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
3 detects somatic SNVs and small indels in tumour/normal pairs
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
4 </description>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
5 <macros>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
6 <import>citations.xml</import>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
7 </macros>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
8 <requirements>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
9 <requirement type="set_environment">STRELKA_INSTALL_DIR</requirement>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
10 <requirement type="set_environment">STRELKA_REPOSITORY_DIR</requirement>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
11 </requirements>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
12 <command detect_errors="aggressive">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
13
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
14 <!-- LINK BAM INDEX -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
15 ln -s $normal normal.bam;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
16 ln -s $normal.metadata.bam_index normal.bam.bai;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
17 ln -s $tumour tumour.bam;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
18 ln -s $tumour.metadata.bam_index tumour.bam.bai;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
19
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
20 <!-- CREATE CONFIG FILE -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
21 touch config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
22 #if #depthfilters == "genome":
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
23 echo "isSkipDepthFilters = 0" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
24 echo "maxInputDepth = 10000" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
25 echo "depthFilterMultiple = 3.0" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
26 #elif #depthfilters == "exome":
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
27 echo "isSkipDepthFilters = 1" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
28 echo "maxInputDepth = 10000" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
29 echo "depthFilterMultiple = 3.0" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
30 #elif #depthfilters == "targeted":
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
31 echo "isSkipDepthFilters = 1" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
32 echo "maxInputDepth = 10000" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
33 echo "depthFilterMultiple = 3.0" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
34 #else:
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
35 echo "isSkipDepthFilters = "$isSkipDepthFilters >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
36 echo "maxInputDepth = "$maxInputDepth >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
37 echo "depthFilterMultiple = "$depthFilterMultiple >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
38 #end if
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
39 echo "snvMaxFilteredBasecallFrac = "$advancedsettings.snvMaxFilteredBasecallFrac >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
40 echo "snvMaxSpanningDeletionFrac = "$advancedsettings.snvMaxSpanningDeletionFrac >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
41 echo "indelMaxRefRepeat = "$advancedsettings.indelMaxRefRepeat >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
42 echo "indelMaxWindowFilteredBasecallFrac = "$advancedsettings.indelMaxWindowFilteredBasecallFrac >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
43 echo "indelMaxIntHpolLength = "$advancedsettings.indelMaxIntHpolLength >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
44 echo "ssnvPrior = "$advancedsettings.ssnvPrior >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
45 echo "sindelPrior = "$advancedsettings.sindelPrior >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
46 echo "ssnvNoise = "$advancedsettings.ssnvNoise >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
47 echo "sindelNoise = "$advancedsettings.sindelNoise >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
48 echo "ssnvNoiseStrandBiasFrac = "$advancedsettings.ssnvNoiseStrandBiasFrac >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
49 echo "minTier1Mapq = "$advancedsettings.minTier1Mapq >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
50 echo "minTier2Mapq = "$advancedsettings.minTier2Mapq >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
51 echo "ssnvQuality_LowerBound = "$advancedsettings.ssnvQuality_LowerBound >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
52 echo "sindelQuality_LowerBound = "$advancedsettings.sindelQuality_LowerBound >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
53 echo "isWriteRealignedBam = 0" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
54 echo "binSize = 25000000" >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
55 echo "extraStrelkaArguments = " >> config.ini;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
56
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
57 <!-- INDEX GENOME IF HISTORY -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
58 #if $reference_source == "history":
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
59 ln -s $reference_source.ref_file ref.fa;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
60 samtools faidx ref.fa;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
61 #end if
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
62
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
63 <!-- CREATE ORIGINAL STRELKA MAKEFILE -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
64 \$STRELKA_INSTALL_DIR/bin/configureStrelkaWorkflow.pl
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
65 --normal \$(pwd)/normal.bam
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
66 --tumor \$(pwd)/tumour.bam
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
67 #if $reference_source == "history":
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
68 --ref ref.fa
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
69 #else:
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
70 --ref ${reference_source.ref_file.fields.path}
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
71 #end if
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
72 --config \$(pwd)/config.ini
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
73
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
74 #if $interval_file
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
75
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
76 <!-- CREATE SUB-MAKEFILE IF PARALLELISM TURNED ON -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
77 cp ./strelkaAnalysis/Makefile ./;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
78
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
79 \$REPOSITORY_STRELKA_DIR/parse_strelka_makefile.py
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
80 --makefile Makefile
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
81 --chrom \$(cat $interval_file | cut -f1)
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
82 --output ./strelkaAnalysis/Makefile;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
83
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
84 #end if
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
85
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
86 <!-- RUN STRELKA -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
87 cd strelkaAnalysis;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
88 make -j \${GALAXY_SLOTS:-1};
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
89
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
90 #if $interval_file
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
91
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
92 <!-- OUTPUT FOR PARALLEL OPTION - TO BE MERGED -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
93 cat ./chromosomes/\$(cat $interval_file | cut -f1)/all.somatic.snvs.vcf > $snvs;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
94 cat ./chromosomes/\$(cat $interval_file | cut -f1)/all.somatic.indels.vcf > $indels;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
95
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
96 #else
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
97
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
98 <!-- OUTPUT FOR NORMAL OPTION - ALREADY MERGED -->
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
99 cat ./results/all.somatic.snvs.vcf > $snvs;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
100 cat ./results/all.somatic.indels.vcf > $indels;
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
101
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
102 #end if
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
103 </command>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
104 <inputs>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
105 <conditional name="reference_source">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
106 <param label="Choose the source for the reference genome" name="reference_source_selector" type="select">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
107 <option value="cached">Use a built-in genome</option>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
108 <option value="history">Use a genome from the history</option>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
109 </param>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
110 <when value="cached">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
111 <param label="Reference Genome File" name="ref_file" type="select" >
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
112 <options from_data_table="fasta_indexes" />
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
113 </param>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
114 </when>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
115 <when value="history">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
116 <param label="Reference Genome File" name="ref_file" type="data" format="fasta" />
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
117 </when>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
118 </conditional>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
119 <param type="data" format="bam" name="normal" label="Normal Alignment File" />
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
120 <param type="data" format="bam" name="tumour" label="Tumour Alignment File" />
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
121 <param type="data" format="txt" optional="true" name="interval_file" label="Chromosomes" help="Restrict SNV calls to the following list of chromosomes (one per line)" />
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
122 <conditional type="depthfilters">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
123 <param type="select" name="seqType" label="What Type of Sequencing?">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
124 <option value="genome" selected="true">Whole Genome</option>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
125 <option value="exome">Exome</option>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
126 <option value="targeted">Targeted</option>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
127 <option value="other">What are you hiding from me?</option>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
128 </param>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
129 <when value="other">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
130 <param name="isSkipDepthFilters" type="boolean" label="Skip Reads Above Depth Threshold?" help="Should we skip reads if they exist above the chromosome average depth multiplied by the Depth Filter Multiple? Should only be true for Whole Genome Sequencing." checked="true" truevalue="0" falsevalue="1"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
131 <param name="depthFilterMultiple" type="float" label="Depth Filter Multiple" value="3.0"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
132 <param name="maxInputDepth" type="integer" label="Max Input Depth" value="10000" help="The upper bound on input depth to load into memory. This filter should not occur with Deep Targeted Sequencing but should occur with Exome or Whole Genome Sequencing. Set to 0 to turn off" min="0"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
133 </when>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
134 </conditional>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
135 <section name="advancedsettings" title="Advanced Settings" expanded="False">
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
136 <param type="float" name="snvMaxFilteredBasecallFrac" value="0.4" label="SNV Max Filtered Basecall Fraction" help="Filter SNV calls when greater than this fraction of basecalls have been removed by a mismatch density filter in either sample."/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
137 <param type="float" name="snvMaxSpanningDeletionFrac" value="0.75" label="SNV Max Spanning Deletion Fraction" help="Filter SNV calls at sites where greater than this fraction of overlapping reads contain deletions which span the SNV call site."/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
138 <param type="integer" name="indelMaxRefRepeat" value="8" label="Indel Max Reference Homopolymer Length" help="Filter Indel calls if they represent an expansion or contraction of a repeated pattern with a repeat count greater than this value in the reference."/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
139 <param type="float" name="indelMaxWindowFilteredBasecallFrac" value="0.3" label="Indel Max Window Filtered Basecall Fraction" help="Filter Indel calls if greater than this fraction of basecalls in a window extending 50 bases to each side of the indel's call positions have been removed by the mismatch density filter."/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
140 <param type="integer" name="indelMaxIntHpolLength" value="14" label="Indel Max Interrupted Homopolymers Length" help="Filter Indel calls if the longest homopolymer which can be found intersecting or adjacent to the called indel when a single non-homopolymer base is allowed is greater than this length."/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
141 <param type="float" name="ssnvPrior" value="0.000001" label="SNV Prior Probability"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
142 <param type="float" name="sindelPrior" value="0.000001" label="Indel Prior Probability"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
143 <param type="float" name="ssnvNoise" value="0.0000005" label="SNV Noise Probability"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
144 <param type="float" name="sindelNoise" value="0.000001" label="Indel Noise Probability"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
145 <param type="float" name="ssnvNoiseStrandBiasFrac" value="0.5" label="SNV Noise Fraction Attributed to Strand Bias"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
146 <param type="integer" name="minTier1Mapq" value="20" label="Min Tier1 Mapping Quality"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
147 <param type="integer" name="minTier2Mapq" value="5" label="Min Tier2 Mapping Quality"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
148 <param type="integer" name="ssnvQuality_LowerBound" value="15" label="SNV Quality Score Lower Bound"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
149 <param type="integer" name="sindelQuality_LowerBound" value="30" label="Indel Quality Score Lower Bound"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
150 </section>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
151 </inputs>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
152 <outputs>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
153 <data format="vcf" name="snvs" label="Strelka SNVs"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
154 <data format="vcf" name="indels" label="Strelka indels"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
155 </outputs>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
156 <tests>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
157 <test>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
158 <param name="normal" value="test.normal.bam"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
159 <param name="tumour" value="test.tumour.bam"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
160 <param name="reference_source" value="history"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
161 <param name="ref_file" value="test.fa"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
162 <output name="snvs" ftype="vcf" file="somatic.all.somatic.snvs.vcf" lines_diff="2"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
163 <output name="indels" ftype="vcf" file="somatic.all.somatic.indels.vcf" lines_diff="2"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
164 </test>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
165 </tests>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
166 <help>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
167
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
168 This tool generates VCF files by calling Strelka, a Somatic Nucleotide Variant Caller, on Tumour Normal Pairs.
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
169
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
170 </help>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
171 <citations>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
172 <expand macro="morinlab_citation"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
173 <expand macro="galaxy_citation"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
174 <expand macro="strelka_citation"/>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
175 </citations>
88141dfd5db1 Uploaded
morinlab
parents:
diff changeset
176 </tool>