annotate freebayes.xml @ 0:5af352c58c24 draft default tip

Uploaded
author dave
date Wed, 02 Oct 2019 09:26:15 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
5af352c58c24 Uploaded
dave
parents:
diff changeset
1 <tool id="freebayes" name="FreeBayes" version="@DEPENDENCY_VERSION@">
5af352c58c24 Uploaded
dave
parents:
diff changeset
2 <description>bayesian genetic variant detector</description>
5af352c58c24 Uploaded
dave
parents:
diff changeset
3 <macros>
5af352c58c24 Uploaded
dave
parents:
diff changeset
4 <import>macros.xml</import>
5af352c58c24 Uploaded
dave
parents:
diff changeset
5 </macros>
5af352c58c24 Uploaded
dave
parents:
diff changeset
6 <expand macro="requirements">
5af352c58c24 Uploaded
dave
parents:
diff changeset
7 <requirement type="package" version="4.1.3">gawk</requirement>
5af352c58c24 Uploaded
dave
parents:
diff changeset
8 <requirement type="package" version="20170422">parallel</requirement>
5af352c58c24 Uploaded
dave
parents:
diff changeset
9 </expand>
5af352c58c24 Uploaded
dave
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
5af352c58c24 Uploaded
dave
parents:
diff changeset
11 ##set up input files
5af352c58c24 Uploaded
dave
parents:
diff changeset
12
5af352c58c24 Uploaded
dave
parents:
diff changeset
13 #set $reference_fasta_filename = "localref.fa"
5af352c58c24 Uploaded
dave
parents:
diff changeset
14
5af352c58c24 Uploaded
dave
parents:
diff changeset
15 #if str( $reference_source.reference_source_selector ) == "history":
5af352c58c24 Uploaded
dave
parents:
diff changeset
16 ln -s -f '${reference_source.ref_file}' '${reference_fasta_filename}' &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
17 samtools faidx '${reference_fasta_filename}' 2>&1 || echo "Error running samtools faidx for FreeBayes" >&2 &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
18 #else:
5af352c58c24 Uploaded
dave
parents:
diff changeset
19 #set $reference_fasta_filename = str( $reference_source.ref_file.fields.path )
5af352c58c24 Uploaded
dave
parents:
diff changeset
20 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
21
5af352c58c24 Uploaded
dave
parents:
diff changeset
22 #if $reference_source.batchmode.processmode == 'merge':
5af352c58c24 Uploaded
dave
parents:
diff changeset
23 #set $input_bamfiles = $reference_source.batchmode.input_bams
5af352c58c24 Uploaded
dave
parents:
diff changeset
24 #else:
5af352c58c24 Uploaded
dave
parents:
diff changeset
25 #set $input_bamfiles = [ $reference_source.batchmode.input_bams ]
5af352c58c24 Uploaded
dave
parents:
diff changeset
26 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
27
5af352c58c24 Uploaded
dave
parents:
diff changeset
28 #for $bam_count, $input_bam in enumerate( $input_bamfiles ):
5af352c58c24 Uploaded
dave
parents:
diff changeset
29 ln -s -f '${input_bam}' 'b_${bam_count}.bam' &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
30 ln -s -f '${input_bam.metadata.bam_index}' 'b_${bam_count}.bam.bai' &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
31 #end for
5af352c58c24 Uploaded
dave
parents:
diff changeset
32
5af352c58c24 Uploaded
dave
parents:
diff changeset
33 ## Tabixize optional input_variant_vcf file (for --variant-input option)
5af352c58c24 Uploaded
dave
parents:
diff changeset
34 #if ( str( $options_type.options_type_selector ) == 'cline' or str( $options_type.options_type_selector ) == 'full' ) and str( $options_type.optional_inputs.optional_inputs_selector ) == 'set' and str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
5af352c58c24 Uploaded
dave
parents:
diff changeset
35 ln -s -f '${options_type.optional_inputs.input_variant_type.input_variant_vcf}' input_variant_vcf.vcf.gz &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
36 ln -s -f '${Tabixized_input}' input_variant_vcf.vcf.gz.tbi &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
37 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
38
5af352c58c24 Uploaded
dave
parents:
diff changeset
39 ##if the user has specified a region or target file, just use that instead of calculating a set of unique regions
5af352c58c24 Uploaded
dave
parents:
diff changeset
40 #if str( $target_limit_type.target_limit_type_selector ) == "limit_by_target_file":
5af352c58c24 Uploaded
dave
parents:
diff changeset
41 ln -s '${target_limit_type.input_target_bed}' regions_all.bed &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
42 #elif str( $target_limit_type.target_limit_type_selector ) == "limit_by_region":
5af352c58c24 Uploaded
dave
parents:
diff changeset
43 printf '${target_limit_type.region_chromosome}\t${target_limit_type.region_start}\t${target_limit_type.region_end}' > regions_all.bed &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
44 #else
5af352c58c24 Uploaded
dave
parents:
diff changeset
45 ##divide up the regions in the bam file for efficient processing
5af352c58c24 Uploaded
dave
parents:
diff changeset
46 #for $bam_count, $input_bam in enumerate( $input_bamfiles ):
5af352c58c24 Uploaded
dave
parents:
diff changeset
47 samtools view -H b_${bam_count}.bam |
5af352c58c24 Uploaded
dave
parents:
diff changeset
48 grep '^@SQ' |
5af352c58c24 Uploaded
dave
parents:
diff changeset
49 cut -f 2- |
5af352c58c24 Uploaded
dave
parents:
diff changeset
50 awk '{ gsub("^SN:","",$1); gsub("^LN:","",$2); print $1"\t0\t"$2; }' >> regions_all.bed &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
51 #end for
5af352c58c24 Uploaded
dave
parents:
diff changeset
52 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
53
5af352c58c24 Uploaded
dave
parents:
diff changeset
54 sort -u regions_all.bed > regions_uniq.bed &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
55 ## split into even small chunks, this has some disatvantages and will not be used for the moment
5af352c58c24 Uploaded
dave
parents:
diff changeset
56 ## bedtools makewindows -b regions_uniq.bed -w 10000000 -s 9990000 > regions.bed &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
57
5af352c58c24 Uploaded
dave
parents:
diff changeset
58 mkdir vcf_output failed_alleles trace &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
59
5af352c58c24 Uploaded
dave
parents:
diff changeset
60 ## Finished setting up inputs
5af352c58c24 Uploaded
dave
parents:
diff changeset
61
5af352c58c24 Uploaded
dave
parents:
diff changeset
62 for i in `cat regions_uniq.bed | awk '{print $1":"$2".."$3}'`;
5af352c58c24 Uploaded
dave
parents:
diff changeset
63 do
5af352c58c24 Uploaded
dave
parents:
diff changeset
64 echo "
5af352c58c24 Uploaded
dave
parents:
diff changeset
65
5af352c58c24 Uploaded
dave
parents:
diff changeset
66 ## COMMAND LINE STARTS HERE
5af352c58c24 Uploaded
dave
parents:
diff changeset
67
5af352c58c24 Uploaded
dave
parents:
diff changeset
68 freebayes
5af352c58c24 Uploaded
dave
parents:
diff changeset
69
5af352c58c24 Uploaded
dave
parents:
diff changeset
70 --region '\$i'
5af352c58c24 Uploaded
dave
parents:
diff changeset
71
5af352c58c24 Uploaded
dave
parents:
diff changeset
72 #for $bam_count, $input_bam in enumerate( $input_bamfiles ):
5af352c58c24 Uploaded
dave
parents:
diff changeset
73 --bam 'b_${bam_count}.bam'
5af352c58c24 Uploaded
dave
parents:
diff changeset
74 #end for
5af352c58c24 Uploaded
dave
parents:
diff changeset
75 --fasta-reference '${reference_fasta_filename}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
76
5af352c58c24 Uploaded
dave
parents:
diff changeset
77 ## Outputs
5af352c58c24 Uploaded
dave
parents:
diff changeset
78 --vcf './vcf_output/part_\$i.vcf'
5af352c58c24 Uploaded
dave
parents:
diff changeset
79
5af352c58c24 Uploaded
dave
parents:
diff changeset
80 ## Coverage
5af352c58c24 Uploaded
dave
parents:
diff changeset
81 #if str($coverage_options.coverage_options_selector) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
82 @COVERAGE@
5af352c58c24 Uploaded
dave
parents:
diff changeset
83 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
84
5af352c58c24 Uploaded
dave
parents:
diff changeset
85 ##advanced options
5af352c58c24 Uploaded
dave
parents:
diff changeset
86 #if str( $options_type.options_type_selector ) == "simple":
5af352c58c24 Uploaded
dave
parents:
diff changeset
87 #pass
5af352c58c24 Uploaded
dave
parents:
diff changeset
88 #elif str( $options_type.options_type_selector ) == "simple_w_filters":
5af352c58c24 Uploaded
dave
parents:
diff changeset
89 --standard-filters
5af352c58c24 Uploaded
dave
parents:
diff changeset
90 #elif str( $options_type.options_type_selector ) == "naive":
5af352c58c24 Uploaded
dave
parents:
diff changeset
91 --haplotype-length 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
92 --min-alternate-count 1
5af352c58c24 Uploaded
dave
parents:
diff changeset
93 --min-alternate-fraction 0.05
5af352c58c24 Uploaded
dave
parents:
diff changeset
94 --pooled-continuous
5af352c58c24 Uploaded
dave
parents:
diff changeset
95 --report-monomorphic
5af352c58c24 Uploaded
dave
parents:
diff changeset
96 #elif str( $options_type.options_type_selector ) == "naive_w_filters":
5af352c58c24 Uploaded
dave
parents:
diff changeset
97 --haplotype-length 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
98 --min-alternate-count 1
5af352c58c24 Uploaded
dave
parents:
diff changeset
99 --min-alternate-fraction 0.05
5af352c58c24 Uploaded
dave
parents:
diff changeset
100 --pooled-continuous
5af352c58c24 Uploaded
dave
parents:
diff changeset
101 --report-monomorphic
5af352c58c24 Uploaded
dave
parents:
diff changeset
102 --standard-filters
5af352c58c24 Uploaded
dave
parents:
diff changeset
103 #elif str( $options_type.options_type_selector ) == "full":
5af352c58c24 Uploaded
dave
parents:
diff changeset
104 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set':
5af352c58c24 Uploaded
dave
parents:
diff changeset
105 ${options_type.optional_inputs.report_monomorphic}
5af352c58c24 Uploaded
dave
parents:
diff changeset
106
5af352c58c24 Uploaded
dave
parents:
diff changeset
107 #if $options_type.optional_inputs.output_trace_option:
5af352c58c24 Uploaded
dave
parents:
diff changeset
108 --trace ./trace/part_'\$i'.txt
5af352c58c24 Uploaded
dave
parents:
diff changeset
109 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
110 #if $options_type.optional_inputs.output_failed_alleles_option:
5af352c58c24 Uploaded
dave
parents:
diff changeset
111 --failed-alleles ./failed_alleles/part_'\$i'.bed
5af352c58c24 Uploaded
dave
parents:
diff changeset
112 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
113 #if $options_type.optional_inputs.samples:
5af352c58c24 Uploaded
dave
parents:
diff changeset
114 --samples '${options_type.optional_inputs.samples}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
115 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
116 #if $options_type.optional_inputs.populations:
5af352c58c24 Uploaded
dave
parents:
diff changeset
117 --populations '${options_type.optional_inputs.populations}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
118 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
119 #if $options_type.optional_inputs.A:
5af352c58c24 Uploaded
dave
parents:
diff changeset
120 --cnv-map '${options_type.optional_inputs.A}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
121 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
122 #if str( $options_type.optional_inputs.input_variant_type.input_variant_type_selector ) == "provide_vcf":
5af352c58c24 Uploaded
dave
parents:
diff changeset
123 --variant-input 'input_variant_vcf.vcf.gz' ## input_variant_vcf.vcf.gz is symlinked to a galaxy-generated dataset in "Tabixize optional input_variant_vcf file" section of the command line above
5af352c58c24 Uploaded
dave
parents:
diff changeset
124 ${options_type.optional_inputs.input_variant_type.only_use_input_alleles}
5af352c58c24 Uploaded
dave
parents:
diff changeset
125 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
126 #if $options_type.optional_inputs.haplotype_basis_alleles:
5af352c58c24 Uploaded
dave
parents:
diff changeset
127 --haplotype-basis-alleles '${options_type.optional_inputs.haplotype_basis_alleles}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
128 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
129 #if $options_type.optional_inputs.observation_bias:
5af352c58c24 Uploaded
dave
parents:
diff changeset
130 --observation-bias '${options_type.optional_inputs.observation_bias}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
131 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
132 #if $options_type.optional_inputs.contamination_estimates:
5af352c58c24 Uploaded
dave
parents:
diff changeset
133 --contamination-estimates '${options_type.optional_inputs.contamination_estimates}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
134 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
135 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
136
5af352c58c24 Uploaded
dave
parents:
diff changeset
137 ## REPORTING
5af352c58c24 Uploaded
dave
parents:
diff changeset
138 #if str( $options_type.reporting.reporting_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
139 --pvar ${options_type.reporting.pvar}
5af352c58c24 Uploaded
dave
parents:
diff changeset
140 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
141 ## POPULATION MODEL
5af352c58c24 Uploaded
dave
parents:
diff changeset
142 #if str( $options_type.population_model.population_model_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
143 --theta ${options_type.population_model.T}
5af352c58c24 Uploaded
dave
parents:
diff changeset
144 --ploidy ${options_type.population_model.P}
5af352c58c24 Uploaded
dave
parents:
diff changeset
145 ${options_type.population_model.J}
5af352c58c24 Uploaded
dave
parents:
diff changeset
146 ${options_type.population_model.K}
5af352c58c24 Uploaded
dave
parents:
diff changeset
147 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
148
5af352c58c24 Uploaded
dave
parents:
diff changeset
149 ## REFERENCE ALLELE
5af352c58c24 Uploaded
dave
parents:
diff changeset
150 #if str( $options_type.reference_allele.reference_allele_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
151 ${options_type.reference_allele.Z}
5af352c58c24 Uploaded
dave
parents:
diff changeset
152 --reference-quality '${options_type.reference_allele.reference_quality}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
153 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
154
5af352c58c24 Uploaded
dave
parents:
diff changeset
155 ## ALLELE SCOPE
5af352c58c24 Uploaded
dave
parents:
diff changeset
156 #if str( $options_type.allele_scope.allele_scope_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
157 ${options_type.allele_scope.I}
5af352c58c24 Uploaded
dave
parents:
diff changeset
158 ${options_type.allele_scope.i}
5af352c58c24 Uploaded
dave
parents:
diff changeset
159 ${options_type.allele_scope.X}
5af352c58c24 Uploaded
dave
parents:
diff changeset
160 ${options_type.allele_scope.u}
5af352c58c24 Uploaded
dave
parents:
diff changeset
161 ${options_type.allele_scope.no_partial_observations}
5af352c58c24 Uploaded
dave
parents:
diff changeset
162
5af352c58c24 Uploaded
dave
parents:
diff changeset
163 -n ${options_type.allele_scope.n}
5af352c58c24 Uploaded
dave
parents:
diff changeset
164
5af352c58c24 Uploaded
dave
parents:
diff changeset
165 --haplotype-length ${options_type.allele_scope.haplotype_length}
5af352c58c24 Uploaded
dave
parents:
diff changeset
166 --min-repeat-size ${options_type.allele_scope.min_repeat_length}
5af352c58c24 Uploaded
dave
parents:
diff changeset
167 --min-repeat-entropy ${options_type.allele_scope.min_repeat_entropy}
5af352c58c24 Uploaded
dave
parents:
diff changeset
168 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
169
5af352c58c24 Uploaded
dave
parents:
diff changeset
170 ## REALIGNMENT
5af352c58c24 Uploaded
dave
parents:
diff changeset
171 ${options_type.O}
5af352c58c24 Uploaded
dave
parents:
diff changeset
172
5af352c58c24 Uploaded
dave
parents:
diff changeset
173 ##INPUT FILTERS
5af352c58c24 Uploaded
dave
parents:
diff changeset
174 #if str( $options_type.input_filters.input_filters_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
175 ${options_type.input_filters.use_duplicate_reads}
5af352c58c24 Uploaded
dave
parents:
diff changeset
176 -m ${options_type.input_filters.m}
5af352c58c24 Uploaded
dave
parents:
diff changeset
177 -q ${options_type.input_filters.q}
5af352c58c24 Uploaded
dave
parents:
diff changeset
178 -R ${options_type.input_filters.R}
5af352c58c24 Uploaded
dave
parents:
diff changeset
179 -Y ${options_type.input_filters.Y}
5af352c58c24 Uploaded
dave
parents:
diff changeset
180 -e ${options_type.input_filters.e}
5af352c58c24 Uploaded
dave
parents:
diff changeset
181 -F ${options_type.input_filters.F}
5af352c58c24 Uploaded
dave
parents:
diff changeset
182 -C ${options_type.input_filters.C}
5af352c58c24 Uploaded
dave
parents:
diff changeset
183 -G ${options_type.input_filters.G}
5af352c58c24 Uploaded
dave
parents:
diff changeset
184
5af352c58c24 Uploaded
dave
parents:
diff changeset
185 #if str( $options_type.input_filters.mismatch_filters.mismatch_filters_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
186 -Q ${options_type.input_filters.mismatch_filters.Q}
5af352c58c24 Uploaded
dave
parents:
diff changeset
187 #if str($options_type.input_filters.mismatch_filters.U)
5af352c58c24 Uploaded
dave
parents:
diff changeset
188 -U ${options_type.input_filters.mismatch_filters.U}
5af352c58c24 Uploaded
dave
parents:
diff changeset
189 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
190 -z ${options_type.input_filters.mismatch_filters.z}
5af352c58c24 Uploaded
dave
parents:
diff changeset
191
5af352c58c24 Uploaded
dave
parents:
diff changeset
192 --read-snp-limit ${options_type.input_filters.mismatch_filters.read_snp_limit}
5af352c58c24 Uploaded
dave
parents:
diff changeset
193 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
194
5af352c58c24 Uploaded
dave
parents:
diff changeset
195 --min-coverage ${options_type.input_filters.min_coverage}
5af352c58c24 Uploaded
dave
parents:
diff changeset
196 --min-alternate-qsum ${options_type.input_filters.min_alternate_qsum}
5af352c58c24 Uploaded
dave
parents:
diff changeset
197 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
198
5af352c58c24 Uploaded
dave
parents:
diff changeset
199 ## POPULATION AND MAPPABILITY PRIORS
5af352c58c24 Uploaded
dave
parents:
diff changeset
200 #if str( $options_type.population_mappability_priors.population_mappability_priors_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
201 ${options_type.population_mappability_priors.k}
5af352c58c24 Uploaded
dave
parents:
diff changeset
202 ${options_type.population_mappability_priors.w}
5af352c58c24 Uploaded
dave
parents:
diff changeset
203 ${options_type.population_mappability_priors.V}
5af352c58c24 Uploaded
dave
parents:
diff changeset
204 ${options_type.population_mappability_priors.a}
5af352c58c24 Uploaded
dave
parents:
diff changeset
205 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
206
5af352c58c24 Uploaded
dave
parents:
diff changeset
207 ## GENOTYPE LIKELIHOODS
5af352c58c24 Uploaded
dave
parents:
diff changeset
208 #if str( $options_type.genotype_likelihoods.genotype_likelihoods_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
209 ${$options_type.genotype_likelihoods.experimental_gls}
5af352c58c24 Uploaded
dave
parents:
diff changeset
210
5af352c58c24 Uploaded
dave
parents:
diff changeset
211 --base-quality-cap ${$options_type.genotype_likelihoods.base_quality_cap}
5af352c58c24 Uploaded
dave
parents:
diff changeset
212 --prob-contamination ${$options_type.genotype_likelihoods.prob_contamination}
5af352c58c24 Uploaded
dave
parents:
diff changeset
213 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
214
5af352c58c24 Uploaded
dave
parents:
diff changeset
215 ## ALGORITHMIC FEATURES
5af352c58c24 Uploaded
dave
parents:
diff changeset
216 #if str( $options_type.algorithmic_features.algorithmic_features_selector ) == "set":
5af352c58c24 Uploaded
dave
parents:
diff changeset
217 -B '${options_type.algorithmic_features.B}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
218 -W '${options_type.algorithmic_features.W}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
219 -D '${options_type.algorithmic_features.D}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
220
5af352c58c24 Uploaded
dave
parents:
diff changeset
221 #if str($options_type.algorithmic_features.genotype_variant_threshold)
5af352c58c24 Uploaded
dave
parents:
diff changeset
222 -S ${options_type.algorithmic_features.genotype_variant_threshold}
5af352c58c24 Uploaded
dave
parents:
diff changeset
223 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
224
5af352c58c24 Uploaded
dave
parents:
diff changeset
225 ${options_type.algorithmic_features.N}
5af352c58c24 Uploaded
dave
parents:
diff changeset
226 ${options_type.algorithmic_features.j}
5af352c58c24 Uploaded
dave
parents:
diff changeset
227 ${options_type.algorithmic_features.H}
5af352c58c24 Uploaded
dave
parents:
diff changeset
228 ${options_type.algorithmic_features.genotype_qualities}
5af352c58c24 Uploaded
dave
parents:
diff changeset
229 ${options_type.algorithmic_features.report_genotype_likelihood_max}
5af352c58c24 Uploaded
dave
parents:
diff changeset
230
5af352c58c24 Uploaded
dave
parents:
diff changeset
231 --genotyping-max-banddepth ${options_type.algorithmic_features.genotyping_max_banddepth}
5af352c58c24 Uploaded
dave
parents:
diff changeset
232 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
233 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
234
5af352c58c24 Uploaded
dave
parents:
diff changeset
235 ";
5af352c58c24 Uploaded
dave
parents:
diff changeset
236 done > freebayes_commands.sh &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
237
5af352c58c24 Uploaded
dave
parents:
diff changeset
238 cat freebayes_commands.sh |
5af352c58c24 Uploaded
dave
parents:
diff changeset
239 parallel --will-cite -j \${GALAXY_SLOTS:-1} &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
240
5af352c58c24 Uploaded
dave
parents:
diff changeset
241 ## make VCF header
5af352c58c24 Uploaded
dave
parents:
diff changeset
242 grep "^#" "./vcf_output/part_\$i.vcf" > header.txt &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
243
5af352c58c24 Uploaded
dave
parents:
diff changeset
244 for i in `cat regions_uniq.bed | awk '{print $1":"$2".."$3}'`;
5af352c58c24 Uploaded
dave
parents:
diff changeset
245 do
5af352c58c24 Uploaded
dave
parents:
diff changeset
246 ## if this fails then it bails out the script
5af352c58c24 Uploaded
dave
parents:
diff changeset
247 cat "./vcf_output/part_\$i.vcf" | grep -v "^#" || true
5af352c58c24 Uploaded
dave
parents:
diff changeset
248 ;
5af352c58c24 Uploaded
dave
parents:
diff changeset
249 done | sort -k1,1 -k2,2n -k5,5 -u | cat header.txt - > '${output_vcf}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
250
5af352c58c24 Uploaded
dave
parents:
diff changeset
251 #if str( $options_type.options_type_selector ) == "full":
5af352c58c24 Uploaded
dave
parents:
diff changeset
252 #if str( $options_type.optional_inputs.optional_inputs_selector ) == 'set':
5af352c58c24 Uploaded
dave
parents:
diff changeset
253 #if $options_type.optional_inputs.output_failed_alleles_option:
5af352c58c24 Uploaded
dave
parents:
diff changeset
254 &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
255 for i in `cat regions.bed | awk '{print $1":"$2".."$3}'`;
5af352c58c24 Uploaded
dave
parents:
diff changeset
256 do
5af352c58c24 Uploaded
dave
parents:
diff changeset
257 cat "./failed_alleles/part_\$i.bed"
5af352c58c24 Uploaded
dave
parents:
diff changeset
258 ;
5af352c58c24 Uploaded
dave
parents:
diff changeset
259 done > '${output_failed_alleles_bed}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
260 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
261
5af352c58c24 Uploaded
dave
parents:
diff changeset
262 #if $options_type.optional_inputs.output_trace_option:
5af352c58c24 Uploaded
dave
parents:
diff changeset
263 &&
5af352c58c24 Uploaded
dave
parents:
diff changeset
264 for i in `cat regions.bed | awk '{print $1":"$2".."$3}'`;
5af352c58c24 Uploaded
dave
parents:
diff changeset
265 do
5af352c58c24 Uploaded
dave
parents:
diff changeset
266 cat './trace/part_\$i.txt'
5af352c58c24 Uploaded
dave
parents:
diff changeset
267 ;
5af352c58c24 Uploaded
dave
parents:
diff changeset
268 done > '${output_trace}'
5af352c58c24 Uploaded
dave
parents:
diff changeset
269 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
270 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
271 #end if
5af352c58c24 Uploaded
dave
parents:
diff changeset
272 ]]></command>
5af352c58c24 Uploaded
dave
parents:
diff changeset
273
5af352c58c24 Uploaded
dave
parents:
diff changeset
274 <inputs>
5af352c58c24 Uploaded
dave
parents:
diff changeset
275 <conditional name="reference_source">
5af352c58c24 Uploaded
dave
parents:
diff changeset
276 <param name="reference_source_selector" type="select" label="Choose the source for the reference genome">
5af352c58c24 Uploaded
dave
parents:
diff changeset
277 <option value="cached">Locally cached</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
278 <option value="history">History</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
279 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
280 <when value="cached">
5af352c58c24 Uploaded
dave
parents:
diff changeset
281 <expand macro="input_bam">
5af352c58c24 Uploaded
dave
parents:
diff changeset
282 <expand macro="validation" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
283 </expand>
5af352c58c24 Uploaded
dave
parents:
diff changeset
284 <param name="ref_file" type="select" label="Using reference genome">
5af352c58c24 Uploaded
dave
parents:
diff changeset
285 <options from_data_table="fasta_indexes" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
286 <validator type="no_options" message="A built-in reference genome is not available for the build associated with the selected input dataset"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
287 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
288 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
289 <when value="history"> <!-- FIX ME!!!! -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
290 <expand macro="input_bam" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
291 <param name="ref_file" type="data" format="fasta" label="Use the following dataset as the reference sequence"
5af352c58c24 Uploaded
dave
parents:
diff changeset
292 help="You can upload a FASTA sequence to the history and use it as reference" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
293 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
294 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
295 <conditional name="target_limit_type">
5af352c58c24 Uploaded
dave
parents:
diff changeset
296 <param name="target_limit_type_selector" type="select" label="Limit variant calling to a set of regions?" help="Sets --targets or --region options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
297 <option value="do_not_limit" selected="true">Do not limit</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
298 <option value="limit_by_target_file">Limit by target file</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
299 <option value="limit_by_region">Limit to region</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
300 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
301 <when value="do_not_limit" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
302 <when value="limit_by_target_file">
5af352c58c24 Uploaded
dave
parents:
diff changeset
303 <param name="input_target_bed" argument="--targets" type="data" format="bed" label="Limit analysis to regions in this BED dataset" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
304 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
305 <when value="limit_by_region">
5af352c58c24 Uploaded
dave
parents:
diff changeset
306 <param name="region_chromosome" argument="--region" type="text" label="Region Chromosome" value="" /> <!--only once? -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
307 <param name="region_start" type="integer" label="Region Start" value="" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
308 <param name="region_end" type="integer" label="Region End" value="" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
309 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
310 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
311 <conditional name="coverage_options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
312 <param name="coverage_options_selector" type="select" label="Read coverage"
5af352c58c24 Uploaded
dave
parents:
diff changeset
313 help="Sets --min-coverage, --limit-coverage, and --skip-coverage">
5af352c58c24 Uploaded
dave
parents:
diff changeset
314 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
315 <option value="set">Specify coverage options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
316 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
317 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
318 <expand macro="par_min_cov" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
319 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
320 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
321 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
322 <conditional name="options_type">
5af352c58c24 Uploaded
dave
parents:
diff changeset
323 <param name="options_type_selector" type="select" label="Choose parameter selection level"
5af352c58c24 Uploaded
dave
parents:
diff changeset
324 help="Select how much control over the freebayes run you need">
5af352c58c24 Uploaded
dave
parents:
diff changeset
325 <option value="simple" selected="true">1. Simple diploid calling</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
326 <option value="simple_w_filters">2. Simple diploid calling with filtering and coverage</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
327 <option value="naive">3. Frequency-based pooled calling</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
328 <option value="naive_w_filters">4. Frequency-based pooled calling with filtering and coverage</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
329 <option value="full">5. Full list of options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
330 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
331 <when value="full">
5af352c58c24 Uploaded
dave
parents:
diff changeset
332
5af352c58c24 Uploaded
dave
parents:
diff changeset
333 <conditional name="optional_inputs">
5af352c58c24 Uploaded
dave
parents:
diff changeset
334 <param name="optional_inputs_selector" type="select" label="Additional inputs"
5af352c58c24 Uploaded
dave
parents:
diff changeset
335 help="Sets --samples, --populations, --cnv-map, --trace, --failed-alleles, --variant-input, --only-use-input-alleles, --haplotype-basis-alleles, --report-all-haplotype-alleles, --report-monomorphic options, --observation-bias, and --contamination-estimates">
5af352c58c24 Uploaded
dave
parents:
diff changeset
336 <option value="do_not_set" selected="true">Do not provide additional inputs</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
337 <option value="set">Provide additional inputs</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
338 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
339 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
340 <param name="output_failed_alleles_option" argument="--failed-alleles" type="boolean" truevalue="--failed-alleles" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
341 label="Write out failed alleles file" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
342 <param name="output_trace_option" argument="--trace" type="boolean" truevalue="--trace" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
343 label="Write out algorithm trace file" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
344 <param argument="--samples" type="data" format="txt"
5af352c58c24 Uploaded
dave
parents:
diff changeset
345 label="Limit analysis to samples listed (one per line) in this dataset" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
346 help="By default FreeBayes will analyze all samples in its input BAM datasets" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
347 <param argument="--populations" type="data" format="txt" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
348 label="Populations dataset"
5af352c58c24 Uploaded
dave
parents:
diff changeset
349 help="Each line of this dataset should list a sample and a population which it is part of. The population-based bayesian inference model will then be partitioned on the basis of the populations" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
350 <param name="A" argument="--cnv-map" type="data" format="bed" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
351 label="Read a copy number map from a BED dataset"
5af352c58c24 Uploaded
dave
parents:
diff changeset
352 help="The BED dataset should have the format: 'reference sequence, start, end, sample name, copy number' for each region in each sample which does not have the default copy number as set by --ploidy. If not specified, copy number is set to as specified by --ploidy" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
353 <conditional name="input_variant_type">
5af352c58c24 Uploaded
dave
parents:
diff changeset
354 <param name="input_variant_type_selector" type="select" label="Provide variants dataset">
5af352c58c24 Uploaded
dave
parents:
diff changeset
355 <option value="do_not_provide" selected="true">Do not provide</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
356 <option value="provide_vcf">Provide VCF dataset</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
357 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
358 <when value="do_not_provide" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
359 <when value="provide_vcf">
5af352c58c24 Uploaded
dave
parents:
diff changeset
360 <param name="input_variant_vcf" argument="--variant-input" type="data" format="vcf_bgzip"
5af352c58c24 Uploaded
dave
parents:
diff changeset
361 label="Use variants reported in this VCF dataset as input to the algorithm">
5af352c58c24 Uploaded
dave
parents:
diff changeset
362 <conversion name="Tabixized_input" type="tabix" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
363 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
364 <param name="only_use_input_alleles" argument="--only-use-input-alleles" type="boolean" truevalue="--only-use-input-alleles" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
365 label="Only provide variant calls and genotype likelihoods for sites in VCF" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
366 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
367 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
368 <param name="haplotype_basis_alleles" argument="--haplotype-basis-alleles" type="data" format="vcf" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
369 label="Only use variant alleles provided in this input VCF for the construction of complex or haplotype alleles" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
370 <param name="report_monomorphic" argument="--report-monomorphic" type="boolean" truevalue="--report-monomorphic" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
371 label="Report even loci which appear to be monomorphic, and report all considered alleles, even those which are not in called genotypes" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
372 <param name="observation_bias" argument="--observation-bias" type="data" format="tabular" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
373 label="Load read length-dependent allele observation biases from"
5af352c58c24 Uploaded
dave
parents:
diff changeset
374 help="The format is [length] [alignment efficiency relative to reference] where the efficiency is 1 if there is no relative observation bias" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
375 <param name="contamination_estimates" argument="--contamination-estimates" type="data" format="tabular" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
376 label="Upload per-sample estimates of contamination from"
5af352c58c24 Uploaded
dave
parents:
diff changeset
377 help="The format should be: sample p(read=R|genotype=AR) p(read=A|genotype=AA) Sample '*' can be used to set default contamination estimates" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
378 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
379 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
380 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
381
5af352c58c24 Uploaded
dave
parents:
diff changeset
382 <!-- reporting -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
383 <conditional name="reporting">
5af352c58c24 Uploaded
dave
parents:
diff changeset
384 <param name="reporting_selector" type="select" label="Reporting options" help="Sets -P --pvar option">
5af352c58c24 Uploaded
dave
parents:
diff changeset
385 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
386 <option value="set">Set reporting options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
387 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
388 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
389 <param argument="--pvar" type="float" value="0.0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
390 label="Report sites if the probability that there is a polymorphism at the site is greater than"
5af352c58c24 Uploaded
dave
parents:
diff changeset
391 help="Note that post-filtering is generally recommended over the use of this parameter" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
392 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
393 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
394 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
395
5af352c58c24 Uploaded
dave
parents:
diff changeset
396 <!-- population model -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
397 <conditional name="population_model">
5af352c58c24 Uploaded
dave
parents:
diff changeset
398 <param name="population_model_selector" type="select" label="Population model options"
5af352c58c24 Uploaded
dave
parents:
diff changeset
399 help="Sets --theta, --ploidy, --pooled-discrete, and --pooled-continuous options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
400 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
401 <option value="set">Set population model options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
402 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
403 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
404 <param name="T" argument="--theta" type="float" value="0.001"
5af352c58c24 Uploaded
dave
parents:
diff changeset
405 label="The expected mutation rate or pairwise nucleotide diversity among the population under analysis"
5af352c58c24 Uploaded
dave
parents:
diff changeset
406 help="This serves as the single parameter to the Ewens Sampling Formula prior model" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
407 <param name="P" argument="--ploidy" type="integer" value="2"
5af352c58c24 Uploaded
dave
parents:
diff changeset
408 label="Set ploidy for the analysis" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
409 <param name="J" argument="--pooled-discrete" type="boolean" truevalue="-J" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
410 label="Assume that samples result from pooled sequencing"
5af352c58c24 Uploaded
dave
parents:
diff changeset
411 help="Model pooled samples using discrete genotypes across pools. When using this flag, set --ploidy to the number of alleles in each sample or use the --cnv-map to define per-sample ploidy" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
412 <param name="K" argument="--poled-continuous" type="boolean" truevalue="-K" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
413 label="Output all alleles which pass input filters, regardles of genotyping outcome or model" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
414 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
415 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
416 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
417
5af352c58c24 Uploaded
dave
parents:
diff changeset
418 <!-- reference allele -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
419 <conditional name="reference_allele">
5af352c58c24 Uploaded
dave
parents:
diff changeset
420 <param name="reference_allele_selector" type="select" label="Reference allele options"
5af352c58c24 Uploaded
dave
parents:
diff changeset
421 help="Sets --use-reference-allele and --reference-quality options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
422 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
423 <option value="set">Set reference allele options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
424 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
425 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
426 <param name="Z" argument="--use-reference-allele" type="boolean" truevalue="-Z" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
427 label="Include the reference allele in the analysis as if it is another sample from the same population" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
428 <param name="reference_quality" argument="--reference-quality" type="text" value="100,60"
5af352c58c24 Uploaded
dave
parents:
diff changeset
429 label="Assign mapping quality of MQ (100) to the reference allele at each site and base quality of BQ (60)" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
430 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
431 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
432 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
433
5af352c58c24 Uploaded
dave
parents:
diff changeset
434 <!-- allelic scope -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
435 <conditional name="allele_scope">
5af352c58c24 Uploaded
dave
parents:
diff changeset
436 <param name="allele_scope_selector" type="select" label="Allelic scope options"
5af352c58c24 Uploaded
dave
parents:
diff changeset
437 help="Sets -I, i, -X, -u, -n, --haplotype-length, --min-repeat-size, --min-repeat-entropy, and --no-partial-observations options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
438 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
439 <option value="set">Set alleic scope options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
440 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
441 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
442 <param name="I" argument="--no-snps" type="boolean" truevalue="-I" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
443 label="Ignore SNP alleles" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
444 <param name="i" argument="--no-indels" type="boolean" truevalue="-i" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
445 label="Ignore indels alleles" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
446 <param name="X" argument="--no-mnps" type="boolean" truevalue="-X" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
447 label="Ignore multi-nucleotide polymorphisms, MNPs" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
448 <param name="u" argument="--no-complex" type="boolean" truevalue="-u" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
449 label="Ignore complex events (composites of other classes)" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
450 <param name="n" argument="--use-best-n-alleles" type="integer" value="0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
451 label="How many best SNP alleles to evaluate"
5af352c58c24 Uploaded
dave
parents:
diff changeset
452 help="Alleles are ranked by the sum of supporting quality scores. Set to 0 to evaluate all" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
453 <param name="haplotype_length" argument="--haplotype-length" type="integer" value="3"
5af352c58c24 Uploaded
dave
parents:
diff changeset
454 label="Allow haplotype calls with contiguous embedded matches of up to (nucleotides)" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
455 <param name="min_repeat_length" argument="--min-repeat-size" type="integer" value="5"
5af352c58c24 Uploaded
dave
parents:
diff changeset
456 label="When assembling observations across repeats, require the total repeat length at least this many bp" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
457 <param name="min_repeat_entropy" argument="--min-repeat-entropy" type="integer" value="1"
5af352c58c24 Uploaded
dave
parents:
diff changeset
458 label="To detect interrupted repeats, build across sequence until it has entropy > (bits per bp)" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
459 <param name="no_partial_observations" argument="--no-partial-observations" type="boolean" truevalue="--no-partial-observations" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
460 label="Exclude observations which do not fully span the dynamically-determined detection window"
5af352c58c24 Uploaded
dave
parents:
diff changeset
461 help="By default, FreeBayes uses all observations, dividing partial support across matching haplotypes when generating haplotypes" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
462 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
463 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
464 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
465
5af352c58c24 Uploaded
dave
parents:
diff changeset
466 <!-- indel realignment -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
467 <param name="O" argument="--dont-left-align-indels" type="boolean" truevalue="-O" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
468 label="Turn off left-alignment of indels" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
469
5af352c58c24 Uploaded
dave
parents:
diff changeset
470 <!-- input filters -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
471 <conditional name="input_filters">
5af352c58c24 Uploaded
dave
parents:
diff changeset
472 <param name="input_filters_selector" type="select" label="Input filters"
5af352c58c24 Uploaded
dave
parents:
diff changeset
473 help="Sets -4, -m, -q, -R, -Y, -Q, -U, -z, -&#36;, -e, -0, -F, -C, -3, -G, and -&#33; options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
474 <option value="do_not_set" selected="true">No input filters (default)</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
475 <option value="set">Set input filters</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
476 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
477 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
478 <param name="use_duplicate_reads" argument="--use-duplicate-reads" type="boolean" truevalue="--use-duplicate-reads" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
479 label="Include duplicate-marked alignments in the analysis" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
480 <param name="m" argument="--min-mapping-quality" type="integer" value="1"
5af352c58c24 Uploaded
dave
parents:
diff changeset
481 label="Exclude alignments from analysis if they have a mapping quality less than" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
482 <param name="q" argument="--min-base-quality" type="integer" value="0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
483 label="Exclude alleles from analysis if their supporting base quality less than" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
484 <param name="R" argument="--min-supporting-allele-qsum" type="integer" value="0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
485 label="Consider any allele in which the sum of qualities of supporting observations is at least" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
486 <param name="Y" argument="--min-supporting-mapping-qsum" type="integer" value="0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
487 label="Consider any allele in which and the sum of mapping qualities of supporting reads is at least" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
488 <conditional name="mismatch_filters">
5af352c58c24 Uploaded
dave
parents:
diff changeset
489 <param name="mismatch_filters_selector" type="select" label="Mismatch filters"
5af352c58c24 Uploaded
dave
parents:
diff changeset
490 help="Sets -Q, -U, -z, and &#36; options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
491 <option value="do_not_set" selected="true">No mismatch filters (default)</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
492 <option value="set">Set mismatch filters</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
493 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
494 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
495 <param name="Q" argument="--mismatch-base-quality-threshold" type="integer" value="10"
5af352c58c24 Uploaded
dave
parents:
diff changeset
496 label="Count mismatches toward -U (option below) if the base quality of the mismatch is >=" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
497 <param name="U" type="integer" argument="--read-mismatch-limit" value="1000" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
498 label="Exclude reads with more than N mismatches where each mismatch has base quality >= mismatch-base-quality-threshold (option above)"
5af352c58c24 Uploaded
dave
parents:
diff changeset
499 help="default=~unbounded" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
500 <param name="z" argument="--read-max-mismatch-fraction" type="float" value="1.0" min="0.0" max="1.0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
501 label="Exclude reads with more than N [0,1] fraction of mismatches where each mismatch has base quality >= mismatch-base-quality-threshold (second option above)" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
502 <param name="read_snp_limit" argument="--read-snp-limit" type="integer" value="1000"
5af352c58c24 Uploaded
dave
parents:
diff changeset
503 label="Exclude reads with more than N base mismatches, ignoring gaps with quality >= mismatch-base-quality-threshold (third option above)"
5af352c58c24 Uploaded
dave
parents:
diff changeset
504 help="default=~unbounded" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
505 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
506 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
507 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
508 <param name="e" argument="--read-indel-limit" type="integer" value="1000"
5af352c58c24 Uploaded
dave
parents:
diff changeset
509 label="Exclude reads with more than this number of separate gaps"
5af352c58c24 Uploaded
dave
parents:
diff changeset
510 help="default=~unbounded" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
511 <param name="standard_filters" argument="--standard-filters" type="boolean" truevalue="-0" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
512 label="Use stringent input base and mapping quality filters"
5af352c58c24 Uploaded
dave
parents:
diff changeset
513 help="Equivalent to -m 30 -q 20 -R 0 -S 0" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
514 <param name="F" argument="--min-alternate-fraction" type="float" value="0.05"
5af352c58c24 Uploaded
dave
parents:
diff changeset
515 label="Require at least this fraction of observations supporting an alternate allele within a single individual in the in order to evaluate the position" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
516 <param name="C" argument="--min-alternate-count" type="integer" value="2"
5af352c58c24 Uploaded
dave
parents:
diff changeset
517 label="Require at least this count of observations supporting an alternate allele within a single individual in order to evaluate the position" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
518 <param name="min_alternate_qsum" argument="--min-alternate-qsum" type="integer" value="0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
519 label="Require at least this sum of quality of observations supporting an alternate allele within a single individual in order to evaluate the position" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
520 <param name="G" argument="--min-alternate-total" type="integer" value="1"
5af352c58c24 Uploaded
dave
parents:
diff changeset
521 label="Require at least this count of observations supporting an alternate allele within the total population in order to use the allele in analysis" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
522 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
523 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
524 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
525
5af352c58c24 Uploaded
dave
parents:
diff changeset
526 <!-- population and mappability priors -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
527 <conditional name="population_mappability_priors">
5af352c58c24 Uploaded
dave
parents:
diff changeset
528 <param name="population_mappability_priors_selector" type="select" label="Population and mappability priors"
5af352c58c24 Uploaded
dave
parents:
diff changeset
529 help="Sets -k, -w, -V, and -a options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
530 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
531 <option value="set">Set population and mappability priors</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
532 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
533 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
534 <param name="k" argument="--no-population-priors" type="boolean" truevalue="-k" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
535 label="No population priors"
5af352c58c24 Uploaded
dave
parents:
diff changeset
536 help="Equivalent to --pooled-discrete --hwe-priors-off and removal of Ewens Sampling Formula component of priors" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
537 <param name="w" argument="--hwe-priors-off" type="boolean" truevalue="-w" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
538 label="Disable estimation of the probability of the combination arising under HWE given the allele frequency as estimated by observation frequency" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
539 <param name="V" argument="--binomial-obs-priors-off" type="boolean" truevalue="-V" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
540 label="Disable incorporation of prior expectations about observations"
5af352c58c24 Uploaded
dave
parents:
diff changeset
541 help="Uses read placement probability, strand balance probability, and read position (5&#39;'-3&#39;') probability" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
542 <param name="a" argument="--allele-balance-priors-off" type="boolean" truevalue="-a" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
543 label="Disable use of aggregate probability of observation balance between alleles as a component of the priors" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
544 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
545 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
546 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
547
5af352c58c24 Uploaded
dave
parents:
diff changeset
548 <!-- genotype likelihoods -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
549 <conditional name="genotype_likelihoods">
5af352c58c24 Uploaded
dave
parents:
diff changeset
550 <param name="genotype_likelihoods_selector" type="select" label="Genotype likelihood options"
5af352c58c24 Uploaded
dave
parents:
diff changeset
551 help="Sets --base-quality-cap, --experimental-gls, and --prob-contamination options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
552 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
553 <option value="set">Set genotype likelihood options</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
554 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
555 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
556 <param name="base_quality_cap" argument="--base-quality-cap" type="integer" value="0"
5af352c58c24 Uploaded
dave
parents:
diff changeset
557 label="Limit estimated observation quality by capping base quality at" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
558 <param name="experimental_gls" argument="--experimental-gls" type="boolean" truevalue="--experimental-gls" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
559 label="Generate genotype likelihoods using 'effective base depth' metric qual = 1-BaseQual * 1-MapQual"
5af352c58c24 Uploaded
dave
parents:
diff changeset
560 help="Incorporate partial observations. This is the default when contamination estimates are provided. Optimized for diploid samples" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
561 <param name="prob_contamination" argument="--prob-contamination" type="float" value="10e-9"
5af352c58c24 Uploaded
dave
parents:
diff changeset
562 label="An estimate of contamination to use for all samples" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
563 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
564 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
565 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
566
5af352c58c24 Uploaded
dave
parents:
diff changeset
567 <!-- algorithmic features -->
5af352c58c24 Uploaded
dave
parents:
diff changeset
568 <conditional name="algorithmic_features">
5af352c58c24 Uploaded
dave
parents:
diff changeset
569 <param name="algorithmic_features_selector" type="select" label="Algorithmic features"
5af352c58c24 Uploaded
dave
parents:
diff changeset
570 help="Sets --report-genotypes-likelihood-max, -B, --genotyping-max-banddepth, -W, -N, S, -j, -H, -D, -= options">
5af352c58c24 Uploaded
dave
parents:
diff changeset
571 <option value="do_not_set" selected="true">Use defaults</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
572 <option value="set">Set algorithmic features</option>
5af352c58c24 Uploaded
dave
parents:
diff changeset
573 </param>
5af352c58c24 Uploaded
dave
parents:
diff changeset
574 <when value="set">
5af352c58c24 Uploaded
dave
parents:
diff changeset
575 <param name="report_genotype_likelihood_max" argument="--report-genotype-likelihood-max" type="boolean" truevalue="--report-genotype-likelihood-max" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
576 label="Report genotypes using the maximum-likelihood estimate provided from genotype likelihoods" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
577 <param name="B" argument="--genotyping-max-iterations" type="integer" value="1000"
5af352c58c24 Uploaded
dave
parents:
diff changeset
578 label="Iterate no more than N times during genotyping step" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
579 <param name="genotyping_max_banddepth" argument="--genotyping-max-banddepth" type="integer" value="6"
5af352c58c24 Uploaded
dave
parents:
diff changeset
580 label="Integrate no deeper than the Nth best genotype by likelihood when genotyping" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
581 <param name="W" argument="--posterior-integration-limits" type="text" value="1,3"
5af352c58c24 Uploaded
dave
parents:
diff changeset
582 label="Integrate all genotype combinations in our posterior space which include no more than N (1) samples with their Mth (3) best data likelihood" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
583 <param name="N" argument="--exclude-unobserved-genotypes" type="boolean" truevalue="--exclude-unobserved-genotypes" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
584 label="Skip sample genotypings for which the sample has no supporting reads" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
585 <param name="genotype_variant_threshold" argument="--genotype-variant-threshold" type="integer" value="" optional="true"
5af352c58c24 Uploaded
dave
parents:
diff changeset
586 label="Limit posterior integration to samples where the second-best genotype likelihood is no more than log(N) from the highest genotype likelihood for the sample"
5af352c58c24 Uploaded
dave
parents:
diff changeset
587 help="default=~unbounded" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
588 <param name="j" argument="--use-mapping-quality" type="boolean" truevalue="-j" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
589 label="Use mapping quality of alleles when calculating data likelihoods" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
590 <param name="H" argument="--harmonic-indel-quality" type="boolean" truevalue="-H" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
591 label="Use a weighted sum of base qualities around an indel, scaled by the distance from the indel"
5af352c58c24 Uploaded
dave
parents:
diff changeset
592 help="By default, FreeBayes uses a minimum Base Quality in flanking sequence" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
593 <param name="D" argument="--read-dependence-factor" type="float" value="0.9"
5af352c58c24 Uploaded
dave
parents:
diff changeset
594 label="Incorporate non-independence of reads by scaling successive observations by this factor during data likelihood calculations" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
595 <param name="genotype_qualities" argument="--genotype-qualities" type="boolean" truevalue="--genotype-qualities" falsevalue="" checked="false"
5af352c58c24 Uploaded
dave
parents:
diff changeset
596 label="Calculate the marginal probability of genotypes and report as GQ in each sample field in the VCF output" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
597 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
598 <when value="do_not_set" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
599 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
600 </when>
5af352c58c24 Uploaded
dave
parents:
diff changeset
601 <when value="simple" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
602 <when value="simple_w_filters" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
603 <when value="naive" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
604 <when value="naive_w_filters" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
605 </conditional>
5af352c58c24 Uploaded
dave
parents:
diff changeset
606 </inputs>
5af352c58c24 Uploaded
dave
parents:
diff changeset
607 <outputs>
5af352c58c24 Uploaded
dave
parents:
diff changeset
608 <data format="vcf" name="output_vcf" label="${tool.name} on ${on_string} (variants)" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
609 <data format="bed" name="output_failed_alleles_bed" label="${tool.name} on ${on_string} (failed alleles)">
5af352c58c24 Uploaded
dave
parents:
diff changeset
610 <filter>( options_type['options_type_selector'] == 'cline' or options_type['options_type_selector'] == 'full' ) and options_type['optional_inputs']['optional_inputs_selector'] == 'set' and options_type['optional_inputs']['output_failed_alleles_option'] is True</filter>
5af352c58c24 Uploaded
dave
parents:
diff changeset
611 </data>
5af352c58c24 Uploaded
dave
parents:
diff changeset
612 <data format="txt" name="output_trace" label="${tool.name} on ${on_string} (trace)">
5af352c58c24 Uploaded
dave
parents:
diff changeset
613 <filter>( options_type['options_type_selector'] == 'cline' or options_type['options_type_selector'] == 'full' ) and options_type['optional_inputs']['optional_inputs_selector'] == 'set' and options_type['optional_inputs']['output_trace_option'] is True</filter>
5af352c58c24 Uploaded
dave
parents:
diff changeset
614 </data>
5af352c58c24 Uploaded
dave
parents:
diff changeset
615 </outputs>
5af352c58c24 Uploaded
dave
parents:
diff changeset
616 <tests>
5af352c58c24 Uploaded
dave
parents:
diff changeset
617 <test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
618 <param name="reference_source_selector" value="history" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
619 <param name="processmode" value="individual" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
620 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
621 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
622 <param name="options_type_selector" value="simple"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
623 <output name="output_vcf" file="freebayes-phix174-test1.vcf" lines_diff="4" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
624 </test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
625 <test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
626 <param name="reference_source_selector" value="history" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
627 <param name="processmode" value="individual" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
628 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
629 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
630 <param name="options_type_selector" value="naive_w_filters"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
631 <param name="min_coverage" value="14"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
632 <output name="output_vcf" file="freebayes-phix174-test2.vcf" lines_diff="4" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
633 </test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
634 <test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
635 <param name="reference_source_selector" value="history" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
636 <param name="processmode" value="individual" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
637 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
638 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
639 <param name="options_type_selector" value="naive_w_filters"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
640 <param name="min_coverage" value="14"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
641 <output name="output_vcf" file="freebayes-phix174-test3.vcf" lines_diff="4" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
642 </test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
643 <test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
644 <param name="reference_source_selector" value="history" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
645 <param name="processmode" value="individual" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
646 <param name="ref_file" ftype="fasta" value="freebayes-phix174.fasta"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
647 <param name="input_bams" ftype="bam" value="freebayes-phix174.bam"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
648 <param name="options_type_selector" value="full"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
649 <param name="population_model_selector" value="set"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
650 <param name="P" value="1"/>
5af352c58c24 Uploaded
dave
parents:
diff changeset
651 <output name="output_vcf" file="freebayes-phix174-test4.vcf" lines_diff="4" />
5af352c58c24 Uploaded
dave
parents:
diff changeset
652 </test>
5af352c58c24 Uploaded
dave
parents:
diff changeset
653 </tests>
5af352c58c24 Uploaded
dave
parents:
diff changeset
654 <help><![CDATA[
5af352c58c24 Uploaded
dave
parents:
diff changeset
655 **What it does**
5af352c58c24 Uploaded
dave
parents:
diff changeset
656
5af352c58c24 Uploaded
dave
parents:
diff changeset
657 FreeBayes is a Bayesian genetic variant detector designed to find small polymorphisms, specifically SNPs (single-nucleotide polymorphisms), indels (insertions and deletions), MNPs (multi-nucleotide polymorphisms), and complex events (composite insertion and substitution events) smaller than the length of a short-read sequencing alignment.
5af352c58c24 Uploaded
dave
parents:
diff changeset
658
5af352c58c24 Uploaded
dave
parents:
diff changeset
659 See https://github.com/ekg/freebayes for details on FreeBayes.
5af352c58c24 Uploaded
dave
parents:
diff changeset
660
5af352c58c24 Uploaded
dave
parents:
diff changeset
661 ------
5af352c58c24 Uploaded
dave
parents:
diff changeset
662
5af352c58c24 Uploaded
dave
parents:
diff changeset
663 **Description**
5af352c58c24 Uploaded
dave
parents:
diff changeset
664
5af352c58c24 Uploaded
dave
parents:
diff changeset
665 Provided some BAM dataset(s) and a reference sequence, FreeBayes will produce a VCF dataset describing SNPs, indels, and complex variants in samples in the input alignments.
5af352c58c24 Uploaded
dave
parents:
diff changeset
666
5af352c58c24 Uploaded
dave
parents:
diff changeset
667 By default, FreeBayes will consider variants supported by at least 2 observations in a single sample (-C) and also by at least 20% of the reads from a single sample (-F). These settings are suitable to low to high depth sequencing in haploid and diploid samples, but users working with polyploid or pooled samples may wish to adjust them depending on the characteristics of their sequencing data.
5af352c58c24 Uploaded
dave
parents:
diff changeset
668
5af352c58c24 Uploaded
dave
parents:
diff changeset
669 FreeBayes is capable of calling variant haplotypes shorter than a read length where multiple polymorphisms segregate on the same read. The maximum distance between polymorphisms phased in this way is determined by the --max-complex-gap, which defaults to 3bp. In practice, this can comfortably be set to half the read length.
5af352c58c24 Uploaded
dave
parents:
diff changeset
670
5af352c58c24 Uploaded
dave
parents:
diff changeset
671 Ploidy may be set to any level (-p), but by default all samples are assumed to be diploid. FreeBayes can model per-sample and per-region variation in copy-number (-A) using a copy-number variation map.
5af352c58c24 Uploaded
dave
parents:
diff changeset
672
5af352c58c24 Uploaded
dave
parents:
diff changeset
673 FreeBayes can act as a frequency-based pooled caller and describe variants and haplotypes in terms of observation frequency rather than called genotypes. To do so, use --pooled-continuous and set input filters to a suitable level. Allele observation counts will be described by AO and RO fields in the VCF output.
5af352c58c24 Uploaded
dave
parents:
diff changeset
674
5af352c58c24 Uploaded
dave
parents:
diff changeset
675 -------
5af352c58c24 Uploaded
dave
parents:
diff changeset
676
5af352c58c24 Uploaded
dave
parents:
diff changeset
677 **Galaxy-specific options**
5af352c58c24 Uploaded
dave
parents:
diff changeset
678
5af352c58c24 Uploaded
dave
parents:
diff changeset
679 Galaxy allows five levels of control over FreeBayes options, provided by the **Choose parameter selection level** menu option. These are:
5af352c58c24 Uploaded
dave
parents:
diff changeset
680
5af352c58c24 Uploaded
dave
parents:
diff changeset
681 1. *Simple diploid calling*: The simplest possible FreeBayes application. Equivalent to using FreeBayes with only a BAM input and no other parameter options.
5af352c58c24 Uploaded
dave
parents:
diff changeset
682 2. *Simple diploid calling with filtering and coverage*: Same as #1 plus two additional options: -0 (standard filters: --min-mapping-quality 30 --min-base-quality 20 --min-supporting-allele-qsum 0 --genotype-variant-threshold 0) and --min-coverage.
5af352c58c24 Uploaded
dave
parents:
diff changeset
683 3. *Frequency-based pooled calling*: This is equivalent to using FreeBayes with the following options: --haplotype-length 0 --min-alternate-count 1 --min-alternate-fraction 0 --pooled-continuous --report-monomorphic. This is the best choice for calling variants in mixtures such as viral, bacterial, or organellar genomes.
5af352c58c24 Uploaded
dave
parents:
diff changeset
684 4. *Frequency-based pooled calling with filtering and coverage*: Same as #3 but adds -0 and --min-coverage like in #2.
5af352c58c24 Uploaded
dave
parents:
diff changeset
685 5. *Complete list of all options*: Gives you full control by exposing all FreeBayes options as Galaxy parameters.
5af352c58c24 Uploaded
dave
parents:
diff changeset
686
5af352c58c24 Uploaded
dave
parents:
diff changeset
687 ------
5af352c58c24 Uploaded
dave
parents:
diff changeset
688
5af352c58c24 Uploaded
dave
parents:
diff changeset
689 **Command-line parameters**
5af352c58c24 Uploaded
dave
parents:
diff changeset
690
5af352c58c24 Uploaded
dave
parents:
diff changeset
691 **Input**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
692
5af352c58c24 Uploaded
dave
parents:
diff changeset
693 --bam FILE The file or set of BAM files to be analyzed.
5af352c58c24 Uploaded
dave
parents:
diff changeset
694 --bam-list FILE A file containing a list of BAM files to be analyzed.
5af352c58c24 Uploaded
dave
parents:
diff changeset
695
5af352c58c24 Uploaded
dave
parents:
diff changeset
696 --stdin Read BAM input on stdin.
5af352c58c24 Uploaded
dave
parents:
diff changeset
697 --fasta-reference FILE Use FILE as the reference sequence for analysis.
5af352c58c24 Uploaded
dave
parents:
diff changeset
698 An index file (FILE.fai) will be created if none exists.
5af352c58c24 Uploaded
dave
parents:
diff changeset
699 If neither --targets nor --region are specified, FreeBayes
5af352c58c24 Uploaded
dave
parents:
diff changeset
700 will analyze every position in this reference.
5af352c58c24 Uploaded
dave
parents:
diff changeset
701 --targets FILE Limit analysis to targets listed in the BED-format FILE.
5af352c58c24 Uploaded
dave
parents:
diff changeset
702 --region <chrom>:<start>-<end> Limit analysis to the specified region, 0-base coordinates,
5af352c58c24 Uploaded
dave
parents:
diff changeset
703 end_position not included (same as BED format).
5af352c58c24 Uploaded
dave
parents:
diff changeset
704 Either '-' or '..' maybe used as a separator.
5af352c58c24 Uploaded
dave
parents:
diff changeset
705 --samples FILE Limit analysis to samples listed (one per line) in the FILE.
5af352c58c24 Uploaded
dave
parents:
diff changeset
706 By default FreeBayes will analyze all samples in its input
5af352c58c24 Uploaded
dave
parents:
diff changeset
707 BAM files.
5af352c58c24 Uploaded
dave
parents:
diff changeset
708 --populations FILE Each line of FILE should list a sample and a population which
5af352c58c24 Uploaded
dave
parents:
diff changeset
709 it is part of. The population-based bayesian inference model
5af352c58c24 Uploaded
dave
parents:
diff changeset
710 will then be partitioned on the basis of the populations.
5af352c58c24 Uploaded
dave
parents:
diff changeset
711 --cnv-map FILE Read a copy number map from the BED file FILE, which has
5af352c58c24 Uploaded
dave
parents:
diff changeset
712 either a sample-level ploidy:
5af352c58c24 Uploaded
dave
parents:
diff changeset
713 sample_name copy_number
5af352c58c24 Uploaded
dave
parents:
diff changeset
714 or a region-specific format:
5af352c58c24 Uploaded
dave
parents:
diff changeset
715 seq_name start end sample_name copy_number
5af352c58c24 Uploaded
dave
parents:
diff changeset
716 ... for each region in each sample which does not have the
5af352c58c24 Uploaded
dave
parents:
diff changeset
717 default copy number as set by --ploidy. These fields can be delimited
5af352c58c24 Uploaded
dave
parents:
diff changeset
718 by space or tab.
5af352c58c24 Uploaded
dave
parents:
diff changeset
719
5af352c58c24 Uploaded
dave
parents:
diff changeset
720 **Output**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
721
5af352c58c24 Uploaded
dave
parents:
diff changeset
722 --vcf FILE Output VCF-format results to FILE. (default: stdout)
5af352c58c24 Uploaded
dave
parents:
diff changeset
723 --gvcf Write gVCF output, which indicates coverage in uncalled regions.
5af352c58c24 Uploaded
dave
parents:
diff changeset
724 --gvcf-chunk NUM When writing gVCF output emit a record for every NUM bases.
5af352c58c24 Uploaded
dave
parents:
diff changeset
725 --gvcf-dont-use-chunk When writing the gVCF output emit a record for all bases if
5af352c58c24 Uploaded
dave
parents:
diff changeset
726 set to "true" , will also route an int to --gvcf-chunk
5af352c58c24 Uploaded
dave
parents:
diff changeset
727 similar to --output-mode EMIT_ALL_SITES from GATK
5af352c58c24 Uploaded
dave
parents:
diff changeset
728 --variant-input VCF Use variants reported in VCF file as input to the algorithm.
5af352c58c24 Uploaded
dave
parents:
diff changeset
729 Variants in this file will included in the output even if
5af352c58c24 Uploaded
dave
parents:
diff changeset
730 there is not enough support in the data to pass input filters.
5af352c58c24 Uploaded
dave
parents:
diff changeset
731 --only-use-input-alleles Only provide variant calls and genotype likelihoods for sites
5af352c58c24 Uploaded
dave
parents:
diff changeset
732 and alleles which are provided in the VCF input, and provide
5af352c58c24 Uploaded
dave
parents:
diff changeset
733 output in the VCF for all input alleles, not just those which
5af352c58c24 Uploaded
dave
parents:
diff changeset
734 have support in the data.
5af352c58c24 Uploaded
dave
parents:
diff changeset
735 --haplotype-basis-alleles VCF When specified, only variant alleles provided in this input
5af352c58c24 Uploaded
dave
parents:
diff changeset
736 VCF will be used for the construction of complex or haplotype
5af352c58c24 Uploaded
dave
parents:
diff changeset
737 alleles.
5af352c58c24 Uploaded
dave
parents:
diff changeset
738 --report-all-haplotype-alleles At sites where genotypes are made over haplotype alleles,
5af352c58c24 Uploaded
dave
parents:
diff changeset
739 provide information about all alleles in output, not only
5af352c58c24 Uploaded
dave
parents:
diff changeset
740 those which are called.
5af352c58c24 Uploaded
dave
parents:
diff changeset
741 --report-monomorphic Report even loci which appear to be monomorphic, and report all
5af352c58c24 Uploaded
dave
parents:
diff changeset
742 considered alleles, even those which are not in called genotypes.
5af352c58c24 Uploaded
dave
parents:
diff changeset
743 Loci which do not have any potential alternates have '.' for ALT.
5af352c58c24 Uploaded
dave
parents:
diff changeset
744 --pvar N Report sites if the probability that there is a polymorphism
5af352c58c24 Uploaded
dave
parents:
diff changeset
745 at the site is greater than N. default: 0.0. Note that post-
5af352c58c24 Uploaded
dave
parents:
diff changeset
746 filtering is generally recommended over the use of this parameter.
5af352c58c24 Uploaded
dave
parents:
diff changeset
747 --strict-vcf Generate strict VCF format (FORMAT/GQ will be an int)
5af352c58c24 Uploaded
dave
parents:
diff changeset
748
5af352c58c24 Uploaded
dave
parents:
diff changeset
749 **Population model**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
750
5af352c58c24 Uploaded
dave
parents:
diff changeset
751 --theta N The expected mutation rate or pairwise nucleotide diversity
5af352c58c24 Uploaded
dave
parents:
diff changeset
752 among the population under analysis. This serves as the
5af352c58c24 Uploaded
dave
parents:
diff changeset
753 single parameter to the Ewens Sampling Formula prior model
5af352c58c24 Uploaded
dave
parents:
diff changeset
754 default: 0.001
5af352c58c24 Uploaded
dave
parents:
diff changeset
755 --ploidy N Sets the default ploidy for the analysis to N. default: 2
5af352c58c24 Uploaded
dave
parents:
diff changeset
756 --pooled-discrete Assume that samples result from pooled sequencing.
5af352c58c24 Uploaded
dave
parents:
diff changeset
757 Model pooled samples using discrete genotypes across pools.
5af352c58c24 Uploaded
dave
parents:
diff changeset
758 When using this flag, set --ploidy to the number of
5af352c58c24 Uploaded
dave
parents:
diff changeset
759 alleles in each sample or use the --cnv-map to define
5af352c58c24 Uploaded
dave
parents:
diff changeset
760 per-sample ploidy.
5af352c58c24 Uploaded
dave
parents:
diff changeset
761 --pooled-continuous Output all alleles which pass input filters, regardles of
5af352c58c24 Uploaded
dave
parents:
diff changeset
762 genotyping outcome or model.
5af352c58c24 Uploaded
dave
parents:
diff changeset
763
5af352c58c24 Uploaded
dave
parents:
diff changeset
764 **Reference allele**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
765
5af352c58c24 Uploaded
dave
parents:
diff changeset
766 --use-reference-allele This flag includes the reference allele in the analysis as
5af352c58c24 Uploaded
dave
parents:
diff changeset
767 if it is another sample from the same population.
5af352c58c24 Uploaded
dave
parents:
diff changeset
768 --reference-quality MQ,BQ Assign mapping quality of MQ to the reference allele at each
5af352c58c24 Uploaded
dave
parents:
diff changeset
769 site and base quality of BQ. default: 100,60
5af352c58c24 Uploaded
dave
parents:
diff changeset
770
5af352c58c24 Uploaded
dave
parents:
diff changeset
771 **Allele scope**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
772
5af352c58c24 Uploaded
dave
parents:
diff changeset
773 --use-best-n-alleles N Evaluate only the best N SNP alleles, ranked by sum of
5af352c58c24 Uploaded
dave
parents:
diff changeset
774 supporting quality scores. (Set to 0 to use all; default: all)
5af352c58c24 Uploaded
dave
parents:
diff changeset
775 --max-complex-gap
5af352c58c24 Uploaded
dave
parents:
diff changeset
776 --haplotype-length N Allow haplotype calls with contiguous embedded matches of up
5af352c58c24 Uploaded
dave
parents:
diff changeset
777 to this length. Set N=-1 to disable clumping. (default: 3)
5af352c58c24 Uploaded
dave
parents:
diff changeset
778 --min-repeat-size When assembling observations across repeats, require the total repeat
5af352c58c24 Uploaded
dave
parents:
diff changeset
779 length at least this many bp. (default: 5)
5af352c58c24 Uploaded
dave
parents:
diff changeset
780 --min-repeat-entropy N To detect interrupted repeats, build across sequence until it has
5af352c58c24 Uploaded
dave
parents:
diff changeset
781 entropy > N bits per bp. Set to 0 to turn off. (default: 1)
5af352c58c24 Uploaded
dave
parents:
diff changeset
782 --no-partial-observations Exclude observations which do not fully span the dynamically-determined
5af352c58c24 Uploaded
dave
parents:
diff changeset
783 detection window. (default, use all observations, dividing partial
5af352c58c24 Uploaded
dave
parents:
diff changeset
784 support across matching haplotypes when generating haplotypes.)
5af352c58c24 Uploaded
dave
parents:
diff changeset
785
5af352c58c24 Uploaded
dave
parents:
diff changeset
786 **Indel realignment**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
787
5af352c58c24 Uploaded
dave
parents:
diff changeset
788 --dont-left-align-indels Turn off left-alignment of indels, which is enabled by default.
5af352c58c24 Uploaded
dave
parents:
diff changeset
789
5af352c58c24 Uploaded
dave
parents:
diff changeset
790 **Input filters**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
791
5af352c58c24 Uploaded
dave
parents:
diff changeset
792 --use-duplicate-reads Include duplicate-marked alignments in the analysis.
5af352c58c24 Uploaded
dave
parents:
diff changeset
793 default: exclude duplicates marked as such in alignments
5af352c58c24 Uploaded
dave
parents:
diff changeset
794 --min-mapping-quality Q Exclude alignments from analysis if they have a mapping
5af352c58c24 Uploaded
dave
parents:
diff changeset
795 quality less than Q. default: 1
5af352c58c24 Uploaded
dave
parents:
diff changeset
796 --min-base-quality Q Exclude alleles from analysis if their supporting base
5af352c58c24 Uploaded
dave
parents:
diff changeset
797 quality is less than Q. default: 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
798 --min-supporting-allele-qsum Q Consider any allele in which the sum of qualities of supporting
5af352c58c24 Uploaded
dave
parents:
diff changeset
799 observations is at least Q. default: 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
800 --min-supporting-mapping-qsum Q Consider any allele in which and the sum of mapping qualities of
5af352c58c24 Uploaded
dave
parents:
diff changeset
801 supporting reads is at least Q. default: 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
802 --mismatch-base-quality-threshold Q Count mismatches toward --read-mismatch-limit if the base
5af352c58c24 Uploaded
dave
parents:
diff changeset
803 quality of the mismatch is >= Q. default: 10
5af352c58c24 Uploaded
dave
parents:
diff changeset
804 --read-mismatch-limit N Exclude reads with more than N mismatches where each mismatch
5af352c58c24 Uploaded
dave
parents:
diff changeset
805 has base quality >= mismatch-base-quality-threshold.
5af352c58c24 Uploaded
dave
parents:
diff changeset
806 default: ~unbounded
5af352c58c24 Uploaded
dave
parents:
diff changeset
807 --read-max-mismatch-fraction N Exclude reads with more than N [0,1] fraction of mismatches where
5af352c58c24 Uploaded
dave
parents:
diff changeset
808 each mismatch has base quality >= mismatch-base-quality-threshold
5af352c58c24 Uploaded
dave
parents:
diff changeset
809 default: 1.0
5af352c58c24 Uploaded
dave
parents:
diff changeset
810 --read-snp-limit N Exclude reads with more than N base mismatches, ignoring gaps
5af352c58c24 Uploaded
dave
parents:
diff changeset
811 with quality >= mismatch-base-quality-threshold.
5af352c58c24 Uploaded
dave
parents:
diff changeset
812 default: ~unbounded
5af352c58c24 Uploaded
dave
parents:
diff changeset
813 --read-indel-limit N Exclude reads with more than N separate gaps.
5af352c58c24 Uploaded
dave
parents:
diff changeset
814 default: ~unbounded
5af352c58c24 Uploaded
dave
parents:
diff changeset
815 --standard-filters Use stringent input base and mapping quality filters
5af352c58c24 Uploaded
dave
parents:
diff changeset
816 Equivalent to -m 30 -q 20 -R 0 -S 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
817 --min-alternate-fraction N Require at least this fraction of observations supporting
5af352c58c24 Uploaded
dave
parents:
diff changeset
818 an alternate allele within a single individual in the
5af352c58c24 Uploaded
dave
parents:
diff changeset
819 in order to evaluate the position. default: 0.05
5af352c58c24 Uploaded
dave
parents:
diff changeset
820 --min-alternate-count N Require at least this count of observations supporting
5af352c58c24 Uploaded
dave
parents:
diff changeset
821 an alternate allele within a single individual in order
5af352c58c24 Uploaded
dave
parents:
diff changeset
822 to evaluate the position. default: 2
5af352c58c24 Uploaded
dave
parents:
diff changeset
823 --min-alternate-qsum N Require at least this sum of quality of observations supporting
5af352c58c24 Uploaded
dave
parents:
diff changeset
824 an alternate allele within a single individual in order
5af352c58c24 Uploaded
dave
parents:
diff changeset
825 to evaluate the position. default: 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
826 --min-alternate-total N Require at least this count of observations supporting
5af352c58c24 Uploaded
dave
parents:
diff changeset
827 an alternate allele within the total population in order
5af352c58c24 Uploaded
dave
parents:
diff changeset
828 to use the allele in analysis. default: 1
5af352c58c24 Uploaded
dave
parents:
diff changeset
829 --min-coverage N Require at least this coverage to process a site. default: 0
5af352c58c24 Uploaded
dave
parents:
diff changeset
830 --limit-coverage N Downsample per-sample coverage to this level if greater than this coverage.
5af352c58c24 Uploaded
dave
parents:
diff changeset
831 default: no limit
5af352c58c24 Uploaded
dave
parents:
diff changeset
832 --skip-coverage N Skip processing of alignments overlapping positions with coverage >N.
5af352c58c24 Uploaded
dave
parents:
diff changeset
833 This filters sites above this coverage, but will also reduce data nearby.
5af352c58c24 Uploaded
dave
parents:
diff changeset
834 default: no limit
5af352c58c24 Uploaded
dave
parents:
diff changeset
835
5af352c58c24 Uploaded
dave
parents:
diff changeset
836 **Population priors**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
837
5af352c58c24 Uploaded
dave
parents:
diff changeset
838 --no-population-priors Equivalent to --pooled-discrete --hwe-priors-off and removal of
5af352c58c24 Uploaded
dave
parents:
diff changeset
839 Ewens Sampling Formula component of priors.
5af352c58c24 Uploaded
dave
parents:
diff changeset
840
5af352c58c24 Uploaded
dave
parents:
diff changeset
841 **Mappability priors**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
842
5af352c58c24 Uploaded
dave
parents:
diff changeset
843 --hwe-priors-off Disable estimation of the probability of the combination
5af352c58c24 Uploaded
dave
parents:
diff changeset
844 arising under HWE given the allele frequency as estimated
5af352c58c24 Uploaded
dave
parents:
diff changeset
845 by observation frequency.
5af352c58c24 Uploaded
dave
parents:
diff changeset
846 --binomial-obs-priors-off Disable incorporation of prior expectations about observations.
5af352c58c24 Uploaded
dave
parents:
diff changeset
847 Uses read placement probability, strand balance probability,
5af352c58c24 Uploaded
dave
parents:
diff changeset
848 and read position (5'-3') probability.
5af352c58c24 Uploaded
dave
parents:
diff changeset
849 --allele-balance-priors-off Disable use of aggregate probability of observation balance between alleles
5af352c58c24 Uploaded
dave
parents:
diff changeset
850 as a component of the priors.
5af352c58c24 Uploaded
dave
parents:
diff changeset
851
5af352c58c24 Uploaded
dave
parents:
diff changeset
852 **Genotype likelihoods**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
853
5af352c58c24 Uploaded
dave
parents:
diff changeset
854 --observation-bias FILE Read length-dependent allele observation biases from FILE.
5af352c58c24 Uploaded
dave
parents:
diff changeset
855 The format is [length] [alignment efficiency relative to reference]
5af352c58c24 Uploaded
dave
parents:
diff changeset
856 where the efficiency is 1 if there is no relative observation bias.
5af352c58c24 Uploaded
dave
parents:
diff changeset
857 --base-quality-cap Q Limit estimated observation quality by capping base quality at Q.
5af352c58c24 Uploaded
dave
parents:
diff changeset
858 --prob-contamination F An estimate of contamination to use for all samples. default: 10e-9
5af352c58c24 Uploaded
dave
parents:
diff changeset
859 --legacy-gls Use legacy (polybayes equivalent) genotype likelihood calculations
5af352c58c24 Uploaded
dave
parents:
diff changeset
860 --contamination-estimates FILE A file containing per-sample estimates of contamination, such as
5af352c58c24 Uploaded
dave
parents:
diff changeset
861 those generated by VerifyBamID. The format should be:
5af352c58c24 Uploaded
dave
parents:
diff changeset
862 sample p(read=R|genotype=AR) p(read=A|genotype=AA)
5af352c58c24 Uploaded
dave
parents:
diff changeset
863 Sample '*' can be used to set default contamination estimates.
5af352c58c24 Uploaded
dave
parents:
diff changeset
864
5af352c58c24 Uploaded
dave
parents:
diff changeset
865 **Algorithmic features**::
5af352c58c24 Uploaded
dave
parents:
diff changeset
866
5af352c58c24 Uploaded
dave
parents:
diff changeset
867 --report-genotype-likelihood-max Report genotypes using the maximum-likelihood estimate provided
5af352c58c24 Uploaded
dave
parents:
diff changeset
868 from genotype likelihoods.
5af352c58c24 Uploaded
dave
parents:
diff changeset
869 --genotyping-max-iterations N Iterate no more than N times during genotyping step. default: 1000.
5af352c58c24 Uploaded
dave
parents:
diff changeset
870 --genotyping-max-banddepth N Integrate no deeper than the Nth best genotype by likelihood when
5af352c58c24 Uploaded
dave
parents:
diff changeset
871 genotyping. default: 6.
5af352c58c24 Uploaded
dave
parents:
diff changeset
872 --posterior-integration-limits N,M Integrate all genotype combinations in our posterior space
5af352c58c24 Uploaded
dave
parents:
diff changeset
873 which include no more than N samples with their Mth best
5af352c58c24 Uploaded
dave
parents:
diff changeset
874 data likelihood. default: 1,3.
5af352c58c24 Uploaded
dave
parents:
diff changeset
875 --exclude-unobserved-genotypes Skip sample genotypings for which the sample has no supporting reads.
5af352c58c24 Uploaded
dave
parents:
diff changeset
876 --genotype-variant-threshold N Limit posterior integration to samples where the second-best
5af352c58c24 Uploaded
dave
parents:
diff changeset
877 genotype likelihood is no more than log(N) from the highest
5af352c58c24 Uploaded
dave
parents:
diff changeset
878 genotype likelihood for the sample. default: ~unbounded
5af352c58c24 Uploaded
dave
parents:
diff changeset
879 --use-mapping-quality Use mapping quality of alleles when calculating data likelihoods.
5af352c58c24 Uploaded
dave
parents:
diff changeset
880 --harmonic-indel-quality Use a weighted sum of base qualities around an indel, scaled by the
5af352c58c24 Uploaded
dave
parents:
diff changeset
881 distance from the indel. By default use a minimum BQ in flanking sequence.
5af352c58c24 Uploaded
dave
parents:
diff changeset
882 --read-dependence-factor N Incorporate non-independence of reads by scaling successive
5af352c58c24 Uploaded
dave
parents:
diff changeset
883 observations by this factor during data likelihood
5af352c58c24 Uploaded
dave
parents:
diff changeset
884 calculations. default: 0.9
5af352c58c24 Uploaded
dave
parents:
diff changeset
885 --genotype-qualities Calculate the marginal probability of genotypes and report as GQ in
5af352c58c24 Uploaded
dave
parents:
diff changeset
886 each sample field in the VCF output.
5af352c58c24 Uploaded
dave
parents:
diff changeset
887
5af352c58c24 Uploaded
dave
parents:
diff changeset
888 ------
5af352c58c24 Uploaded
dave
parents:
diff changeset
889
5af352c58c24 Uploaded
dave
parents:
diff changeset
890 **Acknowledgments**
5af352c58c24 Uploaded
dave
parents:
diff changeset
891
5af352c58c24 Uploaded
dave
parents:
diff changeset
892 The initial version of the wrapper was produced by Dan Blankenberg and upgraded by Anton Nekrutenko.
5af352c58c24 Uploaded
dave
parents:
diff changeset
893 TNG was developed by Bjoern Gruening.
5af352c58c24 Uploaded
dave
parents:
diff changeset
894 ]]>
5af352c58c24 Uploaded
dave
parents:
diff changeset
895 </help>
5af352c58c24 Uploaded
dave
parents:
diff changeset
896 <expand macro="citations">
5af352c58c24 Uploaded
dave
parents:
diff changeset
897 <citation type="bibtex">
5af352c58c24 Uploaded
dave
parents:
diff changeset
898 @article{Tange2011a,
5af352c58c24 Uploaded
dave
parents:
diff changeset
899 title = {GNU Parallel - The Command-Line Power Tool},
5af352c58c24 Uploaded
dave
parents:
diff changeset
900 author = {O. Tange},
5af352c58c24 Uploaded
dave
parents:
diff changeset
901 address = {Frederiksberg, Denmark},
5af352c58c24 Uploaded
dave
parents:
diff changeset
902 journal = {;login: The USENIX Magazine},
5af352c58c24 Uploaded
dave
parents:
diff changeset
903 month = {Feb},
5af352c58c24 Uploaded
dave
parents:
diff changeset
904 number = {1},
5af352c58c24 Uploaded
dave
parents:
diff changeset
905 volume = {36},
5af352c58c24 Uploaded
dave
parents:
diff changeset
906 url = {http://www.gnu.org/s/parallel},
5af352c58c24 Uploaded
dave
parents:
diff changeset
907 year = {2011},
5af352c58c24 Uploaded
dave
parents:
diff changeset
908 pages = {42-47}
5af352c58c24 Uploaded
dave
parents:
diff changeset
909 }
5af352c58c24 Uploaded
dave
parents:
diff changeset
910 </citation>
5af352c58c24 Uploaded
dave
parents:
diff changeset
911 </expand>
5af352c58c24 Uploaded
dave
parents:
diff changeset
912 </tool>