annotate bcftools_norm.xml @ 29:91a6f019e1a9 draft

Uploaded
author wrtz
date Fri, 15 Jan 2016 11:54:12 -0500
parents dfba0f0b3edd
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
13
22d009d35145 Uploaded
wrtz
parents:
diff changeset
1 <tool id="bcftools_norm" name="BCFtools norm" version="1.0.0">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
2 <description>Left-align and normalize indels, check if REF alleles match reference, change multiallelic format</description>
25
dfba0f0b3edd Uploaded
wrtz
parents: 13
diff changeset
3 <requirements>
dfba0f0b3edd Uploaded
wrtz
parents: 13
diff changeset
4 <requirement type="package" version="1.3">bcftools</requirement>
dfba0f0b3edd Uploaded
wrtz
parents: 13
diff changeset
5 </requirements>
13
22d009d35145 Uploaded
wrtz
parents:
diff changeset
6 <command>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
7 #if str( $input_file_index ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
8 ln -s -f $input input_file.${input.ext} &amp;&amp;
22d009d35145 Uploaded
wrtz
parents:
diff changeset
9 ln -s -f $input_file_index input_file.${input.ext}.tbi &amp;&amp;
22d009d35145 Uploaded
wrtz
parents:
diff changeset
10 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
11 #if str( $fasta_ref_cond.set_fasta_ref ) == "True":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
12 #if str( $fasta_ref_cond.fasta_ref_index ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
13 ln -s -f $fasta_ref_cond.fasta_ref fasta_ref_file.${fasta_ref.ext}.fa &amp;&amp;
22d009d35145 Uploaded
wrtz
parents:
diff changeset
14 ln -s -f $fasta_ref_cond.fasta_ref_index fasta_ref_file.${fasta_ref.ext}.fa.fai &amp;&amp;
22d009d35145 Uploaded
wrtz
parents:
diff changeset
15 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
16 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
17 bcftools norm
22d009d35145 Uploaded
wrtz
parents:
diff changeset
18 --output "${output_file}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
19 --output-type "${output_type}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
20 #if str( $regions_file ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
21 --regions-file "${regions_file}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
22 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
23 #if str( $regions ) != "":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
24 --regions "${regions}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
25 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
26 #if str( $targets_file ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
27 --targets-file "${targets_file}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
28 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
29 #if str( $targets ) != "":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
30 --targets "${targets}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
31 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
32 #if str( $check_ref_cond.set_check_ref ) == "True":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
33 #if str( $check_ref_cond.warn ) == "true":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
34 #if str( $check_ref_cond.check_ref ) == "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
35 --check-ref "w"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
36 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
37 --check-ref "w${check_ref_cond.check_ref}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
38 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
39 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
40 --check-ref "${check_ref_cond.check_ref}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
41 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
42 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
43 #if str( $fasta_ref_cond.set_fasta_ref ) == "True":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
44 #if str( $fasta_ref_cond.fasta_ref_index ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
45 --fasta-ref "fasta_ref_file.${fasta_ref.ext}.fa"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
46 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
47 --fasta-ref "${fasta_ref}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
48 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
49 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
50 #if str( $multiallelics_cond.set_multiallelics ) == "True":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
51 #if str( $multiallelics_cond.minus_or_plus ) == "minus":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
52 #if str ( $multiallelics_cond.multiallelics ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
53 --multiallelics "-${multiallelics_cond.multiallelics}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
54 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
55 --multiallelics "-"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
56 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
57 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
58 #if str ( $multiallelics_cond.multiallelics ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
59 --multiallelics "+${multiallelics_cond.multiallelics}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
60 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
61 --multiallelics "+"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
62 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
63 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
64 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
65 #if str( $rm_dup ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
66 --rm-dup "${rm_dup}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
67 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
68 ${do_not_normalize}
22d009d35145 Uploaded
wrtz
parents:
diff changeset
69 ${strict_filter}
22d009d35145 Uploaded
wrtz
parents:
diff changeset
70 #if str( $site_win ) != "":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
71 --site-win "${site_win}"
22d009d35145 Uploaded
wrtz
parents:
diff changeset
72 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
73 #if str( $input_file_index ) != "None":
22d009d35145 Uploaded
wrtz
parents:
diff changeset
74 input_file.${input.ext}
22d009d35145 Uploaded
wrtz
parents:
diff changeset
75 #else
22d009d35145 Uploaded
wrtz
parents:
diff changeset
76 $input
22d009d35145 Uploaded
wrtz
parents:
diff changeset
77 #end if
22d009d35145 Uploaded
wrtz
parents:
diff changeset
78 </command>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
79 <inputs>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
80 <param name="input" type="data" format="vcf,bcf,bgzip" label="VCF or BCF input file" help="Input file can optionally be compressed and indexed using Bgzip and Tabix Galaxy tools. In this case, select bgzipped file here and index below."/>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
81 <param name="input_file_index" type="data" optional="true" label="Input file index" help="Tabix-generated index for input file. Run Tabix Galaxy tool on bgzipped input file to create index."/>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
82 <param name="output_type" type="select" label="Output data type" help="-O">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
83 <option value="v" selected="true">VCF</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
84 <option value="b">BCF</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
85 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
86 <param name="regions_file" type="data" optional="true" label="Regions file" help="-R. Regions specified in a VCF, BED, or tab-delimited file with columns CHROM, POS, and, optionally, POS_TO."/>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
87 <param name="regions" type="text" size="80" optional="True" label="Regions list" help="-r. Comma-separated list of regions. Format: chr|chr:pos|chr:from-to|chr:from-[,...]">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
88 <sanitizer invalid_char="">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
89 <valid initial="string.digits"><add value="CHRchr-:,"/> </valid>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
90 </sanitizer>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
91 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
92 <param name="targets_file" type="data" optional="true" label="Targets file" help="-T. Targets specified in a VCF, BED, or tab-delimited file with columns CHROM, POS, and, optionally, POS_TO."/>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
93 <param name="targets" type="text" size="80" optional="True" label="Targets list" help="-t. Comma-separated list of targets. Format: [^]chr|chr:pos|chr:from-to|chr:from-[,...]">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
94 <sanitizer invalid_char="">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
95 <valid initial="string.digits"><add value="CHRchr-:,^"/> </valid>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
96 </sanitizer>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
97 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
98 <conditional name="fasta_ref_cond">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
99 <param name="set_fasta_ref" type="boolean" checked="False" label="Specify FASTA reference sequence" help="-f" />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
100 <when value="true">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
101 <param name="fasta_ref" type="data" label="FASTA reference file" help="Reference sequence. Using this option turns on left-alignment and normalization. Set corresponding index below." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
102 <param name="fasta_ref_index" type="data" optional="True" label="FASTA reference index" help="Run Faidx (SAMtools) Galaxy tool on above reference file to create index. Errors can arise if this index is not specified." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
103 </when>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
104 </conditional>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
105 <param name="do_not_normalize" type="boolean" checked="False" truevalue="--do-not-normalize" falsevalue="" label="Turn off indel normalization" help="-N. Indel normalization automatically occurs when FASTA reference is used. Use this option to disable this behavior." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
106 <conditional name="check_ref_cond">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
107 <param name="set_check_ref" type="boolean" checked="False" label="Check REF" help="-c. Choose action when an incorrect or missing REF allele is encountered." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
108 <when value="true">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
109 <param name="check_ref" type="select" optional="True" label="Action" help="Action when an incorrect or missing REF allele is encountered.">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
110 <option value="e">Exit program</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
111 <option value="x">Exclude incorrect/missing sites</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
112 <option value="s">Set or fix incorrect/missing sites (requires FASTA reference)</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
113 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
114 <param name="warn" type="boolean" checked="False" label="Warn" help="Warn when an incorrect or missing REF allele is encountered." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
115 </when>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
116 </conditional>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
117 <param name="rm_dup" type="select" optional="True" label="Remove duplicates" help="-d. For given variant type, if a record is present in multiple files, output only the first instance.">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
118 <option value="snps">SNPs</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
119 <option value="indels">Indels</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
120 <option value="both">Both (SNPs and indels)</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
121 <option value="any">Any</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
122 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
123 <conditional name="multiallelics_cond">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
124 <param name="set_multiallelics" type="boolean" checked="False" label="Modify multiallelic sites" help="-m. Split multiallelic sites into biallelic records, or join biallelic sites into multiallelic records." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
125 <when value="true">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
126 <param name="minus_or_plus" type="select" label="Split or join">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
127 <option value="minus" selected="true">Split multiallelic sites into biallelic records</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
128 <option value="plus">Join biallelic sites into multiallelic records</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
129 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
130 <param name="multiallelics" type="select" optional="True" label="Sites to split/join" help="">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
131 <option value="snps">SNPs (only SNP records are split/joined)</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
132 <option value="indels">Indels (only indel records are split/joined)</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
133 <option value="both">Both (SNPs and indels are merged separately into two records)</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
134 <option value="any">Any (SNPs and indels are merged into a single record)</option>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
135 </param>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
136 </when>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
137 </conditional>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
138 <param name="strict_filter" type="boolean" checked="False" truevalue="--strict-filter" falsevalue="" label="Strict PASS filter" help="-s. When merging biallelics into multiallelics, merged site has value PASS only if all sites being merged have value PASS." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
139 <param name="site_win" type="integer" optional="true" label="Position window" help="-w. Maximum distance between two records to consider when locally sorting variants which changed position during the realignment." />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
140 </inputs>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
141 <outputs>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
142 <data name="output_file" format="vcf" label="${tool.name} on ${on_string}">
22d009d35145 Uploaded
wrtz
parents:
diff changeset
143 <change_format>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
144 <when input="output_type" value="b" format="bcf" />
22d009d35145 Uploaded
wrtz
parents:
diff changeset
145 </change_format>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
146 </data>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
147 </outputs>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
148 <help>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
149 **About this tool**
22d009d35145 Uploaded
wrtz
parents:
diff changeset
150
22d009d35145 Uploaded
wrtz
parents:
diff changeset
151 **BCFtools norm**: Left-align and normalize indels, check if REF alleles match the reference, split multiallelic sites into multiple rows, recover multiallelics from multiple rows. Left-alignment and normalization will only be applied if the --fasta-ref option is supplied.
22d009d35145 Uploaded
wrtz
parents:
diff changeset
152
22d009d35145 Uploaded
wrtz
parents:
diff changeset
153 Please see https://samtools.github.io/bcftools/bcftools.html for more info on options.
22d009d35145 Uploaded
wrtz
parents:
diff changeset
154 </help>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
155 </tool>
22d009d35145 Uploaded
wrtz
parents:
diff changeset
156