comparison annotate_variants.xml @ 3:d6ec32ce882b draft default tip

Uploaded
author wolma
date Tue, 28 Mar 2017 04:34:04 -0400
parents
children
comparison
equal deleted inserted replaced
2:7f7028112439 3:d6ec32ce882b
1 <tool id="annotate_variants" name="Variant Annotation" version="0.1.7.3">
2 <description>Predict the effects of SNPs and indels on known genes in the reference genome using SnpEff</description>
3 <macros>
4 <import>toolshed_macros.xml</import>
5 </macros>
6 <expand macro="requirements" />
7 <version_command>mimodd version -q</version_command>
8 <command>
9 mimodd annotate
10
11 "$inputfile"
12
13 #if $str($annotool.name)=='snpeff':
14 --genome "${annotool.genomeVersion}"
15 #if $annotool.ori_output:
16 --snpeff-out "$snpeff_file"
17 #end if
18 #if $annotool.stats:
19 --stats "$summary_file"
20 #end if
21 ${annotool.snpeff_settings.chr} ${annotool.snpeff_settings.no_us} ${annotool.snpeff_settings.no_ds} ${annotool.snpeff_settings.no_intron} ${annotool.snpeff_settings.no_intergenic} ${annotool.snpeff_settings.no_utr}
22 #if $annotool.snpeff_settings.min_cov:
23 --minC "${annotool.snpeff_settings.min_cov}"
24 #end if
25 #if $annotool.snpeff_settings.min_qual:
26 --minQ "${annotool.snpeff_settings.min_qual}"
27 #end if
28 #if $annotool.snpeff_settings.ud:
29 --ud "${annotool.snpeff_settings.ud}"
30 #end if
31 #end if
32
33 --ofile "$outputfile"
34 #if $str($formatting.oformat) == "text":
35 --oformat text
36 #end if
37 #if $str($formatting.oformat) == "html":
38 #if $formatting.formatter_file:
39 --link "${formatting.formatter_file}"
40 #end if
41 #if $formatting.species
42 --species "${formatting.species}"
43 #end if
44 #end if
45
46 #if $str($grouping):
47 --grouping $grouping
48 #end if
49 --verbose
50 </command>
51
52 <inputs>
53 <param format="vcf" label="vcf inputfile to be annotated" name="inputfile" type="data" />
54 <param label="Group variants by" name="grouping" type="select">
55 <option value="">order in the input file</option>
56 <option value="by_sample">sample</option>
57 <option value="by_genes">most affected genes</option>
58 </param>
59 <conditional name="formatting">
60 <param label="Format of the annotation output file" name="oformat" type="select">
61 <option value="html">HTML</option>
62 <option value="text">Tab-separated plain text</option>
63 </param>
64 <when value="html">
65 <param format="txt" label="Optional file with hyperlink formatting instructions" name="formatter_file" optional="true" type="data" />
66 <param help="Overwrite the species guess from the SnpEff genome, often not necessary" label="Species" name="species" type="text" />
67 </when>
68 </conditional>
69 <conditional name="annotool">
70 <param help="Select SnpEff here, if you want to have the vcf input annotated with genomic feature information. Select None if you do not want additional annotation, if you do not have SnpEff installed, or if you have no appropriate SnpEff annotation file for the input." label="Use this tool to annotate the input file" name="name" type="select">
71 <option value="snpeff">SnpEff</option>
72 <option value="None">None</option>
73 </param>
74 <when value="snpeff">
75 <param format="tabular" label="genome list" name="genome_list" type="data" />
76 <param label="Genome" name="genomeVersion" type="select">
77 <options from_dataset="genome_list">
78 <column index="0" name="name" />
79 <column index="1" name="value" />
80 </options>
81 </param>
82 <param checked="true" label="Keep the original SnpEff output" name="ori_output" type="boolean" />
83 <param checked="true" label="Produce a summary file of results" name="stats" type="boolean" />
84
85 <conditional name="snpeff_settings">
86 <param help="This section lets you specify the detailed parameter settings for the SnpEff tool." label="SnpEff-specific parameter settings" name="detail_level" type="select">
87 <option value="default">default settings</option>
88 <option value="change">change settings</option>
89 </param>
90 <when value="default">
91 ## default settings for SnpEff
92 <param name="chr" type="hidden" value="" />
93 <param name="min_cov" type="hidden" value="" />
94 <param name="min_qual" type="hidden" value="" />
95 <param name="no_ds" type="hidden" value="" />
96 <param name="no_us" type="hidden" value="" />
97 <param name="no_intron" type="hidden" value="" />
98 <param name="no_intergenic" type="hidden" value="" />
99 <param name="no_utr" type="hidden" value="" />
100 <param name="ud" type="hidden" value="" />
101 </when>
102 <when value="change">
103 <param checked="false" falsevalue="" label="prepend 'chr' to chromosome names, e.g., 'chr7' instead of '7'" name="chr" truevalue="-chr" type="boolean" />
104 <param help="do not include variants with a coverage lower than this value" label="minimum coverage (default = not used)" name="min_cov" optional="true" type="integer" />
105 <param help="do not include variants with a quality lower than this value" label="minimum quality (default = not used)" name="min_qual" optional="true" type="integer" />
106 <param checked="false" falsevalue="" help="annotation of effects on the downstream region of genes can be suppressed" label="do not show downstream changes" name="no_ds" truevalue="--no-downstream" type="boolean" />
107 <param checked="false" falsevalue="" help="annotation of effects on the upstream region of genes can be suppressed" label="do not show upstream changes" name="no_us" truevalue="--no-upstream" type="boolean" />
108 <param checked="false" falsevalue="" help="annotation of effects on introns of genes can be suppressed" label="do not show intron changes" name="no_intron" truevalue="--no-intron" type="boolean" />
109 <param checked="false" falsevalue="" help="annotation of effects on intergenic regions can be suppressed" label="do not show intergenic changes" name="no_intergenic" truevalue="--no-intergenic" type="boolean" />
110 <param checked="false" falsevalue="" help="annotation of effects on the untranslated regions of genes can be suppressed" label="do not show UTR changes" name="no_utr" truevalue="--no-utr" type="boolean" />
111 <param help="specify the upstream/downstream interval length, i.e., variants more than INTERVAL nts from the next annotated gene are considered to be intergenic" label="upstream downstream interval length (default = 5000 bases)" name="ud" optional="true" type="integer" />
112 </when>
113 </conditional>
114 </when>
115 </conditional>
116 </inputs>
117
118 <outputs>
119 <data format="html" name="outputfile">
120 <change_format>
121 <when format="tabular" input="formatting.oformat" value="text" />
122 </change_format>
123 </data>
124 <data format="vcf" name="snpeff_file">
125 <filter>(annotool['name']=="snpeff" and annotool['ori_output'])</filter>
126 </data>
127 <data format="html" name="summary_file">
128 <filter>(annotool['name']=="snpeff" and annotool['stats'])</filter>
129 </data>
130 </outputs>
131
132 <help>
133 .. class:: infomark
134
135 **What it does**
136
137 The tool turns a variant list in VCF format into a more readable summary table listing variant sites and effects.
138
139 If installed, the variant annotation tool SnpEff can be used transparently to determine the genomic features, e.g., genes or transcripts, affected by the variants.
140
141 Use of this feature requires that you have an appropriate SnpEff genome file installed on the host machine. You can use the *List installed SnpEff genomes* tool to generate a list of all available SnpEff genomes.
142 This list can then be used (by selecting the dataset as the *genome list*) to populate the *genome* dropdown menu, from which you can select the SnpEff genome file to be used for the annotation.
143
144 As output file formats HTML or plain text are supported.
145 In HTML mode, variant positions and/or affected genomic features can be turned into hyperlinks to corresponding views in web-based genome browsers and databases.
146
147 The behavior of this feature depends on:
148
149 1) Recognition of the species that is analyzed
150
151 You can declare the species you are working with using the *Species* text field.
152 If you are not declaring the species explicitly, but are choosing SnpEff for effect annotation, the tool will usually be able to auto-detect the species from the SnpEff genome you are using.
153 If no species gets assigned in either way, no hyperlinks will be generated and the html output will look essentially like plain text.
154
155 2) Available hyperlink formatting rules for this species
156
157 When the species has been recognized, the tool checks if you have selected an *optional file with hyperlink formatting instructions*.
158 If you did and that file contains an entry matching the recognized species, that entry will be used as a template to construct the hyperlinks.
159 If no matching entry is found in the file, an error will be raised.
160
161 If you did not supply a hyperlink formatting instruction file, the tool will consult an internal lookup table to see if it finds default rules for the construction of the hyperlinks for the species.
162 If not, no hyperlinks will be generated and the html output will look essentially like plain text.
163
164 **TIP:**
165 MiModD's internal hyperlink formatting lookup tables are maintained and growing with every new version, but since weblinks are changing frequently as well, it is possible that you will encounter broken hyperlinks for your species of interest. In such a case, you can resort to two things: `tell us about the problem`_ to make sure it gets fixed in the next release and, in the meantime, use a custom file with hyperlink formatting instructions to overwrite the default entry for your species.
166
167 .. _tell us about the problem: mailto:mimodd@googlegroups.com
168 </help>
169 </tool>