annotate polyphen2_web/polyphen2_web.xml @ 3:3c40b02934ad draft default tip

Uploaded
author saketkc
date Tue, 07 Oct 2014 18:56:07 -0400
parents f8f4ad14f5a6
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
1 <tool id="polyphen2_web" name="PolyPhen-2 Webservice">
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
2 <description>Compute functional impact of SNVs </description>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
3 <requirements>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
4 <requirement type="package" version="4.1.0">beautifulsoup4</requirement>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
5 <requirement type="python-module">bs4</requirement>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
6 </requirements>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
7 <command interpreter="python">
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
8 polyphen2_web.py --ucscdb $ucscdb
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
9 --model $model
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
10 --filter $filter
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
11 --function $function
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
12 --input $input
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
13 --log $log_file
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
14 --full $full_file
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
15 --short $short_file
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
16 --snp $snp_file
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
17 </command>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
18 <inputs>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
19 <param format="txt" name="input" type="data" label="Variants File" />
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
20 <param name="ucscdb" type="select" label="Genome Assembly">
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
21 <option value="hg19">GRCh37/hg19</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
22 <option value="hg18">NCBI36/hg18</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
23 </param>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
24 <param name="model" type="select" label="Classifier Model">
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
25 <option value="HumDiv">HumDiv</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
26 <option value="HumVar">HumVar</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
27 </param>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
28 <param name="filter" type="select" label="Transcripts">
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
29 <option value="All">All</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
30 <option value="Canonical">Canonical</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
31 <option value="CCDS">CCDS</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
32 </param>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
33 <param name="function" type="select" label="Annotations">
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
34 <option value="c">Canonical</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
35 <option value="m">CCDS</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
36 <option value="All">All</option>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
37 </param>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
38 </inputs>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
39 <outputs>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
40 <data format="tabular" name="log_file" label="${tool.name} on ${on_string}: log" />
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
41 <data format="tabular" name="full_file" label="${tool.name} on ${on_string}: full"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
42 <data format="tabular" name="short_file" label="${tool.name} on ${on_string}: short"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
43 <data format="tabular" name="snp_file" label="${tool.name} on ${on_string}: snp"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
44 </outputs>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
45
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
46 <tests>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
47 <test>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
48 <param name="input" value="polyphen2_input.txt"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
49 <param name="ucscdb" value="hg19"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
50 <param name="model" value="HumDiv"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
51 <param name="filter" value="All"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
52 <param name="function" value="All"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
53 <output name="log_file" file="polyphen2_log.txt"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
54 <output name="full_file" file="polyphen2_full.txt"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
55 <output name="short_file" file="polyphen2_short.txt"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
56 <output name="snp_file" file="polyphen2_snp.txt"/>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
57 </test>
3
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
58 <test>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
59 <param name="input" value="polyphen_input.txt"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
60 <param name="ucscdb" value="hg19"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
61 <param name="model" value="HumDiv"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
62 <param name="filter" value="All"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
63 <param name="function" value="All"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
64 <output name="log_file" file="polyphen_output_log.tsv"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
65 <output name="full_file" file="polyphen_output_full.tsv"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
66 <output name="short_file" file="polyphen_output_short.tsv"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
67 <output name="snp_file" file="polyphen_output_snp.tsv"/>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
68 </test>
3c40b02934ad Uploaded
saketkc
parents: 2
diff changeset
69
0
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
70 </tests>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
71 <help>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
72 **What it does**
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
73 This tool interacts with the Web Version of Polyphen2 hosted at http://genetics.bwh.harvard.edu/pph2/
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
74
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
75 PolyPhen-2 (Polymorphism Phenotyping v2) is a software tool which predicts possible impact of amino acid substitutions
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
76 on the structure and function of human proteins using straightforward physical and evolutionary comparative considerations.
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
77
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
78 .. class:: infomark
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
79
2
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
80 *Classifier model* used by the probabilistic predictor:
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
81
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
82 -HumDiv is preferred for evaluating rare alleles, dense mapping of regions identified by genome-wide association studies,
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
83 and analysis of natural selection. HumDiv model uses 5% / 10% FPR thresholds for “probably damaging” / “possibly damaging” predictions
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
84
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
85
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
86 -HumVar is better suited for diagnostics of Mendelian diseases which requires distinguishing mutations with drastic effects
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
87 from all the remaining human variation, including abundant mildly deleterious alleles.
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
88 HumVar model uses 10% / 20% FPR thresholds for “probably damaging” / “possibly damaging” predictions
0
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
89
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
90 .. class:: infomark
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
91
2
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
92 *Transcripts* A set of Transcripts on which genomic SNPs will be mapped:
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
93
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
94
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
95 -*All* includes all UCSC knownGene transcripts (highly redundant)
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
96
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
97 -*Canonical* includes UCSC knownCanonical subset
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
98
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
99 -*CCDS* further restricts knownCanonical subset to those transcripts which are also annotated as part of NCBI CCDS.
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
100
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
101
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
102 .. class:: infomark
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
103
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
104 *Annotations* for the following functional categories of genomic SNPs will be included in the output:
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
105
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
106
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
107 -*All*: coding-synon, introns, nonsense missense utr-3, utr-5.
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
108
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
109
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
110 -*Coding*: coding-synon, nonsense. missense
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
111
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
112
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
113 -*Missense*: missense.
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
114
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
115
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
116
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
117 .. class:: warningmark
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
118
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
119 Note that PolyPhen-2 predictions are always produced for missense
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
120
0
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
121
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
122 .. class:: infomark
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
123
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
124
2
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
125 Input format:
0
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
126
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
127
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
128 chr22:30421786 A/T
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
129
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
130 chr22:29446079 A/G
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
131
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
132 chr22:40814500 A/G
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
133
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
134 chr22:40815256 C/T
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
135
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
136
2
f8f4ad14f5a6 Uploaded
saketkc
parents: 0
diff changeset
137
0
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
138 **Citations**
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
139
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
140 If you use this tool please cite:
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
141
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
142 Adzhubei IA, Schmidt S, Peshkin L, Ramensky VE, Gerasimova A, Bork P, Kondrashov AS, Sunyaev SR. Nat Methods 7(4):248-249 (2010).
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
143 "A method and server for predicting damaging missense mutations."
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
144
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
145 </help>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
146 </tool>
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
147
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
148
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
149
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
150
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
151
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
152
b319f980c9e6 Uploaded
saketkc
parents:
diff changeset
153