comparison snpSift_caseControl.xml @ 24:f22f28cd881e

Update for snpEff v3.2
author Jim Johnson <jj@umn.edu>
date Tue, 07 May 2013 14:58:15 -0500
parents 50c1a8ff6c82
children
comparison
equal deleted inserted replaced
23:50c1a8ff6c82 24:f22f28cd881e
1 <tool id="snpSift_caseControl" name="SnpSift CaseControl" version="3.1"> 1 <tool id="snpSift_caseControl" name="SnpSift CaseControl" version="3.2">
2 <description>Count samples are in 'case' and 'control' groups.</description> 2 <description>Count samples are in 'case' and 'control' groups.</description>
3 <!-- 3 <!--
4 You will need to change the path to wherever your installation is. 4 You will need to change the path to wherever your installation is.
5 You can change the amount of memory used, just change the -Xmx parameter (e.g. use -Xmx2G for 2Gb of memory) 5 You can change the amount of memory used, just change the -Xmx parameter (e.g. use -Xmx2G for 2Gb of memory)
6 --> 6 -->
7 <requirements> 7 <requirements>
8 <requirement type="package" version="3.1">snpEff</requirement> 8 <requirement type="package" version="3.2">snpEff</requirement>
9 </requirements> 9 </requirements>
10 <command> 10 <command>
11 java -Xmx1G -jar \$JAVA_JAR_PATH/SnpSift.jar casControl -q $hhCase $hhControl $caseControStr $input > $output 11 java -Xmx1G -jar \$JAVA_JAR_PATH/SnpSift.jar caseControl -q
12 </command> 12 #if $name.__str__.strip() != '':
13 <inputs> 13 -name $name
14 <param format="vcf" name="input" type="data" label="VCF input"/> 14 #end if
15 <param name="hhCase" type="select" label="Hom/Het case"> 15 #if $ctrl.ctrl_src == 'caseString':
16 <option value="any">Any</option> 16 '$ctrl.caseControlStr'
17 <option value="hom">Homozygous</option> 17 #else
18 <option value="het">Heterozygous</option> 18 -tfam "$ctrl.tfam"
19 </param> 19 #end if
20 <param name="hhControl" type="select" label="Hom/Het control"> 20 $input > $output
21 <option value="any">Any</option> 21 </command>
22 <option value="hom">Homozygous</option> 22 <inputs>
23 <option value="het">Heterozygous</option> 23 <param format="vcf" name="input" type="data" label="VCF input"/>
24 </param> 24 <conditional name="ctrl">
25 <param name="caseControStr" type="text" label="Case / Control" size="50"/> 25 <param name="ctrl_src" type="select" label="Case Control defined in">
26 </inputs> 26 <option value="caseString">Case Control String</option>
27 <outputs> 27 <option value="tfam">TFAM</option>
28 <data format="vcf" name="output" /> 28 </param>
29 </outputs> 29 <when value="caseString">
30 <param name="caseControlStr" type="text" label="Case / Control column designation" size="50">
31 <help>
32 Case and control are defined by a string containing plus and minus symbols {'+', '-', '0'} where '+' is case, '-' is control and '0' is neutral
33 </help>
34 <validator type="regex" message="must be only plus(+), minus(-), or zero(0) characters">[+-0]+</validator>
35 </param>
36 </when>
37 <when value="tfam">
38 <param format="tabular" name="tfam" type="data" label="PLINK TFAM file"/>
39 </when>
40 </conditional>
41 <param name="name" type="text" optional="true" label="name" help="name to append to the 'Cases' or 'Controls' tags">
42 <validator type="regex" message="Use only valid ID characters">[_a-zA-Z0-9]+</validator>
43 </param>
44 </inputs>
45 <outputs>
46 <data format="vcf" name="output" />
47 </outputs>
30 <stdio> 48 <stdio>
31 <exit_code range=":-1" level="fatal" description="Error: Cannot open file" /> 49 <exit_code range=":-1" level="fatal" description="Error: Cannot open file" />
32 <exit_code range="1:" level="fatal" description="Error" /> 50 <exit_code range="1:" level="fatal" description="Error" />
33 </stdio> 51 </stdio>
52 <tests>
34 53
35 <help> 54 <test>
55 <param name="input" ftype="vcf" value="test.private.01.vcf"/>
56 <param name="ctrl_src" value="caseString"/>
57 <param name="caseControlStr" value="--"/>
58 <output name="output">
59 <assert_contents>
60 <has_text text="Cases=0,0,0;" />
61 <has_text text="Controls=0,0,0;" />
62 </assert_contents>
63 </output>
64 </test>
36 65
37 Count samples are in 'case' and 'control' groups. You can count 'homozygous', 'heterozygous' or 'any' variants. Case and control are defined by a string containing plus and minus symbols ('+' and '-') where '+' is case and '-' is control. This command adds two annotations to the VCF file. 66 <test>
67 <param name="input" ftype="vcf" value="test.private.02.vcf"/>
68 <param name="ctrl_src" value="caseString"/>
69 <param name="caseControlStr" value="--"/>
70 <output name="output">
71 <assert_contents>
72 <has_text text="Cases=0,0,0;" />
73 <has_text text="Controls=2,0,4;" />
74 </assert_contents>
75 </output>
76 </test>
77
78 <test>
79 <param name="input" ftype="vcf" value="test.private.02.vcf"/>
80 <param name="name" value=""/>
81 <param name="ctrl_src" value="caseString"/>
82 <param name="caseControlStr" value="-+"/>
83 <output name="output">
84 <assert_contents>
85 <has_text text="Cases=1,0,2;" />
86 <has_text text="Controls=1,0,2;" />
87 </assert_contents>
88 </output>
89 </test>
90
91 </tests>
92
93 <help>
94
95 **SnpSift CaseControl**
96
97 Allows you to count how many samples are in 'case' group and a 'control' group. You can count 'homozygous', 'heterozygous' or 'any' variants.
98
99 Case and control are defined by a string containing plus and minus symbols {'+', '-', '0'} where '+' is case, '-' is control and '0' is neutral.
100
101 This command adds two annotations to the VCF file:
102
103 - **CaseControl**: Two comma separated numbers numbers representing the number of samples that have the variant in the case and the control group. Example:
104
105 "CaseControl=3,4" *the variant is present in 3 cases and 4 controls.*
106
107
108 - **CaseControlP**: A p-value (Fisher exact test) that the number of cases is N or more. Example:
109
110 "CaseControl=4,0;CaseControlP=3.030303e-02" *in this case the pValue of having 4 or more cases and zero controls is 0.03*
111
112
113 For example, if we have ten samples (which means ten genotype columns in the VCF file), the first four are 'case' and the last six are 'control', so the description string would be "++++------". Let's say we want to distinguish genotypes that are homozygous in 'case' and either homozygous or heterozygous in 'control'. We would set:
114
115 - Hom/Het case = "hom"
116
117 - Hom/Het control = "any"
118
119 - Case / Control column designation = ""++++------"
120
38 121
39 For details about this tool, please go to http://snpeff.sourceforge.net/SnpSift.html#casecontrol 122 For details about this tool, please go to http://snpeff.sourceforge.net/SnpSift.html#casecontrol
40 123
41 </help> 124 </help>
42 </tool> 125 </tool>