annotate cgatools/tools/cg_cgatools/snpdiff.xml @ 12:e59abf6c3d0b draft

Uploaded
author bcrain-completegenomics
date Thu, 14 Jun 2012 13:44:48 -0400
parents e183f52194a5
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
8
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
1 <tool id="cga_snpdiff" name="snpdiff" version="0.0.1">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
2
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
3 <description>compares snp calls to a Complete Genomics variant file.</description> <!--adds description in toolbar-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
4
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
5 <requirements>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
6 <requirement type="binary">cgatools</requirement>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
7 </requirements>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
8
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
9 <command> <!--run executable-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
10 cgatools snpdiff
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
11 --reference $crr.fields.path
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
12 --variants $varfile
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
13 --genotypes $genotype
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
14 --output-prefix cg_
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
15 --reports `echo ${report1} ${report2} ${report3} | sed 's/ */,/g'`
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
16 </command>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
17
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
18 <outputs>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
19 <data format="tabular" name="output1" from_work_dir="cg_Output.tsv" label="${tool.name} on ${on_string}: Output">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
20 <filter>(report1 == 'Output')</filter>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
21 </data>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
22 <data format="tabular" name="output2" from_work_dir="cg_Verbose.tsv" label="${tool.name} on ${on_string}: Verbose">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
23 <filter>(report2 == 'Verbose')</filter>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
24 </data>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
25 <data format="tabular" name="output3" from_work_dir="cg_Stats.tsv" label="${tool.name} on ${on_string}: Stats">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
26 <filter>(report3 == 'Stats')</filter>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
27 </data>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
28 </outputs>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
29
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
30 <inputs>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
31 <!--form field to select crr file-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
32 <param name="crr" type="select" label="Genome build">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
33 <options from_data_table="cg_crr_files" />
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
34 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
35
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
36 <!--conditional to select variant file input-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
37 <conditional name="data_sources">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
38 <param name="data_source" type="select" label="Where is the input varfile?">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
39 <option value="in" selected="true">imported into Galaxy</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
40 <option value="out">located outside Galaxy (available only for local Galaxy instances)</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
41 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
42 <when value="in">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
43 <!--form field to select variant files-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
44 <param name="varfile" type="data" format="cg_var" label="Var file">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
45 <validator type="unspecified_build" />
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
46 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
47 metadata_name="dbkey" metadata_column="1"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
48 message="cgatools is not currently available for this build."/>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
49 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
50 </when>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
51 <when value="out">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
52 <!--form field to select crr file-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
53 <param name="varfile" type="text" label="Variant file (/path/file_name)" size="40" help="Variant file can be compressed (gz, bz2)."/>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
54 </when>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
55 </conditional>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
56
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
57 <!--conditional to select genotypes file input-->
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
58 <param name="genotype" type="data" format="tabular" label="Genotypes file with SNP calls" help="The genotypes file is a tab-delimited file with at
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
59 least the following columns (additional columns may be given): Chromosome (Required), Offset0Based (Required), GenotypesStrand (Optional), Genotypes (Optional)">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
60 <validator type="unspecified_build" />
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
61 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
62 metadata_name="dbkey" metadata_column="1"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
63 message="cgatools is not currently available for this build."/>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
64 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
65
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
66 <param name="report1" type="select" label="Report Output">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
67 <option value="">no</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
68 <option value="Output">yes</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
69 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
70 <param name="report2" type="select" label="Report Verbose">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
71 <option value="">no</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
72 <option value="Verbose">yes</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
73 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
74 <param name="report3" type="select" label="Report Stats">
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
75 <option value="">no</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
76 <option value="Stats">yes</option>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
77 </param>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
78
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
79 </inputs>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
80
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
81 <help>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
82
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
83 **What it does**
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
84
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
85 This tool ompares snp calls to a Complete Genomics variant file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
86
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
87 cgatools: http://sourceforge.net/projects/cgatools/files/
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
88
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
89 -----
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
90
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
91 **cgatools Manual**::
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
92
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
93 COMMAND NAME
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
94 snpdiff - Compares snp calls to a Complete Genomics variant file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
95
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
96 DESCRIPTION
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
97 Compares the snp calls in the "genotypes" file to the calls in a Complete
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
98 Genomics variant file. The genotypes file is a tab-delimited file with at
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
99 least the following columns (additional columns may be given):
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
100
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
101 Chromosome (Required) The name of the chromosome.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
102 Offset0Based (Required) The 0-based offset in the chromosome.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
103 GenotypesStrand (Optional) The strand of the calls in the Genotypes
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
104 column (+ or -, defaults to +).
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
105 Genotypes (Optional) The calls, one per allele. The following
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
106 calls are recognized:
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
107 A,C,G,T A called base.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
108 N A no-call.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
109 - A deleted base.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
110 . A non-snp variation.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
111
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
112 The output is a tab-delimited file consisting of the columns of the
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
113 original genotypes file, plus the following additional columns:
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
114
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
115 Reference The reference base at the given position.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
116 VariantFile The calls made by the variant file, one per allele.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
117 The character codes are the same as is described for
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
118 the Genotypes column.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
119 DiscordantAlleles (Only if Genotypes is present) The number of
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
120 Genotypes alleles that are discordant with calls in
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
121 the VariantFile. If the VariantFile is described as
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
122 haploid at the given position but the Genotypes is
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
123 diploid, then each genotype allele is compared
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
124 against the haploid call of the VariantFile.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
125 NoCallAlleles (Only if Genotypes is present) The number of
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
126 Genotypes alleles that were no-called by the
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
127 VariantFile. If the VariantFile is described as
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
128 haploid at the given position but the Genotypes is
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
129 diploid, then a VariantFile no-call is counted twice.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
130
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
131 The verbose output is a tab-delimited file consisting of the columns of the
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
132 original genotypes file, plus the following additional columns:
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
133
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
134 Reference The reference base at the given position.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
135 VariantFile The call made by the variant file for one allele (there is
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
136 a line in this file for each allele). The character codes
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
137 are the same as is described for the Genotypes column.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
138 [CALLS] The rest of the columns are pasted in from the VariantFile,
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
139 describing the variant file line used to make the call.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
140
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
141 The stats output is a comma-separated file with several tables describing
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
142 the results of the snp comparison, for each diploid genotype. The tables
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
143 all describe the comparison result (column headers) versus the genotype
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
144 classification (row labels) in different ways. The "Locus classification"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
145 tables have the most detailed match classifications, while the "Locus
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
146 concordance" tables roll these match classifications up into "discordance"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
147 and "no-call". A locus is considered discordant if it is discordant for
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
148 either allele. A locus is considered no-call if it is concordant for both
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
149 alleles but has a no-call on either allele. The "Allele concordance"
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
150 describes the comparison result on a per-allele basis.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
151
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
152 OPTIONS
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
153 -h [ --help ]
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
154 Print this help message.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
155
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
156 --reference arg
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
157 The input crr file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
158
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
159 --variants arg
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
160 The input variant file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
161
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
162 --genotypes arg
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
163 The input genotypes file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
164
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
165 --output-prefix arg
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
166 The path prefix for all output reports.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
167
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
168 --reports arg (=Output,Verbose,Stats)
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
169 Comma-separated list of reports to generate. A report is one of:
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
170 Output The output genotypes file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
171 Verbose The verbose output file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
172 Stats The stats output file.
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
173
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
174 SUPPORTED FORMAT_VERSION
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
175 0.3 or later
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
176 </help>
e183f52194a5 Uploaded
bcrain-completegenomics
parents:
diff changeset
177 </tool>