annotate cgatools_suite/tools/cgatools/calldiff.xml @ 7:96829b1b73ea draft

Uploaded
author bcrain-completegenomics
date Wed, 06 Jun 2012 16:58:26 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
7
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
1 <tool id="cga_calldiff" name="calldiff(beta)" version="0.0.1">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
2
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
3 <description>compares two Complete Genomics variant files.</description> <!--adds description in toolbar-->
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
4
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
5 <requirements>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
6 <requirement type="binary">cgatools</requirement>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
7 </requirements>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
8
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
9 <command> <!--run executable-->
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
10 cgatools calldiff --beta
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
11 --reference ${crr.fields.path}
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
12 --variantsA $data_sources.inputA
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
13 --variantsB $data_sources.inputB
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
14 $validation
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
15 $diploid
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
16 --locus-stats-column-count $column
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
17 --max-hypothesis-count $hypothesis
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
18 --output-prefix cg_
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
19 --reports `echo ${report1} ${report2} ${report3} ${report4} ${report5} ${somatic.report6} | sed 's/ */,/g'`
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
20 #if $somatic.report6 == "SomaticOutput"
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
21 --genome-rootA $somatic.genomeA
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
22 --genome-rootB $somatic.genomeB
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
23 --calibration-root $somatic.calibration
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
24 #end if
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
25 </command>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
26
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
27 <outputs>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
28 <data format="tabular" name="output1" from_work_dir="cg_SuperlocusOutput.tsv" label="${tool.name} on ${on_string}: SuperlocusOutput">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
29 <filter>(report1 == 'SuperlocusOutput')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
30 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
31 <data format="tabular" name="output2" from_work_dir="cg_SuperlocusStats.tsv" label="${tool.name} on ${on_string}: SuperlocusStats">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
32 <filter>(report2 == 'SuperlocusStats')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
33 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
34 <data format="tabular" name="output3" from_work_dir="cg_LocusOutput.tsv" label="${tool.name} on ${on_string}: LocusOutput">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
35 <filter>(report3 == 'LocusOutput')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
36 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
37 <data format="tabular" name="output4" from_work_dir="cg_LocusStats.tsv" label="${tool.name} on ${on_string}: LocusStats">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
38 <filter>(report4 == 'LocusStats')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
39 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
40 <data format="tabular" name="output5a" from_work_dir="cg_VariantsA.tsv" label="${tool.name} on ${on_string}: VariantsA">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
41 <filter>(report5 == 'VariantOutput')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
42 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
43 <data format="tabular" name="output5b" from_work_dir="cg_VariantsB.tsv" label="${tool.name} on ${on_string}: VariantsB">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
44 <filter>(report5 == 'VariantOutput')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
45 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
46 <data format="tabular" name="output6" from_work_dir="cg_SomaticOutput.tsv" label="${tool.name} on ${on_string}: SomaticOutput">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
47 <filter>(somatic['report6'] == 'SomaticOutput')</filter>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
48 </data>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
49 </outputs>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
50
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
51 <inputs>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
52 <!--form field to select crr file-->
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
53 <param name="crr" type="select" label="Genome build">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
54 <options from_data_table="cg_crr_files" />
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
55 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
56
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
57 <!--conditional to select variant file input-->
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
58 <conditional name="data_sources">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
59 <param name="data_source" type="select" label="Where are the input varfiles?">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
60 <option value="in" selected="true">imported into Galaxy</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
61 <option value="out">located outside Galaxy (available only for local Galaxy instances)</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
62 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
63 <when value="in">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
64 <!--form field to select variant files-->
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
65 <param name="inputA" type="data" format="cg_var" label="Dataset A">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
66 <validator type="unspecified_build" />
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
67 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
68 metadata_name="dbkey" metadata_column="1"
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
69 message="cgatools is not currently available for this build."/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
70 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
71 <param name="inputB" type="data" format="cg_var" label="Dataset B">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
72 <validator type="unspecified_build" />
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
73 <validator type="dataset_metadata_in_file" filename="cg_crr_files.loc"
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
74 metadata_name="dbkey" metadata_column="1"
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
75 message="cgatools is not currently available for this build."/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
76 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
77 </when>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
78 <when value="out">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
79 <!--form field to select crr file-->
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
80 <param name="inputA" type="text" label="Variant file A (path/file_name)" size="300" help="Variant files can be compressed (gz, bz2)."/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
81 <param name="inputB" type="text" label="Variant file B (path/file_name)" size="300" help="Variant files can be compressed (gz, bz2)."/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
82 </when>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
83 </conditional>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
84
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
85 <param name="diploid" type="select" label="Use diploid variant model" help="Uses varScoreEAF instead of varScoreVAF in somatic score computations. Also, uses diploid variant model instead of variable allele mixture model.">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
86 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
87 <option value="--diploid">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
88 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
89
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
90 <param name="column" type="integer" label="Number of columns for locus compare classification in the locus stats file (default 15)" value="15"/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
91
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
92 <param name="hypothesis" type="integer" label="Maximum number of possible phasings to consider for a superlocus (default 32)" value="32"/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
93
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
94 <param name="validation" type="select" label="Reference cover validation" help="Turns on/off validation that all bases of a chromosome are covered by calls of the variant file.">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
95 <option value="">on</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
96 <option value="--no-reference-cover-validation">off</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
97 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
98
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
99 <param name="report1" type="select" label="Report SuperlocusOutput">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
100 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
101 <option value="SuperlocusOutput">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
102 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
103 <param name="report2" type="select" label="Report SuperlocusStats">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
104 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
105 <option value="SuperlocusStats">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
106 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
107 <param name="report3" type="select" label="Report LocusOutput">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
108 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
109 <option value="LocusOutput">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
110 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
111 <param name="report4" type="select" label="Report LocusStats">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
112 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
113 <option value="LocusStats">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
114 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
115 <param name="report5" type="select" label="Report VariantOutput" help="Both variant files annotated by comparison results.If the somatic output report is requested, file A is also annotated with the same score ranks as produced in that report.">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
116 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
117 <option value="VariantOutput">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
118 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
119
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
120 <conditional name="somatic">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
121 <param name="report6" type="select" label="Report SomaticOutput" help="This report can only be generated on local Galaxy instances. Report for the list of simple variations that are present only in file 'A', annotated with the score that indicates the probability of the variation being truly somatic. Note: generating this report slows calldiff by 10x-20x.">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
122 <option value="">no</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
123 <option value="SomaticOutput">yes</option>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
124 </param>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
125 <when value="SomaticOutput">
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
126 <param name="genomeA" type="text" size="300" label="Directory for genome A (path/dir)" help="The 'A' genome directory, for example /data/GS00118-DNA_A01; this directory is expected to contain ASM/REF and ASM/EVIDENCE subdirectories."/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
127 <param name="genomeB" type="text" size="300" label="Directory for genome B (path/dir)" help="The 'B' genome directory"/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
128 <param name="calibration" type="text" size="300" label="Directory calibration data (path/dir)" help="The directory containing calibration data. For example, there should exist a file calibration-root/0.0.0/metrics.tsv. Calibration data can be downloaded from ftp://ftp.completegenomics.com/ScoreCalibrationFiles/var-calibration-v1.tgz"/>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
129 </when>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
130 </conditional>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
131
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
132 </inputs>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
133
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
134 <help>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
135
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
136 **What it does**
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
137
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
138 This tool compares two Complete Genomics variant files.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
139
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
140 cgatools: http://sourceforge.net/projects/cgatools/files/
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
141
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
142 -----
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
143
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
144 **cgatools Manual**::
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
145
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
146 COMMAND NAME
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
147 calldiff - Compares two Complete Genomics variant files.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
148
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
149 DESCRIPTION
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
150 Compares two Complete Genomics variant files. Divides the genome up into
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
151 superloci of nearby variants, then compares the superloci. Also refines the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
152 comparison to determine per-call or per-locus comparison results.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
153
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
154 Comparison results are usually described by a semi-colon separated string,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
155 one per allele. Each allele's comparison result is one of the following
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
156 classifications:
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
157
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
158 ref-identical The alleles of the two variant files are identical, and
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
159 they are consistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
160 alt-identical The alleles of the two variant files are identical, and
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
161 they are inconsistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
162 ref-consistent The alleles of the two variant files are consistent,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
163 and they are consistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
164 alt-consistent The alleles of the two variant files are consistent,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
165 and they are inconsistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
166 onlyA The alleles of the two variant files are inconsistent,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
167 and only file A is inconsistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
168 onlyB The alleles of the two variant files are inconsistent,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
169 and only file B is inconsistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
170 mismatch The alleles of the two variant files are inconsistent,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
171 and they are both inconsistent with the reference.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
172 phase-mismatch The two variant files would be consistent if the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
173 hapLink field had been empty, but they are
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
174 inconsistent.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
175 ploidy-mismatch The superlocus did not have uniform ploidy.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
176
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
177 In some contexts, this classification is rolled up into a simplified
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
178 classification, which is one of "identical", "consistent", "onlyA",
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
179 "onlyB", or "mismatch".
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
180
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
181 A good place to start looking at the results is the superlocus-output file.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
182 It has columns defined as follows:
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
183
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
184 SuperlocusId An identifier given to the superlocus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
185 Chromosome The name of the chromosome.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
186 Begin The 0-based offset of the start of the superlocus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
187 End The 0-based offset of the base one past the end of the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
188 superlocus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
189 Classification The match classification of the superlocus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
190 Reference The reference sequence.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
191 AllelesA A semicolon-separated list of the alleles (one per
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
192 haplotype) for variant file A, for the phasing with the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
193 best comparison result.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
194 AllelesB A semicolon-separated list of the alleles (one per
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
195 haplotype) for variant file B, for the phasing with the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
196 best comparison result.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
197
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
198 The locus-output file contains, for each locus in file A and file B that is
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
199 not consistent with the reference, an annotated set of calls for the locus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
200 The calls are annotated with the following columns:
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
201
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
202 SuperlocusId The id of the superlocus containing the locus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
203 File The variant file (A or B).
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
204 LocusClassification The locus classification is determined by the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
205 varType column of the call that is inconsistent
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
206 with the reference, concatenated with a
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
207 modifier that describes whether the locus is
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
208 heterozygous, homozygous, or contains no-calls.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
209 If there is no one variant in the locus (i.e.,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
210 it is heterozygous alt-alt), the locus
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
211 classification begins with "other".
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
212 LocusDiffClassification The match classification for the locus. This is
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
213 defined to be the best of the comparison of the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
214 locus to the same region in the other file, or
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
215 the comparison of the superlocus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
216
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
217 The somatic output file contains a list of putative somatic variations of
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
218 genome A. The output includes only those loci that can be classified as
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
219 snp, del, ins or sub in file A, and are called reference in the file B.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
220 Every locus is annotated with the following columns:
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
221
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
222 VarCvgA The totalReadCount from file A for this locus
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
223 (computed on the fly if file A is not a
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
224 masterVar file).
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
225 VarScoreA The varScoreVAF from file A, or varScoreEAF if
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
226 the "--diploid" option is used.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
227 RefCvgB The maximum of the uniqueSequenceCoverage
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
228 values for the locus in genome B.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
229 RefScoreB Minimum of the reference scores of the locus in
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
230 genome B.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
231 SomaticCategory The category used for determining the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
232 calibrated scores and the SomaticRank.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
233 VarScoreACalib The calibrated variant score of file A, under
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
234 the model selected by using or not using the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
235 "--diploid" option, and corrected for the count
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
236 of heterozygous variants observed in this
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
237 genome. See user guide for more information.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
238 VarScoreBCalib The calibrated reference score of file B, under
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
239 the model selected by using or not using the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
240 "--diploid" option, and corrected for the count
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
241 of heterozygous variants observed in this
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
242 genome. See user guide for more information.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
243 SomaticRank The estimated rank of this somatic mutation,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
244 amongst all true somatic mutations within this
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
245 SomaticCategory. The value is a number between
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
246 0 and 1; a value of 0.012 means, for example,
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
247 that an estimated 1.2% of the true somatic
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
248 mutations in this somaticCategory have a
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
249 somaticScore less than the somaticScore for
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
250 this mutation. See user guide for more
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
251 information.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
252 SomaticScore An integer that provides a total order on
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
253 quality for all somatic mutations. It is equal
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
254 to -10*log10( P(false)/P(true) ), under the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
255 assumption that this genome has a rate of
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
256 somatic mutation equal to 1/Mb for
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
257 SomaticCategory snp, 1/10Mb for SomaticCategory
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
258 ins, 1/10Mb for SomaticCategory del, and 1/20Mb
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
259 for SomaticCategory sub. The computation is
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
260 based on the assumptions described in the user
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
261 guide, and is affected by choice of variant
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
262 model selected by using or not using the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
263 "--diploid" option.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
264 SomaticQuality Equal to VQHIGH for all somatic mutations where
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
265 SomaticScore &gt;= -10. Otherwise, this column is
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
266 empty.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
267
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
268 OPTIONS
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
269 -h [ --help ]
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
270 Print this help message.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
271
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
272 --reference arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
273 The input crr file.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
274
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
275 --variantsA arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
276 The "A" input variant file.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
277
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
278 --variantsB arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
279 The "B" input variant file.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
280
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
281 --output-prefix arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
282 The path prefix for all output reports.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
283
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
284 --reports arg (=SuperlocusOutput,SuperlocusStats,LocusOutput,LocusStats)
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
285 Comma-separated list of reports to generate. (Beware any reports whose
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
286 name begins with "Debug".) A report is one of:
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
287 SuperlocusOutput Report for superlocus classification.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
288 SuperlocusStats Report for superlocus classification stats.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
289 LocusOutput Report for locus classification.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
290 LocusStats Report for locus stats.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
291 VariantOutput Both variant files annotated by comparison
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
292 results.If the somatic output report is
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
293 requested, file A is also annotated with the
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
294 same score ranks as produced in that report.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
295 SomaticOutput Report for the list of simple variations that
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
296 are present only in file "A", annotated with
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
297 the score that indicates the probability of
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
298 the variation being truly somatic. Requires
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
299 beta, genome-rootA, and genome-rootB options
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
300 to be provided as well. Note: generating this
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
301 report slows calldiff by 10x-20x.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
302 DebugCallOutput Report for call classification.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
303 DebugSuperlocusOutput Report for debug superlocus information.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
304 DebugSomaticOutput Report for distribution estimates used for
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
305 somatic rescoring. Only produced if
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
306 SomaticOutput is also turned on.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
307
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
308 --diploid
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
309 Uses varScoreEAF instead of varScoreVAF in somatic score computations.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
310 Also, uses diploid variant model instead of variable allele mixture
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
311 model.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
312
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
313 --locus-stats-column-count arg (=15)
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
314 The number of columns for locus compare classification in the locus
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
315 stats file.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
316
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
317 --max-hypothesis-count arg (=32)
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
318 The maximum number of possible phasings to consider for a superlocus.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
319
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
320 --no-reference-cover-validation
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
321 Turns off validation that all bases of a chromosome are covered by
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
322 calls of the variant file.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
323
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
324 --genome-rootA arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
325 The "A" genome directory, for example /data/GS00118-DNA_A01; this
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
326 directory is expected to contain ASM/REF and ASM/EVIDENCE
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
327 subdirectories.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
328
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
329 --genome-rootB arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
330 The "B" genome directory.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
331
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
332 --calibration-root arg
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
333 The directory containing calibration data. For example, there should
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
334 exist a file calibration-root/0.0.0/metrics.tsv.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
335
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
336 --beta
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
337 This flag enables the SomaticOutput report, which is beta
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
338 functionality.
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
339
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
340 SUPPORTED FORMAT_VERSION
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
341 0.3 or later
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
342 </help>
96829b1b73ea Uploaded
bcrain-completegenomics
parents:
diff changeset
343 </tool>