annotate vcftools_compare.xml @ 0:937918765b6e draft default tip

Uploaded
author devteam
date Sun, 24 Nov 2013 11:01:23 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
937918765b6e Uploaded
devteam
parents:
diff changeset
1 <tool id="vcftools_compare" name="Compare" version="0.1">
937918765b6e Uploaded
devteam
parents:
diff changeset
2 <description>multiple VCF datasets</description>
937918765b6e Uploaded
devteam
parents:
diff changeset
3
937918765b6e Uploaded
devteam
parents:
diff changeset
4 <requirements>
937918765b6e Uploaded
devteam
parents:
diff changeset
5 <requirement type="package">tabix</requirement>
937918765b6e Uploaded
devteam
parents:
diff changeset
6 <requirement type="package" version="0.1.11">vcftools</requirement>
937918765b6e Uploaded
devteam
parents:
diff changeset
7 </requirements>
937918765b6e Uploaded
devteam
parents:
diff changeset
8
937918765b6e Uploaded
devteam
parents:
diff changeset
9 <command>
937918765b6e Uploaded
devteam
parents:
diff changeset
10 ## Preprocessing for each dataset.
937918765b6e Uploaded
devteam
parents:
diff changeset
11 #set dataset_names = []
937918765b6e Uploaded
devteam
parents:
diff changeset
12 #for $input in $inputs:
937918765b6e Uploaded
devteam
parents:
diff changeset
13 ## Sort file.
937918765b6e Uploaded
devteam
parents:
diff changeset
14 sort -k1,1 -k2,2n ${input.file} > ${input.name}.vcf.sorted ;
937918765b6e Uploaded
devteam
parents:
diff changeset
15
937918765b6e Uploaded
devteam
parents:
diff changeset
16 ## Compress.
937918765b6e Uploaded
devteam
parents:
diff changeset
17 bgzip ${input.name}.vcf.sorted ;
937918765b6e Uploaded
devteam
parents:
diff changeset
18
937918765b6e Uploaded
devteam
parents:
diff changeset
19 ## Index.
937918765b6e Uploaded
devteam
parents:
diff changeset
20 tabix -p vcf ${input.name}.vcf.sorted.gz ;
937918765b6e Uploaded
devteam
parents:
diff changeset
21
937918765b6e Uploaded
devteam
parents:
diff changeset
22 #silent dataset_names.append( str($input.name) + '.vcf.sorted.gz' )
937918765b6e Uploaded
devteam
parents:
diff changeset
23 #end for
937918765b6e Uploaded
devteam
parents:
diff changeset
24
937918765b6e Uploaded
devteam
parents:
diff changeset
25 ## Compare and use sed to simplify output.
937918765b6e Uploaded
devteam
parents:
diff changeset
26 vcf-compare -w ${window} ${ignore_indels} #echo ' '.join( dataset_names )# | sed 's/\.vcf\.sorted\.gz//g' > ${output}
937918765b6e Uploaded
devteam
parents:
diff changeset
27 </command>
937918765b6e Uploaded
devteam
parents:
diff changeset
28 <inputs>
937918765b6e Uploaded
devteam
parents:
diff changeset
29 <repeat name="inputs" title="Datasets to Compare" min="2">
937918765b6e Uploaded
devteam
parents:
diff changeset
30 <param name="name" label="Dataset name" type="text" />
937918765b6e Uploaded
devteam
parents:
diff changeset
31 <param name="file" label="Dataset" type="data" format="vcf"/>
937918765b6e Uploaded
devteam
parents:
diff changeset
32 </repeat>
937918765b6e Uploaded
devteam
parents:
diff changeset
33 <param name="window" label="Comparison window" type="integer" min="0" value="0" help="In repetitive sequences, the same indel can be called at different positions. Consider records this far apart as matching (be it a SNP or an indel)."/>
937918765b6e Uploaded
devteam
parents:
diff changeset
34
937918765b6e Uploaded
devteam
parents:
diff changeset
35 <param name="ignore_indels" label="Ignore indels" type="select" help="Exclude sites containing indels from genotype comparison">
937918765b6e Uploaded
devteam
parents:
diff changeset
36 <option value="" selected="True">No</option>
937918765b6e Uploaded
devteam
parents:
diff changeset
37 <option value="--ignore-indels">Yes</option>
937918765b6e Uploaded
devteam
parents:
diff changeset
38 </param>
937918765b6e Uploaded
devteam
parents:
diff changeset
39 </inputs>
937918765b6e Uploaded
devteam
parents:
diff changeset
40
937918765b6e Uploaded
devteam
parents:
diff changeset
41 <outputs>
937918765b6e Uploaded
devteam
parents:
diff changeset
42 <data name="output" format="tabular"/>
937918765b6e Uploaded
devteam
parents:
diff changeset
43 </outputs>
937918765b6e Uploaded
devteam
parents:
diff changeset
44
937918765b6e Uploaded
devteam
parents:
diff changeset
45 <stdio>
937918765b6e Uploaded
devteam
parents:
diff changeset
46 <regex match=".*" source="both" level="log" description="tool progress"/>
937918765b6e Uploaded
devteam
parents:
diff changeset
47 </stdio>
937918765b6e Uploaded
devteam
parents:
diff changeset
48
937918765b6e Uploaded
devteam
parents:
diff changeset
49 <tests>
937918765b6e Uploaded
devteam
parents:
diff changeset
50 <!-- Cannot specify multiple repeats in test framework right now, so no tests possible. -->
937918765b6e Uploaded
devteam
parents:
diff changeset
51 </tests>
937918765b6e Uploaded
devteam
parents:
diff changeset
52
937918765b6e Uploaded
devteam
parents:
diff changeset
53 <help>
937918765b6e Uploaded
devteam
parents:
diff changeset
54 Please see the VCFtools `documentation`__ for help and further information.
937918765b6e Uploaded
devteam
parents:
diff changeset
55
937918765b6e Uploaded
devteam
parents:
diff changeset
56 .. __: http://vcftools.sourceforge.net/docs.html
937918765b6e Uploaded
devteam
parents:
diff changeset
57 </help>
937918765b6e Uploaded
devteam
parents:
diff changeset
58 </tool>