annotate add_fst_column.py @ 0:99a67ac88802 default tip

Uploaded
author rico
date Thu, 05 Apr 2012 14:22:50 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
99a67ac88802 Uploaded
rico
parents:
diff changeset
1 #!/usr/bin/env python
99a67ac88802 Uploaded
rico
parents:
diff changeset
2
99a67ac88802 Uploaded
rico
parents:
diff changeset
3 # <command interpreter="python">
99a67ac88802 Uploaded
rico
parents:
diff changeset
4 # add_fst_column.py "$input" "$p1_input" "$p2_input" "$data_source.choice" "$data_source.min_value" "$retain" "$discard_fixed" "$biased" "$output"
99a67ac88802 Uploaded
rico
parents:
diff changeset
5 # #for $individual, $individual_col in zip($input.dataset.metadata.individual_names, $input.dataset.metadata.individual_columns)
99a67ac88802 Uploaded
rico
parents:
diff changeset
6 # #set $arg = '%s:%s' % ($individual_col, $individual)
99a67ac88802 Uploaded
rico
parents:
diff changeset
7 # "$arg"
99a67ac88802 Uploaded
rico
parents:
diff changeset
8 # #end for
99a67ac88802 Uploaded
rico
parents:
diff changeset
9 # </command>
99a67ac88802 Uploaded
rico
parents:
diff changeset
10
99a67ac88802 Uploaded
rico
parents:
diff changeset
11 import sys
99a67ac88802 Uploaded
rico
parents:
diff changeset
12 import subprocess
99a67ac88802 Uploaded
rico
parents:
diff changeset
13 from Population import Population
99a67ac88802 Uploaded
rico
parents:
diff changeset
14
99a67ac88802 Uploaded
rico
parents:
diff changeset
15 ################################################################################
99a67ac88802 Uploaded
rico
parents:
diff changeset
16
99a67ac88802 Uploaded
rico
parents:
diff changeset
17 if len(sys.argv) < 12:
99a67ac88802 Uploaded
rico
parents:
diff changeset
18 print >> sys.stderr, "Usage"
99a67ac88802 Uploaded
rico
parents:
diff changeset
19 sys.exit(1)
99a67ac88802 Uploaded
rico
parents:
diff changeset
20
99a67ac88802 Uploaded
rico
parents:
diff changeset
21 input, p1_input, p2_input, genotypes, min_reads, min_qual, retain, discard_fixed, biased, output = sys.argv[1:11]
99a67ac88802 Uploaded
rico
parents:
diff changeset
22 individual_metadata = sys.argv[11:]
99a67ac88802 Uploaded
rico
parents:
diff changeset
23
99a67ac88802 Uploaded
rico
parents:
diff changeset
24 p_total = Population()
99a67ac88802 Uploaded
rico
parents:
diff changeset
25 p_total.from_tag_list(individual_metadata)
99a67ac88802 Uploaded
rico
parents:
diff changeset
26
99a67ac88802 Uploaded
rico
parents:
diff changeset
27 p1 = Population()
99a67ac88802 Uploaded
rico
parents:
diff changeset
28 p1.from_population_file(p1_input)
99a67ac88802 Uploaded
rico
parents:
diff changeset
29 if not p_total.is_superset(p1):
99a67ac88802 Uploaded
rico
parents:
diff changeset
30 print >> sys.stderr, 'There is an individual in population 1 that is not in the SNP table'
99a67ac88802 Uploaded
rico
parents:
diff changeset
31 sys.exit(1)
99a67ac88802 Uploaded
rico
parents:
diff changeset
32
99a67ac88802 Uploaded
rico
parents:
diff changeset
33 p2 = Population()
99a67ac88802 Uploaded
rico
parents:
diff changeset
34 p2.from_population_file(p2_input)
99a67ac88802 Uploaded
rico
parents:
diff changeset
35 if not p_total.is_superset(p2):
99a67ac88802 Uploaded
rico
parents:
diff changeset
36 print >> sys.stderr, 'There is an individual in population 2 that is not in the SNP table'
99a67ac88802 Uploaded
rico
parents:
diff changeset
37 sys.exit(1)
99a67ac88802 Uploaded
rico
parents:
diff changeset
38
99a67ac88802 Uploaded
rico
parents:
diff changeset
39 ################################################################################
99a67ac88802 Uploaded
rico
parents:
diff changeset
40
99a67ac88802 Uploaded
rico
parents:
diff changeset
41 prog = 'Fst_column'
99a67ac88802 Uploaded
rico
parents:
diff changeset
42
99a67ac88802 Uploaded
rico
parents:
diff changeset
43 args = []
99a67ac88802 Uploaded
rico
parents:
diff changeset
44 args.append(prog)
99a67ac88802 Uploaded
rico
parents:
diff changeset
45 args.append(input)
99a67ac88802 Uploaded
rico
parents:
diff changeset
46 args.append(genotypes)
99a67ac88802 Uploaded
rico
parents:
diff changeset
47 args.append(min_reads)
99a67ac88802 Uploaded
rico
parents:
diff changeset
48 args.append(min_qual)
99a67ac88802 Uploaded
rico
parents:
diff changeset
49 args.append(retain)
99a67ac88802 Uploaded
rico
parents:
diff changeset
50 args.append(discard_fixed)
99a67ac88802 Uploaded
rico
parents:
diff changeset
51 args.append(biased)
99a67ac88802 Uploaded
rico
parents:
diff changeset
52
99a67ac88802 Uploaded
rico
parents:
diff changeset
53 columns = p1.column_list()
99a67ac88802 Uploaded
rico
parents:
diff changeset
54 for column in columns:
99a67ac88802 Uploaded
rico
parents:
diff changeset
55 args.append('{0}:1'.format(column))
99a67ac88802 Uploaded
rico
parents:
diff changeset
56
99a67ac88802 Uploaded
rico
parents:
diff changeset
57 columns = p2.column_list()
99a67ac88802 Uploaded
rico
parents:
diff changeset
58 for column in columns:
99a67ac88802 Uploaded
rico
parents:
diff changeset
59 args.append('{0}:2'.format(column))
99a67ac88802 Uploaded
rico
parents:
diff changeset
60
99a67ac88802 Uploaded
rico
parents:
diff changeset
61 fh = open(output, 'w')
99a67ac88802 Uploaded
rico
parents:
diff changeset
62
99a67ac88802 Uploaded
rico
parents:
diff changeset
63 #print "args:", ' '.join(args)
99a67ac88802 Uploaded
rico
parents:
diff changeset
64 p = subprocess.Popen(args, bufsize=-1, stdin=None, stdout=fh, stderr=sys.stderr)
99a67ac88802 Uploaded
rico
parents:
diff changeset
65 rc = p.wait()
99a67ac88802 Uploaded
rico
parents:
diff changeset
66 fh.close()
99a67ac88802 Uploaded
rico
parents:
diff changeset
67
99a67ac88802 Uploaded
rico
parents:
diff changeset
68 sys.exit(0)
99a67ac88802 Uploaded
rico
parents:
diff changeset
69