Mercurial > repos > devteam > pileup_interval
annotate pileup_interval.py @ 3:d78f28cae91b draft default tip
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
| author | devteam |
|---|---|
| date | Fri, 15 Jan 2021 11:38:35 +0000 |
| parents | 8afc93a5f9ae |
| children |
| rev | line source |
|---|---|
| 0 | 1 #!/usr/bin/env python |
| 2 | |
| 3 """ | |
| 4 Condenses pileup format into ranges of bases. | |
| 5 | |
| 6 usage: %prog [options] | |
| 7 -i, --input=i: Input pileup file | |
| 8 -o, --output=o: Output pileup | |
| 9 -c, --coverage=c: Coverage | |
| 10 -f, --format=f: Pileup format | |
| 11 -b, --base=b: Base to select | |
| 12 -s, --seq_column=s: Sequence column | |
| 13 -l, --loc_column=l: Base location column | |
| 14 -r, --base_column=r: Reference base column | |
| 15 -C, --cvrg_column=C: Coverage column | |
| 16 """ | |
| 17 import sys | |
| 18 | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
19 from bx.cookbook import doc_optparse |
|
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
20 |
| 0 | 21 |
| 22 def __main__(): | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
23 # Parse Command Line |
|
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
24 options, args = doc_optparse.parse(__doc__) |
| 0 | 25 coverage = int(options.coverage) |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
26 fin = open(options.input, 'r') |
|
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
27 fout = open(options.output, 'w') |
| 0 | 28 inLine = fin.readline() |
| 29 if options.format == 'six': | |
| 30 seqIndex = 0 | |
| 31 locIndex = 1 | |
| 32 baseIndex = 2 | |
| 33 covIndex = 3 | |
| 34 elif options.format == 'ten': | |
| 35 seqIndex = 0 | |
| 36 locIndex = 1 | |
| 37 if options.base == 'first': | |
| 38 baseIndex = 2 | |
| 39 else: | |
| 40 baseIndex = 3 | |
| 41 covIndex = 7 | |
| 42 else: | |
| 43 seqIndex = int(options.seq_column) - 1 | |
| 44 locIndex = int(options.loc_column) - 1 | |
| 45 baseIndex = int(options.base_column) - 1 | |
| 46 covIndex = int(options.cvrg_column) - 1 | |
| 47 lastSeq = '' | |
| 48 lastLoc = -1 | |
| 49 locs = [] | |
| 50 startLoc = -1 | |
| 51 bases = [] | |
| 52 while inLine.strip() != '': | |
| 53 lineParts = inLine.split('\t') | |
| 54 try: | |
| 55 seq, loc, base, cov = lineParts[seqIndex], int(lineParts[locIndex]), lineParts[baseIndex], int(lineParts[covIndex]) | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
56 except IndexError as ei: |
| 0 | 57 if options.format == 'ten': |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
58 sys.exit('It appears that you have selected 10 columns while your file has 6. Make sure that the number of columns you specify matches the number in your file.\n' + str(ei)) |
| 0 | 59 else: |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
60 sys.exit('There appears to be something wrong with your column index values.\n' + str(ei)) |
|
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
61 except ValueError as ev: |
| 0 | 62 if options.format == 'six': |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
63 sys.exit('It appears that you have selected 6 columns while your file has 10. Make sure that the number of columns you specify matches the number in your file.\n' + str(ev)) |
| 0 | 64 else: |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
65 sys.exit('There appears to be something wrong with your column index values.\n' + str(ev)) |
| 0 | 66 # strout += str(startLoc) + '\n' |
| 67 # strout += str(bases) + '\n' | |
| 68 # strout += '%s\t%s\t%s\t%s\n' % (seq, loc, base, cov) | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
69 if loc == lastLoc + 1 or lastLoc == -1: |
| 0 | 70 if cov >= coverage: |
| 71 if seq == lastSeq or lastSeq == '': | |
| 72 if startLoc == -1: | |
| 73 startLoc = loc | |
| 74 locs.append(loc) | |
| 75 bases.append(base) | |
| 76 else: | |
| 77 if len(bases) > 0: | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
78 fout.write('%s\t%s\t%s\t%s\n' % (lastSeq, startLoc - 1, lastLoc, ''.join(bases))) |
| 0 | 79 startLoc = loc |
| 80 locs = [loc] | |
| 81 bases = [base] | |
| 82 else: | |
| 83 if len(bases) > 0: | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
84 fout.write('%s\t%s\t%s\t%s\n' % (lastSeq, startLoc - 1, lastLoc, ''.join(bases))) |
| 0 | 85 startLoc = -1 |
| 86 locs = [] | |
| 87 bases = [] | |
| 88 else: | |
| 89 if len(bases) > 0: | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
90 fout.write('%s\t%s\t%s\t%s\n' % (lastSeq, startLoc - 1, lastLoc, ''.join(bases))) |
| 0 | 91 if cov >= coverage: |
| 92 startLoc = loc | |
| 93 locs = [loc] | |
| 94 bases = [base] | |
| 95 else: | |
| 96 startLoc = -1 | |
| 97 locs = [] | |
| 98 bases = [] | |
| 99 lastSeq = seq | |
| 100 lastLoc = loc | |
| 101 inLine = fin.readline() | |
| 102 if len(bases) > 0: | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
103 fout.write('%s\t%s\t%s\t%s\n' % (lastSeq, startLoc - 1, lastLoc, ''.join(bases))) |
| 0 | 104 fout.close() |
| 105 fin.close() | |
| 106 # import sys | |
| 107 # strout += file(fout.name,'r').read() | |
| 108 # sys.stderr.write(strout) | |
| 109 | |
|
3
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
110 |
|
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
111 if __name__ == "__main__": |
|
d78f28cae91b
"planemo upload for repository https://github.com/galaxyproject/tools-devteam/tree/master/tools/pileup_interval commit 8b2095c59ecc2e94c58a42e2e04dbcecdc823dbf"
devteam
parents:
0
diff
changeset
|
112 __main__() |
