Mercurial > repos > abims-sbr > blastalign
annotate scripts/S01_phylip2fasta.py @ 3:49017ea906b5 draft
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
author | abims-sbr |
---|---|
date | Wed, 17 Jan 2018 08:55:00 -0500 |
parents | 92615a423389 |
children | 0d2da4c020dc |
rev | line source |
---|---|
2
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
1 #!/usr/bin/python |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
2 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
3 ## AUTHOR: Eric Fontanillas |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
4 ## LAST VERSION: 20/08/14 by Julie BAFFARD |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
5 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
6 ## DESCRIPTION: formatting a fasta format into phylip format for using with PAML |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
7 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
8 import string, os, sys |
3
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
9 """ |
2
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
10 if len(sys.argv) == 1: |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
11 print "put arguments!!" |
3
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
12 print "USAGE: S01_phylip2fasta.py INPUT OUTPUT" |
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
13 """ |
2
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
14 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
15 ## INPUT |
3
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
16 if os.path.isfile(sys.argv[1]) : |
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
17 f1 = sys.argv[1] |
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
18 else: |
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
19 print "No existing phylip file ; exiting ..." |
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
20 exit() |
49017ea906b5
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit cf1b9c905931ca2ca25faa4844d45c908756472f
abims-sbr
parents:
2
diff
changeset
|
21 |
2
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
22 F1 = open("%s" %f1, 'r') |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
23 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
24 ## OUTPUT |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
25 f2 = sys.argv[2] |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
26 F2 = open("%s" %f2, 'w') |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
27 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
28 ###### def1 ###### |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
29 # Dans un multialignement fasta, cette fonction permet de formatter les noms de chaque sequence fasta |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
30 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
31 def format(File_IN): |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
32 c = 0 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
33 fichier = "" |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
34 while 1 : |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
35 c = c + 1 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
36 next = File_IN.readline() |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
37 if not next : |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
38 break |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
39 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
40 S1 = string.split(next, "\t") # list : [name, sequence] --- BUG CORRECTED : "\t" instead of " " |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
41 fasta_name = S1[0] # get sequence name |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
42 fasta_seq = S1[1][:-1] # get sequence without the terminal '\n' |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
43 fichier = fichier + ">" + fasta_name + "\n" + fasta_seq + "\n" |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
44 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
45 return (fichier,c) |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
46 #-#-#-#-#-#-#-#-#-#-# |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
47 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
48 ################### |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
49 ### RUN RUN RUN ### |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
50 ################### |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
51 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
52 F1.readline() ## jump the first line |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
53 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
54 fichier_txt, c = format(F1) ### DEF1 ### |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
55 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
56 F2.write(fichier_txt) |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
57 |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
58 F1.close() |
92615a423389
planemo upload for repository https://github.com/abims-sbr/adaptsearch commit 44a89d5eeb82789bfc643b33c11f391281b6374b
abims-sbr
parents:
diff
changeset
|
59 F2.close() |