annotate convert_multiple_dta_to_csv.py @ 12:c4c40e20871c draft

Uploaded
author mb2013
date Wed, 20 Nov 2013 07:19:00 -0500
parents 692262de2de2
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
692262de2de2 Uploaded
mb2013
parents:
diff changeset
1 #Converter of multiple dta files to one csv
692262de2de2 Uploaded
mb2013
parents:
diff changeset
2 #M.Baak
692262de2de2 Uploaded
mb2013
parents:
diff changeset
3 #13-11-2013
692262de2de2 Uploaded
mb2013
parents:
diff changeset
4 #last update: 13-11-2013
692262de2de2 Uploaded
mb2013
parents:
diff changeset
5
692262de2de2 Uploaded
mb2013
parents:
diff changeset
6 import sys
692262de2de2 Uploaded
mb2013
parents:
diff changeset
7 import os
692262de2de2 Uploaded
mb2013
parents:
diff changeset
8
692262de2de2 Uploaded
mb2013
parents:
diff changeset
9
692262de2de2 Uploaded
mb2013
parents:
diff changeset
10 file_outputname = sys.argv[1]
692262de2de2 Uploaded
mb2013
parents:
diff changeset
11 file_outputname2 = sys.argv[2]
692262de2de2 Uploaded
mb2013
parents:
diff changeset
12 file_name = sys.argv[3:]
692262de2de2 Uploaded
mb2013
parents:
diff changeset
13
692262de2de2 Uploaded
mb2013
parents:
diff changeset
14 def convert_dta(file_name,file_outputname,file_outputname2):
692262de2de2 Uploaded
mb2013
parents:
diff changeset
15 output = open(file_outputname,'w') #output file
692262de2de2 Uploaded
mb2013
parents:
diff changeset
16 output2 = open(file_outputname2, 'w')
692262de2de2 Uploaded
mb2013
parents:
diff changeset
17
692262de2de2 Uploaded
mb2013
parents:
diff changeset
18 for x in range(0,len(file_name)):
692262de2de2 Uploaded
mb2013
parents:
diff changeset
19 read_file = open(file_name[x], 'r') #open file
692262de2de2 Uploaded
mb2013
parents:
diff changeset
20 a = len(read_file.readlines())
692262de2de2 Uploaded
mb2013
parents:
diff changeset
21 read_file2 = open(file_name[x], 'r') # open file second time
692262de2de2 Uploaded
mb2013
parents:
diff changeset
22
692262de2de2 Uploaded
mb2013
parents:
diff changeset
23
692262de2de2 Uploaded
mb2013
parents:
diff changeset
24 numberlandmarks = 0
692262de2de2 Uploaded
mb2013
parents:
diff changeset
25 header = ""
692262de2de2 Uploaded
mb2013
parents:
diff changeset
26
692262de2de2 Uploaded
mb2013
parents:
diff changeset
27 #for loop, coordinates, number of landmarks and name of sample will be stored in csv format
692262de2de2 Uploaded
mb2013
parents:
diff changeset
28 for x in range(0,a):
692262de2de2 Uploaded
mb2013
parents:
diff changeset
29 b = read_file2.readline().strip()
692262de2de2 Uploaded
mb2013
parents:
diff changeset
30 split_tabs = b.split(' ')
692262de2de2 Uploaded
mb2013
parents:
diff changeset
31 number_columns = len(split_tabs)
692262de2de2 Uploaded
mb2013
parents:
diff changeset
32 if x == 0:
692262de2de2 Uploaded
mb2013
parents:
diff changeset
33 header += b.replace(' ', '_') #name of sample
692262de2de2 Uploaded
mb2013
parents:
diff changeset
34 if number_columns == 3: #coordinates
692262de2de2 Uploaded
mb2013
parents:
diff changeset
35 output.write("%f,%f,%f\n"%(float(split_tabs[0]),float(split_tabs[1]),float(split_tabs[2])))
692262de2de2 Uploaded
mb2013
parents:
diff changeset
36 numberlandmarks += 1 # number of landmarks
692262de2de2 Uploaded
mb2013
parents:
diff changeset
37
692262de2de2 Uploaded
mb2013
parents:
diff changeset
38 output2.write("%s\n"%(header[1:-4])) # writing header to output file
692262de2de2 Uploaded
mb2013
parents:
diff changeset
39
692262de2de2 Uploaded
mb2013
parents:
diff changeset
40 output.close()
692262de2de2 Uploaded
mb2013
parents:
diff changeset
41
692262de2de2 Uploaded
mb2013
parents:
diff changeset
42 convert_dta(file_name,file_outputname,file_outputname2)
692262de2de2 Uploaded
mb2013
parents:
diff changeset
43
692262de2de2 Uploaded
mb2013
parents:
diff changeset
44
692262de2de2 Uploaded
mb2013
parents:
diff changeset
45
692262de2de2 Uploaded
mb2013
parents:
diff changeset
46