comparison correlation_matrix.py @ 4:4a76c97c3dd0 draft default tip

Uploaded
author sauria
date Thu, 27 Apr 2017 17:32:19 -0400
parents 89009e9b7eb0
children
comparison
equal deleted inserted replaced
3:89009e9b7eb0 4:4a76c97c3dd0
6 import scipy.stats 6 import scipy.stats
7 7
8 def main(): 8 def main():
9 parser = generate_parser() 9 parser = generate_parser()
10 args = parser.parse_args() 10 args = parser.parse_args()
11 data, rnames = load_data(args) 11 data, names = load_data(args)
12 corr = find_correlations(data, args) 12 corr = find_correlations(data, args)
13 save_data(corr, names, args) 13 save_data(corr, names, args)
14 14
15 def load_data(args): 15 def load_data(args):
16 infile = open(args.input) 16 infile = open(args.input)
17 names = [] 17 names = []
18 cnames = None 18 cnames = None
19 data = [] 19 data = []
20 if args.column: 20 if args.column:
21 cnames = infile.readline().split() 21 cnames = infile.readline().split()
22 if args.rows: 22 if args.row:
23 cnames = cnames[1:] 23 cnames = cnames[1:]
24 temp = infile.readline() 24 temp = infile.readline()
25 if args.int: 25 if args.int:
26 dtype = int 26 dtype = int
27 else: 27 else:
39 names = None 39 names = None
40 data = numpy.array(data) 40 data = numpy.array(data)
41 if args.features: 41 if args.features:
42 data = data.T 42 data = data.T
43 names = cnames 43 names = cnames
44 return data, names, cnames 44 return data, names
45 45
46 def find_correlations(data, args): 46 def find_correlations(data, args):
47 corr = numpy.ones((data.shape[0], data.shape[0]), dtype=numpy.float32) 47 corr = numpy.ones((data.shape[0], data.shape[0]), dtype=numpy.float32)
48 if args.test == 'pearson': 48 if args.test == 'pearson':
49 findcorr = scipy.stats.pearsonr 49 findcorr = scipy.stats.pearsonr