Mercurial > repos > sauria > create_correlation_matrix
comparison correlation_matrix.py @ 3:89009e9b7eb0 draft
Uploaded
author | sauria |
---|---|
date | Thu, 27 Apr 2017 17:28:27 -0400 |
parents | f0c8cdd78e28 |
children | 4a76c97c3dd0 |
comparison
equal
deleted
inserted
replaced
2:f0c8cdd78e28 | 3:89009e9b7eb0 |
---|---|
6 import scipy.stats | 6 import scipy.stats |
7 | 7 |
8 def main(): | 8 def main(): |
9 parser = generate_parser() | 9 parser = generate_parser() |
10 args = parser.parse_args() | 10 args = parser.parse_args() |
11 data, names = load_data(args) | 11 data, rnames = load_data(args) |
12 corr = find_correlations(data, args) | 12 corr = find_correlations(data, args) |
13 save_data(corr, names, args) | 13 save_data(corr, names, args) |
14 | 14 |
15 def load_data(args): | 15 def load_data(args): |
16 infile = open(args.input) | 16 infile = open(args.input) |
17 names = [] | 17 names = [] |
18 cnames = None | |
18 data = [] | 19 data = [] |
19 if args.column: | 20 if args.column: |
20 temp = infile.readline() | 21 cnames = infile.readline().split() |
22 if args.rows: | |
23 cnames = cnames[1:] | |
21 temp = infile.readline() | 24 temp = infile.readline() |
22 if args.int: | 25 if args.int: |
23 dtype = int | 26 dtype = int |
24 else: | 27 else: |
25 dtype = float | 28 dtype = float |
35 if len(names) == 0: | 38 if len(names) == 0: |
36 names = None | 39 names = None |
37 data = numpy.array(data) | 40 data = numpy.array(data) |
38 if args.features: | 41 if args.features: |
39 data = data.T | 42 data = data.T |
40 return data, names | 43 names = cnames |
44 return data, names, cnames | |
41 | 45 |
42 def find_correlations(data, args): | 46 def find_correlations(data, args): |
43 corr = numpy.ones((data.shape[0], data.shape[0]), dtype=numpy.float32) | 47 corr = numpy.ones((data.shape[0], data.shape[0]), dtype=numpy.float32) |
44 if args.test == 'pearson': | 48 if args.test == 'pearson': |
45 findcorr = scipy.stats.pearsonr | 49 findcorr = scipy.stats.pearsonr |