Mercurial > repos > sauria > create_correlation_matrix
comparison correlation_matrix.py @ 4:4a76c97c3dd0 draft default tip
Uploaded
author | sauria |
---|---|
date | Thu, 27 Apr 2017 17:32:19 -0400 |
parents | 89009e9b7eb0 |
children |
comparison
equal
deleted
inserted
replaced
3:89009e9b7eb0 | 4:4a76c97c3dd0 |
---|---|
6 import scipy.stats | 6 import scipy.stats |
7 | 7 |
8 def main(): | 8 def main(): |
9 parser = generate_parser() | 9 parser = generate_parser() |
10 args = parser.parse_args() | 10 args = parser.parse_args() |
11 data, rnames = load_data(args) | 11 data, names = load_data(args) |
12 corr = find_correlations(data, args) | 12 corr = find_correlations(data, args) |
13 save_data(corr, names, args) | 13 save_data(corr, names, args) |
14 | 14 |
15 def load_data(args): | 15 def load_data(args): |
16 infile = open(args.input) | 16 infile = open(args.input) |
17 names = [] | 17 names = [] |
18 cnames = None | 18 cnames = None |
19 data = [] | 19 data = [] |
20 if args.column: | 20 if args.column: |
21 cnames = infile.readline().split() | 21 cnames = infile.readline().split() |
22 if args.rows: | 22 if args.row: |
23 cnames = cnames[1:] | 23 cnames = cnames[1:] |
24 temp = infile.readline() | 24 temp = infile.readline() |
25 if args.int: | 25 if args.int: |
26 dtype = int | 26 dtype = int |
27 else: | 27 else: |
39 names = None | 39 names = None |
40 data = numpy.array(data) | 40 data = numpy.array(data) |
41 if args.features: | 41 if args.features: |
42 data = data.T | 42 data = data.T |
43 names = cnames | 43 names = cnames |
44 return data, names, cnames | 44 return data, names |
45 | 45 |
46 def find_correlations(data, args): | 46 def find_correlations(data, args): |
47 corr = numpy.ones((data.shape[0], data.shape[0]), dtype=numpy.float32) | 47 corr = numpy.ones((data.shape[0], data.shape[0]), dtype=numpy.float32) |
48 if args.test == 'pearson': | 48 if args.test == 'pearson': |
49 findcorr = scipy.stats.pearsonr | 49 findcorr = scipy.stats.pearsonr |