annotate pscan_chip/pscan_chip_g.cpp @ 10:5e2af7c006b0 draft default tip

Uploaded
author fz77
date Mon, 17 Nov 2014 10:15:57 -0500
parents 6a5cfb8a872f
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
9
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1 // Pscan-ChIP 1.1
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2 // // Copyright (C) 2013 Federico Zambelli and Giulio Pavesi
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
3 // //
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
4 // // This program is free software: you can redistribute it and/or modify
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
5 // // it under the terms of the GNU General Public License as published by
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
6 // // the Free Software Foundation, either version 3 of the License, or
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
7 // // (at your option) any later version.
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
8 // //
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
9 // // This program is distributed in the hope that it will be useful,
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
10 // // but WITHOUT ANY WARRANTY; without even the implied warranty of
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
11 // // MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
12 // // GNU General Public License for more details.
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
13 // //
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
14 // // You should have received a copy of the GNU General Public License
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
15 // // along with this program. If not, see <http://www.gnu.org/licenses/>.
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
16 // //
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
17 // // If you find Pscan-ChIP useful in your research please cite our paper:
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
18 // //
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
19 // // Zambelli F, Pesole G, Pavesi G. PscanChIP: Finding over-represented
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
20 // // transcription factor-binding site motifs and their correlations in sequences from
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
21 // // ChIP-Seq experiments.
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
22 // // Nucleic Acids Res. 2013 Jul;41(Web Server issue):W535-43.
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
23
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
24 #include <string>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
25 #include <iostream>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
26 #include <fstream>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
27 #include <vector>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
28 #include <sstream>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
29 #include <math.h>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
30 #include <map>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
31 #include <cstdlib>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
32 #include <gsl/gsl_randist.h>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
33 #include <gsl/gsl_cdf.h>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
34 #include <string.h>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
35 #include <ctime>
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
36
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
37 using namespace std;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
38
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
39 const double MIN_ADD_FREQ = 0.01, EPSILON = pow(10,-21), INF = pow(10,21), /*POS_VIS_THRESHOLD = pow(10,-5),*/ DIST_RATIO_THRESHOLD = 3, DIST_PV_THRESHOLD = pow(10,-5);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
40 const unsigned int MAX_REG_SIZE = 3000, ALPHABET_SIZE = 4, TOP_P = 1, DIST_HIT_THRESHOLD = 10;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
41 //const char ALPHABET[4] = {'A','C','G','T'}, RC_ALPHABET[4] = {'T','G','C','A'};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
42 char VI['T' + 1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
43 string regfile, genome, matrixfile, additional_matrixfile, outfile, bgfile, selected, obstf, GALAXY_OUTPUT;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
44 unsigned int RSIZE = 150, MAX_L = 0, W_SIZE = 10, W_STEP = 5;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
45 bool SECOND_BEST_POS = false, SINGLE_STRAND = false, VERBOSE = false, GET_SEQUENCES = false, POSITIONAL = false, SINGLE_MATRIX = false, SPEARMAN = false, TWOBIT = false, QUIET = false; //NAIVE = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
46 ofstream fasta_out;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
47 double SINGLE_MATRIX_BG_AVG = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
48
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
49 struct mpoint
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
50 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
51 unsigned int x;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
52 unsigned int y;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
53 };
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
54
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
55 struct bg
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
56 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
57 unsigned int Size;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
58 double Avg, Var;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
59 };
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
60
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
61 class sequence
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
62 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
63 private:
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
64 string Chr, Name;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
65 char *Seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
66 unsigned int Start, End, E_Rank;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
67 char Strand, AntiStrand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
68 bool good;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
69 public:
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
70 sequence(string*, ifstream*, unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
71 sequence(string*, unsigned int, string, unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
72 char strand();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
73 char antistrand();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
74 string chr();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
75 unsigned int start();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
76 unsigned int end();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
77 unsigned int e_rank();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
78 string name();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
79 char* seq();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
80 bool is_good();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
81 double score();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
82 int mpos();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
83 };
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
84
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
85 class matrix
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
86 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
87 friend void scanner(vector<matrix>*, vector<sequence>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
88 private:
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
89 void normalizer();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
90 void to_log();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
91 void avg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
92 void max_min();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
93 void rev_c();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
94 double get_M_value(int, char);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
95 double get_rc_M_value(int, char);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
96 void calc_var(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
97 void calc_W_param(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
98 void welch_test(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
99 void welch_test_bg(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
100 // void welch_test_bg_G(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
101 void welch_test_pos(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
102 void z_test_pos(double);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
103 unsigned int L, bg_Size, BIN_NUM;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
104 double **M;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
105 double **rc_M;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
106 double max_score, min_score, t, dof, t_bg, dof_bg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
107 double spearman;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
108 string Name, Id;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
109 bool O_U, O_U_bg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
110 vector<bool> W_O_U;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
111 bool good, BG;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
112 bool norm_sec_step;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
113 vector<double> v_score, vF_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
114 vector<unsigned int> v_pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
115 vector<bool> v_strand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
116 vector<vector<double> > W_R_v_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
117 vector<double> W_R_Avg, W_R_Var, W_R_pvalue, W_R_T_pvalue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
118 double R_Avg, F_Avg, R_Var, F_Var, /*G_Avg, G_Var,*/ pvalue, W_Avg, W_Var;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
119 double bg_Avg, bg_Var, pvalue_bg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
120 public:
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
121 matrix(vector<string>*, map<string,bg>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
122 void display();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
123 bool is_good();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
124 string name();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
125 string id();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
126 string o_or_u();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
127 string o_or_u_bg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
128 int W_o_or_u(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
129 void scan(vector<sequence>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
130 double scan_seq_ds(char*, bool, unsigned int, vector<double>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
131 double scan_seq_ss(char*, bool, unsigned int, char, vector<double>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
132 double scan_seq_ds_second_best(char*, unsigned int, unsigned int *, bool *, int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
133 double scan_seq_ss_second_best(char*, unsigned int, unsigned int *, bool *, unsigned int, bool);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
134 double get_score_at(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
135 unsigned int get_pos_at(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
136 unsigned int length();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
137 bool get_strand_at(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
138 bool have_bg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
139 unsigned int bin_num();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
140 double get_R_Avg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
141 double get_F_Avg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
142 double get_bg_Avg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
143 double get_R_Var();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
144 double get_F_Var();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
145 double max();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
146 double min();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
147 double get_pvalue();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
148 double get_pvalue_bg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
149 double get_W_pvalue(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
150 double get_W_R_Avg_at_pos(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
151 double get_t();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
152 double get_dof();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
153 double get_spearman();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
154 double get_W_Avg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
155 double get_W_R_T_pvalue(unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
156 };
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
157
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
158 void command_line_parser(int, char**);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
159 void acquire_regions(vector<sequence>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
160 void acquire_matrices(vector<matrix>*, map<string,bg>*, string*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
161 void acquire_background(map<string,bg>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
162 void scanner(vector<matrix>*, vector<sequence>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
163 void main_output(vector<matrix>*, vector<sequence>*, unsigned int);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
164 void main_output_single_matrix(vector<matrix>*, vector<sequence>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
165 void distance_analysis(vector<matrix>*, vector<sequence>*, unsigned int, multimap <double, vector<matrix>::iterator>*);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
166 void display_help();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
167
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
168 int main(int argc, char **argv)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
169 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
170 srand(time(NULL));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
171
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
172 vector<sequence> Seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
173 vector<matrix> Mat;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
174 map<string,bg> Bg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
175 VI['A'] = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
176 VI['C'] = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
177 VI['G'] = 2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
178 VI['T'] = 3;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
179 VI['N'] = 4;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
180
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
181 obstf.clear();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
182
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
183 command_line_parser(argc, argv);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
184
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
185 if(GET_SEQUENCES)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
186 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
187 string outfile = regfile;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
188 outfile += ".fasta";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
189 fasta_out.open(outfile.c_str(), ios::out);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
190 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
191
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
192 if(!regfile.empty() && !matrixfile.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
193 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
194 if(!bgfile.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
195 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
196 if(!QUIET) cerr << "\nAcquiring background file... ";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
197 acquire_background(&Bg);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
198 if(!QUIET) cerr << "done" << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
199 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
200
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
201 if(!QUIET) cerr << "\nReading binding profiles...";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
202 acquire_matrices(&Mat, &Bg, &matrixfile);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
203
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
204 if(!additional_matrixfile.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
205 acquire_matrices(&Mat, &Bg, &additional_matrixfile);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
206
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
207 if(Mat.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
208 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
209 if(!QUIET) cerr << "\nZero valid matrices acquired. Quitting..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
210 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
211 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
212
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
213 if(!QUIET) cerr << "done: " << Mat.size() << " binding profiles acquired. Max matrix length = " << MAX_L << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
214
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
215 if(Mat.size() == 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
216 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
217 if(!QUIET) cerr << "\nSwitching to single matrix mode..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
218 SINGLE_MATRIX = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
219 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
220
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
221 if(!QUIET) cerr << "\nAcquiring regions...";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
222 acquire_regions(&Seq);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
223 if(!QUIET) cerr << "done: " << Seq.size() << " unique regions acquired." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
224
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
225 if(Seq.size() <= 2)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
226 POSITIONAL = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
227
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
228 if(Seq.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
229 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
230 if(!QUIET) cerr << "\nZero regions to work on! Exiting..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
231 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
232 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
233
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
234 if(GET_SEQUENCES)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
235 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
236 fasta_out.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
237 exit(0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
238 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
239
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
240 // for(unsigned int i = 0; i < Mat.size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
241 // Mat[i].display();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
242
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
243 if(!QUIET) cerr << "\nScanning...";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
244 scanner(&Mat, &Seq);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
245
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
246 if(!QUIET) cerr << "\nWriting output..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
247
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
248 if(!SINGLE_MATRIX)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
249 main_output(&Mat, &Seq, Seq.size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
250 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
251 main_output_single_matrix(&Mat, &Seq);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
252
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
253 if(!QUIET) cerr << "\nOutput written in file: " << outfile << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
254
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
255 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
256 else if(GET_SEQUENCES && !regfile.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
257 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
258 if(!QUIET) cerr << "\nAcquiring regions...";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
259 acquire_regions(&Seq);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
260 if(!QUIET) cerr << "done: " << Seq.size() << " unique regions acquired." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
261
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
262 fasta_out.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
263 exit(0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
264 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
265 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
266 display_help();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
267
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
268
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
269 /* for(unsigned int i = 0; i < Seq.size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
270 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
271 cout << ">" << i+1 << '\t' << Seq[i].name() << '\t' << Seq[i].start() << '\t' << Seq[i].end() << '\t'
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
272 << Mat[0].get_score_at(i) << '\t' << Mat[0].get_pos_at(i) << '\t' << Mat[0].get_strand_at(i) << '\t'
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
273 << "Max = " << Mat[0].max() << '\t' << "Min = " << Mat[0].min()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
274 << endl << Seq[i].seq() << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
275 cout << ">" << i+1 << '\t' << Seq[i].name() << '\t' << "UPSTREAM" << endl << Seq[i].uf_seq() << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
276 cout << ">" << i+1 << '\t' << Seq[i].name() << '\t' << "DOWNSTREAM" << endl << Seq[i].df_seq() << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
277 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
278 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
279
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
280 return 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
281 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
282
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
283 void display_help()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
284 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
285 if(!QUIET) cerr << endl << "Syntax: pscan_chip -r region_file.bed -M matrixfile.wil -g genome [-pos] [-wsize window_size] [-wstep window_step] [-bg background_file] [-s region_size]" << endl << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
286 exit(0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
287 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
288
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
289 void main_output_single_matrix(vector<matrix> *Mat, vector<sequence> *Seq)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
290 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
291 outfile = regfile;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
292 outfile += ".";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
293 outfile += Mat->at(0).id();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
294
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
295 string outfile2 = outfile;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
296
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
297 outfile += ".ris";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
298 outfile2 += ".all.ris";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
299
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
300 if(!GALAXY_OUTPUT.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
301 outfile = GALAXY_OUTPUT;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
302
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
303 multimap <double, string> outmap;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
304
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
305 ofstream out(outfile.c_str(), ios::out);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
306 ofstream out2(outfile2.c_str(), ios::out);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
307
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
308 if(!out)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
309 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
310 if(!QUIET) cerr << "\nError! Can't open output file: " << outfile << " for writing..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
311 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
312 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
313
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
314 out << "CHR\tREG_START\tREG_END\tREG_STRAND\tABS_SITE_START\tABS_SITE_END\tREL_SITE_START\tREL_SITE_END\tSITE_STRAND\tSCORE\tSITE";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
315 out2 << "CHR\tREG_START\tREG_END\tREG_STRAND\tABS_SITE_START\tABS_SITE_END\tREL_SITE_START\tREL_SITE_END\tSITE_STRAND\tSCORE\tSITE";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
316
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
317 // if(SPEARMAN)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
318 // out << "\tE_RANK";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
319
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
320 if(SECOND_BEST_POS)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
321 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
322 out << "\tSB_POS\tSB_SCORE\tSB_OLIGO\tSB_STRAND" << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
323 out2 << "\tSB_POS\tSB_SCORE\tSB_OLIGO\tSB_STRAND" << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
324 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
325 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
326 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
327 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
328 out2 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
329 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
330
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
331 matrix *M = &Mat->at(0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
332
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
333 /* if(SINGLE_MATRIX_BG_AVG == 0) //QUESTO SERVE PER QUANDO NON C'E' IL VALORE DI BACKGROUND!
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
334 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
335 double loc_avg = 0, loc_stdev = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
336
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
337 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
338 loc_avg += M->get_score_at(i);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
339
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
340 loc_avg /= Seq->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
341
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
342 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
343 loc_stdev += pow(M->get_score_at(i) - loc_avg, 2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
344
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
345 loc_stdev /= (Seq->size() - 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
346
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
347 loc_stdev = sqrt(loc_stdev);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
348
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
349 SINGLE_MATRIX_BG_AVG = loc_avg - (2*loc_stdev);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
350
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
351 if(!QUIET) cerr << "\nSMBG = " << SINGLE_MATRIX_BG_AVG;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
352 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
353 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
354 char Oligo[M->length() + 1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
355
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
356 Oligo[M->length()] = '\0';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
357
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
358 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
359 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
360 // if(!QUIET) cerr << endl << M->get_score_at(i) << '\t' << M->get_bg_Avg() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
361
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
362 // if(M->get_score_at(i) < SINGLE_MATRIX_BG_AVG) //ONLY REPORT OCCURRENCES WITH SCORE >= BG_AVG
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
363 // continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
364
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
365 // if(!QUIET) cerr << "passed";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
366
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
367 ostringstream outbuf;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
368
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
369 sequence *S = &Seq->at(i);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
370
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
371 strncpy(Oligo, S->seq() + RSIZE/2 + (M->get_pos_at(i) - M->length()/2), M->length());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
372
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
373 outbuf << S->chr() << '\t' << S->start() << '\t' << S->end() << '\t' << S->strand() << '\t'
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
374 << S->start() + M->get_pos_at(i) - M->length()/2 << '\t' << S->start() + M->get_pos_at(i) + M->length()/2 << '\t'
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
375 << (int)((M->get_pos_at(i) - M->length()/2) - RSIZE/2) << '\t' << (int)((M->get_pos_at(i) + M->length()/2 - 1) - RSIZE/2)<< '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
376
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
377 if(S->strand() == '+')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
378 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
379 if(!M->get_strand_at(i))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
380 outbuf << S->strand();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
381 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
382 outbuf << S->antistrand();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
383 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
384 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
385 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
386 if(!M->get_strand_at(i))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
387 outbuf << S->antistrand();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
388 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
389 outbuf << S->strand();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
390 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
391
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
392 outbuf << '\t' << M->get_score_at(i) << '\t' << Oligo;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
393
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
394 // if(SPEARMAN)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
395 // outbuf << '\t' << S->e_rank();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
396
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
397 if(SECOND_BEST_POS)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
398 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
399 if(SINGLE_STRAND)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
400 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
401 bool s;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
402 unsigned int P;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
403 double score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
404
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
405 score = M->scan_seq_ss_second_best(S->seq() + (RSIZE/2), RSIZE, &P, &s,M->get_pos_at(i), S->strand());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
406
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
407 strncpy(Oligo, S->seq() + RSIZE/2 + P, M->length());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
408
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
409 outbuf << '\t' << P << '\t' << score << '\t' << Oligo;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
410 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
411 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
412 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
413 bool s;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
414 unsigned int P;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
415 double score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
416
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
417 score = M->scan_seq_ds_second_best(S->seq() + (RSIZE/2), RSIZE, &P, &s, (int)M->get_pos_at(i));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
418
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
419 strncpy(Oligo, S->seq() + RSIZE/2 + P, M->length());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
420
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
421 outbuf << '\t' << (int)P - (int)RSIZE/2 << '\t' << score << '\t' << Oligo << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
422
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
423 if(s)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
424 outbuf << '-';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
425 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
426 outbuf << '+';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
427 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
428
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
429 outbuf << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
430 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
431 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
432 outbuf << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
433
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
434 outmap.insert(make_pair(M->get_score_at(i),outbuf.str()));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
435 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
436
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
437 multimap<double,string>::reverse_iterator mi = outmap.rbegin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
438
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
439 // unsigned int count = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
440
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
441 while(mi != outmap.rend())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
442 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
443 // if(count >= outmap.size()/2 && outmap.size() > 1) //SOLO LA MIGLIORE META' DELLE OCCORRENZE!!!
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
444 // break;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
445 if(mi->first >= SINGLE_MATRIX_BG_AVG || mi == outmap.rbegin())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
446 out << mi->second;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
447
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
448 out2 << mi->second;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
449
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
450 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
451 // count++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
452 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
453
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
454 out.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
455 out2.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
456 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
457 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
458
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
459 void main_output(vector<matrix> *Mat, vector<sequence> *Seq, unsigned int SIZE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
460 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
461 multimap <double, vector<matrix>::iterator> S_map;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
462 outfile = regfile;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
463
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
464 outfile += ".res";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
465
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
466 if(!GALAXY_OUTPUT.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
467 outfile = GALAXY_OUTPUT;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
468
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
469 ofstream out(outfile.c_str(),ios::out);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
470
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
471 if(!out)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
472 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
473 if(!QUIET) cerr << "\nError! Can't open output file: " << outfile << " for writing..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
474 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
475 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
476
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
477 out << "NAME\tID\tREG_N\tL_PVALUE O/U\tG_PVALUE O/U\tR_AVG\tR_STDEV\tF_AVG\tBG_AVG";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
478
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
479 if(SPEARMAN)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
480 out << "\tSP_COR";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
481
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
482 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
483 out << "\tPREF_POS\tPREF_POS_PV\n";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
484 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
485 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
486
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
487 vector<matrix>::iterator vi = Mat->begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
488
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
489 while(vi != Mat->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
490 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
491 if(S_map.find(vi->get_pvalue()) != S_map.end()) //GFI WORKAROUND
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
492 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
493 if(S_map.find(vi->get_pvalue())->second->get_pvalue_bg() < vi->get_pvalue_bg())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
494 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
495 S_map.insert(make_pair(vi->get_pvalue() + pow(10,-240), vi));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
496 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
497 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
498 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
499 else if((S_map.find(vi->get_pvalue())->second->get_pvalue_bg() > vi->get_pvalue_bg()))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
500 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
501 S_map.insert(make_pair(vi->get_pvalue() - pow(10,-240), vi));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
502 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
503 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
504 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
505 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
506 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
507 if(S_map.find(vi->get_pvalue())->second->get_spearman() > vi->get_spearman())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
508 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
509 S_map.insert(make_pair(vi->get_pvalue() + pow(10,-240), vi));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
510 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
511 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
512 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
513 else if(S_map.find(vi->get_pvalue())->second->get_spearman() <= vi->get_spearman())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
514 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
515 S_map.insert(make_pair(vi->get_pvalue() - pow(10,-240), vi));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
516 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
517 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
518 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
519 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
520
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
521 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
522 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
523 S_map.insert(make_pair(vi->get_pvalue(), vi));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
524
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
525 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
526 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
527
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
528 multimap <double, vector<matrix>::iterator>::iterator mi = S_map.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
529
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
530 while(mi != S_map.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
531 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
532 double pv1, pv2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
533
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
534 pv1 = mi->second->get_pvalue() * Mat->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
535
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
536 if(pv1 > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
537 pv1 = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
538
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
539 pv2 = mi->second->get_pvalue_bg() * Mat->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
540
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
541 if(pv2 > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
542 pv2 = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
543
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
544 out << mi->second->name() << '\t' << mi->second->id() << '\t' << SIZE << '\t' << pv1 << ' ' << mi->second->o_or_u() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
545
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
546 if(mi->second->have_bg())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
547 out << pv2 << ' ' << mi->second->o_or_u_bg() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
548 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
549 out << "N/A N/A\t";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
550
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
551 out << mi->second->get_R_Avg() << '\t' << pow(mi->second->get_R_Var(), 0.5) << '\t' << mi->second->get_F_Avg() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
552
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
553 if(mi->second->have_bg())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
554 out << mi->second->get_bg_Avg() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
555 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
556 out << "N/A" << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
557
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
558 if(SPEARMAN)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
559 out << mi->second->get_spearman() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
560
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
561 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
562 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
563 double min_pv = 1, min_pv_c;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
564 unsigned int min_pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
565
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
566 for(unsigned int i = 0; i < mi->second->bin_num() - 1; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
567 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
568 if(mi->second->get_W_pvalue(i) <= min_pv) //&& mi->second->W_o_or_u(i) == 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
569 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
570 min_pv = mi->second->get_W_pvalue(i);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
571 min_pos = i;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
572 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
573 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
574
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
575 min_pv_c = min_pv * (mi->second->bin_num() * Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
576
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
577 if(min_pv_c > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
578 min_pv_c = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
579
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
580 out << '[' << (int)(((W_STEP * min_pos) + mi->second->length()/2) - RSIZE/2) << ',' << (int)(((W_STEP * min_pos) + W_SIZE) + mi->second->length()/2 - RSIZE/2) << ']' << '\t' << min_pv_c;// << '\t' << mi->second->get_W_R_T_pvalue(min_pos) << '\t' << min_pv_c;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
581 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
582
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
583 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
584
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
585 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
586 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
587
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
588 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
589 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
590 out << endl << endl << "POSITIONAL ANALYSIS: W_SIZE = " << W_SIZE << " W_STEP = " << W_STEP << endl << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
591
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
592 out << "NAME\tID\t";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
593
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
594 mi = S_map.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
595
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
596 for(int i = -(int)(RSIZE/2); i <= (int)((RSIZE/2) - W_SIZE); i += W_STEP)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
597 out << i /*<< '|' << i + (int)(W_SIZE - 1)*/ << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
598
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
599 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
600
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
601 while(mi != S_map.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
602 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
603 /* bool gflag = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
604
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
605 for(unsigned int i = 0; i < mi->second->bin_num() - 1; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
606 if(mi->second->get_W_pvalue(i) <= POS_VIS_THRESHOLD)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
607 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
608 gflag = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
609 break;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
610 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
611
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
612 if(!gflag)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
613 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
614 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
615 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
616 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
617 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
618 out << mi->second->name() << '\t' << mi->second->id() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
619
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
620 for(unsigned int i = 0; i < mi->second->bin_num() - 1; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
621 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
622 // out << (-log(mi->second->get_W_pvalue(i))/log(10)) * mi->second->W_o_or_u(i) << '\t';//<< " [" << mi->second->W_o_or_u(i) << "]\t";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
623 //
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
624 double bpv = mi->second->get_W_pvalue(i) * (mi->second->bin_num() * Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
625
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
626 if(bpv > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
627 bpv = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
628
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
629 out << bpv << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
630 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
631
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
632 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
633
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
634 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
635 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
636
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
637 if(!obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
638 distance_analysis(Mat, Seq, SIZE, &S_map);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
639 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
640
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
641 out.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
642
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
643 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
644 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
645
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
646 void distance_analysis(vector<matrix> *Mat, vector<sequence> *Seq, unsigned int SIZE, multimap <double, vector<matrix>::iterator> *S_map)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
647 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
648 string dist_outfile = regfile, dist2_outfile = regfile, dist3_outfile = regfile;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
649
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
650 dist_outfile += ".dist";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
651 dist2_outfile += ".exp_dist";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
652 dist3_outfile += ".pv_dist";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
653
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
654 ofstream out(dist_outfile.c_str()), out2, out3;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
655
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
656 if(!obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
657 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
658 out2.open(dist2_outfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
659 out3.open(dist3_outfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
660
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
661 out2 << "TF/EXP_HITS\t";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
662 out3 << "TF/PVALUE\t";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
663 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
664
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
665 out << "TF1|TF2/HITS\t";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
666
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
667 for(int p = -(int)(RSIZE - 1); p < (int)RSIZE; p++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
668 out << p << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
669
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
670 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
671
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
672 if(!obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
673 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
674 for(int p = -(int)(RSIZE - 1); p < (int)RSIZE; p++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
675 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
676 out2 << p << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
677 out3 << p << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
678 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
679
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
680 out2 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
681 out3 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
682 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
683
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
684 multimap <double, vector<matrix>::iterator>::iterator MRI = S_map->begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
685 unsigned int LCOUNT = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
686
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
687 while(MRI != S_map->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
688 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
689 if((MRI->second->get_pvalue_bg() > DIST_PV_THRESHOLD || MRI->second->o_or_u_bg() == "UNDER") &&
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
690 (MRI->second->get_pvalue() > DIST_PV_THRESHOLD || MRI->second->o_or_u() == "UNDER") )
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
691 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
692 MRI++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
693 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
694 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
695
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
696 // if(!QUIET) cerr << endl << MRI->second->name() << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
697
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
698 LCOUNT++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
699
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
700 map<int, double> R_dist_map;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
701
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
702 if(!obstf.empty() && obstf == MRI->second->id())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
703 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
704 map<int, unsigned int> M_hit_distr;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
705
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
706 for(unsigned int a = 0; a < SIZE; a++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
707 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
708 map<int, unsigned int>::iterator mi;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
709
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
710 if(!MRI->second->get_strand_at(a))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
711 mi = M_hit_distr.find(MRI->second->get_pos_at(a));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
712 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
713 mi = M_hit_distr.find(RSIZE - MRI->second->get_pos_at(a));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
714
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
715 if(mi == M_hit_distr.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
716 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
717 if(!MRI->second->get_strand_at(a))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
718 M_hit_distr[MRI->second->get_pos_at(a)] = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
719 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
720 M_hit_distr[RSIZE - MRI->second->get_pos_at(a)] = 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
721 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
722 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
723 mi->second++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
724 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
725
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
726 map<int, unsigned int>::iterator mi = M_hit_distr.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
727
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
728 while(mi != M_hit_distr.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
729 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
730 for(int b = 0; b < RSIZE; b++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
731 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
732 int dpos = mi->first - b;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
733
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
734 map<int, double>::iterator ri = R_dist_map.find(dpos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
735
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
736 if(ri == R_dist_map.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
737 R_dist_map[dpos] = mi->second;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
738 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
739 ri->second += mi->second;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
740
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
741 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
742
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
743 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
744 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
745
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
746 map<int, double>::iterator ri = R_dist_map.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
747 double risum = SIZE * RSIZE;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
748
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
749 out2 << MRI->second->name() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
750
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
751 while(ri != R_dist_map.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
752 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
753 ri->second /= risum;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
754 out2 << ri->second*SIZE << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
755 ri++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
756 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
757
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
758 out2 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
759 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
760
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
761 // multimap <double, vector<matrix>::iterator>::iterator MRI2 = MRI;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
762 multimap <double, vector<matrix>::iterator>::iterator MRI2 = S_map->begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
763
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
764 while(MRI2 != S_map->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
765 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
766 vector<unsigned int> hit_v((RSIZE*2) - 1, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
767
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
768 if(MRI2 == MRI)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
769 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
770 vector<unsigned int> SBPOS;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
771 // vector<bool> SBSTRAND;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
772
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
773 if(SINGLE_STRAND)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
774 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
775 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
776 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
777 bool s;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
778 unsigned int P;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
779 double score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
780
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
781 score = MRI->second->scan_seq_ss_second_best(Seq->at(i).seq() + (RSIZE/2), RSIZE, &P, &s, MRI->second->get_pos_at(i), Seq->at(i).strand());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
782 SBPOS.push_back(P);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
783 // SBSTRAND.push_back(s);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
784 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
785
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
786 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
787 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
788 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
789 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
790 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
791 bool s;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
792 unsigned int P;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
793 double score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
794
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
795 score = MRI->second->scan_seq_ds_second_best(Seq->at(i).seq() + (RSIZE/2), RSIZE, &P, &s, (int)MRI->second->get_pos_at(i));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
796
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
797 SBPOS.push_back(P + MRI->second->length()/2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
798 // SBSTRAND.push_back(s);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
799
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
800 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
801 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
802
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
803 for(unsigned int k = 0; k < SIZE; k++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
804 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
805 int dist;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
806
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
807 if(!MRI->second->get_strand_at(k))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
808 dist = (int)SBPOS.at(k) - (int)MRI->second->get_pos_at(k);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
809 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
810 dist = ((int)(RSIZE-1) - (int)SBPOS.at(k)) - ((int)(RSIZE - 1) - (int)MRI->second->get_pos_at(k));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
811
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
812 hit_v.at((RSIZE-1) + dist)++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
813 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
814
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
815 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
816 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
817 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
818 for(unsigned int k = 0; k < SIZE; k++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
819 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
820 int dist;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
821
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
822 if(!MRI->second->get_strand_at(k))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
823 dist = (int)MRI2->second->get_pos_at(k) - (int)MRI->second->get_pos_at(k);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
824 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
825 dist = ((int)(RSIZE - 1 ) - (int)MRI2->second->get_pos_at(k)) - ((int)(RSIZE - 1 ) - (int)MRI->second->get_pos_at(k));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
826
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
827 // if(!QUIET) cerr << endl << (int)((RSIZE-1) + dist) << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
828
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
829 hit_v.at((RSIZE-1) + dist)++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
830 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
831 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
832
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
833 if((!obstf.empty() && obstf == MRI->second->id()) || obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
834 out << MRI->second->name() << "|" << MRI2->second->name() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
835
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
836 if(!obstf.empty() && obstf == MRI->second->id())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
837 out3 << MRI->second->name() << "|" << MRI2->second->name() << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
838
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
839 for(unsigned int p = 0; p < (RSIZE*2) - 1; p++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
840 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
841 if((!obstf.empty() && obstf == MRI->second->id()) || obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
842 out << hit_v[p] << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
843
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
844 if(!obstf.empty() && obstf == MRI->second->id())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
845 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
846 map<int, double>::iterator ri = R_dist_map.find(p - (RSIZE - 1));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
847
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
848 if(hit_v[p] >= DIST_HIT_THRESHOLD && hit_v[p]/(ri->second * SIZE) >= DIST_RATIO_THRESHOLD)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
849 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
850 double pv = gsl_cdf_binomial_Q(hit_v[p], ri->second, SIZE);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
851
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
852 if(pv <= DIST_PV_THRESHOLD)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
853 out3 << pv << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
854 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
855 out3 << "NA" << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
856 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
857 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
858 out3 << "NA" << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
859 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
860 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
861
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
862 if((!obstf.empty() && obstf == MRI->second->id()) || obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
863 out << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
864
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
865 if(!obstf.empty() && obstf == MRI->second->id())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
866 out3 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
867
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
868 MRI2++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
869 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
870
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
871 MRI++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
872 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
873
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
874 out.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
875
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
876 if(!obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
877 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
878 out2.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
879 out3.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
880 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
881
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
882 if(!LCOUNT)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
883 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
884 remove(dist_outfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
885
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
886 if(!obstf.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
887 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
888 remove(dist2_outfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
889 remove(dist3_outfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
890 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
891 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
892
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
893 if(!QUIET) cerr << "\nDistance analysis written in file: " << dist_outfile << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
894
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
895 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
896 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
897
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
898 void scanner(vector<matrix> *Mat, vector<sequence> *Seq)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
899 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
900 for(unsigned int i = 0; i < Mat->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
901 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
902 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
903 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
904 if(!QUIET) cerr << "\nScanning sequences for "
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
905 << Mat->at(i).name() << " (" << Mat->at(i).id() << ")"<< endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
906 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
907
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
908 Mat->at(i).scan(Seq);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
909 Mat->at(i).calc_var((double)Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
910
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
911 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
912 Mat->at(i).calc_W_param((double)Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
913
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
914 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
915 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
916 if(!QUIET) cerr << "\nRegions avg = " << Mat->at(i).R_Avg << '\t' << "Flanks avg = " << Mat->at(i).F_Avg << '\t'
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
917 << "Regions devstd = " << pow(Mat->at(i).R_Var,0.5) << '\t' << "Flanks devstd = " << pow(Mat->at(i).F_Var,0.5);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
918 if(!QUIET) cerr << "\nDoing Welch's t test... ";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
919 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
920
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
921 Mat->at(i).welch_test((double)Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
922
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
923 if(Mat->at(i).have_bg())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
924 Mat->at(i).welch_test_bg((double)Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
925
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
926 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
927 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
928 // Mat->at(i).welch_test_pos((double)Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
929 Mat->at(i).z_test_pos((double)Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
930 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
931
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
932 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
933 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
934 if(!QUIET) cerr << "done. Pvalue = " << Mat->at(i).get_pvalue() << ' ' << Mat->at(i).o_or_u() << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
935 if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
936 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
937 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
938
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
939 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
940 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
941
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
942 void acquire_matrices(vector<matrix> *Mat, map<string,bg> *Bg, string *matfile)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
943 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
944 ifstream in(matfile->c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
945 string line;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
946
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
947 if(!in)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
948 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
949 if(!QUIET) cerr << "Can't find " << *matfile << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
950 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
951 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
952
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
953 while(getline(in,line))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
954 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
955 if(line.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
956 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
957
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
958 vector<string> mbuf;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
959 mbuf.push_back(line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
960
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
961 for(unsigned int i = 0; i < ALPHABET_SIZE; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
962 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
963 getline(in,line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
964
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
965 if(!line.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
966 mbuf.push_back(line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
967 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
968
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
969 if(mbuf.size() == ALPHABET_SIZE + 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
970 Mat->push_back(matrix(&mbuf,Bg));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
971 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
972
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
973 in.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
974
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
975 vector<matrix>::iterator vi = Mat->begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
976
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
977 while(vi != Mat->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
978 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
979 if(!vi->is_good())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
980 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
981 vi = Mat->erase(vi);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
982 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
983 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
984
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
985 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
986 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
987
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
988 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
989 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
990
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
991 void acquire_background(map<string, bg> *Bg)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
992 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
993 ifstream in(bgfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
994
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
995 if(!in)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
996 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
997 if(!QUIET) cerr << "\nWarning: background file " << bgfile << " not found..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
998 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
999 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1000
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1001 string line;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1002
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1003 getline(in,line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1004
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1005 while(getline(in, line))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1006 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1007 istringstream str(line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1008 string id, trash;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1009 bg nbg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1010
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1011 str >> trash >> id >> nbg.Size >> trash >> trash >> trash >> trash >> nbg.Avg >> nbg.Var;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1012
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1013 nbg.Var = pow(nbg.Var,2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1014
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1015 Bg->insert(make_pair(id,nbg));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1016 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1017
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1018 in.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1019 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1020 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1021
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1022 void acquire_regions(vector<sequence> *Seq)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1023 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1024 ifstream in(regfile.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1025 // map<string, vector<string> > Regs;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1026 map<string, map<unsigned int, string> > Regs; //PREVENT REG DUPLICATES
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1027 map<string, map<unsigned int, unsigned int > > M_RANK;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1028
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1029 if(!in)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1030 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1031 if(!QUIET) cerr << "Can't find " << regfile << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1032 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1033 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1034
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1035 string line;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1036
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1037 unsigned int r_count = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1038
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1039 while(getline(in,line))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1040 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1041 if(line.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1042 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1043
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1044 if(line[0] == '#')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1045 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1046
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1047 for(unsigned int i = 0; i < 3; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1048 line[i] = tolower(line[i]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1049
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1050 for(unsigned int i = 3; i < line.size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1051 line[i] = toupper(line[i]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1052
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1053 istringstream str(line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1054 string chr;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1055 unsigned int start, end, mp;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1056
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1057 str >> chr >> start >> end;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1058
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1059 // Regs[chr].push_back(line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1060 mp = start + ((end - start)/2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1061
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1062 if(mp > (RSIZE + RSIZE/2) + 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1063 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1064 Regs[chr][mp] = line;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1065
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1066 // if(!QUIET) cerr << endl << line;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1067
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1068 if(M_RANK.find(chr) != M_RANK.end()) //PREVENT REGIONS PRESENT MORE THAN ONCE TO DO TOO MUCH MESS WITH SPEARMAN CORRELATION
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1069 if(M_RANK[chr].find(mp) != M_RANK[chr].end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1070 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1071
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1072 M_RANK[chr][mp] = r_count;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1073 r_count++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1074 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1075 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1076 if(!QUIET) cerr << "\nSkipping region: too close to chromosome start..." << endl << line << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1077 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1078
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1079 in.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1080
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1081 map<string, map<unsigned int, string> >::iterator mi = Regs.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1082
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1083 if(!TWOBIT)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1084 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1085 while(mi != Regs.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1086 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1087 string file = genome;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1088 file += "/";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1089 file += mi->first;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1090 file += ".raw";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1091
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1092 in.open(file.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1093
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1094 if(!in)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1095 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1096 if(!QUIET) cerr << "\nCan't find " << file << ". Skipping chromosome:\n" << mi->first << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1097
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1098 if(SPEARMAN)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1099 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1100 if(!QUIET) cerr << "\nSpearman correlation disabled..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1101 SPEARMAN = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1102 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1103
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1104 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1105 in.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1106 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1107 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1108
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1109 map<unsigned int, string>::iterator si = mi->second.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1110
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1111 while(si != mi->second.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1112 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1113 Seq->push_back(sequence(&si->second, &in, M_RANK[mi->first][si->first]));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1114 si++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1115 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1116
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1117 in.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1118 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1119 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1120 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1121 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1122 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1123 ostringstream str;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1124 ofstream outfile;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1125 str << ".pchip." << rand() << ".tmp";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1126 string tmp1 = str.str();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1127 outfile.open(tmp1.c_str(), ios::out);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1128 vector<string> k1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1129 vector<unsigned int> k2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1130
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1131 while(mi != Regs.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1132 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1133 map<unsigned int, string>::iterator si = mi->second.begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1134
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1135 while(si != mi->second.end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1136 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1137 unsigned int Start, End;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1138
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1139 Start = si->first - RSIZE;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1140 End = si->first + RSIZE + 1 + MAX_L;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1141
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1142 outfile << mi->first << '\t' << Start << '\t' << End << '\t' << "." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1143
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1144 k1.push_back(mi->first);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1145 k2.push_back(si->first);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1146
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1147 si++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1148 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1149
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1150 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1151 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1152
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1153 string cline = "twoBitToFa -bedPos -bed=";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1154 cline += str.str();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1155 str << ".fa";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1156 cline += " ";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1157 cline += genome;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1158 /* cline += "/";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1159 cline += genome;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1160 cline += ".2bit "; */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1161 cline += " ";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1162 cline += str.str();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1163
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1164 // if(!QUIET) cerr << endl << "TwoBit command line:\n" << cline << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1165
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1166 if(system(cline.c_str()) != 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1167 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1168 if(!QUIET) cerr << endl << "twoBitToFa returned non 0 error code... aborting pscan_chip run!\n" << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1169 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1170 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1171 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1172 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1173 ifstream in(str.str().c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1174 string seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1175 seq.clear();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1176
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1177 if(!in)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1178 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1179 if(!QUIET) cerr << endl << "Can't access twoBitToFa output file! Aborting pscan_chip run!\n" << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1180 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1181 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1182
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1183 unsigned int scount = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1184
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1185 while(getline(in,line))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1186 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1187 if(line.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1188 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1189
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1190 if(line[0] == '>')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1191 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1192 if(seq.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1193 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1194 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1195 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1196 Seq->push_back(sequence(&seq, M_RANK[k1.at(scount)][k2.at(scount)], k1.at(scount), k2.at(scount)));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1197 seq.clear();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1198 scount++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1199 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1200 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1201 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1202 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1203 seq += line;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1204 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1205
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1206 Seq->push_back(sequence(&seq, M_RANK[k1.at(scount)][k2.at(scount)], k1.at(scount), k2.at(scount))); //LAST SEQUENCE!
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1207
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1208 in.close();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1209 remove(str.str().c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1210 remove(tmp1.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1211 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1212
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1213 // exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1214 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1215
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1216 vector<sequence>::iterator vi = Seq->begin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1217
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1218 while(vi != Seq->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1219 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1220 if(!vi->is_good())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1221 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1222 vi = Seq->erase(vi);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1223 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1224 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1225
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1226 vi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1227 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1228
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1229 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1230 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1231
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1232 void command_line_parser(int argc, char **argv)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1233 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1234 if(argc == 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1235 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1236
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1237 for(int i = 1; i < argc; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1238 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1239 string buf = argv[i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1240
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1241 if(buf == "-r")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1242 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1243 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1244 regfile = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1245 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1246 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1247
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1248 if(buf == "-g")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1249 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1250 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1251 genome = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1252 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1253 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1254
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1255 if(buf == "-s")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1256 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1257 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1258 RSIZE = atoi(argv[++i]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1259 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1260 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1261 if(buf == "-bgavg")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1262 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1263 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1264 SINGLE_MATRIX_BG_AVG = atof(argv[++i]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1265 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1266 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1267 if(buf == "-M")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1268 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1269 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1270 matrixfile = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1271 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1272 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1273 if(buf == "-MADD")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1274 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1275 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1276 additional_matrixfile = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1277 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1278 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1279 if(buf == "-m")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1280 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1281 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1282 selected = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1283 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1284 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1285
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1286 if(buf == "-bg")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1287 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1288 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1289 bgfile = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1290 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1291 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1292 if(buf == "-go")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1293 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1294 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1295 GALAXY_OUTPUT = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1296 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1297 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1298 if(buf == "-obs")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1299 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1300 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1301 obstf = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1302
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1303 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1304 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1305 if(buf == "-ss")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1306 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1307 SINGLE_STRAND = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1308 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1309 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1310 if(buf == "-2bit")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1311 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1312 TWOBIT = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1313 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1314 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1315 if(buf == "-quiet")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1316 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1317 QUIET = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1318 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1319 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1320 if(buf == "-sbp")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1321 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1322 SECOND_BEST_POS = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1323 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1324 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1325 if(buf == "-fasta")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1326 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1327 GET_SEQUENCES = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1328 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1329 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1330 if(buf == "-pos")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1331 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1332 POSITIONAL = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1333 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1334 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1335 if(buf == "-spear")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1336 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1337 SPEARMAN = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1338 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1339 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1340 if(buf == "-wsize")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1341 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1342 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1343 W_SIZE = atoi(argv[++i]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1344
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1345 W_STEP = W_SIZE / 2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1346 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1347 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1348 /* if(buf == "-wstep")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1349 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1350 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1351 W_STEP = atoi(argv[++i]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1352 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1353 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1354
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1355 if(buf == "-fast")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1356 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1357 FAST_SCAN = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1358 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1359 }*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1360 /* if(buf == "-naive")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1361 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1362 NAIVE = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1363 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1364 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1365 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1366 if(buf == "-v")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1367 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1368 VERBOSE = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1369 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1370 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1371 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1372 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1373 if(!QUIET) cerr << "\nUnknown option: " << buf << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1374 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1375 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1376
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1377 /* if(buf == "-Q")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1378 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1379 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1380 idfile = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1381 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1382 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1383 if(buf == "-ql")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1384 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1385 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1386 q_idlist = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1387 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1388 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1389 if(buf == "-imgm")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1390 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1391 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1392 bg_for_img = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1393 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1394 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1395 if(buf == "-magic")
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1396 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1397 if(i < argc - 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1398 magic = argv[++i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1399 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1400 }*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1401 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1402
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1403 if(RSIZE > MAX_REG_SIZE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1404 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1405 if(!QUIET) cerr << "\nRegion size exceeds " << MAX_REG_SIZE << "..." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1406 exit(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1407 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1408
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1409 if(RSIZE % W_SIZE != 0 || W_SIZE % 2 != 0 || RSIZE / W_SIZE < 5)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1410 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1411 if(!QUIET) cerr << "\nWindow size must be even and both an exact divisor of region size and at least five times smaller of it: positional analysis disabled." << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1412 POSITIONAL = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1413 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1414
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1415 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1416 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1417
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1418 //SEQUENCE CLASS BEGIN
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1419
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1420 sequence::sequence(string *seq, unsigned int R, string chr, unsigned int mp) //CONSTRUCTOR FOR 2BIT INPUT
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1421 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1422 Chr = chr;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1423 Strand = '+';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1424 AntiStrand = '-';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1425 E_Rank = R;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1426 good = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1427
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1428 Start = mp - RSIZE/2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1429 End = (mp + RSIZE/2) - 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1430
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1431 for(unsigned int i = 0; i < seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1432 seq->at(i) = toupper(seq->at(i));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1433
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1434 Seq = new char[(RSIZE*2) + 1 + MAX_L];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1435
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1436 // if(!QUIET) cerr << "\nseq.size = " << seq->size() << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1437 // if(!QUIET) cerr << "\narray.size = " << (RSIZE*2) + 1 + MAX_L << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1438
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1439 strcpy(Seq, seq->c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1440
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1441 if(seq->size() != RSIZE*2 + MAX_L + 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1442 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1443 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1444 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1445 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1446
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1447 if(GET_SEQUENCES)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1448 fasta_out << ">" << Chr << '\t' << Start + 1 << '\t' << End + 1 << endl << seq->substr(RSIZE/2, RSIZE) << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1449
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1450 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1451 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1452
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1453 sequence::sequence(string *line, ifstream *in, unsigned int R)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1454 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1455 istringstream str(*line);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1456 string trash;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1457 int buf_s, buf_e, mp;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1458 good = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1459
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1460 E_Rank = R;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1461
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1462 str >> Chr >> buf_s >> buf_e >> Name >> trash >> Strand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1463
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1464 if(Strand == 'R')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1465 Strand = '-';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1466
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1467 if(Strand != '+' && Strand != '-')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1468 Strand = '+';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1469
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1470 if(Strand == '+')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1471 AntiStrand = '-';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1472 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1473 AntiStrand = '+';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1474
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1475 mp = buf_s + ((buf_e - buf_s)/2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1476
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1477 Start = mp - RSIZE/2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1478 End = (mp + RSIZE/2) - 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1479
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1480 // Seq = new char[RSIZE + 1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1481 // UF_Seq = new char[(RSIZE/2) + 1 + MAX_L/2];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1482 // DF_Seq = new char[(RSIZE/2) + 1 + MAX_L/2];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1483
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1484 Seq = new char[(RSIZE*2) + 1 + MAX_L];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1485
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1486 in->seekg((Start) - RSIZE/2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1487
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1488 in->get(Seq, (RSIZE*2 + 1) + MAX_L);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1489
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1490 if(in->gcount() != RSIZE*2 + MAX_L)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1491 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1492 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1493 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1494 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1495
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1496 if(GET_SEQUENCES)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1497 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1498 char *out_seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1499 out_seq = new char[RSIZE + 1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1500
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1501 in->seekg(Start);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1502 in->get(out_seq, (RSIZE + 1));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1503
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1504 fasta_out << ">" << Chr << '\t' << Start + 1 << '\t' << End + 1 << '\t' << "---" << '\t' << buf_s << '\t' << buf_e << '\t' << endl << out_seq << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1505
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1506 delete[] out_seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1507 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1508
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1509 /*in->seekg(((Start - 1) - RSIZE/2) - (MAX_L/2));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1510
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1511 in->get(UF_Seq, RSIZE/2 + 1 + MAX_L /2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1512
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1513 if(in->gcount() != RSIZE/2 + (MAX_L/2))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1514 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1515 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1516 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1517 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1518
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1519 in->get(Seq, RSIZE + 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1520
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1521 if(in->gcount() != RSIZE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1522 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1523 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1524 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1525 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1526
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1527 in->get(DF_Seq, RSIZE/2 + 1 + (MAX_L/2));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1528
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1529 if(in->gcount() != RSIZE/2 + (MAX_L/2))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1530 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1531 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1532
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1533 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1534 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1535
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1536 unsigned int sequence::e_rank()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1537 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1538 return E_Rank;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1539 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1540
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1541 string sequence::chr()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1542 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1543 return Chr;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1544 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1545
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1546 /*string* sequence::seq()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1547 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1548 return &Seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1549 }*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1550
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1551 char* sequence::seq()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1552 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1553 return Seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1554 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1555
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1556 char sequence::strand()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1557 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1558 return Strand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1559 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1560
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1561 char sequence::antistrand()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1562 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1563 return AntiStrand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1564 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1565
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1566 /*char* sequence::uf_seq()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1567 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1568 return UF_Seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1569 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1570
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1571 char* sequence::df_seq()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1572 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1573 return DF_Seq;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1574 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1575 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1576 string sequence::name()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1577 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1578 return Name;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1579 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1580
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1581 unsigned int sequence::start()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1582 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1583 return Start;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1584 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1585
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1586 unsigned int sequence::end()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1587 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1588 return End;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1589 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1590
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1591 bool sequence::is_good()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1592 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1593 return good;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1594 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1595
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1596 // SEQUENCE CLASS END
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1597
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1598 // MATRIX CLASS BEGIN
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1599
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1600 matrix::matrix(vector<string>* mbuf, map<string, bg> *Bg)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1601 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1602 string buf;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1603 istringstream bstr(mbuf->at(1)), nstr(mbuf->at(0));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1604 L = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1605 R_Avg = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1606 F_Avg = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1607 R_Var = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1608 F_Var = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1609 bg_Avg = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1610 bg_Var = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1611
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1612 BIN_NUM = RSIZE / W_STEP;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1613
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1614 W_R_Avg.resize(BIN_NUM, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1615 W_R_Var.resize(BIN_NUM, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1616 W_R_pvalue.resize(BIN_NUM, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1617 W_R_T_pvalue.resize(BIN_NUM,0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1618 spearman = 42;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1619
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1620 O_U = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1621 O_U_bg = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1622 W_O_U.resize(BIN_NUM, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1623
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1624 BG = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1625 good = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1626 norm_sec_step = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1627
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1628 while(bstr >> buf)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1629 L++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1630
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1631 if(L > RSIZE/2)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1632 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1633 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1634 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1635 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1636
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1637 if(L > MAX_L)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1638 MAX_L = L;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1639
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1640 if(!mbuf->at(0).empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1641 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1642 if(mbuf->at(0).at(0) != '>')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1643 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1644 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1645 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1646 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1647 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1648 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1649 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1650 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1651 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1652 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1653
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1654 // Name = mbuf->at(0).substr(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1655 nstr >> Id >> Name;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1656
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1657 Id = Id.substr(1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1658
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1659 if(!selected.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1660 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1661 // cerr << endl << selected << '\t' << Id << '\t' << Name << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1662
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1663 if(selected != Id && selected != Name)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1664 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1665 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1666 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1667 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1668 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1669
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1670 if(!Bg->empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1671 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1672 map<string,bg>::iterator mi = Bg->find(Id);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1673
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1674 if(mi == Bg->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1675 mi = Bg->find(Name);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1676
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1677 if(mi != Bg->end())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1678 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1679 bg_Avg = mi->second.Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1680 bg_Var = mi->second.Var;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1681 bg_Size = mi->second.Size;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1682 BG = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1683 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1684 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1685 if(!QUIET) cerr << "\nWarning: no background for matrix: " << Id << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1686 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1687
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1688 M = new double*[L];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1689 rc_M = new double*[L];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1690
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1691 for(unsigned int i = 1; i < ALPHABET_SIZE + 1; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1692 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1693 istringstream str(mbuf->at(i));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1694
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1695 unsigned int count = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1696
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1697 while(str >> buf)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1698 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1699 if(i == 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1700 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1701 M[count] = new double[ALPHABET_SIZE + 1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1702 rc_M[count] = new double[ALPHABET_SIZE + 1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1703 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1704
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1705 M[count][i-1] = atof(buf.c_str());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1706 count++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1707
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1708 if(count > L)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1709 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1710 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1711 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1712 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1713 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1714
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1715 if(count != L)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1716 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1717 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1718 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1719 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1720 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1721
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1722 normalizer();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1723 to_log();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1724 rev_c();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1725 avg();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1726 max_min();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1727 // set_top_pos();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1728
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1729 if(min_score == max_score)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1730 good = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1731
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1732 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1733 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1734
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1735 void matrix::display()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1736 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1737 if(!QUIET) cerr << "\n>" << Name << '\t' << good << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1738
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1739 for(unsigned int i = 0; i < ALPHABET_SIZE; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1740 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1741 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1742 if(!QUIET) cerr << M[j][i] << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1743
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1744 if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1745 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1746
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1747 if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1748
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1749 // for(unsigned int i = 0; i < TOP_P; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1750 // if(!QUIET) cerr << "TOP[" << i+1 << "] = " << top_pos[i] + 1 << "-" << top_char[i] << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1751
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1752 if(!QUIET) cerr << "\n\n>" << Name << '\t' << good << '\t' << "RC" << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1753
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1754 for(unsigned int i = 0; i < ALPHABET_SIZE; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1755 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1756 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1757 if(!QUIET) cerr << rc_M[j][i] << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1758
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1759 if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1760 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1761
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1762 if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1763
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1764 // for(unsigned int i = 0; i < TOP_P; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1765 // if(!QUIET) cerr << "TOP[" << i+1 << "] = " << rc_top_pos[i] + 1 << "-" << rc_top_char[i] << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1766
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1767 if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1768
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1769 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1770 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1771
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1772 bool matrix::is_good()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1773 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1774 return good;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1775 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1776
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1777
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1778 void matrix::normalizer()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1779 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1780 double *sums = new double[L];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1781
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1782 for(int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1783 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1784 sums[x] = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1785
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1786 for(int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1787 sums[x] += M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1788 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1789
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1790 for(int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1791 for(int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1792 M[x][y] /= sums[x];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1793
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1794 delete[] sums;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1795
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1796 if(!norm_sec_step)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1797 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1798 for(int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1799 for(int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1800 M[x][y] += MIN_ADD_FREQ;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1801
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1802 norm_sec_step = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1803
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1804 normalizer();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1805 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1806
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1807 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1808
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1809 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1810
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1811 void matrix::to_log()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1812 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1813 for(int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1814 for(int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1815 M[x][y] = log(M[x][y]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1816
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1817 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1818 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1819
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1820 void matrix::avg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1821 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1822 // mat_avg = new double[L];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1823
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1824 for(int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1825 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1826 double buf = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1827
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1828 for(int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1829 buf += M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1830
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1831 // mat_avg[x] = buf/ALPHABET_SIZE;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1832 M[x][ALPHABET_SIZE] = buf/ALPHABET_SIZE;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1833 rc_M[(L-1) -x][ALPHABET_SIZE] = buf/ALPHABET_SIZE;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1834 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1835
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1836 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1837 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1838
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1839 void matrix::max_min()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1840 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1841 double min, max;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1842
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1843 max_score = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1844 min_score = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1845
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1846 for(int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1847 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1848 min = M[x][0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1849 max = M[x][0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1850
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1851 for(int y = 1; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1852 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1853 if(M[x][y] < min)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1854 min = M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1855
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1856 if(M[x][y] > max)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1857 max = M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1858 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1859
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1860 min_score += min;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1861 max_score += max;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1862 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1863
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1864 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1865 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1866
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1867 void matrix::rev_c()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1868 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1869 for(unsigned int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1870 for(unsigned int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1871 rc_M[(L - 1) - x][(ALPHABET_SIZE - 1) - y] = M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1872
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1873 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1874 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1875
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1876 void matrix::scan(vector<sequence> *Seq)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1877 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1878 v_score.reserve(Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1879 vF_score.reserve(Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1880 v_pos.reserve(Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1881 v_strand.reserve(Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1882
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1883 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1884 W_R_v_score.reserve(Seq->size());
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1885
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1886 unsigned int progress;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1887
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1888 if(!SINGLE_STRAND)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1889 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1890 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1891 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1892 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1893 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1894 progress = (unsigned int)(((double)(i+1)/(double)Seq->size()) * 100);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1895
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1896 if(!(progress%5))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1897 if(!QUIET) cerr << progress << '%';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1898 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1899
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1900 double max_flank_u, max_flank_d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1901 vector<double> W_buf(BIN_NUM, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1902
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1903 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1904 double r_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1905
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1906 max_flank_u = scan_seq_ds(Seq->at(i).seq() , true, RSIZE/2, &W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1907 r_score = scan_seq_ds(Seq->at(i).seq() + (RSIZE/2) , false, RSIZE, &W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1908 max_flank_d = scan_seq_ds(Seq->at(i).seq() + ((RSIZE/2)*3) , true, RSIZE/2, &W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1909
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1910 R_Avg += r_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1911
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1912 /* if(r_score < max_flank_u || r_score < max_flank_d)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1913 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1914 if(max_flank_u > max_flank_d)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1915 G_Avg += max_flank_u;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1916 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1917 G_Avg += max_flank_d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1918 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1919 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1920 G_Avg += r_score;*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1921
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1922 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1923 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1924 // for(unsigned int i = 0; i < BIN_NUM; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1925 // W_R_Avg[i] += W_buf[i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1926
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1927 W_R_v_score.push_back(W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1928 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1929
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1930 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1931
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1932 if(max_flank_u > max_flank_d)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1933 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1934 F_Avg += max_flank_u;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1935 vF_score.push_back(max_flank_u);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1936 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1937 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1938 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1939 F_Avg += max_flank_d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1940 vF_score.push_back(max_flank_d);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1941 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1942
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1943
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1944 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1945 if(!(progress%5))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1946 if(!QUIET) cerr << (char)13;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1947 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1948 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1949 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1950 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1951 for(unsigned int i = 0; i < Seq->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1952 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1953
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1954 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1955 if(!QUIET) cerr << (unsigned int)(((double)(i+1)/(double)Seq->size()) * 100) << '%';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1956
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1957 double max_flank_u, max_flank_d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1958 vector<double> W_buf(BIN_NUM, 0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1959
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1960 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1961
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1962 double r_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1963
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1964 max_flank_u = scan_seq_ss(Seq->at(i).seq() , true, RSIZE/2, Seq->at(i).strand(), &W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1965 r_score += scan_seq_ss(Seq->at(i).seq() + (RSIZE/2) , false, RSIZE, Seq->at(i).strand(), &W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1966 max_flank_d = scan_seq_ss(Seq->at(i).seq() + ((RSIZE/2)*3), true, RSIZE/2, Seq->at(i).strand(), &W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1967
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1968 R_Avg += r_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1969
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1970 /* if(r_score < max_flank_u || r_score < max_flank_d)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1971 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1972 if(max_flank_u > max_flank_d)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1973 G_Avg += max_flank_u;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1974 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1975 G_Avg += max_flank_d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1976 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1977 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1978 G_Avg += r_score;*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1979
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1980 if(POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1981 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1982 // for(unsigned int i = 0; i < BIN_NUM; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1983 // W_R_Avg[i] += W_buf[i];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1984
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1985 W_R_v_score.push_back(W_buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1986 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1987 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1988
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1989 if(max_flank_u > max_flank_d)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1990 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1991 F_Avg += max_flank_u;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1992 vF_score.push_back(max_flank_u);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1993 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1994 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1995 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1996 F_Avg += max_flank_d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1997 vF_score.push_back(max_flank_d);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1998 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
1999
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2000 if(VERBOSE)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2001 if(!QUIET) cerr << (char)13;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2002 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2003 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2004
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2005 R_Avg /= Seq->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2006 F_Avg /= Seq->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2007 // G_Avg /= Seq->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2008
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2009 // for(unsigned int i = 0; i < BIN_NUM; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2010 // W_R_Avg[i] /= Seq->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2011
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2012 if(SPEARMAN)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2013 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2014 multimap<double, unsigned int> SRM;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2015
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2016 for(unsigned int i = 0; i < v_score.size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2017 SRM.insert(make_pair(v_score[i], i));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2018
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2019 multimap<double, unsigned int>::reverse_iterator mmi = SRM.rbegin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2020 int sr = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2021 double d = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2022
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2023 while(mmi != SRM.rend())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2024 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2025 // if(!QUIET) cerr << endl << mmi->first << '\t' << sr << '\t' << Seq->at(mmi->second).e_rank() << '\t' << this->name();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2026
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2027 d += pow((sr - (int)Seq->at(mmi->second).e_rank()), 2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2028 sr++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2029 mmi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2030 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2031
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2032 d *= 6;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2033
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2034 // if(!QUIET) cerr << endl << "d = " << d << "\tden = " << (Seq->size() * (pow(Seq->size(), 2) - 1)) << '\t' << "ssize = " << Seq->size();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2035
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2036 d /= (Seq->size() * (pow(Seq->size(), 2) - 1));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2037
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2038 spearman = 1 - d;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2039 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2040
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2041 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2042 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2043
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2044 void matrix::calc_var(double S)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2045 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2046 for(unsigned int i = 0; i < S; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2047 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2048 R_Var += pow(v_score[i] - R_Avg,2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2049 F_Var += pow(vF_score[i] - F_Avg,2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2050
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2051 /* if(v_score[i] >= vF_score[i])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2052 G_Var += pow(v_score[i] - G_Avg,2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2053 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2054 G_Var += pow(vF_score[i] - G_Avg,2);*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2055 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2056
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2057 if(S > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2058 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2059 R_Var /= (S - 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2060 F_Var /= (S - 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2061 // G_Var /= (S - 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2062 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2063
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2064 if(R_Var == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2065 R_Var += EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2066
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2067 if(F_Var == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2068 F_Var += EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2069
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2070 // if(G_Var == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2071 // G_Var += EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2072
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2073 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2074 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2075
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2076 void matrix::calc_W_param(double S)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2077 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2078 if(S > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2079 S = S/2; //SOLO PER LA PRIMA META' DELLE SEQUENZE!!!
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2080
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2081 W_Avg = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2082 W_Var = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2083
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2084 multimap<double, unsigned int> score_seq_map;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2085
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2086 for(unsigned int i = 0; i < v_score.size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2087 score_seq_map.insert(make_pair(v_score.at(i), i));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2088
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2089 multimap<double, unsigned int>::reverse_iterator mi = score_seq_map.rbegin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2090
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2091 for(unsigned int i = 0; i < S; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2092 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2093 for(unsigned int j = 0; j < BIN_NUM; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2094 W_R_Avg[j] += W_R_v_score[mi->second][j];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2095
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2096 // if(!QUIET) cerr << Name << '\t' << mi->first << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2097
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2098 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2099 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2100
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2101 for(unsigned int j = 0; j < BIN_NUM; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2102 W_R_Avg[j] /= S;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2103
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2104 mi = score_seq_map.rbegin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2105
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2106 for(unsigned int i = 0; i < S; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2107 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2108 for(unsigned int j = 0; j < BIN_NUM; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2109 W_R_Var[j] += pow(W_R_v_score[mi->second][j] - W_R_Avg[j],2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2110
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2111 mi++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2112 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2113
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2114 /* for(unsigned int i = 0; i < S; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2115 for(unsigned int j = 0; j < BIN_NUM; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2116 W_R_Var[j] += pow(W_R_v_score[i][j] - W_R_Avg[j],2);*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2117
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2118 if(S > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2119 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2120 for(unsigned int j = 0; j < BIN_NUM; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2121 W_R_Var[j] /= (S - 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2122 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2123
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2124 for(unsigned int j = 0; j < BIN_NUM; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2125 if(W_R_Var[j] == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2126 W_R_Var[j] += EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2127
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2128 for(unsigned int j = 0; j < BIN_NUM - 1; j++) //THE LAST BIN IS WASTED SINCE IT IS AN HALF BIN
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2129 W_Avg += W_R_Avg[j];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2130
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2131 W_Avg /= (BIN_NUM - 1);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2132
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2133 for(unsigned int j = 0; j < BIN_NUM - 1; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2134 W_Var += pow(W_R_Avg[j] - W_Avg, 2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2135
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2136 W_Var /= (BIN_NUM - 2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2137
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2138 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2139 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2140
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2141 void matrix::welch_test(double S)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2142 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2143 t = R_Avg - F_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2144
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2145 if(t == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2146 t = EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2147
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2148 t /= pow((R_Var/S) + (F_Var/S),0.5);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2149
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2150 dof = pow((R_Var/S) + (F_Var/S),2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2151
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2152 dof /= (pow(R_Var,2)/((pow(S,2)) * (S-1))) + (pow(F_Var,2)/((pow(S,2)) * (S-1)));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2153
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2154 if(t > 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2155 pvalue = gsl_cdf_tdist_Q(t,dof);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2156 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2157 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2158 pvalue = gsl_cdf_tdist_P(t,dof);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2159 O_U = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2160 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2161
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2162 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2163 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2164
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2165 void matrix::z_test_pos(double S)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2166 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2167 // if(!QUIET) cerr << endl << Name;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2168
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2169 for(unsigned int i = 0; i < BIN_NUM; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2170 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2171 double se = sqrt(W_R_Var.at(i)), z;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2172 se /= sqrt(S/2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2173
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2174 z = W_R_Avg.at(i) - W_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2175 z /=se;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2176
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2177 if(z >= 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2178 W_O_U.at(i) = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2179
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2180 W_R_pvalue.at(i) = gsl_cdf_ugaussian_Q(z);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2181
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2182 // if(!QUIET) cerr << endl << "W_R_Avg.at(i) " << W_R_Avg.at(i) << '\t' << W_Avg << '\t' << W_R_pvalue.at(i) << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2183
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2184 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2185
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2186 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2187 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2188
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2189 void matrix::welch_test_pos(double S)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2190 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2191 if(S > 1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2192 S = S/2; //SOLO LA PRIMA META' DELLE SEQUENZE!!!
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2193
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2194 // if(!QUIET) cerr << "\nRAVG = " << W_Avg << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2195 for(unsigned int i = 0; i < BIN_NUM; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2196 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2197 double T, DOF;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2198
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2199 T = W_R_Avg.at(i) - W_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2200
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2201 // if(!QUIET) cerr << W_R_Avg.at(i) << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2202
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2203 // if(!QUIET) cerr << endl << Name << endl << "T = " << T << '\t' << W_R_Avg.at(i) << '\t' << W_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2204
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2205 if(T == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2206 T = EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2207
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2208 T /= pow((W_R_Var.at(i)/S) + (W_Var/S),0.5);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2209
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2210 DOF = pow((W_R_Var.at(i)/S) + (W_Var/S),2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2211
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2212 DOF /= (pow(W_R_Var.at(i),2)/((pow(S,2)) * (S-1))) + (pow(W_Var,2)/((pow(S,2)) * (S-1)));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2213
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2214 if(T > 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2215 W_R_T_pvalue.at(i) = gsl_cdf_tdist_Q(T,DOF);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2216 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2217 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2218 W_R_T_pvalue.at(i) = gsl_cdf_tdist_P(T,DOF);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2219 W_O_U.at(i) = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2220 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2221
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2222 // if(!QUIET) cerr << "\tPV= " << W_R_pvalue.at(i);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2223
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2224 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2225
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2226 // if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2227
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2228 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2229 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2230
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2231 void matrix::welch_test_bg(double S1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2232 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2233 double S2 = bg_Size;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2234
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2235 // if(!QUIET) cerr << Name << '\t' << R_Avg << '\t' << bg_Avg << '\t' << R_Var << '\t' << bg_Var << '\t' << S1 << '\t' << S2 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2236
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2237 t_bg = R_Avg - bg_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2238
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2239 if(t_bg == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2240 t_bg = EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2241
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2242 t_bg /= pow((R_Var/S1) + (bg_Var/S2),0.5);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2243
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2244 dof_bg = pow((R_Var/S1) + (bg_Var/S2),2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2245
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2246 dof_bg /= (pow(R_Var,2)/((pow(S1,2)) * (S1-1))) + (pow(bg_Var,2)/((pow(S2,2)) * (S2-1)));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2247
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2248 if(t_bg > 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2249 pvalue_bg = gsl_cdf_tdist_Q(t_bg,dof_bg);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2250 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2251 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2252 pvalue_bg = gsl_cdf_tdist_P(t_bg,dof_bg);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2253 O_U_bg = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2254 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2255
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2256 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2257 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2258
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2259 /*void matrix::welch_test_bg_G(double S1)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2260 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2261 double S2 = bg_Size;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2262
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2263 // if(!QUIET) cerr << Name << '\t' << R_Avg << '\t' << bg_Avg << '\t' << R_Var << '\t' << bg_Var << '\t' << S1 << '\t' << S2 << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2264
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2265 t_bg = G_Avg - bg_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2266
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2267 if(t_bg == 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2268 t_bg = EPSILON;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2269
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2270 t_bg /= pow((G_Var/S1) + (bg_Var/S2),0.5);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2271
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2272 dof_bg = pow((G_Var/S1) + (bg_Var/S2),2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2273
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2274 dof_bg /= (pow(G_Var,2)/((pow(S1,2)) * (S1-1))) + (pow(bg_Var,2)/((pow(S2,2)) * (S2-1)));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2275
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2276 if(t_bg > 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2277 pvalue_bg = gsl_cdf_tdist_Q(t_bg,dof_bg);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2278 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2279 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2280 pvalue_bg = gsl_cdf_tdist_P(t_bg,dof_bg);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2281 O_U_bg = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2282 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2283
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2284 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2285 }*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2286
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2287 double matrix::scan_seq_ds(char *S, bool flank, unsigned int l, vector<double> *W_buf)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2288 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2289 unsigned int pos = 0, max_pos = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2290 double seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2291 bool strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2292
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2293 l -= L/2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2294
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2295 while(pos < l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2296 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2297
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2298 double pos_score[2] = {0,0};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2299
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2300 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2301 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2302 pos_score[0] += get_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2303 pos_score[1] += get_rc_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2304 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2305
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2306 if(seq_score < pos_score[0] || !pos)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2307 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2308 seq_score = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2309 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2310 strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2311 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2312 if(seq_score < pos_score[1])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2313 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2314 seq_score = pos_score[1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2315 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2316 strand = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2317 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2318
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2319 if(!flank && POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2320 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2321 unsigned int vpos = pos / W_STEP;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2322
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2323 if(W_buf->at(vpos) < pos_score[0] || !(pos % W_STEP))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2324 W_buf->at(vpos) = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2325
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2326 if(W_buf->at(vpos) < pos_score[1])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2327 W_buf->at(vpos) = pos_score[1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2328
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2329 if(vpos)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2330 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2331 if(W_buf->at(vpos - 1) < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2332 W_buf->at(vpos - 1) = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2333
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2334 if(W_buf->at(vpos - 1) < pos_score[1])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2335 W_buf->at(vpos - 1) = pos_score[1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2336 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2337 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2338
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2339 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2340 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2341
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2342 seq_score = 1 + (seq_score - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2343
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2344 if(!flank && POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2345 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2346 // if(!QUIET) cerr << endl << Name << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2347
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2348 unsigned int binm = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2349
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2350 for(unsigned int i = 0; i < BIN_NUM; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2351 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2352 if(W_buf->at(i) != 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2353 W_buf->at(i) = 1 + (W_buf->at(i) - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2354 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2355 binm++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2356 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2357
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2358 BIN_NUM -= binm;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2359 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2360
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2361 if(!flank)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2362 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2363 v_score.push_back(seq_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2364 v_pos.push_back(max_pos + L/2);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2365 v_strand.push_back(strand);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2366 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2367
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2368 return seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2369 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2370
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2371 double matrix::scan_seq_ss_second_best(char *S, unsigned int l, unsigned int *P, bool *s, unsigned int POS, bool seq_strand)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2372 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2373 unsigned int pos = 0, max_pos = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2374 double seq_score = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2375 bool strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2376
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2377 while(pos < l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2378 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2379 if(pos == POS)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2380 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2381 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2382 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2383 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2384
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2385 double pos_score[2] = {0,0};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2386
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2387 if(seq_strand == '+')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2388 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2389 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2390 pos_score[0] += get_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2391 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2392 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2393 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2394 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2395 pos_score[0] += get_rc_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2396 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2397
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2398 if(seq_score < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2399 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2400 seq_score = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2401 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2402 strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2403 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2404
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2405
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2406 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2407 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2408
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2409 seq_score = 1 + (seq_score - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2410
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2411 *P = max_pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2412 *s = strand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2413
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2414 return seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2415 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2416
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2417 double matrix::scan_seq_ds_second_best(char *S, unsigned int l, unsigned int *P, bool *s, int POS)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2418 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2419 int pos = 0, max_pos = 0, count = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2420 double seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2421 bool strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2422
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2423 POS -= L/2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2424 l -= L/2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2425
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2426 while(pos < l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2427 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2428 // if(pos == POS)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2429 if(pos >= (POS - L) && pos <= (POS + L))
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2430 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2431 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2432 continue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2433 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2434
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2435 double pos_score[2] = {0,0};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2436
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2437 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2438 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2439 pos_score[0] += get_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2440 pos_score[1] += get_rc_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2441 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2442
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2443 if(seq_score < pos_score[0] || !count)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2444 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2445 seq_score = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2446 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2447 strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2448 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2449 if(seq_score < pos_score[1])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2450 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2451 seq_score = pos_score[1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2452 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2453 strand = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2454 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2455
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2456 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2457 count++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2458 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2459
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2460 seq_score = 1 + (seq_score - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2461
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2462 *P = max_pos ;//+ L/2;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2463 *s = strand;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2464
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2465 return seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2466 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2467
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2468
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2469
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2470 /*double matrix::scan_seq_ds_quick(char *S, bool flank, unsigned int l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2471 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2472 unsigned int pos = 0, max_pos = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2473 double seq_score = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2474 bool strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2475
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2476 while(pos < l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2477 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2478 double pos_score[2] = {0,0};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2479
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2480 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2481 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2482 pos_score[0] += get_M_value(p_pos[j], S[pos+p_pos[j]]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2483
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2484 if((pos_score[0] + p_max[j+1]) <= seq_score)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2485 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2486 pos_score[0] = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2487 break;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2488 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2489
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2490 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2491
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2492 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2493 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2494 pos_score[1] += get_rc_M_value(rc_p_pos[j], S[pos+rc_p_pos[j]]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2495
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2496 if((pos_score[1] + p_max[j+1]) <= seq_score)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2497 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2498 pos_score[1] = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2499 break;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2500 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2501 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2502
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2503 if(seq_score < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2504 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2505 seq_score = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2506 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2507 strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2508 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2509 if(seq_score < pos_score[1])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2510 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2511 seq_score = pos_score[1];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2512 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2513 strand = true;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2514 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2515
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2516 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2517 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2518
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2519 seq_score = 1 + (seq_score - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2520
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2521 if(!flank)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2522 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2523 v_score.push_back(seq_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2524 v_pos.push_back(max_pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2525 v_strand.push_back(strand);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2526 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2527
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2528
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2529 return seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2530 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2531 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2532 double matrix::scan_seq_ss(char *S, bool flank, unsigned int l, char seq_strand, vector<double> *W_buf)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2533 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2534 unsigned int pos = 0, max_pos = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2535 double seq_score = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2536 bool strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2537
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2538 while(pos < l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2539 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2540 double pos_score[2] = {0,0};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2541
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2542 if(seq_strand == '+')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2543 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2544 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2545 pos_score[0] += get_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2546 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2547 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2548 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2549 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2550 pos_score[0] += get_rc_M_value(j, S[pos+j]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2551 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2552
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2553 if(seq_score < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2554 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2555 seq_score = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2556 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2557 strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2558 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2559
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2560 if(!flank && POSITIONAL)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2561 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2562 unsigned int vpos = pos / W_STEP;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2563
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2564 if(W_buf->at(vpos) < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2565 W_buf->at(vpos) = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2566
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2567 if(vpos)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2568 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2569 if(W_buf->at(vpos - 1) < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2570 W_buf->at(vpos - 1) = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2571 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2572 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2573
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2574 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2575 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2576
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2577 seq_score = 1 + (seq_score - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2578
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2579 if(POSITIONAL && !flank)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2580 for(unsigned int i = 0; i < W_buf->size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2581 W_buf->at(i) = 1 + (W_buf->at(i) - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2582
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2583 if(!flank)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2584 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2585 v_score.push_back(seq_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2586 v_pos.push_back(max_pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2587 v_strand.push_back(strand);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2588 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2589
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2590 return seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2591 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2592
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2593 /* double matrix::scan_seq_ss_quick(char *S, bool flank, unsigned int l, char seq_strand)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2594 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2595 unsigned int pos = 0, max_pos = 0;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2596 double seq_score = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2597 bool strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2598
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2599 while(pos < l)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2600 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2601 double pos_score[2] = {0,0};
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2602
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2603 if(seq_strand == '+')
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2604 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2605 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2606 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2607 pos_score[0] += get_M_value(p_pos[j], S[pos+p_pos[j]]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2608
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2609 if((pos_score[0] + p_max[j+1]) <= seq_score)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2610 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2611 pos_score[0] = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2612 break;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2613 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2614
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2615
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2616 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2617 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2618 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2619 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2620 for(unsigned int j = 0; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2621 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2622 pos_score[0] += get_rc_M_value(rc_p_pos[j], S[pos+rc_p_pos[j]]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2623
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2624 if((pos_score[0] + p_max[j+1]) <= seq_score)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2625 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2626 pos_score[0] = min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2627 break;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2628 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2629
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2630 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2631 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2632
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2633 if(seq_score < pos_score[0])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2634 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2635 seq_score = pos_score[0];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2636 max_pos = pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2637 strand = false;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2638 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2639
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2640 pos++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2641 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2642
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2643 seq_score = 1 + (seq_score - max_score)/(max_score - min_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2644
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2645 if(!flank)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2646 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2647 v_score.push_back(seq_score);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2648 v_pos.push_back(max_pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2649 v_strand.push_back(strand);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2650 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2651
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2652 return seq_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2653 }*/
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2654
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2655 double matrix::get_M_value(int pos, char C)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2656 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2657 return M[pos][VI[C]];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2658 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2659
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2660 double matrix::get_rc_M_value(int pos, char C)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2661 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2662 return rc_M[pos][VI[C]];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2663 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2664
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2665 /*
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2666 void matrix::set_top_pos()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2667 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2668 multimap<double, mpoint> Tmap;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2669 vector<double> p_max_buf, rc_p_max_buf;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2670
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2671 for(unsigned int x = 0; x < L; x++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2672 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2673 for(unsigned int y = 0; y < ALPHABET_SIZE; y++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2674 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2675 mpoint p;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2676
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2677 p.x = x;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2678 p.y = y;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2679
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2680 Tmap.insert(make_pair(M[x][y],p));
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2681
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2682 if(!y)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2683 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2684 p_max_buf.push_back(M[x][y]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2685 rc_p_max_buf.push_back(rc_M[x][y]);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2686 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2687 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2688 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2689 if(M[x][y] > p_max_buf.back())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2690 p_max_buf[p_max_buf.size() - 1] = M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2691
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2692 if(rc_M[x][y] > rc_p_max_buf.back())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2693 rc_p_max_buf[rc_p_max_buf.size() - 1] = rc_M[x][y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2694 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2695
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2696 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2697
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2698 // if(!QUIET) cerr << endl << p_max_buf.back();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2699 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2700
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2701 multimap<double, mpoint>::reverse_iterator ri = Tmap.rbegin();
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2702
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2703 for(unsigned int i = 0; i < TOP_P; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2704 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2705 top_pos[i] = ri->second.x;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2706 top_char[i] = ALPHABET[ri->second.y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2707
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2708 rc_top_pos[i] = (L - 1) - ri->second.x;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2709 rc_top_char[i] = RC_ALPHABET[ri->second.y];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2710
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2711 ri++;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2712 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2713
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2714 // if(!QUIET) cerr << endl << name() << '\t' << max_score << '\t' << min_score << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2715
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2716 while(p_max.size() != p_max_buf.size())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2717 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2718 double buf = -INF;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2719 unsigned int pos;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2720
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2721 for(unsigned int i = 0; i < p_max_buf.size(); i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2722 if(p_max_buf.at(i) > buf)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2723 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2724 pos = i;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2725 buf = p_max_buf.at(i);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2726 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2727
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2728 p_pos.push_back(pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2729 rc_p_pos.push_back((L - 1) - pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2730
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2731 p_max.push_back(buf);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2732
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2733 p_max_buf[pos] = -INF;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2734 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2735
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2736 for(unsigned int i = 0; i < L; i++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2737 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2738 //if(!QUIET) cerr << p_max[i] << "//"<< '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2739
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2740 for(unsigned int j = i + 1; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2741 p_max[i] += p_max[j];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2742
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2743 // for(unsigned int j = i + 1; j < L; j++)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2744 // rc_p_max[i] += rc_p_max[j];
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2745
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2746 // if(!QUIET) cerr << p_max[i] << "(" << p_pos[i] << ")" << rc_p_max[i] << '\t';
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2747 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2748
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2749 p_max.push_back(0); //WE NEED A 0 AT THE END OF THE VECTOR!
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2750 // rc_p_max.push_back(0);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2751
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2752 // if(!QUIET) cerr << endl;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2753
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2754 return;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2755 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2756 */
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2757 double matrix::get_score_at(unsigned int a)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2758 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2759 return v_score.at(a);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2760 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2761 unsigned int matrix::get_pos_at(unsigned int a)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2762 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2763 return v_pos.at(a);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2764 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2765 bool matrix::get_strand_at(unsigned int a)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2766 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2767 return v_strand.at(a);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2768 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2769
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2770 double matrix::max()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2771 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2772 return max_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2773 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2774
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2775 double matrix::min()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2776 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2777 return min_score;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2778 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2779
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2780 string matrix::name()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2781 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2782 if(!Name.empty())
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2783 return Name;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2784 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2785 return Id;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2786 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2787
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2788 string matrix::id()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2789 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2790 return Id;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2791 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2792
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2793 double matrix::get_pvalue()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2794 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2795 return pvalue;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2796 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2797
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2798 double matrix::get_pvalue_bg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2799 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2800 return pvalue_bg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2801 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2802
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2803 double matrix::get_W_pvalue(unsigned int pos)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2804 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2805 return W_R_pvalue.at(pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2806 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2807
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2808 double matrix::get_W_R_Avg_at_pos(unsigned int pos)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2809 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2810 return W_R_Avg.at(pos);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2811 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2812
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2813 string matrix::o_or_u()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2814 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2815 if(O_U)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2816 return "UNDER";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2817 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2818 return "OVER";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2819 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2820
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2821 string matrix::o_or_u_bg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2822 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2823 if(O_U_bg)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2824 return "UNDER";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2825 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2826 return "OVER";
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2827 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2828
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2829 int matrix::W_o_or_u(unsigned int pos)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2830 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2831 if(W_O_U[pos])
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2832 return -1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2833 else
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2834 return 1;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2835 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2836
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2837 double matrix::get_R_Avg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2838 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2839 return R_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2840 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2841 double matrix::get_F_Avg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2842 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2843 return F_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2844 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2845 double matrix::get_R_Var()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2846 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2847 return R_Var;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2848 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2849 double matrix::get_F_Var()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2850 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2851 return F_Var;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2852 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2853 double matrix::get_bg_Avg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2854 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2855 return bg_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2856 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2857
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2858 double matrix::get_t()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2859 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2860 return t;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2861 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2862
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2863 double matrix::get_dof()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2864 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2865 return dof;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2866 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2867
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2868 bool matrix::have_bg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2869 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2870 return BG;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2871 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2872
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2873 unsigned int matrix::bin_num()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2874 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2875 return BIN_NUM;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2876 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2877
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2878 unsigned int matrix::length()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2879 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2880 return L;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2881 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2882
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2883 double matrix::get_spearman()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2884 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2885 double s = spearman;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2886
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2887 s *= 10000;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2888
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2889 if(s > 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2890 s = floor(s);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2891 else if(s < 0)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2892 s = ceil(s);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2893
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2894 s /= 10000;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2895
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2896 return s;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2897 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2898
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2899 double matrix::get_W_Avg()
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2900 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2901 return W_Avg;
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2902 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2903
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2904 double matrix::get_W_R_T_pvalue(unsigned int i)
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2905 {
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2906 return W_R_T_pvalue.at(i);
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2907 }
6a5cfb8a872f Uploaded
fz77
parents:
diff changeset
2908 // MATRIX CLASS END