annotate execute_dwt_var_perFeature.pl @ 0:083bf4961ff1 draft

Imported from capsule None
author devteam
date Thu, 23 Jan 2014 12:31:14 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
1 #!/usr/bin/perl -w
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
2 # Author: Erika Kvikstad
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
3
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
4 use warnings;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
5 use IO::Handle;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
6 use POSIX qw(floor ceil);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
7
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
8 $usage = "execute_dwt_var_perFeature.pl [TABULAR.in] [FEATURE] [ALPHA] [TABULAR.out] [PDF.out] \n";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
9 die $usage unless @ARGV == 5;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
10
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
11 #get the input arguments
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
12 my $inputFile = $ARGV[0];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
13 my @features = split(/,/,$ARGV[1]);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
14 my $features_count = scalar(@features);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
15 my $alpha = $ARGV[2];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
16 my $outFile1 = $ARGV[3];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
17 my $outFile2 = $ARGV[4];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
18
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
19 open (INPUT, "<", $inputFile) || die("Could not open file $inputFile \n");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
20 open (OUTPUT2, ">", $outFile1) || die("Could not open file $outFile1 \n");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
21 open (OUTPUT3, ">", $outFile2) || die("Could not open file $outFile2 \n");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
22 #open (ERROR, ">", "error.txt") or die ("Could not open file error.txt \n");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
23
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
24 # choosing meaningful names for the output files
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
25 $pvalue = $outFile1;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
26 $pdf = $outFile2;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
27
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
28 # write R script
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
29 $r_script = "get_dwt_varPermut.r";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
30
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
31 open(Rcmd, ">", "$r_script") or die "Cannot open $r_script \n\n";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
32
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
33 print Rcmd "
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
34 ######################################################################
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
35 # plot multiscale wavelet variance
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
36 # create null bands by permuting the original data series
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
37 # generate plots and table of wavelet variance including p-values
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
38 ######################################################################
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
39 options(echo = FALSE)
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
40 #library(\"Rwave\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
41 #library(\"wavethresh\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
42 #library(\"waveslim\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
43 # turn off diagnostics for de-bugging only, turn back on for functional tests on test
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
44 suppressMessages(require(\"Rwave\",quietly=TRUE,warn.conflicts = FALSE));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
45 suppressMessages(require(\"wavethresh\",quietly=TRUE,warn.conflicts = FALSE));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
46 suppressMessages(require(\"waveslim\",quietly=TRUE,warn.conflicts = FALSE));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
47 suppressMessages(require(\"bitops\",quietly=TRUE,warn.conflicts = FALSE));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
48
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
49 # to determine if data is properly formatted 2^N observations
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
50 is.power2<- function(x){x && !(bitAnd(x,x - 1));}
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
51
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
52 # dwt : discrete wavelet transform using Haar wavelet filter, simplest wavelet function but later can modify to let user-define the wavelet filter function
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
53 dwt_var_permut_getMax <- function(data, names, alpha, filter = 1,family=\"DaubExPhase\", bc = \"symmetric\", method = \"kendall\", wf = \"haar\", boundary = \"reflection\") {
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
54 max_var = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
55 matrix = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
56 title = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
57 final_pvalue = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
58 J = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
59 scale = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
60 out = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
61
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
62 print(class(data));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
63 print(names);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
64 print(alpha);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
65
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
66 par(mar=c(5,4,4,3),oma = c(4, 4, 3, 2), xaxt = \"s\", cex = 1, las = 1);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
67
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
68 title<-c(\"Wavelet\",\"Variance\",\"Pvalue\",\"Test\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
69 print(title);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
70
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
71 for(i in 1:length(names)){
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
72 temp = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
73 results = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
74 wave1.dwt = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
75
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
76 # if data fails formatting check, do something
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
77
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
78 print(is.numeric(as.matrix(data)[, i]));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
79 if(!is.numeric(as.matrix(data)[, i]))
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
80 stop(\"data must be a numeric vector\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
81
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
82 print(length(as.matrix(data)[, i]));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
83 print(is.power2(length(as.matrix(data)[, i])));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
84 if(!is.power2(length(as.matrix(data)[, i])))
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
85 stop(\"data length must be a power of two\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
86
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
87
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
88 J <- wd(as.matrix(data)[, i], filter.number = filter, family=family, bc = bc)\$nlevels;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
89 print(J);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
90 temp <- vector(length = J);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
91 wave1.dwt <- dwt(as.matrix(data)[, i], wf = wf, J, boundary = boundary);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
92 #print(wave1.dwt);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
93
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
94 temp <- wave.variance(wave1.dwt)[-(J+1), 1];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
95 print(temp);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
96
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
97 #permutations code :
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
98 feature1 = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
99 null = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
100 var_lower=limit_lower=NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
101 var_upper=limit_upper=NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
102 med = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
103
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
104 limit_lower = alpha/2*1000;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
105 print(limit_lower);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
106 limit_upper = (1-alpha/2)*1000;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
107 print(limit_upper);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
108
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
109 feature1 = as.matrix(data)[,i];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
110 for (k in 1:1000) {
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
111 nk_1 = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
112 null.levels = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
113 var = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
114 null_wave1 = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
115
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
116 nk_1 = sample(feature1, length(feature1), replace = FALSE);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
117 null.levels <- wd(nk_1, filter.number = filter,family=family ,bc = bc)\$nlevels;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
118 var <- vector(length = length(null.levels));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
119 null_wave1 <- dwt(nk_1, wf = wf, J, boundary = boundary);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
120 var<- wave.variance(null_wave1)[-(null.levels+1), 1];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
121 null= rbind(null, var);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
122 }
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
123 null <- apply(null, 2, sort, na.last = TRUE);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
124 var_lower <- null[limit_lower, ];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
125 var_upper <- null[limit_upper, ];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
126 med <- (apply(null, 2, median, na.rm = TRUE));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
127
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
128 # plot
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
129 results <- cbind(temp, var_lower, var_upper);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
130 print(results);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
131 matplot(results, type = \"b\", pch = \"*\", lty = 1, col = c(1, 2, 2),xaxt='n',xlab=\"Wavelet Scale\",ylab=\"Wavelet variance\" );
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
132 mtext(names[i], side = 3, line = 0.5, cex = 1);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
133 axis(1, at = 1:J , labels=c(2^(0:(J-1))), las = 3, cex.axis = 1);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
134
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
135 # get pvalues by comparison to null distribution
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
136 #out <- (names[i]);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
137 for (m in 1:length(temp)){
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
138 print(paste(\"scale\", m, sep = \" \"));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
139 print(paste(\"var\", temp[m], sep = \" \"));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
140 print(paste(\"med\", med[m], sep = \" \"));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
141 pv = tail =scale = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
142 scale=2^(m-1);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
143 #out <- c(out, format(temp[m], digits = 3));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
144 if (temp[m] >= med[m]){
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
145 # R tail test
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
146 print(\"R\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
147 tail <- \"R\";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
148 pv <- (length(which(null[, m] >= temp[m])))/(length(na.exclude(null[, m])));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
149
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
150 } else {
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
151 if (temp[m] < med[m]){
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
152 # L tail test
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
153 print(\"L\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
154 tail <- \"L\";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
155 pv <- (length(which(null[, m] <= temp[m])))/(length(na.exclude(null[, m])));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
156 }
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
157 }
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
158 print(pv);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
159 out<-rbind(out,c(paste(\"Scale\", scale, sep=\"_\"),format(temp[m], digits = 3),pv,tail));
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
160 }
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
161 final_pvalue <-rbind(final_pvalue, out);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
162 }
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
163 colnames(final_pvalue) <- title;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
164 return(final_pvalue);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
165 }\n";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
166
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
167 print Rcmd "
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
168 # execute
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
169 # read in data
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
170 data_test = final = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
171 sub = sub_names = NULL;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
172 data_test <- read.delim(\"$inputFile\",header=FALSE);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
173 pdf(file = \"$pdf\", width = 11, height = 8)\n";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
174
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
175 for ($x=0;$x<$features_count;$x++){
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
176 $feature=$features[$x];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
177 print Rcmd "
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
178 if ($feature > ncol(data_test))
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
179 stop(\"column $feature doesn't exist\");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
180 sub<-data_test[,$feature];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
181 #sub_names <- colnames(data_test);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
182 sub_names<-colnames(data_test)[$feature];
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
183 final <- rbind(final,dwt_var_permut_getMax(sub, sub_names,$alpha));\n";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
184 }
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
185
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
186 print Rcmd "
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
187
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
188 dev.off();
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
189 write.table(final, file = \"$pvalue\", sep = \"\\t\", quote = FALSE, row.names = FALSE);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
190
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
191 #eof\n";
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
192
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
193 close Rcmd;
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
194 system("R --no-restore --no-save --no-readline < $r_script > $r_script.out");
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
195
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
196 #close the input and output and error files
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
197 close(OUTPUT3);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
198 close(OUTPUT2);
083bf4961ff1 Imported from capsule None
devteam
parents:
diff changeset
199 close(INPUT);