annotate batch-consistency-plot.r @ 7:d3b45fab16f8 draft

Uploaded
author modencode-dcc
date Fri, 18 Jan 2013 17:30:34 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
7
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
1 # 1-20-10 Qunhua Li
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
2 #
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
3 # This program first plots correspondence curve and IDR threshold plot
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
4 # (i.e. number of selected peaks vs IDR) for each pair of sample
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
5 #
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
6 # usage:
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
7 # Rscript batch-consistency-plot-merged.r [npairs] [output.dir] [input.file.prefix 1, 2, 3 ...]
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
8 # [npairs]: integer, number of consistency analyses
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
9 # (e.g. if 2 replicates, npairs=1, if 3 replicates, npairs=3
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
10 # [output.prefix]: output directory and file name prefix for plot eg. /plots/idrPlot
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
11 # [input.file.prefix 1, 2, 3]: prefix for the output from batch-consistency-analysis2. They are the input files for merged analysis see below for examples (i.e. saved.file.prefix). It can be multiple files
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
12 #
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
13
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
14 args <- commandArgs(trailingOnly=T)
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
15 npair <- args[1] # number of curves to plot on the same figure
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
16 output.file.prefix <- args[2] # file name for plot, generated from script at the outer level
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
17 df.txt <- 10
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
18 ntemp <- as.numeric(npair)
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
19 saved.file.prefix <- list() # identifier of filenames that contain the em and URI results
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
20 source("/mnt/galaxyTools/galaxy-central/tools/modENCODE_DCC_tools/idr/functions-all-clayton-12-13.r")
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
21
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
22 uri.list <- list()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
23 uri.list.match <- list()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
24 ez.list <- list()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
25 legend.txt <- c()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
26 em.output.list <- list()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
27 uri.output.list <- list()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
28
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
29 for(i in 1:npair){
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
30 saved.file.prefix[i] <- args[2+i]
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
31
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
32 load(paste(saved.file.prefix[i], "-uri.sav", sep=""))
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
33 load(paste(saved.file.prefix[i], "-em.sav", sep=""))
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
34
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
35 uri.output.list[[i]] <- uri.output
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
36 em.output.list[[i]] <- em.output
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
37
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
38 ez.list[[i]] <- get.ez.tt.all(em.output, uri.output.list[[i]]$data12.enrich$merge1,
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
39 uri.output.list[[i]]$data12.enrich$merge2) # reverse =T for error rate
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
40
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
41 # URI for all peaks
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
42 uri.list[[i]] <- uri.output$uri.n
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
43 # URI for matched peaks
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
44 uri.match <- get.uri.matched(em.output$data.pruned, df=df.txt)
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
45 uri.list.match[[i]] <- uri.match$uri.n
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
46
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
47 file.name <- unlist(strsplit(as.character(saved.file.prefix[i]), "/"))
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
48
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
49 legend.txt[i] <- paste(i, "=", file.name[length(file.name)])
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
50
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
51 }
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
52
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
53 plot.uri.file <- paste(output.file.prefix, "-plot.ps", sep="")
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
54
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
55 ############# plot and report output
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
56 # plot correspondence curve for each pair,
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
57 # plot number of selected peaks vs IDR
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
58 # plot all into 1 file
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
59 postscript(paste(output.file.prefix, "-plot.ps", sep=""))
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
60 par(mfcol=c(2,3), mar=c(5,6,4,2)+0.1)
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
61 plot.uri.group(uri.list, NULL, file.name=NULL, c(1:npair), title.txt="all peaks")
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
62 plot.uri.group(uri.list.match, NULL, file.name=NULL, c(1:npair), title.txt="matched peaks")
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
63 plot.ez.group(ez.list, plot.dir=NULL, file.name=NULL, legend.txt=c(1:npair), y.lim=c(0, 0.6))
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
64 plot(0, 1, type="n", xlim=c(0,1), ylim=c(0,1), xlab="", ylab="", xaxt="n", yaxt="n") # legends
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
65 legend(0, 1, legend.txt, cex=0.6)
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
66
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
67 dev.off()
d3b45fab16f8 Uploaded
modencode-dcc
parents:
diff changeset
68