annotate mpagenomics_normalize-7dc6ce39fb89/extractCN.R @ 0:84b13b0e2b85

Uploaded
author sblanck
date Thu, 07 May 2015 08:22:36 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
1 args<-commandArgs(TRUE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
2
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
3 chrom=args[1]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
4 dataset=args[2]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
5 output=args[3]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
6 tmp_dir=args[4]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
7 input=args[5]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
8 tumorcsv=args[6]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
9 signal=args[7]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
10 snp=type.convert(args[8])
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
11 user=args[9]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
12 symmetrize=args[10]
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
13
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
14 library(MPAgenomics)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
15 workdir=file.path(tmp_dir, "mpagenomics",user)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
16 setwd(workdir)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
17
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
18
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
19 if (grepl("all",tolower(chrom)) | chrom=="None") {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
20 chrom_vec=c(1:25)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
21 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
22 chrom_tmp <- strsplit(chrom,",")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
23 chrom_vecstring <-unlist(chrom_tmp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
24 chrom_vec <- as.numeric(chrom_vecstring)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
25 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
26 if (signal == "CN")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
27 {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
28 if (input == "dataset") {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
29 if (tumorcsv== "None")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
30 {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
31 CN=getCopyNumberSignal(dataset,chromosome=chrom_vec, onlySNP=snp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
32
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
33 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
34 CN=getCopyNumberSignal(dataset,chromosome=chrom_vec, normalTumorArray=tumorcsv, onlySNP=snp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
35 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
36 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
37 input_tmp <- strsplit(input,",")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
38 input_tmp_vecstring <-unlist(input_tmp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
39 input_vecstring = sub("^([^.]*).*", "\\1", input_tmp_vecstring)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
40 if (tumorcsv== "None")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
41 {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
42 CN=getCopyNumberSignal(dataset,chromosome=chrom_vec, listOfFiles=input_vecstring, onlySNP=snp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
43 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
44 CN=getCopyNumberSignal(dataset,chromosome=chrom_vec, normalTumorArray=tumorcsv, listOfFiles=input_vecstring, onlySNP=snp )
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
45 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
46 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
47
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
48 list_chr=names(CN)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
49 CN_global=data.frame(check.names = FALSE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
50 for (i in list_chr) {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
51 chr_data=data.frame(CN[[i]],check.names = FALSE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
52 CN_global=rbind(CN_global,chr_data)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
53 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
54 names(CN_global)[names(CN_global)=="featureNames"] <- "probeName"
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
55 write.table(format(CN_global), output, row.names = FALSE, quote = FALSE, sep = "\t")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
56
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
57 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
58 if (symmetrize=="TRUE") {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
59 if (input == "dataset") {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
60 input_vecstring = getListOfFiles(dataset)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
61 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
62 input_tmp <- strsplit(input,",")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
63 input_tmp_vecstring <-unlist(input_tmp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
64 input_vecstring = sub("^([^.]*).*", "\\1", input_tmp_vecstring)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
65 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
66
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
67 symFracB_global=data.frame(check.names = FALSE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
68
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
69 for (currentFile in input_vecstring) {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
70 cat(paste0("extracting signal from ",currentFile,".\n"))
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
71 currentSymFracB=data.frame()
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
72 symFracB=getSymFracBSignal(dataset,chromosome=chrom_vec,file=currentFile,normalTumorArray=tumorcsv)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
73 list_chr=names(symFracB)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
74 for (i in list_chr) {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
75 cat(paste0(" extracting ",i,".\n"))
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
76 chr_data=data.frame(symFracB[[i]]$tumor,check.names = FALSE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
77 currentSymFracB=rbind(currentSymFracB,chr_data)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
78
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
79 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
80 if (is.null(symFracB_global) || nrow(symFracB_global)==0) {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
81 symFracB_global=currentSymFracB
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
82 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
83 symFracB_global=cbind(symFracB_global,currentFile=currentSymFracB[[3]])
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
84 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
85 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
86 names(symFracB_global)[names(symFracB_global)=="featureNames"] <- "probeName"
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
87
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
88 write.table(format(symFracB_global), output, row.names = FALSE, quote = FALSE, sep = "\t")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
89 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
90 if (input == "dataset") {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
91 if (tumorcsv== "None")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
92 {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
93 fracB=getFracBSignal(dataset,chromosome=chrom_vec)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
94
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
95 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
96 fracB=getFracBSignal(dataset,chromosome=chrom_vec, normalTumorArray=tumorcsv)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
97 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
98 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
99 input_tmp <- strsplit(input,",")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
100 input_tmp_vecstring <-unlist(input_tmp)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
101 input_vecstring = sub("^([^.]*).*", "\\1", input_tmp_vecstring)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
102 if (tumorcsv== "None")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
103 {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
104 fracB=getFracBSignal(dataset,chromosome=chrom_vec, listOfFiles=input_vecstring)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
105 } else {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
106 fracB=getFracBSignal(dataset,chromosome=chrom_vec, normalTumorArray=tumorcsv, listOfFiles=input_vecstring)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
107 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
108 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
109 #formatage des données
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
110 list_chr=names(fracB)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
111 fracB_global=data.frame(check.names = FALSE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
112 for (i in list_chr) {
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
113 chr_data=data.frame(fracB[[i]]$tumor,check.names = FALSE)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
114 fracB_global=rbind(fracB_global,chr_data)
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
115 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
116 names(fracB_global)[names(fracB_global)=="featureNames"] <- "probeName"
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
117 write.table(format(fracB_global), output, row.names = FALSE, quote = FALSE, sep = "\t")
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
118 }
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
119
84b13b0e2b85 Uploaded
sblanck
parents:
diff changeset
120 }