annotate QDNAseq.R @ 75:defea65cad01 draft

Uploaded
author stef
date Thu, 06 Nov 2014 05:10:48 -0500
parents 0feb7fa37245
children 4588384edba1
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
1 #!/usr/bin/Rscript
336697c6f7fa Uploaded
stef
parents:
diff changeset
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
3 ## --------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
4 ## prints all arguments as msg
336697c6f7fa Uploaded
stef
parents:
diff changeset
5 ## --------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
6 catMsg <- function( msg=c() ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
7 cat( MAIN_NAME, paste( msg, collapse="" ), "\n", sep='')
336697c6f7fa Uploaded
stef
parents:
diff changeset
8 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
9 ## --------------------
28
40ae95ad9d8c Uploaded
stef
parents: 26
diff changeset
10 ## return the location of this script
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
11 ## --------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
12 getScriptPath <- function(){
336697c6f7fa Uploaded
stef
parents:
diff changeset
13 cmd.args <- commandArgs()
336697c6f7fa Uploaded
stef
parents:
diff changeset
14 m <- regexpr("(?<=^--file=).+", cmd.args, perl=TRUE)
336697c6f7fa Uploaded
stef
parents:
diff changeset
15 script.dir <- dirname(regmatches(cmd.args, m))
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
16 if( length(script.dir) == 0 ) stop("[ERR] Can't determine script dir: please call the script with Rscript\n")
4351c7715275 Uploaded
stef
parents: 40
diff changeset
17 if( length(script.dir) > 1 ) stop("[ERR] Can't determine script dir: more than one '--file' argument detected\n")
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
18 return(script.dir)
336697c6f7fa Uploaded
stef
parents:
diff changeset
19 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
20 ## --------------------
28
40ae95ad9d8c Uploaded
stef
parents: 26
diff changeset
21 ## Some html creation functions
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
22 ## --------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
23 htmlTableRow <- function( string_array=c() ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
24 td_cells <- ''
336697c6f7fa Uploaded
stef
parents:
diff changeset
25 for ( i in string_array ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
26 td_cells <- paste( td_cells, '<td>', i, '</td>', sep='' )
336697c6f7fa Uploaded
stef
parents:
diff changeset
27 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
28 return( paste( "<tr>", td_cells, "</tr>") )
336697c6f7fa Uploaded
stef
parents:
diff changeset
29 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
30 htmlLink <- function( path, desc="LINK" ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
31 return( paste( '<a href="', path, '">', desc, "</a>", sep='') )
336697c6f7fa Uploaded
stef
parents:
diff changeset
32 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
33 ## --------------------
28
40ae95ad9d8c Uploaded
stef
parents: 26
diff changeset
34 ## constructs a list with input bam file info
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
35 ## --------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
36 makeBamFileList <- function( paths, names ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
37 tmp <- list()
336697c6f7fa Uploaded
stef
parents:
diff changeset
38 l1 <- length(paths)
336697c6f7fa Uploaded
stef
parents:
diff changeset
39 l2 <- length(names)
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
40 if ( l1 != l2 ) stop( "Unequal amount of bam-paths (", l1, ") and -names (", l2, ") in makeBamFileList!!!\n" )
72
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
41 if ( l1 == 0 ){ return(tmp) } # empty list in debug mode
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
42
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
43 for ( i in 1:length(paths) ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
44 path <- paths[i]
336697c6f7fa Uploaded
stef
parents:
diff changeset
45 name <- names[i]
336697c6f7fa Uploaded
stef
parents:
diff changeset
46 file <- basename(path)
336697c6f7fa Uploaded
stef
parents:
diff changeset
47
336697c6f7fa Uploaded
stef
parents:
diff changeset
48 tmp[[ file ]] <- name
336697c6f7fa Uploaded
stef
parents:
diff changeset
49 tmp[[ 'all_paths' ]] <- c( tmp[[ 'all_paths' ]], path )
336697c6f7fa Uploaded
stef
parents:
diff changeset
50 tmp[[ 'all_files' ]] <- c( tmp[[ 'all_files' ]], file )
336697c6f7fa Uploaded
stef
parents:
diff changeset
51 tmp[[ 'all_names' ]] <- c( tmp[[ 'all_names' ]], name )
336697c6f7fa Uploaded
stef
parents:
diff changeset
52 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
53 return( tmp )
336697c6f7fa Uploaded
stef
parents:
diff changeset
54 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
55
336697c6f7fa Uploaded
stef
parents:
diff changeset
56 ## --------------------
28
40ae95ad9d8c Uploaded
stef
parents: 26
diff changeset
57 ## copied code for extracting the regions by segment call status
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
58 ## --------------------
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
59 fuseRegions <- function( obj, minRatio=0 ) {
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
60 if ( ncol(obj) > 1 ) stop('Please specify which sample...')
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
61
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
62 data <- data.frame( obj@featureData@data[,1:3], copynumber(obj), segmented(obj), check.names=FALSE, stringsAsFactors=FALSE)
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
63 colnames( data ) <- c( "chr", "start", "end", "log2", "segmentval" )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
64
336697c6f7fa Uploaded
stef
parents:
diff changeset
65 fused.data <- data.frame()
336697c6f7fa Uploaded
stef
parents:
diff changeset
66 curr.bin <- 1
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
67 for ( chr in unique( data$chr ) ) {
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
68 chr.data <- data[ data$chr == chr, ]
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
69 prev.bin <- curr.bin
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
70 prev.log2 <- chr.data[ 1, 'log2' ]
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
71 prev.segm <- chr.data[ 1, 'segmentval' ]
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
72 start <- chr.data[ 1, 'start' ]
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
73
336697c6f7fa Uploaded
stef
parents:
diff changeset
74 if ( nrow(chr.data) > 1) {
336697c6f7fa Uploaded
stef
parents:
diff changeset
75 for ( i in 2:nrow(chr.data) ) {
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
76 curr.bin <- curr.bin + 1
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
77 curr.segm <- chr.data[ i, 'segmentval']
336697c6f7fa Uploaded
stef
parents:
diff changeset
78
336697c6f7fa Uploaded
stef
parents:
diff changeset
79 if ( curr.segm != prev.segm ) {
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
80 fused.data <- rbind( fused.data, data.frame( chr=chr, start=start, end=chr.data[ i-1, 'end'], segmentval=round(prev.segm, digits=DECIMALS) ) )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
81 prev.segm <- curr.segm
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
82 prev.bin <- curr.bin
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
83 start <- chr.data[ i, 'start']
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
84 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
85 }
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
86 fused.data <- rbind( fused.data, data.frame( chr=chr, start=start, end=chr.data[ i-1, 'end'], segmentval=round(prev.segm, digits=DECIMALS) ) )
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
87 }else{
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
88 fused.data <- rbind( fused.data, data.frame( chr=chr, start=start, end=chr.data[ i-1, 'end'], segmentval=round(prev.segm, digits=DECIMALS) ) )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
89 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
90 }
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
91 ## remove regions with low amplitude
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
92 fused.data <- fused.data[ abs(fused.data$segmentval) >= minRatio, ]
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
93 fused.data
336697c6f7fa Uploaded
stef
parents:
diff changeset
94 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
95
336697c6f7fa Uploaded
stef
parents:
diff changeset
96 ## DESC: takes the output of fuse.regions and outputs a txt file per sample
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
97 outputRegionsFromList <- function ( regionsList, outputBasename, outputDir="./", binSize, storeList ){
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
98 if ( missing(regionsList) ) stop( 'Please provide regionsList...' )
336697c6f7fa Uploaded
stef
parents:
diff changeset
99 if ( missing(outputBasename) ) stop( 'Please provide outputBasename...' )
336697c6f7fa Uploaded
stef
parents:
diff changeset
100 if ( !is.list(regionsList) ) stop( 'Input not a list...?' )
336697c6f7fa Uploaded
stef
parents:
diff changeset
101 if ( length(regionsList) < 1 ) stop( 'List seems empty...?' )
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
102 if ( file.exists( outputDir ) ) catMsg( c(" Using dir ", outputDir, " for output") )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
103 else dir.create( outputDir )
336697c6f7fa Uploaded
stef
parents:
diff changeset
104
336697c6f7fa Uploaded
stef
parents:
diff changeset
105 ## have to set R output options otherwise scientific method is used at some point
336697c6f7fa Uploaded
stef
parents:
diff changeset
106 options( "scipen"=100 )
336697c6f7fa Uploaded
stef
parents:
diff changeset
107
336697c6f7fa Uploaded
stef
parents:
diff changeset
108 sampleCount <- length( regionsList )
336697c6f7fa Uploaded
stef
parents:
diff changeset
109 sampleNames <- names( regionsList )
336697c6f7fa Uploaded
stef
parents:
diff changeset
110 bedgraphColumns <- c( 'chr', 'start', 'end', 'segmentval' )
30
647143d0c884 Uploaded
stef
parents: 29
diff changeset
111
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
112 catMsg( c( " There are ", sampleCount, " samples found in input list") )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
113
336697c6f7fa Uploaded
stef
parents:
diff changeset
114 for ( sample in sampleNames ){
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
115 catMsg( c(" Working on sample ", sample ) )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
116 regionCount <- nrow( regionsList[[sample]] )
336697c6f7fa Uploaded
stef
parents:
diff changeset
117
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
118 outSampleBase <- paste( outputBasename, '_', sample, '_', binSize, 'kbp', sep='')
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
119 outBedgraphFile <- paste( outSampleBase, '.bedGraph', sep="" )
336697c6f7fa Uploaded
stef
parents:
diff changeset
120 outBedgraphPath <- paste( outputDir, '/', outBedgraphFile, sep="" )
336697c6f7fa Uploaded
stef
parents:
diff changeset
121
336697c6f7fa Uploaded
stef
parents:
diff changeset
122 ## ---------- BEDGRAPH ----------
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
123 txt <- paste( "track type=bedGraph color=0,100,0 altColor=255,0,0 name=", sample," description=segmented_regions_from_QDNAseq_",binSize,"kbp\n", sep="")
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
124 sink( outBedgraphPath )
336697c6f7fa Uploaded
stef
parents:
diff changeset
125 cat( txt )
336697c6f7fa Uploaded
stef
parents:
diff changeset
126 sink()
336697c6f7fa Uploaded
stef
parents:
diff changeset
127 write.table( regionsList[[sample]][,bedgraphColumns], outBedgraphPath, quote=F, sep="\t", row.names=F, append=T, col.names=F)
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
128 #outFiles[[sample]] <- c( outBedgraphFile )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
129 storeList[[ paste( binSize, sample, 'bedgraph', sep="_")]] <- outBedgraphFile
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
130 }
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
131 return(storeList)
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
132 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
133
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
134
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
135 ## ==================================================
336697c6f7fa Uploaded
stef
parents:
diff changeset
136 ## Start of analysis
336697c6f7fa Uploaded
stef
parents:
diff changeset
137 ## ==================================================
74
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
138 ## ==================================================
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
139 ## Start of analysis
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
140 ## ==================================================
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
141 MAIN_NAME <- '[INFO] '
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
142 catMsg( "Starting QDNAseq wrapper" )
336697c6f7fa Uploaded
stef
parents:
diff changeset
143 catMsg( "Loading R libraries" )
73
4db025c51b6e Uploaded
stef
parents: 72
diff changeset
144 catMsg( R.version.string )
4db025c51b6e Uploaded
stef
parents: 72
diff changeset
145
74
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
146 ## supress msg to allow R to finish with non-error msg
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
147 suppressWarnings( suppressMessages( library( QDNAseq, quietly = TRUE ) ) )
336697c6f7fa Uploaded
stef
parents:
diff changeset
148 suppressWarnings( suppressMessages( library( CGHcall, quietly = TRUE ) ) )
25
8509c112abaa Uploaded
stef
parents: 2
diff changeset
149
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
150 ## only one param: the tmp config file
336697c6f7fa Uploaded
stef
parents:
diff changeset
151 cmdLineArgs <- commandArgs(TRUE)
336697c6f7fa Uploaded
stef
parents:
diff changeset
152 config <- cmdLineArgs[1]
74
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
153 TOOL_PATH <- cmdLineArgs[2]
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
154 CSS_FILE <- paste( TOOL_PATH, '/static/css/QDNAseq.css', sep="" )
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
155 DECIMALS <- 3
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
156 WEB_LINK <- 'http://www.bioconductor.org/packages/release/bioc/html/QDNAseq.html'
0feb7fa37245 Uploaded
stef
parents: 73
diff changeset
157 PURE_CSS <- 'http://yui.yahooapis.com/pure/0.5.0/pure-min.css'
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
158
336697c6f7fa Uploaded
stef
parents:
diff changeset
159 ## sourcing the config file will load all input params
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
160 ## many variables are imported via sourced "config"
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
161 source( config )
336697c6f7fa Uploaded
stef
parents:
diff changeset
162
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
163 ## desparate tries to make png text scale well, damn you R...!
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
164 PLOT_RES <- min( PLOT_WIDTH, PLOT_HEIGHT ) / 6.3
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
165 PAR_SET <- list( pch=22 )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
166
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
167 systemUser <- system("whoami",T)
4351c7715275 Uploaded
stef
parents: 40
diff changeset
168 qdnaseqVersion <- packageDescription( "QDNAseq" )$Version
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
169 rVersion <- R.version.string
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
170 startTime <- Sys.time()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
171 analysisStart <- as.character( startTime )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
172 catMsg( c("QDNAseq version: ", qdnaseqVersion) )
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
173 catMsg( c( rVersion ) )
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
174
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
175 ## get the comma separated list of chromosomes to exclude
336697c6f7fa Uploaded
stef
parents:
diff changeset
176 excludeChrs <- unlist( strsplit( excludeChrsString, ",") )
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
177 binSizes <- as.numeric( unlist( strsplit( binSizesString, ",") ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
178
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
179
336697c6f7fa Uploaded
stef
parents:
diff changeset
180 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
181 ## DEBUG
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
182 if ( debug ){
72
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
183 catMsg( c("Analysis run by user: ", systemUser ) )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
184 catMsg( c("DEBUG SessionInfo: " ) )
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
185 print( sessionInfo() )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
186 }
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
187 ## /DEBUG
336697c6f7fa Uploaded
stef
parents:
diff changeset
188 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
189
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
190 ## prepare output dir
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
191 if ( !file.exists( outputPath) ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
192 dir.create( outputPath )
336697c6f7fa Uploaded
stef
parents:
diff changeset
193 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
194
336697c6f7fa Uploaded
stef
parents:
diff changeset
195 ## copy source config file to output dir to include it in output zip
72
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
196 if ( inGalaxy ){
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
197 file.copy( config, paste(outputPath, 'galaxyConfigFile.R', sep='/') )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
198 }
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
199
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
200 ## setup bam filelist for easy retrieval later
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
201 fileList <- makeBamFileList( bamsPaths, bamsNames )
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
202 bamCount <- length( fileList[[ 'all_paths' ]] )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
203
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
204 gzipOutputName <- paste( 'QDNAseqResults_', outputName, '.zip', sep='' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
205 gzipOutputPath <- paste( outputPath, '/', gzipOutputName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
206 htmlOutputName <- 'index.html'
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
207 htmlOutputPath <- paste( outputPath, '/', htmlOutputName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
208
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
209 plotted_images <- list() # to keep track of images for later linking
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
210 regions <- list() # will contain the segments
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
211 outputFiles <- list()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
212
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
213 ## ------------------------
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
214 ## in case of debug just use inbuilt LGG data for speedup
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
215 if ( debug ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
216 binSizes <- c(15)
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
217 bamsPaths <- c( "BUILD_IN_DATA")
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
218 bamsNames <- c( "LGG150")
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
219 fileList <- makeBamFileList( bamsPaths, bamsNames )
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
220 bamCount <- length( fileList[[ 'all_paths' ]] )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
221 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
222
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
223 for ( binSize in binSizes ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
224
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
225 ## ------------------------
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
226 ## construct output file-names and -paths
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
227 ## ------------------------
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
228 robjReadCoName <- paste( binSize, 'kbp_QDNAseqReadCounts.rds', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
229 robjCopyNrName <- paste( binSize, 'kbp_QDNAseqCopyNumbers.rds', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
230 igvCopyNrName <- paste( binSize, 'kbp_QDNAseqCopyNumbers.igv', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
231 robjSegmntName <- paste( binSize, 'kbp_QDNAseqCopyNumbersSegmented.rds', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
232 regiOutputName <- paste( binSize, 'kbp_QDNAseqRegions.rds', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
233 noiseImgName <- paste( binSize, 'kbp_QDNAseqNoiseplot.png', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
234
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
235 robjReadCoPath <- paste( outputPath, '/', robjReadCoName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
236 robjCopyNrPath <- paste( outputPath, '/', robjCopyNrName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
237 robjSegmntPath <- paste( outputPath, '/', robjSegmntName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
238 robjRegionPath <- paste( outputPath, '/', regiOutputName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
239 igvCopyNrPath <- paste( outputPath, '/', igvCopyNrName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
240 noiseImgPath <- paste( outputPath, '/', noiseImgName, sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
241
72
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
242 binAnnFile <- paste( TOOL_PATH, '/static/binannotation/', binSize, 'kbp_binAnnotations.rds', sep="" )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
243 if ( file.exists(binAnnFile) ){
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
244 binAnnotations <- readRDS( binAnnFile )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
245 catMsg( c("Using local binAnnotations file" ) )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
246 }else{
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
247 binAnnotations <- getBinAnnotations( binSize=binSize, type=experimentType )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
248 }
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
249
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
250 ## in case of debug just use inbuilt LGG data for speedup
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
251 if ( debug ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
252 data(LGG150)
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
253 readCounts <- LGG150
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
254 }else{
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
255 ## provide bamnames because in galaxy everyting is called "dataset_###"
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
256 readCounts <- binReadCounts( binAnnotations, bamfiles=fileList[[ 'all_paths' ]], bamnames=fileList[[ 'all_names' ]] )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
257 }
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
258
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
259 readCountsFiltered <- applyFilters( readCounts, residual=TRUE, blacklist=filterBlacklistedBins, mappability=mappabilityCutoff, chromosomes=excludeChrs )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
260 readCountsFiltered <- estimateCorrection( readCountsFiltered )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
261 copyNumbers <- correctBins( readCountsFiltered )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
262 copyNumbersNormalized <- normalizeBins( copyNumbers )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
263 copyNumbersSmooth <- smoothOutlierBins( copyNumbersNormalized )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
264 sampleNames <- readCountsFiltered@phenoData@data$name
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
265
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
266 ## save objects to output dir
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
267 saveRDS( readCountsFiltered, robjReadCoPath );
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
268 saveRDS( copyNumbersSmooth, robjCopyNrPath );
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
269 exportBins( copyNumbersSmooth, file=igvCopyNrPath, format="igv" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
270
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
271 ## also save objects for galaxy history output if requested
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
272 if ( doOutputCopynumbersIgv ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
273 #@ a bit hacky galaxy way to allow an unknown number of output files based on param selection
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
274 #@ see: https://wiki.galaxyproject.org/Admin/Tools/Multiple%20Output%20Files
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
275 historyName <- paste(binSize, 'kbp-IGV', sep="")
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
276 igvFile <- paste( newFilePath, "/primary_", outputId, "_", historyName, "_visible_txt", sep="" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
277 exportBins( copyNumbersSmooth, file=igvFile, format="igv" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
278 catMsg( c("Exported igv file to history for ", binSize, "kbp bin") )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
279 }
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
280
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
281 ## proceed with calling if requested
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
282 if ( doSegment ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
283 copyNumbersSegmented <- segmentBins( copyNumbersSmooth, undo.splits=undoSplits, undo.SD=undoSD )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
284 copyNumbersSegmented <- normalizeSegmentedBins( copyNumbersSegmented )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
285 cgh <- makeCgh( copyNumbersSegmented )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
286 saveRDS( copyNumbersSegmented, robjSegmntPath );
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
287 }
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
288
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
289 ## ------------------------
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
290 ## create output files
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
291 ## ------------------------
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
292 png( noiseImgPath, width=PLOT_HEIGHT, height=PLOT_HEIGHT, res=PLOT_RES );
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
293 par( PAR_SET )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
294 noisePlot( readCountsFiltered, main=paste( "Noise Plot ", binSize, "kbp", sep=''), col="darkgreen" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
295 dev.off()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
296
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
297 binSize <- as.character( binSize ) # to avoid R using it as array index... (*#$^@ you R!)
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
298 binSizeString <- paste( binSize, 'kbp', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
299
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
300 for (i in 1:length(sampleNames) ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
301
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
302 sample <- sampleNames[i]
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
303 usedReads <- readCountsFiltered@phenoData@data$used.reads[i]
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
304 catMsg( c("Creating plots for sample: ", sample, " (", binSizeString, ")" ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
305
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
306 type <- 'CopyNumbers'
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
307 img_file <- paste( sample, '_', binSize, 'kbp_QDNAseq', type, '.png', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
308 img_file_path <- paste( outputPath, '/', img_file, sep='' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
309
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
310 ## COPYNUMBER PLOT
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
311 png( img_file_path, width=PLOT_WIDTH, height=PLOT_HEIGHT, res=PLOT_RES );
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
312 par( PAR_SET )
68
68a090cffb6f Uploaded
stef
parents: 67
diff changeset
313 plot( copyNumbersSmooth[ ,sample ], main=paste(sample, ": CopyNumbers", sep="") )
69
b4477584bb03 Uploaded
stef
parents: 68
diff changeset
314 mtext( paste( binSizeString, " bins", sep=""), 3 )
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
315 abline( h=c(-2,-1,1,2,3,4), lty=1, lwd=0.5, col="grey" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
316 dev.off()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
317
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
318 plotted_images[[ paste(binSize, sample, type, sep="_" ) ]] <- img_file
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
319
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
320 if ( doSegment ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
321 type <- 'Segmented'
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
322 img_file <- paste( sample, '_', binSize, 'kbp_QDNAseq', type, '.png', sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
323 img_file_path <- paste( outputPath, '/', img_file, sep='' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
324
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
325 ## COPYNUMBER PLOT
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
326 png( img_file_path, width=PLOT_WIDTH, height=PLOT_HEIGHT, res=PLOT_RES );
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
327 par( PAR_SET )
69
b4477584bb03 Uploaded
stef
parents: 68
diff changeset
328 plot( copyNumbersSegmented[ ,sample ], main=paste(sample, ": CopyNumbers and Segments", sep="") )
b4477584bb03 Uploaded
stef
parents: 68
diff changeset
329 mtext( paste( "(", binSizeString, " bins)", sep=""), 3 )
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
330 abline( h=c(-2,-1,1,2,3,4), lty=1, lwd=0.5, col="grey" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
331 dev.off()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
332
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
333 plotted_images[[ paste(binSize, sample, type, sep="_" ) ]] <- img_file
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
334
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
335 catMsg( c(" Fusing regions of sample: ", sample) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
336 regions[[ sample ]] <- fuseRegions( cgh[, sample] )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
337
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
338 region_count <- nrow( data.frame( regions[[ sample ]] ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
339 catMsg( c( ' sample "', sample, '" has ', region_count, " regions" ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
340 plotted_images[[ paste(binSize, sample, 'region_count', sep="_" ) ]] <- region_count
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
341 }
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
342
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
343 ## add USED read counts
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
344 plotted_images[[ paste(binSize, sample, 'usedReads', sep="_" ) ]] <- usedReads
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
345 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
346
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
347 if ( doSegment ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
348 saveRDS( regions, robjRegionPath )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
349 plotted_images <- outputRegionsFromList( regions, outputBasename=outputName, outputDir=outputPath, binSize=binSize, storeList=plotted_images )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
350 }
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
351 }# end bin
28
40ae95ad9d8c Uploaded
stef
parents: 26
diff changeset
352
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
353
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
354 ## ----- debug -----
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
355 #catMsg( "done" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
356 #q(status=0)
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
357 ## ---- /debug -----
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
358
336697c6f7fa Uploaded
stef
parents:
diff changeset
359
336697c6f7fa Uploaded
stef
parents:
diff changeset
360 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
361 ## prepare output
336697c6f7fa Uploaded
stef
parents:
diff changeset
362 ## ------------------------
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
363 catMsg( "...zipping output")
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
364 zip_cmd <- paste( "zip -j", gzipOutputPath, paste(outputPath,'/*',sep='') ) ## -j is for removing dirs from the tree
336697c6f7fa Uploaded
stef
parents:
diff changeset
365 system( zip_cmd )
336697c6f7fa Uploaded
stef
parents:
diff changeset
366
336697c6f7fa Uploaded
stef
parents:
diff changeset
367 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
368 ## get filesizes for report
336697c6f7fa Uploaded
stef
parents:
diff changeset
369 ## ------------------------
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
370 zippedSize <- paste( round( file.info( gzipOutputPath )[["size"]] / 1e+6, digits=2 ), 'MB' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
371 endTime <- Sys.time()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
372 timeDiff <- format( round( endTime - startTime, 3 ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
373 analysisEnd <- as.character( endTime )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
374
336697c6f7fa Uploaded
stef
parents:
diff changeset
375 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
376 ## creating html output to be linked to from the middle galaxy pane
336697c6f7fa Uploaded
stef
parents:
diff changeset
377 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
378 sink( file = htmlOutputPath, type = "output" )
336697c6f7fa Uploaded
stef
parents:
diff changeset
379 cat( "<html>\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
380 cat( "<head>\n")
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
381
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
382 cat( "\t", '<title>QDNAseq Report | ', outputName,'</title>', "\n", sep='' )
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
383 cat( "\t", '<link rel="stylesheet" href="', PURE_CSS, '">', "\n", sep='' )
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
384 cat( "\t<style>\n", sep='')
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
385 ## include CSS into html file, makes it more portable
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
386 cat( "\t\t", readLines( CSS_FILE ), sep="\n\t\t" )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
387 #cat( "\t\th1 {color:red;}", "\n")
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
388 cat( "\n\t</style>\n" )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
389
336697c6f7fa Uploaded
stef
parents:
diff changeset
390 cat( "\n</head>\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
391 cat( "\n<body>\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
392
336697c6f7fa Uploaded
stef
parents:
diff changeset
393 cat( "<h1>QDNAseq Report</h1>", "\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
394
336697c6f7fa Uploaded
stef
parents:
diff changeset
395 cat( '<h3 class="qdnaseq">About this analysis</h3>', "\n")
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
396 cat( '<p>This page provides access to all results. To have a local copy of this report just download the <a href="', gzipOutputName, '" class="button">zipfile</a> with all output (', zippedSize, ')</p>', "\n", sep='')
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
397
336697c6f7fa Uploaded
stef
parents:
diff changeset
398 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
399 ## table with general info
336697c6f7fa Uploaded
stef
parents:
diff changeset
400 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
401 cat( '<h3 class="qdnaseq">Settings</h3><p>', "\n")
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
402 cat( '<table class="pure-table pure-table-striped"><tbody>' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
403 cat( htmlTableRow( c( "AnalysisName", outputName ) ) )
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
404 cat( htmlTableRow( c( "AnalysisStart", analysisStart ) ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
405 cat( htmlTableRow( c( "AnalysisEnd", analysisEnd ) ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
406 cat( htmlTableRow( c( "AnalysisTime", timeDiff ) ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
407 cat( htmlTableRow( c( "BinSizes (kbp)", paste(binSizes,collapse=", ") ) ) )
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
408 cat( htmlTableRow( c( "R info", rVersion ) ) )
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
409 cat( htmlTableRow( c( "QDNAseq info", qdnaseqVersion ) ) )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
410
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
411 sampleStrings <- c()
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
412 for ( galaxyName in fileList[[ 'all_files' ]] ){
336697c6f7fa Uploaded
stef
parents:
diff changeset
413 sampleName <- fileList[[ galaxyName ]]
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
414 sampleStrings <- c( sampleStrings, paste( galaxyName, ' (', sampleName, ')', sep='' ) )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
415 }
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
416 cat( htmlTableRow( c( "InputBams", paste( sampleStrings, collapse=", ") ) ) )
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
417
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
418 cat( "</tbody></table></p>", "\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
419
336697c6f7fa Uploaded
stef
parents:
diff changeset
420 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
421 ## list with links to all output files
336697c6f7fa Uploaded
stef
parents:
diff changeset
422 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
423 cat( '<h3 class="qdnaseq">Output files</h3><p>', "\n")
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
424 cat( '<p>This table contains output files that can be used for local downstream analysis with the bioconductor QDNAseq package. For each bin-size / data-level there is a R data structure file with data of all samples. See ', htmlLink( WEB_LINK, 'the bioconductor QDNAseq documentation' ), ' for more information on how to work with these files</p>', "\n", sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
425 cat( '<table class="pure-table pure-table-striped">', "\n" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
426 cat( '<thead><th>Type</th>', as.vector( mapply( paste, "<th>", binSizes, "kbp</th>", sep="" ) ),'</thead>', "\n" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
427 cat( "<tbody>", "\n")
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
428 files <- list()
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
429 fileTypes <- c( 'ReadCounts.rds', 'CopyNumbers.rds' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
430 if ( doSegment ){ fileTypes <- c( fileTypes, 'CopyNumbersSegmented.rds') }
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
431
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
432 for ( fileType in fileTypes ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
433 fileNames <- mapply( paste, binSizes, paste( 'kbp_QDNAseq', fileType, sep=''), sep='')
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
434 fileLinks <- mapply( htmlLink, fileNames, paste( binSizes, "kbp", sep="" ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
435 cat( htmlTableRow( c( fileType, fileLinks ) ) )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
436 }
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
437 cat( "\n</tbody></table></p>", "\n")
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
438
336697c6f7fa Uploaded
stef
parents:
diff changeset
439 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
440 ## table with links to files
336697c6f7fa Uploaded
stef
parents:
diff changeset
441 ## ------------------------
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
442 ratio <- PLOT_WIDTH / PLOT_HEIGHT
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
443 width <- 960; height <- width / ratio ## bigger img
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
444 width_t <- 100; height_t <- 40 ## thumb img
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
445
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
446 cat( '<h3 class="qdnaseq">Results: overview</h3><p>', "\n")
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
447 cat( '<p>This table contains the visual results of the copy number aberration analysis. You can click on an image to jump to the larger version. If segmentation was performed as well the number of segments is shown and a file with genomic regions can be downloaded (just remember to inspect the results carefully as this is a more exprimental step).</p>', "\n", sep='')
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
448 plots_html <- ''
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
449
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
450 colspan <- 1
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
451 binHeader <- "<th>Image</th>"
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
452 if ( doSegment ){ # extra column with segment info
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
453 colspan <- 2
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
454 binHeader <- "<th>Image</th><th>Segments</th>"
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
455 }
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
456 cat( '<table class="pure-table pure-table-striped">', "\n" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
457 cat( '<thead><tr><th></th><th></th>', as.vector( mapply( paste, "<th colspan=\"", colspan,"\">", binSizes, "kbp</th>", sep="" ) ), '</tr></thead>' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
458 cat( '<thead><tr><th>Sample / File</th><th>Reads</th>', rep( binHeader, length(binSizes) ), '</tr></thead>' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
459 cat( '<tbody>' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
460
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
461 for ( bam_file in bamsNames ){
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
462
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
463 usedReads <- plotted_images[[ paste(binSize, bam_file, 'usedReads', sep="_" ) ]]
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
464 usedReads <- format( as.integer(usedReads), digits=4, decimal.mark=".", big.mark="," )
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
465 htmlRow <- paste( '<tr><td>', bam_file, '</td><td>', usedReads, '</td>', sep='' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
466
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
467 for ( binSize in binSizes ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
468
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
469 ## add thumbnails to table with links to anchors on html page
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
470 copy_img <- plotted_images[[ paste(binSize, bam_file, 'CopyNumbers', sep="_" ) ]]
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
471 html_copy_thumb <- htmlLink( path=paste('#', copy_img, sep=''), paste('<img src="',copy_img,'" alt="', bam_file, '" width="', width_t, '" height="', height_t, '">', sep='') )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
472 html_copy_img <- htmlLink( path=copy_img, paste('<img id="', copy_img,'" src="',copy_img,'" alt="',bam_file, '" width="', width, '" height="', height, '">', sep='') )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
473 html_segm_img <- ''
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
474 html_bedGraph <- ''
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
475 region_count <- ''
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
476 htmlRow <- paste( htmlRow, '<td>', html_copy_thumb, '</td>' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
477
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
478 if ( doSegment ){
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
479 segm_img <- plotted_images[[ paste(binSize, bam_file, 'Segmented', sep="_" ) ]]
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
480 region_count <- plotted_images[[ paste(binSize, bam_file, 'region_count', sep="_" ) ]]
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
481
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
482 html_bedGraph <- htmlLink( path=plotted_images[[ paste(binSize, bam_file, 'bedgraph', sep="_" ) ]], 'bedGraph' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
483 html_segm_img <- htmlLink( path=segm_img, paste('<img id="', segm_img,'" src="', segm_img,'" alt="', bam_file, '" width="', width, '" height="', height,'">', sep='') )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
484 htmlRow <- paste( htmlRow, '<td>', region_count, ' (', html_bedGraph, ')</td>', sep="" )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
485 }
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
486 plots_html <- paste( plots_html, html_copy_img, "\n", html_segm_img, "\n<br \\>\n", sep='' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
487 }
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
488 plots_html <- paste( plots_html, "\n<hr \\>\n", sep='' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
489 ## add info to overview table, including small thumbnails
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
490 htmlRow <- paste( htmlRow, '</tr>', sep='' )
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
491 cat( htmlRow, "\n" )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
492 }
336697c6f7fa Uploaded
stef
parents:
diff changeset
493 cat( "</tbody></table></p>", "\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
494
336697c6f7fa Uploaded
stef
parents:
diff changeset
495 ## ------------------------
336697c6f7fa Uploaded
stef
parents:
diff changeset
496 ## section with various output shown
336697c6f7fa Uploaded
stef
parents:
diff changeset
497 ## ------------------------
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
498 cat( '<h3 class="qdnaseq">Results: Sample plots</h3><p>', "\n")
64
2f0af8970aea Uploaded
stef
parents: 59
diff changeset
499 ## now include (large) images in html page
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
500 cat( plots_html, "\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
501 cat( "\n</p></body>\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
502 cat( "\n</html>\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
503 sink()
336697c6f7fa Uploaded
stef
parents:
diff changeset
504
336697c6f7fa Uploaded
stef
parents:
diff changeset
505 ## ------------------------
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
506 ## creating main html output for galaxy history
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
507 ## ------------------------
72
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
508 if ( inGalaxy ){ # dont create when running outside Galaxy
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
509 sink( file = outputHtml, type = "output" )
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
510
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
511 cat( "<head>", "\n")
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
512 cat( "\t", '<link rel="stylesheet" href="', PURE_CSS, '">', "\n", sep='' )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
513
336697c6f7fa Uploaded
stef
parents:
diff changeset
514 cat( "<style>", "\n")
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
515 ## include CSS directly into html file
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
516 cat( paste( "\t", '/* the css here originates from ', CSS_FILE,' */', "\n") )
336697c6f7fa Uploaded
stef
parents:
diff changeset
517 cat( paste( "\t", readLines( CSS_FILE, n = -1)), sep="\n" )
336697c6f7fa Uploaded
stef
parents:
diff changeset
518 cat( "</style>", "\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
519 cat( "</head>", "\n")
336697c6f7fa Uploaded
stef
parents:
diff changeset
520
336697c6f7fa Uploaded
stef
parents:
diff changeset
521 cat( '<h1>QDNAseq Results (', outputName,')</h1>', "\n", sep="")
59
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
522 cat( '<p>Explore <a href="', htmlOutputName, '" class="button">the results</a> directly within galaxy</p>', "\n", sep="")
bfe9d9b7e261 Uploaded
stef
parents: 56
diff changeset
523 cat( '<p>Or download a <a href="', gzipOutputName, '" class="button">zipfile</a> with all output (', zippedSize, ')</p>', "\n", sep="" )
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
524
72
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
525 sink()
fb2dfd8ba417 Uploaded
stef
parents: 69
diff changeset
526 }
2
336697c6f7fa Uploaded
stef
parents:
diff changeset
527
42
4351c7715275 Uploaded
stef
parents: 40
diff changeset
528 ## ------------------------
4351c7715275 Uploaded
stef
parents: 40
diff changeset
529 ## create final zip and quit with status 0 to tell galaxy all was fine
4351c7715275 Uploaded
stef
parents: 40
diff changeset
530 ## ------------------------
4351c7715275 Uploaded
stef
parents: 40
diff changeset
531 catMsg( "zipping all output")
4351c7715275 Uploaded
stef
parents: 40
diff changeset
532 system( paste( "zip -j ", gzipOutputPath, paste(outputPath,'/', htmlOutputName, sep='') ) )
4351c7715275 Uploaded
stef
parents: 40
diff changeset
533 catMsg( "done" )
25
8509c112abaa Uploaded
stef
parents: 2
diff changeset
534 q(status=0)