annotate QDNAseq.R @ 27:f89205f51e27 draft default tip

Uploaded
author stef
date Mon, 06 Jul 2015 05:41:08 -0400
parents 4943308e95fc
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
1 #!/usr/bin/Rscript
d4d58887f008 Uploaded
stef
parents:
diff changeset
2
d4d58887f008 Uploaded
stef
parents:
diff changeset
3 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
4 ## prints all arguments as msg
d4d58887f008 Uploaded
stef
parents:
diff changeset
5 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
6 catMsg <- function( msg=c() ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
7 cat( MAIN_NAME, paste( msg, collapse="" ), "\n", sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
8 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
9 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
10 ## return the location of this script
d4d58887f008 Uploaded
stef
parents:
diff changeset
11 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
12 getScriptPath <- function(){
d4d58887f008 Uploaded
stef
parents:
diff changeset
13 cmd.args <- commandArgs()
d4d58887f008 Uploaded
stef
parents:
diff changeset
14 m <- regexpr("(?<=^--file=).+", cmd.args, perl=TRUE)
d4d58887f008 Uploaded
stef
parents:
diff changeset
15 script.dir <- dirname(regmatches(cmd.args, m))
d4d58887f008 Uploaded
stef
parents:
diff changeset
16 if( length(script.dir) == 0 ) stop("[ERR] Can't determine script dir: please call the script with Rscript\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
17 if( length(script.dir) > 1 ) stop("[ERR] Can't determine script dir: more than one '--file' argument detected\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
18 return(script.dir)
d4d58887f008 Uploaded
stef
parents:
diff changeset
19 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
20 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
21 ## Some html creation functions
d4d58887f008 Uploaded
stef
parents:
diff changeset
22 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
23 htmlTableRow <- function( string_array=c() ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
24 td_cells <- ''
d4d58887f008 Uploaded
stef
parents:
diff changeset
25 for ( i in string_array ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
26 td_cells <- paste( td_cells, '<td>', i, '</td>', sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
27 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
28 return( paste( "<tr>", td_cells, "</tr>") )
d4d58887f008 Uploaded
stef
parents:
diff changeset
29 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
30 htmlLink <- function( path, desc="LINK" ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
31 return( paste( '<a href="', path, '">', desc, "</a>", sep='') )
d4d58887f008 Uploaded
stef
parents:
diff changeset
32 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
33 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
34 ## constructs a list with input bam file info
d4d58887f008 Uploaded
stef
parents:
diff changeset
35 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
36 makeBamFileList <- function( paths, names ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
37 tmp <- list()
d4d58887f008 Uploaded
stef
parents:
diff changeset
38 l1 <- length(paths)
d4d58887f008 Uploaded
stef
parents:
diff changeset
39 l2 <- length(names)
d4d58887f008 Uploaded
stef
parents:
diff changeset
40 if ( l1 != l2 ) stop( "Unequal amount of bam-paths (", l1, ") and -names (", l2, ") in makeBamFileList!!!\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
41 if ( l1 == 0 ){ return(tmp) } # empty list in debug mode
d4d58887f008 Uploaded
stef
parents:
diff changeset
42
d4d58887f008 Uploaded
stef
parents:
diff changeset
43 for ( i in 1:length(paths) ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
44 path <- paths[i]
d4d58887f008 Uploaded
stef
parents:
diff changeset
45 name <- names[i]
d4d58887f008 Uploaded
stef
parents:
diff changeset
46 file <- basename(path)
d4d58887f008 Uploaded
stef
parents:
diff changeset
47
d4d58887f008 Uploaded
stef
parents:
diff changeset
48 tmp[[ file ]] <- name
d4d58887f008 Uploaded
stef
parents:
diff changeset
49 tmp[[ 'all_paths' ]] <- c( tmp[[ 'all_paths' ]], path )
d4d58887f008 Uploaded
stef
parents:
diff changeset
50 tmp[[ 'all_files' ]] <- c( tmp[[ 'all_files' ]], file )
d4d58887f008 Uploaded
stef
parents:
diff changeset
51 tmp[[ 'all_names' ]] <- c( tmp[[ 'all_names' ]], name )
d4d58887f008 Uploaded
stef
parents:
diff changeset
52 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
53 return( tmp )
d4d58887f008 Uploaded
stef
parents:
diff changeset
54 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
55
d4d58887f008 Uploaded
stef
parents:
diff changeset
56 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
57 ## copied code for extracting the regions by segment call status
d4d58887f008 Uploaded
stef
parents:
diff changeset
58 ## --------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
59 fuseRegions <- function( obj, minRatio=0 ) {
d4d58887f008 Uploaded
stef
parents:
diff changeset
60 if ( ncol(obj) > 1 ) stop('Please specify which sample...')
d4d58887f008 Uploaded
stef
parents:
diff changeset
61
d4d58887f008 Uploaded
stef
parents:
diff changeset
62 data <- data.frame( obj@featureData@data[,1:3], copynumber(obj), segmented(obj), check.names=FALSE, stringsAsFactors=FALSE)
d4d58887f008 Uploaded
stef
parents:
diff changeset
63 colnames( data ) <- c( "chr", "start", "end", "log2", "segmentval" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
64
d4d58887f008 Uploaded
stef
parents:
diff changeset
65 fused.data <- data.frame()
d4d58887f008 Uploaded
stef
parents:
diff changeset
66 curr.bin <- 1
d4d58887f008 Uploaded
stef
parents:
diff changeset
67 for ( chr in unique( data$chr ) ) {
d4d58887f008 Uploaded
stef
parents:
diff changeset
68 chr.data <- data[ data$chr == chr, ]
d4d58887f008 Uploaded
stef
parents:
diff changeset
69 prev.bin <- curr.bin
d4d58887f008 Uploaded
stef
parents:
diff changeset
70 prev.log2 <- chr.data[ 1, 'log2' ]
d4d58887f008 Uploaded
stef
parents:
diff changeset
71 prev.segm <- chr.data[ 1, 'segmentval' ]
d4d58887f008 Uploaded
stef
parents:
diff changeset
72 start <- chr.data[ 1, 'start' ]
d4d58887f008 Uploaded
stef
parents:
diff changeset
73
d4d58887f008 Uploaded
stef
parents:
diff changeset
74 if ( nrow(chr.data) > 1) {
d4d58887f008 Uploaded
stef
parents:
diff changeset
75 for ( i in 2:nrow(chr.data) ) {
d4d58887f008 Uploaded
stef
parents:
diff changeset
76 curr.bin <- curr.bin + 1
d4d58887f008 Uploaded
stef
parents:
diff changeset
77 curr.segm <- chr.data[ i, 'segmentval']
d4d58887f008 Uploaded
stef
parents:
diff changeset
78
d4d58887f008 Uploaded
stef
parents:
diff changeset
79 if ( curr.segm != prev.segm ) {
d4d58887f008 Uploaded
stef
parents:
diff changeset
80 fused.data <- rbind( fused.data, data.frame( chr=chr, start=start, end=chr.data[ i-1, 'end'], segmentval=round(prev.segm, digits=DECIMALS) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
81 prev.segm <- curr.segm
d4d58887f008 Uploaded
stef
parents:
diff changeset
82 prev.bin <- curr.bin
d4d58887f008 Uploaded
stef
parents:
diff changeset
83 start <- chr.data[ i, 'start']
d4d58887f008 Uploaded
stef
parents:
diff changeset
84 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
85 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
86 fused.data <- rbind( fused.data, data.frame( chr=chr, start=start, end=chr.data[ i-1, 'end'], segmentval=round(prev.segm, digits=DECIMALS) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
87 }else{
d4d58887f008 Uploaded
stef
parents:
diff changeset
88 fused.data <- rbind( fused.data, data.frame( chr=chr, start=start, end=chr.data[ i-1, 'end'], segmentval=round(prev.segm, digits=DECIMALS) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
89 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
90 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
91 ## remove regions with low amplitude
d4d58887f008 Uploaded
stef
parents:
diff changeset
92 fused.data <- fused.data[ abs(fused.data$segmentval) >= minRatio, ]
d4d58887f008 Uploaded
stef
parents:
diff changeset
93 fused.data
d4d58887f008 Uploaded
stef
parents:
diff changeset
94 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
95
d4d58887f008 Uploaded
stef
parents:
diff changeset
96 ## DESC: takes the output of fuse.regions and outputs a txt file per sample
d4d58887f008 Uploaded
stef
parents:
diff changeset
97 outputRegionsFromList <- function ( regionsList, outputBasename, outputDir="./", binSize, storeList ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
98 if ( missing(regionsList) ) stop( 'Please provide regionsList...' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
99 if ( missing(outputBasename) ) stop( 'Please provide outputBasename...' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
100 if ( !is.list(regionsList) ) stop( 'Input not a list...?' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
101 if ( length(regionsList) < 1 ) stop( 'List seems empty...?' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
102 if ( file.exists( outputDir ) ) catMsg( c(" Using dir ", outputDir, " for output") )
d4d58887f008 Uploaded
stef
parents:
diff changeset
103 else dir.create( outputDir )
d4d58887f008 Uploaded
stef
parents:
diff changeset
104
d4d58887f008 Uploaded
stef
parents:
diff changeset
105 ## have to set R output options otherwise scientific method is used at some point
d4d58887f008 Uploaded
stef
parents:
diff changeset
106 options( "scipen"=100 )
d4d58887f008 Uploaded
stef
parents:
diff changeset
107
d4d58887f008 Uploaded
stef
parents:
diff changeset
108 sampleCount <- length( regionsList )
d4d58887f008 Uploaded
stef
parents:
diff changeset
109 sampleNames <- names( regionsList )
d4d58887f008 Uploaded
stef
parents:
diff changeset
110 bedgraphColumns <- c( 'chr', 'start', 'end', 'segmentval' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
111
d4d58887f008 Uploaded
stef
parents:
diff changeset
112 catMsg( c( " There are ", sampleCount, " samples found in input list") )
d4d58887f008 Uploaded
stef
parents:
diff changeset
113
d4d58887f008 Uploaded
stef
parents:
diff changeset
114 for ( sample in sampleNames ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
115 catMsg( c(" Working on sample ", sample ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
116 regionCount <- nrow( regionsList[[sample]] )
d4d58887f008 Uploaded
stef
parents:
diff changeset
117
d4d58887f008 Uploaded
stef
parents:
diff changeset
118 outSampleBase <- paste( outputBasename, '_', sample, '_', binSize, 'kbp', sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
119 outBedgraphFile <- paste( outSampleBase, '.bedGraph', sep="" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
120 outBedgraphPath <- paste( outputDir, '/', outBedgraphFile, sep="" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
121
d4d58887f008 Uploaded
stef
parents:
diff changeset
122 ## ---------- BEDGRAPH ----------
d4d58887f008 Uploaded
stef
parents:
diff changeset
123 txt <- paste( "track type=bedGraph color=0,100,0 altColor=255,0,0 name=", sample," description=segmented_regions_from_QDNAseq_",binSize,"kbp\n", sep="")
d4d58887f008 Uploaded
stef
parents:
diff changeset
124 sink( outBedgraphPath )
d4d58887f008 Uploaded
stef
parents:
diff changeset
125 cat( txt )
d4d58887f008 Uploaded
stef
parents:
diff changeset
126 sink()
d4d58887f008 Uploaded
stef
parents:
diff changeset
127 write.table( regionsList[[sample]][,bedgraphColumns], outBedgraphPath, quote=F, sep="\t", row.names=F, append=T, col.names=F)
d4d58887f008 Uploaded
stef
parents:
diff changeset
128 #outFiles[[sample]] <- c( outBedgraphFile )
d4d58887f008 Uploaded
stef
parents:
diff changeset
129 storeList[[ paste( binSize, sample, 'bedgraph', sep="_")]] <- outBedgraphFile
d4d58887f008 Uploaded
stef
parents:
diff changeset
130 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
131 return(storeList)
d4d58887f008 Uploaded
stef
parents:
diff changeset
132 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
133
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
134 ## ==================================================
4943308e95fc Uploaded
stef
parents: 21
diff changeset
135 ## Unused but potential usefull code
4943308e95fc Uploaded
stef
parents: 21
diff changeset
136 ## ==================================================
4943308e95fc Uploaded
stef
parents: 21
diff changeset
137 #@ a bit hacky galaxy way to allow an unknown number of output files based on param selection
4943308e95fc Uploaded
stef
parents: 21
diff changeset
138 #@ see: https://wiki.galaxyproject.org/Admin/Tools/Multiple%20Output%20Files
4943308e95fc Uploaded
stef
parents: 21
diff changeset
139 #historyName <- paste(binSize, 'kbp-IGV', sep="")
4943308e95fc Uploaded
stef
parents: 21
diff changeset
140 #igvFile <- paste( newFilePath, "/primary_", outputId, "_", historyName, "_visible_txt", sep="" )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
141
d4d58887f008 Uploaded
stef
parents:
diff changeset
142 ## ==================================================
d4d58887f008 Uploaded
stef
parents:
diff changeset
143 ## Start of analysis
d4d58887f008 Uploaded
stef
parents:
diff changeset
144 ## ==================================================
18
b711e34e73dc Uploaded
stef
parents: 12
diff changeset
145 MAIN_NAME <- '[INFO] '
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
146 catMsg( "Starting QDNAseq wrapper" )
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
147 #catMsg( R.version.string )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
148 catMsg( "Loading R libraries" )
7
1181e22c2b5a Uploaded
stef
parents: 6
diff changeset
149
12
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
150 ## supress msg to allow R to finish with non-error msg
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
151 suppressWarnings( suppressMessages( library( QDNAseq, quietly = TRUE ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
152 suppressWarnings( suppressMessages( library( CGHcall, quietly = TRUE ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
153
12
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
154 ## only one param: the tmp config file
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
155 cmdLineArgs <- commandArgs(TRUE)
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
156 config <- cmdLineArgs[1]
20
f31856c25082 Uploaded
stef
parents: 19
diff changeset
157 TOOL_PATH <- cmdLineArgs[2]
12
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
158 CSS_FILE <- paste( TOOL_PATH, '/static/css/QDNAseq.css', sep="" )
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
159 DECIMALS <- 3
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
160 WEB_LINK <- 'http://www.bioconductor.org/packages/release/bioc/html/QDNAseq.html'
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
161 PURE_CSS <- 'http://yui.yahooapis.com/pure/0.5.0/pure-min.css'
6936ad89f369 Uploaded
stef
parents: 9
diff changeset
162
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
163 ## sourcing the config file will load all input params
d4d58887f008 Uploaded
stef
parents:
diff changeset
164 ## many variables are imported via sourced "config"
d4d58887f008 Uploaded
stef
parents:
diff changeset
165 source( config )
d4d58887f008 Uploaded
stef
parents:
diff changeset
166
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
167 ## if calling requested we always need segmenting first as well
4943308e95fc Uploaded
stef
parents: 21
diff changeset
168 if ( doCall ){ doSegment <- TRUE }
4943308e95fc Uploaded
stef
parents: 21
diff changeset
169
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
170 ## desparate tries to make png text scale well, damn you R...!
d4d58887f008 Uploaded
stef
parents:
diff changeset
171 PLOT_RES <- min( PLOT_WIDTH, PLOT_HEIGHT ) / 6.3
d4d58887f008 Uploaded
stef
parents:
diff changeset
172 PAR_SET <- list( pch=22 )
d4d58887f008 Uploaded
stef
parents:
diff changeset
173
d4d58887f008 Uploaded
stef
parents:
diff changeset
174 systemUser <- system("whoami",T)
d4d58887f008 Uploaded
stef
parents:
diff changeset
175 qdnaseqVersion <- packageDescription( "QDNAseq" )$Version
d4d58887f008 Uploaded
stef
parents:
diff changeset
176 rVersion <- R.version.string
d4d58887f008 Uploaded
stef
parents:
diff changeset
177 startTime <- Sys.time()
d4d58887f008 Uploaded
stef
parents:
diff changeset
178 analysisStart <- as.character( startTime )
d4d58887f008 Uploaded
stef
parents:
diff changeset
179 catMsg( c("QDNAseq version: ", qdnaseqVersion) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
180 catMsg( c( rVersion ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
181
d4d58887f008 Uploaded
stef
parents:
diff changeset
182 ## get the comma separated list of chromosomes to exclude
d4d58887f008 Uploaded
stef
parents:
diff changeset
183 excludeChrs <- unlist( strsplit( excludeChrsString, ",") )
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
184
4943308e95fc Uploaded
stef
parents: 21
diff changeset
185 ## format binSizes back to integers because stupid galaxy doesn't do what I want
4943308e95fc Uploaded
stef
parents: 21
diff changeset
186 #print( binSizesString )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
187 binSizes <- gsub( 'kb', '', binSizesString ) # remove the kb string to get integers
4943308e95fc Uploaded
stef
parents: 21
diff changeset
188 #print( binSizes )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
189 binSizes <- gsub( 'bin', '', binSizes ) # remove the kb string to get integers
4943308e95fc Uploaded
stef
parents: 21
diff changeset
190 #print( binSizes )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
191 binSizes <- as.numeric( unlist( strsplit( binSizes, ",") ) )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
192 #print( binSizes )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
193
d4d58887f008 Uploaded
stef
parents:
diff changeset
194
d4d58887f008 Uploaded
stef
parents:
diff changeset
195 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
196 ## DEBUG
d4d58887f008 Uploaded
stef
parents:
diff changeset
197 if ( debug ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
198 catMsg( c("Analysis run by user: ", systemUser ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
199 catMsg( c("DEBUG SessionInfo: " ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
200 print( sessionInfo() )
d4d58887f008 Uploaded
stef
parents:
diff changeset
201 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
202 ## /DEBUG
d4d58887f008 Uploaded
stef
parents:
diff changeset
203 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
204
d4d58887f008 Uploaded
stef
parents:
diff changeset
205 ## prepare output dir
d4d58887f008 Uploaded
stef
parents:
diff changeset
206 if ( !file.exists( outputPath) ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
207 dir.create( outputPath )
d4d58887f008 Uploaded
stef
parents:
diff changeset
208 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
209
d4d58887f008 Uploaded
stef
parents:
diff changeset
210 ## copy source config file to output dir to include it in output zip
d4d58887f008 Uploaded
stef
parents:
diff changeset
211 if ( inGalaxy ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
212 file.copy( config, paste(outputPath, 'galaxyConfigFile.R', sep='/') )
d4d58887f008 Uploaded
stef
parents:
diff changeset
213 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
214
d4d58887f008 Uploaded
stef
parents:
diff changeset
215 ## setup bam filelist for easy retrieval later
d4d58887f008 Uploaded
stef
parents:
diff changeset
216 fileList <- makeBamFileList( bamsPaths, bamsNames )
d4d58887f008 Uploaded
stef
parents:
diff changeset
217 bamCount <- length( fileList[[ 'all_paths' ]] )
d4d58887f008 Uploaded
stef
parents:
diff changeset
218
d4d58887f008 Uploaded
stef
parents:
diff changeset
219 gzipOutputName <- paste( 'QDNAseqResults_', outputName, '.zip', sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
220 gzipOutputPath <- paste( outputPath, '/', gzipOutputName, sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
221 htmlOutputName <- 'index.html'
d4d58887f008 Uploaded
stef
parents:
diff changeset
222 htmlOutputPath <- paste( outputPath, '/', htmlOutputName, sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
223
d4d58887f008 Uploaded
stef
parents:
diff changeset
224 plotted_images <- list() # to keep track of images for later linking
d4d58887f008 Uploaded
stef
parents:
diff changeset
225 regions <- list() # will contain the segments
d4d58887f008 Uploaded
stef
parents:
diff changeset
226
d4d58887f008 Uploaded
stef
parents:
diff changeset
227 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
228 ## in case of debug just use inbuilt LGG data for speedup
d4d58887f008 Uploaded
stef
parents:
diff changeset
229 if ( debug ){
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
230 catMsg( c("Built in data only contains binsize 15kb so overriding chosen binSizes to single 15kb") )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
231 binSizes <- c(15)
d4d58887f008 Uploaded
stef
parents:
diff changeset
232 bamsPaths <- c( "BUILD_IN_DATA")
d4d58887f008 Uploaded
stef
parents:
diff changeset
233 bamsNames <- c( "LGG150")
d4d58887f008 Uploaded
stef
parents:
diff changeset
234 fileList <- makeBamFileList( bamsPaths, bamsNames )
d4d58887f008 Uploaded
stef
parents:
diff changeset
235 bamCount <- length( fileList[[ 'all_paths' ]] )
d4d58887f008 Uploaded
stef
parents:
diff changeset
236 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
237
d4d58887f008 Uploaded
stef
parents:
diff changeset
238 for ( binSize in binSizes ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
239
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
240 catMsg( c("Starting analysis for binSize: ", binSize) )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
241 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
242 ## construct output file-names and -paths
d4d58887f008 Uploaded
stef
parents:
diff changeset
243 ## ------------------------
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
244 rdsReadName <- paste( binSize, 'kbp_QDNAseqReadCounts.rds', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
245 rdsCopyName <- paste( binSize, 'kbp_QDNAseqCopyNumbers.rds', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
246 rdsSegmName <- paste( binSize, 'kbp_QDNAseqCopyNumbersSegmented.rds', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
247 rdsCallName <- paste( binSize, 'kbp_QDNAseqCopyNumbersCalled.rds', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
248 igvCopyName <- paste( binSize, 'kbp_QDNAseqCopyNumbers.igv', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
249 igvSegmName <- paste( binSize, 'kbp_QDNAseqCopyNumbersSegmented.igv', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
250 igvCallName <- paste( binSize, 'kbp_QDNAseqCopyNumbersCalled.igv', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
251
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
252 regiOutputName <- paste( binSize, 'kbp_QDNAseqRegions.rds', sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
253 noiseImgName <- paste( binSize, 'kbp_QDNAseqNoiseplot.png', sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
254
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
255 rdsRegiPath <- paste( outputPath, '/', regiOutputName, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
256 noiseImgPath <- paste( outputPath, '/', noiseImgName, sep='')
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
257
d4d58887f008 Uploaded
stef
parents:
diff changeset
258 binAnnFile <- paste( TOOL_PATH, '/static/binannotation/', binSize, 'kbp_binAnnotations.rds', sep="" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
259 if ( file.exists(binAnnFile) ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
260 binAnnotations <- readRDS( binAnnFile )
d4d58887f008 Uploaded
stef
parents:
diff changeset
261 catMsg( c("Using local binAnnotations file" ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
262 }else{
d4d58887f008 Uploaded
stef
parents:
diff changeset
263 binAnnotations <- getBinAnnotations( binSize=binSize, type=experimentType )
d4d58887f008 Uploaded
stef
parents:
diff changeset
264 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
265
d4d58887f008 Uploaded
stef
parents:
diff changeset
266 ## in case of debug just use inbuilt LGG data for speedup
d4d58887f008 Uploaded
stef
parents:
diff changeset
267 if ( debug ){
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
268 data( LGG150 )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
269 readCounts <- LGG150
d4d58887f008 Uploaded
stef
parents:
diff changeset
270 }else{
d4d58887f008 Uploaded
stef
parents:
diff changeset
271 ## provide bamnames because in galaxy everyting is called "dataset_###"
d4d58887f008 Uploaded
stef
parents:
diff changeset
272 readCounts <- binReadCounts( binAnnotations, bamfiles=fileList[[ 'all_paths' ]], bamnames=fileList[[ 'all_names' ]] )
d4d58887f008 Uploaded
stef
parents:
diff changeset
273 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
274
d4d58887f008 Uploaded
stef
parents:
diff changeset
275 readCountsFiltered <- applyFilters( readCounts, residual=TRUE, blacklist=filterBlacklistedBins, mappability=mappabilityCutoff, chromosomes=excludeChrs )
d4d58887f008 Uploaded
stef
parents:
diff changeset
276 readCountsFiltered <- estimateCorrection( readCountsFiltered )
d4d58887f008 Uploaded
stef
parents:
diff changeset
277 copyNumbers <- correctBins( readCountsFiltered )
d4d58887f008 Uploaded
stef
parents:
diff changeset
278 copyNumbersNormalized <- normalizeBins( copyNumbers )
d4d58887f008 Uploaded
stef
parents:
diff changeset
279 copyNumbersSmooth <- smoothOutlierBins( copyNumbersNormalized )
d4d58887f008 Uploaded
stef
parents:
diff changeset
280 sampleNames <- readCountsFiltered@phenoData@data$name
d4d58887f008 Uploaded
stef
parents:
diff changeset
281
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
282 ## set file to output if output requested
4943308e95fc Uploaded
stef
parents: 21
diff changeset
283 outputData <- copyNumbersSmooth
4943308e95fc Uploaded
stef
parents: 21
diff changeset
284 outputType <- 'copynumber'
4943308e95fc Uploaded
stef
parents: 21
diff changeset
285 outputLogT <- TRUE
4943308e95fc Uploaded
stef
parents: 21
diff changeset
286 rdsReadPath <- paste( outputPath, '/', rdsReadName, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
287 saveRDS( readCounts, rdsReadPath );
4943308e95fc Uploaded
stef
parents: 21
diff changeset
288 rdsPath <- paste( outputPath, '/', rdsCopyName, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
289 igvPath <- paste( outputPath, '/', igvCopyName, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
290
4943308e95fc Uploaded
stef
parents: 21
diff changeset
291 ## proceed with segmenting / calling if requested
4943308e95fc Uploaded
stef
parents: 21
diff changeset
292 if ( doSegment ){
27
f89205f51e27 Uploaded
stef
parents: 23
diff changeset
293 copyNumbersSegmented <- segmentBins( copyNumbersSmooth, undo.splits=undoSplits, undo.SD=undoSD, transformFun=c("sqrt") )
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
294 copyNumbersSegmented <- normalizeSegmentedBins( copyNumbersSegmented )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
295 outputData <- copyNumbersSegmented
4943308e95fc Uploaded
stef
parents: 21
diff changeset
296 outputType <- 'segments'
27
f89205f51e27 Uploaded
stef
parents: 23
diff changeset
297 igvPath <- paste( outputPath, '/', igvSegmName, sep='')
f89205f51e27 Uploaded
stef
parents: 23
diff changeset
298 rdsPath <- paste( outputPath, '/', rdsSegmName, sep='')
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
299 }
4943308e95fc Uploaded
stef
parents: 21
diff changeset
300 if ( doCall ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
301 copyNumbersCalled <- callBins(copyNumbersSegmented)
4943308e95fc Uploaded
stef
parents: 21
diff changeset
302 outputData <- copyNumbersCalled
4943308e95fc Uploaded
stef
parents: 21
diff changeset
303 outputType <- 'calls'
4943308e95fc Uploaded
stef
parents: 21
diff changeset
304 outputLogT <- FALSE # call values should not be transformed at output
4943308e95fc Uploaded
stef
parents: 21
diff changeset
305 rdsPath <- paste( outputPath, '/', rdsCallName, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
306 igvPath <- paste( outputPath, '/', igvCallName, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
307 }
4943308e95fc Uploaded
stef
parents: 21
diff changeset
308
4943308e95fc Uploaded
stef
parents: 21
diff changeset
309 ## save the QDNAseq objects and tsv file of highest level (calls or segments)
4943308e95fc Uploaded
stef
parents: 21
diff changeset
310 saveRDS( outputData, rdsPath );
4943308e95fc Uploaded
stef
parents: 21
diff changeset
311 exportBins( outputData, file=igvPath, format="igv", type=outputType, logTransform=outputLogT )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
312
d4d58887f008 Uploaded
stef
parents:
diff changeset
313 ## also save objects for galaxy history output if requested
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
314 if ( txt2history ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
315 fileId <- paste('txt_', binSize, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
316 historyOutputPath <- historyOutputFiles[[ fileId ]]
4943308e95fc Uploaded
stef
parents: 21
diff changeset
317 catMsg( c("About to export igv/txt file to history for ", binSize, "kbp bin") )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
318 exportBins( outputData, file=historyOutputPath, format="igv", type=outputType, logTransform=outputLogT )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
319 }
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
320 if ( rds2history ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
321 fileId <- paste('rds_', binSize, sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
322 rdsHistoryOutputPath <- historyOutputFiles[[ fileId ]]
4943308e95fc Uploaded
stef
parents: 21
diff changeset
323 catMsg( c("About to export rds file to history for ", binSize, "kbp bin") )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
324 saveRDS( outputData, file=rdsHistoryOutputPath )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
325 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
326
d4d58887f008 Uploaded
stef
parents:
diff changeset
327 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
328 ## create output files
d4d58887f008 Uploaded
stef
parents:
diff changeset
329 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
330 png( noiseImgPath, width=PLOT_HEIGHT, height=PLOT_HEIGHT, res=PLOT_RES );
d4d58887f008 Uploaded
stef
parents:
diff changeset
331 par( PAR_SET )
d4d58887f008 Uploaded
stef
parents:
diff changeset
332 noisePlot( readCountsFiltered, main=paste( "Noise Plot ", binSize, "kbp", sep=''), col="darkgreen" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
333 dev.off()
d4d58887f008 Uploaded
stef
parents:
diff changeset
334
d4d58887f008 Uploaded
stef
parents:
diff changeset
335 binSize <- as.character( binSize ) # to avoid R using it as array index... (*#$^@ you R!)
d4d58887f008 Uploaded
stef
parents:
diff changeset
336 binSizeString <- paste( binSize, 'kbp', sep='')
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
337 cgh <- makeCgh( outputData ) # needed for fuseRegions function
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
338
d4d58887f008 Uploaded
stef
parents:
diff changeset
339 for (i in 1:length(sampleNames) ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
340
d4d58887f008 Uploaded
stef
parents:
diff changeset
341 sample <- sampleNames[i]
d4d58887f008 Uploaded
stef
parents:
diff changeset
342 usedReads <- readCountsFiltered@phenoData@data$used.reads[i]
d4d58887f008 Uploaded
stef
parents:
diff changeset
343 catMsg( c("Creating plots for sample: ", sample, " (", binSizeString, ")" ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
344
d4d58887f008 Uploaded
stef
parents:
diff changeset
345 type <- 'CopyNumbers'
d4d58887f008 Uploaded
stef
parents:
diff changeset
346 img_file <- paste( sample, '_', binSize, 'kbp_QDNAseq', type, '.png', sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
347 img_file_path <- paste( outputPath, '/', img_file, sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
348
d4d58887f008 Uploaded
stef
parents:
diff changeset
349 ## COPYNUMBER PLOT
d4d58887f008 Uploaded
stef
parents:
diff changeset
350 png( img_file_path, width=PLOT_WIDTH, height=PLOT_HEIGHT, res=PLOT_RES );
d4d58887f008 Uploaded
stef
parents:
diff changeset
351 par( PAR_SET )
d4d58887f008 Uploaded
stef
parents:
diff changeset
352 plot( copyNumbersSmooth[ ,sample ], main=paste(sample, ": CopyNumbers", sep="") )
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
353 mtext( paste( "(", binSizeString, " bins)", sep=""), 3 )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
354 abline( h=c(-2,-1,1,2,3,4), lty=1, lwd=0.5, col="grey" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
355 dev.off()
d4d58887f008 Uploaded
stef
parents:
diff changeset
356
d4d58887f008 Uploaded
stef
parents:
diff changeset
357 plotted_images[[ paste(binSize, sample, type, sep="_" ) ]] <- img_file
d4d58887f008 Uploaded
stef
parents:
diff changeset
358
d4d58887f008 Uploaded
stef
parents:
diff changeset
359 if ( doSegment ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
360 type <- 'Segmented'
d4d58887f008 Uploaded
stef
parents:
diff changeset
361 img_file <- paste( sample, '_', binSize, 'kbp_QDNAseq', type, '.png', sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
362 img_file_path <- paste( outputPath, '/', img_file, sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
363
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
364 ## COPYNUMBER + SEGMENTS PLOT
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
365 png( img_file_path, width=PLOT_WIDTH, height=PLOT_HEIGHT, res=PLOT_RES );
d4d58887f008 Uploaded
stef
parents:
diff changeset
366 par( PAR_SET )
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
367 plot( copyNumbersSegmented[ ,sample ], main=paste(sample, ": CopyNumbers (Segmented)", sep="") )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
368 mtext( paste( "(", binSizeString, " bins)", sep=""), 3 )
d4d58887f008 Uploaded
stef
parents:
diff changeset
369 abline( h=c(-2,-1,1,2,3,4), lty=1, lwd=0.5, col="grey" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
370 dev.off()
d4d58887f008 Uploaded
stef
parents:
diff changeset
371
d4d58887f008 Uploaded
stef
parents:
diff changeset
372 plotted_images[[ paste(binSize, sample, type, sep="_" ) ]] <- img_file
d4d58887f008 Uploaded
stef
parents:
diff changeset
373
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
374 ## if segmented we can also retrieve the segment locations
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
375 catMsg( c(" Fusing regions of sample: ", sample) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
376 regions[[ sample ]] <- fuseRegions( cgh[, sample] )
d4d58887f008 Uploaded
stef
parents:
diff changeset
377
d4d58887f008 Uploaded
stef
parents:
diff changeset
378 region_count <- nrow( data.frame( regions[[ sample ]] ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
379 catMsg( c( ' sample "', sample, '" has ', region_count, " regions" ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
380 plotted_images[[ paste(binSize, sample, 'region_count', sep="_" ) ]] <- region_count
d4d58887f008 Uploaded
stef
parents:
diff changeset
381 }
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
382
4943308e95fc Uploaded
stef
parents: 21
diff changeset
383 if ( doCall ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
384 type <- 'Called'
4943308e95fc Uploaded
stef
parents: 21
diff changeset
385 img_file <- paste( sample, '_', binSize, 'kbp_QDNAseq', type, '.png', sep='')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
386 img_file_path <- paste( outputPath, '/', img_file, sep='' )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
387
4943308e95fc Uploaded
stef
parents: 21
diff changeset
388 ## COPYNUMBER + SEGMENTS + CALLS PLOT
4943308e95fc Uploaded
stef
parents: 21
diff changeset
389 png( img_file_path, width=PLOT_WIDTH, height=PLOT_HEIGHT, res=PLOT_RES );
4943308e95fc Uploaded
stef
parents: 21
diff changeset
390 par( PAR_SET )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
391 plot( copyNumbersCalled[ ,sample ], main=paste(sample, ": CopyNumbers (Segmented and Called)", sep="") )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
392 mtext( paste( "(", binSizeString, " bins)", sep=""), 3 )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
393 abline( h=c(-2,-1,1,2,3,4), lty=1, lwd=0.5, col="grey" )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
394 dev.off()
4943308e95fc Uploaded
stef
parents: 21
diff changeset
395
4943308e95fc Uploaded
stef
parents: 21
diff changeset
396 plotted_images[[ paste(binSize, sample, type, sep="_" ) ]] <- img_file
4943308e95fc Uploaded
stef
parents: 21
diff changeset
397 }
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
398
d4d58887f008 Uploaded
stef
parents:
diff changeset
399 ## add USED read counts
d4d58887f008 Uploaded
stef
parents:
diff changeset
400 plotted_images[[ paste(binSize, sample, 'usedReads', sep="_" ) ]] <- usedReads
d4d58887f008 Uploaded
stef
parents:
diff changeset
401 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
402
d4d58887f008 Uploaded
stef
parents:
diff changeset
403 if ( doSegment ){
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
404 saveRDS( regions, rdsRegiPath )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
405 plotted_images <- outputRegionsFromList( regions, outputBasename=outputName, outputDir=outputPath, binSize=binSize, storeList=plotted_images )
d4d58887f008 Uploaded
stef
parents:
diff changeset
406 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
407 }# end bin
d4d58887f008 Uploaded
stef
parents:
diff changeset
408
d4d58887f008 Uploaded
stef
parents:
diff changeset
409
d4d58887f008 Uploaded
stef
parents:
diff changeset
410 ## ----- debug -----
d4d58887f008 Uploaded
stef
parents:
diff changeset
411 #catMsg( "done" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
412 #q(status=0)
d4d58887f008 Uploaded
stef
parents:
diff changeset
413 ## ---- /debug -----
d4d58887f008 Uploaded
stef
parents:
diff changeset
414
d4d58887f008 Uploaded
stef
parents:
diff changeset
415
d4d58887f008 Uploaded
stef
parents:
diff changeset
416 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
417 ## prepare output
d4d58887f008 Uploaded
stef
parents:
diff changeset
418 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
419 catMsg( "...zipping output")
d4d58887f008 Uploaded
stef
parents:
diff changeset
420 zip_cmd <- paste( "zip -j", gzipOutputPath, paste(outputPath,'/*',sep='') ) ## -j is for removing dirs from the tree
d4d58887f008 Uploaded
stef
parents:
diff changeset
421 system( zip_cmd )
d4d58887f008 Uploaded
stef
parents:
diff changeset
422
d4d58887f008 Uploaded
stef
parents:
diff changeset
423 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
424 ## get filesizes for report
d4d58887f008 Uploaded
stef
parents:
diff changeset
425 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
426 zippedSize <- paste( round( file.info( gzipOutputPath )[["size"]] / 1e+6, digits=2 ), 'MB' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
427 endTime <- Sys.time()
d4d58887f008 Uploaded
stef
parents:
diff changeset
428 timeDiff <- format( round( endTime - startTime, 3 ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
429 analysisEnd <- as.character( endTime )
d4d58887f008 Uploaded
stef
parents:
diff changeset
430
d4d58887f008 Uploaded
stef
parents:
diff changeset
431 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
432 ## creating html output to be linked to from the middle galaxy pane
d4d58887f008 Uploaded
stef
parents:
diff changeset
433 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
434 sink( file = htmlOutputPath, type = "output" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
435 cat( "<html>\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
436 cat( "<head>\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
437
d4d58887f008 Uploaded
stef
parents:
diff changeset
438 cat( "\t", '<title>QDNAseq Report | ', outputName,'</title>', "\n", sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
439 cat( "\t", '<link rel="stylesheet" href="', PURE_CSS, '">', "\n", sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
440 cat( "\t<style>\n", sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
441 ## include CSS into html file, makes it more portable
d4d58887f008 Uploaded
stef
parents:
diff changeset
442 cat( "\t\t", readLines( CSS_FILE ), sep="\n\t\t" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
443 #cat( "\t\th1 {color:red;}", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
444 cat( "\n\t</style>\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
445
d4d58887f008 Uploaded
stef
parents:
diff changeset
446 cat( "\n</head>\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
447 cat( "\n<body>\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
448
d4d58887f008 Uploaded
stef
parents:
diff changeset
449 cat( "<h1>QDNAseq Report</h1>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
450
d4d58887f008 Uploaded
stef
parents:
diff changeset
451 cat( '<h3 class="qdnaseq">About this analysis</h3>', "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
452 cat( '<p>This page provides access to all results. To have a local copy of this report just download the <a href="', gzipOutputName, '" class="button">zipfile</a> with all output (', zippedSize, ')</p>', "\n", sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
453
d4d58887f008 Uploaded
stef
parents:
diff changeset
454 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
455 ## table with general info
d4d58887f008 Uploaded
stef
parents:
diff changeset
456 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
457 cat( '<h3 class="qdnaseq">Settings</h3><p>', "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
458 cat( '<table class="pure-table pure-table-striped"><tbody>' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
459 cat( htmlTableRow( c( "AnalysisName", outputName ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
460 cat( htmlTableRow( c( "AnalysisStart", analysisStart ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
461 cat( htmlTableRow( c( "AnalysisEnd", analysisEnd ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
462 cat( htmlTableRow( c( "AnalysisTime", timeDiff ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
463 cat( htmlTableRow( c( "BinSizes (kbp)", paste(binSizes,collapse=", ") ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
464 cat( htmlTableRow( c( "R info", rVersion ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
465 cat( htmlTableRow( c( "QDNAseq info", qdnaseqVersion ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
466
d4d58887f008 Uploaded
stef
parents:
diff changeset
467 sampleStrings <- c()
d4d58887f008 Uploaded
stef
parents:
diff changeset
468 for ( galaxyName in fileList[[ 'all_files' ]] ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
469 sampleName <- fileList[[ galaxyName ]]
d4d58887f008 Uploaded
stef
parents:
diff changeset
470 sampleStrings <- c( sampleStrings, paste( galaxyName, ' (', sampleName, ')', sep='' ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
471 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
472 cat( htmlTableRow( c( "InputBams", paste( sampleStrings, collapse=", ") ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
473
d4d58887f008 Uploaded
stef
parents:
diff changeset
474 cat( "</tbody></table></p>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
475
d4d58887f008 Uploaded
stef
parents:
diff changeset
476 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
477 ## list with links to all output files
d4d58887f008 Uploaded
stef
parents:
diff changeset
478 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
479 cat( '<h3 class="qdnaseq">Output files</h3><p>', "\n")
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
480 cat( '<p>This table contains output files that can be used for local downstream analysis with the bioconductor QDNAseq package. For each bin-size / data-level there is a R data structure file with data of all samples. See ', htmlLink( WEB_LINK, 'the bioconductor QDNAseq documentation' ), ' for more information on how to work with these files.</p>', "\n", sep='')
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
481 cat( '<table class="pure-table pure-table-striped">', "\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
482 cat( '<thead><th>Type</th>', as.vector( mapply( paste, "<th>", binSizes, "kbp</th>", sep="" ) ),'</thead>', "\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
483 cat( "<tbody>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
484 files <- list()
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
485 #fileTypes <- c( 'ReadCounts.rds', 'CopyNumbers.rds' )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
486 fileTypes <- c( 'ReadCounts.rds' )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
487 if ( doCall ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
488 fileTypes <- c( fileTypes, 'CopyNumbersCalled.rds')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
489 }else if ( doSegment ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
490 fileTypes <- c( fileTypes, 'CopyNumbersSegmented.rds')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
491 }else {
4943308e95fc Uploaded
stef
parents: 21
diff changeset
492 fileTypes <- c( fileTypes, 'CopyNumbers.rds')
4943308e95fc Uploaded
stef
parents: 21
diff changeset
493 }
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
494
d4d58887f008 Uploaded
stef
parents:
diff changeset
495 for ( fileType in fileTypes ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
496 fileNames <- mapply( paste, binSizes, paste( 'kbp_QDNAseq', fileType, sep=''), sep='')
d4d58887f008 Uploaded
stef
parents:
diff changeset
497 fileLinks <- mapply( htmlLink, fileNames, paste( binSizes, "kbp", sep="" ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
498 cat( htmlTableRow( c( fileType, fileLinks ) ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
499 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
500 cat( "\n</tbody></table></p>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
501
d4d58887f008 Uploaded
stef
parents:
diff changeset
502 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
503 ## table with links to files
d4d58887f008 Uploaded
stef
parents:
diff changeset
504 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
505 ratio <- PLOT_WIDTH / PLOT_HEIGHT
d4d58887f008 Uploaded
stef
parents:
diff changeset
506 width <- 960; height <- width / ratio ## bigger img
d4d58887f008 Uploaded
stef
parents:
diff changeset
507 width_t <- 100; height_t <- 40 ## thumb img
d4d58887f008 Uploaded
stef
parents:
diff changeset
508
d4d58887f008 Uploaded
stef
parents:
diff changeset
509 cat( '<h3 class="qdnaseq">Results: overview</h3><p>', "\n")
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
510 cat( '<p>This table contains the visual results of the copy number aberration analysis. You can click on an image to jump to the larger version. If segmentation was performed as well the number of segments is shown and a file with genomic regions can be downloaded (just remember to inspect the results carefully as this is, together with optional calling afterwards, a more experimental type of analysis).</p>', "\n", sep='')
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
511 plots_html <- ''
d4d58887f008 Uploaded
stef
parents:
diff changeset
512
d4d58887f008 Uploaded
stef
parents:
diff changeset
513 colspan <- 1
d4d58887f008 Uploaded
stef
parents:
diff changeset
514 binHeader <- "<th>Image</th>"
d4d58887f008 Uploaded
stef
parents:
diff changeset
515 if ( doSegment ){ # extra column with segment info
d4d58887f008 Uploaded
stef
parents:
diff changeset
516 colspan <- 2
d4d58887f008 Uploaded
stef
parents:
diff changeset
517 binHeader <- "<th>Image</th><th>Segments</th>"
d4d58887f008 Uploaded
stef
parents:
diff changeset
518 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
519 cat( '<table class="pure-table pure-table-striped">', "\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
520 cat( '<thead><tr><th></th><th></th>', as.vector( mapply( paste, "<th colspan=\"", colspan,"\">", binSizes, "kbp</th>", sep="" ) ), '</tr></thead>' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
521 cat( '<thead><tr><th>Sample / File</th><th>Reads</th>', rep( binHeader, length(binSizes) ), '</tr></thead>' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
522 cat( '<tbody>' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
523
d4d58887f008 Uploaded
stef
parents:
diff changeset
524 for ( bam_file in bamsNames ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
525
d4d58887f008 Uploaded
stef
parents:
diff changeset
526 usedReads <- plotted_images[[ paste(binSize, bam_file, 'usedReads', sep="_" ) ]]
d4d58887f008 Uploaded
stef
parents:
diff changeset
527 usedReads <- format( as.integer(usedReads), digits=4, decimal.mark=".", big.mark="," )
d4d58887f008 Uploaded
stef
parents:
diff changeset
528 htmlRow <- paste( '<tr><td>', bam_file, '</td><td>', usedReads, '</td>', sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
529
d4d58887f008 Uploaded
stef
parents:
diff changeset
530 for ( binSize in binSizes ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
531
d4d58887f008 Uploaded
stef
parents:
diff changeset
532 ## add thumbnails to table with links to anchors on html page
d4d58887f008 Uploaded
stef
parents:
diff changeset
533 copy_img <- plotted_images[[ paste(binSize, bam_file, 'CopyNumbers', sep="_" ) ]]
d4d58887f008 Uploaded
stef
parents:
diff changeset
534 html_copy_thumb <- htmlLink( path=paste('#', copy_img, sep=''), paste('<img src="',copy_img,'" alt="', bam_file, '" width="', width_t, '" height="', height_t, '">', sep='') )
d4d58887f008 Uploaded
stef
parents:
diff changeset
535 html_copy_img <- htmlLink( path=copy_img, paste('<img id="', copy_img,'" src="',copy_img,'" alt="',bam_file, '" width="', width, '" height="', height, '">', sep='') )
d4d58887f008 Uploaded
stef
parents:
diff changeset
536 html_segm_img <- ''
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
537 html_call_img <- ''
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
538 html_bedGraph <- ''
d4d58887f008 Uploaded
stef
parents:
diff changeset
539 region_count <- ''
d4d58887f008 Uploaded
stef
parents:
diff changeset
540 htmlRow <- paste( htmlRow, '<td>', html_copy_thumb, '</td>' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
541
d4d58887f008 Uploaded
stef
parents:
diff changeset
542 if ( doSegment ){
d4d58887f008 Uploaded
stef
parents:
diff changeset
543 segm_img <- plotted_images[[ paste(binSize, bam_file, 'Segmented', sep="_" ) ]]
d4d58887f008 Uploaded
stef
parents:
diff changeset
544 region_count <- plotted_images[[ paste(binSize, bam_file, 'region_count', sep="_" ) ]]
d4d58887f008 Uploaded
stef
parents:
diff changeset
545
d4d58887f008 Uploaded
stef
parents:
diff changeset
546 html_bedGraph <- htmlLink( path=plotted_images[[ paste(binSize, bam_file, 'bedgraph', sep="_" ) ]], 'bedGraph' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
547 html_segm_img <- htmlLink( path=segm_img, paste('<img id="', segm_img,'" src="', segm_img,'" alt="', bam_file, '" width="', width, '" height="', height,'">', sep='') )
d4d58887f008 Uploaded
stef
parents:
diff changeset
548 htmlRow <- paste( htmlRow, '<td>', region_count, ' (', html_bedGraph, ')</td>', sep="" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
549 }
23
4943308e95fc Uploaded
stef
parents: 21
diff changeset
550 if ( doCall ){
4943308e95fc Uploaded
stef
parents: 21
diff changeset
551 call_img <- plotted_images[[ paste(binSize, bam_file, 'Called', sep="_" ) ]]
4943308e95fc Uploaded
stef
parents: 21
diff changeset
552 html_call_img <- htmlLink( path=call_img, paste('<img id="', call_img,'" src="', call_img,'" alt="', bam_file, '" width="', width, '" height="', height,'">', sep='') )
4943308e95fc Uploaded
stef
parents: 21
diff changeset
553 }
4943308e95fc Uploaded
stef
parents: 21
diff changeset
554 plots_html <- paste( plots_html, html_copy_img, "\n", html_segm_img, "\n", html_call_img, "\n<br \\>\n", sep='' )
6
d4d58887f008 Uploaded
stef
parents:
diff changeset
555 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
556 plots_html <- paste( plots_html, "\n<hr \\>\n", sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
557 ## add info to overview table, including small thumbnails
d4d58887f008 Uploaded
stef
parents:
diff changeset
558 htmlRow <- paste( htmlRow, '</tr>', sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
559 cat( htmlRow, "\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
560 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
561 cat( "</tbody></table></p>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
562
d4d58887f008 Uploaded
stef
parents:
diff changeset
563 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
564 ## section with various output shown
d4d58887f008 Uploaded
stef
parents:
diff changeset
565 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
566 cat( '<h3 class="qdnaseq">Results: Sample plots</h3><p>', "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
567 ## now include (large) images in html page
d4d58887f008 Uploaded
stef
parents:
diff changeset
568 cat( plots_html, "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
569 cat( "\n</p></body>\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
570 cat( "\n</html>\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
571 sink()
d4d58887f008 Uploaded
stef
parents:
diff changeset
572
d4d58887f008 Uploaded
stef
parents:
diff changeset
573 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
574 ## creating main html output for galaxy history
d4d58887f008 Uploaded
stef
parents:
diff changeset
575 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
576 if ( inGalaxy ){ # dont create when running outside Galaxy
d4d58887f008 Uploaded
stef
parents:
diff changeset
577 sink( file = outputHtml, type = "output" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
578
d4d58887f008 Uploaded
stef
parents:
diff changeset
579 cat( "<head>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
580 cat( "\t", '<link rel="stylesheet" href="', PURE_CSS, '">', "\n", sep='' )
d4d58887f008 Uploaded
stef
parents:
diff changeset
581
d4d58887f008 Uploaded
stef
parents:
diff changeset
582 cat( "<style>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
583 ## include CSS directly into html file
d4d58887f008 Uploaded
stef
parents:
diff changeset
584 cat( paste( "\t", '/* the css here originates from ', CSS_FILE,' */', "\n") )
d4d58887f008 Uploaded
stef
parents:
diff changeset
585 cat( paste( "\t", readLines( CSS_FILE, n = -1)), sep="\n" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
586 cat( "</style>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
587 cat( "</head>", "\n")
d4d58887f008 Uploaded
stef
parents:
diff changeset
588
d4d58887f008 Uploaded
stef
parents:
diff changeset
589 cat( '<h1>QDNAseq Results (', outputName,')</h1>', "\n", sep="")
d4d58887f008 Uploaded
stef
parents:
diff changeset
590 cat( '<p>Explore <a href="', htmlOutputName, '" class="button">the results</a> directly within galaxy</p>', "\n", sep="")
d4d58887f008 Uploaded
stef
parents:
diff changeset
591 cat( '<p>Or download a <a href="', gzipOutputName, '" class="button">zipfile</a> with all output (', zippedSize, ')</p>', "\n", sep="" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
592
d4d58887f008 Uploaded
stef
parents:
diff changeset
593 sink()
d4d58887f008 Uploaded
stef
parents:
diff changeset
594 }
d4d58887f008 Uploaded
stef
parents:
diff changeset
595
d4d58887f008 Uploaded
stef
parents:
diff changeset
596 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
597 ## create final zip and quit with status 0 to tell galaxy all was fine
d4d58887f008 Uploaded
stef
parents:
diff changeset
598 ## ------------------------
d4d58887f008 Uploaded
stef
parents:
diff changeset
599 catMsg( "zipping all output")
d4d58887f008 Uploaded
stef
parents:
diff changeset
600 system( paste( "zip -j ", gzipOutputPath, paste(outputPath,'/', htmlOutputName, sep='') ) )
d4d58887f008 Uploaded
stef
parents:
diff changeset
601 catMsg( "done" )
d4d58887f008 Uploaded
stef
parents:
diff changeset
602 q(status=0)