annotate cluster.tools/order.by.cl.R @ 2:b442996b66ae draft

Uploaded
author peter-waltman
date Wed, 27 Feb 2013 20:17:04 -0500
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
2
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
1 #!/usr/bin/env Rscript
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
2 argspec <- c("tab.2.cdt.R converts a data matrix to cdt format
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
3
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
4 Usage:
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
5 tab.2.cdt.R -d <data.file>
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
6 Optional:
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
7 -o <output_file>
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
8 \n\n")
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
9 args <- commandArgs(TRUE)
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
10 if ( length( args ) == 1 && args =="--help") {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
11 write(argspec, stderr())
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
12 q();
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
13 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
14
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
15 lib.load.quiet <- function( package ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
16 package <- as.character(substitute(package))
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
17 suppressPackageStartupMessages( do.call( "library", list( package=package ) ) )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
18 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
19 lib.load.quiet(getopt)
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
20 lib.load.quiet( gplots )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
21 if ( any( c( 'flashClust', 'fastcluster' ) %in% installed.packages() ) ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
22 if ( 'flashClust' %in% installed.packages() ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
23 lib.load.quiet( flashClust )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
24 } else {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
25 if ( 'fastcluster' %in% installed.packages() ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
26 lib.load.quiet( fastcluster )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
27 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
28 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
29 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
30
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
31
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
32 spec <- matrix( c( "data.fname", "d", 1, "character",
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
33 "class.select", "c", 1, "character",
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
34 "genes.only", "g", 0, "logical",
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
35 "within.cl.srt", "w", 0, "logical",
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
36 "output.fname", "o", 2, "character"
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
37 ),
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
38 nc=4,
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
39 byrow=TRUE
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
40 )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
41
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
42
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
43 opt <- getopt( spec=spec )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
44 if ( is.null( opt$output.fname ) ) opt$output.fname <- sub( "tab$|csv$", "cdt", opt$data.fname )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
45 if ( is.null( opt$genes.only ) ) opt$genes.only <- FALSE
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
46 if ( is.null( opt$within.cl.srt ) ) opt$within.cl.srt <- FALSE
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
47
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
48 data <- as.matrix( read.delim( opt$data.fname, row.names=1, check.names=FALSE ) )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
49
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
50 if ( opt$genes.only ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
51 feats <- rownames( data )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
52 gene.feats <- feats[ ! grepl( "complex|abstract|family", feats ) ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
53 data <- data[ gene.feats, ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
54 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
55
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
56
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
57 cls <- as.matrix( read.delim( opt$class.select, row.names=1 ) )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
58 cls <- cls[ order( cls[,1] ), , drop=FALSE ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
59
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
60 row.cluster <- FALSE
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
61 ## we assume this is a row-wise cluster if any rows are in the columns
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
62 if ( any( rownames( cls ) %in% rownames( data ) ) ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
63 row.cluster <- TRUE
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
64 data <- t( data )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
65 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
66
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
67 if ( ! all( rownames( cls ) %in% colnames( data ) ) ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
68
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
69 ovp <- rownames( cls )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
70 ovp <- ovp[ ovp %in% colnames( data ) ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
71 if ( length( ovp ) > 0 ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
72 cls <- cls[ ovp, ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
73 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
74 else {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
75 stop( "no samples in cluster are found in data file\n" )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
76 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
77 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
78
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
79 if ( opt$within.cl.srt ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
80
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
81 cls.orig <- cls
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
82 cls.vect <- cls[,1]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
83 cls <- sort( unique( as.numeric( cls.vect ) ) )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
84
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
85 cls <- unlist( lapply( cls,
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
86 function(i) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
87 elts <- names( cls.vect[ cls.vect %in% i ] )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
88 sub.mat <- data[, elts ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
89 browser()
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
90 sub.dist <- dist( t( sub.mat ) )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
91 return( elts[ hclust( sub.dist )$order ] )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
92 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
93 )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
94 )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
95 cls <- cls.orig[ cls, , drop=FALSE ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
96 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
97
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
98
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
99 ## re-order and update column names
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
100 data <- data[, rownames(cls) ]
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
101 colnames( data ) <- paste( rownames(cls), paste( "cl", sprintf( "%02d", cls[,1] ), sep=""), sep="-" )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
102
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
103 ## now re-transpose
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
104 if ( row.cluster ) {
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
105 data <- t( data )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
106 }
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
107 write.table( data, opt$output.fname, sep="\t", col.names=NA, quote=FALSE )
b442996b66ae Uploaded
peter-waltman
parents:
diff changeset
108