Mercurial > repos > peter-waltman > ucsc_cluster_tools2
diff cluster.tools/impute.knn.R @ 0:0decf3fd54bc draft
Uploaded
author | peter-waltman |
---|---|
date | Thu, 28 Feb 2013 01:45:39 -0500 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/cluster.tools/impute.knn.R Thu Feb 28 01:45:39 2013 -0500 @@ -0,0 +1,44 @@ +#!/usr/bin/env Rscript +argspec <- c("impute.knn.R replaces missing values, using the impute.knn function from the impute package + + Usage: + impute.knn.R -d <data.file> + Optional: + -o <output_file> + \n\n") +args <- commandArgs(TRUE) +if ( length( args ) == 1 && args =="--help") { + write(argspec, stderr()) + q(); +} + +lib.load.quiet <- function( package ) { + package <- as.character(substitute(package)) + suppressPackageStartupMessages( do.call( "library", list( package=package ) ) ) +} +lib.load.quiet(getopt) +lib.load.quiet( impute ) + +spec <- matrix( c( "data.fname", "d", 1, "character", + "output.fname", "o", 2, "character" + ), + nc=4, + byrow=TRUE + ) + +opt <- getopt( spec=spec ) + +data <- as.matrix( read.delim( opt$data.fname, row.names=1, check.names=FALSE ) ) +if ( is.null( opt$replacement.val ) ) { opt$replacement.val <- NA } +if ( is.null( opt$output.fname ) ) { opt$output.fname <- paste( "impute.knn", basename( opt$data.fname ), sep="." ) } + + ## Set any NA, NAN or Inf entries to 0 +if ( is.nan(data) ) { + data[ is.nan( data ) ] <- NA +} +if ( is.infinite(data) ) { + data[ is.infinite( data ) ] <- NA +} + +data <- impute.knn( data )$data +write.table( data, opt$output.fname, sep="\t", quote=FALSE, col.names=NA )