annotate naive_output.r @ 57:16c7fc1c4bf8 draft

Uploaded
author davidvanzessen
date Fri, 18 Mar 2016 07:50:34 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
57
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
1 args <- commandArgs(trailingOnly = TRUE)
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
2
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
3 naive.file = args[1]
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
4 shm.file = args[2]
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
5 output.file = args[3]
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
6
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
7 naive = read.table(naive.file, sep="\t", header=T, quote="", fill=T)
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
8 shm.merge = read.table(shm.file, sep="\t", header=T, quote="", fill=T)
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
9
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
10
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
11 final = merge(naive, shm.merge[,c("Sequence.ID", "best_match")], by.x="ID", by.y="Sequence.ID")
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
12 print(paste("nrow final:", nrow(final)))
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
13 names(final)[names(final) == "best_match"] = "Sample"
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
14 final.numeric = final[,sapply(final, is.numeric)]
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
15 final.numeric[is.na(final.numeric)] = 0
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
16 final[,sapply(final, is.numeric)] = final.numeric
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
17 print(paste("nrow final:", nrow(final)))
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
18 final2 = final
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
19 final2$Sample = gsub("[0-9]", "", final2$Sample)
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
20 final = rbind(final, final2)
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
21 final$Replicate = 1
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
22
16c7fc1c4bf8 Uploaded
davidvanzessen
parents:
diff changeset
23 write.table(final, output.file, quote=F, sep="\t", row.names=F, col.names=T)