# HG changeset patch # User davidvanzessen # Date 1421058942 18000 # Node ID 7dbc9ebcefce7fa6f6b59060e3d84786eded5aa9 # Parent 043fd6613fd976c687bb13395ee8397879d794b0 Uploaded diff -r 043fd6613fd9 -r 7dbc9ebcefce RScript.r --- a/RScript.r Mon Jan 12 04:32:40 2015 -0500 +++ b/RScript.r Mon Jan 12 05:35:42 2015 -0500 @@ -50,11 +50,14 @@ inputdata$Top.J.Gene = gsub("[*]([0-9]+)", "", inputdata$Top.J.Gene) inputdata$clonaltype = 1:nrow(inputdata) PRODF = inputdata +UNPROD = inputdata if(filterproductive){ if("Functionality" %in% colnames(inputdata)) { # "Functionality" is an IMGT column PRODF = inputdata[inputdata$Functionality == "productive" | inputdata$Functionality == "productive (see comment)", ] + UNPROD = inputdata[!(inputdata$Functionality == "productive" | inputdata$Functionality == "productive (see comment)"), ] } else { PRODF = inputdata[inputdata$VDJ.Frame != "In-frame with stop codon" & inputdata$VDJ.Frame != "Out-of-frame" & inputdata$CDR3.Found.How != "NOT_FOUND" , ] + UNPROD = inputdata[!(inputdata$VDJ.Frame != "In-frame with stop codon" & inputdata$VDJ.Frame != "Out-of-frame" & inputdata$CDR3.Found.How != "NOT_FOUND" ), ] } } @@ -62,6 +65,8 @@ if(clonaltype != "none"){ PRODF$clonaltype = do.call(paste, c(PRODF[unlist(strsplit(clonaltype, ","))], sep = ":")) PRODF = PRODF[!duplicated(PRODF$clonaltype), ] + UNPROD$clonaltype = do.call(paste, c(UNPROD[unlist(strsplit(clonaltype, ","))], sep = ":")) + UNPROD = UNPROD[!duplicated(UNPROD$clonaltype), ] } PRODF$freq = 1 @@ -576,5 +581,31 @@ mean(P3D.nt.nb, na.rm=T) + mean(P5J.nt.nb, na.rm=T))), by=c("Sample")]) - write.table(newData, "junctionAnalysis.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) + write.table(newData, "junctionAnalysisProd.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) + + newData = data.frame(data.table(UNPROD)[,list(unique=.N, + VH.DEL=mean(X3V.REGION.trimmed.nt.nb, na.rm=T), + P1=mean(P3V.nt.nb, na.rm=T), + N1=mean(N1.REGION.nt.nb, na.rm=T), + P2=mean(P5D.nt.nb, na.rm=T), + DEL.DH=mean(X5D.REGION.trimmed.nt.nb, na.rm=T), + DH.DEL=mean(X3D.REGION.trimmed.nt.nb, na.rm=T), + P3=mean(P3D.nt.nb, na.rm=T), + N2=mean(N2.REGION.nt.nb, na.rm=T), + P4=mean(P5J.nt.nb, na.rm=T), + DEL.JH=mean(X5J.REGION.trimmed.nt.nb, na.rm=T), + Total.Del=( mean(X3V.REGION.trimmed.nt.nb, na.rm=T) + + mean(X5D.REGION.trimmed.nt.nb, na.rm=T) + + mean(X3D.REGION.trimmed.nt.nb, na.rm=T) + + mean(X5J.REGION.trimmed.nt.nb, na.rm=T)), + + Total.N=( mean(N1.REGION.nt.nb, na.rm=T) + + mean(N2.REGION.nt.nb, na.rm=T)), + + Total.P=( mean(P3V.nt.nb, na.rm=T) + + mean(P5D.nt.nb, na.rm=T) + + mean(P3D.nt.nb, na.rm=T) + + mean(P5J.nt.nb, na.rm=T))), + by=c("Sample")]) + write.table(newData, "junctionAnalysisUnProd.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) } diff -r 043fd6613fd9 -r 7dbc9ebcefce r_wrapper.sh --- a/r_wrapper.sh Mon Jan 12 04:32:40 2015 -0500 +++ b/r_wrapper.sh Mon Jan 12 05:35:42 2015 -0500 @@ -112,12 +112,22 @@ hasJunctionData="$(if head -n 1 $inputFile | grep -q '3V-REGION trimmed-nt nb'; then echo 'Yes'; else echo 'No'; fi)" if [[ "$hasJunctionData" == "Yes" ]] ; then - echo "
" >> $outputFile + echo "
" >> $outputFile + echo "
SamplecountVH.DELP1N1P2DEL.DHDH.DELP3N2P4DEL.JHTotal.DelTotal.NTotal.P
" >> $outputFile while IFS=, read Sample unique VHDEL P1 N1 P2 DELDH DHDEL P3 N2 P4 DELJH TotalDel TotalN TotalP do echo "" >> $outputFile - done < $outputDir/junctionAnalysis.csv - echo "
Productive
SamplecountVH.DELP1N1P2DEL.DHDH.DELP3N2P4DEL.JHTotal.DelTotal.NTotal.P
$Sample$unique$VHDEL$P1$N1$P2$DELDH$DHDEL$P3$N2$P4$DELJH$TotalDel$TotalN$TotalP
" >> $outputFile + done < $outputDir/junctionAnalysisProd.csv + echo "" >> $outputFile + + echo "" >> $outputFile + while IFS=, read Sample unique VHDEL P1 N1 P2 DELDH DHDEL P3 N2 P4 DELJH TotalDel TotalN TotalP + do + echo "" >> $outputFile + done < $outputDir/junctionAnalysisUnProd.csv + echo "
Unproductive
SamplecountVH.DELP1N1P2DEL.DHDH.DELP3N2P4DEL.JHTotal.DelTotal.NTotal.P
$Sample$unique$VHDEL$P1$N1$P2$DELDH$DHDEL$P3$N2$P4$DELJH$TotalDel$TotalN$TotalP
" >> $outputFile + + echo "" >> $outputFile fi echo "
" >> $outputFile
IDInclude