Mercurial > repos > davidvanzessen > argalaxy_tools
comparison report_clonality/RScript.r @ 55:67627d77d63b draft
Uploaded
author | davidvanzessen |
---|---|
date | Wed, 16 Mar 2016 11:17:49 -0400 |
parents | 5ba0377b7737 |
children |
comparison
equal
deleted
inserted
replaced
54:5ba0377b7737 | 55:67627d77d63b |
---|---|
644 print(names(PRODF)) | 644 print(names(PRODF)) |
645 print(head(PRODF$N.REGION.nt.nb, 30)) | 645 print(head(PRODF$N.REGION.nt.nb, 30)) |
646 PRODF$N1.REGION.nt.nb = PRODF$N.REGION.nt.nb | 646 PRODF$N1.REGION.nt.nb = PRODF$N.REGION.nt.nb |
647 } | 647 } |
648 | 648 |
649 num_median = function(x, na.rm) { as.numeric(median(x, na.rm=na.rm)) } | |
650 | |
649 newData = data.frame(data.table(PRODF)[,list(unique=.N, | 651 newData = data.frame(data.table(PRODF)[,list(unique=.N, |
650 VH.DEL=mean(.SD$X3V.REGION.trimmed.nt.nb, na.rm=T), | 652 VH.DEL=mean(.SD$X3V.REGION.trimmed.nt.nb, na.rm=T), |
651 P1=mean(.SD$P3V.nt.nb, na.rm=T), | 653 P1=mean(.SD$P3V.nt.nb, na.rm=T), |
652 N1=mean(.SD$N1.REGION.nt.nb, na.rm=T), | 654 N1=mean(.SD$N1.REGION.nt.nb, na.rm=T), |
653 P2=mean(.SD$P5D.nt.nb, na.rm=T), | 655 P2=mean(.SD$P5D.nt.nb, na.rm=T), |
669 mean(.SD$P5D.nt.nb, na.rm=T) + | 671 mean(.SD$P5D.nt.nb, na.rm=T) + |
670 mean(.SD$P3D.nt.nb, na.rm=T) + | 672 mean(.SD$P3D.nt.nb, na.rm=T) + |
671 mean(.SD$P5J.nt.nb, na.rm=T))), | 673 mean(.SD$P5J.nt.nb, na.rm=T))), |
672 by=c("Sample")]) | 674 by=c("Sample")]) |
673 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | 675 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) |
674 write.table(newData, "junctionAnalysisProd.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | 676 write.table(newData, "junctionAnalysisProd_mean.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) |
677 | |
678 newData = data.frame(data.table(PRODF)[,list(unique=.N, | |
679 VH.DEL=num_median(.SD$X3V.REGION.trimmed.nt.nb, na.rm=T), | |
680 P1=num_median(.SD$P3V.nt.nb, na.rm=T), | |
681 N1=num_median(.SD$N1.REGION.nt.nb, na.rm=T), | |
682 P2=num_median(.SD$P5D.nt.nb, na.rm=T), | |
683 DEL.DH=num_median(.SD$X5D.REGION.trimmed.nt.nb, na.rm=T), | |
684 DH.DEL=num_median(.SD$X3D.REGION.trimmed.nt.nb, na.rm=T), | |
685 P3=num_median(.SD$P3D.nt.nb, na.rm=T), | |
686 N2=num_median(.SD$N2.REGION.nt.nb, na.rm=T), | |
687 P4=num_median(.SD$P5J.nt.nb, na.rm=T), | |
688 DEL.JH=num_median(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), | |
689 Total.Del=num_median(c(.SD$X3V.REGION.trimmed.nt.nb, | |
690 .SD$X5D.REGION.trimmed.nt.nb, | |
691 .SD$X3D.REGION.trimmed.nt.nb, | |
692 .SD$X5J.REGION.trimmed.nt.nb), na.rm=T), | |
693 Total.N=num_median( c(.SD$N1.REGION.nt.nb, | |
694 .SD$N2.REGION.nt.nb), na.rm=T), | |
695 Total.P=num_median(c(.SD$P3V.nt.nb, | |
696 .SD$P5D.nt.nb, | |
697 .SD$P3D.nt.nb, | |
698 .SD$P5J.nt.nb), na.rm=T)), | |
699 by=c("Sample")]) | |
700 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | |
701 write.table(newData, "junctionAnalysisProd_median.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | |
675 | 702 |
676 newData = data.frame(data.table(UNPROD)[,list(unique=.N, | 703 newData = data.frame(data.table(UNPROD)[,list(unique=.N, |
677 VH.DEL=mean(.SD$X3V.REGION.trimmed.nt.nb, na.rm=T), | 704 VH.DEL=mean(.SD$X3V.REGION.trimmed.nt.nb, na.rm=T), |
678 P1=mean(.SD$P3V.nt.nb, na.rm=T), | 705 P1=mean(.SD$P3V.nt.nb, na.rm=T), |
679 N1=mean(.SD$N1.REGION.nt.nb, na.rm=T), | 706 N1=mean(.SD$N1.REGION.nt.nb, na.rm=T), |
694 mean(.SD$P5D.nt.nb, na.rm=T) + | 721 mean(.SD$P5D.nt.nb, na.rm=T) + |
695 mean(.SD$P3D.nt.nb, na.rm=T) + | 722 mean(.SD$P3D.nt.nb, na.rm=T) + |
696 mean(.SD$P5J.nt.nb, na.rm=T))), | 723 mean(.SD$P5J.nt.nb, na.rm=T))), |
697 by=c("Sample")]) | 724 by=c("Sample")]) |
698 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | 725 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) |
699 write.table(newData, "junctionAnalysisUnProd.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | 726 write.table(newData, "junctionAnalysisUnProd_mean.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) |
727 | |
728 newData = data.frame(data.table(UNPROD)[,list(unique=.N, | |
729 VH.DEL=num_median(.SD$X3V.REGION.trimmed.nt.nb, na.rm=T), | |
730 P1=num_median(.SD$P3V.nt.nb, na.rm=T), | |
731 N1=num_median(.SD$N1.REGION.nt.nb, na.rm=T), | |
732 P2=num_median(.SD$P5D.nt.nb, na.rm=T), | |
733 DEL.DH=num_median(.SD$X5D.REGION.trimmed.nt.nb, na.rm=T), | |
734 DH.DEL=num_median(.SD$X3D.REGION.trimmed.nt.nb, na.rm=T), | |
735 P3=num_median(.SD$P3D.nt.nb, na.rm=T), | |
736 N2=num_median(.SD$N2.REGION.nt.nb, na.rm=T), | |
737 P4=num_median(.SD$P5J.nt.nb, na.rm=T), | |
738 DEL.JH=num_median(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), | |
739 Total.Del=num_median(c(.SD$X3V.REGION.trimmed.nt.nb, | |
740 .SD$X5D.REGION.trimmed.nt.nb, | |
741 .SD$X3D.REGION.trimmed.nt.nb, | |
742 .SD$X5J.REGION.trimmed.nt.nb), na.rm=T), | |
743 Total.N=num_median( c(.SD$N1.REGION.nt.nb, | |
744 .SD$N2.REGION.nt.nb), na.rm=T), | |
745 Total.P=num_median(c(.SD$P3V.nt.nb, | |
746 .SD$P5D.nt.nb, | |
747 .SD$P3D.nt.nb, | |
748 .SD$P5J.nt.nb), na.rm=T)), | |
749 by=c("Sample")]) | |
750 | |
751 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | |
752 write.table(newData, "junctionAnalysisUnProd_median.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | |
700 } | 753 } |
701 | 754 |
702 # ---------------------- AA composition in CDR3 ---------------------- | 755 # ---------------------- AA composition in CDR3 ---------------------- |
703 | 756 |
704 AACDR3 = PRODF[,c("Sample", "CDR3.Seq")] | 757 AACDR3 = PRODF[,c("Sample", "CDR3.Seq")] |