Mercurial > repos > davidvanzessen > argalaxy_tools
comparison report_clonality/RScript.r @ 3:beaa487ecf43 draft
Uploaded
| author | davidvanzessen |
|---|---|
| date | Wed, 07 Dec 2016 08:36:23 -0500 |
| parents | 90a05ff900db |
| children |
comparison
equal
deleted
inserted
replaced
| 2:4f8a1d121384 | 3:beaa487ecf43 |
|---|---|
| 8 install.packages("ggplot2", repos="http://cran.xl-mirror.nl/") | 8 install.packages("ggplot2", repos="http://cran.xl-mirror.nl/") |
| 9 } | 9 } |
| 10 library(ggplot2) | 10 library(ggplot2) |
| 11 if (!("plyr" %in% rownames(installed.packages()))) { | 11 if (!("plyr" %in% rownames(installed.packages()))) { |
| 12 install.packages("plyr", repos="http://cran.xl-mirror.nl/") | 12 install.packages("plyr", repos="http://cran.xl-mirror.nl/") |
| 13 } | 13 } |
| 14 library(plyr) | 14 library(plyr) |
| 15 | 15 |
| 16 if (!("data.table" %in% rownames(installed.packages()))) { | 16 if (!("data.table" %in% rownames(installed.packages()))) { |
| 17 install.packages("data.table", repos="http://cran.xl-mirror.nl/") | 17 install.packages("data.table", repos="http://cran.xl-mirror.nl/") |
| 18 } | 18 } |
| 715 N2=mean(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 715 N2=mean(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 716 P4=mean(.SD$P5J.nt.nb, na.rm=T), | 716 P4=mean(.SD$P5J.nt.nb, na.rm=T), |
| 717 DEL.JH=mean(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), | 717 DEL.JH=mean(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), |
| 718 Total.Del=mean(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), | 718 Total.Del=mean(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), |
| 719 Total.N=mean(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 719 Total.N=mean(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 720 Total.P=mean(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T))), | 720 Total.P=mean(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T)), |
| 721 Median.CDR3.l=median(.SD$CDR3.Length.DNA)), | |
| 721 by=c("Sample")]) | 722 by=c("Sample")]) |
| 722 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | 723 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) |
| 723 write.table(newData, "junctionAnalysisProd_mean.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | 724 write.table(newData, "junctionAnalysisProd_mean.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) |
| 724 | 725 |
| 725 newData = data.frame(data.table(PRODF)[,list(unique=.N, | 726 newData = data.frame(data.table(PRODF)[,list(unique=.N, |
| 733 N2=num_median(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 734 N2=num_median(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 734 P4=num_median(.SD$P5J.nt.nb, na.rm=T), | 735 P4=num_median(.SD$P5J.nt.nb, na.rm=T), |
| 735 DEL.JH=num_median(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), | 736 DEL.JH=num_median(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), |
| 736 Total.Del=num_median(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), | 737 Total.Del=num_median(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), |
| 737 Total.N=num_median(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 738 Total.N=num_median(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 738 Total.P=num_median(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T))), | 739 Total.P=num_median(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T)), |
| 740 Median.CDR3.l=median(.SD$CDR3.Length.DNA)), | |
| 739 by=c("Sample")]) | 741 by=c("Sample")]) |
| 740 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | 742 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) |
| 741 write.table(newData, "junctionAnalysisProd_median.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | 743 write.table(newData, "junctionAnalysisProd_median.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) |
| 742 | 744 |
| 743 newData = data.frame(data.table(UNPROD)[,list(unique=.N, | 745 newData = data.frame(data.table(UNPROD)[,list(unique=.N, |
| 751 N2=mean(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 753 N2=mean(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 752 P4=mean(.SD$P5J.nt.nb, na.rm=T), | 754 P4=mean(.SD$P5J.nt.nb, na.rm=T), |
| 753 DEL.JH=mean(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), | 755 DEL.JH=mean(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), |
| 754 Total.Del=mean(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), | 756 Total.Del=mean(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), |
| 755 Total.N=mean(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 757 Total.N=mean(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 756 Total.P=mean(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T))), | 758 Total.P=mean(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T)), |
| 759 Median.CDR3.l=median(.SD$CDR3.Length.DNA)), | |
| 757 by=c("Sample")]) | 760 by=c("Sample")]) |
| 758 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | 761 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) |
| 759 write.table(newData, "junctionAnalysisUnProd_mean.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | 762 write.table(newData, "junctionAnalysisUnProd_mean.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) |
| 760 | 763 |
| 761 newData = data.frame(data.table(UNPROD)[,list(unique=.N, | 764 newData = data.frame(data.table(UNPROD)[,list(unique=.N, |
| 769 N2=num_median(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 772 N2=num_median(rowSums(.SD[,c("N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 770 P4=num_median(.SD$P5J.nt.nb, na.rm=T), | 773 P4=num_median(.SD$P5J.nt.nb, na.rm=T), |
| 771 DEL.JH=num_median(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), | 774 DEL.JH=num_median(.SD$X5J.REGION.trimmed.nt.nb, na.rm=T), |
| 772 Total.Del=num_median(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), | 775 Total.Del=num_median(rowSums(.SD[,c("X3V.REGION.trimmed.nt.nb", "X5D.REGION.trimmed.nt.nb", "X3D.REGION.trimmed.nt.nb", "X5J.REGION.trimmed.nt.nb"), with=F], na.rm=T)), |
| 773 Total.N=num_median(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), | 776 Total.N=num_median(rowSums(.SD[,c("N.REGION.nt.nb", "N1.REGION.nt.nb", "N2.REGION.nt.nb", "N3.REGION.nt.nb", "N4.REGION.nt.nb"), with=F], na.rm=T)), |
| 774 Total.P=num_median(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T))), | 777 Total.P=num_median(rowSums(.SD[,c("P3V.nt.nb", "P5D.nt.nb", "P3D.nt.nb", "P5J.nt.nb"), with=F], na.rm=T)), |
| 778 Median.CDR3.l=median(.SD$CDR3.Length.DNA)), | |
| 775 by=c("Sample")]) | 779 by=c("Sample")]) |
| 776 | 780 |
| 777 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) | 781 newData[,sapply(newData, is.numeric)] = round(newData[,sapply(newData, is.numeric)],1) |
| 778 write.table(newData, "junctionAnalysisUnProd_median.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) | 782 write.table(newData, "junctionAnalysisUnProd_median.csv" , sep=",",quote=F,na="-",row.names=F,col.names=F) |
| 779 } | 783 } |
