Mercurial > repos > qfabrepo > metadegalaxy_phyloseq_deseq2
diff phyloseq_2_deseq2.r @ 0:1f0569e94be4 draft
"planemo upload for repository https://github.com/QFAB-Bioinformatics/metaDEGalaxy/tree/master/phyloseq_2_deseq2 commit 8bd68662b72404f6291e9628327dcb109b5fa55e"
author | qfabrepo |
---|---|
date | Mon, 14 Sep 2020 08:20:41 +0000 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/phyloseq_2_deseq2.r Mon Sep 14 08:20:41 2020 +0000 @@ -0,0 +1,86 @@ +library('getopt') +suppressPackageStartupMessages(library('phyloseq')) +suppressPackageStartupMessages(library('DESeq2')) + +options(warn= -1) + +option_specification = matrix(c( + 'biomfile','b',2,'character', + 'metafile','m',2,'character', + 'factor','f',2,'numeric', + 'test','t',2,'character', + 'fitType','T',2,'character', + 'cutoff','c','2','double', + 'outdir','o',2,'character', + 'result','r',2,'character', + 'normalisedResult','n','2','character' +),byrow=TRUE,ncol=4); + + +options <- getopt(option_specification); +options(bitmapType="cairo") + + +if (!is.null(options$outdir)) { + # Create the directory + dir.create(options$outdir,FALSE) +} + + +galaxy_biom <- import_biom(options$biomfile) +galaxy_map <- import_qiime_sample_data(options$metafile) +tax_col_norm <- c("Kingdom","Phylum","Class","Order","Family","Genus","Species") +tax_col_extra <- c("None","Kingdom","Phylum","Class","Order","Family","Genus","Species") + +number.of.tax.rank<-length(colnames(tax_table(galaxy_biom))) + +if( number.of.tax.rank == 7){ +colnames(tax_table(galaxy_biom)) <- tax_col_norm +}else{ +colnames(tax_table(galaxy_biom)) <- tax_col_extra +} + + +AIP_galaxy <- merge_phyloseq(galaxy_biom,galaxy_map) + + +Infactor<-colnames(galaxy_map)[options$factor] +method<-options$test +Type<-options$fitType +cutoff<-options$cutoff + + + +suppressMessages(deseq2_obj<-phyloseq_to_deseq2(AIP_galaxy,as.formula(paste('~',Infactor,sep="")))) +gm_mean = function(x, na.rm=TRUE){ + exp(sum(log(x[x > 0]), na.rm=na.rm) / length(x)) +} +geoMeans = apply(counts(deseq2_obj), 1, gm_mean) +deseq2_obj = estimateSizeFactors(deseq2_obj, geoMeans = geoMeans) + + + +### Normalisation +deseq2_obj_norm<-counts(deseq2_obj,normalized=T) +deseq2_obj_norm.out<-as.data.frame(cbind("OTUID"=rownames(deseq2_obj_norm),deseq2_obj_norm)) +write.table(deseq2_obj_norm.out,file=options$normalisedResult,col.names=T,row.names=F,quote=F,sep="\t") + + +### Normalisation and DE analysis +suppressMessages(deseq2_obj_DE<-DESeq(deseq2_obj,test=method,fitType=Type)) +res = results(deseq2_obj_DE,cooksCutoff = FALSE) + +significant.table <-res[which(res$padj < cutoff),] + +if(nrow(significant.table) == 0){ + out_message <-"no significant result found!" + write(out_message,file=options$result,sep="\t") + quit("yes") +} + +significant.table <- cbind(as(significant.table,"data.frame"), as(tax_table(AIP_galaxy)[rownames(significant.table),],"matrix")) + +significant.table.out<-as.data.frame(cbind("OTUID"=rownames(significant.table),significant.table)) + +write.table(format(significant.table.out, digits=4, scientific=F),file=options$result,col.names=T,row.names=F,quote=F,sep="\t") +