Mercurial > repos > workflow4metabolomics > mixmodel4repeated_measures
view mixmodel_wrapper.R @ 0:a4d89d47646f draft default tip
planemo upload for repository https://github.com/workflow4metabolomics/tools-metabolomics commit 8d2ca678d973501b60479a8dc3f212eecd56eab8
author | workflow4metabolomics |
---|---|
date | Mon, 16 May 2022 09:25:01 +0000 |
parents | |
children |
line wrap: on
line source
#!/usr/bin/env Rscript library(lme4) ## mixed model computing library(Matrix) library(MASS) library(lmerTest) ## computing pvalue and lsmeans from results of lme4 package library(multtest) ## multiple testing library(ggplot2) library(gridExtra) library(grid) source_local <- function(fname) { argv <- commandArgs(trailingOnly = FALSE) base_dir <- dirname(substring(argv[grep("--file=", argv)], 8)) source(paste(base_dir, fname, sep = "/")) } source_local("mixmodel_script.R") source_local("diagmfl.R") parse_args <- function() { args <- commandArgs() start <- which(args == "--args")[1] + 1 if (is.na(start)) { return(list()) } seq_by2 <- seq(start, length(args), by = 2) result <- as.list(args[seq_by2 + 1]) names(result) <- args[seq_by2] return(result) } argVc <- unlist(parse_args()) ##------------------------------ ## Initializing ##------------------------------ ## options ##-------- strAsFacL <- options()$stringsAsFactors options(stringsAsFactors = FALSE) ## constants ##---------- modNamC <- "mixmodel" ## module name topEnvC <- environment() flagC <- "\n" ## functions ##---------- flgF <- function(tesC, envC = topEnvC, txtC = NA) { ## management of warning and error messages tesL <- eval(parse(text = tesC), envir = envC) if (!tesL) { sink(NULL) stpTxtC <- ifelse(is.na(txtC), paste0(tesC, " is FALSE"), txtC) stop(stpTxtC, call. = FALSE) } } ## flgF ## log file ##--------- sink(argVc["information"]) cat("\nStart of the '", modNamC, "' Galaxy module call: ", format(Sys.time(), "%a %d %b %Y %X"), "\n", sep = "") cat("\nParameters used:\n\n") print(argVc) cat("\n\n") ## loading ##-------- datMN <- t(as.matrix(read.table(argVc["dataMatrix_in"], check.names = FALSE, header = TRUE, row.names = 1, sep = "\t"))) samDF <- read.table(argVc["sampleMetadata_in"], check.names = FALSE, header = TRUE, row.names = 1, sep = "\t") varDF <- read.table(argVc["variableMetadata_in"], check.names = FALSE, header = TRUE, row.names = 1, sep = "\t") ## checking ##--------- flgF("identical(rownames(datMN), rownames(samDF))", txtC = "Column names of the dataMatrix are not identical to the row names of the sampleMetadata; check your data with the 'Check Format' module in the 'Quality Control' section") flgF("identical(colnames(datMN), rownames(varDF))", txtC = "Row names of the dataMatrix are not identical to the row names of the variableMetadata; check your data with the 'Check Format' module in the 'Quality Control' section") flgF("argVc['time'] %in% colnames(samDF)", txtC = paste0("Required time factor '", argVc["time"], "' could not be found in the column names of the sampleMetadata")) flgF("argVc['subject'] %in% colnames(samDF)", txtC = paste0("Required subject factor '", argVc["subject"], "' could not be found in the column names of the sampleMetadata")) flgF("mode(samDF[, argVc['time']]) %in% c('character', 'numeric')", txtC = paste0("The '", argVc["time"], "' column of the sampleMetadata should contain either number only, or character only")) flgF("mode(samDF[, argVc['subject']]) %in% c('character', 'numeric')", txtC = paste0("The '", argVc["subject"], "' column of the sampleMetadata should contain either number only, or character only")) flgF("argVc['adjC'] %in% c('holm', 'hochberg', 'hommel', 'bonferroni', 'BH', 'BY', 'fdr', 'none')") flgF("argVc['trf'] %in% c('none', 'log10', 'log2')") flgF("0 <= as.numeric(argVc['thrN']) && as.numeric(argVc['thrN']) <= 1", txtC = "(corrected) p-value threshold must be between 0 and 1") flgF("argVc['diaR'] %in% c('no', 'yes')") ##------------------------------ ## Formating ##------------------------------ if (argVc["dff"] == "Satt") { dffmeth <- "Satterthwaite" } else { dffmeth <- "Kenward-Roger" } ##------------------------------ ## Computation ##------------------------------ varDFout <- lmixedm(datMN = datMN, samDF = samDF, varDF = varDF, fixfact = argVc["fixfact"], time = argVc["time"], subject = argVc["subject"], logtr = argVc["trf"], pvalCutof = argVc["thrN"], pvalcorMeth = argVc["adjC"], dffOption = dffmeth, visu = argVc["diaR"], least.confounded = FALSE, outlier.limit = 3, pdfC = argVc["out_graph_pdf"], pdfE = argVc["out_estim_pdf"] ) ##------------------------------ ## Rounding ##------------------------------ if (argVc["rounding"] == "yes") { varDFout[, which(!(colnames(varDFout) %in% colnames(varDF)))] <- apply(varDFout[, which(!(colnames(varDFout) %in% colnames(varDF)))], 2, round, digits = as.numeric(argVc["decplaces"])) } ##------------------------------ ## Ending ##------------------------------ ## saving ##-------- varDFout <- cbind.data.frame(variableMetadata = rownames(varDFout), varDFout) write.table(varDFout, file = argVc["variableMetadata_out"], quote = FALSE, row.names = FALSE, sep = "\t") ## closing ##-------- cat("\n\nEnd of '", modNamC, "' Galaxy module call: ", as.character(Sys.time()), "\n", sep = "") cat("\nInformation about R (version, Operating System, attached or loaded packages):\n\n") sessionInfo() sink() options(stringsAsFactors = strAsFacL) rm(list = ls())