Galaxy |

Changeset 3:f439ed7a8f03 (2018-09-18)

Previous changeset 2:3a5204f14fff (2018-02-13) Next changeset 4:4c25647cd4df (2018-09-19)

Commit message:
planemo upload for repository https://github.com/workflow4metabolomics/xcms commit 9f72e947d9c241d11221cad561f3525d27231857

modified:
README.rst
macros.xml
static/images/xcms_merge_workflow.png
test-data/ko15-xset.RData
test-data/ko16-xset.RData
test-data/wt15-xset.RData
test-data/wt16-xset.RData
xcms_merge.xml

added:
lib-xcms3.x.x.r
lib.r
macros_xcms.xml
test-data/ko15.CDF
test-data/ko16.CDF
test-data/noclass.merged.sampleMetadata.tsv
test-data/wt15.CDF
test-data/wt16.CDF
xcms_merge.r

removed:
test-data/MM14-xset.RData
test-data/MM8-xset.RData

diff -r 3a5204f14fff -r f439ed7a8f03 README.rst
--- a/README.rst Tue Feb 13 04:48:41 2018 -0500
+++ b/README.rst Tue Sep 18 16:09:25 2018 -0400

@@ -2,6 +2,14 @@
Changelog/News
--------------

+**Version 3.0.0.0 - 08/03/2018**
+
+- UPGRADE: upgrade the xcms version from 1.46.0 to 3.0.0. So refactoring of a lot of underlining codes and methods
+
+- IMPROVMENT: a new dedicated tool "xcms plot chromatogram" will allow you to get TIC and BPI of your raw data.
+
+- IMPROVMENT: the tool will now generate a sampleMetadata file if any was provided. It will be useful to add some further information for the normalization and statistics steps.
+
**Version 1.0.1 - 13/02/2017**

- IMPROVMENT: the tool will now raise an error if a sample isn't describe in the sampleMetadata file
@@ -10,4 +18,3 @@
**Version 1.0.0 - 03/02/2017**

- NEW: a new tool to merge individual xcmsSet outputs to be used by xcms.group
-

diff -r 3a5204f14fff -r f439ed7a8f03 lib-xcms3.x.x.r
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/lib-xcms3.x.x.r Tue Sep 18 16:09:25 2018 -0400

[

@@ -0,0 +1,152 @@
+
+
+#@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
+# https://github.com/sneumann/xcms/issues/250
+groupnamesW4M <- function(xdata, mzdec = 0, rtdec = 0) {
+    mzfmt <- paste("%.", mzdec, "f", sep = "")
+    rtfmt <- paste("%.", rtdec, "f", sep = "")
+
+    gnames <- paste("M", sprintf(mzfmt, featureDefinitions(xdata)[,"mzmed"]), "T",
+                    sprintf(rtfmt, featureDefinitions(xdata)[,"rtmed"]), sep = "")
+
+    if (any(dup <- duplicated(gnames)))
+        for (dupname in unique(gnames[dup])) {
+            dupidx <- which(gnames == dupname)
+            gnames[dupidx] <- paste(gnames[dupidx], seq(along = dupidx), sep = "_")
+        }
+
+    return (gnames)
+}
+
+#@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
+# https://github.com/sneumann/xcms/issues/247
+.concatenate_XCMSnExp <- function(...) {
+    x <- list(...)
+    if (length(x) == 0)
+        return(NULL)
+    if (length(x) == 1)
+        return(x[[1]])
+    ## Check that all are XCMSnExp objects.
+    if (!all(unlist(lapply(x, function(z) is(z, "XCMSnExp")))))
+        stop("All passed objects should be 'XCMSnExp' objects")
+    new_x <- as(.concatenate_OnDiskMSnExp(...), "XCMSnExp")
+    ## If any of the XCMSnExp has alignment results or detected features drop
+    ## them!
+    x <- lapply(x, function(z) {
+        if (hasAdjustedRtime(z)) {
+            z <- dropAdjustedRtime(z)
+            warning("Adjusted retention times found, had to drop them.")
+        }
+        if (hasFeatures(z)) {
+            z <- dropFeatureDefinitions(z)
+            warning("Feature definitions found, had to drop them.")
+        }
+        z
+    })
+    ## Combine peaks
+    fls <- lapply(x, fileNames)
+    startidx <- cumsum(lengths(fls))
+    pks <- lapply(x, chromPeaks)
+    procH <- lapply(x, processHistory)
+    for (i in 2:length(fls)) {
+        pks[[i]][, "sample"] <- pks[[i]][, "sample"] + startidx[i - 1]
+        procH[[i]] <- lapply(procH[[i]], function(z) {
+            z@fileIndex <- as.integer(z@fileIndex + startidx[i - 1])
+            z
+            })
+    }
+    pks <- do.call(rbind, pks)
+    new_x@.processHistory <- unlist(procH)
+    chromPeaks(new_x) <- pks
+    if (validObject(new_x))
+        new_x
+}
+
+#@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
+# https://github.com/sneumann/xcms/issues/247
+.concatenate_OnDiskMSnExp <- function(...) {
+    x <- list(...)
+    if (length(x) == 0)
+        return(NULL)
+    if (length(x) == 1)
+        return(x[[1]])
+    ## Check that all are XCMSnExp objects.
+    if (!all(unlist(lapply(x, function(z) is(z, "OnDiskMSnExp")))))
+        stop("All passed objects should be 'OnDiskMSnExp' objects")
+    ## Check processingQueue
+    procQ <- lapply(x, function(z) z@spectraProcessingQueue)
+    new_procQ <- procQ[[1]]
+    is_ok <- unlist(lapply(procQ, function(z)
+        !is.character(all.equal(new_procQ, z))
+        ))
+    if (any(!is_ok)) {
+        warning("Processing queues from the submitted objects differ! ",
+                "Dropping the processing queue.")
+        new_procQ <- list()
+    }
+    ## processingData
+    fls <- lapply(x, function(z) z@processingData@files)
+    startidx <- cumsum(lengths(fls))
+    ## featureData
+    featd <- lapply(x, fData)
+    ## Have to update the file index and the spectrum names.
+    for (i in 2:length(featd)) {
+        featd[[i]]$fileIdx <- featd[[i]]$fileIdx + startidx[i - 1]
+        rownames(featd[[i]]) <- MSnbase:::formatFileSpectrumNames(
+                                              fileIds = featd[[i]]$fileIdx,
+                                              spectrumIds = featd[[i]]$spIdx,
+                                              nSpectra = nrow(featd[[i]]),
+                                              nFiles = length(unlist(fls))
+                                          )
+    }
+    featd <- do.call(rbind, featd)
+    featd$spectrum <- 1:nrow(featd)
+    ## experimentData
+    expdata <- lapply(x, function(z) {
+        ed <- z@experimentData
+        data.frame(instrumentManufacturer = ed@instrumentManufacturer,
+                   instrumentModel = ed@instrumentModel,
+                   ionSource = ed@ionSource,
+                   analyser = ed@analyser,
+                   detectorType = ed@detectorType,
+                   stringsAsFactors = FALSE)
+    })
+    expdata <- do.call(rbind, expdata)
+    expdata <- new("MIAPE",
+                   instrumentManufacturer = expdata$instrumentManufacturer,
+                   instrumentModel = expdata$instrumentModel,
+                   ionSource = expdata$ionSource,
+                   analyser = expdata$analyser,
+                   detectorType = expdata$detectorType)
+
+    ## protocolData
+    protodata <- lapply(x, function(z) z@protocolData)
+    if (any(unlist(lapply(protodata, nrow)) > 0))
+        warning("Found non-empty protocol data, but merging protocol data is",
+                " currently not supported. Skipped.")
+    ## phenoData
+    pdata <- do.call(rbind, lapply(x, pData))
+    res <- new(
+        "OnDiskMSnExp",
+        phenoData = new("NAnnotatedDataFrame", data = pdata),
+        featureData = new("AnnotatedDataFrame", featd),
+        processingData = new("MSnProcess",
+                             processing = paste0("Concatenated [", date(), "]"),
+                             files = unlist(fls), smoothed = NA),
+        experimentData = expdata,
+        spectraProcessingQueue = new_procQ)
+    if (validObject(res))
+        res
+}
+
+#@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
+# https://github.com/sneumann/xcms/issues/247
+c.XCMSnExp <- function(...) {
+    .concatenate_XCMSnExp(...)
+}
+
+#@TODO: remove this function as soon as we can use xcms 3.x.x from Bioconductor 3.7
+# https://github.com/sneumann/xcms/issues/247
+c.MSnbase <- function(...) {
+    .concatenate_OnDiskMSnExp(...)
+}

diff -r 3a5204f14fff -r f439ed7a8f03 lib.r
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/lib.r Tue Sep 18 16:09:25 2018 -0400

[

b'@@ -0,0 +1,510 @@\n+#@authors ABiMS TEAM, Y. Guitton\n+# lib.r for Galaxy Workflow4Metabolomics xcms tools\n+\n+#@author G. Le Corguille\n+# solve an issue with batch if arguments are logical TRUE/FALSE\n+parseCommandArgs <- function(...) {\n+ args <- batch::parseCommandArgs(...)\n+ for (key in names(args)) {\n+ if (args[key] %in% c("TRUE","FALSE"))\n+ args[key] = as.logical(args[key])\n+ }\n+ return(args)\n+}\n+\n+#@author G. Le Corguille\n+# This function will\n+# - load the packages\n+# - display the sessionInfo\n+loadAndDisplayPackages <- function(pkgs) {\n+ for(pkg in pkgs) suppressPackageStartupMessages( stopifnot( library(pkg, quietly=TRUE, logical.return=TRUE, character.only=TRUE)))\n+\n+ sessioninfo = sessionInfo()\n+ cat(sessioninfo$R.version$version.string,"\\n")\n+ cat("Main packages:\\n")\n+ for (pkg in names(sessioninfo$otherPkgs)) { cat(paste(pkg,packageVersion(pkg)),"\\t") }; cat("\\n")\n+ cat("Other loaded packages:\\n")\n+ for (pkg in names(sessioninfo$loadedOnly)) { cat(paste(pkg,packageVersion(pkg)),"\\t") }; cat("\\n")\n+}\n+\n+#@author G. Le Corguille\n+# This function merge several chromBPI or chromTIC into one.\n+mergeChrom <- function(chrom_merged, chrom) {\n+ if (is.null(chrom_merged)) return(NULL)\n+ chrom_merged@.Data <- cbind(chrom_merged@.Data, chrom@.Data)\n+ return(chrom_merged)\n+}\n+\n+#@author G. Le Corguille\n+# This function merge several xdata into one.\n+mergeXData <- function(args) {\n+ chromTIC <- NULL\n+ chromBPI <- NULL\n+ chromTIC_adjusted <- NULL\n+ chromBPI_adjusted <- NULL\n+ for(image in args$images) {\n+\n+ load(image)\n+ # Handle infiles\n+ if (!exists("singlefile")) singlefile <- NULL\n+ if (!exists("zipfile")) zipfile <- NULL\n+ rawFilePath <- getRawfilePathFromArguments(singlefile, zipfile, args)\n+ zipfile <- rawFilePath$zipfile\n+ singlefile <- rawFilePath$singlefile\n+ retrieveRawfileInTheWorkingDirectory(singlefile, zipfile)\n+\n+ if (exists("raw_data")) xdata <- raw_data\n+ if (!exists("xdata")) stop("\\n\\nERROR: The RData doesn\'t contain any object called \'xdata\'. This RData should have been created by an old version of XMCS 2.*")\n+\n+ cat(sampleNamesList$sampleNamesOrigin,"\\n")\n+\n+ if (!exists("xdata_merged")) {\n+ xdata_merged <- xdata\n+ singlefile_merged <- singlefile\n+ md5sumList_merged <- md5sumList\n+ sampleNamesList_merged <- sampleNamesList\n+ chromTIC_merged <- chromTIC\n+ chromBPI_merged <- chromBPI\n+ chromTIC_adjusted_merged <- chromTIC_adjusted\n+ chromBPI_adjusted_merged <- chromBPI_adjusted\n+ } else {\n+ if (is(xdata, "XCMSnExp")) xdata_merged <- c(xdata_merged,xdata)\n+ else if (is(xdata, "OnDiskMSnExp")) xdata_merged <- .concatenate_OnDiskMSnExp(xdata_merged,xdata)\n+ else stop("\\n\\nERROR: The RData either a OnDiskMSnExp object called raw_data or a XCMSnExp object called xdata")\n+\n+ singlefile_merged <- c(singlefile_merged,singlefile)\n+ md5sumList_merged$origin <- rbind(md5sumList_merged$origin,md5sumList$origin)\n+ sampleNamesList_merged$sampleNamesOrigin <- c(sampleNamesList_merged$sampleNamesOrigin,sampleNamesList$sampleNamesOrigin)\n+ sampleNamesList_merged$sampleNamesMakeNames <- c(sampleNamesList_merged$sampleNamesMakeNames,sampleNamesList$sampleNamesMakeNames)\n+ chromTIC_merged <- mergeChrom(chromTIC_merged, chromTIC)\n+ chromBPI_merged <- mergeChrom(chromBPI_merged, chromBPI)\n+ chromTIC_adjusted_merged <- mergeChrom(chromTIC_adjusted_merged, chromTIC_adjusted)\n+ chromBPI_adjusted_merged <- mergeChrom(chromBPI_adjusted_merged, chromBPI_adjusted)\n+ }\n+ }\n+ rm(image)\n+ xdata <- xdata_merged; rm(xdata_merged)\n+ singlefile <- singlefile_merged; rm(singlefile_merged)\n+ md5sumList <- md5sumList_merged; rm(md5sumList_merged)\n+ sampleNa'..b'(files)))\n+}\n+\n+\n+# This function get the raw file path from the arguments\n+#@author Gildas Le Corguille lecorguille@sb-roscoff.fr\n+getRawfilePathFromArguments <- function(singlefile, zipfile, args, prefix="") {\n+ if (!(prefix %in% c("","Positive","Negative","MS1","MS2"))) stop("prefix must be either \'\', \'Positive\', \'Negative\', \'MS1\' or \'MS2\'")\n+\n+ if (!is.null(args[[paste0("zipfile",prefix)]])) zipfile <- args[[paste0("zipfile",prefix)]]\n+\n+ if (!is.null(args[[paste0("singlefile_galaxyPath",prefix)]])) {\n+ singlefile_galaxyPaths <- args[[paste0("singlefile_galaxyPath",prefix)]]\n+ singlefile_sampleNames <- args[[paste0("singlefile_sampleName",prefix)]]\n+ }\n+ if (exists("singlefile_galaxyPaths")){\n+ singlefile_galaxyPaths <- unlist(strsplit(singlefile_galaxyPaths,"\\\\|"))\n+ singlefile_sampleNames <- unlist(strsplit(singlefile_sampleNames,"\\\\|"))\n+\n+ singlefile <- NULL\n+ for (singlefile_galaxyPath_i in seq(1:length(singlefile_galaxyPaths))) {\n+ singlefile_galaxyPath <- singlefile_galaxyPaths[singlefile_galaxyPath_i]\n+ singlefile_sampleName <- singlefile_sampleNames[singlefile_galaxyPath_i]\n+ # In case, an url is used to import data within Galaxy\n+ singlefile_sampleName <- tail(unlist(strsplit(singlefile_sampleName,"/")), n=1)\n+ singlefile[[singlefile_sampleName]] <- singlefile_galaxyPath\n+ }\n+ }\n+ return(list(zipfile=zipfile, singlefile=singlefile))\n+}\n+\n+# This function retrieve the raw file in the working directory\n+# - if zipfile: unzip the file with its directory tree\n+# - if singlefiles: set symlink with the good filename\n+#@author Gildas Le Corguille lecorguille@sb-roscoff.fr\n+retrieveRawfileInTheWorkingDirectory <- function(singlefile, zipfile) {\n+ if(!is.null(singlefile) && (length("singlefile")>0)) {\n+ for (singlefile_sampleName in names(singlefile)) {\n+ singlefile_galaxyPath <- singlefile[[singlefile_sampleName]]\n+ if(!file.exists(singlefile_galaxyPath)){\n+ error_message <- paste("Cannot access the sample:",singlefile_sampleName,"located:",singlefile_galaxyPath,". Please, contact your administrator ... if you have one!")\n+ print(error_message); stop(error_message)\n+ }\n+\n+ if (!suppressWarnings( try (file.link(singlefile_galaxyPath, singlefile_sampleName), silent=T)))\n+ file.copy(singlefile_galaxyPath, singlefile_sampleName)\n+\n+ }\n+ directory <- "."\n+\n+ }\n+ if(!is.null(zipfile) && (zipfile != "")) {\n+ if(!file.exists(zipfile)){\n+ error_message <- paste("Cannot access the Zip file:",zipfile,". Please, contact your administrator ... if you have one!")\n+ print(error_message)\n+ stop(error_message)\n+ }\n+\n+ #list all file in the zip file\n+ #zip_files <- unzip(zipfile,list=T)[,"Name"]\n+\n+ #unzip\n+ suppressWarnings(unzip(zipfile, unzip="unzip"))\n+\n+ #get the directory name\n+ suppressWarnings(filesInZip <- unzip(zipfile, list=T))\n+ directories <- unique(unlist(lapply(strsplit(filesInZip$Name,"/"), function(x) x[1])))\n+ directories <- directories[!(directories %in% c("__MACOSX")) & file.info(directories)$isdir]\n+ directory <- "."\n+ if (length(directories) == 1) directory <- directories\n+\n+ cat("files_root_directory\\t",directory,"\\n")\n+\n+ }\n+ return (directory)\n+}\n+\n+\n+# This function retrieve a xset like object\n+#@author Gildas Le Corguille lecorguille@sb-roscoff.fr\n+getxcmsSetObject <- function(xobject) {\n+ # XCMS 1.x\n+ if (class(xobject) == "xcmsSet")\n+ return (xobject)\n+ # XCMS 3.x\n+ if (class(xobject) == "XCMSnExp") {\n+ # Get the legacy xcmsSet object\n+ suppressWarnings(xset <- as(xobject, \'xcmsSet\'))\n+ if (!is.null(xset@phenoData$sample_group))\n+ sampclass(xset) <- xset@phenoData$sample_group\n+ else\n+ sampclass(xset) <- "."\n+ return (xset)\n+ }\n+}\n'

diff -r 3a5204f14fff -r f439ed7a8f03 macros.xml
--- a/macros.xml Tue Feb 13 04:48:41 2018 -0500
+++ b/macros.xml Tue Sep 18 16:09:25 2018 -0400

[

@@ -1,141 +1,52 @@
<?xml version="1.0"?>
<macros>
-    <xml name="requirements">
-        <requirements>
-            <requirement type="package" version="0.4_1">r-snow</requirement>
-            <requirement type="package" version="1.46.0">bioconductor-xcms</requirement>
-            <requirement type="package" version="1.1_4">r-batch</requirement>
-        </requirements>
-    </xml>
-    <xml name="requirements_light">
-        <requirements>
-            <requirement type="package" version="1.46.0">bioconductor-xcms</requirement>
-        </requirements>
-    </xml>
     <xml name="stdio">
         <stdio>
             <exit_code range="1" level="fatal" />
         </stdio>
     </xml>

-    <token name="@COMMAND_XCMS_SCRIPT@">
-        LC_ALL=C Rscript $__tool_directory__/xcms.r
-    </token>
+    
+    <token name="@COMMAND_RSCRIPT@">LC_ALL=C Rscript $__tool_directory__/</token>

     <token name="@COMMAND_LOG_EXIT@">
         ;
         return=\$?;
-        mv log.txt '$log';
-        cat '$log';
+        cat 'log.txt';
         sh -c "exit \$return"
     </token>

-    
-
-    <token name="@COMMAND_FILE_LOAD@">
-        #if $file_load_section.file_load_conditional.file_load_select == "yes":
-            #if $file_load_section.file_load_conditional.input[0].is_of_type("mzxml") or $file_load_section.file_load_conditional.input[0].is_of_type("mzml") or $file_load_section.file_load_conditional.input[0].is_of_type("mzdata") or $file_load_section.file_load_conditional.input[0].is_of_type("netcdf"):
-                #set singlefile_galaxyPath = ','.join( [ str( $single_file ) for $single_file in $file_load_section.file_load_conditional.input ] )
-                #set singlefile_sampleName = ','.join( [ str( $single_file.name ) for $single_file in $file_load_section.file_load_conditional.input ] )
-
-                singlefile_galaxyPath '$singlefile_galaxyPath' singlefile_sampleName '$singlefile_sampleName'
-            #else
-                zipfile '$file_load_section.file_load_conditional.input'
-            #end if
-        #end if
-    </token>
-
-    <xml name="input_file_load">
-        <section name="file_load_section" title="Resubmit your raw dataset or your zip file">
-            <conditional name="file_load_conditional">
-                <param name="file_load_select" type="select" label="Resubmit your dataset or your zip file" help="Use only if you get a message which say that your original dataset or zip file have been deleted on the server." >
-                    <option value="no" >no need</option>
-                    <option value="yes" >yes</option>
-                </param>
-                <when value="no">
-                </when>
-                <when value="yes">
-                    <param name="input" type="data" format="mzxml,mzml,mzdata,netcdf,no_unzip.zip,zip" multiple="true" label="File(s) from your history containing your chromatograms" help="Single file mode for the format: mzxml, mzml, mzdata and netcdf. Zip file mode for the format: no_unzip.zip, zip. See the help section below." />
-                </when>
-            </conditional>
-        </section>
+    
+    <xml name="input_validator_range_integer">
+        <validator type="regex" message="The format is 'min,max'" >[0-9]+ *, *[0-9]+</validator>
     </xml>

-    <xml name="test_file_load_zip">
-        <section name="file_load_section">
-            <conditional name="file_load_conditional">
-                <param name="file_load_select" value="yes" />
-                <param name="input" value="faahKO_reduce.zip" ftype="zip" />
-            </conditional>
-        </section>
+    <xml name="input_validator_range_float">
+        <validator type="regex" message="The format is 'min,max'" >[0-9]+\.?[0-9]* *, *[0-9]+\.?[0-9]*</validator>
     </xml>

-    <xml name="test_file_load_single">
-        <section name="file_load_section">
-            <conditional name="file_load_conditional">
-                <param name="file_load_select" value="yes" />
-                <param name="input" value="wt15.CDF,ko16.CDF,ko15.CDF,wt16.CDF" ftype="netcdf" />
-            </conditional>
-        </section>
+    <xml name="input_validator_list_integer">
+        <validator type="regex" message="The format is '1,2,4,6'" >[0-9, ]+</validator>
     </xml>

-    <token name="@COMMAND_PEAKLIST@">
-        #if $peaklist.peaklistBool
-            variableMetadataOutput '$variableMetadata'
-            dataMatrixOutput '$dataMatrix'
-            convertRTMinute $peaklist.convertRTMinute
-            numDigitsMZ $peaklist.numDigitsMZ
-            numDigitsRT $peaklist.numDigitsRT
-            intval $peaklist.intval
-        #end if
-    </token>
+
+    <token name="@INPUT_IMAGE_LABEL@">RData file</token>
+    <token name="@INPUT_IMAGE_HELP@">It contains a xcms3::XCMSnExp object (named xdata)</token>

-    <xml name="input_peaklist">
-        <conditional name="peaklist">
-            <param name="peaklistBool" type="boolean" label="Get a Peak List" />
-            <when value="true">
-              <param name="convertRTMinute" type="boolean" checked="false" truevalue="TRUE" falsevalue="FALSE" label="Convert retention time (seconds) into minutes" help="Convert the columns rtmed, rtmin and rtmax into minutes"/>
-              <param name="numDigitsMZ" type="integer" value="4" label="Number of decimal places for mass values reported in ions' identifiers." help="A minimum of 4 decimal places is recommended. Useful to avoid duplicates within identifiers" />
-              <param name="numDigitsRT" type="integer" value="0" label="Number of decimal places for retention time values reported in ions' identifiers." help="Useful to avoid duplicates within identifiers" />
-              <param name="intval" type="select" label="Reported intensity values" help="[intval] See the help section below">
-                  <option value="into" selected="true">into</option>
-                  <option value="maxo">maxo</option>
-                  <option value="intb">intb</option>
-              </param>
-            </when>
-            <when value="false" />
-        </conditional>
-    </xml>

-    <xml name="output_peaklist"  token_function="">
-        <data name="variableMetadata" format="tabular" label="${image.name[:-6]}.@FUNCTION@.variableMetadata.tsv">
-            <filter>(peaklist['peaklistBool'])</filter>
-        </data>
-        <data name="dataMatrix" format="tabular" label="${image.name[:-6]}.@FUNCTION@.dataMatrix.tsv" >
-            <filter>(peaklist['peaklistBool'])</filter>
-        </data>
-    </xml>
-
-    <token name="@HELP_AUTHORS@">
-.. class:: infomark
-
-**Authors**  Colin A. Smith csmith@scripps.edu, Ralf Tautenhahn rtautenh@gmail.com, Steffen Neumann sneumann@ipb-halle.de, Paul Benton hpaul.benton08@imperial.ac.uk and Christopher Conley cjconley@ucdavis.edu
+    
+    <token name="@HELP_AUTHORS_WRAPPERS@">

.. class:: infomark

-**Galaxy integration** ABiMS TEAM - UPMC/CNRS - Station biologique de Roscoff and Yann Guitton yann.guitton@oniris-nantes.fr - part of Workflow4Metabolomics.org [W4M]
+**Galaxy integration** ABiMS TEAM - SU/CNRS - Station biologique de Roscoff and Yann Guitton - LABERCA
+Part of Workflow4Metabolomics.org [W4M]

  | Contact support@workflow4metabolomics.org for any questions or concerns about the Galaxy implementation of this tool.

----------------------------------------------------
-
     </token>

-
-    <xml name="citation">
-        <citations>
-            <citation type="doi">10.1021/ac051437y</citation>
+    <xml name="citation_w4m">
             <citation type="doi">10.1093/bioinformatics/btu813</citation>
-        </citations>
     </xml>
</macros>

diff -r 3a5204f14fff -r f439ed7a8f03 macros_xcms.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros_xcms.xml Tue Sep 18 16:09:25 2018 -0400

[

b'@@ -0,0 +1,244 @@\n+<?xml version="1.0"?>\n+<macros>\n+\n+ <token name="@WRAPPER_VERSION@">3.0.0</token>\n+ <xml name="requirements">\n+ <requirements>\n+ <requirement type="package" version="@WRAPPER_VERSION@">bioconductor-xcms</requirement>\n+ <requirement type="package" version="1.1_4">r-batch</requirement>\n+ <requirement type="package" version="1.1_2">r-rcolorbrewer</requirement>\n+ <requirement type="package" version="6.0">unzip</requirement>\n+ <yield />\n+ </requirements>\n+ </xml>\n+\n+ \n+ <token name="@COMMAND_FILE_LOAD@">\n+ #if $file_load_section.file_load_conditional.file_load_select == "yes":\n+ #if $file_load_section.file_load_conditional.input[0].is_of_type("mzxml") or $file_load_section.file_load_conditional.input[0].is_of_type("mzml") or $file_load_section.file_load_conditional.input[0].is_of_type("mzdata") or $file_load_section.file_load_conditional.input[0].is_of_type("netcdf"):\n+ #set singlefile_galaxyPath = \'|\'.join( [ str( $single_file ) for $single_file in $file_load_section.file_load_conditional.input ] )\n+ #set singlefile_sampleName = \'|\'.join( [ str( $single_file.name ) for $single_file in $file_load_section.file_load_conditional.input ] )\n+\n+ singlefile_galaxyPath \'$singlefile_galaxyPath\' singlefile_sampleName \'$singlefile_sampleName\'\n+ #else\n+ zipfile \'$file_load_section.file_load_conditional.input\'\n+ #end if\n+ #end if\n+ </token>\n+\n+ <xml name="input_file_load">\n+ <section name="file_load_section" title="Resubmit your raw dataset or your zip file">\n+ <conditional name="file_load_conditional">\n+ <param name="file_load_select" type="select" label="Resubmit your dataset or your zip file" help="Use only if you get a message saying that your original dataset or zip file have been deleted on the server." >\n+ <option value="no" >no need</option>\n+ <option value="yes" >yes</option>\n+ </param>\n+ <when value="no">\n+ </when>\n+ <when value="yes">\n+ <param name="input" type="data" format="mzxml,mzml,mzdata,netcdf,no_unzip.zip,zip" multiple="true" label="File(s) from your history containing your chromatograms" help="Single file mode for the format: mzxml, mzml, mzdata and netcdf. Zip file mode for the format: no_unzip.zip, zip. See the help section below." />\n+ </when>\n+ </conditional>\n+ </section>\n+ </xml>\n+\n+ <xml name="test_file_load_zip">\n+ <section name="file_load_section">\n+ <conditional name="file_load_conditional">\n+ <param name="file_load_select" value="yes" />\n+ <param name="input" value="faahKO_reduce.zip" ftype="zip" />\n+ </conditional>\n+ </section>\n+ </xml>\n+\n+ <xml name="test_file_load_zip_sacuri">\n+ <section name="file_load_section">\n+ <conditional name="file_load_conditional">\n+ <param name="file_load_select" value="yes" />\n+ <param name="input" value="sacuri_dir_root.zip" ftype="zip" />\n+ </conditional>\n+ </section>\n+ </xml>\n+\n+ <xml name="test_file_load_single">\n+ <section name="file_load_section">\n+ <conditional name="file_load_conditional">\n+ <param name="file_load_select" value="yes" />\n+ <param name="input" value="wt15.CDF,ko16.CDF,ko15.CDF,wt16.CDF" ftype="netcdf" />\n+ </conditional>\n+ </section>\n+ </xml>\n+\n+ <xml name="test_file_load_single_ko15">\n+ <section name="file_load_section">\n+ <conditional name="file_load_conditional">\n+ <param name="file_load_select" value="yes" />\n+ <param name="input" value="ko15.CDF" ftype="netcdf" />\n+'..b'the m/z value at the peak apex and the m/z values left and right of it</option>\n+ <option value="meanApex3">mean of the m/z value of the peak apex and the m/z values left and right of it</option>\n+ </param>\n+ <param argument="integrate" type="select" label="Integration method" >\n+ <option value="1">peak limits are found through descent on the mexican hat filtered data (more robust, but less exact)</option>\n+ <option value="2">peak limits based on real data (more accurate but prone to noise)</option>\n+ </param>\n+ <param argument="mzdiff" type="float" value="-0.001" label="Minimum difference in m/z for peaks with overlapping retention times" help="can be negative to allow overlap" />\n+ <param argument="fitgauss" type="boolean" checked="false" truevalue="TRUE" falsevalue="FALSE" label="fitgauss" help="whether or not a Gaussian should be fitted to each peak" />\n+ <param argument="noise" type="integer" value="0" label="Noise filter" help="allowing to set a minimum intensity required for centroids to be considered in the first analysis step (centroids with intensity lower than \xe2\x80\x98noise\xe2\x80\x99 are omitted from ROI detection)." />\n+ <param argument="verboseColumns" type="boolean" checked="false" truevalue="TRUE" falsevalue="FALSE" label="verbose Columns" help="whether additional peak meta data columns should be returned" />\n+ </xml>\n+\n+ <token name="@COMMAND_CENTWAVEADVROI@">\n+ #if $sectionROI.roiList:\n+ roiList \'$sectionROI.roiList\'\n+ firstBaselineCheck $sectionROI.firstBaselineCheck\n+ #if $sectionROI.roiScales != "":\n+ roiScales "c($sectionROI.roiScales)"\n+ #end if\n+ #end if\n+ </token>\n+\n+ <xml name="input_centwaveAdvROI" token_optional="true">\n+ <param argument="roiList" type="data" format="tabular" optional="@OPTIONAL@" label="List of regions-of-interest (ROI) representing detected mass traces" help="If ROIs are submitted the first analysis step is omitted and chromatographic peak detection is performed on the submitted ROIs. Each ROI is expected to have the following elements specified: \xe2\x80\x98scmin\xe2\x80\x99 (start scan index), \xe2\x80\x98scmax\xe2\x80\x99 (end scan index), \xe2\x80\x98mzmin\xe2\x80\x99 (minimum m/z), \xe2\x80\x98mzmax\xe2\x80\x99 (maximum m/z), \xe2\x80\x98length\xe2\x80\x99 (number of scans), \xe2\x80\x98intensity\xe2\x80\x99 (summed intensity)." />\n+ <param argument="firstBaselineCheck" type="boolean" checked="true" truevalue="TRUE" falsevalue="FALSE" label="Is continuous data within regions of interest is checked to be above the first baseline." />\n+ <param argument="roiScales" type="text" value="" optional="true" label="Numeric vector defining the scale for each region of interest in \xe2\x80\x98roiList\xe2\x80\x99" help="Length equal to \xe2\x80\x98roiList\xe2\x80\x99 - Should be used for the centWave-wavelets (format 0.9,1,0.2)">\n+ <expand macro="input_validator_range_float"/>\n+ </param>\n+ </xml>\n+\n+ \n+ <token name="@HELP_AUTHORS@">\n+.. class:: infomark\n+\n+**Authors** Colin A. Smith csmith@scripps.edu, Ralf Tautenhahn rtautenh@gmail.com, Steffen Neumann sneumann@ipb-halle.de, Paul Benton hpaul.benton08@imperial.ac.uk and Christopher Conley cjconley@ucdavis.edu\n+\n+@HELP_AUTHORS_WRAPPERS@\n+\n+---------------------------------------------------\n+\n+ </token>\n+\n+ <token name="@HELP_XCMS_MANUAL@">\n+\n+For details and explanations concerning all the parameters and workflow of xcms_ package, see its manual_ and this example_\n+\n+.. _xcms: https://bioconductor.org/packages/release/bioc/html/xcms.html\n+.. _manual: http://www.bioconductor.org/packages/release/bioc/manuals/xcms/man/xcms.pdf\n+.. _example: https://bioconductor.org/packages/release/bioc/vignettes/xcms/inst/doc/xcms.html\n+\n+ </token>\n+\n+ <xml name="citation">\n+ <citations>\n+ <citation type="doi">10.1021/ac051437y</citation>\n+ <expand macro="citation_w4m"/>\n+ </citations>\n+ </xml>\n+</macros>\n'

diff -r 3a5204f14fff -r f439ed7a8f03 static/images/xcms_merge_workflow.png

Binary file static/images/xcms_merge_workflow.png has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/MM14-xset.RData

Binary file test-data/MM14-xset.RData has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/MM8-xset.RData

Binary file test-data/MM8-xset.RData has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/ko15-xset.RData

Binary file test-data/ko15-xset.RData has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/ko15.CDF

Binary file test-data/ko15.CDF has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/ko16-xset.RData

Binary file test-data/ko16-xset.RData has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/ko16.CDF

Binary file test-data/ko16.CDF has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/noclass.merged.sampleMetadata.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/noclass.merged.sampleMetadata.tsv Tue Sep 18 16:09:25 2018 -0400

@@ -0,0 +1,5 @@
+sampleMetadata class
+ko15 .
+ko16 .
+wt15 .
+wt16 .

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/wt15-xset.RData

Binary file test-data/wt15-xset.RData has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/wt15.CDF

Binary file test-data/wt15.CDF has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/wt16-xset.RData

Binary file test-data/wt16-xset.RData has changed

diff -r 3a5204f14fff -r f439ed7a8f03 test-data/wt16.CDF

Binary file test-data/wt16.CDF has changed

diff -r 3a5204f14fff -r f439ed7a8f03 xcms_merge.r
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/xcms_merge.r Tue Sep 18 16:09:25 2018 -0400

[

@@ -0,0 +1,45 @@
+#!/usr/bin/env Rscript
+
+#Import the different functions
+source_local <- function(fname){ argv <- commandArgs(trailingOnly=FALSE); base_dir <- dirname(substring(argv[grep("--file=", argv)], 8)); source(paste(base_dir, fname, sep="/")) }
+source_local("lib.r")
+source_local("lib-xcms3.x.x.r")
+
+pkgs <- c("xcms","batch")
+loadAndDisplayPackages(pkgs)
+cat("\n\n");
+
+args <- parseCommandArgs(evaluate=FALSE) #interpretation of arguments given in command line as an R list of objects
+
+
+cat("\tXSET MERGING...\n")
+
+mergeXDataReturn <- mergeXData(args)
+xdata <- mergeXDataReturn$xdata
+singlefile <- mergeXDataReturn$singlefile
+md5sumList <- mergeXDataReturn$md5sumList
+sampleNamesList <- mergeXDataReturn$sampleNamesList
+chromTIC <- mergeXDataReturn$chromTIC
+chromBPI <- mergeXDataReturn$chromBPI
+
+# Create a sampleMetada file
+sampleNamesList <- getSampleMetadata(xdata=xdata, sampleMetadataOutput="sampleMetadata.tsv")
+
+cat("\n\n")
+
+cat("\tXCMSnExp OBJECT INFO\n")
+print(pData(xdata))
+print(xdata)
+cat("\n\n")
+
+cat("\txcmsSet OBJECT INFO\n")
+# Get the legacy xcmsSet object
+xset <- getxcmsSetObject(xdata)
+print(xset@phenoData)
+print(xset)
+cat("\n\n")
+
+cat("\tSAVE RData\n")
+#saving R data in .Rdata file to save the variables used in the present tool
+objects2save <- c("xdata", "zipfile", "singlefile", "md5sumList", "sampleNamesList", "chromTIC", "chromBPI")
+save(list=objects2save[objects2save %in% ls()], file="merged.RData")

diff -r 3a5204f14fff -r f439ed7a8f03 xcms_merge.xml
--- a/xcms_merge.xml Tue Feb 13 04:48:41 2018 -0500
+++ b/xcms_merge.xml Tue Sep 18 16:09:25 2018 -0400

[

b'@@ -1,99 +1,45 @@\n-<tool id="xcms_merge" name="xcms.xcmsSet Merger" version="1.1.0">\n- <description>Merge xcms.xcmsSet xset in one to be used by group</description>\n+<tool id="xcms_merge" name="xcms findChromPeaks Merger" version="@WRAPPER_VERSION@.0">\n+ <description>Merge xcms findChromPeaks RData into a unique file to be used by group</description>\n \n <macros>\n <import>macros.xml</import>\n+ <import>macros_xcms.xml</import>\n </macros>\n \n- <expand macro="requirements_light"/>\n+ <expand macro="requirements"/>\n <expand macro="stdio"/>\n \n <command><![CDATA[\n- Rscript $script_file\n+ @COMMAND_RSCRIPT@/xcms_merge.r\n+\n+ images \'c("${"\\",\\"".join(map(str, $images))}")\'\n+\n+ #if str($sampleMetadata) != \'None\':\n+ sampleMetadata \'$sampleMetadata\'\n+ #end if\n+\n+ @COMMAND_FILE_LOAD@\n ]]></command>\n \n- <configfiles>\n- <configfile name="script_file"><![CDATA[\n-suppressPackageStartupMessages(library(xcms, quietly=TRUE))\n-\n-images=c(\n-"${"\\",\\"".join(map(str, $images))}"\n-)\n-\n-\n-cat("\\tXSET MERGING...\\n")\n-\n-for(image in images) {\n- load(image)\n- cat(sampleNamesList\\$sampleNamesOrigin,"\\n")\n- if (!exists("xset_merged")) {\n- xset_merged=xset\n- singlefile_merged=singlefile\n- listOFlistArguments_merged=listOFlistArguments\n- md5sumList_merged=md5sumList\n- sampleNamesList_merged=sampleNamesList\n- } else {\n- xset_merged=c(xset_merged,xset)\n- singlefile_merged=c(singlefile_merged,singlefile)\n- listOFlistArguments_merged=c(listOFlistArguments_merged,listOFlistArguments)\n- md5sumList_merged\\$origin=rbind(md5sumList_merged\\$origin,md5sumList\\$origin)\n- sampleNamesList_merged\\$sampleNamesOrigin=c(sampleNamesList_merged\\$sampleNamesOrigin,sampleNamesList\\$sampleNamesOrigin)\n- sampleNamesList_merged\\$sampleNamesMakeNames=c(sampleNamesList_merged\\$sampleNamesMakeNames,sampleNamesList\\$sampleNamesMakeNames)\n- }\n-}\n-rm(image)\n-xset=xset_merged; rm(xset_merged)\n-singlefile=singlefile_merged; rm(singlefile_merged)\n-listOFlistArguments=listOFlistArguments_merged; rm(listOFlistArguments_merged)\n-md5sumList=md5sumList_merged; rm(md5sumList_merged)\n-sampleNamesList=sampleNamesList_merged; rm(sampleNamesList_merged)\n+ <inputs>\n+ <param name="images" type="data" format="rdata.xcms.findchrompeaks,rdata" label="@INPUT_IMAGE_LABEL@" help="@INPUT_IMAGE_HELP@ from multiple findChromPeaks" multiple="true" />\n+ <param name="sampleMetadata" label="Sample metadata file " format="tabular" type="data" optional="true" help="must contain at least one column with the sample id and one column with the sample class"/>\n \n-#if str($sampleMetadata) != \'None\':\n- cat("\\tXSET PHENODATA SETTING...\\n")\n- sampleMetadata=read.table("$sampleMetadata", h=F, sep=";", stringsAsFactors=F)\n- if (ncol(sampleMetadata) < 2) sampleMetadata=read.table("$sampleMetadata", h=F, sep="\\t", stringsAsFactors=F)\n- if (ncol(sampleMetadata) < 2) sampleMetadata=read.table("$sampleMetadata", h=F, sep=",", stringsAsFactors=F)\n- if (ncol(sampleMetadata) < 2) {\n- error_message="Your sampleMetadata file seems not well formatted. The column separators accepted are ; , and tabulation"\n- print(error_message)\n- stop(error_message)\n- }\n-\n- sampclass(xset)=sampleMetadata\\$V2[match(rownames(xset@phenoData),sampleMetadata\\$V1)]\n-\n- if (any(is.na(sampclass(xset)))) {\n- sample_missing <- rownames(phenoData(xset))[is.na(sampclass(xset))]\n- error_message <- paste("Those samples are missing in your sampleMetadata:", paste(sample_missing, collapse=" "))\n- print(error_message)\n- stop(error_message)\n- }\n-#end if\n-\n-\n-\n-cat("\\tXSET OBJECT INFO\\n")\n-\n-print(xset@phenoData)\n-print(xset)\n-\n-cat("\\tSAVE RData\\n")\n-save.image("$xsetRData")\n-\n- ]]></configfile>\n- </configfiles>\n-\n- <inputs>\n- <param name="images" type="data" format="'..b'===============+=================+\n-|xcms.group | xset.RData | rdata.xcms.raw |\n-+---------------------------+--------------------+-----------------+\n+=========================== ==================== ============================\n+Name Output file Format\n+=========================== ==================== ============================\n+xcms.groupChromPeaks xset.merged.RData rdata.xcms.findchrompeaks\n+=========================== ==================== ============================\n \n .. image:: xcms_merge_workflow.png\n \n@@ -191,50 +131,60 @@\n Input files\n -----------\n \n-+---------------------------+-----------------------+\n-| Parameter : num + label | Format |\n-+===========================+=======================+\n-| 1 : RData file | rdata.xcms.raw |\n-+---------------------------+-----------------------+\n-| 2 : RData file | rdata.xcms.raw |\n-+---------------------------+-----------------------+\n-| N : RData file | rdata.xcms.raw |\n-+---------------------------+-----------------------+\n-| Optional : sampleMetadata | tsv or csv |\n-+---------------------------+-----------------------+\n+=========================== ==================================\n+Parameter : num + label Format\n+=========================== ==================================\n+1 : RData file rdata.xcms.findchrompeaks\n+--------------------------- ----------------------------------\n+2 : RData file rdata.xcms.findchrompeaks\n+--------------------------- ----------------------------------\n+N : RData file rdata.xcms.findchrompeaks\n+--------------------------- ----------------------------------\n+Optional : sampleMetadata tsv or csv\n+=========================== ==================================\n \n Example of a sampleMetadata:\n \n-+---------------------------+------------+\n-|HU_neg_028 | bio |\n-+---------------------------+------------+\n-|HU_neg_034 | bio |\n-+---------------------------+------------+\n-|Blanc04 | blank |\n-+---------------------------+------------+\n-|Blanc06 | blank |\n-+---------------------------+------------+\n-|Blanc09 | blank |\n-+---------------------------+------------+\n+=========================== ============\n+Samples class\n+=========================== ============\n+HU_neg_028 bio\n+--------------------------- ------------\n+HU_neg_034 bio\n+--------------------------- ------------\n+Blanc04 blank\n+--------------------------- ------------\n+Blanc06 blank\n+--------------------------- ------------\n+Blanc09 blank\n+=========================== ============\n+\n \n ------------\n Output files\n ------------\n \n-xset.merged.RData: rdata.xcms.raw format\n+xset.merged.RData: rdata.xcms.findchrompeaks format\n \n- | Rdata file that is necessary in the next step of the workflow "xcms.group".\n+ | Rdata file that is necessary in the next step of the workflow "xcms.groupChromPeaks".\n \n ---------------------------------------------------\n \n Changelog/News\n --------------\n \n+**Version 3.0.0.0 - 08/03/2018**\n+\n+- UPGRADE: upgrade the xcms version from 1.46.0 to 3.0.0. So refactoring of a lot of underlining codes and methods\n+\n+- IMPROVMENT: a new dedicated tool "xcms plot chromatogram" will allow you to get TIC and BPI of your raw data.\n+\n+- IMPROVMENT: the tool will now generate a sampleMetadata file if any was provided. It will be useful to add some further information for the normalization and statistics steps.\n+\n **Version 1.0.1 - 13/02/2017**\n \n - IMPROVMENT: the tool will now raise an error if a sample isn\'t describe in the sampleMetadata file\n \n-\n **Version 1.0.0 - 03/02/2017**\n \n - NEW: a new tool to merge individual xcmsSet outputs to be used by xcms.group\n'