changeset 0:f3f97841564f draft

Uploaded
author lecorguille
date Fri, 07 Aug 2015 11:02:28 -0400
parents
children e51ff83e4d94
files abims_xcms_group.xml repository_dependencies.xml static/images/xcms_group.png static/images/xcms_group_workflow.png test-data/xset.RData test-data/xset.group.RData test-data/xset.group.Rplots.pdf tool_dependencies.xml
diffstat 8 files changed, 282 insertions(+), 0 deletions(-) [+]
line wrap: on
line diff
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/abims_xcms_group.xml	Fri Aug 07 11:02:28 2015 -0400
@@ -0,0 +1,266 @@
+<tool id="abims_xcms_group" name="xcms.group" version="2.0.2">
+
+    <description>Group peaks together across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time.</description>
+
+    <requirements>
+        <requirement type="package" version="3.1.2">R</requirement>
+        <requirement type="binary">Rscript</requirement>
+        <requirement type="package" version="1.44.0">xcms</requirement>
+        <requirement type="package" version="2.1">xcms_w4m_script</requirement>
+    </requirements>
+
+    <stdio>
+        <exit_code range="1:" level="fatal" />
+    </stdio>
+
+    <command>
+        xcms.r 
+        xfunction group image $image method $methods.method sleep 0.001 
+        #if $methods.method == "density":
+            ## minsamp $methods.minsamp 
+            minfrac $methods.minfrac 
+            bw $methods.bw 
+            mzwid $methods.mzwid
+        #if $methods.density_options.option == "show":
+            max $methods.density_options.max
+        #end if 
+        #elif $methods.method == "mzClust":
+            mzppm $methods.mzppm
+            mzabs $methods.mzabs
+            minfrac $methods.minfrac
+            ## minsamp $methods.minsamp
+        #else:
+            mzVsRTbalance $methods.mzVsRTbalance
+            mzCheck $methods.mzCheck
+            rtCheck $methods.rtCheck
+            kNN $methods.kNN
+        #end if
+        &amp;&amp; (
+        mv group.RData $xsetRData;
+        mv Rplots.pdf $rplotsPdf
+        );
+        cat xset.log
+   </command> 
+
+    <inputs>
+        <param name="image" type="data" format="rdata.xcms.raw,rdata.xcms.group,rdata.xcms.retcor,rdata" label="xset RData file" help="output file from another function xcms (xcmsSet, retcor etc.)" />
+        <conditional name="methods">
+            <param name="method" type="select" label="Method to use for grouping" help="[method] See the help section below">
+                <option value="density" selected="true">density</option>
+                <option value="mzClust" >mzClust</option>
+                <option value="nearest" >nearest</option>
+            </param>
+            <when value="density">
+                <param name="bw" type="integer" value="30" label="Bandwidth" help="[bw] bandwidth (standard deviation or half width at half maximum) of gaussian smoothing kernel to apply to the peak density chromatogram" />
+                <param name="minfrac" type="float" value="0.5" label="Minimum fraction of samples necessary" help="[minfrac] in at least one of the sample groups for it to be a valid group" />
+                <param name="mzwid" type="float" value="0.25" label="Width of overlapping m/z slices" help="[mzwid] to use for creating peak density chromatograms and grouping peaks across samples " />
+<!--
+                <param name="minsamp" type="hidden" value="1" label="minsamp" help="minimum number of samples necessary in at least one of the sample groups for it to be a valid group " /> 
+-->
+            <conditional name="density_options">
+            <param name="option" type="select" label="Advanced options">
+                <option value="show">show</option>
+                <option value="hide" selected="true">hide</option>
+            </param>
+            <when value="show">
+                <param name="max" type="integer" value="5" label="Maximum number of groups to identify in a single m/z slice" help="[max]" />
+            </when>
+            <when value="hide">
+            </when>
+        </conditional>
+
+            </when>
+            <when value="mzClust">
+                <param name="mzppm" type="integer" value="20 " label="Relative error used for clustering/grouping in ppm" help="[mzppm]" />
+                <param name="mzabs" type="float" value="0" label="Absolute error used for clustering/grouping" help="[mzabs]" />
+                <param name="minfrac" type="float" value="0" label="Minimum fraction of each class in one bin" help="[minfrac] minimum fraction of samples necessary in at least one of the sample groups for it to be a valid group" />
+<!--
+                <param name="minsamp" type="hidden" value="1" label="minsamp" help="minimum number of samples necessary in at least one of the sample groups for it to be a valid group " />   
+-->
+            </when>
+            <when value="nearest">
+                <param name="mzVsRTbalance" type="integer" value="10 " label="Multiplicator for mz value before calculating the (euclidean) distance between two peaks." help="[mzVsRTbalance]" />
+                <param name="mzCheck" type="float" value="0.2" label="Maximum tolerated distance for mz" help="[mzCheck]" />
+                <param name="rtCheck" type="integer" value="15" label="Maximum tolerated distance for RT" help="[rtCheck]" />
+                <param name="kNN" type="integer" value="10" label="Number of nearest Neighbours to check" help="[kNN]" />    
+            </when>
+        </conditional>
+<!--
+        <param name="sleepy" type="float" value="0.001" label="sleep" help="seconds to pause between plotting successive steps of the peak grouping algorithm. peaks are plotted as points showing relative intensity. identified groups are flanked by dotted vertical lines"> 
+            <validator type="in_range" message="Must be more than 0" min="0.001" max="inf"/>
+        </param>
+-->
+
+    </inputs>
+
+    <outputs>
+        <data name="xsetRData" format="rdata.xcms.group" label="${image.name[:-6]}.group.RData"/>
+        <data name="rplotsPdf" format="pdf" label="${image.name[:-6]}.group.Rplots.pdf"/>
+    </outputs>
+
+    <tests>
+        <test>
+            <param name="image" value="xset.RData"/>
+            <param name="methods.method" value="density"/>
+            <param name="methods.bw" value="5"/>
+            <param name="methods.minfrac" value="0.3"/>
+            <param name="methods.mzwid" value="0.01"/>
+            <param name="methods.density_options.option" value="show"/>
+            <param name="methods.density_options.max" value="50"/>
+            <output name="xsetRData" file="xset.group.RData" />
+            <output name="rplotsPdf" file="xset.group.Rplots.pdf" />
+         
+        </test>
+    </tests>
+
+    <help>
+        
+.. class:: infomark
+
+**Authors**  Colin A. Smith csmith@scripps.edu, Ralf Tautenhahn rtautenh@gmail.com, Steffen Neumann sneumann@ipb-halle.de, Paul Benton hpaul.benton08@imperial.ac.uk and Christopher Conley cjconley@ucdavis.edu 
+
+**Galaxy integration** ABiMS TEAM - UPMC/CNRS - Station biologique de Roscoff and Yann Guitton yann.guitton@univ-nantes.fr - part of Workflow4Metabolomics.org [W4M]
+
+ | Contact support@workflow4metabolomics.org for any questions or concerns about the Galaxy implementation of this tool.
+
+
+
+---------------------------------------------------
+
+==========
+Xcms.Group
+==========
+
+-----------
+Description
+-----------
+
+After peak identification with xcmsSet, this tool groups the peaks which represent the same analyte across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time. Allows rejection of features, which are only partially detected within the replicates of a sample class.
+
+
+
+-----------------
+Workflow position
+-----------------
+
+**Upstream tools**
+
+========================= ================= =================== ==========
+Name                      output file       format              parameter
+========================= ================= =================== ==========
+xcms.xcmsSet              xset.RData        rdata.xcms.raw      RData file
+------------------------- ----------------- ------------------- ----------
+xcms.retcor               xset.RData        rdata.xcms.retcor   RData file
+========================= ================= =================== ==========
+
+
+**Downstream tools**
+
++---------------------------+--------------------------------------+
+| Name                      | Output file     | Format             |
++===========================+=================+====================+
+|xcms.retcor                | xset.RData      | rdata.xcms.group   |
++---------------------------+--------------------------------------+
+|xcms.fillPeaks             | xset.RData      | rdata.xcms.group   |
++---------------------------+--------------------------------------+
+
+The output file is an xcmsSet.RData file. You can continue your analysis using it in **xcms.retcor** tool as an next step and then **xcms.fillPeaks**.
+
+**General schema of the metabolomic workflow**
+
+.. image:: xcms_group_workflow.png
+
+
+-----------
+Input files
+-----------
+
++---------------------------+-----------------------+
+| Parameter : num + label   |   Format              |
++===========================+=======================+
+| 1 : RData file            |   rdata.xcms.group    |
++---------------------------+-----------------------+
+
+
+----------
+Parameters
+----------
+
+Method to use for grouping
+--------------------------
+
+**mzClust**
+
+    | Runs high resolution alignment on single spectra samples stored in the RData file generated by the **xcmsSet tool**.
+
+**density**
+
+    | Groups peaks together across samples using overlapping m/z bins and calculation of smoothed peak distributions in chromatographic time.
+
+**nearest**
+
+    | Groups peaks together across samples by creating a master peak list and assigning corresponding peaks from all samples. It is inspired by the alignment algorithm of mzMine.
+
+
+------------
+Output files
+------------
+
+xset.group.Rplots.pdf
+
+xset.group.RData: rdata.xcms.group format
+
+    | Rdata file that will be necessary in the third and fourth step of the workflow (xcms.retcor and xcms.fillpeaks).
+    
+
+------
+
+.. class:: infomark 
+
+The output file is an xset.group.RData file. You can continue your analysis using it in **xcms.retcor** tool.
+
+    
+---------------------------------------------------
+
+
+---------------
+Working example
+---------------
+
+Input files
+-----------
+
+    | RData file -> **xset.RData**
+
+Parameters
+----------
+
+    | Method -> **density**
+    | bw     -> **5**
+    | minfrac -> **0.3**
+    | mzwid    -> **0.01**
+    | Advanced options: **show**
+    | max -> **50**
+
+
+Output files
+------------
+
+    | **1) xset.RData: RData file**
+
+    | **2) Example of an xset.group.Rplots pdf file**
+
+.. image:: xcms_group.png
+        :width: 700
+
+
+    </help>
+
+
+    <citations>
+        <citation type="doi">10.1021/ac051437y</citation>
+        <citation type="doi">10.1093/bioinformatics/btu813</citation>
+    </citations>
+
+
+</tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/repository_dependencies.xml	Fri Aug 07 11:02:28 2015 -0400
@@ -0,0 +1,4 @@
+<?xml version="1.0"?>
+<repositories>
+    <repository changeset_revision="d64562a4ebb3" name="rdata_xcms_datatypes" owner="lecorguille" toolshed="https://toolshed.g2.bx.psu.edu" />
+</repositories>
Binary file static/images/xcms_group.png has changed
Binary file static/images/xcms_group_workflow.png has changed
Binary file test-data/xset.RData has changed
Binary file test-data/xset.group.RData has changed
Binary file test-data/xset.group.Rplots.pdf has changed
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_dependencies.xml	Fri Aug 07 11:02:28 2015 -0400
@@ -0,0 +1,12 @@
+<?xml version="1.0"?>
+<tool_dependency>
+    <package name="R" version="3.1.2">
+        <repository changeset_revision="9f2fddb9d6e2" name="package_r_3_1_2" owner="iuc" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+    <package name="xcms" version="1.44.0">
+        <repository changeset_revision="a1c3fc774157" name="package_r_xcms_1_44_0" owner="lecorguille" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+    <package name="xcms_w4m_script" version="2.1">
+        <repository changeset_revision="c94c8ef520c8" name="package_xcms_w4m_script_2_1" owner="lecorguille" toolshed="https://toolshed.g2.bx.psu.edu" />
+    </package>
+</tool_dependency>