annotate batchcorrection-57edfd3943ab/batch_correction.xml @ 3:73892ef177e3 draft

Uploaded
author melpetera
date Tue, 02 May 2017 09:47:22 -0400
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
3
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
1 <tool id="Batch_correction" name="Batch_correction" version="2.1.2">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
2 <description>Corrects intensities for signal drift and batch-effects</description>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
3
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
4 <requirements>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
5 <requirement type="package">r-batch</requirement>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
6 <requirement type="package">r-ade4</requirement>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
7 <requirement type="package">bioconductor-pcamethods</requirement>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
8 <requirement type="package">bioconductor-ropls</requirement>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
9 </requirements>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
10
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
11 <stdio>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
12 <exit_code range="1:" level="fatal" />
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
13 </stdio>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
14
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
15 <command><![CDATA[
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
16 #if str($span_condition.method) == 'all_loess_pool':
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
17 Rscript $__tool_directory__/batch_correction_all_loess_wrapper.R
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
18 dataMatrix "$dataMatrix"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
19 sampleMetadata "$sampleMetadata"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
20 variableMetadata "$variableMetadata"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
21 method "all_loess_pool"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
22 span "${span_condition.span}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
23
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
24 #elif str($span_condition.method) == 'all_loess_sample':
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
25 Rscript $__tool_directory__/batch_correction_all_loess_wrapper.R
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
26 dataMatrix "$dataMatrix"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
27 sampleMetadata "$sampleMetadata"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
28 variableMetadata "$variableMetadata"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
29 method "all_loess_sample"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
30 span "${span_condition.span}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
31 #else:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
32 Rscript $__tool_directory__/batch_correction_wrapper.R
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
33 analyse "batch_correction"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
34 dataMatrix "$dataMatrix"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
35 sampleMetadata "$sampleMetadata"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
36 variableMetadata "$variableMetadata"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
37 method "${span_condition.method}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
38 #if str($span_condition.method) == 'linear':
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
39 span "none"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
40 #else:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
41 span "${span_condition.span}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
42 #end if
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
43 valnull "${span_condition.valnull}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
44 ref_factor "${span_condition.ref_factor}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
45 detail "${span_condition.detail}"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
46 #end if
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
47 dataMatrix_out "$dataMatrix_out" variableMetadata_out "$variableMetadata_out"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
48 graph_output "$graph_output" rdata_output "$rdata_output"
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
49 ]]></command>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
50
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
51 <inputs>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
52 <param name="dataMatrix" label="Data Matrix file " format="tabular" type="data" />
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
53 <param name="sampleMetadata" label="Sample metadata file " format="tabular" type="data" help="must contain at least the three following columns: 'batch' + 'injectionOrder' + 'sampleType'"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
54 <param name="variableMetadata" label="Variable metadata file " format="tabular" type="data" />
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
55
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
56 <conditional name="span_condition">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
57 <param name="method" label="Type of regression model " type="select" help="To select between linear or non-linear (lowess or loess) methods to be used in Van der Kloet algorithm ; when using loess, you can choose to use pools or samples to model batch effect.">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
58 <option value="linear">linear</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
59 <option value="lowess">lowess</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
60 <option value="loess">loess</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
61 <option value="all_loess_pool">all loess pool</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
62 <option value="all_loess_sample">all loess sample</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
63 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
64 <when value="linear">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
65 <param name="valnull" label="Null values" type="select" display="radio" help="What to do of generated negative or infinite values">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
66 <option value="0">consider it as a null intensity</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
67 <option value="NA">consider it as a missing value</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
68 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
69 <param name="ref_factor" label="Factor of interest " type="text" value="batch" help="column name of factor of interest (often a biological factor); if none, leave 'batch'" />
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
70 <param name="detail" label="Level of details for plots " type="select" help="Amount of plots in the pdf file output. See Help section for more details.">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
71 <option value="no">basic</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
72 <option value="plot">standard</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
73 <option value="reg">complete</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
74 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
75 </when>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
76 <when value="lowess">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
77 <param name="span" type="float" value="0.85" label="span" help="it is a advanced option. Must be less than or equal to 1"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
78 <param name="valnull" label="Null values" type="select" display="radio" help="What to do of generated negative or infinite values">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
79 <option value="0">consider it as a null intensity</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
80 <option value="NA">consider it as a missing value</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
81 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
82 <param name="ref_factor" label="Factor of interest " type="text" value="batch" help="column name of factor of interest (often a biological factor); if none, leave 'batch'" />
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
83 <param name="detail" label="Level of details for plots " type="select" help="Amount of plots in the pdf file output. See Help section for more details.">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
84 <option value="no">basic</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
85 <option value="plot">standard</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
86 <option value="reg">complete</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
87 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
88 </when>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
89 <when value="loess">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
90 <param name="span" type="float" value="1" label="span" help="it is a advanced option. Must be strictly greater than 0"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
91 <param name="valnull" label="Null values" type="select" display="radio" help="What to do of generated negative or infinite values">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
92 <option value="0">consider it as a null intensity</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
93 <option value="NA">consider it as a missing value</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
94 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
95 <param name="ref_factor" label="Factor of interest " type="text" value="batch" help="column name of factor of interest (often a biological factor); if none, leave 'batch'" />
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
96 <param name="detail" label="Level of details for plots " type="select" help="Amount of plots in the pdf file output. See Help section for more details.">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
97 <option value="no">basic</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
98 <option value="plot">standard</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
99 <option value="reg">complete</option>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
100 </param>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
101 </when>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
102 <when value="all_loess_pool">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
103 <param name="span" type="float" value="1" label="span" help="smoothing parameter; must be > 0"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
104 </when>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
105 <when value="all_loess_sample">
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
106 <param name="span" type="float" value="1" label="span" help="smoothing parameter; must be > 0"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
107 </when>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
108 </conditional>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
109 </inputs>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
110
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
111 <outputs>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
112 <data name="dataMatrix_out" label="${tool.name}_${span_condition.method}_${dataMatrix.name}" format="tabular"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
113 <data name="variableMetadata_out" label="${tool.name}_${span_condition.method}_${variableMetadata.name}" format="tabular"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
114 <data name="graph_output" label="${tool.name}_${span_condition.method}_graph" format="pdf"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
115 <data name="rdata_output" label="${tool.name}_${span_condition.method}_rdata" format="rdata"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
116 </outputs>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
117
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
118 <tests>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
119 <test>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
120 <param name="dataMatrix" value="input-batchcorrection-dataMatrix.tsv"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
121 <param name="sampleMetadata" value="input-batchcorrection-sampleMetadata.tsv"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
122 <param name="variableMetadata" value="input-batchcorrection-variableMetadata.tsv"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
123 <param name="method" value="all_loess_pool"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
124 <param name="span" value="1"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
125 <output name="dataMatrix_out" file="output-batchcorrection-dataMatrix.tsv"/>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
126 </test>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
127 </tests>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
128
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
129
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
130 <help>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
131
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
132 .. class:: infomark
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
133
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
134 **Authors**
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
135 | Jean-Francois Martin - PF MetaToul-AXIOM ; INRA ; MetaboHUB (for original version of this tool and overall development of the R script)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
136 | Melanie Petera - PFEM ; INRA ; MetaboHUB (for R wrapper and R script improvement)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
137 | Marion Landi - FLAME ; PFEM ; INRA ; MetaboHUB (for xml interface and R wrapper)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
138 | Franck Giacomoni - PFEM ; INRA ; MetaboHUB (for xml interface and R wrapper)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
139 | Etienne Thevenot - LIST/LADIS ; CEA ; MetaboHUB (for R script and wrapper regarding "all loess pool" and "all loess sample" methods)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
140
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
141 ---------------------------------------------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
142
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
143 .. class:: infomark
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
144
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
145 **Please cite** If you use this tool, please cite:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
146
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
147 when using the **linear**, **lowess** or **loess** methods:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
148 | `F.M. Van Der Kloet, I. Bobeldijk, E.R. Verheij, R.H. Jellema. (2009). "Analytical error reduction using single point calibration for accurate and precise metabolomic phenotyping." Journal of Proteome Research p5132-5141 &lt;http://www.ncbi.nlm.nih.gov/pubmed/19754161&gt;`_
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
149
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
150 when using the **all loess pool** or **all loess sample** method:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
151 | `Dunn et al (2011). Procedures for large-scale metabolic profiling of serum and plasma using gas chromatography and liquid chromatography coupled to mass spectrometry. Nature Protocols, 6:1060-1083 &lt;http://dx.doi.org/10.1038/nprot.2011.335&gt;`_
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
152 | Cleveland et al (1997). In Statistical Models in S; Chambers JM. and Hastie TJ. Ed.; Chapman et Hall: London; pp. 309-376
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
153 | Etienne A. Thevenot, Aurelie Roux, Ying Xu, Eric Ezan, and Christophe Junot (2015). Analysis of the human adult urinary metabolome variations with age, body mass index and gender by implementing a comprehensive workflow for univariate and OPLS statistical analyses. *Journal of Proteome Research*, **14**:3322-3335 (http://dx.doi.org/10.1021/acs.jproteome.5b00354).
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
154
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
155 ---------------------------------------------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
156
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
157 .. class:: infomark
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
158
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
159 **Tool updates**
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
160
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
161 See the **NEWS** section at the bottom of this page
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
162
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
163 ---------------------------------------------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
164
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
165 ================
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
166 Batch_correction
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
167 ================
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
168
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
169 -----------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
170 Description
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
171 -----------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
172
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
173 | **Instrumental drift** and **offset differences** between batches have been described in **LC-MS** experiments when the number of samples is large and/or multiple batches of acquisition are needed.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
174 | Recently a normalization strategy relying on the measurements of a **pooled** (or QC) sample injected periodically has been described: for each variable, a **regression model** is fitted to the values of the **pool** and subsequently used to adjust the intensities of the samples of interest (van der Kloet et al, 2009; Dunn et al, 2011).
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
175 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
176 | The current tool implements **two strategies** which differ in the way the regression model is applied to the variables (either depending on variable quality metrics, or 'loess' model for all variables) and also in the generated figure.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
177 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
178
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
179
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
180 -----------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
181 Workflow position
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
182 -----------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
183
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
184 .. image:: batch_correction.png
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
185 :width: 800
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
186
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
187
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
188 -----------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
189 Input files
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
190 -----------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
191
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
192 +----------------------------+------------+
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
193 | Parameter : num + label | Format |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
194 +============================+============+
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
195 | 1 : Data Matrix file | tabular |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
196 +----------------------------+------------+
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
197 | 2 : Sample metadata file | tabular |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
198 +----------------------------+------------+
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
199 | 3 : Variable metadata file | tabular |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
200 +----------------------------+------------+
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
201
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
202
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
203 Data Matrix file must contain the intensity values of variables.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
204 | First line must contain all the samples' names
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
205 | First column must contain all the variables' ID
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
206 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
207
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
208 Sample metadata file must contain at least the three following columns:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
209 | "batch" to identify the batches of analyses
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
210 | "injectionOrder" (integers) defining the injection order of all samples (QC-pools as well as analysed samples)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
211 | "sampleType" indicating if a sample ("sample") or a QC-pool ("pool"); each batch needs
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
212 | at least 3 QC-pools for intra-batch linear adjustment and 8 for lo(w)ess adjustment (5 for **all loess** methods)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
213
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
214
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
215 .. class:: warningmark
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
216
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
217 MISSING DATA are allowed only with the **all loess** methods
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
218
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
219
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
220 ----------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
221 Parameters
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
222 ----------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
223
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
224 Type of regression model
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
225 | To choose between *linear*, *lowess*, *loess*, *all loess pool*, and *all loess sample* strategies
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
226 | **- Option 1** (**linear**, **lowess**, and **loess** methods): before the normalisation of each variable, some quality metrics are computed (see the "Determine Batch Correction" module); depending on the result, the variable can be normalized or not, with either the **linear**, **lowess** or **loess** model.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
227 | **- Option 2** (**all loess pool** and **all loess sample**): each variable is normalized by using the 'loess' model;
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
228 | in the case **all loess pool** is chosen and the number of pool observations is below 5, the linear method is used (for all variables) and a warning is generated;
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
229 | if the pool intensities are not representative of the samples (which can be viewed on the figure where both trends are shown), the case **all loess sample** enables using the sample intensities (instead of the pool intensities) as the reference for the loess curve.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
230 | In all "option 2" cases: the **median intensity of the reference observations** (either 'pool' or 'sample') is used as the scaling factor after the initial intensities have been divided by the loess predictions.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
231 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
232
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
233 Span
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
234 | Smoothing parameter, advanced option for *lo(w)ess* and *all loess* methods
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
235 | In case of a loess fit, the **span** parameter (between 0 and 1) controls the smoothing
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
236 | (the higher the smoother; higher values are prefered to avoid overfitting; Cleveland et al, 1997).
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
237 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
238
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
239 Null values
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
240 | available for regression model *linear*, *lowess* and *loess*
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
241 | Controls what is done regarding negative or infinite values that can be generated during regression estimation.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
242 | *consider it as a missing value* will switch concerned intensities to NA;
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
243 | this option implies that concerned ions will not be considered in PCA display.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
244 | *consider it as a null intensity* will switch concerned intensities to 0 for lo(w)ess
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
245 | or correct them by the batch mean instead of regression estimate for linear.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
246 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
247
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
248 Factor of interest
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
249 | available for regression model *linear*, *lowess* and *loess*
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
250 | Name of the factor (column header) in Sample metadata file that will be used as a categorical variable for plots and PCA.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
251 | (often a biological factor ; if none, leave "batch")
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
252 | This factor does not affect correction calculation.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
253 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
254
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
255 Level of details for plots
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
256 | available for regression model *linear*, *lowess* and *loess*
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
257 | *basic*: PCA + CV boxplot (before and after correction)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
258 | *standard*: 'basic' plots + before/after-correction plots of intensities over injection order, and design effects for each ion
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
259 | *complete*: 'standard' plots + QC-pool regression plots per batch with samples' intensities over injection order
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
260 | This factor is not used by the *all loess* methods where a unique figure is generated showing the sum of intensities along injection order, and the first 4 PCA scores.
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
261 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
262
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
263
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
264 ------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
265 Output files
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
266 ------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
267
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
268 Batch_correction_$method_rdata.rdata
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
269 | binary data
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
270 | Download, open R and use the 'load' function; objects are in the 'res' list
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
271 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
272
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
273 Batch_correction_$method_graph.pdf
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
274 | graphical output
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
275 | For the *linear* and *lo(w)ess* methods, content depends on level of details chosen
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
276 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
277
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
278 Batch_correction_$method_variableMetadata.tabular
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
279 | tsv output
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
280 | Identical to the Variable metadata input file, with x more columns (where x is the number of batches) in case of *linear*, *lowess* and *loess* methods
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
281 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
282
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
283 Batch_correction_$method_dataMatrix.tabular
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
284 | tsv output (tabulated)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
285 | Same formatting as Data Matrix file; contains corrected intensities
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
286 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
287
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
288
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
289 ---------------------------------------------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
290
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
291 ---------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
292 Working example
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
293 ---------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
294
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
295 .. class:: infomark
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
296
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
297 Refer to the corresponding "W4M HowTo" page:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
298 | `MS data processing - Filters and normalisation &lt;http://workflow4metabolomics.org/sites/workflow4metabolomics.org/files/files/w4e-2016-data_processing.pdf&gt;`_
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
299 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
300 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
301
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
302 See also the reference history:
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
303 | `W4M00001_Sacurine-statistics (DOI:10.15454/1.4811121736910142E12) &lt;http://dx.doi.org/10.15454/1.4811121736910142E12&gt;`_
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
304 |
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
305
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
306 ---------------------------------------------------
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
307
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
308 ----
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
309 NEWS
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
310 ----
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
311
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
312 CHANGES IN VERSION 2.1.2
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
313 ========================
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
314
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
315 INTERNAL MODIFICATIONS
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
316
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
317 Minor modifications in config file
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
318
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
319 CHANGES IN VERSION 2.1.0
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
320 ========================
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
321
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
322 INTERNAL MODIFICATIONS
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
323
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
324 For PCA figure display only (**all_loess** options): missing values are set to the minimum value before PCA computation is performed (with svd)
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
325
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
326 Additional running and installation tests added with planemo, conda, and travis
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
327
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
328 BUG FIX
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
329
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
330 Variables with NA or 0 values in all reference samples are discarded before applying the **all_loess** normalization
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
331
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
332 INTERNAL MODIFICATIONS
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
333
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
334 Modifications of the **all_loess_wrapper** file to handle the recent **ropls** package versions (i.e. 1.3.15 and above) which use S4 classes
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
335
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
336 </help>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
337 <!-- [RECOMMANDED] All citations associated to this tool (main citation given above and other references). Can be extracted from the history panel -->
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
338 <citations>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
339 <!-- [HELP] As DOI or BibTex entry -->
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
340 <citation type="doi">10.1021/pr900499r</citation>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
341 <citation type="doi">10.1038/nprot.2011.335</citation>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
342 <citation type="bibtex">@ARTICLE{Cleveland91,
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
343 author = {Cleveland et al},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
344 year = {1991},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
345 journal = {Statistical Models in S, Chambers JM. and Hastie TJ. Ed., Chapman et Hall: London},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
346 title = {Local Regression Models},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
347 pages = {309-376},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
348 editor = {Chambers JM. and Hastie TJ. Ed.},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
349 publisher = {Chapman et Hall: London},
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
350 chapter = {8}
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
351 }</citation>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
352 <citation type="doi">10.1021/acs.jproteome.5b00354</citation>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
353 </citations>
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
354
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
355
73892ef177e3 Uploaded
melpetera
parents:
diff changeset
356 </tool>