annotate BC/batch_correction.xml @ 4:23314e1192d4 draft default tip

Uploaded
author melpetera
date Thu, 14 Jan 2021 09:56:58 +0000
parents
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
4
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
1 <tool id="Batch_correction" name="Batch_correction" version="3.0.0">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
2 <description>Corrects intensities for signal drift and batch-effects</description>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
3
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
4 <macros>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
5 <import>macros.xml</import>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
6 </macros>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
7
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
8 <requirements>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
9 <requirement type="package" version="1.1_4">r-batch</requirement>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
10 <requirement type="package" version="1.7_8">r-ade4</requirement>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
11 <requirement type="package" version="1.70.0">bioconductor-pcamethods</requirement>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
12 <requirement type="package" version="1.10.0">bioconductor-ropls</requirement>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
13 </requirements>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
14
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
15 <stdio>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
16 <exit_code range="1:" level="fatal" />
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
17 </stdio>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
18
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
19 <command><![CDATA[
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
20 #if str($span_condition.method) == 'all_loess_pool':
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
21 Rscript $__tool_directory__/batch_correction_all_loess_wrapper.R
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
22 dataMatrix "$dataMatrix"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
23 sampleMetadata "$sampleMetadata"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
24 variableMetadata "$variableMetadata"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
25 method "all_loess_pool"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
26 span "${span_condition.span}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
27
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
28 #elif str($span_condition.method) == 'all_loess_sample':
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
29 Rscript $__tool_directory__/batch_correction_all_loess_wrapper.R
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
30 dataMatrix "$dataMatrix"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
31 sampleMetadata "$sampleMetadata"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
32 variableMetadata "$variableMetadata"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
33 method "all_loess_sample"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
34 span "${span_condition.span}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
35 #else:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
36 Rscript $__tool_directory__/batch_correction_3Lwrapper.R
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
37 analyse "batch_correction"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
38 dataMatrix "$dataMatrix"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
39 sampleMetadata "$sampleMetadata"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
40 variableMetadata "$variableMetadata"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
41 method "${span_condition.method}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
42 #if str($span_condition.method) == 'linear':
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
43 span "none"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
44 #else:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
45 span "${span_condition.span}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
46 #end if
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
47 valnull "${span_condition.valnull}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
48 ref_factor "${span_condition.ref_factor}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
49 detail "${span_condition.detail}"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
50 #end if
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
51 dataMatrix_out "$dataMatrix_out" variableMetadata_out "$variableMetadata_out"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
52 graph_output "$graph_output" rdata_output "$rdata_output"
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
53 @SM_CUSTOM@
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
54 ]]></command>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
55
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
56 <inputs>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
57 <param name="dataMatrix" label="Data matrix file " format="tabular" type="data" />
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
58 <param name="sampleMetadata" label="Sample metadata file " format="tabular" type="data" help="must contain at least the three following columns: 'batch' + 'injectionOrder' + 'sampleType'"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
59 <param name="variableMetadata" label="Variable metadata file " format="tabular" type="data" />
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
60
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
61 <expand macro="sm_customisation"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
62
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
63 <conditional name="span_condition">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
64 <param name="method" label="Type of regression model " type="select" help="To select between linear or non-linear (lowess or loess) methods to be used in Van der Kloet algorithm ; when using loess, you can choose to use pools or samples to model batch effect.">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
65 <option value="linear">linear</option>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
66 <option value="lowess">lowess</option>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
67 <option value="loess">loess</option>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
68 <option value="all_loess_pool">all loess pool</option>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
69 <option value="all_loess_sample">all loess sample</option>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
70 </param>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
71 <when value="linear">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
72 <expand macro="lll_options"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
73 </when>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
74 <when value="lowess">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
75 <expand macro="lll_span"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
76 <expand macro="lll_options"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
77 </when>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
78 <when value="loess">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
79 <expand macro="lll_span"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
80 <expand macro="lll_options"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
81 </when>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
82 <when value="all_loess_pool">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
83 <param name="span" type="float" value="1" label="span" help="smoothing parameter; must be > 0"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
84 </when>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
85 <when value="all_loess_sample">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
86 <param name="span" type="float" value="1" label="span" help="smoothing parameter; must be > 0"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
87 </when>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
88 </conditional>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
89 </inputs>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
90
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
91 <outputs>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
92 <data name="dataMatrix_out" label="BC_${span_condition.method}_${dataMatrix.name}" format="tabular"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
93 <data name="variableMetadata_out" label="BC_${span_condition.method}_${variableMetadata.name}" format="tabular"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
94 <data name="graph_output" label="${tool.name}_${span_condition.method}_graph" format="pdf"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
95 <data name="rdata_output" label="${tool.name}_${span_condition.method}_rdata" format="rdata">
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
96 <filter>span_condition['method'] == 'all_loess_pool' or span_condition['method'] == 'all_loess_sample'</filter>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
97 </data>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
98 </outputs>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
99
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
100 <tests>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
101 <test>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
102 <param name="dataMatrix" value="input-batchcorrection-dataMatrix.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
103 <param name="sampleMetadata" value="input-batchcorrection-sampleMetadata.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
104 <param name="variableMetadata" value="input-batchcorrection-variableMetadata.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
105 <param name="method" value="all_loess_pool"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
106 <param name="span" value="1"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
107 <output name="dataMatrix_out" file="output-batchcorrection-dataMatrix.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
108 </test>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
109 <test>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
110 <param name="dataMatrix" value="input-batchcorrection-dataMatrix.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
111 <param name="sampleMetadata" value="input-batchcorrection-sampleMetadata-customSampleType.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
112 <param name="variableMetadata" value="input-batchcorrection-variableMetadata.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
113 <param name="method" value="loess"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
114 <param name="span" value="1"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
115 <param name="sample_type_col_name" value="MySampType"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
116 <param name="sampleTypeTagPool" value="lot"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
117 <param name="sampleTypeTagBlank" value="blanc"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
118 <param name="sampleTypeTagSample" value="echant"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
119 <output name="dataMatrix_out" file="output-batchcorrection-dataMatrix-3L.tsv"/>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
120 </test>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
121 </tests>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
122
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
123 <help>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
124
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
125 .. class:: infomark
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
126
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
127 **Authors**
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
128 | Jean-Francois Martin - PF MetaToul-AXIOM ; INRAE ; MetaboHUB (for original version of this tool and overall development of the R script)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
129 | Melanie Petera - PFEM ; INRAE ; MetaboHUB (for R wrapper and R script improvement regarding "linear/lowess/loess" methods)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
130 | Marion Landi - FLAME ; PFEM (for original xml interface and R wrapper)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
131 | Franck Giacomoni - PFEM ; INRAE ; MetaboHUB (for original xml interface and R wrapper)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
132 | Etienne Thevenot - LIST/LADIS ; CEA ; MetaboHUB (for R script and wrapper regarding "all loess pool" and "all loess sample" methods)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
133
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
134 ---------------------------------------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
135
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
136 .. class:: infomark
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
137
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
138 **Please cite** If you use this tool, please cite:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
139
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
140 when using the **linear**, **lowess** or **loess** methods:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
141 | `F.M. Van Der Kloet, I. Bobeldijk, E.R. Verheij, R.H. Jellema. (2009). "Analytical error reduction using single point calibration for accurate and precise metabolomic phenotyping." Journal of Proteome Research p5132-5141 &lt;http://www.ncbi.nlm.nih.gov/pubmed/19754161&gt;`_
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
142
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
143 when using the **all loess pool** or **all loess sample** method:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
144 | `Dunn et al (2011). Procedures for large-scale metabolic profiling of serum and plasma using gas chromatography and liquid chromatography coupled to mass spectrometry. Nature Protocols, 6:1060-1083 &lt;http://dx.doi.org/10.1038/nprot.2011.335&gt;`_
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
145 | Cleveland et al (1997). In Statistical Models in S; Chambers JM. and Hastie TJ. Ed.; Chapman et Hall: London; pp. 309-376
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
146 | Etienne A. Thevenot, Aurelie Roux, Ying Xu, Eric Ezan, and Christophe Junot (2015). Analysis of the human adult urinary metabolome variations with age, body mass index and gender by implementing a comprehensive workflow for univariate and OPLS statistical analyses. *Journal of Proteome Research*, **14**:3322-3335 (http://dx.doi.org/10.1021/acs.jproteome.5b00354).
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
147
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
148 ---------------------------------------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
149
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
150 .. class:: infomark
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
151
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
152 **Tool updates**
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
153
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
154 See the **NEWS** section at the bottom of this page
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
155
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
156 ---------------------------------------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
157
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
158 ================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
159 Batch_correction
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
160 ================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
161
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
162 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
163
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
164 -----------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
165 Description
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
166 -----------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
167
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
168 | **Instrumental drift** and **offset differences** between batches have been described in **LC-MS** experiments when the number of samples is large and/or multiple batches of acquisition are needed.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
169 | Recently a normalization strategy relying on the measurements of a **pooled** (or QC) sample injected periodically has been described: for each variable, a **regression model** is fitted to the values of the **pool** and subsequently used to adjust the intensities of the samples of interest (van der Kloet et al, 2009; Dunn et al, 2011).
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
170 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
171 | The current tool implements **two strategies** which differ in the way the regression model is applied to the variables (either depending on variable quality metrics, or 'loess' model for all variables) and also in the generated figure.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
172 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
173
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
174
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
175 -----------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
176 Workflow position
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
177 -----------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
178
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
179 .. image:: batch_correction.png
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
180 :width: 800
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
181
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
182
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
183 -----------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
184 Input files
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
185 -----------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
186
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
187 +----------------------------+------------+
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
188 | Parameter : num + label | Format |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
189 +============================+============+
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
190 | 1 : Data Matrix file | tabular |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
191 +----------------------------+------------+
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
192 | 2 : Sample metadata file | tabular |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
193 +----------------------------+------------+
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
194 | 3 : Variable metadata file | tabular |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
195 +----------------------------+------------+
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
196
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
197 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
198
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
199 Data Matrix file must contain the intensity values of variables.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
200 | First line must contain all the samples' names
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
201 | First column must contain all the variables' ID
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
202
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
203
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
204 Sample metadata file must contain at least the three following columns:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
205 | - a batch column (default to "*batch*") to identify the batches of analyses
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
206 | - an injection order column (default to "*injectionOrder*") composed of integers defining the injection order of samples
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
207 | - a sample type column (default to "*sampleType*") indicating if a sample is a biological one ("*sample*"), a QC-pool ("*pool*") or a blank ("*blank*")
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
208 | *Default values* can be changed according to your data coding using the customisation parameters in the "**Sample metadata file coding parameters**" section.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
209
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
210
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
211 **Notes concerning your design:**
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
212 | - the 3 mandatory columns must not contain NA
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
213 | - your data should contain at least 3 QC-pools in each batch for intra-batch **linear** adjustment and 8 for **lo(w)ess** adjustment (minimum of 5 for **all loess** methods)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
214
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
215
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
216
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
217 ----------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
218 Parameters
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
219 ----------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
220
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
221
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
222 Sample metadata file coding parameters
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
223 | Enables to give the names of columns in the sample metadata table that contain the injection order, the batches and the sample types.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
224 | Also enables to specify the sample type coding used in the sampletype column.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
225 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
226
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
227 Type of regression model
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
228 | To choose between *linear*, *lowess*, *loess*, *all loess pool*, and *all loess sample* strategies
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
229 | **- Option 1** (**linear**, **lowess**, and **loess** methods): before the normalisation of each variable, some quality metrics are computed (see the "Determine Batch Correction" module); depending on the result, the variable can be normalized or not, with either the **linear**, **lowess** or **loess** model.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
230 | **- Option 2** (**all loess pool** and **all loess sample**): each variable is normalized by using the 'loess' model;
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
231 | in the case **all loess pool** is chosen and the number of pool observations is below 5, the linear method is used (for all variables) and a warning is generated;
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
232 | if the pool intensities are not representative of the samples (which can be viewed on the figure where both trends are shown), the case **all loess sample** enables using the sample intensities (instead of the pool intensities) as the reference for the loess curve.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
233 | In all "option 2" cases: the **median intensity of the reference observations** (either 'pool' or 'sample') is used as the scaling factor after the initial intensities have been divided by the loess predictions.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
234 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
235
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
236 Span
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
237 | Smoothing parameter, advanced option for *lo(w)ess* and *all loess* methods
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
238 | In case of a loess fit, the **span** parameter (between 0 and 1) controls the smoothing
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
239 | (the higher the smoother; higher values are prefered to avoid overfitting; Cleveland et al, 1997).
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
240 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
241
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
242 Unconsistant values
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
243 | available for regression model *linear*, *lowess* and *loess*
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
244 | Controls what is done regarding negative or infinite values that can be generated during regression estimation.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
245 | *Prevent it* will change the normalisation term leading to an unconsistant value to prevent it:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
246 | when intra batch denominator term is below 1, it is turned to the minimum >1 one obtained in the concerned batch.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
247 | *Consider it as a missing value* will switch concerned intensities to NA;
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
248 | this option implies that concerned ions will not be considered in PCA display.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
249 | *Consider it as a null intensity* will switch concerned intensities to 0.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
250 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
251
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
252 Factor of interest
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
253 | available for regression model *linear*, *lowess* and *loess*
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
254 | Name of the factor (column header) that will be used as a categorical variable for design plots (often a biological factor ; if none, put the batch column name).
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
255 | This factor does not affect correction calculation.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
256 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
257
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
258 Level of details for plots
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
259 | available for regression model *linear*, *lowess* and *loess*
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
260 | *basic*: Sum of intensities + PCA + CV boxplot (before and after correction)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
261 | *standard*: 'basic' plots + before/after-correction plots of intensities over injection order, and design effects for each ion
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
262 | *complete*: 'standard' plots + QC-pool regression plots per batch with samples' intensities over injection order
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
263 | This factor is not used by the *all loess* methods where a unique figure is generated showing the sum of intensities along injection order, and the first 4 PCA scores.
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
264 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
265
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
266
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
267 ------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
268 Output files
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
269 ------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
270
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
271 Batch_correction_$method_rdata.rdata ('all_loess' methods only)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
272 | binary data
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
273 | Download, open R and use the 'load' function; objects are in the 'res' list
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
274 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
275
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
276 Batch_correction_$method_graph.pdf
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
277 | graphical output
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
278 | For the *linear* and *lo(w)ess* methods, content depends on level of details chosen
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
279 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
280
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
281 Batch_correction_$method_variableMetadata.tabular
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
282 | tsv output
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
283 | Identical to the variable metadata input file, with x more columns (where x is the number of batches) in case of *linear*, *lowess* and *loess* methods
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
284 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
285
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
286 Batch_correction_$method_dataMatrix.tabular
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
287 | tsv output (tabulated)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
288 | Same formatting as the data matrix file; contains corrected intensities
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
289 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
290
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
291
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
292 ---------------------------------------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
293
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
294 ----------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
295 Additional information
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
296 ----------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
297
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
298 .. class:: infomark
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
299
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
300 Refer to the corresponding "W4M HowTo" page:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
301 | `MS data processing - Filters and normalisation &lt;https://download.workflow4metabolomics.org/docs/w4e2018/2018-10_EC_W4E%20-%20Dataprocessing_Filter_and_normalisation.pdf&gt;`_
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
302 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
303
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
304 See also the reference history:
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
305 | `W4M00001_Sacurine-statistics (DOI:10.15454/1.4811121736910142E12) &lt;http://dx.doi.org/10.15454/1.4811121736910142E12&gt;`_
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
306
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
307
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
308 ---------------------------------------------------
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
309
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
310 ----
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
311 NEWS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
312 ----
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
313
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
314 CHANGES IN VERSION 3.0.0
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
315 ========================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
316
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
317 NEW FEATURES
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
318
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
319 | - Specific names for the 'sampleType', 'injectionOrder', and 'batch' from sampleMetadata are now available in a dedicated parameter section
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
320 | - Addition of a sum of ions before/after plot for linear/lowess/loess methods
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
321 | - Addition of a third option in "Null values" parameter (renamed "unconsistant values") in linear/lowess/loess methods
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
322 | - linear/lowess/loess methods now handle NA in intensities and allow "blank" samples in the dataset
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
323 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
324
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
325 INTERNAL MODIFICATIONS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
326
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
327 | - XML optimisation using macros
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
328 | - Output name changes
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
329 | - linear/lowess/loess methods: disabling of RData output
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
330 | - linear/lowess/loess methods: split of tool-linked code and script-linked one
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
331 | - linear/lowess/loess methods: adjustments in the normalisation process to match matters linked to NA acceptance
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
332 | - linear/lowess/loess methods: better handling of special characters in IDs and column names
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
333 |
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
334
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
335 CHANGES IN VERSION 2.2.4
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
336 ========================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
337
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
338 INTERNAL MODIFICATIONS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
339
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
340 Fixed bug for pool selection ("all_loess" methods)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
341
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
342 CHANGES IN VERSION 2.2.2
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
343 ========================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
344
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
345 INTERNAL MODIFICATIONS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
346
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
347 Fixed bug for color plot ("all_loess" methods)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
348
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
349 CHANGES IN VERSION 2.2.0
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
350 ========================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
351
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
352 NEW FEATURE
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
353
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
354 Specific names for the 'sampleType', 'injectionOrder', and 'batch' from sampleMetadata can be selected by the user (for compatibility with the MTBLS downloader)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
355
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
356 CHANGES IN VERSION 2.1.2
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
357 ========================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
358
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
359 INTERNAL MODIFICATIONS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
360
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
361 Minor modifications in config file
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
362
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
363 CHANGES IN VERSION 2.1.0
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
364 ========================
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
365
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
366 INTERNAL MODIFICATIONS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
367
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
368 For PCA figure display only (**all_loess** options): missing values are set to the minimum value before PCA computation is performed (with svd)
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
369
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
370 Additional running and installation tests added with planemo, conda, and travis
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
371
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
372 BUG FIX
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
373
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
374 Variables with NA or 0 values in all reference samples are discarded before applying the **all_loess** normalization
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
375
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
376 INTERNAL MODIFICATIONS
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
377
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
378 Modifications of the **all_loess_wrapper** file to handle the recent **ropls** package versions (i.e. 1.3.15 and above) which use S4 classes
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
379
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
380 </help>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
381 <!-- [RECOMMANDED] All citations associated to this tool (main citation given above and other references). Can be extracted from the history panel -->
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
382 <citations>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
383 <!-- [HELP] As DOI or BibTex entry -->
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
384 <citation type="doi">10.1021/pr900499r</citation>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
385 <citation type="doi">10.1038/nprot.2011.335</citation>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
386 <citation type="bibtex">@ARTICLE{Cleveland91,
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
387 author = {Cleveland et al},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
388 year = {1991},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
389 journal = {Statistical Models in S, Chambers JM. and Hastie TJ. Ed., Chapman et Hall: London},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
390 title = {Local Regression Models},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
391 pages = {309-376},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
392 editor = {Chambers JM. and Hastie TJ. Ed.},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
393 publisher = {Chapman et Hall: London},
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
394 chapter = {8}
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
395 }</citation>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
396 <citation type="doi">10.1021/acs.jproteome.5b00354</citation>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
397 </citations>
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
398
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
399
23314e1192d4 Uploaded
melpetera
parents:
diff changeset
400 </tool>