comparison macros.xml @ 0:afc9136ab094 draft

"planemo upload for repository https://github.com/computational-metabolomics/dimspy-galaxy commit 6321871098b2c4bc9e321d20b7e66fff3d641839"
author computational-metabolomics
date Sat, 11 Apr 2020 16:47:41 -0400
parents
children 657c7f8f26b5
comparison
equal deleted inserted replaced
-1:000000000000 0:afc9136ab094
1 <macros>
2 <token name="@TOOL_VERSION@">1.4.0</token>
3 <token name="@GALAXY_TOOL_VERSION@">0</token>
4
5 <xml name="requirements">
6 <requirements>
7 <requirement type="package" version="@TOOL_VERSION@">dimspy</requirement>
8 </requirements>
9 </xml>
10
11 <token name="@HDF5_PM_TO_TXT@">
12 dimspy hdf5-pm-to-txt
13 --input '$hdf5_file_out'
14 --output '$matrix_file_out'
15 --delimiter $delimiter
16 --attribute_name $hdf5_to_txt.matrix_attr
17 --representation-samples $hdf5_to_txt.representation_samples
18 </token>
19
20 <token name="@HDF5_PM_TO_TXT_COMPREHENSIVE@">
21 dimspy hdf5-pm-to-txt
22 --input '$hdf5_file_out'
23 --output '$matrix_comprehensive_file_out'
24 --delimiter $delimiter
25 --comprehensive
26 --attribute_name $hdf5_to_txt.matrix_attr
27 --representation-samples $hdf5_to_txt.representation_samples
28 </token>
29
30 <xml name="hdf5_pm_to_txt">
31 <section name="hdf5_to_txt" title="Show options for addtional output (*.tsv files)" expanded="False">
32 <param name="standard" type="boolean" checked="false" truevalue="true" falsevalue="false" label="Standard output?" help="Set to &quot;yes&quot; to produce a &quot;standard&quot; Peak Matrix (i.e. m/z and intensity)."/>
33 <param name="comprehensive" type="boolean" checked="false" truevalue="true" falsevalue="false" label="Comprehensive output?" help="Set to &quot;yes&quot; to produce a Peak Matrix with additional information (e.g. m/z and intensity, rsd, missing values)."/>
34 <param name="representation_samples" type="select" label="Should the rows or columns represent the samples?" help="">
35 <option value="rows" selected="true">Rows</option>
36 <option value="columns">Columns</option>
37 </param>
38 <param name="matrix_attr" type="select" label="The Peak Matrix should contain ... values" help="">
39 <option value="intensity" selected="true">Intensity</option>
40 <option value="mz">m/z</option>
41 <option value="snr">Signal-to-noise ratio (SNR)</option>
42 </param>
43 </section>
44 </xml>
45
46 <xml name="outputs_peak_intensity_matrix">
47 <data name="hdf5_file_out" format="h5" label="${tool.name} on ${on_string}: Peak Intensity Matrix (HDF5 file)"/>
48 <data name="matrix_file_out" format="tsv" label="${tool.name} on ${on_string}: Peak Intensity Matrix">
49 <filter>hdf5_to_txt["standard"] is True</filter>
50 </data>
51 <data name="matrix_comprehensive_file_out" format="tsv" label="${tool.name} on ${on_string}: Peak Intensity Matrix (comprehensive)" >
52 <filter>hdf5_to_txt["comprehensive"] is True</filter>
53 </data>
54 </xml>
55
56 <xml name="citations">
57 <citations>
58 <citation type="doi">10.1038/nprot.2016.156</citation>
59 <citation type="doi">10.1038/sdata.2014.12</citation>
60 <citation type="doi">10.1021/ac062446p</citation>
61 <citation type="doi">10.1021/ac2001803</citation>
62 <yield />
63 </citations>
64 </xml>
65
66 <token name="@example_filelist@"><![CDATA[
67
68 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
69 | **filename** | **classLabel** | **replicate** | **batch** | **injectionOrder** | **[...]** |
70 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
71 | sample_rep1.raw | sample | 1 | 1 | 1 | [...] |
72 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
73 | sample_rep2.raw | sample | 2 | 1 | 2 | [...] |
74 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
75 | sample_rep3.raw | sample | 3 | 1 | 3 | [...] |
76 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
77 | sample_rep4.raw | sample | 4 | 1 | 4 | [...] |
78 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
79 | blank_rep1.raw | blank | 1 | 1 | 5 | [...] |
80 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
81 | blank_rep2.raw | blank | 2 | 1 | 6 | [...] |
82 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
83 | blank_rep3.raw | blank | 3 | 1 | 7 | [...] |
84 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
85 | blank_rep4.raw | blank | 4 | 1 | 8 | [...] |
86 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
87 | ... | ... | ... | ... | ... | [...] |
88 +-------------------------+----------------+---------------+-----------+--------------------+-----------+
89
90 ]]></token>
91
92
93 <token name="@help_columns_peaklist@">
94
95 - **mz** - the mass-to-charge ratio of the extracted mass spectral peak
96
97 - **intensity** - the intensity of the extracted mass spectral peak
98
99 - **snr** - the signal-to-noise ratio of the extracted peak, which is defined as the ratio of the peak’s intensity value to that of the background noise intensity value
100
101 - **present** - a numeric value greater than 0 that indicates the total number of scans at least one peak was detected in a given file
102
103 - **fraction** - a proportion ranging from 0 to 1 that indicates the total number of times a peak was detected in a given scan event type, divided by the total number of occurrences of that scan event type recorded in a given file.
104
105 - **purity** - a numeric value ranging from 0 to 1 that indicates the proportion of scans, for a given scan event type, that contained a single mass spectral peak following hierarchical clustering. A purity score less-than 1 indicates that in some proportion of scans, multiple peaks within a single scan were grouped together during the hierarchical clustering process.
106
107 - **occurrence** - a numeric value greater than 0 that indicates the total number of peaks that were observed across scans within the user-defined ppm error tolerance.
108
109 - **snr_flag** - a boolean value indicating whether to keep (“1”) or discard (“0”) a peak according to its signal-to-noise ratio value.
110
111 - **fraction_flag** - a boolean value indicating whether a peak should be kept or discarded according to the ratio of the number of scans in which it was detected, to the the number of scans in which it was not detected.
112
113 - **flags** - a boolean value indicating whether a peak should be retained or discarded based upon both its ‘snr_flag’ and ‘fraction_flag’ boolean values (if either is set to ‘0’ i.e. discard peak, then the ‘flags’ boolean should also be 0).
114
115 </token>
116
117 <token name="@example_peaklist@">
118
119
120 **Example of an processed and filtered peaklist**:
121
122
123 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
124 | mz | intensity | snr | present | fraction | rsd | occurrence | purity | snr_flag | fraction_flag | flags |
125 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
126 | 90.44000 | 4744.0 | 3.06 | 1 | 0.063 | nan | 1 | 1 | 1 | 0 | 0 |
127 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
128 | 97.07380 | 5423.6 | 3.52 | 1 | 0.063 | nan | 1 | 1 | 1 | 0 | 0 |
129 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
130 | 99.04180 | 4105.8 | 3.60 | 1 | 0.063 | nan | 1 | 1 | 1 | 0 | 0 |
131 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
132 | 99.49800 | 4775.7 | 3.05 | 1 | 0.063 | nan | 1 | 1 | 1 | 0 | 0 |
133 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
134 | 99.95020 | 5657.8 | 3.63 | 1 | 0.063 | nan | 1 | 1 | 1 | 0 | 0 |
135 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
136 | 100.40660 | 5489.5 | 3.57 | 3 | 0.188 | 14.51 | 3 | 1 | 1 | 0 | 0 |
137 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
138 | 100.8672 | 4841.18 | 3.27 | 7 | 0.4375 | 16.36 | 7 | 1 | 1 | 0 | 0 |
139 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
140 | 101.0027 | 9047.79 | 5.99 | 16 | 1 | 21.53 | 19 | 0.8125 | 1 | 1 | 1 |
141 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
142 | 101.0033 | 271893.9 | 182 | 16 | 1 | 4.17 | 16 | 1 | 1 | 1 | 1 |
143 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
144 | 101.0038 | 8738.03 | 5.9 | 14 | 0.875 | 9.71 | 14 | 1 | 1 | 1 | 1 |
145 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
146 | 101.004 | 5166.67 | 3.5 | 5 | 0.3125 | 18.02 | 6 | 0.8 | 1 | 0 | 0 |
147 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
148 | 101.0599 | 5894.69 | 3.88 | 2 | 0.125 | 15.06 | 2 | 1 | 1 | 0 | 0 |
149 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
150 | 101.2728 | 6846.28 | 4.44 | 1 | 0.0625 | nan | 1 | 1 | 1 | 0 | 0 |
151 +-----------+-----------+------+---------+----------+-------+------------+--------+----------+---------------+-------+
152
153 </token>
154
155 <token name="@help_options_addtional_output@">
156
157 **Show options for additional output(s)** (OPTIONAL):
158
159 - **Standard output** (default = **No**) - boolean toggle where selection of:
160
161 - **No** - prevent the export of a .txt formatted peak matrix to the active Galaxy history.
162
163 - **Yes** - export a .txt formatted peak matrix to the active Galaxy history that includes only those peaks from the input peak intensity matrix that passed the filtering procedure.
164
165 - **Comprehensive output** (default = "No") - boolean toggle where selection of:
166
167 - **No** - prevents export of a .txt formatted comprehensive peak matrix.
168
169 - **Yes** - exports a .txt formatted comprehensive peak matrix to the active Galaxy history that contains the m/z, missing values and other metrics associated with all peaks included in the input peak intensity matrix, including the metric defined by the "The peak matrix should contain intensity | m/z | SNR values" parameter.
170
171 - **Should rows or columns represent the samples?** (default = **rows**) - binary toggle where selection of:
172
173 - **rows** - sample information is presented in the rows and m/z values (for aligned mass spectral peaks) in the columns of any output peak matrix.
174
175 - **columns** - sample information is presented in the columns and m/z values (for aligned mass spectral peaks) in the rows of any output peak matrix.
176
177 - **The peak matrix should contain intensity | m/z | SNR values** - use this option to define which peak metric is inserted in to the cells of any optionally-output peak matrix:
178
179 - **Intensity** - writes the absolute peak intensity to the cells of the peak matrix
180
181 - **m/z** - writes the mass-to-charge ratio to the cells of the peak matrix
182
183 - **signal-to-noise ratio (SNR)** - writes the signal-to-noise ratio to the cells of the peak matrix
184
185 </token>
186
187 <token name="@help_outputs_matrix@">
188
189 **Default output** - a HDF5 file containing the aligned peak intensity matrix.
190
191 |
192
193 **Optional outputs** - the metric recorded in any optionally output peak matrix/matrices is defined using the parameter "The peak matrix should contain intensity | m/z | SNR values". By default, study samples are listed row-wise, while mass-to-charge ratios of the aligned mass spectral peaks are presented in columns (to adjust, users must adjust the "Should rows or columns represent samples" toggle to “columns”).
194
195
196 - **Standard output** - an aligned peak matrix in tab-delimited format (“.” as decimal and NA for missing values).
197
198 **Example of a standard peak intensity matrix**:
199
200 +------------+----------+----------+----------+----------+---------+
201 | mz | 96.04216 | 99.08062 | 100.0759 | 100.8672 | ... |
202 +------------+----------+----------+----------+----------+---------+
203 | QC_1 | 0 | 0 | 0 | 0 | ... |
204 +------------+----------+----------+----------+----------+---------+
205 | Blank_1 | 3342.626 | 0 | 0 | 0 | ... |
206 +------------+----------+----------+----------+----------+---------+
207 | Control_10 | 0 | 0 | 45432.2 | 0 | ... |
208 +------------+----------+----------+----------+----------+---------+
209 | Sample_2 | 0 | 3423.3 | 0 | 0 | ... |
210 +------------+----------+----------+----------+----------+---------+
211 | Control_5 | 0 | 0 | 49759 | 0 | ... |
212 +------------+----------+----------+----------+----------+---------+
213 | Control_10 | 0 | | 39890.5 | 0 | ... |
214 +------------+----------+----------+----------+----------+---------+
215 | Sample_20 | 0 | 14563.7 | 0 | 0 | ... |
216 +------------+----------+----------+----------+----------+---------+
217 | Sample_2 | 0 | 34676.4 | 0 | 0 | ... |
218 +------------+----------+----------+----------+----------+---------+
219 | Sample_14 | 0 | 13134.9 | 0 | 521.4 | ... |
220 +------------+----------+----------+----------+----------+---------+
221 | ... | ... | ... | ... | ... | ... |
222 +------------+----------+----------+----------+----------+---------+
223
224 |
225
226 - **Comprehensive output** - an aligned peak matrix, as described for the "standard output" (above), including all metadata from the "Process Scans" Filelist/samplelist and the following additional mass spectral peak metrics:
227
228 - **present** - a positive integer value (0 <![CDATA[ < ]]> value <![CDATA[ < ]]> total number of study samples in the filelist / samplelist) that indicates the total number of study samples in which a peak was detected with the specified mass-to-charge ratio, plus or minus the user-defined ppm error tolerance.
229
230 - **occurrence** - a positive integer value indicating the number of peaks that were grouped together during the alignment procedure and thus, that were used to calculate the average mass-to-charge ratio indicated for the aligned peak. A value greater than given in the “Present” metric indicates that one or more peaklists contained more-than one mass spectral peak with the specified mass-to-charge, plus or minus the user-defined ppm error tolerance.
231
232 - **purity** - a proportion ranging from 0 to 1 that indicates the number of scans in which only a single peak was detected during the peaklist alignment process. If the value in the “occurrence” metric is greater than the “present” metric, purity will be <![CDATA[ < ]]> 1. A purity <![CDATA[ < ]]> 1 means that in at least one peaklist there was more-than one mass spectral peak with the specified mass-to-charge, plus or minus the user-defined ppm error tolerance.
233
234 - **rsd_all** - a numeric value indicating the percent relative standard deviation (otherwise termed the percent coefficient of variation) of peak intensities for peaks aligned together using the Align Samples tool. If fewer than 2 peaks were aligned across samples, then the rsd_all column will be filled in with ‘nan’
235
236 - **blank_flag** (may be absent if "Blank filter” tool was not applied) - a boolean value where 0 = reject peak, 1 = accept peak. A peak is accepted during blank filtering if a user-defined minimum proportion of study samples had peak intensity values greater-than the product of the average of “reference” sample peak intensities and the “min_fold_change” parameter.
237
238 - **fraction_flag** (may be absent if "Sample filter” tool was not applied)- a boolean value where 0 = reject peak, 1 = accept peak. If greater-than a user-defined minimum fraction of samples (whether checked across ALL experimental classes, or within ANY of the individual experimental classes) had recorded intensity values for a given peak, then this peak is accepted, i.e. it is considered in downstream processing procedures, while rejected peaks are not.
239
240 - **flags** - a boolean value indicating whether a peak should be included (“1”) or excluded (“0”) from downstream processing procedures. Exclusion of a peak occurs if the thresholds for “relative standard deviation” and/or “minimum number of technical replicates a peak has to be present in” were not met.
241
242 |
243
244 **Example of a comprehensive peak intensity matrix**:
245
246 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
247 | mz | missing values | tags_batch | tags_replicates | tags_replicate | tags_injectionOrder | tags_classLabel | tags_untyped | 96.04216 | 99.08062 | 100.0759 | 100.8672 | ... |
248 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
249 | present* | | | | | | | | 1 | 4 | 3 | 1 | ... |
250 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
251 | occurrence* | | | | | | | | 1 | 4 | 4 | 1 | ... |
252 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
253 | purity* | | | | | | | | 1 | 1 | 1 | 1 | ... |
254 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
255 | rsd_all* | | | | | | | | nan | nan | 10.98 | nan | ... |
256 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
257 | flags* | | | | | | | | 1 | 1 | 1 | 1 | ... |
258 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
259 | QC_1 | 2901 | 1 | 2_3_4 | 2 | 2 | QC | | 0 | 0 | 0 | 0 | ... |
260 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
261 | Blank_1 | 2948 | 1 | 1_2_4 | 1 | 5 | Blank | | 3342.626 | 0 | 0 | 0 | ... |
262 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
263 | Control_10 | 2921 | 1 | 2_3_4 | 2 | 10 | Control | | 0 | 0 | 45432.2 | 0 | ... |
264 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
265 | Sample_2 | 2819 | 1 | 1_2_4 | 1 | 13 | Exposed | | 0 | 3423.3 | 0 | 0 | ... |
266 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
267 | Control_5 | 2877 | 1 | 2_3_4 | 2 | 18 | Control | | 0 | 0 | 49759 | 0 | ... |
268 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
269 | Control_10 | 2856 | 1 | 1_2_3 | 1 | 21 | Control | | 0 | | 39890.5 | 0 | ... |
270 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
271 | Sample_20 | 2855 | 1 | 1_2_4 | 1 | 25 | Exposed | | 0 | 14563.7 | 0 | 0 | ... |
272 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
273 | Sample_2 | 2814 | 1 | 1_2_4 | 1 | 29 | Exposed | | 0 | 34676.4 | 0 | 0 | ... |
274 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
275 | Sample_14 | 2870 | 1 | 1_2_3 | 1 | 33 | Exposed | | 0 | 13134.9 | 0 | 521.4 | ... |
276 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
277 | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... | ... |
278 +-------------+----------------+------------+-----------------+----------------+---------------------+-----------------+--------------+----------+----------+----------+----------+---------+
279
280 </token>
281
282
283 <token name="@github_developers_contributors@">
284 Github respository (source code)
285 --------------------------------
286
287 Galaxy Tool Wrappers: https://github.com/computational-metabolomics/dimspy-galaxy/
288 DIMSpy package: https://github.com/computational-metabolomics/dimspy/
289
290
291 Developers and contributors
292 ---------------------------
293
294 - Ralf Weber (r.j.weber@bham.ac.uk) - University of Birmingham (UK)
295 - Martin R. Jones (m.r.jones.1@bham.ac.uk) - University of Birmingham (UK)
296 - Thomas Lawson (tnl495@bham.ac.uk) - University of Birmingham (UK)
297
298 </token>
299
300 <token name="@license@">
301 License
302 -------
303 DIMSpy is released under the GNU General Public License v3.0 (see `LICENSE file`_)
304
305 .. _`LICENSE file`: https://github.com/computational-metabolomics/dimspy-galaxy/blob/master/LICENSE
306
307 </token>
308
309
310 </macros>