comparison vkmz.xml @ 6:35b984684450 draft

planemo upload for repository https://github.com/HegemanLab/VKMZ commit 5ef8d2b36eb35ff5aad5d5e9b78c38405fc95c1a
author eslerm
date Tue, 10 Jul 2018 17:58:35 -0400
parents 04079c34452a
children b0ce669ce794
comparison
equal deleted inserted replaced
5:04079c34452a 6:35b984684450
1 <tool id="VKMZ" name="VKMZ" version="1.1.1"> 1 <tool id="VKMZ" name="VKMZ" version="1.2.0">
2 2
3 <description>metabolomics formula prediction and van Krevelen diagram generation</description> 3 <description>metabolomics formula prediction and van Krevelen diagram generation</description>
4 4
5 <requirements> 5 <requirements>
6 <requirement type="package" version="2.7">python</requirement> 6 <requirement type="package" version="2.7">python</requirement>
7 <requirement type="package">pandas</requirement>
8 <requirement type="package">plotly</requirement>
9 </requirements> 7 </requirements>
10 8
11 <stdio> 9 <stdio>
12 <exit_code range="1:" level="fatal" /> 10 <exit_code range="1:" level="fatal" />
13 </stdio> 11 </stdio>
35 --error $prediction.error 33 --error $prediction.error
36 --database $prediction.database_type.database 34 --database $prediction.database_type.database
37 #if $prediction.unique=="True": 35 #if $prediction.unique=="True":
38 --unique 36 --unique
39 #end if 37 #end if
40 --size $diagram.size
41 --size-algorithm $diagram.sizealgorithm
42 --directory $__tool_directory__/ 38 --directory $__tool_directory__/
43 ]]></command> 39 ]]></command>
44 40
45 <inputs> 41 <inputs>
46 <conditional name="mode"> 42 <conditional name="mode">
56 <when value="tsv"> 52 <when value="tsv">
57 <param name="input" label="Tabular input" type="data" format="tabular" help="Select tabular data" /> 53 <param name="input" label="Tabular input" type="data" format="tabular" help="Select tabular data" />
58 </when> 54 </when>
59 </conditional> 55 </conditional>
60 <section name="advanced_input" title="Advanced Input Options" expanded="false"> 56 <section name="advanced_input" title="Advanced Input Options" expanded="false">
61 <param name="polarity" label="Override polarity" type="select" help="Set polarity for all samples ignoring input files"> 57 <param name="polarity" label="Override polarity" type="select" help="Force the polarity of all samples">
62 <option value="NA">No override</option> 58 <option value="NA">No override</option>
63 <option value="negative">Negative</option> 59 <option value="negative">Negative</option>
64 <option value="positive">Positive</option> 60 <option value="positive">Positive</option>
65 </param> 61 </param>
66 <param name="no_adjustment" label="Disable polarity based mass adjustment" type="boolean" truevalue="True" help="Use this option if data contains neutral masses." /> 62 <param name="no_adjustment" label="Disable polarity based mass adjustment" type="boolean" truevalue="True" help="Use this option if data contains neutral masses." />
67 </section> 63 </section>
68 <section name="prediction" title="Prediction Options" expanded="true"> 64 <section name="prediction" title="Prediction Options" expanded="true">
69 <param name="error" label="Mass Error (PPM)" type="float" value="3.0" min="0" help="Set according to mass spectrometer's mass error in parts-per-million" /> 65 <param name="error" label="Mass Error (PPM)" type="float" value="10.0" min="0" help="Set according to expected mass error in parts-per-million" />
70 <conditional name="database_type"> 66 <conditional name="database_type">
71 <param name="database_type_selector" type="select" label="Database Type"> 67 <param name="database_type_selector" type="select" label="Database Type">
72 <option value="heuristic">Heuristically Generated</option> 68 <option value="heuristic">Heuristically Generated</option>
73 <option value="custom">Custom</option> 69 <option value="custom">Custom</option>
74 </param> 70 </param>
84 <param name="database" label="Database" type="data" format="tabular" help="Select a custom tabular database" /> 80 <param name="database" label="Database" type="data" format="tabular" help="Select a custom tabular database" />
85 </when> 81 </when>
86 </conditional> 82 </conditional>
87 <param name="unique" label="Unique matches" type="boolean" truevalue="True" help="Only output features with a single prediction" /> 83 <param name="unique" label="Unique matches" type="boolean" truevalue="True" help="Only output features with a single prediction" />
88 </section> 84 </section>
89 <section name="diagram" title="Diagram Options" expanded="true">
90 <param name="size" label="Minimum Maker Size" type="integer" value="5" min="0" help="Set the base size of diagram's markers" />
91 <param name="sizealgorithm" label="Marker Size Algorithm" type="select" help="Select algorithm to change marker sizes. 1.) Set all markers to the base size, 2.) Marker sizes are relative to feature's log intensity">
92 <option value="0">Uniform</option>
93 <option value="1">Relative Log Intensity</option>
94 </param>
95 </section>
96 </inputs> 85 </inputs>
97
98 <outputs> 86 <outputs>
99 <data format="tabular" name="output" from_work_dir="vkmz.tsv" label="${tool.name}_${mode.mode_selector}_tabular" /> 87 <data format="tabular" name="output" from_work_dir="vkmz.tsv" label="${tool.name}_${mode.mode_selector}_tabular" />
100 <data format="html" name="output_html" from_work_dir="vkmz.html" label="${tool.name}_${mode.mode_selector}_html" /> 88 <data format="html" name="output_html" from_work_dir="vkmz.html" label="${tool.name}_${mode.mode_selector}_html" />
101 </outputs> 89 </outputs>
102 90
106 <param name="mode_selector" value="xcms" /> 94 <param name="mode_selector" value="xcms" />
107 <param name="datamatrix" value="datamatrix.tabular" /> 95 <param name="datamatrix" value="datamatrix.tabular" />
108 <param name="samplemetadata" value="sampleMetadata.tabular" /> 96 <param name="samplemetadata" value="sampleMetadata.tabular" />
109 <param name="variablemetadata" value="variableMetadata.tabular" /> 97 <param name="variablemetadata" value="variableMetadata.tabular" />
110 </conditional> 98 </conditional>
111 <param name="error" value="3" /> 99 <param name="error" value="10" />
112 <param name="database" value="databases/bmrb-light.tsv" /> 100 <param name="database" value="databases/bmrb-light.tsv" />
113 <output name="output"> 101 <output name="output">
114 <assert_contents> 102 <assert_contents>
115 <has_text text="0.00016357" /> 103 <has_text text="0.00016357" />
116 </assert_contents> 104 </assert_contents>
119 <test> 107 <test>
120 <conditional name="mode"> 108 <conditional name="mode">
121 <param name="mode_selector" value="tsv" /> 109 <param name="mode_selector" value="tsv" />
122 <param name="input" value="tabular.tabular" /> 110 <param name="input" value="tabular.tabular" />
123 </conditional> 111 </conditional>
124 <param name="error" value="3" /> 112 <param name="error" value="10" />
125 <conditional name="database_type"> 113 <conditional name="database_type">
126 <param name="database" value="databases/bmrb-light.tsv" /> 114 <param name="database" value="databases/bmrb-light.tsv" />
127 </conditional> 115 </conditional>
128 <output name="output"> 116 <output name="output">
129 <assert_contents> 117 <assert_contents>
133 </test> 121 </test>
134 122
135 </tests> 123 </tests>
136 124
137 <help><![CDATA[ 125 <help><![CDATA[
138 ======== 126 ==========
139 VKMZ 1.0 127 VKMZ 1.2.0
140 ======== 128 ==========
141 129
142 VKMZ is a metabolomics prediction and vizualization tool which creates van Krevelen diagrams from mass spectrometry data. A van Krevelen diagram (VKD) plots a molecule on a scatterplot by the molecules oxygen to carbon ratio (O:C) against it's hydrogen to carbon ratio (H:C). Classes of metabolites cluster together on a VKD [0]. Plotting a complex mixture of metabolites on a VKD briefly conveys untargeted metabolomics data. 130 VKMZ is a metabolomics prediction and vizualization tool which creates van Krevelen diagrams from mass spectrometry data. A van Krevelen diagram (VKD) plots a molecule on a scatterplot by the molecules oxygen to carbon ratio (O:C) against it's hydrogen to carbon ratio (H:C). Classes of metabolites cluster together on a VKD [0]. Plotting a complex mixture of metabolites on a VKD briefly conveys untargeted metabolomics data.
143 131
144 ============= 132 =============
145 Documentation 133 Documentation
146 ============= 134 =============
147 135
148 **Input Data** 136 **Input Data**
149 137
150 VKMZ is designed to use XCMS [1] data as input. Tabular data can also be used as input. 138 VKMZ is designed to use XCMS [1] or tabular data as input.
151 139
152 *XCMS* mode requires three files which XCMS generates: the data matrix, sample metadata, and variable metadata files. 140 *XCMS* mode requires three files which XCMS generates: the data matrix, sample metadata, and variable metadata files.
153 141
154 *Tabular* mode requires a tab delimited file with the first five columns being: sample_id, polarity, mz, retention_time, and intensity. 142 *Tabular* mode requires a tab delimited file with the first five columns being: sample_id, polarity, mz, retention_time, and intensity.
155 143
156 **Advanced Input Options** 144 **Advanced Input Options**
157 145
158 *Override polarity* allows users to set the polarity of all features to either positive or negative. This option should not be used if data contains both polarity types. 146 *Override polarity* allows users to set the polarity of all features to either *Positive* or *Negative*. Set this if input does not contain the correct polarity information. This option should not be used if data contains both positive and negative polarity.
159 147
160 *Disable mass adjustment* prevents converting charged masses to neutral masses. If you are using neutral mass data this option should be used. 148 *Disable mass adjustment* prevents converting charged masses to neutral masses.
161 149
162 **Prediction Options** 150 **Prediction Options**
163 151
164 For each feature in the data VKMZ attempts to predict a molecular formula by comparing the feature's mass to a database of known formula masses. A prediction is made when a known mass is within a mass error of the observed mass. VKMZ finds all predictions for an observed mass within the mass error. The prediction with the lowest delta, absolute difference between observed and known mass, is plotted. Features without predictions are discarded. Using low resolution data may result in finding too many predictions per feature to be useful, especially for large mass metabolites. 152 For each feature VKMZ attempts to predict a molecular formula by comparing the feature's uncharged mass to a database of known formula masses. A prediction is made when a known mass is within a mass error of observed, uncharged, mass. VKMZ finds all predictions for an observed mass within a specified mass error. The prediction with the lowest delta (absolute difference between observed and known mass) is plotted. Features without predictions are discarded. Using low resolution data may result in finding too many predictions per feature to be useful, especially for large mass metabolites.
165 153
166 Set *Mass error* to the mass error, in parts per million, of the mass spectrometer which collected the data. 154 *Mass error* sets the mass error in parts per million. Mass error will be specific to your mass spectrometer, calibration and other methods. Mass error can be approximated by running similar methods with targeted standards with a range in mass.
167 155
168 *Database* can be set to heuristically generated databases for unlabeled and labeled chemcials [2] or to a custom database. 156 *Database* can be set to the provided heuristically generated databases for unlabeled and labeled molecules [2] or to a custom database.
169 157
170 *Unique matches* removes features from the output which have multiple predictions. Low mass molecules are less affected by this filter than high mass molecules. 158 *Unique matches* removes features from the output which have multiple predictions. High mass molecules are affected by this filter more than low mass molecules. This is due to the increased number of possible elemental combinations at a higher mass.
171 159
172 **Diagram Options** 160 **Tabular Output**
173 161
174 Predicted features are plotted as markers. The size of each marker is determined by the minimum marker size and a marker size algorithm. The marker size algorithms use minimum marker size as a variable. 162 Tabular output contians the columns: sample_id, polarity, mz, rt (retentnion time), intensity, predictions (list of list-elements which contains: predicted mz, predicted formula, and predicted delta), hc (hydrogen to carbon ratio), oc, nc.
163
164 **HTML Output**
165
166 The HTML web page is an interactive van Krevelen diagram for exploring data.
167
168 Predicted features are plotted as circle symbols.
169
170 *Min Size* and *Max Size* sets the minimal and maximum area of symbols (absolute scaling).
171
172 The *Sizer* dropdown sets the algorithm to size each symbol.
173
174 * *Uniform* sets the symbols of all features to the *Max Size*.
175 * *Relative Intensity* sets the symbol size of each feature by the feature's intensity divided by the maxium intensity in the dataset mutiplied by the *Maxium Symbol Size*.
176 * *Relative Log Intensity* sets the symbol size of each feature by the feature's log intensity divided by the maxium log intensity in the dataset mutiplied by the *Maxium Symbol Size*.
177
178 *Threshold* is a slider which removes low-intensity features. The slider exponentially scales.
179
180 * Setting the slider to 50% removes features with intensities lower than 25% of the maximum inensity.
181 * Setting the slider to 75% removes features with intensities lower than 50% of the maximum inensity.
182
183 *x-axis* and *y-axis* allow setting axis to alternate elemental ratios.
184
185 *Opacity* sets the opacity of feature symbols.
186
187 *Visible Samples* sets the visibility of features from given sample IDs. Checked samples are visible. By default all samples are visible.
188
175 ]]></help> 189 ]]></help>
176 190
177 <citations> 191 <citations>
178 <citation type="doi">10.1007/s11306-018-1343-y</citation> 192 <citation type="doi">10.1007/s11306-018-1343-y</citation>
179 <citation type="doi">10.1021/ac051437y</citation> 193 <citation type="doi">10.1021/ac051437y</citation>