Mercurial > repos > prog > lcmsmatching
comparison lcmsmatching.xml @ 5:fb9c0409d85c draft
planemo upload for repository https://github.com/workflow4metabolomics/lcmsmatching.git commit 608d9e59a0d2dcf85a037968ddb2c61137fb9bce
author | prog |
---|---|
date | Wed, 19 Apr 2017 10:00:05 -0400 |
parents | b34c14151f25 |
children | f86fec07f392 |
comparison
equal
deleted
inserted
replaced
4:b34c14151f25 | 5:fb9c0409d85c |
---|---|
1 <tool id="lcmsmatching" name="LC/MS matching" version="3.2.0" profile="16.01"> | 1 <tool id="lcmsmatching" name="LC/MS matching" version="3.3.1" profile="16.01"> |
2 | 2 |
3 <description>Annotation of MS peaks using matching on a spectra database.</description> | 3 <description>Annotation of MS peaks using matching on a spectra database.</description> |
4 | 4 |
5 <requirements> | 5 <requirements> |
6 <!--<requirement type="package" version="3.3.3">r</requirement>--> | |
7 <requirement type="package" version="7.0">readline</requirement> <!-- Try readline 7.0 --> | |
6 <requirement type="package" version="1.20.0">r-getopt</requirement> | 8 <requirement type="package" version="1.20.0">r-getopt</requirement> |
7 <requirement type="package" version="1.0.0">r-stringr</requirement> | 9 <requirement type="package" version="1.0.0">r-stringr</requirement> |
8 <requirement type="package" version="1.8.3">r-plyr</requirement> | 10 <requirement type="package" version="1.8.3">r-plyr</requirement> |
9 <requirement type="package" version="3.98">r-xml</requirement> | 11 <requirement type="package" version="3.98">r-xml</requirement> |
10 <requirement type="package" version="1.0_6">r-bitops</requirement> | 12 <requirement type="package" version="1.0_6">r-bitops</requirement> |
11 <requirement type="package" version="1.95">r-rcurl</requirement> | 13 <requirement type="package" version="1.95">r-rcurl</requirement> |
12 <requirement type="package" version="1.3">r-rjsonio</requirement> | 14 <requirement type="package" version="1.1">r-jsonlite</requirement> |
13 </requirements> | 15 </requirements> |
14 | 16 |
15 <code file="list-chrom-cols.py"/> | 17 <code file="list-chrom-cols.py"/> |
16 | 18 <code file="list-file-cols.py"/> |
17 <!--~~~~~~~ | 19 <code file="list-ms-mode-values.py"/> |
18 ~ COMMAND ~ | 20 |
19 ~~~~~~~~--> | 21 <!--======= |
22 = COMMAND = | |
23 ========--> | |
20 | 24 |
21 <command> | 25 <command> |
22 <![CDATA[ | 26 <![CDATA[ |
23 ## @@@BEGIN_CHEETAH@@@ | 27 ## @@@BEGIN_CHEETAH@@@ |
24 $__tool_directory__/search-mz -i "$mzrtinput" | 28 $__tool_directory__/search-mz |
29 | |
30 ## Input file | |
31 -i "$mzrtinput" | |
32 --input-col-names "mz=$inputmzfield,rt=$inputrtfield" | |
33 --rtunit "$inputrtunit" | |
25 | 34 |
26 ## Database | 35 ## Database |
27 #if $db.dbtype == "inhouse" | 36 #if $db.dbtype == "inhouse" |
28 -d file | 37 -d file |
29 --db-fields "$db.dbfields" | 38 --db-fields "mztheo=$db.dbmzreffield,chromcolrt=$db.dbchromcolrtfield,compoundid=$db.dbspectrumidfield,chromcol=$db.dbchromcolfield,msmode=$db.dbmsmodefield,peakattr=$db.dbpeakattrfield,pubchemcompid=$db.dbpubchemcompidfield,chebiid=$db.dbchebiidfield,hmdbid=$db.dbhmdbidfield,keggid=$db.dbkeggidfield" |
30 --db-ms-modes "$db.dbmsmodes" | 39 --db-ms-modes "pos=$db.dbmsposmode,neg=$db.dbmsnegmode" |
40 --db-rt-unit $db.dbrtunit | |
31 #end if | 41 #end if |
32 #if $db.dbtype == "peakforest" | 42 #if $db.dbtype == "peakforest" |
33 -d peakforest | 43 -d peakforest |
34 --db-token "$db.dbtoken" | 44 --db-token "$db.dbtoken" |
35 #end if | 45 #end if |
55 -o "$mainoutput" --peak-output-file "$peaksoutput" --same-rows --same-cols | 65 -o "$mainoutput" --peak-output-file "$peaksoutput" --same-rows --same-cols |
56 | 66 |
57 ## HTML output | 67 ## HTML output |
58 --html-output-file "$htmloutput" --no-main-table-in-html-output | 68 --html-output-file "$htmloutput" --no-main-table-in-html-output |
59 | 69 |
60 ## Fields of input file | |
61 --input-col-names "$inputfields" | |
62 | |
63 ## Ouput setting | 70 ## Ouput setting |
64 #if $out.enabled == "true" | 71 --molids-sep "$molidssep" |
65 --output-col-names "$out.outputfields" | |
66 --molids-sep "$out.molidssep" | |
67 #else | |
68 --molids-sep "|" | |
69 #end if | |
70 ## @@@END_CHEETAH@@@ | 72 ## @@@END_CHEETAH@@@ |
71 ]]></command> | 73 ]]></command> |
72 | 74 |
73 <!--~~~~~~ | 75 <!--====== |
74 ~ INPUTS ~ | 76 = INPUTS = |
75 ~~~~~~~--> | 77 =======--> |
76 | 78 |
77 <inputs> | 79 <inputs> |
78 | 80 |
79 <!-- DATABASE --> | 81 <!-- DATABASE --> |
80 | 82 |
88 <when value="inhouse"> | 90 <when value="inhouse"> |
89 <!-- Database file --> | 91 <!-- Database file --> |
90 <param name="dburl" label="Database file" type="data" format="tabular,tsv" refresh_on_change="true" help="Decimal: '.', missing: NA, mode: character and numerical, sep: tabular. Retention time values must be in seconds."/> | 92 <param name="dburl" label="Database file" type="data" format="tabular,tsv" refresh_on_change="true" help="Decimal: '.', missing: NA, mode: character and numerical, sep: tabular. Retention time values must be in seconds."/> |
91 | 93 |
92 <!-- File database field names --> | 94 <!-- File database field names --> |
93 <param name="dbfields" label="File database column names" type="text" size="256" value="mztheo=mztheo,chromcolrt=chromcolrt,compoundid=compoundid,chromcol=chromcol,msmode=msmode,peakattr=peakattr,peakcomp=peakcomp,fullnames=fullnames,compoundmass=compoundmass,compoundcomp=compoundcomp,inchi=inchi,inchikey=inchikey,pubchemcompid=pubchemcompid,chebiid=chebiid,hmdbid=hmdbid,keggid=keggid" refresh_on_change="true" help=""/> | 95 <param name="dbspectrumidfield" type="select" label="Database file Spectrum ID column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'spectrumid,accession,compoundid,molid')" help="Select the Spectrum ID column of the database file."/> |
96 <param name="dbmzreffield" type="select" label="Database file Reference MZ column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'mztheo,mzexp,mz')" help="Select the Reference MZ column of the database file."/> | |
97 <param name="dbchromcolfield" type="select" label="Database file Chromatographic Column Name column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'chromcol,col')" help="Select the Chromatographic Column Name column of the database file." refresh_on_change="true"/> | |
98 <param name="dbchromcolrtfield" type="select" label="Database file Chromatographic Column Retention Time column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'chromcolrt,colrt,rt')" help="Select the Chromatographic Column Retention Time column of the database file."/> | |
99 <param name="dbmsmodefield" type="select" label="Database file MS Mode column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'msmode,mode')" help="Select the MS Mode column of the database file." refresh_on_change="true"/> | |
100 <param name="dbpeakattrfield" type="select" label="Database file Peak Attribution column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'peakattr,attr')" help="Select the Peak Attribution column of the database file."/> | |
101 <param name="dbpubchemcompidfield" type="select" label="Database file PubChem Compound ID column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'pubchemcompid,pubchemid,pubchemcomp,pubchem')" help="Select the PubChem Compound ID column of the database file."/> | |
102 <param name="dbchebiidfield" type="select" label="Database file ChEBI ID column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'chebiid,chebi')" help="Select the ChEBI ID column of the database file."/> | |
103 <param name="dbhmdbidfield" type="select" label="Database file HMDB Metabolite ID column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'hmdbid,hmdb')" help="Select the HMDB Metabolite ID column of the database file."/> | |
104 <param name="dbkeggidfield" type="select" label="Database file KEGG Compound ID column name" dynamic_options="get_file_cols(file = db['dburl'], preferred = 'keggid,kegg')" help="Select the KEGG Compound ID column of the database file."/> | |
94 | 105 |
95 <!-- File database MS modes --> | 106 <!-- File database MS modes --> |
96 <param name="dbmsmodes" label="File database MS modes" type="text" size="32" value="pos=POS,neg=NEG" help=""/> | 107 <param name="dbmsposmode" label="File database MS Positive mode" type="select" dynamic_options="get_ms_mode_value(file = db['dburl'], col = db['dbmsmodefield'], preferred = 'POS,pos,+')" help="Select the value used to identify the positive MS mode."/> |
108 <param name="dbmsnegmode" label="File database MS Negative mode" type="select" dynamic_options="get_ms_mode_value(file = db['dburl'], col = db['dbmsmodefield'], preferred = 'NEG,neg,-')" help="Select the value used to identify the negitive MS mode."/> | |
109 | |
110 <!-- File database RT unit --> | |
111 <param name="dbrtunit" label="Retention time unit" type="select" display="radio" multiple="false" help=""> | |
112 <option value="sec">Seconds</option> | |
113 <option value="min">Minutes</option> | |
114 </param> | |
97 | 115 |
98 <param name="dbtoken" type="text" size="32" value="" hidden="true"/> | 116 <param name="dbtoken" type="text" size="32" value="" hidden="true"/> |
99 </when> | 117 </when> |
100 | 118 |
101 <when value="peakforest"> | 119 <when value="peakforest"> |
102 <param name="dburl" type="text" size="128" value="https://peakforest-alpha.inra.fr/rest" refresh_on_change="true"/> | 120 <param name="dburl" type="text" size="128" value="https://peakforest-alpha.inra.fr/rest" refresh_on_change="true"/> |
103 | 121 |
104 <param name="dbtoken" label="Peakforest security token" type="text" size="32" value="" refresh_on_change="true" help="If you do not have yet a Peakforest token, go to Peakforest website and request one from your account."/> | 122 <param name="dbtoken" label="Peakforest security token" type="text" size="32" value="" refresh_on_change="true" help="If you do not have yet a Peakforest token, go to Peakforest website and request one from your account."/> |
105 | 123 |
106 <param name="dbfields" type="text" size="32" value="" hidden="true"/> | 124 <param name="dbchromcolfield" type="text" size="32" value="" hidden="true"/> |
107 </when> | 125 </when> |
108 </conditional> | 126 </conditional> |
109 | 127 |
110 <!-- INPUT --> | 128 <!-- INPUT --> |
111 | 129 |
112 <!-- Input file --> | 130 <!-- Input file --> |
113 <param name="mzrtinput" label="Input file - MZ(/RT) values" type="data" format="tabular,tsv" help="Decimal: '.', missing: NA, mode: character and numerical, sep: tabular. RT values must be in seconds."/> | 131 <param name="mzrtinput" label="Input file - MZ(/RT) values" type="data" format="tabular,tsv" refresh_on_change="true" help="Decimal: '.', missing: NA, mode: character and numerical, sep: tabular. RT values must be in seconds."/> |
114 | 132 |
115 <!-- Input field names --> | 133 <!-- Input field field names --> |
116 <param name="inputfields" label="Input file column names" type="text" size="32" value="mz=mzmed,rt=rtmed" help=""/> | 134 <param name="inputmzfield" type="select" label="Input file MZ column name" dynamic_options="get_file_cols(file = mzrtinput, preferred = 'mzmed,mz')" help="Select the MZ column of the input file."/> |
135 <param name="inputrtfield" type="select" label="Input file RT column name" dynamic_options="get_file_cols(file = mzrtinput, preferred = 'rtmed,rt')" help="Select the RT column of the input file."/> | |
136 | |
137 <!-- Input file RT unit --> | |
138 <param name="inputrtunit" label="Retention time unit" type="select" display="radio" multiple="false" help=""> | |
139 <option value="sec">Seconds</option> | |
140 <option value="min">Minutes</option> | |
141 </param> | |
117 | 142 |
118 <!-- M/Z MATCHING --> | 143 <!-- M/Z MATCHING --> |
119 | 144 |
120 <!-- Mode --> | 145 <!-- Mode --> |
121 <param name="mzmode" label="MS mode" type="select" display="radio" multiple="false" help=""> | 146 <param name="mzmode" label="MS mode" type="select" display="radio" multiple="false" help=""> |
128 <param name="mzshift" label="M/Z shift (in ppm)" type="float" help="" value="0"/> | 153 <param name="mzshift" label="M/Z shift (in ppm)" type="float" help="" value="0"/> |
129 | 154 |
130 <!-- RETENTION TIME PARAMETERS --> | 155 <!-- RETENTION TIME PARAMETERS --> |
131 | 156 |
132 <!-- List of chromatographic columns --> | 157 <!-- List of chromatographic columns --> |
133 <param name="chromcols" type="select" label="Chromatographic columns" multiple="true" dynamic_options="get_chrom_cols(dbtype = db['dbtype'], dburl = db['dburl'], dbtoken = db['dbtoken'], dbfields = db['dbfields'])" help="Select here the set of chromatographic columns against which the retention time matching will be run."/> | 158 <param name="chromcols" type="select" label="Chromatographic columns" multiple="true" dynamic_options="get_chrom_cols(dbtype = db['dbtype'], dburl = db['dburl'], dbtoken = db['dbtoken'], col_field = db['dbchromcolfield'])" help="Select here the set of chromatographic columns against which the retention time matching will be run."/> |
134 | 159 |
135 <!-- Tolerances --> | 160 <!-- Tolerances --> |
136 <param name="tolx" label="RTX retention time tolerance, parameter x (in seconds)" type="float" help="" value="5"/> | 161 <param name="tolx" label="RTX retention time tolerance, parameter x (in seconds)" type="float" help="" value="5"/> |
137 <param name="toly" label="RTY retention time tolerance, parameter y" type="float" help="" value="0.8"/> | 162 <param name="toly" label="RTY retention time tolerance, parameter y" type="float" help="" value="0.8"/> |
138 <param name="tolz" label="RTZ retention time tolerance, used when precursor matching is enabled." type="float" help="" value="5"/> | 163 <param name="tolz" label="RTZ retention time tolerance, used when precursor matching is enabled." type="float" help="" value="5"/> |
172 </param> | 197 </param> |
173 </when> | 198 </when> |
174 </conditional> | 199 </conditional> |
175 | 200 |
176 <!-- OUTPUT --> | 201 <!-- OUTPUT --> |
177 <conditional name="out"> | 202 <!-- Molecule IDs separator character --> |
178 | 203 <param name="molidssep" label="Molecule IDs separator character" type="text" size="3" value="|" help=""> |
179 <param name="enabled" label="Output settings" type="select"> | 204 <sanitizer> |
180 <option value="false">Default</option> | 205 <valid initial="string.printable"> |
181 <option value="true">Customized</option> | 206 <remove value='"'/> |
182 </param> | 207 </valid> |
183 | 208 <mapping initial="none"> |
184 <when value="false"></when> | 209 <add source='"' target='\"'/> |
185 <when value="true"> | 210 </mapping> |
186 | 211 </sanitizer> |
187 <!-- Output field names --> | 212 </param> |
188 <param name="outputfields" label="Output column names" type="text" size="256" value="mz=mz,rt=rt,chromcol=chromcol,chromcolrt=chromcolrt,compoundid=compoundid,peakattr=peakattr,peakcomp=peakcomp,intensity=intensity,relative.intensity=relative.intensity,mzexp=mzexp,mztheo=mztheo,fullnames=fullnames,compoundmass=compoundmass,compoundcomp=compoundcomp,inchi=inchi,inchikey=inchikey,pubchemcompid=pubchemcompid,chebiid=chebiid,hmdbid=hmdbid,keggid=keggid" help=""/> | |
189 | |
190 <!-- Molecule IDs separator character --> | |
191 <param name="molidssep" label="Molecule IDs separator character" type="text" size="3" value="|" help=""> | |
192 <sanitizer> | |
193 <valid initial="string.printable"> | |
194 <remove value='"'/> | |
195 </valid> | |
196 <mapping initial="none"> | |
197 <add source='"' target='\"'/> | |
198 </mapping> | |
199 </sanitizer> | |
200 </param> | |
201 </when> | |
202 </conditional> | |
203 | 213 |
204 </inputs> | 214 </inputs> |
205 | 215 |
206 <!--~~~~~~~ | 216 <!--======= |
207 ~ OUTPUTS ~ | 217 = OUTPUTS = |
208 ~~~~~~~~--> | 218 ========--> |
209 | 219 |
210 <outputs> | 220 <outputs> |
211 | 221 |
212 <!-- Output file --> | 222 <!-- Output file --> |
213 <data name="mainoutput" label="lcmsmatch_${mzrtinput.name}" format="tabular"/> | 223 <data name="mainoutput" label="lcmsmatch_${mzrtinput.name}" format="tabular"/> |
214 <data name="peaksoutput" label="lcmsmatch_${mzrtinput.name}_peaks" format="tabular"/> | 224 <data name="peaksoutput" label="lcmsmatch_${mzrtinput.name}_peaks" format="tabular"/> |
215 <data name="htmloutput" label="lcmsmatch_${mzrtinput.name}.html" format="html"/> | 225 <data name="htmloutput" label="lcmsmatch_${mzrtinput.name}.html" format="html"/> |
216 | 226 |
217 </outputs> | 227 </outputs> |
218 | 228 |
219 <!--~~~~~ | 229 <!--===== |
220 ~ TESTS ~ | 230 = TESTS = |
221 ~~~~~~--> | 231 ======--> |
222 | 232 |
223 <tests> | 233 <tests> |
224 | 234 |
225 <!-- File database test --> | 235 <!-- File database test --> |
226 <test> | 236 <test> |
227 <param name="dbtype" value="inhouse"/> | 237 <param name="dbtype" value="inhouse"/> |
228 <param name="dburl" value="filedb.tsv"/> | 238 <param name="dburl" value="filedb.tsv"/> |
229 <param name="dbfields" value=""/> | 239 <param name="dbfields" value=""/> |
230 <param name="dbmsmodes" value=""/> | 240 <param name="dbmsmodes" value=""/> |
231 <param name="mzrtinput" value="mz-input-small.tsv"/> | 241 <param name="mzrtinput" value="mz-input-small.tsv"/> |
232 <param name="inputfields" value=""/> | 242 <param name="inputmzfield" value="mzmed"/> |
243 <param name="inputrtfield" value="rtmed"/> | |
233 <param name="mzmode" value="pos"/> | 244 <param name="mzmode" value="pos"/> |
234 <output name="mainoutput" file="filedb-small-mz-match-output.tsv"/> | 245 <output name="mainoutput" file="filedb-small-mz-match-output.tsv"/> |
235 <output name="peaksoutput" file="filedb-small-mz-match-peaks-output.tsv"/> | 246 <output name="peaksoutput" file="filedb-small-mz-match-peaks-output.tsv"/> |
236 <output name="htmloutput" file="filedb-small-mz-match-html-output.html"/> | 247 <output name="htmloutput" file="filedb-small-mz-match-html-output.html"/> |
237 </test> | 248 </test> |
251 </output> | 262 </output> |
252 </test> | 263 </test> |
253 --> | 264 --> |
254 </tests> | 265 </tests> |
255 | 266 |
256 <!--~~~~ | 267 <!--==== |
257 ~ HELP ~ | 268 = HELP = |
258 ~~~~~--> | 269 =====--> |
259 | 270 |
260 <help> | 271 <help> |
261 <!-- @@@BEGIN_RST@@@ --> | 272 <!-- @@@BEGIN_RST@@@ --> |
262 | 273 |
263 ============== | 274 ============== |
270 Database | 281 Database |
271 -------- | 282 -------- |
272 | 283 |
273 When selecting the database, you have the choice between a Peakforest database or an in-house file. | 284 When selecting the database, you have the choice between a Peakforest database or an in-house file. |
274 | 285 |
275 For the Peakforest database, a default REST web base address is already provided. But you can change it of you want to use a custom database. A field is also available for setting a token key in case the access to the Peakforest database you want to use is restricted. This is the case of the default database. | 286 For the Peakforest database, a default REST web base address is already provided. But you can change it to use a custom database. A field is also available for setting a token key in case the access to the Peakforest database you want to use is restricted. This is the case of the default database URL. |
276 | 287 |
277 For the in-house file, please refer to the paragraph "Single file database" below. | 288 For the in-house file, please refer to the paragraph "Single file database" below. |
278 | 289 |
279 ----------- | 290 ----------- |
280 Input files | 291 Input files |
283 Be careful to always provide UTF-8 encoded files, unless you do not use special characters at all. For instance, greek letters in molecule names give errors if the file is in latin1 (ISO 8859-1) or Windows 1252 (not distinguishable from latin1) encoding. | 294 Be careful to always provide UTF-8 encoded files, unless you do not use special characters at all. For instance, greek letters in molecule names give errors if the file is in latin1 (ISO 8859-1) or Windows 1252 (not distinguishable from latin1) encoding. |
284 | 295 |
285 Single file database | 296 Single file database |
286 ==================== | 297 ==================== |
287 | 298 |
288 The database used is provided as a single file, in tabular format, through the *Database file* field. This file contains a list of MS peaks, with retention times. | 299 The database used is provided as a single file, in tabular format, through the *Database file* field. This file must contain a list of MS peaks, with possibly retention times. |
289 Peaks are "duplicated" as much as necessary. For instance if 3 retention times are available on a compound with 10 peaks in positive mode, then there will be 30 lines for this compounds in positive mode. | 300 Peaks are "duplicated" as much as necessary. For instance if 3 retention times are available on a compound with 10 peaks in positive mode, then there will be 30 lines for this compound in positive mode. |
290 | 301 |
291 The file must contain a header with the column names. The names are free, but must be provided through the *File database column names* field. | 302 The file must contain a header with the column names. The names are free, but must be provided through the different fields named *Database file ... column name*. |
292 In this field, each column is identified with a tag, and the columns names are listed as a comma separated list of tag/name couples (separated by character `=`). The allowed tags are the following ones: | 303 Then you must provide the values used to identify the MS modes (positive and negative). |
293 | 304 |
294 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | 305 A last information about the single file database is the unit of the retention times, either in seconds or in minutes. |
295 | Column tag | Compulsory | Values | | |
296 +==============+============+============================================================================================================+ | |
297 | mztheo | Yes | The m/z values. | | |
298 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
299 | mode | Yes | The MS mode. | | |
300 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
301 | molid | Yes | This is the identifier of your compound. | | |
302 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
303 | colrt | No | The retention time values in seconds. | | |
304 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
305 | col | No | The chromatographic column associated with the retention time. Compulsory if retention times are provided. | | |
306 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
307 | attr | No | The attribution of the peak (e.g.: ``[(M+H)-(H2O)-(NH3)]+``). | | |
308 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
309 | comp | No | The composition of the peak (e.g.: ``C6 H10 N O``). | | |
310 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
311 | molcomp | No | The composition of the molecule. (e.g.: ``C6H14N2O2``). | | |
312 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
313 | molmass | No | The mass of the molecule. | | |
314 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
315 | molnames | No | The names of the molecule, as a semicolon separated list. | | |
316 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
317 | inchi | No | The InChI of the molecule. | | |
318 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
319 | inchikey | No | The InChI key of the molecule. | | |
320 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
321 | pubchem | No | The PubChem ID of the molecule. | | |
322 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
323 | chebi | No | The ChEBI ID of the molecule. | | |
324 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
325 | hmdb | No | The HMDB ID of the molecule. | | |
326 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
327 | kegg | No | The KEGG ID of the molecule. | | |
328 +--------------+------------+------------------------------------------------------------------------------------------------------------+ | |
329 | |
330 The field *File database MS modes* allows you to personalize the MS mode identifiers. The value of the field is a comma separated list of mode/name couples (separated by character `=`).. | |
331 For instance, if in your database file you use characters '+' and '-' to identify the modes, then you must set the field to `pos=+,neg=-`. | |
332 | 306 |
333 Example of database file (totally fake, no meaning): | 307 Example of database file (totally fake, no meaning): |
334 | 308 |
335 +-------+-------+------------+--------------------+-------------------------+-----------+-------+---------------+-----------+--------------+ | 309 +-------+-------+------------+--------------------+-------------------------+-----------+-------+---------------+-----------+--------------+ |
336 | molid | mode | mz | composition | attribution | col | rt | molcomp | molmass | molnames | | 310 | molid | mode | mz | composition | attribution | col | rt | molcomp | molmass | molnames | |
359 +-------+-------+------------+--------------------+-------------------------+-----------+-------+---------------+-----------+--------------+ | 333 +-------+-------+------------+--------------------+-------------------------+-----------+-------+---------------+-----------+--------------+ |
360 | 334 |
361 MZ/RT input file | 335 MZ/RT input file |
362 ================ | 336 ================ |
363 | 337 |
364 The input to provide is a file, in a tabular format (or TSV: Tab Seperated Values), containing the list of MZ/RT values. | 338 The input to provide is a file, in a tabular format (or TSV: Tab Seperated Values), containing the list of M/Z values, with possibly also RT values. |
365 | 339 |
366 The following columns will be used: | 340 The column names for the M/Z and RT values must be provided through the fields *Input file MZ column name* and *Input file RT column name*. |
367 | 341 As a consequence, the file must contain a header line. |
368 +--------------+------------+---------------------------------------+ | 342 |
369 | Column tag | Compulsory | Values | | 343 The unit of the retention time has to be provided with the field *Retention time unit*. |
370 +==============+============+=======================================+ | |
371 | mz | Yes | The m/z values. | | |
372 +--------------+------------+---------------------------------------+ | |
373 | rt | No | The retention time values in seconds. | | |
374 +--------------+------------+---------------------------------------+ | |
375 | |
376 The file may contain a header line, in which case you have to provide the column names through the *Input file column names* field, which consists in a comma separated list of tag/name couples (separated by character `=`). If your file does not contain a header line, then you must provide the column numbers. Examples: | |
377 | |
378 * With a header line having name MASS for mz column and RET for rt column: `mz=MASS,rt=RET`. | |
379 * With no header line: `mz=1,rt=2`. | |
380 | |
381 Since the MS spectrum mode can not be known from the file, an *MS mode* radio button field is provided for setting the mode. | |
382 | 344 |
383 Example of file input: | 345 Example of file input: |
384 | 346 |
385 +-------------+-------------+ | 347 +-------------+-------------+ |
386 | mz | rt | | 348 | mz | rt | |
406 | 368 |
407 The first parameter is the MS mode, specified through the *MS mode* parameter. | 369 The first parameter is the MS mode, specified through the *MS mode* parameter. |
408 | 370 |
409 The parameters *M/Z precision* and *M/Z shift* are used by the algorithm in the following formula in order to match an *m/z* value: | 371 The parameters *M/Z precision* and *M/Z shift* are used by the algorithm in the following formula in order to match an *m/z* value: |
410 | 372 |
411 mz (1 + (- shift - precision) / 10^6) < mztheo < mz (1 + (- shift - precision) / 10^6) | 373 mz (1 + (- shift - precision) / 10^6) < mzref < mz (1 + (- shift - precision) / 10^6) |
412 | 374 |
413 Where *mztheo* is the theoretical mass of the database peak that is tested. If this double inequality is true, then the *m/z* value is matched with this peak. | 375 Where *mzref* is the M/Z of reference from the database peak that is tested. If this double inequality is true, then the *m/z* value is matched with this peak. |
414 | 376 |
415 -------------------- | 377 -------------------- |
416 Retention time match | 378 Retention time match |
417 -------------------- | 379 -------------------- |
418 | 380 |
419 If at least one column is checked inside the *Columns* parameter section, then retention time is also matched, in addition to the *m/z* value, according to the following formula: | 381 If at least one column is selected inside the *Chromatographic columns* parameter section, then retention time is also matched, in addition to the *m/z* value, according to the following formula: |
420 | 382 |
421 rt - x - rt^y < colrt < rt + x + rt^y | 383 rt - x - rt^y < colrt < rt + x + rt^y |
422 | 384 |
423 Where *x* is the value of the parameter *RTX* and *y* the value of the parameter *RTY*. | 385 Where *x* is the value of the parameter *RTX* and *y* the value of the parameter *RTY*. |
424 | 386 |
449 3. For each input couple (m/z,rt), we look at all peaks inside the molecules taken from step 2, whose matched retention time between *rt - z* and *rt + z*, where *z* is the value of parameter *RTZ*. | 411 3. For each input couple (m/z,rt), we look at all peaks inside the molecules taken from step 2, whose matched retention time between *rt - z* and *rt + z*, where *z* is the value of parameter *RTZ*. |
450 | 412 |
451 --------------- | 413 --------------- |
452 Output settings | 414 Output settings |
453 --------------- | 415 --------------- |
454 | |
455 The *Output column names* parameter is used to customize the columns of the output files. As with the *File database column names* parameter, each column is identified with a tag, and the columns names are listed as a comma separated list of tag/name couples (separated by character `=`). The allowed tags are the following ones: | |
456 | |
457 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
458 | Column tag | Values | | |
459 +==============+=================================================================================================================================+ | |
460 | mz | The m/z values from the input file. | | |
461 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
462 | mztheo | The m/z values from the database. | | |
463 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
464 | molid | This is the identifier of your compound. | | |
465 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
466 | rt | The retention time values in seconds from the input file. | | |
467 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
468 | col | The chromatographic column associated with the retention time. | | |
469 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
470 | colrt | The retention time associated with the matched chromatographic column. | | |
471 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
472 | msmatching | The list IDs of matched molecules. IDs are separated by the character specified in the *Molecule IDs separator character* field | | |
473 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
474 | attr | The attribution of the peak (e.g.: ``[(M+H)-(H2O)-(NH3)]+``). | | |
475 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
476 | comp | The composition of the peak (e.g.: ``C6 H10 N O``). | | |
477 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
478 | molcomp | The composition of the molecule. (e.g.: ``C6H14N2O2``). | | |
479 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
480 | molmass | The mass of the molecule. | | |
481 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
482 | molnames | The names of the molecule, as a semicolon separated list. | | |
483 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
484 | inchi | The InChI of the molecule. | | |
485 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
486 | inchikey | The InChI key of the molecule. | | |
487 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
488 | pubchem | The PubChem ID of the molecule. | | |
489 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
490 | chebi | The ChEBI ID of the molecule. | | |
491 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
492 | hmdb | The HMDB ID of the molecule. | | |
493 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
494 | kegg | The KEGG ID of the molecule. | | |
495 +--------------+---------------------------------------------------------------------------------------------------------------------------------+ | |
496 | 416 |
497 The *Molecule IDs separator character* is used to customize the character used to separate the molecule IDs of the **molid** column inside the *main* output file. | 417 The *Molecule IDs separator character* is used to customize the character used to separate the molecule IDs of the **molid** column inside the *main* output file. |
498 | 418 |
499 Output files | 419 Output files |
500 ============ | 420 ============ |
538 R Core Team (2013). R: A language and Environment for Statistical Computing. http://www.r-project.org | 458 R Core Team (2013). R: A language and Environment for Statistical Computing. http://www.r-project.org |
539 | 459 |
540 <!-- @@@END_RST@@@ --> | 460 <!-- @@@END_RST@@@ --> |
541 </help> | 461 </help> |
542 | 462 |
543 <!--~~~~~~~~~ | 463 <!--========= |
544 ~ CITATIONS ~ | 464 = CITATIONS = |
545 ~~~~~~~~~~--> | 465 ==========--> |
546 | 466 |
547 <citations/> | 467 <citations/> |
548 | 468 |
549 </tool> | 469 </tool> |