annotate spec2vec_training.xml @ 1:9d917de87cca draft default tip

planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
author recetox
date Tue, 27 Jun 2023 14:29:59 +0000
parents e1e22ada831e
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
1
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
1 <tool id="spec2vec_training" name="spec2vec model training" version="@TOOL_VERSION@+galaxy0" profile="21.09">
0
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
2 <description>Train a Spec2Vec model for mass spectra similarity scoring</description>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
3
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
4 <macros>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
5 <import>macros.xml</import>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
6 </macros>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
7 <expand macro="creator"/>
1
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
8 <expand macro="edam" />
0
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
9
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
10 <requirements>
1
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
11 <requirement type="package" version="@TOOL_VERSION@">spec2vec</requirement>
0
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
12 </requirements>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
13
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
14 <command detect_errors="exit_code"><![CDATA[
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
15 ln -fs '${weights_filename}' '${weights_filename}.npy' &&
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
16 sh ${spec2vec_python_cli}
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
17 ]]></command>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
18
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
19 <configfiles>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
20 <configfile name="spec2vec_python_cli">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
21 python3 '${__tool_directory__}/spec2vec_training_wrapper.py' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
22 --spectra_filename '$spectra_filename' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
23 --spectra_fileformat '$spectra_filename.ext' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
24 #if $output_parameters.model_checkpoints.save_checkpoints == 'TRUE'
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
25 --checkpoints '$output_parameters.model_checkpoints.checkpoints' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
26 #else
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
27 --epochs $output_parameters.model_checkpoints.epochs \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
28 #end if
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
29 --vector_size $training_parameters.vector_size \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
30 --alpha $training_parameters.alpha \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
31 --min_alpha $training_parameters.min_alpha \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
32 --window $training_parameters.window \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
33 --min_count $training_parameters.min_count \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
34 --sample $training_parameters.sample \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
35 --seed $training_parameters.seed \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
36 --sg $training_parameters.sg_param.sg \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
37 #if not $training_parameters.sg_param.sg
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
38 --cbow_mean $training_parameters.sg_param.cbow_mean \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
39 #end if
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
40 --hs $training_parameters.hs_param.hs \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
41 #if not $training_parameters.hs_param.hs
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
42 --negative $training_parameters.hs_param.negative \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
43 --ns_exponent $training_parameters.hs_param.ns_exponent \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
44 #end if
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
45 --sorted_vocab $training_parameters.sorted_vocab \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
46 --batch_words $training_parameters.batch_words \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
47 --shrink_windows $training_parameters.shrink_windows \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
48 #if $training_parameters.trim_vocab.max_vocab_size_bool == 'TRUE'
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
49 --max_vocab_size $training_parameters.trim_vocab.max_vocab_size \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
50 #end if
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
51 --n_decimals $training_parameters.n_decimals \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
52 --n_workers \${GALAXY_SLOTS:-1} \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
53 #if $output_parameters.as_pickle
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
54 --model_filename_pickle '$model_filename_pickle' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
55 #end if
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
56 --model_filename '$model_filename' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
57 --weights_filename '$weights_filename' \
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
58 </configfile>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
59 </configfiles>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
60
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
61 <inputs>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
62 <param label="Training spectra" name="spectra_filename" type="data" format="msp,mgf"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
63 help="Spectra file to train a Spec2Vec model."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
64
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
65 <section title="Output parameters" name="output_parameters" expanded="true">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
66 <param label="Save model as Pickle file" name="as_pickle" type="boolean" checked="false" truevalue="TRUE" falsevalue="FALSE"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
67 help="Add a Pickle output besides default JSON."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
68 <conditional name="model_checkpoints">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
69 <param label="Model checkpoints" name="save_checkpoints" type="select" display="radio"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
70 help="Epochs after which to save a model.">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
71 <option value="TRUE">Yes</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
72 <option value="FALSE" selected="true">No</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
73 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
74 <when value="TRUE">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
75 <param label="Number of training epochs with checkpoints" name="checkpoints" type="text" value="10,20,50"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
76 help="Comma-separated epoch numbers after which to save a model. The highest number will be used as a total number of epochs for training.">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
77 <validator type="empty_field"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
78 <validator type="regex"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
79 message="The input has to be a comma-separated sequence of integers without trailing commas. For example: 10,20,50">^[0-9]+(,[0-9]+)*$</validator>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
80 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
81 </when>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
82 <when value="FALSE">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
83 <param label="Number of training epochs" name="epochs" type="integer" value="10"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
84 help="Number of epochs to train the model."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
85 </when>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
86 </conditional>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
87 </section>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
88
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
89 <section title="Training hyperparameters" name="training_parameters" expanded="true">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
90 <param label="Vector size" name="vector_size" type="integer" value="300"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
91 min="1" help="Dimensionality of the feature vectors (i.e., into how many dimensions to encode each m/z and neutral loss peak."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
92 <param label="Alpha" name="alpha" type="float" value="0.025"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
93 min="0" help="The initial learning rate."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
94 <param label="Minimum Alpha" name="min_alpha" type="float" value="0.00025"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
95 min="0" help="Learning rate will linearly drop to this value as training progresses."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
96 <param label="Window" name="window" type="integer" value="500"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
97 help="Maximum distance between the current and predicted peak within a spectrum."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
98 <param label="Minimum peak count" name="min_count" type="integer" value="1"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
99 min="0" help="Ignores all peaks with absolute frequency lower than this."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
100 <param label="Sample" name="sample" type="float" value="0.001"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
101 help="The threshold for configuring which higher-frequency peaks are randomly downsampled."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
102 <param label="Seed" name="seed" type="integer" value="1"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
103 help="Seed of random number generator for model reproducibility."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
104 <conditional name="sg_param">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
105 <param label="Word-Embedding type" name="sg" type="select"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
106 help="Embedding type: Skip-gram or Continuous Bag of Words">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
107 <option value="0">CBOW</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
108 <option value="1">Skip-gram</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
109 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
110 <when value="0">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
111 <param label="CBOW mean" name="cbow_mean" type="select"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
112 help="Whether to use the sum of the context word vectors or their mean.">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
113 <option value="0">Sum</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
114 <option value="1" selected="true">Mean</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
115 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
116 </when>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
117 </conditional>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
118 <conditional name="hs_param">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
119 <param label="Last Layer Activation" name="hs" type="select"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
120 help="Activation function of the last layer of the neural network. Negative sampling is more computationally efficient.">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
121 <option value="0">Negative Sampling</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
122 <option value="1">Hierarchical Softmax</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
123 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
124 <when value="0">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
125 <param label="Negative Samples" name="negative" type="integer" value="5"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
126 min="1" help="Specify how many 'negative' examples should be drawn for each peak and neutral loss (usually between 5-20).">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
127 <validator type="in_range" min="1" message="The value must be larger than 0."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
128 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
129 <param label="Negative Sample Exponent" name="ns_exponent" type="float" value="0.75"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
130 help="The exponent used to shape the negative sampling distribution. A value of 1.0 samples exactly in proportion to the frequencies,
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
131 0.0 samples all peaks and neutral losses equally, while a negative value samples low-frequency peaks more often than high-requency peaks.">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
132 <validator type="in_range" min="-1.0" max="1.0" message="The value must be within -1.0 and 1.0 range."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
133 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
134 </when>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
135 </conditional>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
136 <param label="Sort the vocabulary of spectra" name="sorted_vocab" type="boolean" checked="true" truevalue="TRUE" falsevalue="FALSE"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
137 help="If true, sort the vocabulary by descending frequency before assigning peak and neutral loss indices."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
138 <param label="Batch size" name="batch_words" type="integer" value="10000"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
139 help="Target size (in peaks and neutral losses) for batches of examples passed to worker threads (and thus cython routines).
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
140 Larger batches will be passed if individual peak sequences are longer than 10000 words, but the standard cython code truncates to that maximum."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
141 <param label="Shrink windows" name="shrink_windows" type="boolean" checked="true" truevalue="TRUE" falsevalue="FALSE"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
142 help="EXPERIMENTAL. If true, the effective window size is uniformly sampled in range [1,Window] for each target peak during training."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
143 <conditional name="trim_vocab">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
144 <param label="Limit unique peaks and neutral losses in the spectral vocabulary" name="max_vocab_size_bool" type="select" display="radio"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
145 help="Limits the RAM during vocabulary building; if there are more unique peaks and neutral losses than this, then prune the infrequent ones. Disable for no limit (default).">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
146 <option value="FALSE">No limit</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
147 <option value="TRUE">Limit</option>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
148 </param>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
149 <when value="TRUE">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
150 <param label="Maximum unique peaks and neutral losses" name="max_vocab_size" type="integer" value="100000" min="1"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
151 </when>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
152 </conditional>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
153 <param label="Number of decimals to round m/z values" name="n_decimals" type="integer" value="2"
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
154 min="0" max="5" help="Rounds peak position to this number of decimals."/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
155 </section>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
156 </inputs>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
157
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
158 <outputs>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
159 <data label="Spec2Vec model on ${on_string}" name="model_filename" format="json"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
160 <data label="Spec2Vec weights on ${on_string}" name="weights_filename" format="binary"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
161 <data label="Spec2Vec pickle model on ${on_string}" name="model_filename_pickle" format="binary">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
162 <filter>output_parameters['as_pickle']</filter>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
163 </data>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
164 <collection name="model_checkpoints" type="list" label="Spec2Vec model checkpoints on ${on_string}">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
165 <discover_datasets pattern="__name_and_ext__" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
166 <filter>output_parameters['model_checkpoints']['save_checkpoints'] == 'TRUE'</filter>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
167 </collection>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
168 </outputs>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
169
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
170 <tests>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
171 <test expect_num_outputs="2"> <!-- Test 1: with default parameters -->
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
172 <param name="spectra_filename" value="RECETOX_Exposome_pesticides_HR_MS_normalized_20220323.msp" ftype="msp"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
173 <output name="model_filename" file="model.json" ftype="json"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
174 <output name="weights_filename" ftype="binary">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
175 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
176 <has_size value="1708000" delta="1000"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
177 <has_text text="'shape': (1423, 300)" n="1"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
178 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
179 </output>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
180 </test>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
181 <test expect_num_outputs="3"> <!-- Test 2: pickle output -->
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
182 <param name="spectra_filename" value="RECETOX_Exposome_pesticides_HR_MS_normalized_20220323.msp" ftype="msp"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
183 <param name="as_pickle" value="TRUE"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
184 <output name="model_filename" file="model.json" ftype="json"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
185 <output name="weights_filename" ftype="binary">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
186 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
187 <has_size value="1708000" delta="1000"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
188 <has_text text="'shape': (1423, 300)" n="1"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
189 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
190 </output>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
191 <output name="model_filename_pickle" ftype="binary">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
192 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
193 <has_size value="3468000" delta="1000" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
194 <has_text text="gensim.models.word2vec"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
195 <has_text text="peak@" n="1423"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
196 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
197 </output>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
198 </test>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
199 <test expect_num_outputs="3"> <!-- Test 3: model checkpoints -->
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
200 <param name="spectra_filename" value="RECETOX_Exposome_pesticides_HR_MS_normalized_20220323.msp" ftype="msp"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
201 <conditional name="model_checkpoints">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
202 <param name="save_checkpoints" value="TRUE"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
203 <param name="checkpoints" value="1,5,8,10"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
204 </conditional>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
205 <output name="model_filename" file="model.json" ftype="json"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
206 <output name="weights_filename" ftype="binary">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
207 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
208 <has_size value="1708000" delta="1000"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
209 <has_text text="'shape': (1423, 300)" n="1"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
210 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
211 </output>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
212 <output_collection name="model_checkpoints" type="list" count="3">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
213 <element name="spec2vec_iter_1">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
214 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
215 <has_size value="3468000" delta="1000" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
216 <has_text text="gensim.models.word2vec" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
217 <has_text text="peak@" n="1423" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
218 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
219 </element>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
220 <element name="spec2vec_iter_5">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
221 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
222 <has_size value="3468000" delta="1000" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
223 <has_text text="gensim.models.word2vec" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
224 <has_text text="peak@" n="1423" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
225 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
226 </element>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
227 <element name="spec2vec_iter_8">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
228 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
229 <has_size value="3468000" delta="1000" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
230 <has_text text="gensim.models.word2vec" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
231 <has_text text="peak@" n="1423" />
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
232 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
233 </element>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
234 </output_collection>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
235 </test>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
236 <test> <!-- Test 4: embeddings size in output corresponds to `vector_size` param -->
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
237 <param name="spectra_filename" value="RECETOX_Exposome_pesticides_HR_MS_normalized_20220323.msp" ftype="msp"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
238 <param name="vector_size" value="100"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
239 <output name="model_filename" file="model_vector_size_100.json" ftype="json"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
240 <output name="weights_filename" ftype="binary">
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
241 <assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
242 <has_size value="569000" delta="1000"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
243 <has_text text="'shape': (1423, 100)" n="1"/>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
244 </assert_contents>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
245 </output>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
246 </test>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
247 </tests>
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
248
1
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
249 <help>
0
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
250 **Spec2vec** is a spectral similarity score inspired by a natural language processing algorithm – Word2Vec.
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
251 Where Word2Vec learns relationships between words in sentences, spec2vec does so for mass fragments and neutral losses in MS/MS spectra.
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
252 The spectral similarity score is based on spectral embeddings learnt from the fragmental relationships within a large set of spectral data.
1
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
253 </help>
0
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
254
1
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
255 <expand macro="citations"/>
9d917de87cca planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents: 0
diff changeset
256
0
e1e22ada831e planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/spec2vec commit 2e4bdc2fd94445aa5a8d1882a3d092cca727e4b6
recetox
parents:
diff changeset
257 </tool>