Mercurial > repos > recetox > matchms_similarity
annotate matchms_similarity_wrapper.py @ 1:872d8040f713 draft default tip
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit b1cc1aebf796f170d93e3dd46ffcdefdc7b8018a
author | recetox |
---|---|
date | Thu, 12 Oct 2023 13:25:30 +0000 |
parents | e5010b19d64d |
children |
rev | line source |
---|---|
0
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
1 import argparse |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
2 import json |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
3 import sys |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
4 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
5 from matchms import calculate_scores |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
6 from matchms.importing import load_from_mgf, load_from_msp |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
7 from matchms.similarity import (CosineGreedy, CosineHungarian, MetadataMatch, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
8 ModifiedCosine, NeutralLossesCosine) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
9 from spec2vec import Spec2Vec |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
10 from spec2vec.serialization.model_importing import load_weights, Word2VecLight |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
11 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
12 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
13 def convert_precursor_mz(spectrum): |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
14 """ |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
15 Check the presence of precursor m/z since it is needed for ModifiedCosine similarity metric. Convert to float if |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
16 needed, raise error if missing. |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
17 """ |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
18 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
19 if "precursor_mz" in spectrum.metadata: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
20 metadata = spectrum.metadata |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
21 metadata["precursor_mz"] = float(metadata["precursor_mz"]) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
22 spectrum.metadata = metadata |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
23 return spectrum |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
24 else: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
25 raise ValueError("Precursor_mz missing. Apply 'add_precursor_mz' filter first.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
26 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
27 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
28 def load_model(model_file, weights_file) -> Word2VecLight: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
29 """ |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
30 Read a lightweight version of a :class:`~gensim.models.Word2Vec` model from disk. |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
31 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
32 Parameters |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
33 ---------- |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
34 model_file: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
35 A path of json file to load the model. |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
36 weights_file: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
37 A path of `.npy` file to load the model's weights. |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
38 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
39 Returns |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
40 ------- |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
41 :class:`~spec2vec.serialization.model_importing.Word2VecLight` – a lightweight version of a |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
42 :class:`~gensim.models.Word2Vec` |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
43 """ |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
44 with open(model_file, "r", encoding="utf-8") as f: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
45 model: dict = json.load(f) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
46 del (model["mapfile_path"]) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
47 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
48 weights = load_weights(weights_file, model["__weights_format"]) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
49 return Word2VecLight(model, weights) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
50 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
51 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
52 def main(argv): |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
53 parser = argparse.ArgumentParser(description="Compute MSP similarity scores") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
54 parser.add_argument("-r", dest="ri_tolerance", type=float, help="Use RI filtering with given tolerance.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
55 parser.add_argument("-s", dest="symmetric", action='store_true', help="Computation is symmetric.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
56 parser.add_argument("--array_type", type=str, help="Type of array to use for storing scores (numpy or sparse).") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
57 parser.add_argument("--ref", dest="references_filename", type=str, help="Path to reference spectra library.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
58 parser.add_argument("--ref_format", dest="references_format", type=str, help="Reference spectra library file format.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
59 parser.add_argument("--spec2vec_model", dest="spec2vec_model", type=str, help="Path to spec2vec model.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
60 parser.add_argument("--spec2vec_weights", dest="spec2vec_weights", type=str, help="Path to spec2vec weights.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
61 parser.add_argument("--allow_missing_percentage", dest="allowed_missing_percentage", type=lambda x: float(x) * 100.0, help="Maximum percentage of missing peaks in model corpus.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
62 parser.add_argument("queries_filename", type=str, help="Path to query spectra.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
63 parser.add_argument("queries_format", type=str, help="Query spectra file format.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
64 parser.add_argument("similarity_metric", type=str, help='Metric to use for matching.') |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
65 parser.add_argument("tolerance", type=float, help="Tolerance to use for peak matching.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
66 parser.add_argument("mz_power", type=float, help="The power to raise mz to in the cosine function.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
67 parser.add_argument("intensity_power", type=float, help="The power to raise intensity to in the cosine function.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
68 parser.add_argument("output_filename_scores", type=str, help="Path where to store the output .json scores.") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
69 args = parser.parse_args() |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
70 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
71 if args.queries_format == 'msp': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
72 queries_spectra = list(load_from_msp(args.queries_filename)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
73 elif args.queries_format == 'mgf': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
74 queries_spectra = list(load_from_mgf(args.queries_filename)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
75 else: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
76 raise ValueError(f'File format {args.queries_format} not supported for query spectra.') |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
77 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
78 if args.symmetric: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
79 reference_spectra = queries_spectra.copy() |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
80 else: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
81 if args.references_format == 'msp': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
82 reference_spectra = list(load_from_msp(args.references_filename)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
83 elif args.references_format == 'mgf': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
84 reference_spectra = list(load_from_mgf(args.references_filename)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
85 else: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
86 raise ValueError(f'File format {args.references_format} not supported for reference spectra library.') |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
87 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
88 if args.similarity_metric == 'CosineGreedy': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
89 similarity_metric = CosineGreedy(args.tolerance, args.mz_power, args.intensity_power) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
90 elif args.similarity_metric == 'CosineHungarian': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
91 similarity_metric = CosineHungarian(args.tolerance, args.mz_power, args.intensity_power) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
92 elif args.similarity_metric == 'ModifiedCosine': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
93 similarity_metric = ModifiedCosine(args.tolerance, args.mz_power, args.intensity_power) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
94 reference_spectra = list(map(convert_precursor_mz, reference_spectra)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
95 queries_spectra = list(map(convert_precursor_mz, queries_spectra)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
96 elif args.similarity_metric == 'NeutralLossesCosine': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
97 similarity_metric = NeutralLossesCosine(args.tolerance, args.mz_power, args.intensity_power) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
98 reference_spectra = list(map(convert_precursor_mz, reference_spectra)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
99 queries_spectra = list(map(convert_precursor_mz, queries_spectra)) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
100 elif args.similarity_metric == 'Spec2Vec': |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
101 model = load_model(args.spec2vec_model, args.spec2vec_weights) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
102 similarity_metric = Spec2Vec(model, intensity_weighting_power=args.intensity_power, allowed_missing_percentage=args.allowed_missing_percentage) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
103 else: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
104 return -1 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
105 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
106 print("Calculating scores...") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
107 scores = calculate_scores( |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
108 references=reference_spectra, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
109 queries=queries_spectra, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
110 array_type=args.array_type, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
111 similarity_function=similarity_metric, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
112 is_symmetric=args.symmetric |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
113 ) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
114 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
115 if args.ri_tolerance is not None: |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
116 print("RI filtering with tolerance ", args.ri_tolerance) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
117 ri_matches = calculate_scores(references=reference_spectra, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
118 queries=queries_spectra, |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
119 similarity_function=MetadataMatch("retention_index", "difference", args.ri_tolerance), |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
120 array_type="numpy", |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
121 is_symmetric=args.symmetric).scores |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
122 scores.scores.add_coo_matrix(ri_matches, "MetadataMatch", join_type="inner") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
123 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
124 write_outputs(args, scores) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
125 return 0 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
126 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
127 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
128 def write_outputs(args, scores): |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
129 """Write Scores to json file.""" |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
130 print("Storing outputs...") |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
131 scores.to_json(args.output_filename_scores) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
132 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
133 |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
134 if __name__ == "__main__": |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
135 main(argv=sys.argv[1:]) |
e5010b19d64d
planemo upload for repository https://github.com/RECETOX/galaxytools/tree/master/tools/matchms commit f79a5b51599254817727bc9028b9797ea994cb4e
recetox
parents:
diff
changeset
|
136 pass |