Mercurial > repos > tduigou > retropath2
changeset 5:d31587621543 draft
planemo upload commit f40274f6b9f6a15eb4022aab21286d4c96cd8475-dirty
author | tduigou |
---|---|
date | Wed, 21 Sep 2022 12:49:42 +0000 (2022-09-21) |
parents | 9c8ac9980bd6 |
children | 8d76e8616839 |
files | retropath2.xml |
diffstat | 1 files changed, 56 insertions(+), 52 deletions(-) [+] |
line wrap: on
line diff
--- a/retropath2.xml Tue Feb 08 11:09:41 2022 +0000 +++ b/retropath2.xml Wed Sep 21 12:49:42 2022 +0000 @@ -1,24 +1,26 @@ -<tool id="retropath2" name="RetroPath2.0" version="@TOOL_VERSION@" profile="19.09"> +<tool id="retropath2_wrapper" name="RetroPath2.0" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="21.09"> <description>Build a reaction network from a set of source compounds to a set of sink compounds</description> <macros> - <token name="@TOOL_VERSION@">2.3.0</token> + <token name="@VERSION_SUFFIX@">0</token> + <token name="@TOOL_VERSION@">2.3.1</token> </macros> <requirements> <requirement type="package" version="@TOOL_VERSION@">retropath2_wrapper</requirement> </requirements> <stdio> - <exit_code range="1" level="fatal" description="Source has been found in the sink" /> - <exit_code range="2" level="fatal" description="Cannot find source-in-sink file" /> - <exit_code range="3" level="fatal" description="Running the RetroPath2.0 Knime program produced an OSError" /> - <exit_code range="4" level="warning" description="RetroPath2.0 has found no solution" /> - <exit_code range="5" level="warning" description="Time limit reached" /> - </stdio> + <exit_code range="1" level="fatal" description="Cannot find source-in-sink file" /> + <exit_code range="2" level="fatal" description="Running the RetroPath2.0 Knime program produced an OSError" /> + <exit_code range="3" level="fatal" description="The InChI string is malformed" /> + <exit_code range="-1" level="warning" description="Source has been found in the sink" /> + <exit_code range="-2" level="warning" description="RetroPath2.0 has found no solution" /> + <exit_code range="-3" level="warning" description="Time limit reached" /> + </stdio> <command detect_errors="exit_code"><![CDATA[ python -m retropath2_wrapper '$sinkfile' '$rulesfile' out - --source_inchi '$source_inchi_type.source_inchi' + --source_inchi '$source_inchi' --source_name '$source_name' --rp2_version '$adv.version' --max_steps '$max_steps' @@ -34,84 +36,86 @@ fi ]]></command> <inputs> - <param name="rulesfile" type="data" format="csv,tar" label="Rules File"/> - <param name="sinkfile" type="data" format="csv" label="Sink File"/> - <conditional name="source_inchi_type"> - <param name="inchi_type" type="select" label="InChI type"> - <!-- <option value="name" selected="true">By name</option> --> - <option value="string">By string</option> - </param> - <when value="string"> - <param name="source_inchi" type="text" label="Source InChI" optional="false"> - <validator type="empty_field" message="You must provide the InChI string"/> - </param> - </when> - </conditional> - <param name="max_steps" type="integer" value="3" min="1" max="10" label="Maximal Pathway length" /> - <param name="source_name" type="text" value="target" optional="true" label="Source name"> - <validator type="empty_field" message="Source name is required"/> + <param name="rulesfile" type="data" format="csv,tar" label="Rules File" help="File containing reaction rules which reflect the enzymatic potential of the chassis organism."/> + <param name="sinkfile" type="data" format="csv" label="Sink File" help=" Sink file which comprises all compounds that are considered as granted in your system."/> + <param name="source_inchi" type="text" label="Source InChI" optional="false" help="InChI of compound to produce."> + <validator type="empty_field" message="You must provide the InChI string"/> + </param> + <param name="max_steps" type="integer" value="3" min="1" max="10" label="Maximal Pathway length" help="The maximal number of metabolic steps (i.e. reactions) for exploring around the target."/> + <param name="source_name" type="text" value="target" optional="true" label="Source name" help="Name of compound to produce."> + <validator type="empty_field" message="Source name is required."/> </param> <section name="adv" title="Advanced Options" expanded="false"> - <param name="version" type="select" label="Workflow version"> + <param name="version" type="select" label="Workflow version" help="Retropath2.0 Workflow versions, formatted as 'r{year}{month}{day}' (the latest version 'r20220104' is used by default)."> <option value="v9">v9</option> <option value="r20210127">r20210127</option> <option value="r20220104" selected="true">r20220104</option> </param> - <param name="topx" type="integer" value="100" min="1" max="1000" label="TopX" /> - <param name="dmin" type="integer" value="0" min="0" max="1000" label="Minimum rule diameter" /> - <param name="dmax" type="integer" value="1000" min="0" max="1000" label="Maximum rule diameter" /> - <param name="mwmax_source" type="integer" value="1000" min="0" max="2000" label="Molecular weight of source (Da)" /> - <param name="timeout" type="integer" value="60" min="30" max="600" label="Timeout (min)" /> + <param name="topx" type="integer" value="100" min="1" max="1000" label="TopX" help="The maximal number of intermediate compounds to use as new starting points for a next iteration of the retrosynthesis algorithm." /> + <param name="dmin" type="integer" value="0" min="0" max="1000" label="Minimum rule diameter" help="Minimum rule diameter of the sphere including the atoms around the reacting center. The higher is the diameter, the more specific are the rules." /> + <param name="dmax" type="integer" value="1000" min="0" max="1000" label="Maximum rule diameter" help="Maximum rule diameter of the sphere including the atoms around the reacting center. The higher is the diameter, the more specific are the rules."/> + <param name="mwmax_source" type="integer" value="1000" min="0" max="2000" label="Molecular weight of source (Da)" help="The molecular weight cutoff (in Da), above which initial source (ie target) and intermediate compounds will be filtered out." /> + <param name="timeout" type="integer" value="60" min="30" max="600" label="Timeout (min)" help="Maximal time of RetroPath2.0 execution (60 minutes by default)." /> </section> </inputs> <outputs> - <data name="Reaction_Network" format="csv" label="${tool.name}" /> + <data name="Reaction_Network" format="csv" label="${tool.name}" > + <actions> + <action name="column_names" type="metadata" default="Initial source,Transformation ID,Reaction SMILES,Substrate SMILES,Substrate InChI,Product SMILES,Product InChI,In Sink,Sink name,Diameter,Rule ID,EC number,Score,Starting Source SMILES,Iteration" /> + </actions> + </data> </outputs> <tests> <test> <!-- test 1: check if identical outputs are produced with default parameters --> <param name="rulesfile" value="rules.csv" /> <param name="sinkfile" value="sink.csv" /> - <param name="source_inchi" value="InChI=1S/C6H6O4/c7-5(8)3-1-2-4-6(9)10/h1-4H,(H,7,8)(H,9,10)/p-2" /> + <param name="source_inchi" value="InChI=1S/C40H56/c1-33(2)19-13-23-37(7)27-17-31-39(9)29-15-25-35(5)21-11-12-22-36(6)26-16-30-40(10)32-18-28-38(8)24-14-20-34(3)4/h11-12,15-22,25-32H,13-14,23-24H2,1-10H3/b12-11+,25-15+,26-16+,31-17+,32-18+,35-21+,36-22+,37-27+,38-28+,39-29+,40-30+" /> <output name="Reaction_Network" file="results_retropath2.csv" ftype="csv" compare="diff"/> </test> - </tests> + </tests> <help><![CDATA[ Retropath2.0 wrapper ==================== -Perform retrosynthesis search of possible metabolic routes between a source molecule and a collection of sink molecules. Docker implementation of the KNIME retropath2.0 workflow. Takes for input the minimal (dmin) and maximal (dmax) diameter for the reaction rules and the maximal path length (maxSteps). The docker mounts a local folder and expects the following files: rules.csv, sink.csv and source.csv. We only support a single source molecule at this time. +Perform retrosynthesis search of possible metabolic routes between a source molecule and a collection of sink molecules. This tool is an implementation of the `KNIME retropath2.0 workflow <https://www.myexperiment.org/workflows/4987.html>`_. It takes for input the minimal (dmin) and maximal (dmax) diameter for the reaction rules and the maximal path length (maxSteps). The tool expects the following files: rules.csv, sink.csv and source.csv and produce a retrosynthesis network as a CSV file providing reactions in the reaction SMILES format and chemicals in both SMILES and InChI formats along with other information like the score for each reaction. Only a single source molecule is processed at this time. Input ----- Required: -* **-sinkfile**\ : (string) Path to the sink file -* **-sourcefile**\ : (string) Path to the source file -* **-max_steps**\ : (integer) Maximal number of steps -* **-rulesfile**\ : (string) Path to the rules file -* **-rulesfile_format**\ : (string) Valid Options: tar, csv. Format of the rules file +* **Sink File**\ : (string) Sink file which comprises all compounds that are considered as granted in your system. +* **Source InChI**\ : (string) InChI of compound to produce. +* **Source name**\ : (string) Name of compound to produce. +* **Maximal Pathway length**\ : (integer) The maximal number of metabolic steps (i.e. reactions) for exploring around the target. +* **Rules File**\ : (string) File containing reaction rules which reflect the enzymatic potential of the chassis organism. -The InChI source DB entries are obtained by the following command: - -`cat chem_prop.tsv | awk -F'\\t' '{print "\\t\\t\\t\\t\\t<option value=\\""$6"\\"\\>" "["$1"]\\t " $2 "</option>"}' | sed 's/\\&/\\&/g'` - -where `chem_prop.tsv` has been downloaded on MetaNetX. Advanced options: -* **-topx**\ : (integer, default: 100) For each iteration, number of rules -* **-dmin**\ : (integer, default: 0) -* **-dmax**\ : (integer, default: 1000) -* **-mwmax_source**\ : (integer, default: 1000) -* **-timeout**\ : (integer, default: 30) Timeout in minutes +* **TopX**\ : (integer, default: 100) The maximal number of intermediate compounds to use as new starting points for a next iteration of the retrosynthesis algorithm. +* **Minimum rule diameter**\ : (integer, default: 0) Minimum rule diameter of the sphere including the atoms around the reacting center. The higher is the diameter, the more specific are the rules. +* **Maximum rule diameter**\ : (integer, default: 1000) Maximum rule diameter of the sphere including the atoms around the reacting center. The higher is the diameter, the more specific are the rules. +* **Molecular weight of source (Da)**\ : (integer, default: 1000) The molecular weight cutoff (in Da), above which initial source (ie target) and intermediate compounds will be filtered out. +* **Timeout (min)**\ : (integer, default: 60) Maximal time of RetroPath2.0 execution (60 minutes by default) +* **Workflow version**\ : Retropath2.0 Workflow versions, formatted as r{year}{month}{day} (the latest version r20220104 is used by default) Output ------ -* **-scope_csv**\ : (string) Path to the output scope csv file +* **Reaction Network**\ : CSV file containing retrosynthesis network which provides reactions in the reaction SMILES format and chemicals in both SMILES and InChI formats along with other information like the score for each reaction. + +Project Links +--------------------- + +* `GitHub <https://github.com/brsynth/RetroPath2-wrapper>`_ + +Version +---------- + +2.3.1 Authors ------- @@ -122,7 +126,7 @@ License ------- -This project is licensed under the MIT License. +This project is licensed under the `MIT <https://github.com/brsynth/RetroPath2-wrapper/blob/master/LICENSE>`_ License. Acknowledgments ---------------