changeset 1:41e31a198b34 draft

planemo upload for repository https://github.com/CS76/NP-Likeness commit 63130752ef267b8239e39562b6d0d7bcf4d6d80a
author bgruening
date Tue, 23 May 2017 03:09:35 -0400
parents b2cad51889ea
children 40d181cc8c19
files natural_product_likeness_calculator.xml repository_dependencies.xml test-data/CID_3037.sdf test-data/Score.sdf tool_dependencies.xml
diffstat 5 files changed, 415 insertions(+), 91 deletions(-) [+]
line wrap: on
line diff
--- a/natural_product_likeness_calculator.xml	Thu Aug 15 03:38:29 2013 -0400
+++ b/natural_product_likeness_calculator.xml	Tue May 23 03:09:35 2017 -0400
@@ -1,70 +1,56 @@
-<tool id="ctb_np-likeness-calculator" name="Natural Product" version="0.2.1">
-    <description>likeness calculator</description>
-    <!--<parallelism method="multi" split_inputs="infile" split_mode="to_size" split_size="100" shared_inputs="" merge_outputs="outfile,outfragments"></parallelism>-->
-    <requirements>
-        <requirement type="package" version="2.0">np-likeness-scorer</requirement>
-    </requirements>
-    <command>
-        ## NPLC is really picky with file extensions. We need to specify every datatype as file extension
-        ## A workaround is to create a symlink with a proper file-extension.
-        #import tempfile
-        #set $temp_file = tempfile.NamedTemporaryFile()
-        #set $temp_link = "%s.%s" % ($temp_file.name, $infile.ext)
-        $temp_file.close()
-        ln -s $infile $temp_link;
-
-        java -jar \$NPLS_JAR_PATH/NP-Likeness-2.0.jar
-            -in "${temp_link}"
-            -out "${outfile}"
-            #if $reconstruct_fragments:
-                -reconstructFragments true
-                -outFragments $outfragments
-            #end if
-        ;
-        rm $temp_link
-    </command>
-    <stdio>
-        <exit_code range="1:" />
-        <exit_code range=":-1" />
-    </stdio>
-    <inputs>
-        <param format="smi,sdf" name="infile" type="data" label="Molecule file" help="Dataset missing? See TIP below"/>
-        <param name='reconstruct_fragments' type='boolean' label='Fragments-scores are written out in SMILES format' truevalue='' falsevalue='' />
-    </inputs>
-    <outputs>
-        <data format_source="infile" name="outfile" />
-        <data format="tabular" name="outfragments">
-            <filter>reconstruct_fragments is True</filter>
-        </data>
-    </outputs>
-    <tests>
-    </tests>
-    <help>
-
-
-.. class:: infomark
-
-**What this tool does**
-
-The `Natural-Product-Likeness Scorer`_ calculates the Natural Product(NP)-likeness of a molecule, i.e. the similarity of the molecule to the structure space covered by known natural products. The more positive the score, the higher is the NP-likeness and vice versa.
-
-.. _Natural-Product-Likeness Scorer: http://sourceforge.net/projects/np-likeness/
-
-.. image:: $PATH_TO_IMAGES/score_distribution.png
-
-
------
-
-.. class:: infomark
-
-**Cite**
-
-| KV Jayaseelan, C Steinbeck, P Moreno, A Truszkowski, P Ertl - `Natural product-likeness score revisited: an open-source, open-data implementation`_
-| 
-| P Ertl, S Roggo, and A Schuffenhauer - `Natural product-likeness score and its application for prioritization of compound libraries`_
-
-.. _`Natural product-likeness score revisited: an open-source, open-data implementation`: http://www.biomedcentral.com/1471-2105/13/106/abstract
-.. _`Natural product-likeness score and its application for prioritization of compound libraries`: http://www.ncbi.nlm.nih.gov/pubmed/18034468
-
-    </help>
-</tool>
+<tool id="ctb_np-likeness-calculator" name="Natural Product" version="2.1">
+    <description>likeness calculator</description>
+    <requirements>
+        <requirement type="package" version="2.1">np-likeness-scorer</requirement>
+    </requirements>
+    <command detect_errors="aggressive">
+    <![CDATA[
+        np-likeness
+            -in '$infile'
+            -intype $infile.ext
+            -out '$outfile'
+            -outtype $infile.ext
+            #if $reconstruct_fragments:
+                -reconstructFragments true
+                -outFragments $outfragments
+            #end if
+    ]]>
+    </command>
+    <inputs>
+        <param format="smi,sdf" name="infile" type="data"
+            label="Molecule file" help="Dataset missing? See TIP below"/>
+        <param name='reconstruct_fragments' type='boolean'
+            truevalue='' falsevalue=''
+            label='Fragments and scores are written out in SMILES format' />
+    </inputs>
+    <outputs>
+        <data format_source="infile" name="outfile" />
+        <data format="tabular" name="outfragments">
+            <filter>reconstruct_fragments is True</filter>
+        </data>
+    </outputs>
+     <tests>
+        <test>
+            <param name="infile" value="CID_3037.sdf"/>
+            <output name="outfile" file="Score.sdf" ftype="sdf" lines_diff="4"/>
+        </test>
+    </tests>
+    <help>
+<![CDATA[
+
+**What this tool does**
+
+The `Natural-Product-Likeness Scorer`_ calculates the Natural Product(NP)-likeness of
+a molecule, i.e. the similarity of the molecule to the structure space covered by known
+natural products. The more positive the score, the higher is the NP-likeness and vice versa.
+
+.. _Natural-Product-Likeness Scorer: http://sourceforge.net/projects/np-likeness/
+.. image:: $PATH_TO_IMAGES/score_distribution.png
+
+]]>
+    </help>
+    <citations>
+        <citation type="doi">10.1186/1471-2105-13-106</citation>
+        <citation type="doi">10.1021/ci700286x</citation>
+    </citations>
+</tool>
--- a/repository_dependencies.xml	Thu Aug 15 03:38:29 2013 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,4 +0,0 @@
-<?xml version="1.0"?>
-<repositories description="This requires the Molecule datatype definitions (e.g. SMILES, InChI, SD-format).">
-    <repository changeset_revision="85eca06eefc6" name="molecule_datatypes" owner="iuc" toolshed="http://toolshed.g2.bx.psu.edu" />
-</repositories>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/CID_3037.sdf	Tue May 23 03:09:35 2017 -0400
@@ -0,0 +1,220 @@
+3037
+  -OEChem-08231108593D
+
+ 27 28  0     0  0  0  0  0  0999 V2000
+   -4.8550    1.3401    0.2120 Cl  0  0  0  0  0  0  0  0  0  0  0  0
+    4.8529   -1.3406    0.2121 Cl  0  0  0  0  0  0  0  0  0  0  0  0
+   -0.1809   -2.1668   -0.3789 O   0  0  0  0  0  0  0  0  0  0  0  0
+    0.1788    2.1664   -0.3787 O   0  0  0  0  0  0  0  0  0  0  0  0
+   -0.0011   -0.0002    1.4744 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -1.2222   -0.2738    0.6597 C   0  0  0  0  0  0  0  0  0  0  0  0
+    1.2377    0.2772    0.6480 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -1.2586   -1.3462   -0.2316 C   0  0  0  0  0  0  0  0  0  0  0  0
+    1.2565    1.3457   -0.2314 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.3343    0.5568    0.7972 C   0  0  0  0  0  0  0  0  0  0  0  0
+    2.3322   -0.5574    0.7972 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.4069   -1.5879   -0.9855 C   0  0  0  0  0  0  0  0  0  0  0  0
+    2.4048    1.5875   -0.9852 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -3.4827    0.3152    0.0433 C   0  0  0  0  0  0  0  0  0  0  0  0
+    3.4807   -0.3156    0.0435 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -3.5190   -0.7571   -0.8481 C   0  0  0  0  0  0  0  0  0  0  0  0
+    3.5170    0.7568   -0.8478 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -0.1548    0.8649    2.1342 H   0  0  0  0  0  0  0  0  0  0  0  0
+    0.1601   -0.8435    2.1593 H   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.3089    1.3938    1.4913 H   0  0  0  0  0  0  0  0  0  0  0  0
+    2.3053   -1.3909    1.4943 H   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.4415   -2.4213   -1.6818 H   0  0  0  0  0  0  0  0  0  0  0  0
+    2.4469    2.4191   -1.6835 H   0  0  0  0  0  0  0  0  0  0  0  0
+   -4.4070   -0.9574   -1.4422 H   0  0  0  0  0  0  0  0  0  0  0  0
+    4.4050    0.9570   -1.4418 H   0  0  0  0  0  0  0  0  0  0  0  0
+    0.2961   -2.2262    0.4641 H   0  0  0  0  0  0  0  0  0  0  0  0
+    0.3872    2.8487   -1.0397 H   0  0  0  0  0  0  0  0  0  0  0  0
+  1 14  1  0  0  0  0
+  2 15  1  0  0  0  0
+  3  8  1  0  0  0  0
+  3 26  1  0  0  0  0
+  4  9  1  0  0  0  0
+  4 27  1  0  0  0  0
+  5  6  1  0  0  0  0
+  5  7  1  0  0  0  0
+  5 18  1  0  0  0  0
+  5 19  1  0  0  0  0
+  6  8  2  0  0  0  0
+  6 10  1  0  0  0  0
+  7  9  2  0  0  0  0
+  7 11  1  0  0  0  0
+  8 12  1  0  0  0  0
+  9 13  1  0  0  0  0
+ 10 14  2  0  0  0  0
+ 10 20  1  0  0  0  0
+ 11 15  2  0  0  0  0
+ 11 21  1  0  0  0  0
+ 12 16  2  0  0  0  0
+ 12 22  1  0  0  0  0
+ 13 17  2  0  0  0  0
+ 13 23  1  0  0  0  0
+ 14 16  1  0  0  0  0
+ 15 17  1  0  0  0  0
+ 16 24  1  0  0  0  0
+ 17 25  1  0  0  0  0
+M  END
+> <PUBCHEM_COMPOUND_CID>
+3037
+
+> <PUBCHEM_CONFORMER_RMSD>
+0.6
+
+> <PUBCHEM_CONFORMER_DIVERSEORDER>
+8
+10
+12
+1
+7
+5
+11
+3
+6
+9
+4
+2
+
+> <PUBCHEM_MMFF94_PARTIAL_CHARGES>
+25
+1 -0.18
+10 -0.15
+11 -0.15
+12 -0.15
+13 -0.15
+14 0.18
+15 0.18
+16 -0.15
+17 -0.15
+2 -0.18
+20 0.15
+21 0.15
+22 0.15
+23 0.15
+24 0.15
+25 0.15
+26 0.45
+27 0.45
+3 -0.53
+4 -0.53
+5 0.29
+6 -0.14
+7 -0.14
+8 0.08
+9 0.08
+
+> <PUBCHEM_EFFECTIVE_ROTOR_COUNT>
+2
+
+> <PUBCHEM_PHARMACOPHORE_FEATURES>
+4
+1 3 donor
+1 4 donor
+6 6 8 10 12 14 16 rings
+6 7 9 11 13 15 17 rings
+
+> <PUBCHEM_HEAVY_ATOM_COUNT>
+17
+
+> <PUBCHEM_ATOM_DEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_ATOM_UDEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_BOND_DEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_BOND_UDEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_ISOTOPIC_ATOM_COUNT>
+0
+
+> <PUBCHEM_COMPONENT_COUNT>
+1
+
+> <PUBCHEM_CACTVS_TAUTO_COUNT>
+5
+
+> <PUBCHEM_CONFORMER_ID>
+00000BDD00000008
+
+> <PUBCHEM_MMFF94_ENERGY>
+44.6858
+
+> <PUBCHEM_FEATURE_SELFOVERLAP>
+20.297
+
+> <PUBCHEM_SHAPE_FINGERPRINT>
+10062212 137 18261117369936506423
+104564 63 17986963035811110412
+11458722 120 18339359768245870841
+11471102 22 5472872458301843344
+11578080 2 18190204380446433792
+116883 192 18265608969609498196
+12236239 1 18410856576819659107
+12592029 89 18338223951597366363
+13549 16 18410575084668353682
+13693222 15 6555421915516066822
+13764800 53 14189033175566991199
+14115302 16 18186237320680093898
+14341114 328 10087642619424135543
+14787075 74 9511159855286719151
+14993402 34 18410855451538227223
+15099037 51 18340768233908588503
+15207287 21 15719111361650760302
+15375358 24 15647053767618106914
+15775835 57 18272650117329930317
+16945 1 17906452130063974618
+17834072 14 15936410035134206066
+18186145 218 17132117918276567720
+19422 9 18271525295227750719
+20279233 1 15719389529571237654
+20645476 183 18339080393619327415
+23402539 116 18186809105365620101
+23402655 69 18342736308283284156
+23559900 14 17603590712323212176
+25 1 17561083592297532664
+26918003 58 6266902359448424189
+296302 2 15213020427345972082
+3082319 5 18338798905472319583
+34934 24 18341891845236497020
+633830 44 17703790310130762689
+74978 22 18266740181857992718
+7832392 63 18340206284835898173
+81228 2 15720767252053392762
+9981440 41 17403743242177431832
+
+> <PUBCHEM_SHAPE_MULTIPOLES>
+341.85
+8.38
+1.9
+1.1
+0.02
+0
+-1.15
+1.94
+-0.01
+0
+-0.39
+-4.15
+0.01
+0
+
+> <PUBCHEM_SHAPE_SELFOVERLAP>
+722.787
+
+> <PUBCHEM_SHAPE_VOLUME>
+193
+
+> <PUBCHEM_COORDINATE_TYPE>
+2
+5
+255
+
+$$$$
+
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/Score.sdf	Tue May 23 03:09:35 2017 -0400
@@ -0,0 +1,139 @@
+3037
+  CDK     0523170409
+
+ 27 28  0  0  0  0  0  0  0  0999 V2000
+   -4.8550    1.3401    0.2120 Cl  0  0  0  0  0  0  0  0  0  0  0  0
+    4.8529   -1.3406    0.2121 Cl  0  0  0  0  0  0  0  0  0  0  0  0
+   -0.1809   -2.1668   -0.3789 O   0  0  0  0  0  0  0  0  0  0  0  0
+    0.1788    2.1664   -0.3787 O   0  0  0  0  0  0  0  0  0  0  0  0
+   -0.0011   -0.0002    1.4744 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -1.2222   -0.2738    0.6597 C   0  0  0  0  0  0  0  0  0  0  0  0
+    1.2377    0.2772    0.6480 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -1.2586   -1.3462   -0.2316 C   0  0  0  0  0  0  0  0  0  0  0  0
+    1.2565    1.3457   -0.2314 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.3343    0.5568    0.7972 C   0  0  0  0  0  0  0  0  0  0  0  0
+    2.3322   -0.5574    0.7972 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.4069   -1.5879   -0.9855 C   0  0  0  0  0  0  0  0  0  0  0  0
+    2.4048    1.5875   -0.9852 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -3.4827    0.3152    0.0433 C   0  0  0  0  0  0  0  0  0  0  0  0
+    3.4807   -0.3156    0.0435 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -3.5190   -0.7571   -0.8481 C   0  0  0  0  0  0  0  0  0  0  0  0
+    3.5170    0.7568   -0.8478 C   0  0  0  0  0  0  0  0  0  0  0  0
+   -0.1548    0.8649    2.1342 H   0  0  0  0  0  0  0  0  0  0  0  0
+    0.1601   -0.8435    2.1593 H   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.3089    1.3938    1.4913 H   0  0  0  0  0  0  0  0  0  0  0  0
+    2.3053   -1.3909    1.4943 H   0  0  0  0  0  0  0  0  0  0  0  0
+   -2.4415   -2.4213   -1.6818 H   0  0  0  0  0  0  0  0  0  0  0  0
+    2.4469    2.4191   -1.6835 H   0  0  0  0  0  0  0  0  0  0  0  0
+   -4.4070   -0.9574   -1.4422 H   0  0  0  0  0  0  0  0  0  0  0  0
+    4.4050    0.9570   -1.4418 H   0  0  0  0  0  0  0  0  0  0  0  0
+    0.2961   -2.2262    0.4641 H   0  0  0  0  0  0  0  0  0  0  0  0
+    0.3872    2.8487   -1.0397 H   0  0  0  0  0  0  0  0  0  0  0  0
+  1 14  1  0  0  0  0 
+  2 15  1  0  0  0  0 
+  3  8  1  0  0  0  0 
+  3 26  1  0  0  0  0 
+  4  9  1  0  0  0  0 
+  4 27  1  0  0  0  0 
+  5  6  1  0  0  0  0 
+  5  7  1  0  0  0  0 
+  5 18  1  0  0  0  0 
+  5 19  1  0  0  0  0 
+  6  8  2  0  0  0  0 
+  6 10  1  0  0  0  0 
+  7  9  2  0  0  0  0 
+  7 11  1  0  0  0  0 
+  8 12  1  0  0  0  0 
+  9 13  1  0  0  0  0 
+ 10 14  2  0  0  0  0 
+ 10 20  1  0  0  0  0 
+ 11 15  2  0  0  0  0 
+ 11 21  1  0  0  0  0 
+ 12 16  2  0  0  0  0 
+ 12 22  1  0  0  0  0 
+ 13 17  2  0  0  0  0 
+ 13 23  1  0  0  0  0 
+ 14 16  1  0  0  0  0 
+ 15 17  1  0  0  0  0 
+ 16 24  1  0  0  0  0 
+ 17 25  1  0  0  0  0 
+M  END
+> <cdk:Title>
+3037
+
+> <cdk:Remark>
+null
+
+> <PUBCHEM_COMPOUND_CID>
+3037
+
+> <PUBCHEM_CONFORMER_RMSD>
+0.6
+
+> <PUBCHEM_CONFORMER_DIVERSEORDER>
+810121751136942
+
+> <PUBCHEM_MMFF94_PARTIAL_CHARGES>
+251 -0.1810 -0.1511 -0.1512 -0.1513 -0.1514 0.1815 0.1816 -0.1517 -0.152 -0.1820 0.1521 0.1522 0.1523 0.1524 0.1525 0.1526 0.4527 0.453 -0.534 -0.535 0.296 -0.147 -0.148 0.089 0.08
+
+> <PUBCHEM_EFFECTIVE_ROTOR_COUNT>
+2
+
+> <PUBCHEM_PHARMACOPHORE_FEATURES>
+41 3 donor1 4 donor6 6 8 10 12 14 16 rings6 7 9 11 13 15 17 rings
+
+> <PUBCHEM_HEAVY_ATOM_COUNT>
+17
+
+> <PUBCHEM_ATOM_DEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_ATOM_UDEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_BOND_DEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_BOND_UDEF_STEREO_COUNT>
+0
+
+> <PUBCHEM_ISOTOPIC_ATOM_COUNT>
+0
+
+> <PUBCHEM_COMPONENT_COUNT>
+1
+
+> <PUBCHEM_CACTVS_TAUTO_COUNT>
+5
+
+> <PUBCHEM_CONFORMER_ID>
+00000BDD00000008
+
+> <PUBCHEM_MMFF94_ENERGY>
+44.6858
+
+> <PUBCHEM_FEATURE_SELFOVERLAP>
+20.297
+
+> <PUBCHEM_SHAPE_FINGERPRINT>
+10062212 137 18261117369936506423104564 63 1798696303581111041211458722 120 1833935976824587084111471102 22 547287245830184334411578080 2 18190204380446433792116883 192 1826560896960949819612236239 1 1841085657681965910712592029 89 1833822395159736636313549 16 1841057508466835368213693222 15 655542191551606682213764800 53 1418903317556699119914115302 16 1818623732068009389814341114 328 1008764261942413554314787075 74 951115985528671915114993402 34 1841085545153822722315099037 51 1834076823390858850315207287 21 1571911136165076030215375358 24 1564705376761810691415775835 57 1827265011732993031716945 1 1790645213006397461817834072 14 1593641003513420606618186145 218 1713211791827656772019422 9 1827152529522775071920279233 1 1571938952957123765420645476 183 1833908039361932741523402539 116 1818680910536562010123402655 69 1834273630828328415623559900 14 1760359071232321217625 1 1756108359229753266426918003 58 6266902359448424189296302 2 152130204273459720823082319 5 1833879890547231958334934 24 18341891845236497020633830 44 1770379031013076268974978 22 182667401818579927187832392 63 1834020628483589817381228 2 157207672520533927629981440 41 17403743242177431832
+
+> <PUBCHEM_SHAPE_MULTIPOLES>
+341.858.381.91.10.020-1.151.94-0.010-0.39-4.150.010
+
+> <PUBCHEM_SHAPE_SELFOVERLAP>
+722.787
+
+> <PUBCHEM_SHAPE_VOLUME>
+193
+
+> <PUBCHEM_COORDINATE_TYPE>
+25255
+
+> <NATURAL_PRODUCT_LIKENESS_SCORE>
+-00.1511
+
+> <UNIQUE_MOLECULE_ID>
+eb878dfc-1074-456a-ab86-c7fc4f84bf2a
+
+$$$$
--- a/tool_dependencies.xml	Thu Aug 15 03:38:29 2013 -0400
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,17 +0,0 @@
-<tool_dependency>
-    <package name="np-likeness-scorer" version="2.0">
-        <install version="1.0">
-            <actions>
-                <action type="download_by_url">http://downloads.sourceforge.net/project/np-likeness/Natural_Product_Likeness_calculator_2.0.zip</action>
-               <action type="move_file">
-                    <source>Natural_Product_Likeness_calculator_2.0/NP-Likeness-2.0.jar</source>
-                    <destination>$INSTALL_DIR</destination>
-                </action>
-                <action type="set_environment">
-                    <environment_variable name="NPLS_JAR_PATH" action="set_to">$INSTALL_DIR</environment_variable>
-                </action>
-            </actions>
-        </install>
-        <readme>Opsin requires a JAVA (1.5+) runtime evironment.</readme>
-    </package>
-</tool_dependency>