diff silicos_qed.xml @ 1:ab73abead7fa draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/chemicaltoolbox/silicos-it/qed commit ed9b6859de648aa5f7cde483732f5df20aaff90e
author bgruening
date Tue, 07 May 2019 13:41:23 -0400
parents 5ccd3a432785
children fc45bf8b6e01
line wrap: on
line diff
--- a/silicos_qed.xml	Tue May 23 03:57:14 2017 -0400
+++ b/silicos_qed.xml	Tue May 07 13:41:23 2019 -0400
@@ -1,8 +1,8 @@
-<tool id="ctb_silicos_qed" name="Drug-likeness" version="0.1">
+<tool id="ctb_silicos_qed" name="Drug-likeness" version="0.2">
     <description>quantitative estimation (QED)</description>
     <!--parallelism method="multi" split_inputs="infile" split_mode="to_size" split_size="10000" shared_inputs="" merge_outputs="outfile"></parallelism-->
     <requirements>
-        <requirement type="package" version="2015.09.2">rdkit</requirement>
+        <requirement type="package" version="2019.03.1">rdkit</requirement>
     </requirements>
     <command detect_errors="aggressive">
 <![CDATA[
@@ -15,13 +15,13 @@
 ]]>
     </command>
     <inputs>
-        <param format="smi,sdf" name="infile" type="data" label="Molecule data in SD- or SMILES-format" help="Dataset missing? See TIP below"/>
-        <param name="method" type="select" label="Method">
+        <param format="smi,sdf" name="infile" type="data" label="Molecule data in SDF or SMILES format" help="Dataset missing? See TIP below"/>
+        <param name="method" type="select" label="Method" help="Method for weighting features">
             <option value="max">Max weight (QEDw,max)</option>
             <option value="mean">Mean weight (QEDw,mo)</option>
-            <option value="unweighted">unweighted (QEDw,u)</option>
+            <option value="unweighted">Unweighted (QEDw,u)</option>
         </param>
-        <param name="header" type="boolean" label="Include the descriptor name as header" truevalue="--header" falsevalue="" checked="false" />
+        <param name="header" type="boolean" label="Include the descriptor names as header" truevalue="--header" falsevalue="" checked="false" />
     </inputs>
     <outputs>
         <data format="tabular" name="outfile" />
@@ -56,21 +56,37 @@
 
 **What this tool does**
 
-Estimates the drug-likeness of molecules and reports a score. Comes with three applicable varieties (QED\ :sub:`w,mo`\ , QED\ :sub:`w,max`\ , QED\ :sub:`w,u` ).
+Estimates the drug-likeness of molecules, based on eight commonly used molecular
+properties, and reports a score between 0 (all properties unfavourable) to 1 (all
+properties favourable). Two possible methods to weight the features are available
+(QED\ :sub:`w,mo`\ , QED\ :sub:`w,max`\), as well as an option to leave features
+unweighted (QED\ :sub:`w,u`).
+
+The eight properties used are: molecular weight (MW), octanol–water partition 
+coefficient (ALOGP), number of hydrogen bond donors (HBDs), number of hydrogen
+bond acceptors (HBAs), molecular polar surface area (PSA), number of rotatable
+bonds (ROTBs), number of aromatic rings (AROMs) and number of structural alerts
+(ALERTS).
 
 -----
 
 .. class:: warningmark
 
-**HINT**
+**Hint**
 
-- All invalid, blank and comment lines are skipped when performing computations. The number of skipped lines is displayed in the resulting history item.
+All invalid, blank and comment lines are skipped when performing computations. The
+number of skipped lines is displayed in the resulting history item. The method refers
+to a set of weights that can be applied to the features. These are derived in the
+`original paper`_ describing QED.
+
 
 - QED\ :sub:`w,max` using the set of weights that give maximal information content
 
 - QED\ :sub:`w,mo` using the mean weights of the optimal 1,000 weight combinations that give the highest information content
 
-- QED\ :sub:`w,u` with all weights as unity, hence unweighted.
+- QED\ :sub:`w,u` with all weights as unity i.e. unweighted.
+
+.. _original paper: https://www.nature.com/articles/nchem.1243
 
 -----
 
@@ -79,11 +95,11 @@
 **Input**
 
 
-| - `SD-Format`_
-| - `SMILES Format`_
+| - `SDF format`_
+| - `SMILES format`_
 
-.. _SD-Format: http://en.wikipedia.org/wiki/Chemical_table_file
-.. _SMILES Format: http://en.wikipedia.org/wiki/Simplified_molecular_input_line_entry_specification
+.. _SDF format: http://en.wikipedia.org/wiki/Chemical_table_file
+.. _SMILES format: http://en.wikipedia.org/wiki/Simplified_molecular_input_line_entry_specification
 
 -----
 
@@ -91,6 +107,9 @@
 
 **Output**
 
+A table listing the values of the eight features, the QED score, the name of the
+molecule, and the number of Lipinski rules which the molecule obeys. 
+
 +--------+-------+-----+-----+--------+------+------+--------+-------+----------------+-----+
 |   MW   | ALOGP | HBA | HBD |   PSA  | ROTB | AROM | ALERTS |  QED  |      NAME      | Ro5 |
 +========+=======+=====+=====+========+======+======+========+=======+================+=====+