Mercurial > repos > bgruening > chemfp
diff nxn_clustering.xml @ 7:0d88631bb7de draft
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/chemicaltoolbox/chemfp commit ed9b6859de648aa5f7cde483732f5df20aaff90e
author | bgruening |
---|---|
date | Tue, 07 May 2019 13:32:50 -0400 |
parents | 70b071de9bee |
children | 198b1e30c739 |
line wrap: on
line diff
--- a/nxn_clustering.xml Fri Mar 23 03:26:33 2018 -0400 +++ b/nxn_clustering.xml Tue May 07 13:32:50 2019 -0400 @@ -1,10 +1,9 @@ -<tool id="ctb_chemfp_nxn_clustering" name="NxN Clustering" version="0.4"> +<tool id="ctb_chemfp_nxn_clustering" name="NxN clustering" version="1.5"> <description>of molecular fingerprints</description> <requirements> - <requirement type="package" version="1.1p1">chemfp</requirement> - <requirement type="package" version="2">python</requirement> - <requirement type="package" version="2.0.2">matplotlib</requirement> - <requirement type="package" version="0.19.0">scipy</requirement> + <requirement type="package" version="1.5">chemfp</requirement> + <requirement type="package" version="2.2.3">matplotlib</requirement> + <requirement type="package" version="1.2.1">scipy</requirement> <requirement type="package" version="2.4.1">openbabel</requirement> </requirements> <command detect_errors="exit_code"> @@ -16,43 +15,44 @@ --cluster '$image' #end if #if str($output_files) in ['both', 'matrix']: - --smatrix '$smilarity_matrix' + --smatrix '$similarity_matrix' #end if --oformat '$oformat' ]]> </command> <inputs> - <param name="infile" type="data" format="fps" label="Finperprint dataset" help="Dataset missing? See TIP below"/> - <param name='threshold' type='float' value='0.0' /> + <param name="infile" type="data" format="fps" label="Fingerprint dataset" help="Dataset missing? See TIP below"/> + <param name='threshold' label='Threshold' type='float' value='0.0' /> <param name='oformat' type='select' format='text' label="Format of the resulting picture"> <option value='png'>PNG</option> <option value='svg'>SVG</option> </param> <param name='output_files' type='select' format='text' label="Output options"> - <option value='both'>NxN matrix and Image</option> + <option value='both'>NxN matrix and image</option> <option value='image'>Image</option> - <option value='matrix'>NxN Matrix</option> + <option value='matrix'>NxN ḿatrix</option> </param> </inputs> <outputs> - <data name="image" format="svg" label="${tool.name} on ${on_string} - Cluster Image"> + <data name="image" format="svg" label="${tool.name} on ${on_string} - Dendrogram Image"> <filter>output_files == "both" or output_files == "image"</filter> <change_format> <when input="oformat" value="png" format="png"/> </change_format> </data> - <data name="smilarity_matrix" format="binary" label="${tool.name} on ${on_string} - Similarity Matrix"> + <data name="similarity_matrix" format="txt" label="${tool.name} on ${on_string} - Similarity Matrix"> <filter>output_files == "both" or output_files == "matrix"</filter> </data> </outputs> <tests> <test> <param name="infile" ftype="fps" value="targets.fps" /> - <param name='treshold' value='0.75' /> + <param name='threshold' value='0.75' /> <param name='oformat' value='svg' /> - <param name='output_files' value='image' /> - <output name="image" file='NxN_Clustering_on_q.svg' ftype="svg" compare="sim_size"/> + <param name='output_files' value='both' /> + <output name="image" file='NxN_Clustering_on_q.svg' ftype="svg"/> + <output name="similarity_matrix" file='NxN_Clustering_on_q.txt' ftype="txt"/> </test> </tests> <help> @@ -62,8 +62,7 @@ **What this tool does** -Generating hierarchical clusters and visualizing clusters with dendrograms. -For the clustering and the fingerprint handling the chemfp_ project is used. +Based on a set of fingerprints, generates a square self-similarity (NxN) matrix, as well as a dendrogram visualizing the clusters derived from it using hierarchical clustering. For the clustering and the fingerprint handling the chemfp_ project is used. .. _chemfp: http://chemfp.com/ @@ -73,7 +72,7 @@ **Hint** -The plotting of the cluster image is sensible only with a small dataset. +The plotting of the dendrogram is sensible only with a small dataset - if more than around 20 fingerprints are used the plot will be unreadable. -----