comparison galaxy_stubs/FingerprintSimilaritySearch.xml @ 2:605370bc1def draft default tip

Uploaded
author luis
date Tue, 12 Jul 2016 12:33:33 -0400
parents
children
comparison
equal deleted inserted replaced
1:31013b5cd066 2:605370bc1def
1 <?xml version='1.0' encoding='UTF-8'?>
2 <!--This is a configuration file for the integration of a tools into Galaxy (https://galaxyproject.org/). This file was automatically generated using CTD2Galaxy.-->
3 <!--Proposed Tool Section: [Chemoinformatics]-->
4 <tool id="FingerprintSimilaritySearch" name="FingerprintSimilaritySearch" version="1.1.0">
5 <description>calculate similar molecules in a library</description>
6 <macros>
7 <token name="@EXECUTABLE@">FingerprintSimilaritySearch</token>
8 <import>macros.xml</import>
9 </macros>
10 <expand macro="stdio"/>
11 <expand macro="requirements"/>
12 <command>FingerprintSimilaritySearch
13
14 #if $param_t:
15 -t $param_t
16 #end if
17 #if $param_q:
18 -q $param_q
19 #end if
20 #if $param_o:
21 -o $param_o
22 #end if
23 #if $param_f:
24 -f $param_f
25 #end if
26 #if $param_fp_col:
27 -fp_col $param_fp_col
28 #end if
29 #if $param_id_col:
30 -id_col $param_id_col
31 #end if
32 #if $param_fp_tag:
33 -fp_tag "$param_fp_tag"
34 #end if
35 #if $param_id_tag:
36 -id_tag "$param_id_tag"
37 #end if
38 #if $param_tc:
39 -tc $param_tc
40 #end if
41 #if $param_nt:
42 -nt "$param_nt"
43 #end if
44 #if $param_bs:
45 -bs $param_bs
46 #end if
47 #if $param_sdf_out:
48 -sdf_out $param_sdf_out
49 #end if
50 </command>
51 <inputs>
52 <param name="param_t" type="data" format="smi.gz,csv,sdf.gz,sdf,txt.gz,smi,txt,csv.gz" optional="False" value="&lt;class 'CTDopts.CTDopts._Null'&gt;" label="Target library input file" help="(-t) "/>
53 <param name="param_q" type="data" format="smi.gz,csv,sdf.gz,sdf,txt.gz,smi,txt,csv.gz" optional="False" value="&lt;class 'CTDopts.CTDopts._Null'&gt;" label="Query library input file" help="(-q) "/>
54 <param name="param_f" type="integer" min="1" max="2" optional="False" value="0" label="Fingerprint format [1 = binary bitstring, 2 = comma separated feature list]" help="(-f) "/>
55 <param name="param_fp_col" type="integer" value="-1" label="Column number for comma separated smiles input which contains the fingerprint" help="(-fp_col) "/>
56 <param name="param_id_col" type="integer" value="-1" label="Column number for comma separated smiles input which contains the molecule identifie" help="(-id_col) "/>
57 <param name="param_fp_tag" type="text" size="30" value=" " label="Tag name for SDF input which contains the fingerprint" help="(-fp_tag) ">
58 <sanitizer>
59 <valid initial="string.printable">
60 <remove value="'"/>
61 <remove value="&quot;"/>
62 </valid>
63 </sanitizer>
64 </param>
65 <param name="param_id_tag" type="text" size="30" value=" " label="Tag name for SDF input which contains the molecule identifie" help="(-id_tag) ">
66 <sanitizer>
67 <valid initial="string.printable">
68 <remove value="'"/>
69 <remove value="&quot;"/>
70 </valid>
71 </sanitizer>
72 </param>
73 <param name="param_tc" type="float" value="0.7" label="Tanimoto cutoff [default: 0.7]" help="(-tc) "/>
74 <param name="param_nt" type="text" size="30" value="1" label="Number of parallel threads to use" help="(-nt) To use all possible threads enter &lt;max&gt; [default: 1]">
75 <sanitizer>
76 <valid initial="string.printable">
77 <remove value="'"/>
78 <remove value="&quot;"/>
79 </valid>
80 </sanitizer>
81 </param>
82 <param name="param_bs" type="integer" value="500" label="Block size [default: 500]" help="(-bs) "/>
83 <param name="param_sdf_out" type="integer" min="0" max="1" optional="True" value="0" label="If query file has SD format, this flag activates writing of nearest neighbours as a new CSV tag in a copy of the query SD file" help="(-sdf_out) "/>
84 </inputs>
85 <expand macro="advanced_options"/>
86 <outputs>
87 <data name="param_o" metadata_source="param_t" format="input"/>
88 </outputs>
89 <help>This tool calculates all nearest neighbours above a similarity cutoff for given query molecules in a compound library on the basis of 2D binary fingerprints.
90 The first library to specify (i1) is the compound library to be searched, the second library (i2) is conseiderd as the query compounds.
91 Both files have to be comma separated values (csv) files and the binary fingerprints have to be encoded as feature lists or as binary bit strings.
92
93 WARNING: If similarity cutoff is chosen to be 0.0, the output will be the entire similarity matrix and has a size of n*m with n=|i1| and m=|i2|.
94
95 ======================================================================================================================================================
96
97 Examples:
98
99 $ FingerprintSimilaritySearch -t target.sdf -q query.sdf -o results -fp_tag FPRINT -f 1 -id_tag NAME
100 tries to extract fingerprints as binary bitstrings (-f 1) from tag &lt;FPRINT&gt; and compound IDs from tag &lt;NAME&gt; of target.sdf and query.sdf.
101 A similarity search is performed for all query molecules against all target molecules and pairs with similarity above Tanimoto cutoff 0.7 are written to outfile (results).
102
103 $ FingerprintSimilaritySearch -t target.sdf -q query.sdf -o results -fp_tag FPRINT -f 1 -id_tag NAME -sdf_out
104 tries to extract fingerprints as binary bitstrings (-f 1) from tag &lt;FPRINT&gt; and compound IDs from tag &lt;NAME&gt; of target.sdf and query.sdf.
105 A similarity search is performed for all query molecules against all target molecules and pairs with similarity above Tanimoto cutoff 0.7
106 are added as a new SD tag to output file 'NN_TAGGED_query.sdf' as a list of TargetID:Similarity pairs.
107
108 $ FingerprintSimilaritySearch -t target.sdf -q query.smi -o results -fp_tag FPRINT -f 1 -id_tag NAME -fp_col 2
109 tries to extract fingerprints as binary bitstrings (-f 1) from tag &lt;FPRINT&gt; and compound IDs from tag &lt;NAME&gt; of target.sdf
110 and fingerprints as binary bitstrings of space separated query file from column 2 (-fp_col 2).
111 A similarity search is performed for all query molecules against all target molecules and pairs with similarity above Tanimoto cutoff 0.7 are written to outfile (results).
112
113 </help>
114 </tool>