annotate osra.xml @ 0:34ae5f2ae450 draft

Uploaded
author bgruening
date Thu, 15 Aug 2013 03:30:25 -0400
parents
children d2490712b67d
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
1 <tool id="ctb_osra" name="Molecule recognition" version="0.3">
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
2 <description>in Images or PDF documents (OSRA)</description>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
3 <requirements>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
4 <requirement type="package" version="2.0.0">osra</requirement>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
5 <requirement type="package" version="2.3.2">openbabel</requirement>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
6 <requirement type="package" version="1.3.18">graphicsmagick</requirement>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
7 </requirements>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
8 <command interpreter='python'>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
9 ## OSRA_DATA_FILES is set during the toolshed Installation
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
10 ## if it is not set, use the standard configuration and hope the best
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
11 osra.py -f $oformat $infile
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
12 -l \$OSRA_DATA_FILES/spelling.txt -a \$OSRA_DATA_FILES/superatom.txt
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
13
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
14 ## further additions of OSRA parameter should go after -l and -a
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
15 ## because -l and -a can be removed by the python wrapper
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
16
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
17 $confidence
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
18 $adaptive
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
19 $thinning
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
20
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
21 > $outfile
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
22 </command>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
23 <inputs>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
24 <param name="infile" type="data" format="png,pdf" label="Image or PDF with molecules"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
25 <param name="oformat" type="select" label="Output molecule format">
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
26 <option value="can">SMILES</option>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
27 <option value="sdf">SDF</option>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
28 </param>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
29 <param name="confidence" type="boolean" label="Print out confidence estimate (-p)" truevalue="-p" falsevalue="" checked="true" />
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
30 <param name="adaptive" type="boolean" label="Adaptive thresholding pre-processing, useful for low light/low contrast images (-i)" truevalue="-i" falsevalue="" checked="false" />
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
31 <param name="thinning" type="boolean" label="Additional thinning/scaling down of low quality documents (-j)" truevalue="-j" falsevalue="" checked="false" />
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
32
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
33 </inputs>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
34 <outputs>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
35 <data name="outfile" type="data" format="sdf">
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
36 <change_format>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
37 <when input="oformat" value="can" format="smi"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
38 </change_format>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
39 </data>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
40 </outputs>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
41 <tests>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
42 <test>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
43 <param name="infile" ftype="png" value="CID_2244.png"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
44 <param name="oformat" value="sdf"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
45 <output name="outfile" ftype="sdf" file="osra_on_CID2244.sdf"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
46 </test>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
47 <test>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
48 <param name="infile" ftype="png" value="2008001635_153_chem.png"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
49 <param name="oformat" value="can"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
50 <output name="outfile" ftype="sdf" file="2008001635_153_chem.smi"/>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
51 </test>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
52
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
53 </tests>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
54 <help>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
55
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
56 .. class:: infomark
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
57
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
58 **What this tool does**
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
59
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
60 OSRA_ (Optical Structure Recognition Application) is a utility designed to convert graphical representations of chemical structures into SMILES or SDF. It generates the SMILES or SDF representation of any molecular structure image within a document which is parseable by GraphicMagick.
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
61
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
62 .. _OSRA: http://cactus.nci.nih.gov/osra/
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
63
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
64 -----
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
65
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
66 .. class:: infomark
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
67
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
68 **Cite**
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
69
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
70 Igor V Filippov and Marc C Nicklaus - `Optical Structure Recognition Software To Recover Chemical Information: OSRA, An Open Source Solution`_
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
71
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
72 .. _`Optical Structure Recognition Software To Recover Chemical Information: OSRA, An Open Source Solution`: http://pubs.acs.org/doi/abs/10.1021/ci800067r
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
73 </help>
34ae5f2ae450 Uploaded
bgruening
parents:
diff changeset
74 </tool>