view osra.xml @ 4:aeb1f7daa7c2 draft

planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/chemicaltoolbox/osra commit 74daed54894d9769a251a2ca6a46d96b7a27e461
author bgruening
date Thu, 09 Nov 2017 03:41:42 -0500
parents d2490712b67d
children b2edf498e8fb
line wrap: on
line source

<tool id="ctb_osra" name="Molecule recognition" version="2.1.0">
    <description>in Images or PDF documents (OSRA)</description>
    <requirements>
        <requirement type="package" version="2.1.0">osra</requirement>
    </requirements>
    <command detect_errors="aggressive">
<![CDATA[
osra
  -f $oformat
  '$infile'
  -l `which osra | xargs dirname`/../share/spelling.txt
  -a `which osra | xargs dirname`/../share/superatom.txt

  $confidence
  $adaptive
  $thinning
  > '$outfile'
]]>
    </command>
    <inputs>
        <param name="infile" type="data" format="pdf" label="PDF with molecules"/>
        <param name="oformat" type="select" label="Output molecule format">
            <option value="can">SMILES</option>
            <option value="sdf">SDF</option>
        </param>
        <param name="confidence" type="boolean" label="Print out confidence estimate" help=" (-p)"
            truevalue="-p" falsevalue="" checked="true" />
        <param name="adaptive" type="boolean" label="Adaptive thresholding pre-processing, useful for low light/low contrast images" help="(-i)"
            truevalue="-i" falsevalue="" checked="false" />
        <param name="thinning" type="boolean" label="Additional thinning/scaling down of low quality documents" help="(-j)"
            truevalue="-j" falsevalue="" checked="false" />

    </inputs>
    <outputs>
        <data name="outfile" format="sdf">
            <change_format>
                <when input="oformat" value="can" format="smi"/>
            </change_format>
        </data>
    </outputs>
    <tests>
        <test>
            <param name="infile" value="CID_2244.pdf" ftype="pdf"/>
            <param name="oformat" value="sdf"/>
            <output name="outfile" ftype="sdf" file="osra_on_CID2244.sdf"/>
        </test>
        <!--test>
            PNGs producing a core-dump in osra
            <param name="infile" value="2008001635_153_chem.png"/>
            <param name="oformat" value="can"/>
            <output name="outfile" ftype="smi" file="2008001635_153_chem.smi"/>
        </test-->
    </tests>
    <help>
<![CDATA[

.. class:: infomark

**What this tool does**

OSRA_ (Optical Structure Recognition Application) is a utility designed to convert graphical representations of chemical structures into SMILES or SDF. It generates the SMILES or SDF representation of any molecular structure image within a document which is parseable by GraphicMagick.

.. _OSRA: http://cactus.nci.nih.gov/osra/

.. _`Optical Structure Recognition Software To Recover Chemical Information: OSRA, An Open Source Solution`: http://pubs.acs.org/doi/abs/10.1021/ci800067r
]]>
    </help>
    <citations>
        <citation type="bibtex">
            @inproceedings{filippov2010improvements,
            title={Improvements in Optical Structure Recognition Application},
            author={Filippov, Igor V and Nicklaus, Marc C and Kinney, John},
            booktitle={Document Analysis Systems Workshop},
            year={2010}
            }
        </citation>
    </citations>
</tool>