Mercurial > repos > bgruening > ctb_im_max_min_picker
diff max_min_picker.xml @ 0:2d9ca306538d draft
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/chemicaltoolbox/im-pipelines commit 598dd288a384481b7602a0f6322c5081dc8da5d9"
author | bgruening |
---|---|
date | Tue, 21 Jul 2020 05:23:34 -0400 |
parents | |
children |
line wrap: on
line diff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000 +++ b/max_min_picker.xml Tue Jul 21 05:23:34 2020 -0400 @@ -0,0 +1,98 @@ +<tool id="ctb_im_max_min_picker" name="Pick" version="@TOOL_VERSION@+galaxy@GALAXY_VERSION@"> + <description>diverse compounds from a library with Butina clustering</description> + <macros> + <import>macros.xml</import> + <token name="@GALAXY_VERSION@">0</token> + </macros> + <expand macro="requirements" /> + <command detect_errors="exit_code"><![CDATA[ + max_min_picker + -i '$infile' + -if sdf + -t '$threshold' + -d '$descriptor_opts' + #if $number != '' + -n $number + #end if + --fragment-method '$fragment_opts' + #if $seedfile + -s '$seedfile' + #end if + $out_fragment + --meta + -o outp + -of sdf &>> $logfile && + cat outp_metrics.txt &>> $logfile && + gzip -d outp.sdf.gz + ]]></command> + <inputs> + <param name="infile" type="data" format="sdf" label="Input file" help="Input file in SDF or JSON format"/> + <param name="threshold" type="float" label="Similarity threshold" value="0.7" min="0" max="1" help="1.0 means identical"/> + <param name="descriptor_opts" type="select" label="Type of descriptor or fingerprint" help="Default is morgan2"> + <option value="maccs">maccs</option> + <option value="morgan2" selected="true">morgan2</option> + <option value="morgan3">morgan3</option> + </param> + <param name="number" type="integer" optional="true" label="Maximum number to pick for diverse subset selection" help="ABC"/> + <param name="fragment_opts" type="select" label="Fragment" help="Approach to find biggest fragment, if more than one is found"> + <option value="hac" selected="true">Biggest by heavy atom count</option> + <option value="mw">Biggest by molecular weight</option> + </param> + <param name="seedfile" type="data" format="sdf" optional="true" label="Seed file" help="Optional file containing any seed molecules that have already been picked"/> + <param name="out_fragment" type="boolean" label="Output fragment" truevalue="--output-fragment" falsevalue="" help="Output the biggest fragment rather than the original molecule"/> + </inputs> + + <expand macro="outputs" /> + + <tests> + <test> + <param name="infile" value="Kinase_inhibs.sdf" ftype="sdf"/> + <param name="threshold" value="0.5"/> + <param name="descriptor_opts" value="morgan2" /> + <param name="fragment_opts" value="hac" /> + <output name="outfile" ftype='sdf'> + <assert_contents> + <has_text_matching expression="^([^\$]+?\$\$\$\$){33}?$"/> + </assert_contents> + </output> + <output name="logfile"> + <assert_contents> + <has_text text="36 candidates 36 total"/> + <has_text text="Output 33 molecules"/> + </assert_contents> + </output> + </test> + </tests> + <help> +<![CDATA[ + +.. class:: infomark + +**What this tool does** + +This molecule selects a subset from a library, ensuring the subset reflects the diversity of the library overall by applying Butina clustering. + + +----- + +.. class:: infomark + +**Input** + +| - Compounds in `SDF Format`_ +| - Various options: similarity threshold, type of fingerprint, seem molecule. + +.. _SDF Format: http://en.wikipedia.org/wiki/Chemical_table_file + + +----- + +.. class:: infomark + + **Output** + +SD-file containing picked compounds. + +]]></help> + <expand macro="citations" /> +</tool> \ No newline at end of file