view fast5_subset.xml @ 0:eb1f4aa80c72 draft

"planemo upload for repository https://github.com/nanoporetech/ont_fast5_api/ commit 84504d6786e9edf00367739210d6bae78cb42cc8"
author iuc
date Mon, 08 Jun 2020 15:57:10 -0400
parents
children 3bdd8fa109b1
line wrap: on
line source

<?xml version="1.0"?>
<tool id="ont_fast5_api_fast5_subset" name="Fast5 subset" version="@TOOL_VERSION@+galaxy0" profile="18.01">
    <description>of multi read file</description>
    <macros>
        <import>macros.xml</import>
    </macros>
    <expand macro="requirements"/>
    <version_command></version_command>
    <command detect_errors="exit_code"><![CDATA[
## initialize
mkdir data &&
#for $num, $current in enumerate($input):
    ln -s '$current' './data/batch${num}.fast5' &&
#end for

## run
fast5_subset
## required
--input ./data
-s ./results
--read_id_list '$read_id_list'
## optional
--batch_size $batch_size
-t \${GALAXY_SLOTS:-4}
    ]]></command>
    <inputs>
        <param argument="--input" type="data" format="fast5" multiple="true"
            label="Select multi read input file(s)"/>
        <param argument="--read_id_list" type="data" format="tabular"
            label="Select file with read_ids" help="Either containing 1 read_id per line or a tabular file with a column named read_id."/>
        <param argument="--batch_size" type="integer" value="4000" min="1"
            label="Set batch size" help="Number of single reads to include in each multi read file"/>
    </inputs>
    <outputs>
        <data name="out_results" format="fast5">
            <discover_datasets pattern="(?P&lt;designation&gt;.+)\.fast5" format="fast5" directory="results" assign_primary_output="true" visible="true"/>
        </data>
    </outputs>
    <tests>
        <test expect_num_outputs="1">
            <param name="input" value="batch.fast5"/>
            <param name="read_id_list" value="list.txt"/>
            <param name="batch_size" value="2"/>
            <output name="out_results">
                <assert_contents>
                    <has_size value="23304"/>
                </assert_contents>
                <!-- batch0 is represented by out_results -->
                <discovered_dataset designation="batch1" ftype="fast5">
                    <assert_contents>
                        <has_size value="17328"/>
                    </assert_contents>
                </discovered_dataset>
            </output>
        </test>
    </tests>
    <help><![CDATA[
.. class:: infomark

**What it does**

@WID@

fast5_subset extracts reads from multi_read_fast5_file(s) based on a list of read IDs.

**Input**

A multi read file in FAST5 format and a list of read IDs that should be extracted.

**Output**

A multi read file in FAST5 format containing a subset of the input file.

.. class:: infomark

**References**

@REFERENCES@
    ]]></help>
    <expand macro="citations"/>
</tool>