view summarize_assembly.xml @ 1:cd86d5f93b4a draft default tip

planemo upload for repository https://github.com/jvolkening/galaxy-tools/tree/master/tools/b2b_utils commit 9260aa02a5f703bce63d2db5b69003df9be371ac
author jvolkening
date Fri, 08 Mar 2024 00:45:00 +0000
parents 1995630ef409
children
line wrap: on
line source

<tool id="b2b_summarize_assembly" name="Summarize assembly"
    version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" license="MIT" profile="21.01">

    <description>Calculate and print basic assembly summary stats</description>
    <macros>
        <token name="@TOOL_NAME@">summarize_assembly</token>
        <token name="@TOOL_VERSION@">0.02</token>
        <token name="@VERSION_SUFFIX@">1</token>
        <import>macros.xml</import>
    </macros>
    <edam_topics>
        <edam_topic>topic_0080</edam_topic> <!-- Sequence analysis -->
    </edam_topics>
    <expand macro="requirements" />
    <expand macro="version_command" />

    <!-- ***************************************************************** -->

    <command detect_errors="aggressive">
    <![CDATA[

    summarize_assembly
    --fasta $input1
    --cutoffs $cutoffs
    #if $split_N:
	--split_N
    #end if
    #if $strip_N:
	--strip_N
    #end if

    > $report
    ;

    ]]>
    </command>

    <!-- ***************************************************************** -->

    <inputs>
	    <param format="fasta" name="input1" type="data" label="Assembly in FASTA format" />
	    <param name="cutoffs" type="text" size="60" value="50 90" label="Nx cutoffs to calculate (space-separated)">
		   <sanitizer invalid_char="">
		      <valid initial="string.digits"><add value=" " /></valid>
		   </sanitizer>
	    </param>
	    <param name="strip_N" type="boolean" label="Strip Ns prior to calculations" />
	    <param name="split_N" type="boolean" label="Split scaffolds on Ns (e.g. report contig-level summary)" />
    </inputs>

    <!-- ***************************************************************** -->

    <outputs>
       <data format="txt" name="report" label="${tool.name} on ${on_string}" />
    </outputs>

    <!-- ***************************************************************** -->

    <tests>
        <test>
            <param name="input1" value="assembly.fa" ftype="fasta" />
            <param name="cutoffs" value="50 90 95" />
            <output name="report" file="summarize.txt" compare="diff" />
        </test>
        <test>
            <param name="input1" value="assembly.fa" ftype="fasta" />
            <param name="cutoffs" value="50 90 95" />
            <param name="strip_N" value="True" />
            <output name="report" file="summarize.strip.txt" compare="diff" />
        </test>
        <test>
            <param name="input1" value="assembly.fa" ftype="fasta" />
            <param name="cutoffs" value="50 90 95" />
            <param name="split_N" value="True" />
            <output name="report" file="summarize.split.txt" compare="diff" />
        </test>
    </tests>

    <!-- ***************************************************************** -->

    <help>

    summarize_assembly is a utility from b2b-utils. It takes a FASTA file and
    optionally a list of cutoff values as input and prints out summary
    information about the contigs/scaffolds contained in the file. You can, of
    course, supply a FASTA file of any sort of nucleic acid sequences, but the
    summary information makes most sense for contigs from genomic sequencing
    assemblies.

    </help>

    <!-- ***************************************************************** -->

    <citations>
    </citations>

</tool>