view dante_ltr_search.xml @ 5:0c3111ab729b draft

"planemo upload commit 5a81f1734493a3acf5ff24a573fa2887d92b58a8"
author petr-novak
date Mon, 16 May 2022 07:50:41 +0000
parents 6ae4a341d1f3
children b91ca438a1cb
line wrap: on
line source

<tool id="dante_ltr_search" name="DANTE_LTR transposable element identification" version="0.1.5" python_template_version="3.5">
    <requirements>
        <requirement type="package">blast</requirement>
        <requirement type="package">r-optparse</requirement>
        <requirement type="package">bioconductor-bsgenome</requirement>
        <requirement type="package">bioconductor-biostrings</requirement>
        <requirement type="package">bioconductor-rtracklayer</requirement>

    </requirements>
    <command detect_errors="exit_code"><![CDATA[
        Rscript ${__tool_directory__}/extract_putative_ltr.R --gff3 '$dante' --reference_sequence '$reference' --output output --cpu 32
        &&
        mv output.gff3 $te_ltr_gff
    ]]></command>
    <inputs>
        <param type="data" name="dante" format="gff3" label="Filtered gff3 output from DANTE pipeline"/>
        <param type="data" name="reference" format="fasta" label="Reference sequence matching DANTE output" />
    </inputs>
    <outputs>
        <data name="te_ltr_gff" format="gff3" label="Annotation of detected LTR transposable elements
         based on the annotation $dante.hid and reference $reference.hid" />
    </outputs>
    <help><![CDATA[
        This tool uses output from DANTE annotation pipeline to identify full length LTR
        transposable elements. Output is in the GFF3 format and include annotation of
        5' and 3' Longe Terminal Repeats, Target Site Duplication (TSD) and primer binding site (PBS).

        All identified elements contains complete set of protein domains as defined in
        REXdb_. Based on the results detection  structural feature,
        elements falls into four categories:

        - elements with domains, 5'LTR, 3'LTR, TSD and PBS
        - elements with domains, 5'LTR, 3'LTR and PBS (TSD was not found)
        - elements with domains, 5' LTR, 3'LTR, TSD (PBS was not found)
        - elements with protein domains, 5'LTR and 3'LTR (PBS and LDS were not found)

       .. _REXdb: https://doi.org/10.1186/s13100-018-0144-1

    ]]></help>
</tool>