Mercurial > repos > iuc > presto_collapseseq
view presto_collapseseq.xml @ 2:3364fd7073ca draft
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/presto commit 19e832988729a92be5426131fc6114e1f7237982"
author | iuc |
---|---|
date | Fri, 02 Jul 2021 15:33:36 +0000 |
parents | dc7cb4efc998 |
children | c60bd515e46d |
line wrap: on
line source
<tool id="presto_collapseseq" name="pRESTO CollapseSeq" version="@TOOL_VERSION@"> <description>Remove/collapse duplicate sequences</description> <macros> <import>presto_macros.xml</import> </macros> <expand macro="requirements"/> <version_command>CollapseSeq.py --version</version_command> <command detect_errors="exit_code"><![CDATA[ ln -s '$fastq_in' in.fastq && CollapseSeq.py -s in.fastq -n '$n' --uf $uf --cf $cf --act $act $inner $keepmiss #if $representative.select_by == "by_min" --minf '$minf' #end if #if $representative.select_by == "by_max" --maxf '$maxf' #end if --outname=tmp #if $capture_log --log '$log_out' #end if ]]></command> <inputs> <param argument="-s" name="fastq_in" type="data" format="fastq" label="Input FASTQ file" help="FASTQ file of sequences."/> <param argument="-n" type="integer" value="0" label="Max Missing" help="Maximum number of missing nucleotides to consider for collapsing sequences. A sequence will be considered undetermined if it contains too many missing nucleotides."/> <param argument="--uf" type="text" value="" label="Unique Field(s)" help="Space-separated list of fields to match reads by."/> <param argument="--cf" type="text" value="" label="Copy Field(s)" help="Space-separated list of fields to copy into the target sequence headers."> <expand macro="text-regex-validator"/> </param> <param argument="--act" type="text" value="" label="Action(s)" help="Space-separated list of actions to take on Copy Field(s)."> <expand macro="text-regex-validator"/> </param> <param argument="--inner" type="boolean" value="false" truevalue="--inner" falsevalue="" label="Inner" help="If true, trim off any missing/undetermined bases from the ends of reads after collapsing."/> <param argument="--keepmiss" type="boolean" value="false" truevalue="--keepmiss" falsevalue="" label="Keep Missing" help="If specified, sequences with more missing characters than the threshold set by the -n parameter will be written to the unique sequence output file with a DUPCOUNT=1 annotation. If not specified, such sequences will be written to a separate file."/> <conditional name="representative"> <param name="select_by" type="select"> <option value="first">First Sequence</option> <option value="by_min">By field minimum value</option> <option value="by_max">By field maximum value</option> </param> <when value="first"></when> <when value="by_min"> <param argument="--minf" type="text" value="" label="Field Name" help="Specifies the field whose minimum value determines the retained sequence."/> </when> <when value="by_max"> <param argument="--maxf" type="text" value="" label="Field Name" help="Specifies the field whose maximum value determines the retained sequence."/> </when> </conditional> <expand macro="presto-log-param"/> </inputs> <outputs> <data name="fastq_out" format="fastq" from_work_dir="tmp_collapse-unique.fastq"/> <expand macro="presto-log-output"/> </outputs> <tests> <test> <param name="fastq_in" value="presto_collapseseq_test_in.fastq"/> <param name="n" value="0"/> <param name="uf" value="PRCONS CREGION"/> <param name="cf" value="CONSCOUNT"/> <param name="act" value="sum"/> <param name="inner" value="true"/> <param name="keepmiss" value="true"/> <output name="fastq_out" file="presto_collapseseq_test_output.fastq" sort="true"/> </test> </tests> <help><![CDATA[ Removes/collapses duplicate sequences from FASTQ files. See the `pRESTO online help <@PRESTO_BASE_URL@/en/stable>`_ for more information. @HELP_NOTE@ ]]></help> <expand macro="citations" /> </tool>