bioext_bealign: bealign.xml comparison

comparison bealign.xml @ 3:fb4975b507c6 draft

"planemo upload for repository https://github.com/davebx/bioext-gx/ commit af3bfbbd3f1236bf96a25bcb8483f2889295ec0c"

author	iuc
date	Fri, 20 Aug 2021 21:04:17 +0000
parents	d8b6f0adaa79
children	a287431cdf4f

comparison

equal deleted inserted replaced

-:d8b6f0adaa79
+:fb4975b507c6
 <?xml version="1.0"?>
 <tool id="bioext_bealign" name="Align sequences" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
 <description>to a reference using a codon alignment algorithm</description>
 <macros>
 <import>macros.xml</import>
-<token name="@VERSION_SUFFIX@">0</token>
+<token name="@VERSION_SUFFIX@">1</token>
 </macros>
-<expand macro="requirements" />
+<expand macro="requirements">
+<requirement type="package" version="5.1.0">gawk</requirement>
+</expand>
 <version_command>bealign --version</version_command>
 <command detect_errors="exit_code">
 <![CDATA[
 ## Some downstream tools, such as the TN-93 clustering tool and RAxML, might
 ## break if there are non-standard characters in the sequences or text other
 ## than alphanumerics in the sequence names, so we run the input dataset
 ## through a simple awk script to remove any non-IUPAC-standard nucleotides
 ## and replace any unwanted characters in the sequence names with underscores.
 ## This should not affect the actual alignment, since any non-standard character
 ## in the sequences is already ignored, but the possibility remains.
-cat '$input' | awk '{ if (\$0 ~ "^[^>]") {a = gensub(/[^ACGTURYKMSWBDHVNacgturykmswbdhvn?-]/, "", "g"); } else {a=gensub(/[^>A-Za-z0-9_]/, "_", "g"); }; print a } ' |
+cat '$input' @SANITIZE@ reads.fa &&
-sed 's,_\\+,_,g' > reads.fa &&
 bealign --reference '$select_reference.reference' --alphabet $advanced.alphabet
 #if $advanced.expected_identity:
 --expected-identity $advanced.expected_identity
 #end if
---score-matrix $advanced.score_matrix $advanced.reverse_complement $advanced.keep_reference
 #if $advanced.discard:
 $advanced.discard '$advanced.discarded_reads'
 #end if
-reads.fa alignment.bam
+--score-matrix $advanced.score_matrix
+$advanced.reverse_complement
+$advanced.keep_reference
+reads.fa '$output'
+#set $input_background = False
+#if $background_source.selection == 'history':
+#if $background_source.sequences:
+#set $input_background = $background_source.sequences
+#end if
+#else:
+#if $background_source.sequences:
+#set $input_background = $background_source.sequences.fields.path
+#end if
+#end if
+#if $input_background:
+&& cat '$input_background' @SANITIZE@ background.fa &&
+bealign --reference '$select_reference.reference' --alphabet $advanced.alphabet
+#if $advanced.expected_identity:
+--expected-identity $advanced.expected_identity
+#end if
+--keep-reference --score-matrix $advanced.score_matrix $advanced.reverse_complement
+background.fa '$background'
+#end if
+#set $reference_name = str($select_reference.reference)
+#if $select_reference.reference_type == 'preset' and $select_reference.save_reference:
+&& python '$__tool_directory__/copy_reference.py' --reference '$reference_name' --dataset '$saved_reference'
+#end if
 ]]>
 </command>
 <inputs>
 <param name="input" type="data" format="fasta" label="Input reads" help="For the benefit of certain tools that depend on this aligner, such as the TN-93 clustering tool, this dataset's sequence names will have non-alphanumeric characters replaced with underscores, and the sequences will be restricted to the set of IUPAC nucleotide characters." />
 <conditional name="select_reference">
 <option value="CoV2-ORF7b">SARS-CoV-2: ORF7b</option>
 <option value="CoV2-ORF8">SARS-CoV-2: ORF8</option>
 <option value="CoV2-ORF10">SARS-CoV-2: ORF10</option>
 <option value="CoV2-RdRp">SARS-CoV-2: RNA-dependent RNA polymerase</option>
 </param>
+<param name="save_reference" type="boolean" display="radio" label="Save this reference to your history" />
 </when>
 <when value="dataset">
 <param argument="--reference" type="data" format="fasta" label="Reference sequences" />
 </when>
 </conditional>
+<conditional name="background_source">
+<param name="selection" type="select" label="Source for the background" help="You can use a predefined background cached on this Galaxy server or select a dataset from your history">
+<option value="data_table">Use a predefined background</option>
+<option value="history">Select a dataset from your history</option>
+</param>
+<when value="data_table">
+<param name="sequences" type="select" optional="true" label="Select sequences from data table">
+<options from_data_table="bealign_selection" />
+</param>
+</when>
+<when value="history">
+<param name="sequences" type="data" format="fasta" optional="true" label="Select dataset with sequences" />
+</when>
+</conditional>
 <section name="advanced" title="Advanced options" expanded="False">
-<param name="expected_identity" argument="--expected-identity" type="float" min="0" max="1" optional="True" label="Discard sequences that are insufficiently identical to the reference" />
+<param argument="--expected-identity" type="float" min="0" max="1" optional="True" label="Discard sequences that are insufficiently identical to the reference" />
 <param argument="--alphabet" type="select" label="Alphabet to use for alignment">
 <option value="codon" selected="True">Codon</option>
 <option value="dna">DNA</option>
 <option value="amino">Amino acids</option>
 </param>
 <param name="reverse_complement" argument="--reverse-complement" type="boolean" checked="False" truevalue="--reverse-complement" falsevalue="" label="Also try to align against reverse complement of reference" />
 <param name="keep_reference" argument="--keep-reference" type="boolean" checked="False" truevalue="--keep-reference" falsevalue="" label="Include reference as first sequence in aligned BAM" />
 </section>
 </inputs>
 <outputs>
-<data name="output" format="bam" from_work_dir="alignment.bam" />
+<data name="output" format="bam" label="${tool.name} on ${on_string} - Aligned Sequences" />
+<data name="background" format="bam" label="${tool.name} on ${on_string} - Background" >
+<filter>background_source['sequences']</filter>
+</data>
+<data name="saved_reference" format="fasta" label="${tool.name} on ${on_string} - Reference" >
+<filter>select_reference['save_reference']</filter>
+</data>
 <data name="discarded_reads" format="fasta">
 <filter>advanced['discard']</filter>
 </data>
 </outputs>
 <tests>
 <test>
-<param name="input" ftype="fasta" value="bealign-in1.fa" />
+<param name="input" ftype="fasta" value="query.fa" />
 <param name="reference_type" value="dataset" />
 <param name="score_matrix" value="HIV_BETWEEN_F" />
-<param name="reference" ftype="fasta" value="bealign-in-ref-1.fa" />
+<param name="reference" ftype="fasta" value="reference.fa" />
 <output name="output" file="bealign-out1.bam" ftype="bam" lines_diff="2" />
 </test>
 <test>
-<param name="input" ftype="fasta" value="bealign-in2.fa" />
+<param name="input" ftype="fasta" value="query.fa" />
-<param name="reference_type" value="dataset" />
+<param name="reference_type" value="preset" />
-<param name="score_matrix" value="BLOSUM62" />
+<param name="reference" value="CoV2-nsp8" />
-<param name="reference" ftype="fasta" value="bealign-in-ref-2.fa" />
+<param name="score_matrix" value="HIV_BETWEEN_F" />
 <output name="output" file="bealign-out2.bam" ftype="bam" lines_diff="2"/>
 </test>
-<test>
+<test expect_num_outputs="2">
-<param name="input" ftype="fasta" value="bealign-in2.fa" />
+<param name="input" ftype="fasta" value="query.fa" />
-<param name="reference_type" value="dataset" />
+<param name="reference_type" value="preset" />
-<param name="expected_identity" value="0.9" />
+<param name="reference" value="CoV2-nsp8" />
-<param name="score_matrix" value="BLOSUM62" />
+<param name="add_background" value="Yes" />
-<param name="reference" ftype="fasta" value="bealign-in-ref-2.fa" />
+<param name="background_source" value="data_table" />
+<param name="sequences" value="CoV2-nsp8" />
+<param name="alphabet" value="codon" />
+<param name="score_matrix" value="HIV_BETWEEN_F" />
 <output name="output" file="bealign-out3.bam" ftype="bam" lines_diff="2"/>
+<output name="background" file="bealign-out3-background.bam" ftype="bam" lines_diff="2"/>
+</test>
+<test expect_num_outputs="2">
+<param name="input" ftype="fasta" value="query.fa" />
+<param name="reference_type" value="preset" />
+<param name="reference" value="CoV2-nsp8" />
+<param name="save_reference" value="true" />
+<param name="add_background" value="No" />
+<param name="alphabet" value="codon" />
+<param name="score_matrix" value="HIV_BETWEEN_F" />
+<output name="output" file="bealign-out4.bam" ftype="bam" lines_diff="2"/>
+<output name="saved_reference" file="reference.fa" ftype="fasta"/>
 </test>
 </tests>
 <help>
 <![CDATA[
 bealign

Mercurial > repos > iuc > bioext_bealign

comparison bealign.xml @ 3:fb4975b507c6 draft