comparison fasta-stats.xml @ 4:0dbb995c7d35 draft default tip

"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fasta_stats/ commit 50f5cce5a8c11001e2c59600a2b99a4243b6d06f"
author iuc
date Thu, 18 Nov 2021 20:56:57 +0000
parents 56022eb50bbd
children
comparison
equal deleted inserted replaced
3:56022eb50bbd 4:0dbb995c7d35
1 <tool id="fasta-stats" name="Fasta Statistics" version="1.0.3"> 1 <tool id="fasta-stats" name="Fasta Statistics" version="2.0" profile="20.05">
2 <description>Display summary statistics for a fasta file.</description> 2 <description>display summary statistics for a FASTA file</description>
3 <requirements> 3 <requirements>
4 <requirement type="package" version="5.26">perl</requirement> 4 <requirement type="package" version="1.21.4">numpy</requirement>
5 <requirement type="package" version="1.79">biopython</requirement>
5 </requirements> 6 </requirements>
6 <command detect_errors="exit_code"><![CDATA[ 7 <command detect_errors="exit_code"><![CDATA[
7 perl '${__tool_directory__}/fasta-stats.pl' 8 python '${__tool_directory__}/fasta-stats.py'
8 '$dataset' 9 --fasta '$fasta'
9 #if $genome_size: 10 --stats_output '$stats_output'
10 $genome_size 11 #if $gaps_option
12 --gaps_output '$gaps_output'
11 #end if 13 #end if
12 > '$stats' 14 #if $genome_size
15 --genome_size $genome_size
16 #end if
13 ]]> 17 ]]>
14 </command> 18 </command>
15 <inputs> 19 <inputs>
16 <param name="dataset" type="data" format="fasta" label="fasta or multifasta file" help="fasta dataset to get statistics for."/> 20 <param argument="--fasta" type="data" format="fasta" label="FASTA or Multi-FASTA file" help="FASTA dataset to get statistics."/>
17 <param name="genome_size" type="float" optional="True" label="Genome size estimate (optional)" help="Estimate of the genome size in bases. If specified, NG50 and LG50 will be calculated."/> 21 <param argument="--genome_size" type="integer" min="0" optional="true" label="Estimated genome size" help="This parameter is optional. If provided, it will be used for calculating the NG50 statistic." />
22 <param argument="--gaps_option" type="boolean" truevalue="true" falsevalue="false" label="Generate gap stats"/>
18 </inputs> 23 </inputs>
19 <outputs> 24 <outputs>
20 <data name="stats" format="tabular" label="${tool.name} on ${on_string}: Fasta summary stats"/> 25 <data name="stats_output" format="tabular" label="${tool.name} on ${on_string}: summary stats"/>
26 <data name="gaps_output" format="bed" label="${tool.name} on ${on_string}: Gap stats">
27 <filter>gaps_option</filter>
28 </data>
21 </outputs> 29 </outputs>
22 <tests> 30 <tests>
23 <test> 31 <test expect_num_outputs="1">
24 <param name="dataset" value="test.fasta"/> 32 <param name="fasta" value="test.fasta" ftype="fasta"/>
25 <output name="stats" file="test_out.txt"/> 33 <output name="stats_output" file="test_01.tab" ftype="tabular"/>
26 </test> 34 </test>
27 <test> 35 <!--Test gap options and NG50-->
28 <param name="dataset" value="ng50_input.fasta"/> 36 <test expect_num_outputs="2">
37 <param name="fasta" value="ng50_input.fasta" ftype="fasta"/>
38 <param name="gaps_option" value="true"/>
29 <param name="genome_size" value="4000"/> 39 <param name="genome_size" value="4000"/>
30 <output name="stats" file="ng50_out.txt"/> 40 <output name="stats_output" file="test_02.tab" ftype="tabular"/>
41 <output name="gaps_output" file="test_02.bed" ftype="bed"/>
42 </test>
43 <!--Compare outputs with QUAST-->
44 <test expect_num_outputs="1">
45 <param name="fasta" value="test_long_sequence.fasta" ftype="fasta"/>
46 <output name="stats_output" ftype="tabular">
47 <assert_contents>
48 <has_text text="8353"/>
49 <has_text text="303889"/>
50 <has_text text="22107"/>
51 </assert_contents>
52 </output>
31 </test> 53 </test>
32 </tests> 54 </tests>
33 <help> 55 <help><![CDATA[
34 **Fasta Stats** 56
35 Displays the summary statistics for a fasta file. 57 .. class:: infomark
58
59 **Purpose**
60
61 Displays the summary statistics for a FASTA file.
36 62
37 ------ 63 ------
38 64
39 Outputs in tabular form: 65 .. class:: infomark
40 Lengths: n50, min, max, median and average
41 66
42 Number of base pairs: A, C, G, T, N, Total and Total_not_N 67 **Outputs**
43 68
44 Number of sequences 69 This tool generates two outputs: a general summary and an optional gap stats file.
45 70
46 GC content in % 71 The general summary includes the following information:
47 72
48 If an optional genome size estimate is specified, then the NG50 length will also be calculated. 73 - Lengths: n50, min, max, median and average
74 - Number of base pairs: A, C, G, T, N, Total and Total_not_N
75 - Number of sequences
76 - GC content
49 77
50 ------ 78 In addition the optional gap stats BED file includes the information about gaps localization.
51 79 ]]>
52 Inputs:
53
54 Fasta dataset
55 </help> 80 </help>
56 <citations> 81 <citations>
57 <citation type="bibtex"> 82 <citation type="bibtex">
58 @UNPUBLISHED{Seemann_Gladman2012, 83 @UNPUBLISHED{Anmol_Kyran2021,
59 author = {Torsten Seemann and Simon Gladman}, 84 author = {Anmol Kyran},
60 title = {Fasta Statistics: Display summary statistics for a fasta file.}, 85 title = {Fasta Statistics: Display summary statistics for a fasta file.},
61 year = {2012}, 86 year = {2021},
62 url = {https://github.com/galaxyproject/tools-iuc}, 87 url = {https://github.com/galaxyproject/tools-iuc},
63 } 88 }
64 </citation> 89 </citation>
65 </citations> 90 </citations>
66 </tool> 91 </tool>