Mercurial > repos > iuc > fasta_stats
comparison fasta-stats.xml @ 4:0dbb995c7d35 draft default tip
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fasta_stats/ commit 50f5cce5a8c11001e2c59600a2b99a4243b6d06f"
author | iuc |
---|---|
date | Thu, 18 Nov 2021 20:56:57 +0000 |
parents | 56022eb50bbd |
children |
comparison
equal
deleted
inserted
replaced
3:56022eb50bbd | 4:0dbb995c7d35 |
---|---|
1 <tool id="fasta-stats" name="Fasta Statistics" version="1.0.3"> | 1 <tool id="fasta-stats" name="Fasta Statistics" version="2.0" profile="20.05"> |
2 <description>Display summary statistics for a fasta file.</description> | 2 <description>display summary statistics for a FASTA file</description> |
3 <requirements> | 3 <requirements> |
4 <requirement type="package" version="5.26">perl</requirement> | 4 <requirement type="package" version="1.21.4">numpy</requirement> |
5 <requirement type="package" version="1.79">biopython</requirement> | |
5 </requirements> | 6 </requirements> |
6 <command detect_errors="exit_code"><![CDATA[ | 7 <command detect_errors="exit_code"><![CDATA[ |
7 perl '${__tool_directory__}/fasta-stats.pl' | 8 python '${__tool_directory__}/fasta-stats.py' |
8 '$dataset' | 9 --fasta '$fasta' |
9 #if $genome_size: | 10 --stats_output '$stats_output' |
10 $genome_size | 11 #if $gaps_option |
12 --gaps_output '$gaps_output' | |
11 #end if | 13 #end if |
12 > '$stats' | 14 #if $genome_size |
15 --genome_size $genome_size | |
16 #end if | |
13 ]]> | 17 ]]> |
14 </command> | 18 </command> |
15 <inputs> | 19 <inputs> |
16 <param name="dataset" type="data" format="fasta" label="fasta or multifasta file" help="fasta dataset to get statistics for."/> | 20 <param argument="--fasta" type="data" format="fasta" label="FASTA or Multi-FASTA file" help="FASTA dataset to get statistics."/> |
17 <param name="genome_size" type="float" optional="True" label="Genome size estimate (optional)" help="Estimate of the genome size in bases. If specified, NG50 and LG50 will be calculated."/> | 21 <param argument="--genome_size" type="integer" min="0" optional="true" label="Estimated genome size" help="This parameter is optional. If provided, it will be used for calculating the NG50 statistic." /> |
22 <param argument="--gaps_option" type="boolean" truevalue="true" falsevalue="false" label="Generate gap stats"/> | |
18 </inputs> | 23 </inputs> |
19 <outputs> | 24 <outputs> |
20 <data name="stats" format="tabular" label="${tool.name} on ${on_string}: Fasta summary stats"/> | 25 <data name="stats_output" format="tabular" label="${tool.name} on ${on_string}: summary stats"/> |
26 <data name="gaps_output" format="bed" label="${tool.name} on ${on_string}: Gap stats"> | |
27 <filter>gaps_option</filter> | |
28 </data> | |
21 </outputs> | 29 </outputs> |
22 <tests> | 30 <tests> |
23 <test> | 31 <test expect_num_outputs="1"> |
24 <param name="dataset" value="test.fasta"/> | 32 <param name="fasta" value="test.fasta" ftype="fasta"/> |
25 <output name="stats" file="test_out.txt"/> | 33 <output name="stats_output" file="test_01.tab" ftype="tabular"/> |
26 </test> | 34 </test> |
27 <test> | 35 <!--Test gap options and NG50--> |
28 <param name="dataset" value="ng50_input.fasta"/> | 36 <test expect_num_outputs="2"> |
37 <param name="fasta" value="ng50_input.fasta" ftype="fasta"/> | |
38 <param name="gaps_option" value="true"/> | |
29 <param name="genome_size" value="4000"/> | 39 <param name="genome_size" value="4000"/> |
30 <output name="stats" file="ng50_out.txt"/> | 40 <output name="stats_output" file="test_02.tab" ftype="tabular"/> |
41 <output name="gaps_output" file="test_02.bed" ftype="bed"/> | |
42 </test> | |
43 <!--Compare outputs with QUAST--> | |
44 <test expect_num_outputs="1"> | |
45 <param name="fasta" value="test_long_sequence.fasta" ftype="fasta"/> | |
46 <output name="stats_output" ftype="tabular"> | |
47 <assert_contents> | |
48 <has_text text="8353"/> | |
49 <has_text text="303889"/> | |
50 <has_text text="22107"/> | |
51 </assert_contents> | |
52 </output> | |
31 </test> | 53 </test> |
32 </tests> | 54 </tests> |
33 <help> | 55 <help><![CDATA[ |
34 **Fasta Stats** | 56 |
35 Displays the summary statistics for a fasta file. | 57 .. class:: infomark |
58 | |
59 **Purpose** | |
60 | |
61 Displays the summary statistics for a FASTA file. | |
36 | 62 |
37 ------ | 63 ------ |
38 | 64 |
39 Outputs in tabular form: | 65 .. class:: infomark |
40 Lengths: n50, min, max, median and average | |
41 | 66 |
42 Number of base pairs: A, C, G, T, N, Total and Total_not_N | 67 **Outputs** |
43 | 68 |
44 Number of sequences | 69 This tool generates two outputs: a general summary and an optional gap stats file. |
45 | 70 |
46 GC content in % | 71 The general summary includes the following information: |
47 | 72 |
48 If an optional genome size estimate is specified, then the NG50 length will also be calculated. | 73 - Lengths: n50, min, max, median and average |
74 - Number of base pairs: A, C, G, T, N, Total and Total_not_N | |
75 - Number of sequences | |
76 - GC content | |
49 | 77 |
50 ------ | 78 In addition the optional gap stats BED file includes the information about gaps localization. |
51 | 79 ]]> |
52 Inputs: | |
53 | |
54 Fasta dataset | |
55 </help> | 80 </help> |
56 <citations> | 81 <citations> |
57 <citation type="bibtex"> | 82 <citation type="bibtex"> |
58 @UNPUBLISHED{Seemann_Gladman2012, | 83 @UNPUBLISHED{Anmol_Kyran2021, |
59 author = {Torsten Seemann and Simon Gladman}, | 84 author = {Anmol Kyran}, |
60 title = {Fasta Statistics: Display summary statistics for a fasta file.}, | 85 title = {Fasta Statistics: Display summary statistics for a fasta file.}, |
61 year = {2012}, | 86 year = {2021}, |
62 url = {https://github.com/galaxyproject/tools-iuc}, | 87 url = {https://github.com/galaxyproject/tools-iuc}, |
63 } | 88 } |
64 </citation> | 89 </citation> |
65 </citations> | 90 </citations> |
66 </tool> | 91 </tool> |