annotate fastani.xml @ 1:3c6e0e8df873 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastani commit 2510af3d8a6e812e211ea9fa1ebf42259b7c27f0
author iuc
date Sat, 18 May 2024 15:26:00 +0000
parents 2c7ac12ad75a
children
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
1 <tool id="fastani" name="FastANI" version="@VERSION@">
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
2 <description> fast alignment-free computation of whole-genome Average Nucleotide Identity</description>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
3 <macros>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
4 <import>macros.xml</import>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
5 </macros>
1
3c6e0e8df873 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/fastani commit 2510af3d8a6e812e211ea9fa1ebf42259b7c27f0
iuc
parents: 0
diff changeset
6 <expand macro="xrefs"/>
0
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
7 <expand macro="requirements" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
8 <version_command>fastANI --version</version_command>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
9 <command detect_errors="exit_code">
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
10 <![CDATA[
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
11 #import re
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
12
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
13 ### SET UP INPUTS ###
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
14 #for $input_q in $query:
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
15 #set $file_name = re.sub('[^\w_]', '_', $input_q.element_identifier)
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
16 ln -fs '$input_q' '${file_name}_query' &&
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
17 echo '${file_name}_query' >> query.lst &&
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
18 #end for
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
19
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
20 #for $input_r in $reference:
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
21 #set $file_name = re.sub('[^\w_]', '_', $input_r.element_identifier)
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
22 ln -fs '$input_r' '${file_name}_ref' &&
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
23 echo '${file_name}_ref' >> ref.lst &&
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
24 #end for
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
25
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
26
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
27 ### COMMAND ###
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
28
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
29 fastANI --ql query.lst --rl ref.lst -o output -t "\${GALAXY_SLOTS:-1}"
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
30
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
31 ]]></command>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
32 <inputs>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
33 <param name="query" type="data" format="fasta" multiple="true" label="Query Sequence(s)"
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
34 help="Specify any number of query sequences in fasta format as input." />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
35 <param name="reference" type="data" format="fasta" multiple="true" label="Reference Sequence(s)"
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
36 help="Specify any number of reference sequences in fasta format as input." />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
37 </inputs>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
38 <outputs>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
39 <data name="output" format="tabular" from_work_dir="output" label="${tool.name} on ${on_string} Output"/>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
40 </outputs>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
41 <tests>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
42 <test>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
43 <param name="query" value="E.coli_1.fasta" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
44 <param name="reference" value="S.flexneri_1.fasta" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
45 <output name="output" file="single.out" compare="sim_size" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
46 </test>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
47 <test>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
48 <param name="query" value="E.coli_1.fasta,E.coli_2.fasta" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
49 <param name="reference" value="S.flexneri_1.fasta,S.flexneri_2.fasta" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
50 <output name="output" file="multi.out" compare="sim_size" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
51 </test>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
52 </tests>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
53 <help><![CDATA[
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
54
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
55 FastANI
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
56 =======
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
57
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
58 FastANI is developed for fast alignment-free computation of whole-genome
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
59 Average Nucleotide Identity (ANI). ANI is defined as mean nucleotide
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
60 identity of orthologous gene pairs shared between two microbial genomes.
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
61 FastANI supports pairwise comparison of both complete and draft genome
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
62 assemblies. Its underlying procedure follows a similar workflow as described
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
63 by `Goris et al. 2007 <https://doi.org/10.1099/ijs.0.64483-0>`_. However, it avoids expensive sequence alignments and
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
64 uses `Mashmap <https://github.com/marbl/MashMap>`_ as its MinHash based sequence mapping engine to compute the
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
65 orthologous mappings and alignment identity estimates. Based on our
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
66 experiments with complete and draft genomes, its accuracy is on par with
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
67 `BLAST-based ANI solver <http://enve-omics.ce.gatech.edu/ani/>`_ and it achieves two to three orders of magnitude
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
68 speedup. Therefore, it is useful for pairwise ANI computation of large
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
69 number of genome pairs. More details about its speed, accuracy and potential
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
70 applications are described here: `"High Throughput ANI Analysis of 90K
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
71 Prokaryotic Genomes Reveals Clear Species Boundaries" <https://doi-org.uml.idm.oclc.org/10.1038/s41467-018-07641-9>`_.
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
72
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
73 Please visit the authors at: https://github.com/ParBLiSS/FastANI
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
74
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
75
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
76 Inputs
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
77 ------
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
78
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
79 **Query Sequence(s):**
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
80 Input one or more query genomes in fasta format
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
81
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
82 **Reference Sequence(s):**
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
83 Input one or more reference genomes to be compared to the query genomes
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
84
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
85
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
86 Output
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
87 ------
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
88
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
89 Tabular table output with columns: Query Genome, Reference Genome, ANI Value, Count of Bidirectional Fragment Mappings, and Total Query Fragments.
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
90
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
91 Output table looks as such:
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
92
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
93 +------------+------------+-----------+--------+--------+
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
94 | Genome A | Genome C | 97.5883 | 1405 | 1594 |
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
95 +------------+------------+-----------+--------+--------+
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
96 | Genome A | Genome D | 95.6663 | 1405 | 1594 |
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
97 +------------+------------+-----------+--------+--------+
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
98 | Genome B | Genome C | 92.4281 | 1409 | 1553 |
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
99 +------------+------------+-----------+--------+--------+
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
100 | Genome B | Genome D | 99.9242 | 1396 | 1553 |
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
101 +------------+------------+-----------+--------+--------+
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
102
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
103 |
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
104 | Thanks to Thanh LĂȘ for building the initial Galaxy wrapper.
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
105 ]]></help>
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
106 <expand macro="citations" />
2c7ac12ad75a "planemo upload commit 01a4c6cb401a89acddd991825fcaa304052d275f"
iuc
parents:
diff changeset
107 </tool>