annotate gtdbtk_classify_wf.xml @ 6:a09c8c901603 draft

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 85683b4edaf9ec44550ff0de861023f794bf35f2
author iuc
date Fri, 13 Sep 2024 11:15:36 +0000
parents a68b985913ab
children b907a3c0434f
Ignore whitespace changes - Everywhere: Within whitespace: At end of lines:
rev   line source
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
1 <tool id="gtdbtk_classify_wf" name="GTDB-Tk Classify genomes" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
2 <description>by placement in GTDB reference tree</description>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
3 <macros>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
4 <import>macros.xml</import>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
5 </macros>
3
f8f56dd6449f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 883bfde016c4d8e76ae9600008b0e451eedcb1f2
iuc
parents: 2
diff changeset
6 <xrefs>
f8f56dd6449f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 883bfde016c4d8e76ae9600008b0e451eedcb1f2
iuc
parents: 2
diff changeset
7 <xref type="bio.tools">GTDB-Tk</xref>
f8f56dd6449f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 883bfde016c4d8e76ae9600008b0e451eedcb1f2
iuc
parents: 2
diff changeset
8 </xrefs>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
9 <expand macro="requirements"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
10 <command detect_errors="exit_code"><![CDATA[
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
11 #import re
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
12
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
13 mkdir input_dir &&
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
14 mkdir output_dir &&
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
15 #for $i in $input:
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
16 ## gtdbtk uses the file extension to determine the input format.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
17 #set ext = "." + $i.ext
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
18 #set input_identifier = re.sub('[^\s\w\-]', '_', str($i.element_identifier)) + $ext
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
19 ln -s '${i}' input_dir/'${input_identifier}' &&
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
20 #end for
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
21 export GTDBTK_DATA_PATH=$gtdbtk_db.fields.path &&
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
22 gtdbtk classify_wf
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
23 --genome_dir input_dir
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
24 --extension '$ext'
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
25 --out_dir output_dir
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
26 --cpus \${GALAXY_SLOTS:-4}
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
27 --min_perc_aa $advanced.min_perc_aa
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
28 $advanced.force
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
29 --min_af $advanced.min_af
1
dbf1798c0dcc planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 1dddd355fe97cb9d6bb37f93b98f3402184b4320
iuc
parents: 0
diff changeset
30
dbf1798c0dcc planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 1dddd355fe97cb9d6bb37f93b98f3402184b4320
iuc
parents: 0
diff changeset
31 ## Required unless mash_db is available:
dbf1798c0dcc planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 1dddd355fe97cb9d6bb37f93b98f3402184b4320
iuc
parents: 0
diff changeset
32 --skip_ani_screen
dbf1798c0dcc planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 1dddd355fe97cb9d6bb37f93b98f3402184b4320
iuc
parents: 0
diff changeset
33
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
34 #if str($advanced.output_process_log) == 'yes':
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
35 && cat output_dir/gtdbtk.warnings.log output_dir/gtdbtk.log > '$process_log'
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
36 #end if
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
37 ]]></command>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
38 <inputs>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
39 <param name="input" type="data" format="fasta,fasta.gz" multiple="true" label="Fasta (Genome) files"/>
1
dbf1798c0dcc planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 1dddd355fe97cb9d6bb37f93b98f3402184b4320
iuc
parents: 0
diff changeset
40 <param name="gtdbtk_db" type="select" label="GTDB-Tk database" help="This version of GTDB-Tk required GTDB version R207_v2. Please contact your service administrator if this version is not available to select.">
6
a09c8c901603 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 85683b4edaf9ec44550ff0de861023f794bf35f2
iuc
parents: 5
diff changeset
41 <options from_data_table="gtdbtk_database_versioned">
a09c8c901603 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 85683b4edaf9ec44550ff0de861023f794bf35f2
iuc
parents: 5
diff changeset
42 <filter type="regexp" column="3" value="^v2(07|14)$"/>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
43 <validator type="no_options" message="No locally cached GTDB-Tk database is available"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
44 </options>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
45 </param>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
46 <section name="advanced" title="Advanced options">
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
47 <param argument="--min_perc_aa" type="integer" min="0" max="100" value="10" label="Exclude genomes that do not have at least this percentage of AA in the MSA" help="Inclusive bound"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
48 <param argument="--force" type="boolean" truevalue="--force" falsevalue="" checked="false" label="Continue processing if an error occurs on a single genome?"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
49 <param argument="--min_af" type="float" min="0" max="1" value="0.65" label="Minimum alignment fraction to consider closest genome"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
50 <param name="output_process_log" type="boolean" truevalue="yes" falsevalue="no" checked="false" label="Output process log file?"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
51 </section>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
52 </inputs>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
53 <outputs>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
54 <data name="process_log" format="txt" label="${tool.name} on ${on_string} (process log)">
5
a68b985913ab planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fe7c6bb90ca130ec69711445a605bfb1d0ef8bae
iuc
parents: 4
diff changeset
55 <filter>advanced['output_process_log']</filter>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
56 </data>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
57 <collection name="output_align" type="list" format="fasta.gz" label="${tool.name} on ${on_string} (align)">
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
58 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.fasta.gz" ext="fasta.gz" directory="output_dir/align"/>
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
59 </collection>
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
60 <collection name="output_identfy" type="list" format="tsv" label="${tool.name} on ${on_string} (identify)">
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
61 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.tsv" ext="tsv" directory="output_dir/identify"/>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
62 </collection>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
63 <collection name="output_classify" type="list" format="newick" label="${tool.name} on ${on_string} (classify)">
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
64 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.tree" ext="newick" directory="output_dir/classify"/>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
65 </collection>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
66 <collection name="output_summary" type="list" format="tsv" label="${tool.name} on ${on_string} (summary)">
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
67 <discover_datasets pattern="(?P&lt;designation&gt;.+)\.tsv" ext="tsv" directory="output_dir"/>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
68 </collection>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
69 </outputs>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
70 <tests>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
71 <!-- The commented test here is valid if we could store the GTDB-Tk database -->
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
72 <!--
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
73 <test expect_num_outputs="4">
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
74 <param name="input" value="genome_1.fna.gz" ftype="fasta.gz"/>
4
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
75 <param name="gtdbtk_db" value="gtdbtk214"/>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
76 <output_collection name="output_summary" type="list" count="1">
4
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
77 <element name="gtdbtk.ar53.summary" ftype="tsv">
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
78 <assert_contents>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
79 <has_text text="user_genome"/>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
80 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
81 </element>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
82 </output_collection>
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
83 <output_collection name="output_identfy" type="list" count="4">
4
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
84 <element name="gtdbtk.ar53.markers_summary" ftype="tsv">
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
85 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
86 <has_text text="number_unique_genes"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
87 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
88 </element>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
89 <element name="gtdbtk.bac120.markers_summary" ftype="tsv">
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
90 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
91 <has_text text="genome_1_fna_gz"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
92 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
93 </element>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
94 <element name="gtdbtk.failed_genomes" ftype="tsv">
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
95 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
96 <has_size value="0"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
97 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
98 </element>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
99 <element name="gtdbtk.translation_table_summary" ftype="tsv">
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
100 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
101 <has_text text="genome_1_fna_gz"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
102 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
103 </element>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
104 </output_collection>
4
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
105 <output_collection name="output_classify" type="list" count="1">
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
106 <element name="gtdbtk.ar53.classify" ftype="newick">
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
107 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
108 <has_text text="GB_GCA_"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
109 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
110 </element>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
111 </output_collection>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
112 <output_collection name="output_align" type="list" count="2">
4
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
113 <element name="gtdbtk.ar53.msa" ftype="fasta.gz" decompress="true">
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
114 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
115 <has_text text="GB_GCA_000008085"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
116 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
117 </element>
4
65d52c693b8e planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 94a1996b09d7597793f823307cbac6208e20f1d1
iuc
parents: 3
diff changeset
118 <element name="gtdbtk.ar53.user_msa" ftype="fasta.gz" decompress="true">
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
119 <assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
120 <has_text text="genome_1_fna_gz"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
121 </assert_contents>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
122 </element>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
123 </output_collection>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
124 </test>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
125 -->
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
126 <!-- GTDB-Tk databases are far too large to test currently -->
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
127 <test expect_failure="true">
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
128 <param name="input" value="genome_1.fna.gz" ftype="fasta.gz"/>
6
a09c8c901603 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 85683b4edaf9ec44550ff0de861023f794bf35f2
iuc
parents: 5
diff changeset
129 <param name="gtdbtk_db" value="gtdbtk214"/>
0
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
130 <assert_stderr>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
131 <has_text text="Fatal error: Exit code 1"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
132 </assert_stderr>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
133 </test>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
134 </tests>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
135 <help><![CDATA[
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
136 **What it does**
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
137
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
138 GTDB-Tk is a software toolkit for assigning objective taxonomic classifications to bacterial and archaeal genomes
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
139 based on the Genome Database Taxonomy GTDB. It is designed to work with recent advances that allow hundreds or
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
140 thousands of metagenome-assembled genomes (MAGs) to be obtained directly from environmental samples. It can also
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
141 be applied to isolate and single-cell genomes.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
142
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
143 This tool accepts one or more fasta (genome) files and determines taxonomic classification of genomes by
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
144 maximum-likelihood (ML) placement. The classification workflow consists of three steps: identify, align, and
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
145 classify.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
146
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
147 The identify step calls genes using Prodigal, and uses HMM models and the HMMER package to identify the 120 bacterial
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
148 and 122 archaeal marker genes used for phylogenetic inference. Multiple sequence alignments (MSA) are obtained by
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
149 aligning marker genes to their respective HMM model.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
150
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
151 The align step concatenates the aligned marker genes and filters the concatenated MSA to approximately 5,000
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
152 amino acids.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
153
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
154 Finally, the classify step uses pplacer to find the maximum-likelihood placement of each genome in the GTDB-Tk
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
155 reference tree. GTDB-Tk classifies each genome based on its placement in the reference tree, its relative evolutionary
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
156 divergence, and/or average nucleotide identity (ANI) to reference genomes.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
157
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
158 Results can be impacted by a lack of marker genes or contamination.
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
159 ]]></help>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
160 <expand macro="citations"/>
c4db8c4de66f planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit 8487d2c73793be0afa5b34388b122e686ac8a094
iuc
parents:
diff changeset
161 </tool>
2
6501b5b33988 planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/gtdbtk commit fab39612473d91e048868d9c122d7dd61a2bd9d4
iuc
parents: 1
diff changeset
162