changeset 4:2e0af1e2d487 draft default tip

planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/amber/ commit 09a7f1234811e6104671c0fbb51a515e13815041
author iuc
date Sat, 08 Feb 2025 11:33:03 +0000
parents 8d0b2def5e65
children
files biobox_add_taxid.xml test-data/binid2taxid.tsv test-data/biobox_file.tsv test-data/kraken2.tsv test-data/modified_biobox_file_bin.tsv test-data/modified_biobox_file_contig.tsv test-data/test_bat_file.tsv test-data/test_biobox_file.tsv test-data/test_biobox_file_add_taxid_bat.tsv test-data/test_biobox_file_add_taxid_gtdb.tsv test-data/test_gtdb_file.tsv test-data/test_gtdb_to_taxdump_file.tsv test-data/test_taxonkit_file_1.tsv test-data/test_taxonkit_file_2.tsv
diffstat 14 files changed, 1391 insertions(+), 245 deletions(-) [+]
line wrap: on
line diff
--- a/biobox_add_taxid.xml	Sun Sep 08 14:37:41 2024 +0000
+++ b/biobox_add_taxid.xml	Sat Feb 08 11:33:03 2025 +0000
@@ -1,68 +1,59 @@
-<tool id="biobox_add_taxid" name="Biobox add taxid" version="@SCRIPT_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
+<tool id="biobox_add_taxid" name="Biobox add taxid" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
     <description>Add taxid output from BAT or GTDB to biobox binning data</description>
     <macros>
-        <import>macros.xml</import>
-        <token name="@SCRIPT_VERSION@">0.6</token>
+        <token name="@TOOL_VERSION@">1.2</token>
+        <token name="@VERSION_SUFFIX@">0</token>
+        <token name="@PROFILE@">24.1</token>
     </macros>
     <requirements>
-        <requirement type="package" version="@SCRIPT_VERSION@">biobox_add_taxid</requirement>
+        <requirement type="package" version="@TOOL_VERSION@">biobox_add_taxid</requirement>
     </requirements>
     <command detect_errors="exit_code">
     <![CDATA[
 
-        mkdir -p input taxonkit gtdb_to_taxdump &&
-
-        ln -s '${biobox_file}' '$biobox_file.element_identifier' &&
-
-        #for $i, $f in enumerate($tool_type.input):
-            ln -s '$f' 'input/${i}.tsv' &&
-        #end for
+    ln -s '$biobox_file' 'biobox.tsv' &&
 
-        #if $tool_type.is_select == 'GTDB':
-            #for $i, $f in enumerate($gtdb_to_taxdump):
-                ln -s '$f' 'gtdb_to_taxdump/gtdb_to_taxdump_${i}.tsv' &&
-            #end for
-            #for $i, $f in enumerate($taxonkit):
-                ln -s '$f' 'taxonkit/taxonkit_${i}.tsv' &&
-            #end for
-        #end if
+    #if $input.is_select == 'contig':
+        ln -s '$contig2taxid' 'contig.tsv' &&
+    #else:
+        ln -s '$binid2taxid' 'bin.tsv' &&
+    #end if
 
-        biobox_add_taxid.py
-        '$biobox_file.element_identifier'
-        '$tool_type.is_select'
-        'input'
-        #if $tool_type.is_select == 'GTDB':
-            -g 'gtdb_to_taxdump'
-            -t 'taxonkit'
-            -c $column
-        #end if
-        &&
+    biobox_add_taxid.py
+    'biobox.tsv'
+    #if $input.is_select == 'contig':
+        -c 'contig.tsv'
+    #else:
+        -b 'bin.tsv'
+    #end if
+    -k_c ${key_col}
+    -t_c ${taxid_col}
 
-        #if $tool_type.is_select == 'GTDB':
-            cp *_add_taxid_GTDB* $output
-        #else:
-            cp *_add_taxid_BAT* $output
-        #end if
+    &&
+
+    cp 'modified_biobox_file.tsv' '$output'
 
     ]]>
     </command>
     <inputs>
-        <param name="biobox_file" type="data" format="tabular" label="CAMI amber biobox file input" help="Input the CAMI amber biobox file here which are corespond with the biner and the BAT/GTDB output which did used the biner as input! "/>
-        <conditional name="tool_type">
-            <param name="is_select" type="select" label="Select the tool which output should be used here" help="Select BAT when you use the bin2classifier file(s) or select GTDB when using the summary file(s)">
-                <option value="BAT">BAT</option>
-                <option value="GTDB">GTDB</option>
+        <param name="biobox_file" type="data" format="tabular" label="Input biobox file"
+            help="This file can be generated with the utility tool from CAMI AMBER named convert to biobox"/>
+        <conditional name="input">
+            <param name="is_select" type="select" label="Select typ of input">
+                <option value="contig">ContigID2TaxID</option>
+                <option value="bin">BinID2TaxID</option>
             </param>
-            <when value="GTDB">
-                <param argument="--gtdb_to_taxdump" type="data" multiple="true" format="tabular" label="Input the output from gtdb_to_taxdump here" help="Use the output from gtdb_to_taxdump here since we need the mapped names from GTDB to NCBI to get the arcoding taxids from NCBI"/>
-                <param argument="--taxonkit" type="data" format="tabular" multiple="true" label="Input the output from Taxonkit here" help="Use the output from Taxonkit here since the need the mapped NCBI names to the arcording taxids"/>
-                <param argument="--column" type="data_column" data_ref="taxonkit" label="Input the colum with the NCBI names"/>
-                <param name="input" type="data" multiple="true" format="tabular" label="Input the GTDB-Tk summary file(s) here"
-                    help="Use the GTDB-Tk file(s) which are coresponding with the binning file!"/>
+            <when value="contig">
+                <param argument="--contig2taxid" type="data" format="tabular" label="Input ConitgID2TaxID file"
+                    help="This input comes from Kraken2"/>
+                <param argument="--key_col" type="data_column" data_ref="contig2taxid" label="Select the column where the ContigID are stated"/>
+                <param argument="--taxid_col" type="data_column" data_ref="contig2taxid" label="Select the column where the TaxID are stated"/>
             </when>
-            <when value="BAT">
-                <param name="input" type="data" multiple="true" format="tabular" label="Input bin2classifier file(s) from BAT here"
-                    help="Use the BAT file(s) which are coresponding with the binning file!"/>
+            <when value="bin">
+                <param argument="--binid2taxid" type="data" format="tabular" label="Input BinID2TaxID file"
+                    help="This input comes from Kraken2"/>
+                <param argument="--key_col" type="data_column" data_ref="binid2taxid" label="Select the column where the BinID are stated"/>
+                <param argument="--taxid_col" type="data_column" data_ref="binid2taxid" label="Select the column where the TaxID are stated"/>
             </when>
         </conditional>
     </inputs>
@@ -70,48 +61,52 @@
         <data name="output" format="tabular" label="${tool.name}: BIOBOX ADD TAXID COLUMN"/>
     </outputs>
     <tests>
-        <test expect_num_outputs="1">
-            <param name="biobox_file" ftype="tabular" value="test_biobox_file.tsv"/>
-            <conditional name="tool_type">
-                <param name="is_select" value="BAT"/>
-                <param name="input" ftype="tabular" value="test_bat_file.tsv"/>
+        <test>
+            <param name="biobox_file" value="biobox_file.tsv" ftype="tabular"/>
+            <conditional name="input">
+                <param name="is_select" value="bin"/>
+                <param name="binid2taxid" value="binid2taxid.tsv" ftype="tabular"/>
+                <param name="key_col" value="1"/>
+                <param name="taxid_col" value="2"/>
             </conditional>
-            <output name="output" file="test_biobox_file_add_taxid_bat.tsv"/>
+            <output name="output" file="modified_biobox_file_bin.tsv"/>
         </test>
-        <test expect_num_outputs="1">
-            <param name="biobox_file" ftype="tabular" value="test_biobox_file.tsv"/>
-            <conditional name="tool_type">
-                <param name="is_select" value="GTDB"/>
-                <param name="gtdb_to_taxdump" ftype="tabular" value="test_gtdb_to_taxdump_file.tsv"/>
-                <param name="taxonkit" ftype="tabular" value="test_taxonkit_file_1.tsv,test_taxonkit_file_2.tsv"/>
-                <param name="column" value="1"/>
-                <param name="input" ftype="tabular" value="test_gtdb_file.tsv"/>
+        <test>
+            <param name="biobox_file" value="biobox_file.tsv" ftype="tabular"/>
+            <conditional name="input">
+                <param name="is_select" value="contig"/>
+                <param name="contig2taxid" value="kraken2.tsv" ftype="tabular"/>
+                <param name="key_col" value="2"/>
+                <param name="taxid_col" value="3"/>
             </conditional>
-            <output name="output" file="test_biobox_file_add_taxid_gtdb.tsv"/>
+            <output name="output" file="modified_biobox_file_contig.tsv"/>
         </test>
     </tests>
     <help>
     <![CDATA[
         
         **USAGE OF THIS TOOL**
-
-        This tool was desgin for using the BAT/GTDB-Tk output to expand the CAMI amber biobox file with the taxid column to access taxa evaluation with amber!
-
-        **IMPORTAND NOTE WHEN USING GTDB OUTPUT**
-
-        Befor using GTDB-Tk output you have to use 2 other tools to map the GTDB names to the NCBI names and then map the NCBI names to there taxids.
-        To map the GTDB names to the NCBI names you extract the GTDB names from the summary file and with them you can now use the gtdb_to_taxdum tool!
-        After using the gtdb_to_taxdum tool you have the extract the NCBI names here and then use the tool Taxonkit[name2taxid] to finaly get the taxids.
+        
+        This tool can be used to add the TaxID column to a biobox file.
 
         **INPUTS**
-        - The CAMI amber biobox file
-        - BAT[bin2classifier] file(s) OR GTDB-Tk[Summary] file(s)
-        - The gtdb_to_taxdum output[WHEN USING GTDB-Tk]
-        - The Taxonkit[name2taxid] output[WHEN USING GTDB-Tk]
+        
+        - A biobox file. This file can be generated with the CAMI AMBER utility Tool named 'convert to biobox'
+        - Either a Contig2TaxID file which is generated from Kraken2 (the classification file from Kraken2) or a BinID2TaxID which has to be done manualy
+
+        Example for a BinID2TaxID file 
+
+        ::
+        
+            #BinID   TaxID
+            test1   11056
+            test2   444944
+            ABC 888
 
         **OUTPUT**
 
-        A CAMI amber biobox file with a taxid colum
+        - A CAMI AMBER biobox file with a taxid column
+
     ]]> 
     </help>
     <citations>
@@ -121,8 +116,7 @@
             journal = {GitHub},
             year = {2024},
             month = aug,
-            note = {[Online; accessed 22. Aug. 2024]},
-            url = {https://github.com/SantaMcCloud/biobox_add_taxid/tree/release-0.3}
+            url = {https://github.com/SantaMcCloud/biobox_add_taxid/tree/release-1.0}
         }</citation>
     </citations>
 </tool>
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/binid2taxid.tsv	Sat Feb 08 11:33:03 2025 +0000
@@ -0,0 +1,39 @@
+#BinID	NCBI_TaxID
+SemiBin_SemiBin_234	12908
+SemiBin_SemiBin_78_sub	12908
+SemiBin_SemiBin_79	12908
+SemiBin_SemiBin_54	226
+SemiBin_SemiBin_56	226
+MetaBAT2_69	2234
+SemiBin_SemiBin_80	191412
+SemiBin_SemiBin_448	100716
+CONCOCT_117	1485
+CONCOCT_136_sub	897
+CONCOCT_73_sub	1263979
+SemiBin_SemiBin_1072	1263979
+CONCOCT_45_sub	39960
+CONCOCT_170	1188228
+MetaBAT2_13_sub	2745
+CONCOCT_60	54248
+MetaBAT2_42	12908
+CONCOCT_87	467094
+CONCOCT_2_sub	1124597
+CONCOCT_93	186192
+CONCOCT_8	936476
+SemiBin_SemiBin_50	2198
+CONCOCT_192	38027
+SemiBin_SemiBin_159	168695
+CONCOCT_62	133539
+CONCOCT_198	1229
+CONCOCT_17	971279
+SemiBin_SemiBin_93	497
+CONCOCT_166_sub	1335757
+MetaBAT2_7	1335746
+CONCOCT_27	1292
+CONCOCT_214	265570
+MetaBAT2_46	1129
+SemiBin_SemiBin_374	80679
+MetaBAT2_9_sub	171436
+SemiBin_SemiBin_19	662
+SemiBin_SemiBin_75	662
+MetaBAT2_24	29497
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/biobox_file.tsv	Sat Feb 08 11:33:03 2025 +0000
@@ -0,0 +1,321 @@
+#CAMI Format for Binning
+@Version:0.9.0
+@SampleID:_SAMPLEID_
+@@SEQUENCEID	BINID
+S0C67443	CONCOCT_117
+S0C145665	CONCOCT_117
+S0C179008	CONCOCT_117
+S0C285214	CONCOCT_117
+S0C309108	CONCOCT_117
+S0C310129	CONCOCT_117
+S0C336019	CONCOCT_117
+S0C388550	CONCOCT_117
+S0C495394	CONCOCT_117
+S0C511360	CONCOCT_117
+S0C577842	CONCOCT_117
+S0C596918	CONCOCT_117
+S0C603398	CONCOCT_117
+S0C754713	CONCOCT_117
+S0C938786	CONCOCT_117
+S0C967914	CONCOCT_117
+S0C974893	CONCOCT_117
+S0C1006901	CONCOCT_117
+S0C1018235	CONCOCT_117
+S0C1018552	CONCOCT_117
+S0C1049501	CONCOCT_117
+S0C1067275	CONCOCT_117
+S0C1069633	CONCOCT_117
+S0C1089023	CONCOCT_117
+S0C1146406	CONCOCT_117
+S0C1154753	CONCOCT_117
+S0C1194005	CONCOCT_117
+S0C1226618	CONCOCT_117
+S0C1282023	CONCOCT_117
+S0C1332000	CONCOCT_117
+S0C1359995	CONCOCT_117
+S0C1396765	CONCOCT_117
+S0C1472996	CONCOCT_117
+S0C1475640	CONCOCT_117
+S0C2285	CONCOCT_136_sub
+S0C12513	CONCOCT_136_sub
+S0C13841	CONCOCT_136_sub
+S0C15954	CONCOCT_136_sub
+S0C33046	CONCOCT_136_sub
+S0C38240	CONCOCT_136_sub
+S0C40714	CONCOCT_136_sub
+S0C67745	CONCOCT_136_sub
+S0C96249	CONCOCT_136_sub
+S0C105628	CONCOCT_136_sub
+S0C121147	CONCOCT_136_sub
+S0C123278	CONCOCT_136_sub
+S0C128492	CONCOCT_136_sub
+S0C142447	CONCOCT_136_sub
+S0C143656	CONCOCT_136_sub
+S0C146090	CONCOCT_136_sub
+S0C146468	CONCOCT_136_sub
+S0C148477	CONCOCT_136_sub
+S0C154116	CONCOCT_136_sub
+S0C154853	CONCOCT_136_sub
+S0C183450	CONCOCT_136_sub
+S0C206740	CONCOCT_136_sub
+S0C217759	CONCOCT_136_sub
+S0C218807	CONCOCT_136_sub
+S0C232692	CONCOCT_136_sub
+S0C241720	CONCOCT_136_sub
+S0C254412	CONCOCT_136_sub
+S0C255416	CONCOCT_136_sub
+S0C257539	CONCOCT_136_sub
+S0C271698	CONCOCT_136_sub
+S0C273417	CONCOCT_136_sub
+S0C277828	CONCOCT_136_sub
+S0C292193	CONCOCT_136_sub
+S0C317783	CONCOCT_136_sub
+S0C325310	CONCOCT_136_sub
+S0C328828	CONCOCT_136_sub
+S0C329977	CONCOCT_136_sub
+S0C333294	CONCOCT_136_sub
+S0C368301	CONCOCT_136_sub
+S0C383465	CONCOCT_136_sub
+S0C394511	CONCOCT_136_sub
+S0C398856	CONCOCT_136_sub
+S0C403250	CONCOCT_136_sub
+S0C425442	CONCOCT_136_sub
+S0C452562	CONCOCT_136_sub
+S0C456710	CONCOCT_136_sub
+S0C463745	CONCOCT_136_sub
+S0C528906	CONCOCT_136_sub
+S0C537221	CONCOCT_136_sub
+S0C544925	CONCOCT_136_sub
+S0C561693	CONCOCT_136_sub
+S0C600277	CONCOCT_136_sub
+S0C604275	CONCOCT_136_sub
+S0C605807	CONCOCT_136_sub
+S0C637735	CONCOCT_136_sub
+S0C638781	CONCOCT_136_sub
+S0C649134	CONCOCT_136_sub
+S0C652655	CONCOCT_136_sub
+S0C660528	CONCOCT_136_sub
+S0C677873	CONCOCT_136_sub
+S0C680313	CONCOCT_136_sub
+S0C687459	CONCOCT_136_sub
+S0C692321	CONCOCT_136_sub
+S0C713693	CONCOCT_136_sub
+S0C714168	CONCOCT_136_sub
+S0C733252	CONCOCT_136_sub
+S0C776530	CONCOCT_136_sub
+S0C783755	CONCOCT_136_sub
+S0C795045	CONCOCT_136_sub
+S0C800057	CONCOCT_136_sub
+S0C813055	CONCOCT_136_sub
+S0C899262	CONCOCT_136_sub
+S0C913746	CONCOCT_136_sub
+S0C918289	CONCOCT_136_sub
+S0C938734	CONCOCT_136_sub
+S0C975726	CONCOCT_136_sub
+S0C979641	CONCOCT_136_sub
+S0C983123	CONCOCT_136_sub
+S0C997065	CONCOCT_136_sub
+S0C1002112	CONCOCT_136_sub
+S0C1021820	CONCOCT_136_sub
+S0C1025488	CONCOCT_136_sub
+S0C1065828	CONCOCT_136_sub
+S0C1070236	CONCOCT_136_sub
+S0C1073934	CONCOCT_136_sub
+S0C1113098	CONCOCT_136_sub
+S0C1114754	CONCOCT_136_sub
+S0C1114940	CONCOCT_136_sub
+S0C1147832	CONCOCT_136_sub
+S0C1152832	CONCOCT_136_sub
+S0C1163944	CONCOCT_136_sub
+S0C1165074	CONCOCT_136_sub
+S0C1169186	CONCOCT_136_sub
+S0C1169264	CONCOCT_136_sub
+S0C1171688	CONCOCT_136_sub
+S0C1176365	CONCOCT_136_sub
+S0C1185051	CONCOCT_136_sub
+S0C1186809	CONCOCT_136_sub
+S0C1210700	CONCOCT_136_sub
+S0C1214131	CONCOCT_136_sub
+S0C1221620	CONCOCT_136_sub
+S0C1234807	CONCOCT_136_sub
+S0C1239526	CONCOCT_136_sub
+S0C1254841	CONCOCT_136_sub
+S0C1285320	CONCOCT_136_sub
+S0C1293224	CONCOCT_136_sub
+S0C1295836	CONCOCT_136_sub
+S0C1304758	CONCOCT_136_sub
+S0C1304844	CONCOCT_136_sub
+S0C1325299	CONCOCT_136_sub
+S0C1352093	CONCOCT_136_sub
+S0C1379815	CONCOCT_136_sub
+S0C1383473	CONCOCT_136_sub
+S0C1392056	CONCOCT_136_sub
+S0C1393578	CONCOCT_136_sub
+S0C1393787	CONCOCT_136_sub
+S0C1463756	CONCOCT_136_sub
+S0C1473393	CONCOCT_136_sub
+S0C105857	CONCOCT_166_sub
+S0C388714	CONCOCT_17
+S0C813	CONCOCT_170
+S0C3376	CONCOCT_170
+S0C3946	CONCOCT_170
+S0C4598	CONCOCT_170
+S0C5801	CONCOCT_170
+S0C6129	CONCOCT_170
+S0C6683	CONCOCT_170
+S0C7348	CONCOCT_170
+S0C8735	CONCOCT_170
+S0C9580	CONCOCT_170
+S0C9975	CONCOCT_170
+S0C13152	CONCOCT_170
+S0C13440	CONCOCT_170
+S0C17036	CONCOCT_170
+S0C18177	CONCOCT_170
+S0C19017	CONCOCT_170
+S0C23506	CONCOCT_170
+S0C26465	CONCOCT_170
+S0C26897	CONCOCT_170
+S0C27778	CONCOCT_170
+S0C29092	CONCOCT_170
+S0C29873	CONCOCT_170
+S0C31104	CONCOCT_170
+S0C32058	CONCOCT_170
+S0C33000	CONCOCT_170
+S0C36793	CONCOCT_170
+S0C38649	CONCOCT_170
+S0C42734	CONCOCT_170
+S0C43766	CONCOCT_170
+S0C43907	CONCOCT_170
+S0C46070	CONCOCT_170
+S0C48380	CONCOCT_170
+S0C52799	CONCOCT_170
+S0C53306	CONCOCT_170
+S0C56322	CONCOCT_170
+S0C56380	CONCOCT_170
+S0C57389	CONCOCT_170
+S0C58396	CONCOCT_170
+S0C60056	CONCOCT_170
+S0C61727	CONCOCT_170
+S0C68023	CONCOCT_170
+S0C74410	CONCOCT_170
+S0C74790	CONCOCT_170
+S0C74939	CONCOCT_170
+S0C75897	CONCOCT_170
+S0C78941	CONCOCT_170
+S0C85952	CONCOCT_170
+S0C87085	CONCOCT_170
+S0C87881	CONCOCT_170
+S0C88932	CONCOCT_170
+S0C89448	CONCOCT_170
+S0C89868	CONCOCT_170
+S0C90415	CONCOCT_170
+S0C90716	CONCOCT_170
+S0C93293	CONCOCT_170
+S0C102816	CONCOCT_170
+S0C103662	CONCOCT_170
+S0C104694	CONCOCT_170
+S0C107175	CONCOCT_170
+S0C107697	CONCOCT_170
+S0C107933	CONCOCT_170
+S0C111037	CONCOCT_170
+S0C114385	CONCOCT_170
+S0C117906	CONCOCT_170
+S0C123235	CONCOCT_170
+S0C124089	CONCOCT_170
+S0C129769	CONCOCT_170
+S0C131077	CONCOCT_170
+S0C131919	CONCOCT_170
+S0C136538	CONCOCT_170
+S0C137113	CONCOCT_170
+S0C139193	CONCOCT_170
+S0C140030	CONCOCT_170
+S0C143099	CONCOCT_170
+S0C143812	CONCOCT_170
+S0C146859	CONCOCT_170
+S0C148933	CONCOCT_170
+S0C152340	CONCOCT_170
+S0C152505	CONCOCT_170
+S0C152600	CONCOCT_170
+S0C153465	CONCOCT_170
+S0C153977	CONCOCT_170
+S0C156191	CONCOCT_170
+S0C163440	CONCOCT_170
+S0C164900	CONCOCT_170
+S0C165431	CONCOCT_170
+S0C165600	CONCOCT_170
+S0C167514	CONCOCT_170
+S0C170731	CONCOCT_170
+S0C171275	CONCOCT_170
+S0C172053	CONCOCT_170
+S0C172143	CONCOCT_170
+S0C173871	CONCOCT_170
+S0C176168	CONCOCT_170
+S0C176457	CONCOCT_170
+S0C177012	CONCOCT_170
+S0C177016	CONCOCT_170
+S0C180505	CONCOCT_170
+S0C184052	CONCOCT_170
+S0C187627	CONCOCT_170
+S0C189589	CONCOCT_170
+S0C190286	CONCOCT_170
+S0C190997	CONCOCT_170
+S0C192169	CONCOCT_170
+S0C192913	CONCOCT_170
+S0C193235	CONCOCT_170
+S0C197282	CONCOCT_170
+S0C199440	CONCOCT_170
+S0C200742	CONCOCT_170
+S0C202327	CONCOCT_170
+S0C203916	CONCOCT_170
+S0C207418	CONCOCT_170
+S0C214076	CONCOCT_170
+S0C214145	CONCOCT_170
+S0C214674	CONCOCT_170
+S0C215796	CONCOCT_170
+S0C218011	CONCOCT_170
+S0C223793	CONCOCT_170
+S0C224911	CONCOCT_170
+S0C226616	CONCOCT_170
+S0C226964	CONCOCT_170
+S0C232179	CONCOCT_170
+S0C233703	CONCOCT_170
+S0C235269	CONCOCT_170
+S0C244843	CONCOCT_170
+S0C245988	CONCOCT_170
+S0C247775	CONCOCT_170
+S0C248142	CONCOCT_170
+S0C248525	CONCOCT_170
+S0C250249	CONCOCT_170
+S0C250769	CONCOCT_170
+S0C261957	CONCOCT_170
+S0C267920	CONCOCT_170
+S0C268515	CONCOCT_170
+S0C271398	CONCOCT_170
+S0C273474	CONCOCT_170
+S0C273642	CONCOCT_170
+S0C273909	CONCOCT_170
+S0C282614	CONCOCT_170
+S0C284421	CONCOCT_170
+S0C284529	CONCOCT_170
+S0C286800	CONCOCT_170
+S0C289235	CONCOCT_170
+S0C290438	CONCOCT_170
+S0C291627	CONCOCT_170
+S0C296643	CONCOCT_170
+S0C297219	CONCOCT_170
+S0C302272	CONCOCT_170
+S0C303794	CONCOCT_170
+S0C307970	CONCOCT_170
+S0C310701	CONCOCT_170
+S0C310818	CONCOCT_170
+S0C313722	CONCOCT_170
+S0C313791	CONCOCT_170
+S0C315247	CONCOCT_170
+S0C316931	CONCOCT_170
+S0C317968	CONCOCT_170
+S0C319375	CONCOCT_170
+S0C320040	CONCOCT_170
+S0C320442	CONCOCT_170
+S0C328161	CONCOCT_170
+S0C328842	CONCOCT_170
+S0C329759	CONCOCT_170
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/kraken2.tsv	Sat Feb 08 11:33:03 2025 +0000
@@ -0,0 +1,317 @@
+C	S0C67443	1415774
+U	S0C145665	0
+U	S0C179008	0
+U	S0C285214	0
+C	S0C309108	1415774
+U	S0C310129	0
+C	S0C336019	1415774
+U	S0C388550	0
+C	S0C495394	1415774
+C	S0C511360	1415774
+C	S0C577842	1415774
+C	S0C596918	1415774
+U	S0C603398	0
+U	S0C754713	0
+U	S0C938786	0
+C	S0C967914	1415774
+C	S0C974893	1415774
+U	S0C1006901	0
+U	S0C1018235	0
+U	S0C1018552	0
+C	S0C1049501	1415774
+C	S0C1067275	1415774
+U	S0C1069633	0
+U	S0C1089023	0
+U	S0C1146406	0
+U	S0C1154753	0
+U	S0C1194005	0
+U	S0C1226618	0
+C	S0C1282023	1415774
+C	S0C1332000	1415774
+C	S0C1359995	1415774
+U	S0C1396765	0
+U	S0C1472996	0
+U	S0C1475640	0
+C	S0C2285	897
+C	S0C12513	897
+C	S0C13841	897
+C	S0C15954	897
+C	S0C33046	897
+C	S0C38240	897
+C	S0C40714	897
+C	S0C67745	897
+C	S0C96249	897
+C	S0C105628	897
+C	S0C121147	897
+C	S0C123278	897
+C	S0C128492	897
+C	S0C142447	897
+C	S0C143656	897
+C	S0C146090	897
+C	S0C146468	897
+C	S0C148477	897
+C	S0C154116	897
+C	S0C154853	897
+C	S0C183450	897
+C	S0C206740	897
+C	S0C217759	897
+C	S0C218807	897
+C	S0C232692	897
+C	S0C241720	897
+C	S0C254412	897
+C	S0C255416	897
+C	S0C257539	897
+C	S0C271698	897
+C	S0C273417	897
+C	S0C277828	897
+C	S0C292193	897
+C	S0C317783	897
+C	S0C325310	897
+C	S0C328828	897
+C	S0C329977	897
+C	S0C333294	897
+C	S0C368301	897
+C	S0C383465	897
+C	S0C394511	897
+C	S0C398856	897
+C	S0C403250	897
+C	S0C425442	897
+C	S0C452562	897
+C	S0C456710	897
+C	S0C463745	897
+C	S0C528906	897
+C	S0C537221	897
+C	S0C544925	897
+C	S0C561693	897
+C	S0C600277	897
+C	S0C604275	897
+C	S0C605807	897
+C	S0C637735	897
+C	S0C638781	897
+C	S0C649134	897
+C	S0C652655	897
+C	S0C660528	897
+C	S0C677873	897
+C	S0C680313	897
+C	S0C687459	897
+C	S0C692321	897
+C	S0C713693	897
+C	S0C714168	897
+C	S0C733252	897
+C	S0C776530	897
+C	S0C783755	881
+C	S0C795045	897
+C	S0C800057	897
+C	S0C813055	897
+C	S0C899262	897
+C	S0C913746	897
+C	S0C918289	897
+C	S0C938734	897
+C	S0C975726	897
+C	S0C979641	897
+C	S0C983123	897
+C	S0C997065	897
+C	S0C1002112	897
+C	S0C1021820	897
+C	S0C1025488	897
+C	S0C1065828	897
+C	S0C1070236	897
+C	S0C1073934	897
+C	S0C1113098	897
+C	S0C1114754	897
+C	S0C1114940	897
+C	S0C1147832	897
+C	S0C1152832	897
+C	S0C1163944	897
+C	S0C1165074	897
+C	S0C1169186	897
+C	S0C1169264	897
+C	S0C1171688	897
+C	S0C1176365	897
+C	S0C1185051	897
+C	S0C1186809	897
+C	S0C1210700	897
+C	S0C1214131	897
+C	S0C1221620	897
+C	S0C1234807	897
+C	S0C1239526	897
+C	S0C1254841	562
+C	S0C1285320	897
+C	S0C1293224	897
+C	S0C1295836	897
+C	S0C1304758	897
+C	S0C1304844	897
+C	S0C1325299	897
+C	S0C1352093	897
+C	S0C1379815	897
+C	S0C1383473	897
+C	S0C1392056	897
+C	S0C1393578	897
+C	S0C1393787	897
+C	S0C1463756	897
+C	S0C1473393	897
+C	S0C105857	1335757
+C	S0C388714	1343739
+C	S0C813	1188229
+C	S0C3376	1188229
+C	S0C3946	1188229
+C	S0C4598	1188229
+C	S0C5801	1188229
+C	S0C6129	1188229
+C	S0C6683	1188229
+C	S0C7348	1188229
+C	S0C8735	1188229
+C	S0C9580	1188229
+C	S0C9975	1188229
+C	S0C13152	1188229
+C	S0C13440	1188229
+C	S0C17036	1188229
+C	S0C18177	1188229
+C	S0C19017	1188229
+C	S0C23506	1188229
+C	S0C26465	1188229
+C	S0C26897	1188229
+C	S0C27778	1188229
+C	S0C29092	1188229
+C	S0C29873	1188229
+C	S0C31104	1188229
+C	S0C32058	1188229
+C	S0C33000	1188229
+C	S0C36793	1188229
+C	S0C38649	1188229
+C	S0C42734	1188229
+C	S0C43766	1188229
+C	S0C43907	1188229
+C	S0C46070	1188229
+C	S0C48380	1188229
+C	S0C52799	1188229
+C	S0C53306	1188229
+C	S0C56322	1188229
+C	S0C56380	1188229
+C	S0C57389	1188229
+C	S0C58396	1188229
+C	S0C60056	1188229
+C	S0C61727	1188229
+C	S0C68023	1188229
+C	S0C74410	1188229
+C	S0C74790	1188229
+C	S0C74939	1188229
+C	S0C75897	1188229
+C	S0C78941	1188229
+C	S0C85952	1188229
+C	S0C87085	1188229
+C	S0C87881	1188229
+C	S0C88932	1188229
+C	S0C89448	1188229
+C	S0C89868	1188229
+C	S0C90415	1188229
+C	S0C90716	1188229
+C	S0C93293	1188229
+C	S0C102816	1188229
+C	S0C103662	1188229
+C	S0C104694	1188229
+C	S0C107175	1188229
+C	S0C107697	1188229
+C	S0C107933	1188229
+C	S0C111037	1188229
+C	S0C114385	1188229
+C	S0C117906	1188229
+C	S0C123235	1188229
+C	S0C124089	1188229
+C	S0C129769	1188229
+C	S0C131077	1188229
+C	S0C131919	1188229
+C	S0C136538	1188229
+C	S0C137113	1188229
+C	S0C139193	1188229
+C	S0C140030	1188229
+C	S0C143099	1188229
+C	S0C143812	1188229
+C	S0C146859	1188229
+C	S0C148933	1188229
+C	S0C152340	1188229
+C	S0C152505	1188229
+C	S0C152600	1188229
+C	S0C153465	1188229
+C	S0C153977	1188229
+C	S0C156191	1188229
+C	S0C163440	1188229
+C	S0C164900	1188229
+C	S0C165431	1188229
+C	S0C165600	1188229
+C	S0C167514	1188229
+C	S0C170731	1188229
+C	S0C171275	1188229
+C	S0C172053	1188229
+C	S0C172143	1188229
+C	S0C173871	1188229
+C	S0C176168	1188229
+C	S0C176457	1188229
+C	S0C177012	1188229
+C	S0C177016	1188229
+C	S0C180505	1188229
+C	S0C184052	1188229
+C	S0C187627	1188229
+C	S0C189589	1188229
+C	S0C190286	1188229
+C	S0C190997	1188229
+C	S0C192169	1188229
+C	S0C192913	1188229
+C	S0C193235	1188229
+C	S0C197282	1188229
+C	S0C199440	1188229
+C	S0C200742	1188229
+C	S0C202327	1188229
+C	S0C203916	1188229
+C	S0C207418	1188229
+C	S0C214076	1188229
+C	S0C214145	1188229
+C	S0C214674	1188229
+C	S0C215796	1188229
+C	S0C218011	1188229
+C	S0C223793	1188229
+C	S0C224911	1188229
+C	S0C226616	1188229
+C	S0C226964	1188229
+C	S0C232179	1188229
+C	S0C233703	1188229
+C	S0C235269	1188229
+C	S0C244843	1188229
+C	S0C245988	1188229
+C	S0C247775	1188229
+C	S0C248142	1188229
+C	S0C248525	1188229
+C	S0C250249	1188229
+C	S0C250769	1188229
+C	S0C261957	1188229
+C	S0C267920	1188229
+C	S0C268515	1188229
+C	S0C271398	1188229
+C	S0C273474	1188229
+C	S0C273642	1188229
+C	S0C273909	1188229
+C	S0C282614	1188229
+C	S0C284421	1188229
+C	S0C284529	1188229
+C	S0C286800	1188229
+C	S0C289235	1188229
+C	S0C290438	1188229
+C	S0C291627	1188229
+C	S0C296643	1188229
+C	S0C297219	1188229
+C	S0C302272	1188229
+C	S0C303794	1188229
+C	S0C307970	1188229
+C	S0C310701	1188229
+C	S0C310818	1188229
+C	S0C313722	1188229
+C	S0C313791	1188229
+C	S0C315247	1188229
+C	S0C316931	1188229
+C	S0C317968	1188229
+C	S0C319375	1188229
+C	S0C320040	1188229
+C	S0C320442	1188229
+C	S0C328161	1188229
+C	S0C328842	1188229
+C	S0C329759	1188229
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/modified_biobox_file_bin.tsv	Sat Feb 08 11:33:03 2025 +0000
@@ -0,0 +1,321 @@
+#CAMI Format for Binning
+@Version:0.9.0
+@SampleID:_SAMPLEID_
+@@SEQUENCEID	BINID	TAXID
+S0C67443	CONCOCT_117	1485
+S0C145665	CONCOCT_117	1485
+S0C179008	CONCOCT_117	1485
+S0C285214	CONCOCT_117	1485
+S0C309108	CONCOCT_117	1485
+S0C310129	CONCOCT_117	1485
+S0C336019	CONCOCT_117	1485
+S0C388550	CONCOCT_117	1485
+S0C495394	CONCOCT_117	1485
+S0C511360	CONCOCT_117	1485
+S0C577842	CONCOCT_117	1485
+S0C596918	CONCOCT_117	1485
+S0C603398	CONCOCT_117	1485
+S0C754713	CONCOCT_117	1485
+S0C938786	CONCOCT_117	1485
+S0C967914	CONCOCT_117	1485
+S0C974893	CONCOCT_117	1485
+S0C1006901	CONCOCT_117	1485
+S0C1018235	CONCOCT_117	1485
+S0C1018552	CONCOCT_117	1485
+S0C1049501	CONCOCT_117	1485
+S0C1067275	CONCOCT_117	1485
+S0C1069633	CONCOCT_117	1485
+S0C1089023	CONCOCT_117	1485
+S0C1146406	CONCOCT_117	1485
+S0C1154753	CONCOCT_117	1485
+S0C1194005	CONCOCT_117	1485
+S0C1226618	CONCOCT_117	1485
+S0C1282023	CONCOCT_117	1485
+S0C1332000	CONCOCT_117	1485
+S0C1359995	CONCOCT_117	1485
+S0C1396765	CONCOCT_117	1485
+S0C1472996	CONCOCT_117	1485
+S0C1475640	CONCOCT_117	1485
+S0C2285	CONCOCT_136_sub	897
+S0C12513	CONCOCT_136_sub	897
+S0C13841	CONCOCT_136_sub	897
+S0C15954	CONCOCT_136_sub	897
+S0C33046	CONCOCT_136_sub	897
+S0C38240	CONCOCT_136_sub	897
+S0C40714	CONCOCT_136_sub	897
+S0C67745	CONCOCT_136_sub	897
+S0C96249	CONCOCT_136_sub	897
+S0C105628	CONCOCT_136_sub	897
+S0C121147	CONCOCT_136_sub	897
+S0C123278	CONCOCT_136_sub	897
+S0C128492	CONCOCT_136_sub	897
+S0C142447	CONCOCT_136_sub	897
+S0C143656	CONCOCT_136_sub	897
+S0C146090	CONCOCT_136_sub	897
+S0C146468	CONCOCT_136_sub	897
+S0C148477	CONCOCT_136_sub	897
+S0C154116	CONCOCT_136_sub	897
+S0C154853	CONCOCT_136_sub	897
+S0C183450	CONCOCT_136_sub	897
+S0C206740	CONCOCT_136_sub	897
+S0C217759	CONCOCT_136_sub	897
+S0C218807	CONCOCT_136_sub	897
+S0C232692	CONCOCT_136_sub	897
+S0C241720	CONCOCT_136_sub	897
+S0C254412	CONCOCT_136_sub	897
+S0C255416	CONCOCT_136_sub	897
+S0C257539	CONCOCT_136_sub	897
+S0C271698	CONCOCT_136_sub	897
+S0C273417	CONCOCT_136_sub	897
+S0C277828	CONCOCT_136_sub	897
+S0C292193	CONCOCT_136_sub	897
+S0C317783	CONCOCT_136_sub	897
+S0C325310	CONCOCT_136_sub	897
+S0C328828	CONCOCT_136_sub	897
+S0C329977	CONCOCT_136_sub	897
+S0C333294	CONCOCT_136_sub	897
+S0C368301	CONCOCT_136_sub	897
+S0C383465	CONCOCT_136_sub	897
+S0C394511	CONCOCT_136_sub	897
+S0C398856	CONCOCT_136_sub	897
+S0C403250	CONCOCT_136_sub	897
+S0C425442	CONCOCT_136_sub	897
+S0C452562	CONCOCT_136_sub	897
+S0C456710	CONCOCT_136_sub	897
+S0C463745	CONCOCT_136_sub	897
+S0C528906	CONCOCT_136_sub	897
+S0C537221	CONCOCT_136_sub	897
+S0C544925	CONCOCT_136_sub	897
+S0C561693	CONCOCT_136_sub	897
+S0C600277	CONCOCT_136_sub	897
+S0C604275	CONCOCT_136_sub	897
+S0C605807	CONCOCT_136_sub	897
+S0C637735	CONCOCT_136_sub	897
+S0C638781	CONCOCT_136_sub	897
+S0C649134	CONCOCT_136_sub	897
+S0C652655	CONCOCT_136_sub	897
+S0C660528	CONCOCT_136_sub	897
+S0C677873	CONCOCT_136_sub	897
+S0C680313	CONCOCT_136_sub	897
+S0C687459	CONCOCT_136_sub	897
+S0C692321	CONCOCT_136_sub	897
+S0C713693	CONCOCT_136_sub	897
+S0C714168	CONCOCT_136_sub	897
+S0C733252	CONCOCT_136_sub	897
+S0C776530	CONCOCT_136_sub	897
+S0C783755	CONCOCT_136_sub	897
+S0C795045	CONCOCT_136_sub	897
+S0C800057	CONCOCT_136_sub	897
+S0C813055	CONCOCT_136_sub	897
+S0C899262	CONCOCT_136_sub	897
+S0C913746	CONCOCT_136_sub	897
+S0C918289	CONCOCT_136_sub	897
+S0C938734	CONCOCT_136_sub	897
+S0C975726	CONCOCT_136_sub	897
+S0C979641	CONCOCT_136_sub	897
+S0C983123	CONCOCT_136_sub	897
+S0C997065	CONCOCT_136_sub	897
+S0C1002112	CONCOCT_136_sub	897
+S0C1021820	CONCOCT_136_sub	897
+S0C1025488	CONCOCT_136_sub	897
+S0C1065828	CONCOCT_136_sub	897
+S0C1070236	CONCOCT_136_sub	897
+S0C1073934	CONCOCT_136_sub	897
+S0C1113098	CONCOCT_136_sub	897
+S0C1114754	CONCOCT_136_sub	897
+S0C1114940	CONCOCT_136_sub	897
+S0C1147832	CONCOCT_136_sub	897
+S0C1152832	CONCOCT_136_sub	897
+S0C1163944	CONCOCT_136_sub	897
+S0C1165074	CONCOCT_136_sub	897
+S0C1169186	CONCOCT_136_sub	897
+S0C1169264	CONCOCT_136_sub	897
+S0C1171688	CONCOCT_136_sub	897
+S0C1176365	CONCOCT_136_sub	897
+S0C1185051	CONCOCT_136_sub	897
+S0C1186809	CONCOCT_136_sub	897
+S0C1210700	CONCOCT_136_sub	897
+S0C1214131	CONCOCT_136_sub	897
+S0C1221620	CONCOCT_136_sub	897
+S0C1234807	CONCOCT_136_sub	897
+S0C1239526	CONCOCT_136_sub	897
+S0C1254841	CONCOCT_136_sub	897
+S0C1285320	CONCOCT_136_sub	897
+S0C1293224	CONCOCT_136_sub	897
+S0C1295836	CONCOCT_136_sub	897
+S0C1304758	CONCOCT_136_sub	897
+S0C1304844	CONCOCT_136_sub	897
+S0C1325299	CONCOCT_136_sub	897
+S0C1352093	CONCOCT_136_sub	897
+S0C1379815	CONCOCT_136_sub	897
+S0C1383473	CONCOCT_136_sub	897
+S0C1392056	CONCOCT_136_sub	897
+S0C1393578	CONCOCT_136_sub	897
+S0C1393787	CONCOCT_136_sub	897
+S0C1463756	CONCOCT_136_sub	897
+S0C1473393	CONCOCT_136_sub	897
+S0C105857	CONCOCT_166_sub	1335757
+S0C388714	CONCOCT_17	971279
+S0C813	CONCOCT_170	1188228
+S0C3376	CONCOCT_170	1188228
+S0C3946	CONCOCT_170	1188228
+S0C4598	CONCOCT_170	1188228
+S0C5801	CONCOCT_170	1188228
+S0C6129	CONCOCT_170	1188228
+S0C6683	CONCOCT_170	1188228
+S0C7348	CONCOCT_170	1188228
+S0C8735	CONCOCT_170	1188228
+S0C9580	CONCOCT_170	1188228
+S0C9975	CONCOCT_170	1188228
+S0C13152	CONCOCT_170	1188228
+S0C13440	CONCOCT_170	1188228
+S0C17036	CONCOCT_170	1188228
+S0C18177	CONCOCT_170	1188228
+S0C19017	CONCOCT_170	1188228
+S0C23506	CONCOCT_170	1188228
+S0C26465	CONCOCT_170	1188228
+S0C26897	CONCOCT_170	1188228
+S0C27778	CONCOCT_170	1188228
+S0C29092	CONCOCT_170	1188228
+S0C29873	CONCOCT_170	1188228
+S0C31104	CONCOCT_170	1188228
+S0C32058	CONCOCT_170	1188228
+S0C33000	CONCOCT_170	1188228
+S0C36793	CONCOCT_170	1188228
+S0C38649	CONCOCT_170	1188228
+S0C42734	CONCOCT_170	1188228
+S0C43766	CONCOCT_170	1188228
+S0C43907	CONCOCT_170	1188228
+S0C46070	CONCOCT_170	1188228
+S0C48380	CONCOCT_170	1188228
+S0C52799	CONCOCT_170	1188228
+S0C53306	CONCOCT_170	1188228
+S0C56322	CONCOCT_170	1188228
+S0C56380	CONCOCT_170	1188228
+S0C57389	CONCOCT_170	1188228
+S0C58396	CONCOCT_170	1188228
+S0C60056	CONCOCT_170	1188228
+S0C61727	CONCOCT_170	1188228
+S0C68023	CONCOCT_170	1188228
+S0C74410	CONCOCT_170	1188228
+S0C74790	CONCOCT_170	1188228
+S0C74939	CONCOCT_170	1188228
+S0C75897	CONCOCT_170	1188228
+S0C78941	CONCOCT_170	1188228
+S0C85952	CONCOCT_170	1188228
+S0C87085	CONCOCT_170	1188228
+S0C87881	CONCOCT_170	1188228
+S0C88932	CONCOCT_170	1188228
+S0C89448	CONCOCT_170	1188228
+S0C89868	CONCOCT_170	1188228
+S0C90415	CONCOCT_170	1188228
+S0C90716	CONCOCT_170	1188228
+S0C93293	CONCOCT_170	1188228
+S0C102816	CONCOCT_170	1188228
+S0C103662	CONCOCT_170	1188228
+S0C104694	CONCOCT_170	1188228
+S0C107175	CONCOCT_170	1188228
+S0C107697	CONCOCT_170	1188228
+S0C107933	CONCOCT_170	1188228
+S0C111037	CONCOCT_170	1188228
+S0C114385	CONCOCT_170	1188228
+S0C117906	CONCOCT_170	1188228
+S0C123235	CONCOCT_170	1188228
+S0C124089	CONCOCT_170	1188228
+S0C129769	CONCOCT_170	1188228
+S0C131077	CONCOCT_170	1188228
+S0C131919	CONCOCT_170	1188228
+S0C136538	CONCOCT_170	1188228
+S0C137113	CONCOCT_170	1188228
+S0C139193	CONCOCT_170	1188228
+S0C140030	CONCOCT_170	1188228
+S0C143099	CONCOCT_170	1188228
+S0C143812	CONCOCT_170	1188228
+S0C146859	CONCOCT_170	1188228
+S0C148933	CONCOCT_170	1188228
+S0C152340	CONCOCT_170	1188228
+S0C152505	CONCOCT_170	1188228
+S0C152600	CONCOCT_170	1188228
+S0C153465	CONCOCT_170	1188228
+S0C153977	CONCOCT_170	1188228
+S0C156191	CONCOCT_170	1188228
+S0C163440	CONCOCT_170	1188228
+S0C164900	CONCOCT_170	1188228
+S0C165431	CONCOCT_170	1188228
+S0C165600	CONCOCT_170	1188228
+S0C167514	CONCOCT_170	1188228
+S0C170731	CONCOCT_170	1188228
+S0C171275	CONCOCT_170	1188228
+S0C172053	CONCOCT_170	1188228
+S0C172143	CONCOCT_170	1188228
+S0C173871	CONCOCT_170	1188228
+S0C176168	CONCOCT_170	1188228
+S0C176457	CONCOCT_170	1188228
+S0C177012	CONCOCT_170	1188228
+S0C177016	CONCOCT_170	1188228
+S0C180505	CONCOCT_170	1188228
+S0C184052	CONCOCT_170	1188228
+S0C187627	CONCOCT_170	1188228
+S0C189589	CONCOCT_170	1188228
+S0C190286	CONCOCT_170	1188228
+S0C190997	CONCOCT_170	1188228
+S0C192169	CONCOCT_170	1188228
+S0C192913	CONCOCT_170	1188228
+S0C193235	CONCOCT_170	1188228
+S0C197282	CONCOCT_170	1188228
+S0C199440	CONCOCT_170	1188228
+S0C200742	CONCOCT_170	1188228
+S0C202327	CONCOCT_170	1188228
+S0C203916	CONCOCT_170	1188228
+S0C207418	CONCOCT_170	1188228
+S0C214076	CONCOCT_170	1188228
+S0C214145	CONCOCT_170	1188228
+S0C214674	CONCOCT_170	1188228
+S0C215796	CONCOCT_170	1188228
+S0C218011	CONCOCT_170	1188228
+S0C223793	CONCOCT_170	1188228
+S0C224911	CONCOCT_170	1188228
+S0C226616	CONCOCT_170	1188228
+S0C226964	CONCOCT_170	1188228
+S0C232179	CONCOCT_170	1188228
+S0C233703	CONCOCT_170	1188228
+S0C235269	CONCOCT_170	1188228
+S0C244843	CONCOCT_170	1188228
+S0C245988	CONCOCT_170	1188228
+S0C247775	CONCOCT_170	1188228
+S0C248142	CONCOCT_170	1188228
+S0C248525	CONCOCT_170	1188228
+S0C250249	CONCOCT_170	1188228
+S0C250769	CONCOCT_170	1188228
+S0C261957	CONCOCT_170	1188228
+S0C267920	CONCOCT_170	1188228
+S0C268515	CONCOCT_170	1188228
+S0C271398	CONCOCT_170	1188228
+S0C273474	CONCOCT_170	1188228
+S0C273642	CONCOCT_170	1188228
+S0C273909	CONCOCT_170	1188228
+S0C282614	CONCOCT_170	1188228
+S0C284421	CONCOCT_170	1188228
+S0C284529	CONCOCT_170	1188228
+S0C286800	CONCOCT_170	1188228
+S0C289235	CONCOCT_170	1188228
+S0C290438	CONCOCT_170	1188228
+S0C291627	CONCOCT_170	1188228
+S0C296643	CONCOCT_170	1188228
+S0C297219	CONCOCT_170	1188228
+S0C302272	CONCOCT_170	1188228
+S0C303794	CONCOCT_170	1188228
+S0C307970	CONCOCT_170	1188228
+S0C310701	CONCOCT_170	1188228
+S0C310818	CONCOCT_170	1188228
+S0C313722	CONCOCT_170	1188228
+S0C313791	CONCOCT_170	1188228
+S0C315247	CONCOCT_170	1188228
+S0C316931	CONCOCT_170	1188228
+S0C317968	CONCOCT_170	1188228
+S0C319375	CONCOCT_170	1188228
+S0C320040	CONCOCT_170	1188228
+S0C320442	CONCOCT_170	1188228
+S0C328161	CONCOCT_170	1188228
+S0C328842	CONCOCT_170	1188228
+S0C329759	CONCOCT_170	1188228
--- /dev/null	Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/modified_biobox_file_contig.tsv	Sat Feb 08 11:33:03 2025 +0000
@@ -0,0 +1,321 @@
+#CAMI Format for Binning
+@Version:0.9.0
+@SampleID:_SAMPLEID_
+@@SEQUENCEID	BINID	TAXID
+S0C67443	CONCOCT_117	1415774
+S0C145665	CONCOCT_117	0
+S0C179008	CONCOCT_117	0
+S0C285214	CONCOCT_117	0
+S0C309108	CONCOCT_117	1415774
+S0C310129	CONCOCT_117	0
+S0C336019	CONCOCT_117	1415774
+S0C388550	CONCOCT_117	0
+S0C495394	CONCOCT_117	1415774
+S0C511360	CONCOCT_117	1415774
+S0C577842	CONCOCT_117	1415774
+S0C596918	CONCOCT_117	1415774
+S0C603398	CONCOCT_117	0
+S0C754713	CONCOCT_117	0
+S0C938786	CONCOCT_117	0
+S0C967914	CONCOCT_117	1415774
+S0C974893	CONCOCT_117	1415774
+S0C1006901	CONCOCT_117	0
+S0C1018235	CONCOCT_117	0
+S0C1018552	CONCOCT_117	0
+S0C1049501	CONCOCT_117	1415774
+S0C1067275	CONCOCT_117	1415774
+S0C1069633	CONCOCT_117	0
+S0C1089023	CONCOCT_117	0
+S0C1146406	CONCOCT_117	0
+S0C1154753	CONCOCT_117	0
+S0C1194005	CONCOCT_117	0
+S0C1226618	CONCOCT_117	0
+S0C1282023	CONCOCT_117	1415774
+S0C1332000	CONCOCT_117	1415774
+S0C1359995	CONCOCT_117	1415774
+S0C1396765	CONCOCT_117	0
+S0C1472996	CONCOCT_117	0
+S0C1475640	CONCOCT_117	0
+S0C2285	CONCOCT_136_sub	897
+S0C12513	CONCOCT_136_sub	897
+S0C13841	CONCOCT_136_sub	897
+S0C15954	CONCOCT_136_sub	897
+S0C33046	CONCOCT_136_sub	897
+S0C38240	CONCOCT_136_sub	897
+S0C40714	CONCOCT_136_sub	897
+S0C67745	CONCOCT_136_sub	897
+S0C96249	CONCOCT_136_sub	897
+S0C105628	CONCOCT_136_sub	897
+S0C121147	CONCOCT_136_sub	897
+S0C123278	CONCOCT_136_sub	897
+S0C128492	CONCOCT_136_sub	897
+S0C142447	CONCOCT_136_sub	897
+S0C143656	CONCOCT_136_sub	897
+S0C146090	CONCOCT_136_sub	897
+S0C146468	CONCOCT_136_sub	897
+S0C148477	CONCOCT_136_sub	897
+S0C154116	CONCOCT_136_sub	897
+S0C154853	CONCOCT_136_sub	897
+S0C183450	CONCOCT_136_sub	897
+S0C206740	CONCOCT_136_sub	897
+S0C217759	CONCOCT_136_sub	897
+S0C218807	CONCOCT_136_sub	897
+S0C232692	CONCOCT_136_sub	897
+S0C241720	CONCOCT_136_sub	897
+S0C254412	CONCOCT_136_sub	897
+S0C255416	CONCOCT_136_sub	897
+S0C257539	CONCOCT_136_sub	897
+S0C271698	CONCOCT_136_sub	897
+S0C273417	CONCOCT_136_sub	897
+S0C277828	CONCOCT_136_sub	897
+S0C292193	CONCOCT_136_sub	897
+S0C317783	CONCOCT_136_sub	897
+S0C325310	CONCOCT_136_sub	897
+S0C328828	CONCOCT_136_sub	897
+S0C329977	CONCOCT_136_sub	897
+S0C333294	CONCOCT_136_sub	897
+S0C368301	CONCOCT_136_sub	897
+S0C383465	CONCOCT_136_sub	897
+S0C394511	CONCOCT_136_sub	897
+S0C398856	CONCOCT_136_sub	897
+S0C403250	CONCOCT_136_sub	897
+S0C425442	CONCOCT_136_sub	897
+S0C452562	CONCOCT_136_sub	897
+S0C456710	CONCOCT_136_sub	897
+S0C463745	CONCOCT_136_sub	897
+S0C528906	CONCOCT_136_sub	897
+S0C537221	CONCOCT_136_sub	897
+S0C544925	CONCOCT_136_sub	897
+S0C561693	CONCOCT_136_sub	897
+S0C600277	CONCOCT_136_sub	897
+S0C604275	CONCOCT_136_sub	897
+S0C605807	CONCOCT_136_sub	897
+S0C637735	CONCOCT_136_sub	897
+S0C638781	CONCOCT_136_sub	897
+S0C649134	CONCOCT_136_sub	897
+S0C652655	CONCOCT_136_sub	897
+S0C660528	CONCOCT_136_sub	897
+S0C677873	CONCOCT_136_sub	897
+S0C680313	CONCOCT_136_sub	897
+S0C687459	CONCOCT_136_sub	897
+S0C692321	CONCOCT_136_sub	897
+S0C713693	CONCOCT_136_sub	897
+S0C714168	CONCOCT_136_sub	897
+S0C733252	CONCOCT_136_sub	897
+S0C776530	CONCOCT_136_sub	897
+S0C783755	CONCOCT_136_sub	881
+S0C795045	CONCOCT_136_sub	897
+S0C800057	CONCOCT_136_sub	897
+S0C813055	CONCOCT_136_sub	897
+S0C899262	CONCOCT_136_sub	897
+S0C913746	CONCOCT_136_sub	897
+S0C918289	CONCOCT_136_sub	897
+S0C938734	CONCOCT_136_sub	897
+S0C975726	CONCOCT_136_sub	897
+S0C979641	CONCOCT_136_sub	897
+S0C983123	CONCOCT_136_sub	897
+S0C997065	CONCOCT_136_sub	897
+S0C1002112	CONCOCT_136_sub	897
+S0C1021820	CONCOCT_136_sub	897
+S0C1025488	CONCOCT_136_sub	897
+S0C1065828	CONCOCT_136_sub	897
+S0C1070236	CONCOCT_136_sub	897
+S0C1073934	CONCOCT_136_sub	897
+S0C1113098	CONCOCT_136_sub	897
+S0C1114754	CONCOCT_136_sub	897
+S0C1114940	CONCOCT_136_sub	897
+S0C1147832	CONCOCT_136_sub	897
+S0C1152832	CONCOCT_136_sub	897
+S0C1163944	CONCOCT_136_sub	897
+S0C1165074	CONCOCT_136_sub	897
+S0C1169186	CONCOCT_136_sub	897
+S0C1169264	CONCOCT_136_sub	897
+S0C1171688	CONCOCT_136_sub	897
+S0C1176365	CONCOCT_136_sub	897
+S0C1185051	CONCOCT_136_sub	897
+S0C1186809	CONCOCT_136_sub	897
+S0C1210700	CONCOCT_136_sub	897
+S0C1214131	CONCOCT_136_sub	897
+S0C1221620	CONCOCT_136_sub	897
+S0C1234807	CONCOCT_136_sub	897
+S0C1239526	CONCOCT_136_sub	897
+S0C1254841	CONCOCT_136_sub	562
+S0C1285320	CONCOCT_136_sub	897
+S0C1293224	CONCOCT_136_sub	897
+S0C1295836	CONCOCT_136_sub	897
+S0C1304758	CONCOCT_136_sub	897
+S0C1304844	CONCOCT_136_sub	897
+S0C1325299	CONCOCT_136_sub	897
+S0C1352093	CONCOCT_136_sub	897
+S0C1379815	CONCOCT_136_sub	897
+S0C1383473	CONCOCT_136_sub	897
+S0C1392056	CONCOCT_136_sub	897
+S0C1393578	CONCOCT_136_sub	897
+S0C1393787	CONCOCT_136_sub	897
+S0C1463756	CONCOCT_136_sub	897
+S0C1473393	CONCOCT_136_sub	897
+S0C105857	CONCOCT_166_sub	1335757
+S0C388714	CONCOCT_17	1343739
+S0C813	CONCOCT_170	1188229
+S0C3376	CONCOCT_170	1188229
+S0C3946	CONCOCT_170	1188229
+S0C4598	CONCOCT_170	1188229
+S0C5801	CONCOCT_170	1188229
+S0C6129	CONCOCT_170	1188229
+S0C6683	CONCOCT_170	1188229
+S0C7348	CONCOCT_170	1188229
+S0C8735	CONCOCT_170	1188229
+S0C9580	CONCOCT_170	1188229
+S0C9975	CONCOCT_170	1188229
+S0C13152	CONCOCT_170	1188229
+S0C13440	CONCOCT_170	1188229
+S0C17036	CONCOCT_170	1188229
+S0C18177	CONCOCT_170	1188229
+S0C19017	CONCOCT_170	1188229
+S0C23506	CONCOCT_170	1188229
+S0C26465	CONCOCT_170	1188229
+S0C26897	CONCOCT_170	1188229
+S0C27778	CONCOCT_170	1188229
+S0C29092	CONCOCT_170	1188229
+S0C29873	CONCOCT_170	1188229
+S0C31104	CONCOCT_170	1188229
+S0C32058	CONCOCT_170	1188229
+S0C33000	CONCOCT_170	1188229
+S0C36793	CONCOCT_170	1188229
+S0C38649	CONCOCT_170	1188229
+S0C42734	CONCOCT_170	1188229
+S0C43766	CONCOCT_170	1188229
+S0C43907	CONCOCT_170	1188229
+S0C46070	CONCOCT_170	1188229
+S0C48380	CONCOCT_170	1188229
+S0C52799	CONCOCT_170	1188229
+S0C53306	CONCOCT_170	1188229
+S0C56322	CONCOCT_170	1188229
+S0C56380	CONCOCT_170	1188229
+S0C57389	CONCOCT_170	1188229
+S0C58396	CONCOCT_170	1188229
+S0C60056	CONCOCT_170	1188229
+S0C61727	CONCOCT_170	1188229
+S0C68023	CONCOCT_170	1188229
+S0C74410	CONCOCT_170	1188229
+S0C74790	CONCOCT_170	1188229
+S0C74939	CONCOCT_170	1188229
+S0C75897	CONCOCT_170	1188229
+S0C78941	CONCOCT_170	1188229
+S0C85952	CONCOCT_170	1188229
+S0C87085	CONCOCT_170	1188229
+S0C87881	CONCOCT_170	1188229
+S0C88932	CONCOCT_170	1188229
+S0C89448	CONCOCT_170	1188229
+S0C89868	CONCOCT_170	1188229
+S0C90415	CONCOCT_170	1188229
+S0C90716	CONCOCT_170	1188229
+S0C93293	CONCOCT_170	1188229
+S0C102816	CONCOCT_170	1188229
+S0C103662	CONCOCT_170	1188229
+S0C104694	CONCOCT_170	1188229
+S0C107175	CONCOCT_170	1188229
+S0C107697	CONCOCT_170	1188229
+S0C107933	CONCOCT_170	1188229
+S0C111037	CONCOCT_170	1188229
+S0C114385	CONCOCT_170	1188229
+S0C117906	CONCOCT_170	1188229
+S0C123235	CONCOCT_170	1188229
+S0C124089	CONCOCT_170	1188229
+S0C129769	CONCOCT_170	1188229
+S0C131077	CONCOCT_170	1188229
+S0C131919	CONCOCT_170	1188229
+S0C136538	CONCOCT_170	1188229
+S0C137113	CONCOCT_170	1188229
+S0C139193	CONCOCT_170	1188229
+S0C140030	CONCOCT_170	1188229
+S0C143099	CONCOCT_170	1188229
+S0C143812	CONCOCT_170	1188229
+S0C146859	CONCOCT_170	1188229
+S0C148933	CONCOCT_170	1188229
+S0C152340	CONCOCT_170	1188229
+S0C152505	CONCOCT_170	1188229
+S0C152600	CONCOCT_170	1188229
+S0C153465	CONCOCT_170	1188229
+S0C153977	CONCOCT_170	1188229
+S0C156191	CONCOCT_170	1188229
+S0C163440	CONCOCT_170	1188229
+S0C164900	CONCOCT_170	1188229
+S0C165431	CONCOCT_170	1188229
+S0C165600	CONCOCT_170	1188229
+S0C167514	CONCOCT_170	1188229
+S0C170731	CONCOCT_170	1188229
+S0C171275	CONCOCT_170	1188229
+S0C172053	CONCOCT_170	1188229
+S0C172143	CONCOCT_170	1188229
+S0C173871	CONCOCT_170	1188229
+S0C176168	CONCOCT_170	1188229
+S0C176457	CONCOCT_170	1188229
+S0C177012	CONCOCT_170	1188229
+S0C177016	CONCOCT_170	1188229
+S0C180505	CONCOCT_170	1188229
+S0C184052	CONCOCT_170	1188229
+S0C187627	CONCOCT_170	1188229
+S0C189589	CONCOCT_170	1188229
+S0C190286	CONCOCT_170	1188229
+S0C190997	CONCOCT_170	1188229
+S0C192169	CONCOCT_170	1188229
+S0C192913	CONCOCT_170	1188229
+S0C193235	CONCOCT_170	1188229
+S0C197282	CONCOCT_170	1188229
+S0C199440	CONCOCT_170	1188229
+S0C200742	CONCOCT_170	1188229
+S0C202327	CONCOCT_170	1188229
+S0C203916	CONCOCT_170	1188229
+S0C207418	CONCOCT_170	1188229
+S0C214076	CONCOCT_170	1188229
+S0C214145	CONCOCT_170	1188229
+S0C214674	CONCOCT_170	1188229
+S0C215796	CONCOCT_170	1188229
+S0C218011	CONCOCT_170	1188229
+S0C223793	CONCOCT_170	1188229
+S0C224911	CONCOCT_170	1188229
+S0C226616	CONCOCT_170	1188229
+S0C226964	CONCOCT_170	1188229
+S0C232179	CONCOCT_170	1188229
+S0C233703	CONCOCT_170	1188229
+S0C235269	CONCOCT_170	1188229
+S0C244843	CONCOCT_170	1188229
+S0C245988	CONCOCT_170	1188229
+S0C247775	CONCOCT_170	1188229
+S0C248142	CONCOCT_170	1188229
+S0C248525	CONCOCT_170	1188229
+S0C250249	CONCOCT_170	1188229
+S0C250769	CONCOCT_170	1188229
+S0C261957	CONCOCT_170	1188229
+S0C267920	CONCOCT_170	1188229
+S0C268515	CONCOCT_170	1188229
+S0C271398	CONCOCT_170	1188229
+S0C273474	CONCOCT_170	1188229
+S0C273642	CONCOCT_170	1188229
+S0C273909	CONCOCT_170	1188229
+S0C282614	CONCOCT_170	1188229
+S0C284421	CONCOCT_170	1188229
+S0C284529	CONCOCT_170	1188229
+S0C286800	CONCOCT_170	1188229
+S0C289235	CONCOCT_170	1188229
+S0C290438	CONCOCT_170	1188229
+S0C291627	CONCOCT_170	1188229
+S0C296643	CONCOCT_170	1188229
+S0C297219	CONCOCT_170	1188229
+S0C302272	CONCOCT_170	1188229
+S0C303794	CONCOCT_170	1188229
+S0C307970	CONCOCT_170	1188229
+S0C310701	CONCOCT_170	1188229
+S0C310818	CONCOCT_170	1188229
+S0C313722	CONCOCT_170	1188229
+S0C313791	CONCOCT_170	1188229
+S0C315247	CONCOCT_170	1188229
+S0C316931	CONCOCT_170	1188229
+S0C317968	CONCOCT_170	1188229
+S0C319375	CONCOCT_170	1188229
+S0C320040	CONCOCT_170	1188229
+S0C320442	CONCOCT_170	1188229
+S0C328161	CONCOCT_170	1188229
+S0C328842	CONCOCT_170	1188229
+S0C329759	CONCOCT_170	1188229
--- a/test-data/test_bat_file.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,39 +0,0 @@
-# bin	classification	reason	lineage	lineage scores
-1.FASTA	taxid assigned	based on 4161/4187 ORFs	1;131567;2;1783272;201174;1760;85007;182102;85043;1736349	1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.99;0.99;0.31
-10.FASTA	taxid assigned	based on 1895/1915 ORFs	1;131567;2;1224;1236;135614;32033;2370;2371	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.94
-11.FASTA	taxid assigned	based on 4793/4923 ORFs	1;131567;2;1783272;1239;186801;186802;31979;1884934;191027*	1.00;1.00;1.00;0.99;0.99;0.98;0.98;0.83;0.81;0.81
-12.FASTA	taxid assigned	based on 4056/4136 ORFs	1;131567;2;1783270;68336;976;1853228;1853229;563835;398041;462367	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.99
-13.FASTA	taxid assigned	based on 3575/3644 ORFs	1;131567;2;1783272;544448;31969;186332;186333;2086;2088	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-14.FASTA	taxid assigned	based on 245/248 ORFs	1;131567;2;1224;28216;80840;75682;149698;1736522	1.00;1.00;1.00;0.99;0.91;0.91;0.91;0.89;0.35
-15.FASTA	taxid assigned	based on 3834/3853 ORFs	1;131567;2;1224;28211;204455;31989;1097466;404881	1.00;1.00;1.00;1.00;1.00;0.99;0.97;0.96;0.96
-16.FASTA	taxid assigned	based on 2824/2869 ORFs	1;131567;2;1783272;544448;31969;186332;186333;2086;2088	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-17.FASTA	taxid assigned	based on 2646/2678 ORFs	1;131567;2;1783272;1239;186801;186802;186804;214904;227138	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.90
-18.FASTA	taxid assigned	based on 6183/6302 ORFs	1;131567;2;1783272;200795;388447;388448;768649;768650*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-19.FASTA	taxid assigned	based on 8855/8930 ORFs	1;131567;2;1783272;1239;91061;1385;539002;539742;33986*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-2.FASTA	taxid assigned	based on 3440/3461 ORFs	1;131567;2;1783272;1239;91061;1385;539002;539742;33986*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-20.FASTA	taxid assigned	based on 4264/4287 ORFs	1;131567;2;1224;28216;206351;1499392;397275;1121000	1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.99;0.97
-21.FASTA	taxid assigned	based on 5835/5867 ORFs	1;131567;2;1224;28216;80840;75682;149698;1736522	1.00;1.00;1.00;1.00;0.98;0.98;0.98;0.97;0.59
-22.FASTA	taxid assigned	based on 2576/2598 ORFs	1;131567;2;1783270;68336;976;117743;200644;49546;363408;328515	1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.97;0.97;0.96;0.89
-23.FASTA	taxid assigned	based on 5759/5763 ORFs	1;131567;2	1.00;0.74;0.73
-24.FASTA	taxid assigned	based on 6458/6478 ORFs	1;131567;2;1224;28211;204455;31989;265;266	1.00;1.00;1.00;1.00;1.00;0.99;0.99;0.95;0.46
-25.FASTA	taxid assigned	based on 4145/4341 ORFs	1;131567;2;1783270;68336;976;1853228;1853229;563835;398041;462367	1.00;1.00;1.00;0.99;0.99;0.99;0.93;0.93;0.93;0.89;0.88
-26.FASTA	taxid assigned	based on 2208/2231 ORFs	1;131567;2;1783272;1239;186801;186802;1491775;42447;182411	1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.97;0.97;0.72
-27.FASTA	taxid assigned	based on 4557/4633 ORFs	1;131567;2;1783270;68336;976;1853228;1853229;563835;1004300;1004304	1.00;1.00;1.00;1.00;1.00;1.00;0.89;0.89;0.89;0.89;0.88
-28.FASTA	taxid assigned	based on 1856/1860 ORFs	1;131567;2;1783272;1239;91061;1385;539002;539742;33986*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-29.FASTA	taxid assigned	based on 3780/3817 ORFs	1;131567;2;1783272;1239;91061;1385;539002;539742;33986*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-3.FASTA	taxid assigned	based on 205/207 ORFs	1;131567;2;1783272;1239;909932;909929;1843491;55506;55507*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.99
-30.FASTA	taxid assigned	based on 6218/6259 ORFs	1;131567;2;1224;28216;80840;75682;149698;1736532	1.00;1.00;1.00;1.00;0.98;0.98;0.98;0.97;0.57
-31.FASTA	taxid assigned	based on 2720/2744 ORFs	1;131567;2;1224;28216;80840;80864;198705;198706	1.00;1.00;1.00;1.00;0.99;0.99;0.98;0.97;0.97
-32.FASTA	taxid assigned	based on 3222/3245 ORFs	1;131567;2;1783272;201174;1760;85006;85021;99479;1736399	1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.96;0.53
-33.FASTA	taxid assigned	based on 292/297 ORFs	1;131567;2;1224;28211;204455;31989	1.00;1.00;0.99;0.89;0.84;0.50;0.49
-34.FASTA	taxid assigned	based on 3557/3604 ORFs	1;131567;2;1783272;1239;186801;186802;186803;653683;264463*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.99;0.99
-35.FASTA	taxid assigned	based on 2175/2205 ORFs	1;131567;2;1783272;1239;909932;909929;1843491;55506;55507*	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.99;0.99
-36.FASTA	taxid assigned	based on 3370/3422 ORFs	1;131567;2;1783270;68336;976;1853228;1853229;563835;1004300;1004304	1.00;1.00;1.00;1.00;1.00;1.00;0.89;0.89;0.89;0.89;0.87
-37.FASTA	taxid assigned	based on 4212/4264 ORFs	1;131567;2;1783270;68336;976;1853228;1853229;563835;1004300;1004304	1.00;1.00;1.00;1.00;1.00;1.00;0.92;0.92;0.92;0.92;0.91
-38.FASTA	taxid assigned	based on 8008/8038 ORFs	1;131567;2;1224;28211;204455;31989;265;266	1.00;1.00;1.00;1.00;1.00;0.99;0.99;0.98;0.40
-4.FASTA	taxid assigned	based on 8568/8682 ORFs	1;131567;2;1783270;68336;976;1853228;1853229;563835;1004300;1004304	1.00;1.00;1.00;1.00;1.00;1.00;0.92;0.92;0.92;0.92;0.90
-5.FASTA	taxid assigned	based on 2948/2952 ORFs	1;131567;2;1224;28211;204455;31989;205889;990712	1.00;1.00;1.00;1.00;1.00;0.87;0.87;0.86;0.86
-6.FASTA	taxid assigned	based on 2846/2901 ORFs	1;131567;2;1224;1236;135614;32033;68;1736549	1.00;1.00;1.00;0.96;0.94;0.92;0.85;0.65;0.52
-7.FASTA	taxid assigned	based on 5030/5081 ORFs	1;131567;2;1224;68525;28221;213118;213119;218207;259354	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;0.38
-8.FASTA	taxid assigned	based on 2537/2579 ORFs	1;131567;2;1783272;544448;31969;186332;186333;2086;2088	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
-9.FASTA	taxid assigned	based on 1648/1673 ORFs	1;131567;2;1783272;544448;31969;186332;186333;2086;2088	1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00;1.00
\ No newline at end of file
--- a/test-data/test_biobox_file.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,13 +0,0 @@
-#CAMI Format for Binning
-@Version:0.9.0
-@SampleID:gsa
-@@SEQUENCEID	BINID
-RL|S1|C1198	1
-RL|S1|C3912	1
-RL|S1|C131	10
-RL|S1|C1410	10
-RL|S1|C2929	10
-RL|S1|C3754	10
-RL|S1|C1335	11
-RL|S1|C1344	11
-RL|S1|C1352	11
\ No newline at end of file
--- a/test-data/test_biobox_file_add_taxid_bat.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,13 +0,0 @@
-#CAMI Format for Binning
-@Version:0.9.0
-@SampleID:_SAMPLEID_
-@@SEQUENCEID	BINID	TAXID
-RL|S1|C1198	1	1736349
-RL|S1|C3912	1	1736349
-RL|S1|C131	10	2371
-RL|S1|C1410	10	2371
-RL|S1|C2929	10	2371
-RL|S1|C3754	10	2371
-RL|S1|C1335	11	191027
-RL|S1|C1344	11	191027
-RL|S1|C1352	11	191027
--- a/test-data/test_biobox_file_add_taxid_gtdb.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,13 +0,0 @@
-#CAMI Format for Binning
-@Version:0.9.0
-@SampleID:_SAMPLEID_
-@@SEQUENCEID	BINID	TAXID
-RL|S1|C1198	1	12908
-RL|S1|C3912	1	12908
-RL|S1|C131	10	2371
-RL|S1|C1410	10	2371
-RL|S1|C2929	10	2371
-RL|S1|C3754	10	2371
-RL|S1|C1335	11	191027
-RL|S1|C1344	11	191027
-RL|S1|C1352	11	191027
--- a/test-data/test_gtdb_file.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,39 +0,0 @@
-user_genome	classification	fastani_reference	fastani_reference_radius	fastani_taxonomy	fastani_ani	fastani_af	closest_placement_reference	closest_placement_radius	closest_placement_taxonomy	closest_placement_ani	closest_placement_af	pplacer_taxonomy	classification_method	note	other_related_references(genome_id,species_name,radius,ANI,AF)	msa_percent	translation_table	red_value	warnings
-1	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Williamsia_A;s__Williamsia_A herbipolensis	GCF_000964005.1	95.0	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Williamsia_A;s__Williamsia_A herbipolensis	95.01	0.891	GCF_000964005.1	95.0	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Williamsia_A;s__Williamsia_A herbipolensis	95.01	0.891	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Mycobacteriales;f__Mycobacteriaceae;g__Williamsia_A;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_014635305.1, s__Williamsia_A phyllosphaerae, 95.0, 82.43, 0.702; GCA_016462415.1, s__Williamsia_A sp016462415, 95.0, 82.15, 0.649; GCF_018474015.1, s__Williamsia_A sp018474015, 95.0, 80.23, 0.523	96.49	11	N/A	N/A
-10	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Xylella;s__Xylella fastidiosa	GCF_011801475.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Xylella;s__Xylella fastidiosa	99.99	1.0	GCF_011801475.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Xylella;s__Xylella fastidiosa	99.99	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Xylella;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_013177435.1, s__Xylella taiwanensis, 95.0, 82.85, 0.849	85.13	11	N/A	N/A
-11	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Caminicellaceae;g__Paramaledivibacter;s__Paramaledivibacter caminithermalis	GCF_900142245.1	95.0	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Caminicellaceae;g__Paramaledivibacter;s__Paramaledivibacter caminithermalis	99.97	0.872	GCF_900142245.1	95.0	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Caminicellaceae;g__Paramaledivibacter;s__Paramaledivibacter caminithermalis	99.97	0.872	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Caminicellaceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	78.49	11	N/A	Genome has more than 10.0% of markers with multiple hits
-12	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__Flavisolibacter ginsengisoli	GCF_900129295.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__Flavisolibacter ginsengisoli	100.0	0.999	GCF_900129295.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__Flavisolibacter ginsengisoli	100.0	0.999	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_017745135.1, s__Flavisolibacter sp017745135, 95.0, 77.32, 0.1; GCA_013327885.1, s__Flavisolibacter sp013327885, 95.0, 77.25, 0.081; GCF_007970805.1, s__Flavisolibacter ginsenosidimutans, 95.0, 76.92, 0.056; GCF_003628535.1, s__Flavisolibacter nicotianae, 95.0, 76.88, 0.08; GCA_014163555.1, s__Flavisolibacter sp014163555, 95.0, 76.86, 0.077; GCA_002050435.1, s__Flavisolibacter sp002050435, 95.0, 76.62, 0.139	97.8	11	N/A	N/A
-13	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	97.96	0.859	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	97.96	0.859	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_017388605.1, s__Anaeroplasma sp017388605, 95.0, 83.32, 0.715; GCA_016280975.1, s__Anaeroplasma sp016280975, 95.0, 78.46, 0.241; GCA_017449215.1, s__Anaeroplasma sp017449215, 95.0, 77.98, 0.251; GCA_002449755.1, s__Anaeroplasma sp002449755, 95.0, 77.78, 0.249; GCA_017441525.1, s__Anaeroplasma sp017441525, 95.0, 77.67, 0.269; GCA_016282815.1, s__Anaeroplasma sp016282815, 95.0, 77.61, 0.204; GCA_017524905.1, s__Anaeroplasma sp017524905, 95.0, 77.59, 0.242; GCA_900770055.1, s__Anaeroplasma sp900770055, 95.0, 77.45, 0.176; GCA_015059145.1, s__Anaeroplasma sp015059145, 95.0, 77.44, 0.194; GCA_017542485.1, s__Anaeroplasma sp017542485, 95.0, 77.44, 0.199; GCA_017462645.1, s__Anaeroplasma sp017462645, 95.0, 77.4, 0.236; GCA_016288855.1, s__Anaeroplasma sp016288855, 95.0, 77.33, 0.203; GCA_017444645.1, s__Anaeroplasma sp017444645, 95.0, 77.24, 0.231; GCA_017454375.1, s__Anaeroplasma sp017454375, 95.0, 77.07, 0.14; GCA_902783745.1, s__Anaeroplasma sp902783745, 95.0, 77.01, 0.214; GCA_018715825.1, s__Anaeroplasma faecigallinarum, 95.0, 76.96, 0.115; GCA_900767915.1, s__Anaeroplasma sp900767915, 95.0, 76.92, 0.173; GCA_902796895.1, s__Anaeroplasma sp902796895, 95.0, 76.82, 0.227; GCA_905236105.1, s__Anaeroplasma sp905236105, 95.0, 76.14, 0.118; GCA_905236965.1, s__Anaeroplasma sp905236965, 95.0, 75.89, 0.176	55.08	11	N/A	Genome has more than 19.2% of markers with multiple hits
-14	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425045	GCF_001425045.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425045	100.0	1.0	GCF_001425045.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425045	100.0	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_001425265.1, s__Pseudoduganella sp001425265, 95.0, 92.95, 0.957; GCF_003053665.1, s__Pseudoduganella sp003053665, 95.0, 91.93, 0.891; GCF_009857595.1, s__Pseudoduganella aquatica_A, 95.0, 91.22, 0.978; GCF_900116645.1, s__Pseudoduganella namucuonensis, 95.0, 87.85, 0.913; GCF_014191875.1, s__Pseudoduganella violacea, 95.0, 84.06, 0.761; GCF_013369485.1, s__Pseudoduganella sp013369485, 95.0, 84.01, 0.804; GCF_009674485.1, s__Pseudoduganella sp009674485, 95.0, 83.86, 0.804; GCF_000425385.1, s__Pseudoduganella violaceinigra, 95.0, 83.6, 0.804; GCF_001191005.1, s__Pseudoduganella sp001191005, 95.0, 83.48, 0.848; GCF_004421005.1, s__Pseudoduganella plicata, 95.0, 83.23, 0.717; GCF_003028855.1, s__Pseudoduganella armeniaca, 95.0, 83.18, 0.804; GCA_008011715.1, s__Pseudoduganella haloabium, 95.0, 83.0, 0.848; GCF_007830455.1, s__Pseudoduganella lurida, 95.0, 82.99, 0.761; GCF_009720865.1, s__Pseudoduganella ginsengisoli, 95.0, 82.96, 0.848; GCF_001427305.1, s__Pseudoduganella sp001427305, 95.0, 82.81, 0.761; GCF_004322755.1, s__Pseudoduganella albidiflava, 95.0, 82.76, 0.826; GCF_009720835.1, s__Pseudoduganella buxea, 95.0, 82.6, 0.804; GCF_009857475.1, s__Pseudoduganella guangdongensis, 95.0, 82.56, 0.783; GCF_004217275.1, s__Pseudoduganella sp004217275, 95.0, 82.55, 0.761; GCF_900113115.1, s__Pseudoduganella sp900113115, 95.0, 82.37, 0.739; GCA_002454505.1, s__Pseudoduganella sp002454505, 95.0, 82.35, 0.783; GCF_009727155.1, s__Pseudoduganella dura, 95.0, 82.31, 0.848; GCF_014192225.1, s__Pseudoduganella umbonata, 95.0, 82.27, 0.826; GCF_001425005.1, s__Pseudoduganella sp001425005, 95.0, 82.22, 0.783; GCF_004209755.1, s__Pseudoduganella lutea, 95.0, 82.18, 0.826; GCF_007830495.1, s__Pseudoduganella flava, 95.0, 82.17, 0.804; GCF_009720745.1, s__Pseudoduganella eburnea, 95.0, 81.81, 0.848	12.39	11	N/A	N/A
-15	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Albidovulum;s__Albidovulum denitrificans	GCF_002973535.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Albidovulum;s__Albidovulum denitrificans	100.0	0.998	GCF_002973535.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Albidovulum;s__Albidovulum denitrificans	100.0	0.998	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Albidovulum;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_002440625.1, s__Albidovulum sp002440625, 95.0, 81.59, 0.611; GCA_002280515.1, s__Albidovulum sp002280515, 95.0, 81.47, 0.618; GCA_011620265.1, s__Albidovulum sp011620265, 95.0, 81.18, 0.602; GCA_008933605.1, s__Albidovulum sp008933605, 95.0, 80.63, 0.571; GCA_002841115.1, s__Albidovulum sp002841115, 95.0, 80.51, 0.565; GCF_900302475.1, s__Albidovulum aquaemixtae, 95.0, 79.33, 0.459; GCF_002927635.1, s__Albidovulum inexpectatum, 95.0, 79.06, 0.482	89.91	11	N/A	N/A
-16	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	98.99	0.916	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	98.99	0.916	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_017388605.1, s__Anaeroplasma sp017388605, 95.0, 83.71, 0.719; GCA_017449215.1, s__Anaeroplasma sp017449215, 95.0, 78.26, 0.268; GCA_017441525.1, s__Anaeroplasma sp017441525, 95.0, 78.17, 0.276; GCA_017524905.1, s__Anaeroplasma sp017524905, 95.0, 77.95, 0.238; GCA_002449755.1, s__Anaeroplasma sp002449755, 95.0, 77.9, 0.268; GCA_016280975.1, s__Anaeroplasma sp016280975, 95.0, 77.81, 0.257; GCA_017462645.1, s__Anaeroplasma sp017462645, 95.0, 77.8, 0.236; GCA_017542485.1, s__Anaeroplasma sp017542485, 95.0, 77.55, 0.195; GCA_017444645.1, s__Anaeroplasma sp017444645, 95.0, 77.47, 0.262; GCA_900770055.1, s__Anaeroplasma sp900770055, 95.0, 77.41, 0.184; GCA_902783745.1, s__Anaeroplasma sp902783745, 95.0, 77.4, 0.217; GCA_016288855.1, s__Anaeroplasma sp016288855, 95.0, 77.38, 0.218; GCA_016282815.1, s__Anaeroplasma sp016282815, 95.0, 77.33, 0.221; GCA_015059145.1, s__Anaeroplasma sp015059145, 95.0, 77.32, 0.197; GCA_017454375.1, s__Anaeroplasma sp017454375, 95.0, 77.22, 0.13; GCA_900767915.1, s__Anaeroplasma sp900767915, 95.0, 77.2, 0.183; GCA_018715825.1, s__Anaeroplasma faecigallinarum, 95.0, 76.96, 0.111; GCA_902796895.1, s__Anaeroplasma sp902796895, 95.0, 76.93, 0.242; GCA_905236965.1, s__Anaeroplasma sp905236965, 95.0, 76.16, 0.185; GCA_905236105.1, s__Anaeroplasma sp905236105, 95.0, 76.08, 0.131	50.77	11	N/A	Genome has more than 15.8% of markers with multiple hits
-17	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Peptostreptococcaceae;g__Tepidibacter;s__Tepidibacter formicigenes	GCF_900142235.1	95.0	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Peptostreptococcaceae;g__Tepidibacter;s__Tepidibacter formicigenes	100.0	0.999	GCF_900142235.1	95.0	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Peptostreptococcaceae;g__Tepidibacter;s__Tepidibacter formicigenes	100.0	0.999	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Peptostreptococcales;f__Peptostreptococcaceae;g__Tepidibacter;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_900129915.1, s__Tepidibacter thalassicus, 95.0, 86.9, 0.78	77.03	11	N/A	N/A
-18	d__Bacteria;p__Chloroflexota;c__Ktedonobacteria;o__Ktedonobacterales;f__Ktedonobacteraceae;g__Thermosporothrix;s__Thermosporothrix hazakensis	GCF_003253565.1	95.0	d__Bacteria;p__Chloroflexota;c__Ktedonobacteria;o__Ktedonobacterales;f__Ktedonobacteraceae;g__Thermosporothrix;s__Thermosporothrix hazakensis	100.0	0.999	GCF_003253565.1	95.0	d__Bacteria;p__Chloroflexota;c__Ktedonobacteria;o__Ktedonobacterales;f__Ktedonobacteraceae;g__Thermosporothrix;s__Thermosporothrix hazakensis	100.0	0.999	d__Bacteria;p__Chloroflexota;c__Ktedonobacteria;o__Ktedonobacterales;f__Ktedonobacteraceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	84.41	11	N/A	Genome has more than 11.7% of markers with multiple hits
-19	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	99.76	0.989	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	99.76	0.989	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000702605.1, s__Exiguobacterium_A acetylicum, 95.0, 90.87, 0.853; GCF_001939065.1, s__Exiguobacterium_A indicum, 95.0, 90.72, 0.833; GCF_001275385.1, s__Exiguobacterium_A sp001275385, 95.0, 89.22, 0.814; GCF_018618755.1, s__Exiguobacterium_A sp018618755, 95.0, 80.92, 0.543; GCF_000702625.1, s__Exiguobacterium_A oxidotolerans, 95.0, 80.85, 0.548; GCF_000019905.1, s__Exiguobacterium_A sibiricum, 95.0, 80.84, 0.552; GCF_000620865.1, s__Exiguobacterium_A sibiricum_A, 95.0, 80.82, 0.534; GCA_902363455.1, s__Exiguobacterium_A sp902363455, 95.0, 80.8, 0.51; GCF_003339585.1, s__Exiguobacterium_A sp003339585, 95.0, 80.75, 0.542; GCF_000620805.1, s__Exiguobacterium_A undae, 95.0, 80.72, 0.516; GCF_000685865.1, s__Exiguobacterium_A antarcticum, 95.0, 80.66, 0.512; GCF_014524545.1, s__Exiguobacterium_A sp004339505, 95.0, 80.64, 0.522; GCF_001870785.1, s__Exiguobacterium_A sp001870785, 95.0, 80.58, 0.531; GCF_003344535.1, s__Exiguobacterium_A flavidum, 95.0, 79.37, 0.3	16.18	11	N/A	Genome has more than 82.5% of markers with multiple hits
-2	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	99.23	0.971	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	99.23	0.971	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000702605.1, s__Exiguobacterium_A acetylicum, 95.0, 90.41, 0.883; GCF_001939065.1, s__Exiguobacterium_A indicum, 95.0, 90.37, 0.852; GCF_001275385.1, s__Exiguobacterium_A sp001275385, 95.0, 88.8, 0.834; GCF_018618755.1, s__Exiguobacterium_A sp018618755, 95.0, 80.82, 0.518; GCA_902363455.1, s__Exiguobacterium_A sp902363455, 95.0, 80.82, 0.478; GCF_000702625.1, s__Exiguobacterium_A oxidotolerans, 95.0, 80.81, 0.511; GCF_000620865.1, s__Exiguobacterium_A sibiricum_A, 95.0, 80.77, 0.523; GCF_000620805.1, s__Exiguobacterium_A undae, 95.0, 80.74, 0.5; GCF_003339585.1, s__Exiguobacterium_A sp003339585, 95.0, 80.63, 0.504; GCF_000019905.1, s__Exiguobacterium_A sibiricum, 95.0, 80.61, 0.502; GCF_000685865.1, s__Exiguobacterium_A antarcticum, 95.0, 80.57, 0.501; GCF_014524545.1, s__Exiguobacterium_A sp004339505, 95.0, 80.55, 0.514; GCF_001870785.1, s__Exiguobacterium_A sp001870785, 95.0, 80.52, 0.514; GCF_003344535.1, s__Exiguobacterium_A flavidum, 95.0, 79.14, 0.277	86.16	11	N/A	N/A
-20	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Chitinibacteraceae;g__Andreprevotia;s__Andreprevotia lacus	GCF_900176275.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Chitinibacteraceae;g__Andreprevotia;s__Andreprevotia lacus	100.0	1.0	GCF_900176275.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Chitinibacteraceae;g__Andreprevotia;s__Andreprevotia lacus	100.0	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Chitinibacteraceae;g__Andreprevotia;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_009848685.1, s__Andreprevotia sp009848685, 95.0, 82.66, 0.616; GCF_000711875.1, s__Andreprevotia chitinilytica, 95.0, 80.35, 0.45	92.83	11	N/A	N/A
-21	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425045	GCF_001425045.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425045	100.0	1.0	GCF_001425045.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425045	100.0	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_001425265.1, s__Pseudoduganella sp001425265, 95.0, 90.09, 0.928; GCF_003053665.1, s__Pseudoduganella sp003053665, 95.0, 89.99, 0.888; GCF_009857595.1, s__Pseudoduganella aquatica_A, 95.0, 88.9, 0.843; GCF_900116645.1, s__Pseudoduganella namucuonensis, 95.0, 85.3, 0.781; GCF_014191875.1, s__Pseudoduganella violacea, 95.0, 82.17, 0.604; GCF_001191005.1, s__Pseudoduganella sp001191005, 95.0, 82.07, 0.612; GCF_013369485.1, s__Pseudoduganella sp013369485, 95.0, 82.03, 0.605; GCA_008011715.1, s__Pseudoduganella haloabium, 95.0, 81.49, 0.621; GCF_009674485.1, s__Pseudoduganella sp009674485, 95.0, 81.47, 0.689; GCF_009720835.1, s__Pseudoduganella buxea, 95.0, 81.41, 0.6; GCF_009857475.1, s__Pseudoduganella guangdongensis, 95.0, 81.4, 0.581; GCF_003028855.1, s__Pseudoduganella armeniaca, 95.0, 81.39, 0.619; GCF_000425385.1, s__Pseudoduganella violaceinigra, 95.0, 81.23, 0.526; GCF_007830455.1, s__Pseudoduganella lurida, 95.0, 81.11, 0.574; GCF_900113115.1, s__Pseudoduganella sp900113115, 95.0, 81.1, 0.541; GCF_004217275.1, s__Pseudoduganella sp004217275, 95.0, 81.1, 0.555; GCF_009720745.1, s__Pseudoduganella eburnea, 95.0, 81.0, 0.551; GCA_002454505.1, s__Pseudoduganella sp002454505, 95.0, 81.0, 0.579; GCF_001425005.1, s__Pseudoduganella sp001425005, 95.0, 80.95, 0.557; GCF_014192225.1, s__Pseudoduganella umbonata, 95.0, 80.88, 0.602; GCF_009727155.1, s__Pseudoduganella dura, 95.0, 80.84, 0.597; GCF_004322755.1, s__Pseudoduganella albidiflava, 95.0, 80.82, 0.628; GCF_001427305.1, s__Pseudoduganella sp001427305, 95.0, 80.8, 0.562; GCF_004421005.1, s__Pseudoduganella plicata, 95.0, 80.7, 0.553; GCF_004209755.1, s__Pseudoduganella lutea, 95.0, 80.57, 0.569; GCF_007830495.1, s__Pseudoduganella flava, 95.0, 80.5, 0.617; GCF_009720865.1, s__Pseudoduganella ginsengisoli, 95.0, 80.45, 0.545	43.37	11	N/A	N/A
-22	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Flavobacteriales;f__Flavobacteriaceae;g__Nonlabens;s__Nonlabens dokdonensis	GCF_000332115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Flavobacteriales;f__Flavobacteriaceae;g__Nonlabens;s__Nonlabens dokdonensis	100.0	1.0	GCF_000332115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Flavobacteriales;f__Flavobacteriaceae;g__Nonlabens;s__Nonlabens dokdonensis	100.0	1.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Flavobacteriales;f__Flavobacteriaceae;g__Nonlabens;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_002162835.1, s__Nonlabens dokdonensis_B, 95.0, 86.47, 0.762; GCF_000732625.1, s__Nonlabens ulvanivorans, 95.0, 79.63, 0.287; GCF_002934445.1, s__Nonlabens xylanidelens, 95.0, 79.33, 0.543; GCF_002831625.1, s__Nonlabens sp002831625, 95.0, 79.02, 0.461; GCF_012974865.1, s__Nonlabens sp012974865, 95.0, 78.76, 0.472; GCA_000153385.1, s__Nonlabens sp000153385, 95.0, 78.67, 0.259; GCF_000755285.1, s__Nonlabens ulvanivorans_A, 95.0, 78.48, 0.316; GCF_002954765.1, s__Nonlabens arenilitoris, 95.0, 78.4, 0.305; GCA_018401815.1, s__Nonlabens sp018401815, 95.0, 78.16, 0.397; GCF_003966335.1, s__Nonlabens ponticola, 95.0, 77.67, 0.152; GCF_900101765.1, s__Nonlabens sp900101765, 95.0, 77.65, 0.156; GCF_000831385.1, s__Nonlabens marinus, 95.0, 77.49, 0.16; GCF_002994045.1, s__Nonlabens agnitus, 95.0, 77.34, 0.184; GCF_001413925.1, s__Nonlabens sp001413925, 95.0, 76.88, 0.17; GCF_002954355.1, s__Nonlabens tegetincola, 95.0, 76.75, 0.152; GCF_002117125.1, s__Nonlabens spongiae, 95.0, 76.63, 0.121; GCF_003865345.1, s__Nonlabens xiamenensis, 95.0, 76.61, 0.138; GCF_015356755.1, s__Nonlabens antarcticus, 95.0, 76.38, 0.163	47.56	11	N/A	N/A
-23	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Pseudomonas;s__Pseudomonas aeruginosa	GCF_001457615.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Pseudomonas;s__Pseudomonas aeruginosa	100.0	1.0	GCF_001457615.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Pseudomonas;s__Pseudomonas aeruginosa	100.0	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Pseudomonadales;f__Pseudomonadaceae;g__Pseudomonas;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000017205.1, s__Pseudomonas aeruginosa_A, 95.0, 94.08, 0.898; GCF_900187975.1, s__Pseudomonas delhiensis, 95.078, 84.72, 0.657; GCF_900103845.1, s__Pseudomonas jinjuensis, 95.0, 84.68, 0.586; GCF_900112375.1, s__Pseudomonas citronellolis, 95.078, 84.65, 0.657; GCF_017589465.1, s__Pseudomonas sp017589465, 95.0, 84.16, 0.606; GCF_000349845.1, s__Pseudomonas sp000349845, 95.0, 83.98, 0.654; GCF_017491605.1, s__Pseudomonas sp017491605, 95.0, 83.93, 0.609; GCF_014204515.1, s__Pseudomonas nitritireducens_A, 95.0, 83.89, 0.64; GCA_002452115.1, s__Pseudomonas nitroreducens_B, 95.0, 83.87, 0.623; GCF_000689415.1, s__Pseudomonas knackmussii, 95.0, 83.83, 0.579; GCF_900099785.1, s__Pseudomonas panipatensis, 95.0, 83.79, 0.609; GCF_000955805.1, s__Pseudomonas sp000955805, 95.0, 83.72, 0.626; GCF_008807415.1, s__Pseudomonas sp002079985, 95.0, 83.68, 0.631; GCF_009189165.1, s__Pseudomonas sp009189165, 95.0, 83.63, 0.584; GCF_002091755.1, s__Pseudomonas nitroreducens, 95.0, 83.55, 0.618; GCA_002796985.1, s__Pseudomonas sp002796985, 95.0, 83.47, 0.604; GCF_014852585.1, s__Pseudomonas sp014852585, 95.0, 83.39, 0.608; GCF_000313755.1, s__Pseudomonas nitroreducens_A, 95.0, 83.37, 0.611; GCF_016919445.1, s__Pseudomonas sp016919445, 95.0, 83.35, 0.614; GCF_005877905.1, s__Pseudomonas nicosulfuronedens, 95.0, 83.35, 0.613	90.35	11	N/A	N/A
-24	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__Paracoccus denitrificans	GCF_900100045.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__Paracoccus denitrificans	100.0	0.85	GCF_900100045.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__Paracoccus denitrificans	100.0	0.85	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_001447385.1, s__Paracoccus sp001447385, 95.0, 91.66, 0.582; GCF_008824185.1, s__Paracoccus pantotrophus, 95.0, 91.28, 0.634; GCF_000518925.1, s__Paracoccus sp000518925, 95.0, 90.94, 0.62; GCF_000763885.1, s__Paracoccus versutus, 95.0, 90.85, 0.57; GCF_016446475.1, s__Paracoccus binzhouensis, 95.0, 88.9, 0.547; GCF_900156255.1, s__Paracoccus thiocyanatus, 95.0, 88.81, 0.661; GCF_016919705.1, s__Paracoccus sp002359815, 95.0, 87.13, 0.614; GCF_001546115.1, s__Paracoccus aminovorans_B, 95.0, 86.89, 0.534; GCF_900005615.1, s__Paracoccus aminovorans, 95.0, 86.71, 0.557; GCF_000622145.1, s__Paracoccus yeei, 96.0533, 84.29, 0.492; GCF_009301415.1, s__Paracoccus kondratievae, 95.0, 84.29, 0.567; GCF_003285265.1, s__Paracoccus mutanolyticus, 96.0533, 84.23, 0.54; GCF_003337565.1, s__Paracoccus lutimaris, 95.0, 84.16, 0.5; GCF_000763905.1, s__Paracoccus halophilus, 95.0, 84.01, 0.499; GCA_018056045.1, s__Paracoccus sp018056045, 95.0, 83.99, 0.546; GCF_009711185.1, s__Paracoccus limosus, 95.0, 83.56, 0.528; GCF_009696685.1, s__Paracoccus sp009696685, 95.0, 83.34, 0.592; GCF_003709565.1, s__Paracoccus siganidrum, 95.0, 83.3, 0.476; GCF_009711205.1, s__Paracoccus litorisediminis, 95.0, 82.54, 0.387; GCF_009711265.1, s__Paracoccus sp009711265, 95.0, 82.45, 0.476; GCF_004522175.1, s__Paracoccus ravus, 95.0, 82.05, 0.419; GCF_900142875.1, s__Paracoccus solventivorans, 95.0, 81.92, 0.487; GCF_018860165.1, s__Paracoccus sp018860165, 95.0, 81.79, 0.441; GCF_007830335.1, s__Paracoccus sulfuroxidans, 95.0, 81.77, 0.452; GCF_900182695.1, s__Paracoccus laeviglucosivorans, 95.0, 81.62, 0.457; GCF_900631945.1, s__Paracoccus haematequi, 95.0, 81.4, 0.457; GCF_017356265.1, s__Paracoccus fontiphilus, 95.0, 81.21, 0.448; GCF_000763805.1, s__Paracoccus sphaerophysae, 95.0, 81.21, 0.486; GCF_017315735.1, s__Paracoccus sp017315735, 95.0, 81.15, 0.457; GCF_900110285.1, s__Paracoccus alcaliphilus, 95.0, 81.14, 0.422; GCF_009711225.1, s__Paracoccus aestuariivivens, 95.0, 81.1, 0.383; GCF_900108405.1, s__Paracoccus alkenifer, 95.0, 81.07, 0.499; GCF_009708075.1, s__Paracoccus lichenicola, 95.0, 81.07, 0.444; GCF_014642735.1, s__Paracoccus acridae, 95.0, 80.96, 0.429; GCF_003594815.1, s__Paracoccus aestuarii, 95.0, 80.95, 0.461; GCF_002287065.1, s__Paracoccus salipaludis, 95.0, 80.84, 0.451; GCF_900102885.1, s__Paracoccus chinensis, 95.0, 80.73, 0.442; GCF_004683865.2, s__Paracoccus liaowanqingii, 95.0, 80.72, 0.332; GCF_014656455.1, s__Paracoccus aerius, 95.0, 80.7, 0.405; GCF_002847445.1, s__Paracoccus zhejiangensis, 95.0, 80.7, 0.402; GCF_005048225.1, s__Paracoccus gahaiensis, 95.0, 80.69, 0.401; GCF_019061185.1, s__Paracoccus sp019061185, 95.0, 80.68, 0.461; GCF_004522155.1, s__Paracoccus luteus, 95.0, 80.66, 0.494; GCF_016617715.1, s__Paracoccus sp014164625, 95.0, 80.62, 0.431; GCF_003286075.1, s__Paracoccus endophyticus, 95.0, 80.58, 0.488; GCF_900106665.1, s__Paracoccus sanguinis, 95.0, 80.52, 0.462; GCF_000420145.1, s__Paracoccus zeaxanthinifaciens, 95.0, 80.43, 0.469; GCF_900102505.1, s__Paracoccus tibetensis, 95.0, 80.39, 0.408; GCF_006151785.1, s__Paracoccus marcusii, 95.0, 80.38, 0.404; GCF_900188295.1, s__Paracoccus sediminis, 95.0, 80.37, 0.423; GCF_003007735.2, s__Paracoccus marinus_A, 95.0, 80.34, 0.35; GCF_005048265.1, s__Paracoccus hibiscisoli, 95.0, 80.26, 0.425; GCF_002865605.1, s__Paracoccus jeotgali, 95.0, 80.23, 0.449; GCA_002294185.1, s__Paracoccus sp002294185, 95.0, 80.16, 0.432; GCF_013868135.1, s__Paracoccus sp013868135, 95.0, 80.14, 0.412; GCF_002105555.1, s__Paracoccus contaminans, 95.0, 80.12, 0.474; GCF_000444995.1, s__Paracoccus aminophilus, 95.0, 80.1, 0.334; GCF_004310345.1, s__Paracoccus subflavus, 95.0, 80.08, 0.465; GCF_004923205.2, s__Paracoccus aeridis, 95.0, 80.04, 0.421; GCF_000787695.1, s__Paracoccus sp000787695, 95.0, 80.03, 0.366; GCF_007096355.1, s__Paracoccus sp007096355, 95.0, 79.99, 0.371; GCF_007018965.1, s__Paracoccus marinus, 95.0, 79.94, 0.448; GCF_011308835.1, s__Paracoccus xiamenensis, 95.0, 79.84, 0.416; GCF_016629665.1, s__Paracoccus caeni, 95.0, 79.83, 0.368; GCF_018860625.1, s__Paracoccus sp018860625, 95.0, 79.83, 0.403; GCA_003255745.1, s__Paracoccus saliphilus_A, 95.0, 79.82, 0.388; GCF_003697785.1, s__Paracoccus alkanivorans, 95.0, 79.77, 0.339; GCF_003056335.1, s__Paracoccus indicus, 95.0, 79.77, 0.412; GCF_009674885.1, s__Paracoccus sp009674885, 95.0, 79.76, 0.378; GCF_017744015.1, s__Paracoccus sp002732665, 95.0, 79.74, 0.365; GCF_003259195.1, s__Paracoccus sediminilitoris, 95.0, 79.7, 0.398; GCA_900156835.1, s__Paracoccus saliphilus, 95.0, 79.65, 0.301; GCF_900101865.1, s__Paracoccus isoporae, 95.0, 79.64, 0.403; GCF_900111675.1, s__Paracoccus homiensis, 95.0, 79.63, 0.369; GCA_016869875.1, s__Paracoccus sp016869875, 95.0, 79.53, 0.311; GCF_004335005.1, s__Paracoccus sp004335005, 95.0, 79.5, 0.361; GCF_003324675.1, s__Paracoccus suum, 95.0, 79.1, 0.398; GCF_007993065.1, s__Paracoccus aurantiacus, 95.0, 78.95, 0.298; GCA_005768755.1, s__Paracoccus denitrificans_B, 95.0, 78.88, 0.289; GCF_002847305.1, s__Paracoccus sp002847305, 95.0, 78.88, 0.311; GCF_900199195.1, s__Paracoccus seriniphilus, 95.0, 78.66, 0.294; GCF_014490725.1, s__Paracoccus amoyensis, 95.0, 78.59, 0.301; GCA_003240735.1, s__Paracoccus denitrificans_A, 95.0, 78.52, 0.338; GCF_003591515.1, s__Paracoccus sp003591515, 95.0, 78.33, 0.268; GCF_003590715.1, s__Paracoccus sp003590715, 95.0, 77.93, 0.247	65.41	11	N/A	N/A
-25	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__	N/A	N/A	N/A	N/A	N/A	GCF_900129295.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__Flavisolibacter ginsengisoli	84.4	0.777	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Flavisolibacter;s__	taxonomic classification defined by topology and ANI	classification based on placement in class-level tree	GCA_002050435.1, s__Flavisolibacter sp002050435, 95.0, 77.03, 0.153; GCA_017745135.1, s__Flavisolibacter sp017745135, 95.0, 76.9, 0.111; GCF_003628535.1, s__Flavisolibacter nicotianae, 95.0, 76.85, 0.074; GCA_013327885.1, s__Flavisolibacter sp013327885, 95.0, 76.81, 0.084; GCA_014163555.1, s__Flavisolibacter sp014163555, 95.0, 76.57, 0.096; GCF_007970805.1, s__Flavisolibacter ginsenosidimutans, 95.0, 76.56, 0.057	98.29	11	0.98734	Genome not assigned to closest species as it falls outside its pre-defined ANI radius
-26	d__Bacteria;p__Firmicutes_D;c__Proteinivoracia;o__Proteinivoracales;f__Proteinivoraceae;g__Anaerobranca;s__Anaerobranca californiensis	GCF_900142275.1	95.0	d__Bacteria;p__Firmicutes_D;c__Proteinivoracia;o__Proteinivoracales;f__Proteinivoraceae;g__Anaerobranca;s__Anaerobranca californiensis	100.0	0.977	GCF_900142275.1	95.0	d__Bacteria;p__Firmicutes_D;c__Proteinivoracia;o__Proteinivoracales;f__Proteinivoraceae;g__Anaerobranca;s__Anaerobranca californiensis	100.0	0.977	d__Bacteria;p__Firmicutes_D;c__Proteinivoracia;o__Proteinivoracales;f__Proteinivoraceae;g__Anaerobranca;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_900111575.1, s__Anaerobranca gottschalkii, 95.0, 86.04, 0.802	87.59	11	N/A	N/A
-27	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	97.48	0.867	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	97.48	0.867	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_011362875.1, s__Hydrotalea flava_A, 95.0, 92.3, 0.83; GCA_001623405.1, s__Hydrotalea flava, 95.0, 78.35, 0.428	49.05	11	N/A	Genome has more than 13.3% of markers with multiple hits
-28	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	100.0	0.993	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	100.0	0.993	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000702605.1, s__Exiguobacterium_A acetylicum, 95.0, 91.58, 0.944; GCF_001939065.1, s__Exiguobacterium_A indicum, 95.0, 91.28, 0.89; GCF_001275385.1, s__Exiguobacterium_A sp001275385, 95.0, 90.06, 0.899; GCA_902363455.1, s__Exiguobacterium_A sp902363455, 95.0, 81.7, 0.601; GCF_000620865.1, s__Exiguobacterium_A sibiricum_A, 95.0, 81.66, 0.637; GCF_014524545.1, s__Exiguobacterium_A sp004339505, 95.0, 81.61, 0.661; GCF_000702625.1, s__Exiguobacterium_A oxidotolerans, 95.0, 81.6, 0.65; GCF_018618755.1, s__Exiguobacterium_A sp018618755, 95.0, 81.59, 0.643; GCF_000019905.1, s__Exiguobacterium_A sibiricum, 95.0, 81.56, 0.64; GCF_003339585.1, s__Exiguobacterium_A sp003339585, 95.0, 81.55, 0.64; GCF_000620805.1, s__Exiguobacterium_A undae, 95.0, 81.4, 0.653; GCF_001870785.1, s__Exiguobacterium_A sp001870785, 95.0, 81.31, 0.624; GCF_000685865.1, s__Exiguobacterium_A antarcticum, 95.0, 81.27, 0.633; GCF_003344535.1, s__Exiguobacterium_A flavidum, 95.0, 79.69, 0.349	84.09	11	N/A	N/A
-29	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	98.66	0.951	GCF_001423965.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__Exiguobacterium_A sp001423965	98.66	0.951	d__Bacteria;p__Firmicutes;c__Bacilli;o__Exiguobacterales;f__Exiguobacteraceae;g__Exiguobacterium_A;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000702605.1, s__Exiguobacterium_A acetylicum, 95.0, 89.97, 0.827; GCF_001939065.1, s__Exiguobacterium_A indicum, 95.0, 89.81, 0.795; GCF_001275385.1, s__Exiguobacterium_A sp001275385, 95.0, 88.32, 0.779; GCF_018618755.1, s__Exiguobacterium_A sp018618755, 95.0, 80.5, 0.481; GCF_000702625.1, s__Exiguobacterium_A oxidotolerans, 95.0, 80.47, 0.469; GCF_000620865.1, s__Exiguobacterium_A sibiricum_A, 95.0, 80.45, 0.467; GCF_000620805.1, s__Exiguobacterium_A undae, 95.0, 80.4, 0.466; GCA_902363455.1, s__Exiguobacterium_A sp902363455, 95.0, 80.39, 0.45; GCF_000685865.1, s__Exiguobacterium_A antarcticum, 95.0, 80.33, 0.451; GCF_000019905.1, s__Exiguobacterium_A sibiricum, 95.0, 80.31, 0.484; GCF_003339585.1, s__Exiguobacterium_A sp003339585, 95.0, 80.29, 0.477; GCF_014524545.1, s__Exiguobacterium_A sp004339505, 95.0, 80.22, 0.47; GCF_001870785.1, s__Exiguobacterium_A sp001870785, 95.0, 80.18, 0.481; GCF_003344535.1, s__Exiguobacterium_A flavidum, 95.0, 79.0, 0.248	73.13	11	N/A	Genome has more than 13.3% of markers with multiple hits
-3	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__Schwartzia;s__Schwartzia succinivorans	GCF_900129225.1	95.0	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__Schwartzia;s__Schwartzia succinivorans	100.0	1.0	GCF_900129225.1	95.0	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__Schwartzia;s__Schwartzia succinivorans	100.0	1.0	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	16.46	11	N/A	N/A
-30	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425265	GCF_001425265.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425265	100.0	1.0	GCF_001425265.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__Pseudoduganella sp001425265	100.0	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Pseudoduganella;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_003053665.1, s__Pseudoduganella sp003053665, 95.0, 90.85, 0.868; GCF_001425045.1, s__Pseudoduganella sp001425045, 95.0, 90.63, 0.861; GCF_009857595.1, s__Pseudoduganella aquatica_A, 95.0, 89.77, 0.815; GCF_900116645.1, s__Pseudoduganella namucuonensis, 95.0, 85.71, 0.688; GCF_001191005.1, s__Pseudoduganella sp001191005, 95.0, 82.78, 0.593; GCF_014191875.1, s__Pseudoduganella violacea, 95.0, 82.72, 0.596; GCF_013369485.1, s__Pseudoduganella sp013369485, 95.0, 82.69, 0.586; GCA_008011715.1, s__Pseudoduganella haloabium, 95.0, 82.2, 0.58; GCF_009720835.1, s__Pseudoduganella buxea, 95.0, 82.11, 0.6; GCF_009857475.1, s__Pseudoduganella guangdongensis, 95.0, 82.09, 0.636; GCF_003028855.1, s__Pseudoduganella armeniaca, 95.0, 82.05, 0.601; GCF_009674485.1, s__Pseudoduganella sp009674485, 95.0, 81.97, 0.595; GCF_000425385.1, s__Pseudoduganella violaceinigra, 95.0, 81.81, 0.554; GCF_007830455.1, s__Pseudoduganella lurida, 95.0, 81.78, 0.586; GCF_004217275.1, s__Pseudoduganella sp004217275, 95.0, 81.75, 0.549; GCA_002454505.1, s__Pseudoduganella sp002454505, 95.0, 81.72, 0.592; GCF_009720745.1, s__Pseudoduganella eburnea, 95.0, 81.62, 0.569; GCF_001425005.1, s__Pseudoduganella sp001425005, 95.0, 81.59, 0.543; GCF_900113115.1, s__Pseudoduganella sp900113115, 95.0, 81.54, 0.555; GCF_001427305.1, s__Pseudoduganella sp001427305, 95.0, 81.37, 0.543; GCF_004322755.1, s__Pseudoduganella albidiflava, 95.0, 81.34, 0.549; GCF_014192225.1, s__Pseudoduganella umbonata, 95.0, 81.26, 0.528; GCF_009727155.1, s__Pseudoduganella dura, 95.0, 81.26, 0.541; GCF_004421005.1, s__Pseudoduganella plicata, 95.0, 81.21, 0.58; GCF_007830495.1, s__Pseudoduganella flava, 95.0, 81.1, 0.559; GCF_004209755.1, s__Pseudoduganella lutea, 95.0, 80.92, 0.516; GCF_009720865.1, s__Pseudoduganella ginsengisoli, 95.0, 80.7, 0.521	97.2	11	N/A	N/A
-31	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Lampropedia;s__Lampropedia hyalina	GCF_900129055.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Lampropedia;s__Lampropedia hyalina	100.0	1.0	GCF_900129055.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Lampropedia;s__Lampropedia hyalina	100.0	1.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Burkholderiales;f__Burkholderiaceae;g__Lampropedia;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_004217315.1, s__Lampropedia populi, 95.0, 79.06, 0.425; GCA_002285265.1, s__Lampropedia sp002285265, 95.0, 79.05, 0.389; GCA_002285285.1, s__Lampropedia sp002285285, 95.0, 78.85, 0.367; GCA_003703475.1, s__Lampropedia sp003703475, 95.0, 78.75, 0.327; GCF_001005215.1, s__Lampropedia cohaerens, 95.0, 78.15, 0.303; GCF_004803635.1, s__Lampropedia aestuarii, 95.0, 77.37, 0.192; GCF_004833285.1, s__Lampropedia puyangensis, 95.0, 76.97, 0.131	97.26	11	N/A	N/A
-32	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Actinomycetales;f__Dermatophilaceae;g__Phycicoccus;s__Phycicoccus sp001428065	GCF_001428065.1	95.0	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Actinomycetales;f__Dermatophilaceae;g__Phycicoccus;s__Phycicoccus sp001428065	99.99	0.997	GCF_001428065.1	95.0	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Actinomycetales;f__Dermatophilaceae;g__Phycicoccus;s__Phycicoccus sp001428065	99.99	0.997	d__Bacteria;p__Actinobacteriota;c__Actinomycetia;o__Actinomycetales;f__Dermatophilaceae;g__Phycicoccus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_002846495.1, s__Phycicoccus duodecadis, 95.0, 92.25, 0.859; GCF_011383005.1, s__Phycicoccus sp011383005, 95.0, 84.56, 0.741; GCF_016887965.1, s__Phycicoccus sp016887965, 95.0, 84.46, 0.714; GCF_000720925.1, s__Phycicoccus jejuensis, 95.0, 84.36, 0.722; GCF_013201035.1, s__Phycicoccus sp013201035, 95.0, 84.23, 0.736; GCA_014763705.1, s__Phycicoccus sp014763705, 95.0, 84.07, 0.661; GCF_004025965.2, s__Phycicoccus flavus, 95.0, 83.51, 0.697; GCF_011326735.1, s__Phycicoccus endophyticus, 95.0, 82.86, 0.667; GCF_016888005.1, s__Phycicoccus sp016888005, 95.0, 82.78, 0.656; GCF_018139485.1, s__Phycicoccus sp018139485, 95.0, 82.55, 0.623	96.03	11	N/A	N/A
-33	Unclassified Bacteria	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	N/A	Insufficient number of amino acids in MSA (6.6%)
-34	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Lachnospirales;f__Lachnospiraceae;g__Anaerosporobacter;s__Anaerosporobacter mobilis	GCF_900142955.1	95.0	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Lachnospirales;f__Lachnospiraceae;g__Anaerosporobacter;s__Anaerosporobacter mobilis	100.0	0.997	GCF_900142955.1	95.0	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Lachnospirales;f__Lachnospiraceae;g__Anaerosporobacter;s__Anaerosporobacter mobilis	100.0	0.997	d__Bacteria;p__Firmicutes_A;c__Clostridia;o__Lachnospirales;f__Lachnospiraceae;g__Anaerosporobacter;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_018372435.1, s__Anaerosporobacter sp018372435, 95.0, 94.7, 0.913; GCF_012070565.1, s__Anaerosporobacter sp012070565, 95.0, 79.12, 0.355	54.65	11	N/A	Genome has more than 11.7% of markers with multiple hits
-35	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__Schwartzia;s__Schwartzia succinivorans	GCF_900129225.1	95.0	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__Schwartzia;s__Schwartzia succinivorans	100.0	1.0	GCF_900129225.1	95.0	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__Schwartzia;s__Schwartzia succinivorans	100.0	1.0	d__Bacteria;p__Firmicutes_C;c__Negativicutes;o__Selenomonadales;f__Selenomonadaceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	81.67	11	N/A	N/A
-36	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	97.73	0.846	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	97.73	0.846	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_011362875.1, s__Hydrotalea flava_A, 95.0, 92.52, 0.741; GCA_001623405.1, s__Hydrotalea flava, 95.0, 78.56, 0.446	38.4	11	N/A	Genome has more than 12.5% of markers with multiple hits
-37	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	99.13	0.933	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	99.13	0.933	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_011362875.1, s__Hydrotalea flava_A, 95.0, 93.75, 0.894; GCA_001623405.1, s__Hydrotalea flava, 95.0, 78.83, 0.519	68.78	11	N/A	Genome has more than 15.0% of markers with multiple hits
-38	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__Paracoccus denitrificans	GCF_900100045.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__Paracoccus denitrificans	99.47	0.878	GCF_900100045.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__Paracoccus denitrificans	99.47	0.878	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Paracoccus;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_001447385.1, s__Paracoccus sp001447385, 95.0, 92.4, 0.686; GCF_008824185.1, s__Paracoccus pantotrophus, 95.0, 91.75, 0.773; GCF_000518925.1, s__Paracoccus sp000518925, 95.0, 91.5, 0.76; GCF_000763885.1, s__Paracoccus versutus, 95.0, 91.37, 0.686; GCF_016446475.1, s__Paracoccus binzhouensis, 95.0, 89.81, 0.692; GCF_900156255.1, s__Paracoccus thiocyanatus, 95.0, 89.57, 0.812; GCF_016919705.1, s__Paracoccus sp002359815, 95.0, 87.44, 0.75; GCF_900005615.1, s__Paracoccus aminovorans, 95.0, 87.41, 0.693; GCF_001546115.1, s__Paracoccus aminovorans_B, 95.0, 87.27, 0.674; GCF_000622145.1, s__Paracoccus yeei, 96.0533, 84.9, 0.628; GCF_003337565.1, s__Paracoccus lutimaris, 95.0, 84.81, 0.638; GCF_003285265.1, s__Paracoccus mutanolyticus, 96.0533, 84.8, 0.689; GCF_009301415.1, s__Paracoccus kondratievae, 95.0, 84.68, 0.698; GCA_018056045.1, s__Paracoccus sp018056045, 95.0, 84.65, 0.696; GCF_000763905.1, s__Paracoccus halophilus, 95.0, 84.44, 0.631; GCF_009711185.1, s__Paracoccus limosus, 95.0, 84.27, 0.672; GCF_009696685.1, s__Paracoccus sp009696685, 95.0, 83.89, 0.751; GCF_003709565.1, s__Paracoccus siganidrum, 95.0, 83.61, 0.588; GCF_009711265.1, s__Paracoccus sp009711265, 95.0, 83.19, 0.594; GCF_009711205.1, s__Paracoccus litorisediminis, 95.0, 83.06, 0.496; GCF_004522175.1, s__Paracoccus ravus, 95.0, 82.44, 0.549; GCF_007830335.1, s__Paracoccus sulfuroxidans, 95.0, 82.23, 0.59; GCF_900182695.1, s__Paracoccus laeviglucosivorans, 95.0, 82.18, 0.589; GCF_900142875.1, s__Paracoccus solventivorans, 95.0, 82.17, 0.628; GCF_018860165.1, s__Paracoccus sp018860165, 95.0, 82.15, 0.554; GCF_900631945.1, s__Paracoccus haematequi, 95.0, 81.7, 0.572; GCF_000763805.1, s__Paracoccus sphaerophysae, 95.0, 81.61, 0.647; GCF_009708075.1, s__Paracoccus lichenicola, 95.0, 81.58, 0.568; GCF_017356265.1, s__Paracoccus fontiphilus, 95.0, 81.57, 0.555; GCF_017315735.1, s__Paracoccus sp017315735, 95.0, 81.56, 0.582; GCF_014642735.1, s__Paracoccus acridae, 95.0, 81.46, 0.531; GCF_009711225.1, s__Paracoccus aestuariivivens, 95.0, 81.45, 0.501; GCF_900110285.1, s__Paracoccus alcaliphilus, 95.0, 81.35, 0.518; GCF_900108405.1, s__Paracoccus alkenifer, 95.0, 81.32, 0.632; GCF_002847445.1, s__Paracoccus zhejiangensis, 95.0, 81.31, 0.521; GCF_014656455.1, s__Paracoccus aerius, 95.0, 81.25, 0.5; GCF_002287065.1, s__Paracoccus salipaludis, 95.0, 81.24, 0.59; GCF_003286075.1, s__Paracoccus endophyticus, 95.0, 81.19, 0.633; GCF_004522155.1, s__Paracoccus luteus, 95.0, 81.14, 0.64; GCF_019061185.1, s__Paracoccus sp019061185, 95.0, 81.1, 0.59; GCF_003594815.1, s__Paracoccus aestuarii, 95.0, 81.02, 0.562; GCF_005048225.1, s__Paracoccus gahaiensis, 95.0, 80.97, 0.51; GCF_900102885.1, s__Paracoccus chinensis, 95.0, 80.96, 0.568; GCF_016617715.1, s__Paracoccus sp014164625, 95.0, 80.89, 0.535; GCF_004683865.2, s__Paracoccus liaowanqingii, 95.0, 80.86, 0.427; GCF_900106665.1, s__Paracoccus sanguinis, 95.0, 80.78, 0.592; GCF_002865605.1, s__Paracoccus jeotgali, 95.0, 80.75, 0.541; GCF_900102505.1, s__Paracoccus tibetensis, 95.0, 80.74, 0.513; GCF_900188295.1, s__Paracoccus sediminis, 95.0, 80.67, 0.55; GCF_013868135.1, s__Paracoccus sp013868135, 95.0, 80.63, 0.53; GCF_000420145.1, s__Paracoccus zeaxanthinifaciens, 95.0, 80.6, 0.599; GCF_004310345.1, s__Paracoccus subflavus, 95.0, 80.57, 0.568; GCF_003007735.2, s__Paracoccus marinus_A, 95.0, 80.54, 0.46; GCF_005048265.1, s__Paracoccus hibiscisoli, 95.0, 80.54, 0.525; GCF_006151785.1, s__Paracoccus marcusii, 95.0, 80.51, 0.535; GCF_002105555.1, s__Paracoccus contaminans, 95.0, 80.5, 0.591; GCA_002294185.1, s__Paracoccus sp002294185, 95.0, 80.4, 0.553; GCF_000787695.1, s__Paracoccus sp000787695, 95.0, 80.39, 0.477; GCF_004923205.2, s__Paracoccus aeridis, 95.0, 80.31, 0.542; GCF_018860625.1, s__Paracoccus sp018860625, 95.0, 80.27, 0.506; GCF_007096355.1, s__Paracoccus sp007096355, 95.0, 80.26, 0.484; GCF_000444995.1, s__Paracoccus aminophilus, 95.0, 80.24, 0.428; GCF_007018965.1, s__Paracoccus marinus, 95.0, 80.24, 0.573; GCF_003056335.1, s__Paracoccus indicus, 95.0, 80.18, 0.534; GCF_011308835.1, s__Paracoccus xiamenensis, 95.0, 80.14, 0.509; GCF_900111675.1, s__Paracoccus homiensis, 95.0, 80.1, 0.465; GCF_017744015.1, s__Paracoccus sp002732665, 95.0, 80.09, 0.47; GCF_009674885.1, s__Paracoccus sp009674885, 95.0, 80.06, 0.484; GCF_900101865.1, s__Paracoccus isoporae, 95.0, 80.06, 0.506; GCA_003255745.1, s__Paracoccus saliphilus_A, 95.0, 80.05, 0.49; GCF_003697785.1, s__Paracoccus alkanivorans, 95.0, 80.0, 0.421; GCF_016629665.1, s__Paracoccus caeni, 95.0, 79.96, 0.482; GCF_003259195.1, s__Paracoccus sediminilitoris, 95.0, 79.92, 0.502; GCA_016869875.1, s__Paracoccus sp016869875, 95.0, 79.86, 0.406; GCF_004335005.1, s__Paracoccus sp004335005, 95.0, 79.84, 0.456; GCA_900156835.1, s__Paracoccus saliphilus, 95.0, 79.58, 0.378; GCF_003324675.1, s__Paracoccus suum, 95.0, 79.37, 0.5; GCF_002847305.1, s__Paracoccus sp002847305, 95.0, 79.07, 0.407; GCA_005768755.1, s__Paracoccus denitrificans_B, 95.0, 78.95, 0.364; GCF_900199195.1, s__Paracoccus seriniphilus, 95.0, 78.94, 0.373; GCF_007993065.1, s__Paracoccus aurantiacus, 95.0, 78.87, 0.377; GCF_014490725.1, s__Paracoccus amoyensis, 95.0, 78.85, 0.391; GCA_003240735.1, s__Paracoccus denitrificans_A, 95.0, 78.69, 0.439; GCF_003591515.1, s__Paracoccus sp003591515, 95.0, 78.33, 0.332; GCF_003590715.1, s__Paracoccus sp003590715, 95.0, 78.23, 0.32	65.59	11	N/A	Genome has more than 33.3% of markers with multiple hits
-4	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	99.99	0.99	GCF_003254115.1	95.0	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__Hydrotalea sandarakina	99.99	0.99	d__Bacteria;p__Bacteroidota;c__Bacteroidia;o__Chitinophagales;f__Chitinophagaceae;g__Hydrotalea;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_011362875.1, s__Hydrotalea flava_A, 95.0, 94.51, 0.932; GCA_001623405.1, s__Hydrotalea flava, 95.0, 79.19, 0.591	26.13	11	N/A	Genome has more than 73.3% of markers with multiple hits
-5	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Meinhardsimonia;s__Meinhardsimonia xiamenensis	GCF_900102905.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Meinhardsimonia;s__Meinhardsimonia xiamenensis	100.0	0.999	GCF_900102905.1	95.0	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__Meinhardsimonia;s__Meinhardsimonia xiamenensis	100.0	0.999	d__Bacteria;p__Proteobacteria;c__Alphaproteobacteria;o__Rhodobacterales;f__Rhodobacteraceae;g__;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	N/A	91.46	11	N/A	N/A
-6	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Lysobacter;s__	N/A	N/A	N/A	N/A	N/A	GCF_014489475.1	95.0	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Lysobacter;s__Lysobacter solisilvae	87.17	0.796	d__Bacteria;p__Proteobacteria;c__Gammaproteobacteria;o__Xanthomonadales;f__Xanthomonadaceae;g__Lysobacter;s__	taxonomic classification defined by topology and ANI	classification based on placement in class-level tree	GCF_001427225.1, s__Lysobacter sp001427225, 95.0, 84.08, 0.726; GCF_016613535.2, s__Lysobacter solisilvae_A, 95.0, 82.93, 0.69; GCF_003814555.1, s__Lysobacter tengchongensis, 95.0, 82.62, 0.619; GCF_009765165.1, s__Lysobacter panacisoli, 95.0, 82.36, 0.64; GCF_003586305.1, s__Lysobacter tabacisoli, 95.0, 82.33, 0.649; GCF_016613475.2, s__Lysobacter arenosi, 95.0, 82.23, 0.643; GCF_009765215.1, s__Lysobacter prati, 95.0, 82.11, 0.618; GCF_017308985.1, s__Lysobacter sp017308985, 95.0, 82.08, 0.634; GCF_003382365.1, s__Lysobacter silvisoli, 95.0, 82.05, 0.664; GCF_900114355.1, s__Lysobacter sp900114355, 95.0, 82.04, 0.665; GCF_015453285.1, s__Lysobacter niastensis, 95.0, 82.04, 0.658; GCF_016735495.2, s__Lysobacter sp016735495, 95.0, 82.01, 0.647; GCA_013361435.1, s__Lysobacter sp013361435, 95.0, 81.93, 0.591; GCF_000768335.1, s__Lysobacter arseniciresistens, 95.0, 81.92, 0.555; GCF_003382285.1, s__Lysobacter soli, 95.0, 81.87, 0.642; GCF_001428685.1, s__Lysobacter sp001428685, 95.0, 81.87, 0.682; GCF_001429785.1, s__Lysobacter sp001429785, 95.0, 81.8, 0.669; GCF_900107375.1, s__Lysobacter sp900107375, 95.0, 81.79, 0.691; GCF_007923255.1, s__Lysobacter thermophilus, 95.0, 81.78, 0.578; GCF_001442515.1, s__Lysobacter enzymogenes_B, 95.0, 81.68, 0.712; GCF_017355525.1, s__Lysobacter enzymogenes_C, 95.0, 81.68, 0.672; GCF_000336385.2, s__Lysobacter antibioticus_A, 95.0, 81.66, 0.632; GCA_005503055.1, s__Lysobacter sp005503055, 95.0, 81.61, 0.628; GCF_000768355.1, s__Lysobacter daejeonensis, 95.0, 81.58, 0.548; GCF_018847975.1, s__Lysobacter sp018847975, 95.0, 81.55, 0.673; GCF_007830115.1, s__Lysobacter ruishenii, 95.0, 81.54, 0.556; GCF_900106525.1, s__Lysobacter enzymogenes, 95.0, 81.48, 0.687; GCF_001442535.1, s__Lysobacter antibioticus, 95.0, 81.4, 0.632; GCF_000731095.1, s__Lysobacter antibioticus_B, 95.0, 81.36, 0.618; GCF_003719825.1, s__Lysobacter psychrotolerans, 95.0, 81.34, 0.604; GCF_006546735.2, s__Lysobacter maris, 95.0, 81.34, 0.541; GCF_014651995.1, s__Lysobacter xinjiangensis, 95.0, 81.28, 0.546; GCF_014779555.1, s__Lysobacter capsici, 95.0, 81.21, 0.638; GCF_907164845.1, s__Lysobacter sp907164845, 95.0, 81.17, 0.576; GCF_001442805.1, s__Lysobacter gummosus, 95.0, 81.17, 0.642; GCF_018612875.1, s__Lysobacter sp018612875, 95.0, 81.13, 0.619; GCF_018732085.1, s__Lysobacter capsici_A, 95.0, 81.1, 0.67; GCA_001830245.1, s__Lysobacter sp001830245, 95.0, 81.08, 0.56; GCF_001427785.1, s__Lysobacter sp001427785, 95.0, 81.08, 0.623; GCF_014145325.1, s__Lysobacter spongiae, 95.0, 81.05, 0.553; GCF_004359965.1, s__Lysobacter segetis, 95.0, 81.01, 0.575; GCF_006546775.1, s__Lysobacter aestuarii, 95.0, 80.97, 0.546; GCF_006547045.1, s__Lysobacter alkalisoli, 95.0, 80.94, 0.566; GCF_000768345.1, s__Lysobacter concretionis, 95.0, 80.78, 0.518; GCF_014145395.1, s__Lysobacter penaei, 95.0, 80.76, 0.502; GCF_004361065.1, s__Lysobacter terrigena, 95.0, 80.55, 0.508; GCF_003367355.1, s__Lysobacter sp003367355, 95.0, 80.54, 0.516; GCF_000423325.1, s__Lysobacter defluvii, 95.0, 80.42, 0.515; GCF_000426005.1, s__Lysobacter sp000426005, 95.0, 80.4, 0.515; GCF_015209725.1, s__Lysobacter sp015209725, 95.0, 80.29, 0.481; GCF_900167055.1, s__Lysobacter spongiicola, 95.0, 80.25, 0.489; GCF_014652095.1, s__Lysobacter bugurensis, 95.0, 80.25, 0.522; GCF_008274655.1, s__Lysobacter lacus, 95.0, 80.01, 0.52; GCF_015209765.1, s__Lysobacter sp015209765, 95.0, 79.97, 0.484; GCA_004322525.1, s__Lysobacter sp004322525, 95.0, 79.81, 0.529; GCA_902805755.1, s__Lysobacter sp902805755, 95.0, 79.81, 0.544; GCF_000855665.1, s__Lysobacter sp000855665, 95.0, 79.58, 0.461	72.88	11	0.98425	Genome not assigned to closest species as it falls outside its pre-defined ANI radius
-7	d__Bacteria;p__Desulfobacterota;c__Desulfobacteria;o__Desulfobacterales;f__Desulfatibacillaceae;g__Desulfatibacillum;s__Desulfatibacillum alkenivorans	GCF_900142135.1	95.0	d__Bacteria;p__Desulfobacterota;c__Desulfobacteria;o__Desulfobacterales;f__Desulfatibacillaceae;g__Desulfatibacillum;s__Desulfatibacillum alkenivorans	100.0	1.0	GCF_900142135.1	95.0	d__Bacteria;p__Desulfobacterota;c__Desulfobacteria;o__Desulfobacterales;f__Desulfatibacillaceae;g__Desulfatibacillum;s__Desulfatibacillum alkenivorans	100.0	1.0	d__Bacteria;p__Desulfobacterota;c__Desulfobacteria;o__Desulfobacterales;f__Desulfatibacillaceae;g__Desulfatibacillum;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCF_000429905.1, s__Desulfatibacillum aliphaticivorans, 95.0, 93.06, 0.876; GCA_016342355.1, s__Desulfatibacillum sp016342355, 95.0, 79.44, 0.52	85.86	11	N/A	N/A
-8	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	99.22	0.892	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	99.22	0.892	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_017388605.1, s__Anaeroplasma sp017388605, 95.0, 83.89, 0.71; GCA_017449215.1, s__Anaeroplasma sp017449215, 95.0, 78.37, 0.262; GCA_017441525.1, s__Anaeroplasma sp017441525, 95.0, 78.17, 0.272; GCA_002449755.1, s__Anaeroplasma sp002449755, 95.0, 78.14, 0.275; GCA_017462645.1, s__Anaeroplasma sp017462645, 95.0, 78.0, 0.236; GCA_017524905.1, s__Anaeroplasma sp017524905, 95.0, 77.92, 0.242; GCA_016280975.1, s__Anaeroplasma sp016280975, 95.0, 77.86, 0.273; GCA_017444645.1, s__Anaeroplasma sp017444645, 95.0, 77.57, 0.26; GCA_900770055.1, s__Anaeroplasma sp900770055, 95.0, 77.54, 0.192; GCA_902783745.1, s__Anaeroplasma sp902783745, 95.0, 77.5, 0.231; GCA_016282815.1, s__Anaeroplasma sp016282815, 95.0, 77.44, 0.216; GCA_017542485.1, s__Anaeroplasma sp017542485, 95.0, 77.43, 0.189; GCA_016288855.1, s__Anaeroplasma sp016288855, 95.0, 77.42, 0.212; GCA_015059145.1, s__Anaeroplasma sp015059145, 95.0, 77.4, 0.199; GCA_900767915.1, s__Anaeroplasma sp900767915, 95.0, 77.38, 0.187; GCA_017454375.1, s__Anaeroplasma sp017454375, 95.0, 77.11, 0.128; GCA_902796895.1, s__Anaeroplasma sp902796895, 95.0, 76.99, 0.242; GCA_018715825.1, s__Anaeroplasma faecigallinarum, 95.0, 76.73, 0.118; GCA_905236965.1, s__Anaeroplasma sp905236965, 95.0, 76.07, 0.2; GCA_905236105.1, s__Anaeroplasma sp905236105, 95.0, 76.05, 0.133	57.15	11	N/A	Genome has more than 10.0% of markers with multiple hits
-9	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	100.0	1.0	GCF_003550015.1	95.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__Anaeroplasma bactoclasticum	100.0	1.0	d__Bacteria;p__Firmicutes;c__Bacilli;o__Acholeplasmatales;f__Anaeroplasmataceae;g__Anaeroplasma;s__	taxonomic classification defined by topology and ANI	topological placement and ANI have congruent species assignments	GCA_017388605.1, s__Anaeroplasma sp017388605, 95.0, 84.15, 0.658; GCA_002449755.1, s__Anaeroplasma sp002449755, 95.0, 78.65, 0.256; GCA_017441525.1, s__Anaeroplasma sp017441525, 95.0, 78.34, 0.265; GCA_017449215.1, s__Anaeroplasma sp017449215, 95.0, 78.33, 0.263; GCA_017524905.1, s__Anaeroplasma sp017524905, 95.0, 78.01, 0.244; GCA_017462645.1, s__Anaeroplasma sp017462645, 95.0, 78.0, 0.23; GCA_016280975.1, s__Anaeroplasma sp016280975, 95.0, 77.96, 0.23; GCA_017542485.1, s__Anaeroplasma sp017542485, 95.0, 77.74, 0.195; GCA_017444645.1, s__Anaeroplasma sp017444645, 95.0, 77.7, 0.258; GCA_900767915.1, s__Anaeroplasma sp900767915, 95.0, 77.52, 0.172; GCA_016288855.1, s__Anaeroplasma sp016288855, 95.0, 77.51, 0.196; GCA_902783745.1, s__Anaeroplasma sp902783745, 95.0, 77.5, 0.209; GCA_016282815.1, s__Anaeroplasma sp016282815, 95.0, 77.5, 0.201; GCA_900770055.1, s__Anaeroplasma sp900770055, 95.0, 77.43, 0.184; GCA_015059145.1, s__Anaeroplasma sp015059145, 95.0, 77.28, 0.183; GCA_902796895.1, s__Anaeroplasma sp902796895, 95.0, 77.2, 0.221; GCA_017454375.1, s__Anaeroplasma sp017454375, 95.0, 77.19, 0.129; GCA_018715825.1, s__Anaeroplasma faecigallinarum, 95.0, 76.79, 0.111; GCA_905236965.1, s__Anaeroplasma sp905236965, 95.0, 76.42, 0.19; GCA_905236105.1, s__Anaeroplasma sp905236105, 95.0, 76.12, 0.118	66.58	11	N/A	N/A
\ No newline at end of file
--- a/test-data/test_gtdb_to_taxdump_file.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,25 +0,0 @@
-ncbi_taxonomy	gtdb_taxonomy	lca_frac	target_tax_level	lineage
-s__Williamsia_A herbipolensis	unclassified	NA	NA	NA
-s__Xylella fastidiosa	s__Xylella fastidiosa	1.0	species	d__bacteria;p__pseudomonadota;c__gammaproteobacteria;o__xanthomonadales;f__xanthomonadaceae;g__xylella;s__xylella fastidiosa
-s__Paramaledivibacter caminithermalis	s__Paramaledivibacter caminithermalis	1.0	species	d__bacteria;p__bacillota_a;c__clostridia;o__peptostreptococcales;f__caminicellaceae;g__paramaledivibacter;s__paramaledivibacter caminithermalis
-s__Flavisolibacter ginsengisoli	s__Flavisolibacter ginsengisoli	1.0	species	d__bacteria;p__bacteroidota;c__bacteroidia;o__chitinophagales;f__chitinophagaceae;g__flavisolibacter;s__flavisolibacter ginsengisoli
-s__Anaeroplasma bactoclasticum	c__Bacilli	1.0	class	d__bacteria;p__bacillota;c__bacilli
-s__Pseudoduganella sp001425045	unclassified	NA	NA	NA
-s__Albidovulum denitrificans	unclassified	NA	NA	NA
-s__Tepidibacter formicigenes	s__Tepidibacter formicigenes	1.0	species	d__bacteria;p__bacillota_a;c__clostridia;o__peptostreptococcales;f__peptostreptococcaceae;g__tepidibacter;s__tepidibacter formicigenes
-s__Thermosporothrix hazakensis	unclassified	NA	NA	NA
-s__Exiguobacterium_A sp001423965	unclassified	NA	NA	NA
-s__Andreprevotia lacus	s__Andreprevotia lacus	1.0	species	d__bacteria;p__pseudomonadota;c__gammaproteobacteria;o__burkholderiales;f__chitinibacteraceae;g__andreprevotia;s__andreprevotia lacus
-s__Nonlabens dokdonensis	g__Nonlabens	1.0	genus	d__bacteria;p__bacteroidota;c__bacteroidia;o__flavobacteriales;f__flavobacteriaceae;g__nonlabens
-s__Pseudomonas aeruginosa	s__Pseudomonas aeruginosa	0.99	species	d__bacteria;p__pseudomonadota;c__gammaproteobacteria;o__pseudomonadales;f__pseudomonadaceae;g__pseudomonas;s__pseudomonas aeruginosa
-s__Paracoccus denitrificans	g__Paracoccus	1.0	genus	d__bacteria;p__pseudomonadota;c__alphaproteobacteria;o__rhodobacterales;f__rhodobacteraceae;g__paracoccus
-N/A	unclassified	NA	NA	NA
-s__Anaerobranca californiensis	s__Anaerobranca californiensis	1.0	species	d__bacteria;p__bacillota_d;c__proteinivoracia;o__proteinivoracales;f__proteinivoraceae;g__anaerobranca;s__anaerobranca californiensis
-s__Hydrotalea sandarakina	s__Hydrotalea sandarakina	1.0	species	d__bacteria;p__bacteroidota;c__bacteroidia;o__chitinophagales;f__chitinophagaceae;g__hydrotalea;s__hydrotalea sandarakina
-s__Schwartzia succinivorans	f__Selenomonadaceae	1.0	family	d__bacteria;p__bacillota_c;c__negativicutes;o__selenomonadales;f__selenomonadaceae
-s__Pseudoduganella sp001425265	unclassified	NA	NA	NA
-s__Lampropedia hyalina	s__Lampropedia hyalina	1.0	species	d__bacteria;p__pseudomonadota;c__gammaproteobacteria;o__burkholderiales;f__burkholderiaceae_b;g__lampropedia;s__lampropedia hyalina
-s__Phycicoccus sp001428065	unclassified	NA	NA	NA
-s__Anaerosporobacter mobilis	s__Anaerosporobacter mobilis	1.0	species	d__bacteria;p__bacillota_a;c__clostridia;o__lachnospirales;f__lachnospiraceae;g__anaerosporobacter;s__anaerosporobacter mobilis
-s__Meinhardsimonia xiamenensis	s__Meinhardsimonia xiamenensis	1.0	species	d__bacteria;p__pseudomonadota;c__alphaproteobacteria;o__rhodobacterales;f__rhodobacteraceae;g__meinhardsimonia;s__meinhardsimonia xiamenensis
-s__Desulfatibacillum alkenivorans	s__Desulfatibacillum alkenivorans	1.0	species	d__bacteria;p__desulfobacterota;c__desulfobacteria;o__desulfobacterales;f__desulfatibacillaceae;g__desulfatibacillum;s__desulfatibacillum alkenivorans
--- a/test-data/test_taxonkit_file_1.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,11 +0,0 @@
-unclassified	12908
-Xylella fastidiosa	2371
-Paramaledivibacter caminithermalis	191027
-Flavisolibacter ginsengisoli	462367
-Bacilli	91061
-unclassified	12908
-unclassified	12908
-Tepidibacter formicigenes	227138
-unclassified	12908
-unclassified	12908
-Andreprevotia lacus	1121000
--- a/test-data/test_taxonkit_file_2.tsv	Sun Sep 08 14:37:41 2024 +0000
+++ /dev/null	Thu Jan 01 00:00:00 1970 +0000
@@ -1,14 +0,0 @@
-Nonlabens	363408
-Pseudomonas aeruginosa	287
-Paracoccus	265
-Paracoccus	249411
-unclassified	12908
-Anaerobranca californiensis	182411
-Hydrotalea sandarakina	1004304
-Selenomonadaceae	1843491
-unclassified	12908
-Lampropedia hyalina	198706
-unclassified	12908
-Anaerosporobacter mobilis	264463
-Meinhardsimonia xiamenensis	990712
-Desulfatibacillum alkenivorans	259354