diff --git a/tools/phylophlan/.shed.yml b/tools/phylophlan/.shed.yml
new file mode 100644
index 0000000000..3177886007
--- /dev/null
+++ b/tools/phylophlan/.shed.yml
@@ -0,0 +1,10 @@
+name: phylophan
+owner: bgruening
+description: Tool for high-resolution phylogenetic analysis and taxonomic classification of microbial genomes and MAGs.
+homepage_url: https://github.com/biobakery/phylophlan
+long_description: PhyloPhlAn is a comprehensive and scalable pipeline for phylogenetic profiling of microbial genomes and metagenomes. It supports accurate species- and strain-level classification, including for metagenome-assembled genomes (MAGs), and can reconstruct large-scale phylogenies using clade-specific informative markers.
+remote_repository_url: https://github.com/bgruening/galaxytools/tree/master/tools/phylophlan
+categories:
+ - Metagenomics
+ - Sequence Analysis
+ - Phylogenetics
\ No newline at end of file
diff --git a/tools/phylophlan/macros.xml b/tools/phylophlan/macros.xml
new file mode 100644
index 0000000000..8c8a67645d
--- /dev/null
+++ b/tools/phylophlan/macros.xml
@@ -0,0 +1,102 @@
+
+ 3.1.1
+ 0
+
+
+
+
+ phylophlan
+
+
+ python
+
+
+
+
+ diamond
+ blast
+ usearch
+ muscle
+ mafft
+ fasttree
+ raxml
+ iqtree
+ astral-tree
+
+
+
+
+ mash
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ PhyloPhlAn
+
+
+
+
+ 10.1038/s41467-020-16366-7
+
+
+
+
\ No newline at end of file
diff --git a/tools/phylophlan/phylophlan.xml b/tools/phylophlan/phylophlan.xml
new file mode 100644
index 0000000000..893dbe29a1
--- /dev/null
+++ b/tools/phylophlan/phylophlan.xml
@@ -0,0 +1,583 @@
+
+
+ microbial genome characterization and phylogenetic analysis
+
+
+ macros.xml
+
+
+
+
+
+
+
+ 'database/database.f${db_type}a' &&
+ #end if
+
+ phylophlan_write_config_file
+ -o config.cfg
+ -d $db_type
+ #if $trimming.trim != "None"
+ --trim trimal
+ #end if
+
+ #if $config.analysis == "supermatrix_nt"
+ --db_dna makeblastdb
+ --map_dna blastn
+ --msa mafft
+ --tree1 fasttree
+ --tree2 raxml
+ #else if $config.analysis == "supertree_nt"
+ --db_dna makeblastdb
+ --map_dna blastn
+ --msa mafft
+ --gene_tree1 fasttree
+ --gene_tree2 raxml
+ --tree1 astral
+ #else if $config.analysis == "supermatrix_aa"
+ --db_aa diamond
+ --map_dna diamond
+ --map_aa diamond
+ --msa mafft
+ --tree1 fasttree
+ --tree2 raxml
+ #else if $config.analysis == "supertree_aa"
+ --db_aa diamond
+ --map_dna diamond
+ --map_aa diamond
+ --msa mafft
+ --gene_tree1 fasttree
+ --gene_tree2 raxml
+ --tree1 astral
+ #else
+ #if $config.db.type == "n"
+ --db_dna $config.db.db_dna
+ --map_dna $config.db.map_dna
+ #else if $config.db.type == "a"
+ --db_aa $config.db.db_aa
+ --map_aa $config.db.map_aa
+ #if $config.db.map_dna
+ --map_dna $config.db.map_dna
+ #end if
+ #end if
+ --msa $config.msa
+
+ #if $config.analysis == "custom_supertree"
+ --gene_tree1 $config.gene_tree.gene_tree1
+ #if $config.gene_tree.gene_tree2
+ --gene_tree2 $config.gene_tree.gene_tree2
+ #end if
+ --tree1 $config.tree.tree1
+ #else
+ --tree1 $config.tree.tree1
+ #if $config.tree.tree2
+ --tree2 $config.tree.tree2
+ #end if
+ #end if
+ #end if
+
+ $force_nucleotides
+ --overwrite &&
+
+ ## fixing astral binary path
+ sed -i "\%program_name.*astral%s%=.*%= `which astral`%" config.cfg &&
+
+ #if "supertree" in $config.analysis.value
+ #if $config.maas.source == "history"
+ #set $maas_file = $config.maas.models
+ #else
+ #set $maas_file = $__tool_directory__ + '/test-data/phylophlan.tsv'
+ #end if
+ python '$__tool_directory__/validate_mapping_file.py' '$maas_file' &&
+ #end if
+
+ phylophlan
+ -i input
+ -o output
+ -d database
+ -f config.cfg
+
+ --diversity $diversity
+ $accuracy
+
+ #if "supertree" in $config.analysis.value
+ --maas '$maas_file'
+ #end if
+
+ --min_num_proteins $quality.min_num_proteins
+ --min_len_protein $quality.min_len_protein
+ #if $quality.min_num_markers
+ --min_num_markers $quality.min_num_markers
+ #end if
+ #if $quality.min_num_entries
+ --min_num_entries $quality.min_num_entries
+ #end if
+
+ $quality.remove_only_gaps_entries
+ #if not $quality.remove_only_gaps_entries
+ $quality.remove_fragmentary_entries
+ #if $quality.fragmentary_threshold
+ --fragmentary_threshold $quality.fragmentary_threshold
+ #end if
+ #end if
+
+ #if $trimming.trim != "None"
+ --trim $trimming.trim
+ #if $trimming.trim.value in {'gap_perc', 'greedy'}
+ --gap_perc_threshold $trimming.gap_perc_threshold
+ #end if
+ #if $trimming.trim.value in {'not_variant', 'greedy'}
+ --not_variant_threshold $trimming.not_variant_threshold
+ #end if
+ #end if
+
+ #if $sample.subsample != "default"
+ --subsample $sample.subsample
+ #end if
+ #if $sample.scoring_function
+ --scoring_function $sample.scoring_function
+ #end if
+ #if $sample.submat
+ --submat $sample.submat
+ #end if
+
+ --unknown_fraction $quality.unknown_fraction
+ $quality.convert_N2gap
+ $force_nucleotides
+ $sort
+ $mrate.mutation_rates
+
+ -t $db_type
+ --nproc \${GALAXY_SLOTS:-4}
+ --verbose
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ mrate['mutation_rates'] and not mrate['discard_individual_tables']
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/tools/phylophlan/phylophlan_assign_sgbs.xml b/tools/phylophlan/phylophlan_assign_sgbs.xml
new file mode 100644
index 0000000000..7adad0b9db
--- /dev/null
+++ b/tools/phylophlan/phylophlan_assign_sgbs.xml
@@ -0,0 +1,125 @@
+
+
+ to metagenome-assembled genomes.
+
+
+ macros.xml
+
+
+
+ '${database_name}.md5' &&
+ cd .. &&
+ #end if
+ #end if
+
+ phylophlan_assign_sgbs
+ -i input
+ -o output
+ --database_folder database
+ #if $analysis.type == "closest"
+ -d '$database_name'
+ #if $analysis.assign_all
+ -n all
+ #else
+ -n $analysis.n
+ #end if
+ #else if $analysis.type == "taxonomy"
+ -d '$database_name'
+ --add_ggb_fgb
+ #else if $analysis.type == "matrix"
+ --only_input
+ #end if
+
+ --overwrite
+ --nproc \${GALAXY_SLOTS:-4}
+ --verbose
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/tools/phylophlan/phylophlan_draw_metagenomic.xml b/tools/phylophlan/phylophlan_draw_metagenomic.xml
new file mode 100644
index 0000000000..fd40947d05
--- /dev/null
+++ b/tools/phylophlan/phylophlan_draw_metagenomic.xml
@@ -0,0 +1,55 @@
+
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
\ No newline at end of file
diff --git a/tools/phylophlan/test-data/CM_ethiopia__CM_A06_M0_18__bin.34.fna b/tools/phylophlan/test-data/CM_ethiopia__CM_A06_M0_18__bin.34.fna
new file mode 100644
index 0000000000..043c31360c
--- /dev/null
+++ b/tools/phylophlan/test-data/CM_ethiopia__CM_A06_M0_18__bin.34.fna
@@ -0,0 +1,99 @@
+>NODE_56_length_69222_cov_8.30568
+ATTTCTACACAACCTCAATATAGCTATTCTCAACAAGCTATAGATTTTATTTACGATGAA
+ATTAGGAAAAACCCAGATACAATTTTAGAGGATTTAAAAGAAAAAGTAAAAAAGTCAACC
+CCAGGAGCAAAGGATTCTAAGTGAAAAACACCTACTCCCATTCGGGAACCCAGCTTTATC
+CATCACAAGTTGACTAACTTTAGTATATGAAAAAAATGTTAAAAAGTCAAAAGTTTTTTA
+AATTAGTGAAAACAAAAAGGAGGCTCACCATATGAAATTACTGATCAAACAAAGAGTTTT
+TTCATGGACCGATTCTTATGACATATATGATGAATCCGGTAATGCAAAGTATTTTGTGAA
+AGCAGAATTCCTTACATTAGGACACCGGCTGCATATATATGATCAGGCGGGAAATGAACT
+GGGACTGATCAAAGAAAAGGTATTTTCCCTGCTTCCGGTGTTTGAGATCGAGCAGCATGG
+ACAGCTGAAGGGGAGAATCCAGAAACAATTTACATTTTTTAAGCCAAAGTATGAGATTGA
+TTATAATGGCTGGCGTGTGGAAGGTGATTTTCTGGGATGGGAATATGACGTGTATCATGG
+ATGCAGTTCGATCGTACATATTTCAAAGGAACTACTGCACTGGGGGGATACTTATGCGAT
+CAATATCAGTGATCCGTCCGATGAATTGGATGCTCTTATGCTGGTGATCGCAATCGACGC
+AGCAAACTGCTCAGATGGAAATTAGAAAGAAAGGTGTAATTATGGCAGGATATTTAATTA
+AGGATACAACAAAAGAAGAAAGAGAACAGATCGTAGCAGAGTCGCTTGGAAATATTGAGG
+CGAACTGTGATGGCTGTATGCGCGGACTTGCAGACATGTATCAGGATTACATCGATGGCA
+AAAAGGAATTGCGTGAGATCAACATGGAATTCAATACAAGATTTGTAAAAAGCGGTGATG
+ATATGCCGGGCAGACACAGCTGTGCGATGTATGGAGAATAATAAGATGAACATATTATTA
+ACACAGATTATGGAACCGCAGGCTGCAGCATTCACACATGGAGGGAAATTTCATGCGGAT
+GATGTATTCTCTGCGGCTTTATTGCGCTATTTGAACCCCGATATCACCATTGAGCGCGGA
+AACCGTGTGCCGGAAGAATATAAGGGAATCGTATTTGACATTGGAAGAGGCAGATATGAC
+CATCATCAGAGGGACAGCCGCATCCGGGAAAACGGAGTGCCATATGCGGCATTTGGGCTG
+CTCTGGGAGGAACTTGGAGTTGAGATACTTGGAGAAGATCTTACATTGAGGTTCGATGAA
+GATTTTGTGCAGCCGCTGGATCTCAATGACAATACCGGAGAGAAGAATGAGCTTGCGACA
+CTGATCGGACAGTTTAATCCGGTGTGGGACGATCACCGGGGAAGTGATGAGGGCTTCTTC
+CGTGCCGTTTCGGTCGCAGAGATGATCCTTAAAAATAAATTTGACCGGTATCTTGGAAAA
+GCCAGAGCAGACCAGCAGACGGAAGCGATTCTCGCAGAGCATGACAAAGCGGTTCATTCC
+GGCGATGCTGCGCCGGAGGATGCACGAATCTTAGTGCTTCCGGACTTTGTTCCATGTCAG
+AAACGGCTTGAGGAAACGGATATTGCATTTATCGTTTTTCCATCGAACCGTGGTGGATAT
+TGTATACAACCTTTGAAAAAGAAGCAGTCGATGAATTATAAATGCAGTTTCCCAGAGGAA
+TGGCTGGGACTGGAAAACGAGGAACTTGCGGCAGCAAGCGGACTGCAGAGTGCCACATTT
+TGCCATAAGGGCGGTTTCCTGATGTCTGTGGGAGATCTCGAGGATGCTGTGAAAGCCTGC
+AGGATCAGTCTTTTACAATATAAAGACCAGCCGGTGATCGTGAGACTTGGTGAAGATTCC
+GGAGCCGACGGGTTGTTGCTTCAGATTCCGGGAATGGAACATGCACAGGTGGTCTGGATG
+CCGCTTTTTTCAGCTCCGGAGCTTGAAATGCAGGGAAATTATGGCGAAATAGCCATGGAG
+AAGCCACAGTGGAAACAACTGGTCAAAGAGTATGTCAGAGAAATACTGCATTTTCATCCG
+GAAGCAGTATTTGTGAATGGAGAACTTCTGGAGGTTTATCCGGTTGTGCATGCACTCCGT
+AAAAAACATGTTCCGGTTCTGACGGTTTCAAAACAGAATGGAAGATCTGTGATCGTAAGG
+ATCCCGGCCGGTTCATAAAGTGCGGTTCACAAAGCAGATGCAGAAAATTCTTTTTTTTCA
+TAGGAAGAAATGCTAGAATTAAAGATTGTATCAGGATAAACGGAGGTTTATGATGGACAT
+TCTATTTGCAGGAAACACTAATTTTTTCTCTCCGGAATTTTATGAGGAGTTTGCAGTGGA
+GGATCGCTGCGCCGTAATTGGCAATGCAAAGCCCCGGAAGCAGATAAACAGGAAAGGCAT
+CAGATTTTTTCCGGAGACGAAGGACGCAGAGACGGAAAGGATATTCCAGAGCTATGATTT
+TGAGACGGTTCTGTTTCTTTCCAGGACGCTGGACTGTGAAAAAAAGGTTTTTGATGAGCT
+GGAGAACCTGGAGTATATTCTCTATCAGTGCAGAAAGAGAAATGTACCGGAGTTTATCTA
+CATTACAGAAAACCGTCATGTGAATGAGATTAAGGACGGTGAAGTAAGCAGAAAGATCCT
+TCTGGAAGCGTGCGACAAGCTGTGCAGGCATGCGGCAGAAAAGGACCATATCCGTGTTCT
+TGTCCTGCGCGTACCATATTTATATGGAGCAATGGGGGACAAGTGTGCTTCACAGGATCG
+CAGAGTGCTGGAAAAATGGATACAGGATACCGTAACAGAAAAGAGGCTTGAACTTCAGGG
+GGAACGGGATACGGAGATTGATTTTCTGCATACGGATGATCTGAAGGAGCTATTGAAAAG
+GATATTGGATGATCCGTGGAAAGAACCTTATTTTTCGGTCAGCGTGGGTGGAAAAAATAA
+CTGCACAATGGGGGAAGTTGAGGACTTTCTGAAGGCTGCAGAACCACAGCTTACAGTGCA
+TTACAGCGGAAAAACAGAGTATGTTCCGGCTGCAGGGGAGAACCAGTGGGCGAGAAGGGA
+GTATGGATTTATCCCCAAGGCAGATGTCTGGCAGGATGCTGCCCGTCAACTGGAACTGGA
+AAAGAAACAGCATGAAAAGTCAGCCGGGAAACGAAACCAATGGACGGGAAGATGGCTTCG
+TACCGGGATCGAACAGGCTGCCCTTTTTGCAGGAGCGGAATTTTTAAATGCGGTAACACA
+AAACAATGTTCTGGTCAATTTTCTTGATTTCAGATTTATTTATATTGCAATTATGGCGTG
+CGTGAATGGACTGGGTGCGGGTGTGTTTGCAGCACTGCTTGCCAGCGCAGGATATATTGT
+ATCGAAAGCAGGGGCAGTGAACTGGCAGGTTTTATTCTTCAATGTCGAGAACTGGCTGCC
+GTTCGCAAGTTATCTGCTGCTTGGATGTGTGATCGGATACACGATGGACCGTTCGGAAGA
+TGAACTGCAGAACAGTAGAGAGGAATATCAGATCCTGGATGAAAAATACAGCTTTCTCCA
+TGGACTATATATGGAAGTCCTTGAGGGAAAAGAGCGGTTTAACAGCCAGATTATCGGCTA
+CAGGGACAGCTTTGGACGGATGTATGCTGTCGTGAAAAAATTAAATACGACGCTGCCGGA
+ACAGGTATTTTATGAGGCTGTAGATGTGCTGGAGGAGATTTTGGACAATCCATATGTCGC
+AATCTATAATATACGCCCGAACAGCGTCTATGCGAGGTTAAATGTCTGCTCTAAACGGTG
+TATGGGGAATGTAAAAAAATCCTTGAAAATGACAGATTATCCGAAATTGTCAGAGTGTCT
+GTCTGCAAATGAGACATTCGTGAATATCGATGCGTTGGAGGATTATCCGGCATATGCGAC
+ACCGGTATTCAGAAATGACGTACTTGTGGGAATGATTCTTCTGATGCAGGCAGATTATCA
+GCAGATGAATATGGAGTTTTCCAATAAGTTCCGTATCATGACGGACATGATCCGTGATTC
+CCTGATCCGTGCCATGGATTTTTATGAGCAGAATGAGAATGCCGTGAAGAATACAAGGAT
+TCTTGAGAATGACAGGTTTGAAGAAATCCTGAAGGTGAAACAGGCAATGCGTAAGAAACA
+GTACTTAAATTACCGTATGCTTCATATTTTTCTGGATGGATCAGGTCTGGAGGAGATTAA
+TGAAAAGCTCTCCGGTCTGGTACGTGAAAATGATGTGCTAGGCCTTGGAGGAGATGGCGG
+GCTGTATCTGCTTTTGTCACAGACAAATGAGACGGATTTAAAGATCGTGGAAACCAGGCT
+GAAAACAAATCACATTCGGTACAAAGAGGTTATGGAATGAGAATTGCGATGATTTTTCTG
+TTGATCCATATTGCCGTCTGCATCGCAGTCGGGTATTTGTATAAGACGAAAAAACTAAAA
+ACGAGGAACCCGGTTCTTCTGGTCGTGATCTGCATTCCGGTGTGGGGGATAGGGATGCTT
+CTTGTGGAGGAGACCGCAGAACGGAGACATACTATGGGCAGAAGACCGGTCCGGATGTAT
+GAGACCATAGAAAAGAACGATCTGAATTACCGGACGATTCAGACAGGGACGCATGAGGAT
+ATTGTTCCGCTGGAGGAAGCAATGACCGTCAATGATACATCCGTAAGCCGCCGGCTTATG
+CTTGAAATTCTGCATAAAAATCCCGATGAATATATAGATCTTCTGAAGAAAGCGACTTCA
+TCAGATGATGTGGAACTGACACATTATGCGACGACAACAATGCTGGAGATCCAGAGCCGA
+TATGAGTGGAGGATCGAACAGAGTCTGGAAAGGCTGGAAGAGCAGCCGGAGAATCTGAAT
+ACGTTACGGAGAACAAAGAATTTACTGGAGAAATATCTTGAGAGCGGACTGATCTCCGGT
+GCGATTGCAGGACAATACAGAAAACGGCTGCAGGAGGTGCTGGAAACACTGCAGCGTCTA
+CAGCCGCAGACACACCGCTATGTATATGAAAGCCTGGAAAACAGGATTCTGGAGGGCAGC
+CTAAAAGGTGTAGAGAAGGAACTGCAAAAACTCCTGGAGCAATTCCCACAGGATGAGAAC
+GTGTACCGCTTGTCTGCACAATACTATTATATCCAGAAGGATGGCCAGAAACTCCGGGAA
+CTTTTCAGGCTTATGGAGCAGAGGCAGGTATACCTTGATAATGAAAGCCGGAAGTGGTAT
+GACTTCTGGACGCAAAAAGGATGAATAAATGAGAAGAAAAGCATTTGGAAAAATTATGGT
+GCCGGTTCTGGCACTGTTTCTGCTCAGTCTGCTTATTTTCCGGGAGAGGGCGGGAATCGA
+CTATGATCATACGGGTGACGGCAATAACGGATGGAATACAGCCTGCTATACGGATGCGGT
+AAGCCAGACACCATCCTGCCTGATTTTATCTTCTTCCGAAGCGGTCAGTACCCAGTACAC
+GGATATGATGCAGAAGGTCTTATCTGGCATGAAAATTGCATATGATATATGTGATGTGGA
+ACAGGGCTTTGATGCAGATATACTGGACAGATATGATACCGTCGTAGTGACCTTCCAGGA
+GTGGAGTGTGCTTGGGGATGAGATTTTTCCGGTATTTTCCTGGGTGGAATCCGGGGGATG
+CCTTCTGGATGCACTGACACCATCGGTGGATGGCTATTTTCAGGCAGTTTCGATGAAATT
+CGGAATTGAAATGATCGGATCTTCCTATCCTGCAGTATATGGGATAAGGTTTTTCAATGA
+CTGTATGCTCGGAGCATCGCAGGATGATGTATTCTGGTACGACAGAACCAAAGAAGAGGG
\ No newline at end of file
diff --git a/tools/phylophlan/test-data/GCA_000007905_truncated.fna b/tools/phylophlan/test-data/GCA_000007905_truncated.fna
new file mode 100644
index 0000000000..b057070083
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_000007905_truncated.fna
@@ -0,0 +1,36 @@
+>AE017125.1 Helicobacter hepaticus ATCC 51449, complete genome
+AGCAAATTAAATACCAAAAGGCATTTTATGGAATCCAAAGCACAAGAAAAGCAAGAGCAAAAAAAAGGCTATAATCCACA
+AGATATAGAATCTAGATTCTATGCTATATGTGAGAAACGAGGCTATTTTGAAATTGAGGGGAATAAATCTCTCTGGCAAG
+GTTGTGCGCCAAAATGCTTTAGCATTATGATGCCCCCACCTAATGTTACAGGAGTGCTTCACATAGGACACGCACTTACT
+TTTACTCTCCAAGATATTATCACAAGATTTAAACGAATGGAGGGCTTTAAAACACTCTATCAACCCGGTTTAGACCACGC
+AGGGATTGCTACTCAAAATGTCGTATTAAAACAGCTTTTAGCACAAGGTATAACTAAAGAATCTTTAGGAAGAGAAGCAT
+TTATAGCTAAAGTATGGGAATGGAAAGAGCAAAGTGGGGGGGAGATTCTCAATCAAATGCGTCATCTTGGCATCACACCT
+GCGTGGTCGCGTTTGCGTTTTACGATGGATAAAGGATTACAAAAAGCTGTAAAAAAAGCCTTTGTGCAATGGTATAATCA
+AGGGCTTATCGTGCAAGATAATTATATGGTAAATTGGTGCGTGAATGATGGTGCGCTTTCAGATATTGAGGTAGAGTATG
+AGCAAAATCACGGCAAGCTTTATTATTTGCGCTATCCTATTAAAGATTCTGCTCAATCCCTCATCGTAGCTACCACGCGT
+CCGGAAACATTTTTTGGCGATACTGGCGTAATGGTCAATCCAAATGATGAACGATATAAGCATCTCATTGGTAAAAGCGT
+GATTCTCCCATTATTGGGGAGAGAAATACCTATTATAGCAGATTCTCACGTTGATATGAGCTTTGGAAGTGGCTGTGTAA
+AAGTAACACCTGCCCACGATATGAATGACTACGAAGTAGGTAAAAGGCACAATCTCCCATTTATTACGATTTTTGACGAA
+AAGGGTATATTCAATAAAAATGCAGGAATCTTTCAGGGACAAGAACGTTTAGAATCTCGCCCTCTTATTGTCCAAAAATT
+ACAAGAAAATGGCTTTGTAGAAAAAATAGAAGATTATACAAATCAAGTTGGTAAATGTTATCGCTGCGGTAACATTGTAG
+AACCTTATATCTCCAAACAATGGTTTGTCAAAAAAGAAACAGCACATAATGCCATTCAACGTGTCAATAATGGCGAATTA
+CATTTTTACCCTGCACAATGGCTTAATAATTATAATGCGTGGATGAGAGAACTCAAAGATTGGTGTATTTCACGGCAGCT
+TTGGTGGGGACATAGAATCCCTGTATGGTATTGTGAATGCGGCAATAAAGTCGCTTCAGAATCTGATAATCCTATCTGCC
+CTCAATGTCAATCCACTATCACAAAGCAAGATGAAGATGTGCTTGATACTTGGTTTAGTTCTGGATTATGGGCTTTTAGC
+ACTTTGGGCTGGGGTAATGAGGATACAAATACTCAACCTCCCCTTTATCACGCAAATGATTTGGCAGAATTTTATCCTAA
+TTCATTGCTTATTACGGGTTTTGATATTTTATTCTTTTGGGTGGCACGTATGATTTTAAGTGGAGAATCCTTACTTGATT
+CACTGCCTTTTAAAGATGTTTATCTTCACGCACTTGTGCGCGATGAAAATGGGCAAAAAATGAGCAAAAGCAAAGGCAAT
+ATCATTGACCCTATGGAAATTATATCCTCTTATGGGGCAGACACACTCCGCTTCACTCTAGCAATTTTATGCGCACAAGG
+GCGCGATGTGAAACTCTCTACTCAATCTCTTGAAATTTCTAAAAATTTCACAAATAAGCTTTATAATGCTACAAATTTCC
+TTAATATGTATTTGGAACAACTCGGCGGTAAAGAGGCTTTAAAAAAAGGTTTTGGCGATATTAACCATATACACATAAAT
+ACACCACTTGGACAATATATGTTAGTAAGATTCTATACTGCTACAAACGAAGTAAGAGCAGCACTTGAGAACTATCGTTT
+TAATGATGGGGCAAGTATTCTTTATCGCTTCTTATGGGGAGAATTTTGCGATTGGGGTATTGAACTTGCAAAAGCAAGTA
+AAGATTCTATTTATGAGCTAGGAGCAATCTTTAAAGCTGCGCTTATACTGCTTCACCCTTATATGCCCTTTATCACAGAT
+GCGCTTTGGCATACGCTCAATGCAAGCGATATACAAACTTCCGATTCTATTATGATTCACTCTTATCCCAAAGCTATGGA
+AAAAAATGAGCAACACTCGCAGCTAGAGCGGACTTTTGAGGTTATTCAAGATGTCATTACTTCTATCCGCCGATTAAAAG
+CAATGCTTGAGCTTGGCTCTACAAATATTGAGTGTATTTTTGTCAAACTCAATGCACCATTTGAACACTCACTCCTTGAG
+CAGTTTGTTTGCAAGCTTGCTAAAGTCAAAACTCTTTGTATCACACAGCAAAAGCCTAAAGATTGCGTAGGGGATGTAAG
+CAAATATTGTGAATGCTACATACAACTTGGAGAGATTGATTTACAAGCTATTGGCACTCGTTTGCACAATCAACGTCAAA
+AACTTGAAAAAGAAATTACCAAACTTCAAGCTATGCTTGGAAATGAAAATTTTATAAAAAATGCCCCAAAGGCTGTAATG
+GAACAAAATCAAAGTGCATTACACAATGCGCAAGAAAAATTGGATAAAATTAACGCTGAACTTATCGCACTTGGATTGCA
+ATCTTAAAAATACAAAGGAGAACAAATGAAAAAAATACTCTTGCTCGTGCTGTGCTTTTATCTTAGTGGCTGTGGAGATT
diff --git a/tools/phylophlan/test-data/GCA_000008525_truncated.fna b/tools/phylophlan/test-data/GCA_000008525_truncated.fna
new file mode 100644
index 0000000000..5b0b8c088c
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_000008525_truncated.fna
@@ -0,0 +1,34 @@
+>AE000511.1 Helicobacter pylori 26695, complete genome
+TATTATGGTTGTTCTAACAAGTCCAATTCTTGCTTAATTTTACTTTCTTTTTCTAAAAGCGTTTTTAAACTCTCTTTAGC
+TTTTTCTAGCACGCTTTTAGGCGCGTTTTTGACAAAATTTTCATTGTGCAAATTGAGTTTTAATTTTTCTTTTTCCAATT
+TTTCCAACTGCTTTTTCAAACGCGCAACAAGCGGGCTTAAATCAAGATTTTCTAAATTCGCATAAGTCTGGCAAAATTCC
+CCCACATCGCTCACGCTTTTTAAAGGCTTAGAACTAATCACGCTGACTTTTTCCAACCTCGCTAATTTTTGGGCGTAAGT
+TTGCAAACGCTCTGTGTTTTCTATGGCTTCTCTTAATCCCACGCTCGCTTCTTTTAGAACAATCGGTGGGGTTTCTAGCA
+TGATTTTTAAACGCCTTAAAGACACAATGCAATCTTTAATCACTTCAAATTCATGCTCTAATTTTTCATCTTGCGCCAAA
+TCTTTAGGGTAAGGCATGACCATGATAGATTCAGTGTTTTCTAGTTCCGTATTGCTGAGCTTGTGGTATAAAGACTCGCT
+GATAAAGGGCATGAAAGGGTGCAAGAGTTTTAAAGCCTCTTTTAACACGCTCCCTAATTCGTCTATCGCTTCATTTTCCA
+CTTTAGAAAATTCAATGAACCAGTCGCAAAATTCCCCCCACAAAAAGCGGTATAACAAAGTCGTGGCGTCATTAAAACGA
+TAATTATCTAAAGCGTTACGCGCCTCTTTAGTCGCTGAATTCAAGCGCGATTTCGCATAACGCCCCAAAGGCGTTTGGTA
+TTCATTCAAACGCTCTTTATCTTTGAAAGATTCTTGTTTGAGCTTCAAGTAACTCGCCGCATTAAAAAGCTTGTTGGCGA
+AATTCTTGTTATTTTCTAAATGCGTAGTGGAAAGCTTAATGTCCCTACCCGTAGCGCACAAATTGGCTAAAGTGAAACGC
+AAGCTATCCGCGCCGTATTTTTCTATCATCTCTAAAGGATCGATCACATTACCCTTAGATTTGCTCATTTTTTCACCCTT
+TTCATCTCTCACTAAGGCGTGCAAGTAAATATCTTTAAAGGGCAATTCGCCTAAAAGCGATTCGCTGCAAAAAAGCATCC
+TAGCCACCCAAAAAAAGAGGATGTCAAACCCAGTAATGAGCGTTGTGTTAGGGTAGAAATCTTTCAAATCGCTTTCATTA
+AACAAACCGCTTTTTTCTTGCCCCCACCCTAGAGTGGAAAACGCCCATAGCCCTGAACTAAACCATGTGTCTAGCACATC
+CTTATCTTGCTCTAGTGTTTCGCTCTTACAAGTAGGGCAACTTAAGGGGGTGTCTAAGCTTACGAACTGGTGGTTATTCT
+CGCAAGTGAATACCGGTATTTGATGCCCCCAAAACAATTGCCTGCTGATACACCAAGGGCGTAATTCCCTCATCCAAGCG
+TTGTAATTATTGATCCAATTAGAAGGGTAGAATCGCGCCAAACCTTGTTGGATTTTTTCAATAGAACTTTGAGCGATTTC
+AGGCTTGACAAACCATTGCTTAGACACATAAGGTTCTACCACATTATGACAACGATAGCAATGCCCCACTTGATGCGTGT
+GTTCTTCTATTTTTTCCAATAGGGCGTTTTCTTTTAATCTTTCTACGACCTTATCTCTAGCTTCTAATCGTTCTAAATTT
+TCAAACTCCCCGCAATGCGCGTTTAAAATCCCCTTTTCATCAAAGATTTTAATCGTTTCCAAATGGTGGCGTTTGCCCAC
+TTCATAATCGTTAAAATCATGCCCAGGGGTTACTTTCACACACCCTGTGCCAAACTCCATTTCAACATGTTCATCAGCGA
+TAATAGGGATTGTGCGATGGATTAAAGGCAAGATCGCTTTTTGCCCCACCAAATGCTTGTATCTCTCATCGTTAGGATTG
+ACCATAAGCGCGCTATCGCCAAACAAGGTTTCAGGGCGTGTGGTAGCCACCACTAAATAATCTTTTTGATTTTCTAAATA
+ATATCTAATATAATACAACGCCCCCTTACGCTCTTCATACTCCACTTCAATATCGCTCAACGCCCCATCTTTAGTGCACC
+AATTCACCATGTAATTATCTTGAATAATGAGACCTTTTTCATACCATTTCAAAAACGCCAATTTGACCGCTCTTTGCAAG
+CCCTTATCCATCGTGAAACGAGTCCTAGAAAAGGCCGCGCTCACGCCTAAACGCTTCATTTGCTCTAAAATCGCTCCCCC
+GCTCTTTTCTTTCCATTCCCACACTTTTTTAATGAACTCTTCACGCCCTAAATCTTCTTTTTTAATCCCTTGACTTAAAA
+GCTGCTTTTCCACGACATTTTGCGTTGCAATGCCAGCGTGATCCAACCCGGGCTGATACAAAGTCTTATACCCATCCATG
+CGTTTGTAACGCGCTAAAATATCTTGCAAGCTTAAAGTCAGGGCATGCCCTATGTGCAACACACCGGTCACATTAGGAGG
+GGGCATCATCAAGCAAAATCGTTTGTTTTTTTCTTGGATCGCTTCATTGCCATCAATTTCAAAATACCCCCTATGAGAGC
+AAATTTCATAAATCTTTTTTTCTATCTCTTCTGGTTGGTAGGTGGTGGGTTCTTGTTTCATTATCATTATTATCCTAAAA
diff --git a/tools/phylophlan/test-data/GCA_000012345_truncated.fna b/tools/phylophlan/test-data/GCA_000012345_truncated.fna
new file mode 100644
index 0000000000..ab94cfc6cd
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_000012345_truncated.fna
@@ -0,0 +1,35 @@
+>CP000084.1 Candidatus Pelagibacter ubique HTCC1062, complete genome
+ATAAACTTATTATCACCTATGAGTAACGATAAATATATACATACAGACGTTGAAGATAAGATTTATTCTTATTGGGAAAA
+AAACAATTTATTTAAACCCACTAAAAATAAGAAACAATTTTCAGTGGTTATACCTCCGCCCAATGTAACTGGTAGCCTTC
+ATATGGGTCATGCTTTGAATAATTCAATTCAAGATCTTTTGGTTAGATACCACCGTATGAATAATTATGAAACCTTATGG
+CAACCTGGAACAGATCATGCAGGTATTGCCACACAGGCCTTAGTTGAGAAAAAATTAACCGCTGATGGTATTGATAAAAA
+TGAAATTGGAAGAGAAAAGTTCATAGAAAAGGTTTGGGAATGGAAGGAAGAACATGGTGATATCATTTTAAATCAACTAA
+AAAAACTAGGTTGCTCTTGTGATTGGTCAAGAAATGCTTTTACAATGGATGAAAACCTTTCAAAATCAGTTTTAAAAGTT
+TTTGTAGAGCTTCACAAAAAAGGTTTAATTTATAAAGATAAAAAACTAGTAAACTGGGATACGGTTTTAAAAACAGCAAT
+ATCTGATTTAGAAGTGGATCAAAGAGAAGTTAATTCTAAGATTTACTATATTCAATATCCTATAGAAGCTTCTAGTGATT
+TTATAACTATAGCAACAACAAGACCTGAAACCATGTTGGGTGATACAGCGATAGCTGTAAATCCAAAGGATGATCGATTT
+AAACATTTAGTTGGTAAGTTTGTAACAGTACCAATTGTTGGAAAAAAAATAAAAATTATTGAAGATGAATATGCTGATCC
+TGAGATGGGAACGGGTGCTTTAAAGATAACACCAGCACATGATTTTAATGACTATGAAGTGGGACAAAGAAATAATTTAG
+AAATCATAAATATTTTTACTGAAGGTGGCAAAGTAAACGAAAACGCTCCTAAAGAATATATTGGACTTGATAGATTTGAA
+GCTAGAAAAAGAATTATAAAAGAACTTAAAGAAAAAGAGTTTTTTGTTAAGGAAGAGAACATAAAGAATAAAGTTCCTTA
+TGGGGATAGGTCTAATTCAATAATTGAGCCTTTTTTAACAGAACAATGGTTTGTCGATGCAAAAAAATTATCAATTAAAG
+CTAAAGATATAGTTAACTCTAAAAAAACTAATTTTTTTCCTGCTAATTGGTCAAAAACTTATTTTCAATGGATGAACAAT
+ATTGAGCCATGGTGTATCTCAAGACAGCTTTGGTGGGGACATCAAATACCTGCTTGGTATGGACCAGATAAAAAAATCTT
+CGTTGCAATAAATGAAGAAGAAGCAAAATTGGATGCAAAAAAATTCTATAATAAAGATGTAGATTTAATTCGTGACCCAG
+ATGTATTGGATACTTGGTTTTCATCAGGTCTATGGCCTTTTGCTACATTGGGTTGGCCTGACAATAAAGAATATGTAGAT
+AAATTTTACCCGACATCAGTACTGGTTACAGGGTTTGACATTATATTTTTTTGGGTAGCACGCATGATCATGTTTGGAAT
+GGAGTTTCTAGACAAAGAGCCTTTTAAAGATGTTTACGTTCACGCCCTTGTTAAAGACGAGAAGGGACAAAAAATGTCTA
+AATCTAAAGGAAACGTAATTAATCCCTTAGACCTAATTGAAAAATATAGTGCAGATGCTTTAAGGTTTACTCTACTGTCA
+ATGGCGTCACCCGGAACAGATGTAAAACTTTCTGAAGATAGAGTTAAGGGTTATAGAAATTTTTTAAATAAATTATGGAA
+TGCAAACAATTTTTTAATTACCAATAATTGTGATTTTTCTAAAATTGATGAAAAACCAATTTTATCAATTAATATTAACA
+AATGGATCTATGCTGAACTTATAGAAACTAAAAATAAAATTGAAAAAAATCTAAAAGATTACAGGTTTGATGAAGCTGCA
+AAAAATGCCTATCAATTTACTTGGCACTCTTATTGTGATTGGTATTTAGAGCTATCTAAAACAATCCTATTTTCAGAAGA
+TGAAAAGGCAAAAGATGAAGTAAGACAGGTATCAGCTTACGTATTTAAACAGATATTAATATTATTACATCCATTTATTC
+CATTTGTGACTGAAGAAATTTGGCTAAATAATAAATTTGATAACACAGGTAAAGACTTTTTAATGTTAGCTAATTGGCCT
+TCTGGAGAGTTTGAAAGAGATACATCCATTAATCAAGTTGAAAAAATTATCAGTATAGTTTCTGAATTAAGATCATTTAA
+AAATGAATTAAGTGTAAGCCCTGGGTCATTTATAGATATTTCAATAGAGACAGTTAGTAAAAAAGAACAATCATTTTTTA
+CTGAAAATGAAATTATTCTAAAAAAACTTGGTCGTATCAAAAATTTATATAATAAAGATCTGGATAAACCAACTGCTACA
+TTGATGGTTTCTGGAGATTTATTCAAAGTGTATTTTGATGAAGATGTCGATTTAGAATTAATTAAAAAAAACTTAACTAC
+AAGGCAAAATAAATACCAAGAAGAAATGAATAAAATATCACAAAGATTAGCTAATAAAGGCTTTGTTGATAGAGCACCAA
+AAGATATTGTTGATCAGGAAAAAACTAATTATAATAATTTAAAAAATGATGTTGAGAGAATATCGATAACTATAAAGGGT
+TTATAATGGCAAAATTTAATAAAAAAAAATTACCAAGCAGACATACTTCATTAGGTGCTGATAGAGCTCCACATAGATCA
diff --git a/tools/phylophlan/test-data/GCA_000012965_truncated.fna b/tools/phylophlan/test-data/GCA_000012965_truncated.fna
new file mode 100644
index 0000000000..c724ed0942
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_000012965_truncated.fna
@@ -0,0 +1,35 @@
+>CP000153.1 Sulfurimonas denitrificans DSM 1251, complete genome
+TCTTAGCATTGTAAAGATTCTAATTGCTCTTTAACTTTGCTCTGCTTATCTGACGCATCCGCCAAAAGCTCTCTGTTTTT
+TACTAAAACATCCTCAGGAGCATTAGCAACGAAACGCTCATTATTTAACATTGAAGAGAGTTTGTCTATCTCTTTTTGTA
+GCTTTTCATCTTGCTTTGTAAGCTTTGAGATAATCGGAGTTAAATCAATACTCTGAGTCGGTATAAAAGTTTCACACATT
+TGGCTAATATCACTAACTGAGTCTGGGATTTTTTCATTTGTAAATTCAACTACATCAACCTTAGCAAGTCTAGCTATAAA
+AGGTCTCATCATCTCTTTTTCATCTTCACTTATGTTGTCTATCTTAACATAAGCTTTTTCTATCTTTTGGTTTGCCAAAT
+CAACCAAAACTTTAGCACGTCTAATAGAGATAATAGCATCCATGATTATCTCAAATCTCGCTTCATCTTTTGTGCGAACT
+TTTGTTTTGTAAGGGTACTTCATAATCATAATCGACTCTGAAGCTTCAAGTGTAGTACCGCTTAGCTCATGGTAGAGATA
+CTCTGTGATAAATGGCATAAATGGATGAAGAAGTTTCATCGACTCTTTAAAGATAGCTCCAAGCTCTACAATTGAGCCTT
+TGTCTGCTTTGCTTAGCTCGATTCCCCAGTCACAAAACTCATTCCATAAAAAGCGGTAAAGTACAGTTGCAGCGTCGTTA
+AATCTGTACTCATCCATACATGAGCGAACCTCTTGTGTTGCTACATTTAGGCGAGATAACATGTAACGTCCAAGTGGGCT
+CTCAACACAAAACCCTTTTAAATCAGGGAAAGTATCAACGTTCATCTGTAAGAATTTTGCGGCATTGTAGAGTTTATTTG
+TAAAGTTACGGTTTTGCTCGAGTTTGTCCGTACTCATTCTTATATCACGCCCTTGAGCAGCACTTATCGCAAGAGTAAAA
+CGAAGTATGTCGGCACTGTATTTTTCTACCATGTCAAGCGGGTCGATTACATTGCCTTTTGATTTAGACATCTTTTGTCC
+ATGCTCATCACGAACAAGTGCATGAAGGTAGATATGGTTAAATGGAAGTTCGCCTACAAAACTCTCACCCATCATCATCA
+TTCTAGCTACCCAGAAAAAGAGGATGTCAAAACCAGTTATTAGAAGCGAATTTGGATAAAAATCTTTCATATCCTGTGAA
+CTAAAGAGTTTGTCCATAGAAGCGTCGCCATTCCCCCAGCCTAAAGTTGAAAACGGCCAAAGAGCAGAGCTAAACCAAGT
+ATCTAGAACATCAGGGTCTTGAGAGATATTTTTTGAAGCACACTTTGGACATGTATGCTCTTCATCTTTGAGTGAAGCCC
+ATTCGTTGTCGCAATCCCCACAGTAAAATACAGGAATTTGATGTCCCCACCAAAGCTGACGAGAGATACACCAATCACGC
+AAATCACCCATCCAAGAGTTGTATGAGTTTATCCAGTGAGGAGGAAAAAATTTAGCTTCTCCGTTGTTTGTTTTCTCGAT
+AGATTTACGAGCAACTTCACTTCTTACAAACCACTGTTTTGAGATATAAGGCTCAACAATGTTTTTACATCTGTAACAGT
+GCCCTACTTGATGTTTATGCTCTTCAATTTTTACTACAAAACCTTCTTCATAAAGTCTTTTCATAATAATGTCACGAGCT
+TCTAAACGCTCTAAACCTTTGAATTCTCCAGCGTACTCATTTAAGATACCCTTTTCATCAAAAACAGTGATAAACTCTAA
+GTCATGACGCTTACCAACTTCATAGTCATTTTGGTCATGTGCAGGTGTAACTTTTACAACCCCCGTTCCAAAATCCATAG
+CTACATGTGAATCGGCGATGATAGAAACTTCTCTCTGAAGTAGTGGAAGTTTGATTTTTTTACCGATTAGATGCTTATAA
+CGCTCATCATCAGGATGAACCATAACCGCTGTATCGCCAAAGTATGTCTCAGGTCTTGTTGTTGCAACTTCAACAAATCC
+GCTTCCATCAGCAAAAGGGTACTTTATGTGGTAAAACTTTCCGTCATGGTCTTCATGTTCAACTTCTATATCGCTAAGTG
+CGCCATCATGTGTACACCAGTTTACCATGTAGTTTCCGCGAACTATCAGACCTTGATTGTAGAGATGAACAAAAGCCTCT
+TTTACAGATTTTTGAAGCCCGTCATCCATAGTAAAACGCTCACGCTTCCATGCAGGGCTAACTCCCATTTTGCGAAGTTG
+GCTTGTCATAATGCCAGCAGATTCTGCTTTCCACTCCCAAGCTCTCTTTAAAAACGCTTCTCTGCCAATCTCCTCTTTAG
+TCGTTCCCTCAGCAAGAAGTTGTTTCTCAACTACATTTTGAGTTGCGATTCCTGCATGGTCGGTTCCAGGTTGCCATAGA
+GTTTTATAACCGTCCATTCTCTTGTAACGGGTAATAATATCTTGAAGTGTAAATGTGAGTGCATGACCTATGTGAAGACG
+TCCAGTTACATTTGGAGGAGGCATCATGATAGAGAAGTTTTTTCCCTCTTCTTGAATACTCTTGTTAGAATCTACTTCAA
+AGTAGCCTCTCTCTTCCCAAATTTTGTAAAACTTATCTTCAGTAAGTTGTGGTTCGTAGCTGTTTGACATATTTATTACC
+TTGATTTTTGTAGTTTAAAAGTTTGAGATTATATCTAAAAAGATGTGAGGCTCTACTTATAATAAGTTCTATATTGCCTG
diff --git a/tools/phylophlan/test-data/GCA_000014865_truncated.fna b/tools/phylophlan/test-data/GCA_000014865_truncated.fna
new file mode 100644
index 0000000000..5aa9c8a23a
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_000014865_truncated.fna
@@ -0,0 +1,37 @@
+>CP000471.1 Magnetococcus marinus MC-1, complete genome
+GTCGAACTAGGTATCACCTACAGGGCCTATGCCCTTGCCAGAGAAGAGAAGATCCCATGCAGGAAACATCGTTGCCAAAA
+TCCTATGACCCCACCGGTGTGGAACAGCGCTGGTATCAAACCTGGGAAGAGCAGGGGTGTTTTAAACCCAGTGGTCTAAG
+TGCGGCCAACGCCTACTGCATCATGATCCCCCCCCCCAATGTGACCGGCAGCCTGCATATGGGGCACGCTTTTCAAGATA
+CCATCATGGATGCCCTGATCCGCTACAACCGCATGCAGGGGCATAATACCCTGTGGCAGTGTGGGACCGATCATGCCGGC
+ATCGCCACCCAAATGGTGGTGGAACGGCAACTCGAAGCCGAGGGTAAAAGCCGCCACGATCTTGGCCGCGATGCCTTTAT
+TGAACGGGTTTGGGAGTGGAAAGCCAGCAGTGGTAACACCATTACCAAACAGCTCCGCCGAATGGGGGCTTCCTGCGATT
+GGAGCCGTGAACGCTTTACCATGGATGACGGACTCTCCGAGGCGGTCAAAGAGGTGTTTGTTCGCCTCTATGAAGAAGAT
+TTAATCTACCGTGGTAAGCGCTTGGTCAACTGGGACCCGGTGTTGCACACGGCGGTTTCGGATCTGGAAGTAATCAGCGA
+GGAAGAGCAGGGCCACATGTGGCACATGCGCTACCCCATGGTCGAGGGCGATGGCTTTTTGGTGGTGGCAACCACTCGAC
+CAGAAACCATGCTGGGGGATAGCGCCGTGGCGGTGCATCCCGAAGACGCGCGCTACCAGCATCTGATCGGCAAGCAGGTG
+GTGTTGCCCTTGACGGGTCGCACCATTCCTGTGATCGGGGATGACTATGTTGATCCTGAGTTTGGTTCTGGCTGTGTCAA
+GATCACACCAGCCCACGATTTTAATGACTATGAGGTAGGCAAACGGCACAATCTGCCCCAAATGAGCATCTTTACCGTGG
+ATGCCTGCATCAATGAGGATGCCCCAGCCCGCTACCGGGGAATGGATCGCTACGAGGCGCGTAAACGCATTGTGGAGGAT
+CTGCAAGAGGCAGGTTTGCTGGAAAAAATAGTCGACCACAAACTCATGGTGCCCCGTGGTGACCGTACCAAGGCAGTCAT
+TGAGCCGTTGTTGACCGATCAATGGTTTGTGACCACCGCCCCCTTGGCCGCTGAGGCGATTAAGGTGGTGGAAGAGGGGC
+GCATTAAATTTGTACCGGAAAACTGGTCCAAAACCTATTTTGAATGGATGCGGAATATTCAAGATTGGTGCATCAGTCGC
+CAGATATGGTGGGGCCACCGCATTCCCGCTTGGTATGGTCCCGATGGTCAGGTGTTTGTCTGCCGCACCCAAGAGGAAGC
+GTCCCAAAAAGCCAGCCAGCACTACGGTAAGCCGGTGGCGCTAACCCAAGATAATGATGTGCTGGATACCTGGTTCTCAT
+CGGCACTATGGACCTTTTCGACCCTGGGTTGGCCAGAAAAAAGCCAAGAATTGGCCTCTTTTCACCCCACAAACGTGCTG
+GTTACAGGTTTTGACATTATCTTTTTTTGGGTAGCCCGCATGATTATGATGGGGCTGAAATTTACCGATGAAGTGCCCTT
+TCATACCGTCTATGTGCATGGTCTGGTGCGCGATGGCGAGGGGCATAAAATGAGCAAATCCAAGGGTAATGTCTTGGACC
+CGTTGGATCTGATCGACGGTATTAGCTTGGAGGATCTGGTGGCCAAGCGTACGCGGGATATGATGCAGCCCCATCTGGCC
+AAAAAGATTGAAAAACAGACCCGTAAAGAGTTCCCCGATGGCATCGCCGCCGCAGGTACGGATGCCTTGCGCTTTACCTT
+GGCATCGTTGGCGACCCAGGGGCGGGATATCAAGTTTGACCTGGGACGGATGGAGGGCTACCGTAATTTTTGCAATAAGT
+TATGGAATGCCTCGCGCTTTGTGCTCATGAATGCAGAGGGCCAGGATTGCGGGCTGGAACGGGTGGATCTGCCCCTATCG
+GTGACCGATCAGTGGATTGTGAGCAAATTTCAGCGCACCGCCCGGGATGTTACACAGGATATTGAAAATTATCGCTTTAG
+CGATGCGGCCAATACGCTCTATCAATTTTTGTGGGGCAGTTATTGCGACTGGTACTTAGAGATGGTGAAAACCACGCTCT
+ATGATGAGAACGCCGCAGAGGCGGCCAAAGCGGCGGTACGGCACACCATGGTTGGGGTGTTGGAGGCCTCCTTGCGGCTG
+CTCCATCCGTTGATGCCCTTTATTACCGAAGAGTTGTGGCAAAAGCTGGCCCCTCTGGCGGGCAAGCCCGCAGGTAGCAT
+TATGCTGGCCCCTTGGCCCGAGGCCGATGAAGGCCGTATTTTAGACCAAATTGAGAGCGAAATTGACTGGGTGCAGCGCT
+TTACCAGCACCATTCGTGGTATCCGTAGTGAAATGGATATCCCTCCCAGCAAAAAGATCCAGGTCTTGGTGCGTGGTGAC
+GACAGTGCGGTGGCCCGTCTGCGGCGCCATGTGAGTACCGTTACCGCCCTGGCCAAATTGGAGGGGTGGGCGGTGTTGCA
+GGATGAGGCTCCGCAAGGCTGCGCCACGGGGGTGTTGGAGGATATGCAGCTGTATATCCCCATGAAGGGCCTCATTGATG
+TGGCCGCCGAGAGCGCCCGTTTGCAAAAAAGCTTGGATAAGCTGGATGCCGATTGGCAGCAAGTCACAAGAAAACTGAGC
+AACGAAAATTTTATTGCCAAGGCCAATCCCGAAGTGGTTGCCAAAGAGCGGGATAAAGCCAATGAACTGATGGAAAAAAA
+GCGTGCCGTGCAGGAGGCTCTAACACGCATTCAGGCCATGGCATAGGGCGTGCTGTTTAAAGCAATTGCCCAGGGGCTAG
diff --git a/tools/phylophlan/test-data/GCA_000020825_truncated.fna b/tools/phylophlan/test-data/GCA_000020825_truncated.fna
new file mode 100644
index 0000000000..52a6218a65
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_000020825_truncated.fna
@@ -0,0 +1,37 @@
+>CP001132.1 Acidithiobacillus ferrooxidans ATCC 53993, complete genome
+GTCCTGCACGAAGGCCTGGACCAGATCAACGCCTCGGAAATCGAGAAAGATACCCTACCATGACTGACACTCTGGATCGC
+CCCTTTGCCCCCGCCGAGATCGAAACCCAATGCTACGCACGCTGGGAAACCCACGGCCTGTTCCAGCCGAAAGGCAGTGG
+AACCCCCTATTGCATCATGCTTCCGCCACCCAATGTCACCGGCACCCTGCATATGGGTCACGCCTTTCAGGATACCCTCA
+TGGATATCCTCACCCGCGTCCACCGGATGCGCGGCGAGCGCACCCTCTGGCAGCCGGGGACCGATCATGCCGGTATCGCC
+ACCCAGATGCTGGTGGAACGGCAACTGGTACAGGAAGGCGGCGATCGCCATCAGATGGGCCGCGGTGCCTTTCTGGAACG
+GGTCTGGCAGTGGCGTCGGGAATCCGGTGGCCATATCACCCGGCAGATGCGACGGCTGGGAGCATCCTGTGACTGGTCAC
+GCGAGCGTTTTACGCTGGACAGCGGGCTCTCCCATGCGGTCACCGAAGTCTTCGTCCGCCTCCATGACGAAGGGTTGATC
+TACCGCGGCAAACGGCTGGTCAACTGGGATCCGGTCCTGCGTACCGCAGTCTCCGATCTGGAGGTCATCAGCGAAGCGGA
+GCAAGGCTCGCTCTGGCACATCCGTTATCCCCTCAGCGATGGCACCGGCTTCCTCGTGGTCGCCACCACCCGTCCGGAAA
+CCCTGCTGGGCGACGTGGCGGTGGCGGTTCACCCCGACGATCCGCGCTACGCCGCCCTCGTCGGCAAGACCCTGCGCCTA
+CCGGTCATGAACCGTGAGATTCCCATCATCGCGGACGATTATGTCGATCCGGAATTCGGCTCCGGCTGCGTCAAAATCAC
+CCCGGCCCACGATTTCAACGACTATCAGGTGGGGCAACGGCACAACCTGGCCCTGCTCAACGTCTTTACCCCCGACGCGC
+ATATCCGGGACAGTATCGAGGTCTTCGGCGACGACGTCGTCGCCGGGGAGATTCCCGAGGCCCTACGCGGACTGGACCGT
+TATGCCGCCCGCCAGCAGATTCTCATCCTGCTGGCGGCGGAAAACCTGCTGGAACGCACCGACGAACACCAACTCATGGT
+GCCCCGCGGCGACCGCTCCCATGCCGTCATCGAGCCCTACCTAACGGACCAATGGTATGTGCGGGTCGCCCCCCTGGCGG
+AACCGGCCATCCGCGCGGTGGAAGAAGGCCGCATCCGCTTCGTGCCGGAAAACTGGAGCAAAACCTACTTCGACTGGATG
+CAGCGTATCGAGGACTGGTGCATCTCTCGCCAGCTCTGGTGGGGGCACCAGATTCCCGCCTGGTACGGCCCCGACGGCAA
+AATCTTTGTCGCTCGTCGTGAAGAGGAAGCGCAGTCGGAAGCCGTCCGCCATTACGGCATGCCGGTGGTCCTGGAACGCG
+ACCCGGACGTACTCGACACCTGGTTCAGTTCGGCGTTGTGGCCCTTCACCACTCTGGGCTGGCCGGAAAAAACATCGGAC
+CTTGCCCAGTTCTACCCCACCAGCGTGCTGGTCACCGGCTTCGACATCATTTTTTTCTGGGTGGCGCGAATGATCATGAT
+GGGTCTGCGCTTCATGGACGATGTGCCATTCCATGAAGTCTATGTCCACGGTCTGGTGCGCGATGCCGAGGGCCAGAAGA
+TGAGCAAGTCCAAGGGCAATGTCCTCGACCCCATCGACCTCATAGACGGCATCAGTCTGGAAGACCTCGTCGCCAAGCGT
+ACCCGGGGCCTCATGCAGCCGCAGATGGCGGCCAAAATCGAAAAGGCCACCCGTAAGGAGTTCGCTGACGGCATTCCCGC
+CTTCGGCACCGATGCCCTGCGCTTCACCTTCGCGGCACTGGCCACCCAGGGCCGGGACATCAAGTTTGACCTCAAGCGGG
+TGGAGGGGAATCGCAATTTCTGCAACAAGCTTTGGAACGCCTCGCGTTTCGCCCTGATGCAGACACCAACTCCGGCCGCT
+CTGGAAGGCGAGCGCGAGCTGCTGGCGCCGGAACGCTGGATCATCGGTCGCCTGCAACACTGCGAGGCGGCCGTCAACAG
+CGCCATCGACCAGTATCGCTTTGCCGACGCCGCCCATGCACTCTTCCAGTTTTTCTGGAATGACTACTGCGACTGGTATA
+TCGAACTGAGCAAACCGGTGCTGCGCGAGGGCGGCCCGTTCACCTCGGCACAACAGTGCGGCACCCGCAATACCCTGCTG
+CGGGTGCTGGAGGCCGGCCTGCGTCTGATGCACCCGGTGATGCCCTTCCTCACCGAGGAACTCTGGCAGCGGGTCGCACC
+GATGATCGGCAAGGCGGGGGACAGCATTGCCCTCGCCCCCTACCCGGTGGCCGATCTCGCCCGTGTGGACACCGATGCCG
+ATGCCGATACGGAATGGCTGATTGCCGTCATCCGCGCCATCCGCTCGGTGCGCGGCGAGATGGATATCCCACCGGGGAAA
+CCTCTGCCCCTGCTCCTGCAAGCCGGCGATACCCATGACCGGGAAAGGGTGGAACGCTACCGGTCCTGGCTCTTCGCCCT
+CAGCCGCCTCGCCAGTCTGGAATGGCTGGACGCCGAAGAGGAAGCGCCGCCCGCCGCCTTGCAACTGGTCGGCGATCTGC
+GCGTCCTCGTCCCTCTCGCGGGGGTGATCAACGTCGCTGCCGAACAGATCCGCCTCGCCAAGGAACAGCAACGCCTGGAA
+CAGGATCGCGCCAAAACCGTCGCCAAACTCGGGCAGGAAAGCTTTCGCAGCCGGGCGCCCGCAGAGGTGGTCGCCAAAGA
+AGAGGAACGCCTGCGGGAGGTGGATGCCGCATTACTGCAACTGGGGGAGCAGGCACGGCGGTTAGCCTTGTTGTGATCAA
diff --git a/tools/phylophlan/test-data/GCA_003236755_trunc.fna b/tools/phylophlan/test-data/GCA_003236755_trunc.fna
new file mode 100644
index 0000000000..d8a87550cd
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_003236755_trunc.fna
@@ -0,0 +1,116 @@
+>PZRR01000001.1 Staphylococcus aureus strain CM179 PROKKA_contig000001, whole genome shotgun sequence
+TCTCGTCCGTTCGCTCGACTTGCATGTATTAGGCACGCCGCCAGCGTTCATCCTGAGCCAGGATCAAACTCTCCATAAAA
+ATTATGATGTTTGATTAGCTCATAAATACTAAATAATGTTTGTAACTTATAGTTACGTTTTTGGAATTAACGTTGACATA
+TTGTCATTCAGTTTTCAATGTTCATTAATGTTCAATCTCTTTTATTGTACTTCATTAAATTATTGAAGTCAATAACTTTT
+TGAACGATTACTTTATTTATTTTATATTGTTTTTATAGTTATTTCAATGGTAAGTTTTACACTTTTGAAATTCTTCTTTA
+AAAACATCATCGCCGTTTTTGACGACTTTATTATCTTATCAACTTTATAATTTAAAGTCAATAACTTTTTTGAAAAATAT
+TCGTGTTTGCAAGTCGCTTCTTTTTTCAATGCGTTGATTGCTTAACACAAGAACTTATTTTACCAGCATTTTAAAACAAT
+TCAATATAAAAACGTACAAAATAAAAGTAATTTTGTACGTTTAGCATATATTATACCTATTTATTTGTCGCAGCTATAAC
+TTTTTGTGCAATCGAGCTATAAATTTTACCTAATCTGTCTTCAGCTTGATAAATTGAAGGTGCAAAGTCTTTTGGATTCC
+AAGACGGTTGCTCTAAAGGTAATTCCCCAAGTAATTGAGTATTAAGTTCATCAGCTAACTTAGTACCGCCACCTTTACCA
+AAAACATATTCTTTATTACCCGTCTCTTTACTTTCAAAATAACTCATGTTTTCAATTACTCCAAGAATAGAATGGTCCGT
+ATGTTTTGCCATCGCACCTGCGCGAGCTGCAACAAATGCTGCTGTAGGATGAGGTGTCGTTACAATAATTTCCTTACTTG
+AAGGTAACATCGTATGAACATCTAAAGCTACATCCCCTGTTCCAGGTGGAAGATCGAGTATTAAATATTCAATGTCTCCC
+CATTTAACTTCTGTAAAGAAATTCGTCAACATTTTACCTAACATTGGCCCTCTCCATATAACTGGCGCATTTTCTTCCAC
+AAAAAAGGCCATTGATATAACTTTAACGCCATGACGTTCAACTGGAATTACTTCCTTCCCTTTAATTCCAGGCTTTTCAT
+CAATACCCATCATATCTGGTACACTAAATCCATATATATCGGCATCTACTAATCCGACTTTTTTACCTTCACGGGCTAAG
+GCAACGGCTAAATTTACTGCAACAGTAGATTTACCGACGCCACCTTTACCTGAAGCAATAGCAATAAATTCAACTGGATT
+ATTTTGAGATAATAAGCCTTCTATCGTTTTAGGTTTATTTTCTTCTTTTGGTTTAAATTGATTTACTTTTTCTTCTGGTA
+ACGTTTCAAATCGTATACCCACAGTTTTTGCACCATTTTCTTTTAAAACATTAACAACTGCCATCTGTAAATCTAATTGC
+GGTGCGCCACCTAATTGTGCCATTGCCACTTTAACACTTACATGTTCTTTTTCTTCCTTAATAGAAACTTCTACAATACC
+TTCTGTTTCTTTTAAAGGTACATCTATAATAGGATCTTTAATTTCTCCTATTAGTTCTTTAACTTGATCTACCGTTAACA
+AAGCAAATCCCCCTTAATCAATTTAAAATATCTACATCATAGCAAATAACAATTTTTGCTTAGTCTATCAATAAAAGTAT
+AAAACTTTTCATTAAATAAAAAAAGAAGTTAGCCTATTATTTTCAATAGACCAACTACTATAATTATTTTAAAATTCCCT
+TCTATTACTTTCTATTACTTTAGGTTCTCTTATAAAAAGCGCTATCACATAAGCTGCCATAACAAGCACAGCTACAAAAG
+CAAATGAGATATCCACCCCTATAGCAATTGATTGCTGTTTAATTTCAGTTGCAGTTAAATGCGATGGCGATGTAGATGAG
+AATATTTTTGCGCCAAAACTCATCAAAGTAACCATTAATGCTGTTCCTAATGAGCCAGCCATTACACGACCAAAGTTCAT
+AATAGCCGTGCCATGTGAGATTTCTTCATTTCTCAAAGAATTAATTCCTGTAGTATTTATCGGCATCATGAGTAAAGAAA
+CTGAAAACATTCTAATTGCATATACGACTATTAAATACGTATAAGATGTGTCTGTATGCAAGAAACACAACATAATAGTA
+GTAATTGTTAAAATCGTAAAACCAGTATAAATCAGTGGTCTAGGACCATACTTATCATAAAATTTACCTGTAAAAACCGA
+CATAATACCATTTATGATTGCACCTGGCATGATAACAAGTCCAGACAATAATGCAGATAGAGCTAAGCTATTTTGAACAT
+AGAGCGGTATTAATAACGCTGGACCAACCATTGACATCATTATGATCATTGAGCTAATCGTACATAATGCAAATGTTCTA
+TTTTTAAAAACACTTAAATTTAAAAGTGCATTGCTTATATTGAATTGTCTACGAATAAATAAGTAGATGATAATAGAACT
+AATTATCATGGCACCAATGACTACCGGGCTAGTAAATCCTAGGTCGCCTGCACTACTGAATGCATATAACATTAATCCAA
+ATCCAATCGTTGAATACATTACAGAGCGCTTATCTAATTTAGTATATTTCACTTCATTATAGCTTGAAATTGAAATTAAA
+CCGAAGATGAATGCGACTAAAGCAATTCCTACAATTATAATAAATGGTACTCGCCAACTCGCTTGATCAATGATTAATCC
+AGTAACAGTAGGCCCGATTGCTGGTGCAAATTGAATAACTAAACCAGCTAATCCCATTGCAAATCCTCTATGTTCTTTAC
+TGAATAACGTAAACAATGTGAATTGCATTAAAGGCATGAGTACGCCTGCCCCCATAGCTTGGATGACACGCGCTACCATT
+AATACGCCAAAATTGGGTGCCATGGCTGCAACAATTGATCCTACTAAAAATGTCCCCATCGCTGCTAAGTATAAAGGTCT
+AGTTTTAATCCTGTCCATTAAGTATGCTGTTAGAGGTATCATGACGCCATTAACAAGCATAAACCCAGTAACTAGCCATT
+GCGATGTACTTTCATTAATATTTAATTCTCTCATTATACTAGGTAACGCTGTATTTAATAATGTTTGATTTAAAATAGCT
+ACAAACGCACTAATCAACATAACAGCAACTATGAAGTTTCGTCTCCGGGTTGTTAATTCAACTTTAGCCACCACAATTCC
+TCCTTTGTAACAAATTTACGTTTATTAGCATATATACTTAAAATATATTTCAGATTAAAGTACCAACTATTTATATCAAT
+GGTTATTATTAACCGTGATTAATTGAAGCAAAACAACTCATTTTCTACTATATGAATAAAAAGAAGTTGGAACACATCAT
+TGCCCCCAACTTCAAACCTCTATTTTCTATTGTTTAGATTTTTACTTTCAGGGTAAAACTGCAGCTTACAAACATATAAA
+AAGCCTATAATAACCATGATGACCCAAAAATCAATATTGATATACACATAGTTCAGATGAATAATAAAATAAAATAACGT
+TGTTGCAACCATATAAGAGATTAAATGAAAAGTTGCACCTCTAAAATAAGCATTTTCAGGTAACATTTTTCTAAAATAAT
+CCATCAAATTTTCAACTGCAAATACGATAAAGTAGCCAAATATAATATAACTACCATAATATAGCAAATTGTCGTACATA
+CTTCTGTTATATGTGAAGTCACCTAACCTAAAATAAATAAGAATTCTACTTAATCCATATAGTCCGAACCCTAAAAACGT
+TAAGAATATCGCACCAGAAAGCACAAAGATAAAGAGAACAATAATTGTTGTTAATAAATTATAAAACTTATGTTTAAGAT
+AATTCATAACTATTGTCCTCCTTACCAATAATAATTTATATTGCTTGTAATTTTAAGATAGTTGATTACACTTCAAACTT
+AGTAAAATGATTATTTGTTACTTTATTTACACTACATCAATTTTAATCATAATTCTATTCTTTTGTTTGTGACGCCGCTT
+CTCTATAAAATATGAGCCATACAACGATGAGCCCTACACTTATCAAGGATACAACGCCTAAAATATTATGCAAGTTTGCA
+CCAAACAATCCTGATTTTAATGCATAAAGGTATCCCATAATCGTCGAACCTATTGATGCGCCAAGGTTTTTTGTTAATCC
+ATAAAACGACATCATTTTCTTCATTTGTATTGGACTTGTTTCCTCTTGGACAATTACACTATCTTTTGTATAAATATATC
+CAAAGCTTAGTCCACTTAAAATTAAGACACATGCTATAAGAATTGGTAATTTTATACCAAACGCAATGATTATACTACTT
+AATAATAATAATGTAAAAGACGACAAATAGATAACTTTTCTTGATAACTTCGCTTCAATATGGTGCAAATTAAAATTCAA
+TGTAATCCACGCTACAGAAAGTGGAAAAATAACTAATCCACTTTGCAATGGCGATAACCCCAGTTGTTCTTGAAGATACA
+CAGGAATATATAAATTAAAGCCCATTAAACAAACAGCTGTAAGAAGATCTGTAATAAAGACCAAAGTAATCATTCGATTA
+AATTCTGCTACTGGTAAGAATGGGGATGAAACTTTTTTCTCAACATTAAATAATCGAAGTGCAACTAATATTGCTAAGAC
+AAAACCTATGATATTTAAATATAAATGTTGTTGGTTTAACAATGCAAACATAATTAAACCAATGAAAATATAAAACAGGG
+TGATACCTTTAGTATCGAATTTTGATTTAGCCACAGTTTTTTCTTCTGGAAAATGAAATGTCCAGACAACCAATATTATT
+GCAATAATCGCAATCGGTATATTTATGTAGAATAACCAATGCCATGTTGCAAATTCTAATATGCCACCACCTAGAAGTGG
+TCCAATGATACTCGAAATCCCCCAAACGCTACCAACGATACCCATAATTTTATAGCGTAATGGAATTTCAAACGCTAATT
+TAGGTACAATTTGTGACAAGGACATCATGACACCAGATCCAAACCCTTGAATTACACGTGATATAATCAACATACTAAAA
+TGTGTGCTTAAACCTGACATTAAACTACCAACCGTGAATAGTGTAAGACCTGCGATAGCAATATAAATAATTTTAAAACG
+AGTTAATAATTCACCTACTATTGGATTCGCAATCACTAATGCAATAAAGTAAGCCGTAAATATTAATGAAATTAAATTCC
+CTGCATTTAAATCTTGCTTAATTGTTGGTAACGCTAAAGAAATAATTGATGATTCGATTGCAGCCATAAACATGATTAGT
+ATTAAAGCTATTACAGTTACAATTGATTTTAAACGCATGCTATACCTCCTTTTATAATAATGATAGTGCTATGTAATTTC
+TAATTTTACTATTTCCTATCTTATCCTCTTTTAAATTCAAATTAGTTTTTTTAAAATCTATTTGTTACACCTACTAAAAA
+ATTCAAATAAACGTATCCATCAAATGTCTGATTAATACAAATTAAGTGCACTCCCAGCTTTAAAAATCATACCGATTTTA
+AAAAAGCAAAACAATCCTCTATTAGAATGAATTAAGTAATAAAAAAAGCGGAGTTTCCCCCACCTTCTGATAAACTATTA
+CATAAAATATAAAATAGCAATTAAATGCAATAATGATGCTATAACGATAAAAATATGCCATATCATATGAAAATATGGTC
+TGTTTTTTTGTGCATAAAACCAGGCACCAATTGTATATGACACACCACCTAAGAAAATGAATAATATGAATATCCATGAT
+GTGCGAATAAAAATAATTGGTAACAAGATAATACCTACCCAGCCCATCACTAAATAGACAATTAAACTTAACTTTTGATT
+AACTTTGACAGCTATGGATTTATATAAAATTCCCCAAAGAGTCGTTCCCCATAATAAAATAAATACTGTCCAACCTATCC
+AACCACCTACAATTGTTAACAAAATAGGAGTGTATGTACCTGAAATTGCTACGTAAATCATACTATGATCAATAATCCTT
+AAAATATATTTATGGGGTGTTTCATTTTGCATAGAGTGATAAATTGTTGATGAAATAAACATCATAAAGATAGAAATAAC
+ATAAATTGACATACTAACTGATGCAAGTGTGCCATTTGCAATATAACTATGTACAGCCGCATAAGGTAAGACTAATAGTG
+TTAACAGCGCTGCCAGACCATGAGATGCAGCATTGCCTATTTCTTCTCCAAATGACAATGGAATGATATCCTTAAATGTT
+TCTACAATTGTGTCATTACTTTTTTTACTTGATTTGGACATCATAGTCACCGCCTAACATTAAATTAAACCCATTCTACG
+TAAATCTTCAGTCGCTGTTGCAACACTATCTTTACCTTCTTTATTTTTTAGAGGTGAGAACTCTTCTTCTCTAGGAACTT
+GTAACGTGACAAAACTAGTTCCATAAGTAAATATGTCAAAATAGAACAATTCGAATTTTAAAGTTGGTTGTTCAATAACA
+CCAAAGTTCTCATCTAATTGCTTCAAATTCTTAATAGCTAAATGATAAGGTAATTCACGATTTACAGCATTTATAATAAA
+TCCAAGTTTAAATGCATGAATACCGATATTAGCATTGTTAAATTGATTTGCAACTTCTGGATCTAATTCTGAATACTCCA
+ATACTGTATCTTTACAATCGACATTAACTAATCGTCCAACACTTTCTCCTGGTTTTGGTTGAATCGTTTTAGAAGTAATA
+TCGTAATCATGTTCTACCGTAAATCCTGCAAATAGTGGATCCAACACTTTTACTAAAACATTGTCGATATTATTCAAGAA
+AATATACTTAACGCCATTATTAGACATTTCTTCTAAGTATCCTGACTTGTCTAAAGATTTAAACACGCCACCATTACCAT
+TTGGCGTTTCCATAATACGACCTTGTTGATTTAAAATTAACTTCCCTTCTTCACTAAGCGCCACAATATTATCTTGTTTA
+AAGAAATGTATTGCTTCTTGATCATAACCAAAGTAGTTATGCGATTCAAAATAAGCTAAAGTTTCTTCATGATTGATATC
+ACTTGTCATAATGTACCATTGAATTATATGACCAGTTTGTCGATGTAGTTCTTTTAATTGTTTTGCCTGAAGTTCAAATA
+AACTTACACCTTCAATTTCGAATGAACCTTTAGGTCCTTTATATCCAAGTCTTGTTCCTTGTCCACCTGCCATCAAAAGT
+ACTGCAAATTGTCCTTCTTTAATAGCTTGAAGTCCTTGTTCCTCTAAACGCTTAATCTCATCATCACTCATTTGTGATTT
+AATATCATATTTCACTTCAGAAACTGCAGATACATCATCTATTGTTTTCTTATTGATGTATAAATCGTTATATAATTTGG
+CAATAAAATCTAAATCTAATGACGCTACCTTCTCTTCAAGCGCTTCTTTTTCATTATTACTCATTATTTTTTCATATTCA
+CATAAATGATCTTGTTTATATTTAGCTAATTGATTTTTATCTAGCATTTTACGCCTCCTGCTGAGTTTGTAACCTTTAAT
+AATTTATTTTCTATAAAAACTTAGTATTCCAGTTGCTTATTATATCATTGATGAAAGGCTGAAATAAAACATAAACTGTT
+CCGACCATTAACGCAGTAGCTAAAGATAAGTCTACAAGTCCACCTGTTTTAAATTGAATCGGTGTCTTCACATTAAACGG
+TAACGGATAAAATAATTTCACGCCTTTTGGTGTTATCATATCTAGTATAACATGTGACACTAATCCAATTATAATTGCTG
+CCATATAATAATTAGGCGTCTGAATAATTTGCAATAAAAATGCTATGATTGCGATAAATAATATTGAATGCGTAAAGGTT
+>PZRR01000017.1 Staphylococcus aureus strain CM179 PROKKA_contig000017, whole genome shotgun sequence
+TGAATCGTCTACACTTAATTGGACAAATTCTATGAGAATAGATATTGTTAATTTAAGAAAGTAGGCGATTTTATTATGAC
+AAGAGAAAGAAGATCATTTAGTTCAGAGTTTAAGTTACAAATGGTTAGATTATATGAAAATGGTAAGCCTAGGAATGAAA
+TTATACGCGAGTATGATTTAACACCTTCGGCGTTAGGAAAATGGATAAAGCAACATCAAAACACGGGTACATTCAATCAC
+CAAGATAACTTATCAGATGAAGAAAAAGAGCTGATTAAATTACGTAAAGAAGTTCAACATTTAAAAATGGAGAACGATAT
+TTTAAAGCAAGCAGCGCTGATCATGGGACGAAAATAGAAGTCATTCAAAAGAATGCACATCAATATTCAGTATCAGCAAT
+GTGTAAAGTCCTAAAAATACCAAGAAGTACCTATTATGATTCTATAAAAAGAAAAGATAATAAAATCACTAAAGATGATT
+CAAACGTAGAACGTGCTGTCATAAATATTTTTAATTCTAATAGAAAAGTCTTTGGTACAAGACGAATTAAAAATAATTTA
+AATGATAAGGGTCTTACTGTATCAAGACGAAAGATAGGTCGTATCATGAAAAAACATAATCTAGTTTCTGTTTATACGAA
+AGCTAAATACAAAAATCATCCAAAAGAAACTAATAAAAAACGAATTAAAAATCATTTGAATCGCGCTTTTAATAGAGAAC
+AACCAATGGAGACATTAGTAAGTGATTTGACATATGTAAAAGTCGCAGGAACATGGCATTACATATGTTTATTTATAGAT
+CTATTTAATAGAGAAATTGTTGGTTACAGTGCAGGTAAAAATAAGGACGCAAATTTAGTATCAAAAGCAATCAGCAGAAT
+AAATCATAATCTTGAACAAATCAAACTATTCCACACTGATAGAGGCAAAGAATTTGATAATCATTTGATAGATGAAGTCC
+TAGAAACATTTAAAATCAAACGTTCATTAAGTACCAAAGGTTGTCCTTATGATAACGCAGTTGCGGAAGCAACGATGAAA
+GCAATGAAAACCGAATTTGTAAAACAAATGCAATTTGAAAACTTAGAACAGTTAGAAACAGAATTATTTGATTATGTAAA
+TTGGTACAACAATTTTAGACCACATTCTTCATTACAGTATTTGACGCCAGTGGCATTTAAAAATCTACACATGAAAACTG
+TCTAAAAAATTGTTGACATACCA
diff --git a/tools/phylophlan/test-data/GCA_003236765_trunc.fna b/tools/phylophlan/test-data/GCA_003236765_trunc.fna
new file mode 100644
index 0000000000..d9ea458369
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_003236765_trunc.fna
@@ -0,0 +1,114 @@
+>PZTC01000001.1 Staphylococcus aureus strain CM178 PROKKA_contig000001, whole genome shotgun sequence
+TAACAATACTAACAGCAATTATTATTATACTAGAGATTTTATTTAAAAATAATATATATTTACCTGTTCTATCTATAGAA
+CCTAAAACCTTACCTAATATTGCTAACAGAAAAAACCATAGCCAAGAAACCATAATTGTGGCAATACAAAAAAGTATCTT
+TTCTAAACCAGAATAGACAGATGCGCTTGATCCAATTACACCAACTGTATCCATAATTGCATGTGGATTTAACAACGAAA
+CAGATATAGCAAAACCTATTTGCTTTTTTGTACTCATCGGTTCATAGTTCTCTAGAGTGTTAGGCTTTTCTTTCCATAAA
+GACCAAGCCATGTACAATAGAAAAAACAAACCAACTATATAAATAAATAATTGTAGAACTGGTAATGACATTAATATTAG
+TGAAACACCCAGTACAGCAATTATTATTAAAAAAGTGTCACATAATCCAGCCGTTATAACAACCGGCAATGCGTTTATCA
+TTTTTTTTTGATTAGCACCTTGATTAAATACAAACACGTTTTGCGCTCCTAGGGGCAAAATAAGCCCCAATGCTAATAAA
+ATACCGTGTAAAACTGGTTGTATCAATTCGCATCCTCCCCCTTCCCAACAATGTTCGGTGTACAAATATCTTTTACTACA
+CTATAAAAACCCGGTAGTGTCGTCTTGAAGAACCCAGTACAATGGTGTGCTTCTCTATATTTTTGATCTTTCATTAATAT
+AATATGTGCTTTTTTCAAATTATAATGTGGAATTGCTGGGAATAAATGGTGAACTAAGTGAAAATTATCATGGTGAGGAT
+GAAATAAAAATATTGTCCAAGGCATACCAAAAGTATTCCGACTTGCTGTTAACTCACTATCATTATTCAATCCAGAGTGT
+TCAGCCATTTCTGCCCAATAACGAATAATCTGAAAAGTTGTTAAAAGTGGTATAAACCAATAAAGAATAACATATAACCA
+AAAATTAAACATAATTGATAACGTAATAATTGTTACCCAGAAAATATTTCTAGTCCATATTTCTGATTTAGGTGTATCCC
+TACTGTATAAGTTAGCTGAAACTGTACCTAAAACATATTTAGGCACATGGAATAAAAATAGTACCTTTACAATGTGATTA
+ATTATAAATTTTTTCACATCTTTTTGCGGCTTATCTAAACCTACAATGCGATATCGTTTAGTATCTGGGTCTTTTTCCTC
+ATCCCATAAATTTCTATGATGTTTAAAATGAGAATTACAATATGTAGTAAAGCTTGTAAATATAGGGAATGCTACTAAAA
+GACAAGCAATCCATTTATTATAAAACTTATTTGTAAATAATGAACGATGACATGCTTCGTGCATTAAGTTATCAAACGCC
+CTCATTCGACTTCCAATTAAAATAATACTTATAATATAAATAATGAGATTACTCATATAGATACTTATACATGCACTCCC
+GAGAATTACCAACCAGTCAAAAATCAAAGCGAAAATATTGTGGTAATTATCCTTTTTCATTAATAACTTCAAATCTTTTT
+TTATCTCCATTGAAAATACAGCTTTTTCTAATTTTAGTGTCAATTTAACCGCCTCCCTTATTTAATATGTTATAATAATC
+TGAAAATTAAAAAACCTACCAGATTCTAATAAAAATTCCAACCAGATTGAGGATGACATTTATGACTAAATTTCAATATA
+AAAAAATTATTGATGATATTATTAATAAAATTAACAACGGTATTTTATCTCCTGGAGATAAATTGTACTCGCAAAGAAAA
+TTAGCTAAGTACTATAATGTAAATAAATCCACAGTTATACAAGCTTTAGATATTCTAAAAAGCTATGGCATCTTAGATAC
+AATTGAAAAAAAAGGTATTTATGTATCCCAGTATAAATGGAATTCTTATATTACCAATAATATTCATTGGCAAGATTATA
+TAGGCAACAGCTTTTCTAAAAATAACCAGTATTATATTCAAAAAATTAATGAAATAGAATTTAATACTGATATCGTCCGA
+TTAGGTACTGGAGAACTATCACCAAAACTAATTCCAAACCATATATTTAAAAAAATATTAACTAATGATATTGAAGAATC
+TTTACAAACTAACTATGAAGAACCTAAAGGAAATCTAAAGTTAAGGATAGAAATAGTAAAGTATATGAAGCGAAGAGGAG
+TTGATTGTAATATCAATAATATATGTATTACATCCGGTGCTGTACAAGGTTTAAAACTAATTGCAGACGGACTGTTAATT
+CCACAATCTAAAATTATAATTGAAACACCATCATACATTAATTCCATACGTACTTGGCATAATATCAGAGCGAAAATTAT
+TCCTTTGTCCATCAATTACATCAAACAGAATATTAACAATATCTTTAAATTAAATAGTGATTATAGGCACAGTATTTTTT
+ACTGTATACCTACGCTGCATAACCCTACTCAAAATACTTATAGTAAAGAAGAGAAGCAAAAAATTATAGATCAATGTCAT
+AAAGAAGGTATTCCAATTGTGGAAGATAGTATATACTCTGATTTATGGTTCAGCCCTAACCAACAAATTTCTATGAAAGC
+TTTAAAAAATAGTGATAATGTTTTATATTTAGGTAGTTTATCTAAAACTGTAAGTCCCGGTTTACGTATTGGTTGGATTA
+TAGCAGATGAAAAAGTAATTCATCATTTAGCCGATTTAAAAATGCAAAATGATTATGGTGCAAGTTCTATATCACAGTAT
+ATTGCCACAACGTGGTTAAGTAATTATCATGAAGATCATTTATATAAATTAAAAATCGAACTAAAATTACGAAAATCTAT
+TTTTATAAAGTCATTAAAGAAACATCTATCTAAGTTTGGATATTGGAATGAACCCCAAGGCTCATTTTATATCTGGTTTA
+AGCTATCTGTTCCAGTAAATATAAAGCTCTTATTTAACGAAGCAATAAAAGAAAATATACTAATACACCCAGGAGAAATA
+TATGACATTAACTCTAAAAGCTATATCCGCTTTTCATACTCATATATCGACAAGGAAGAAATTGACCAAAGCTTAAAAAA
+ATTAAGTGAAATTATAAATAGAATACGAACTTAGTTAACATTTATCACCCTTTATATAATTCATTTTATACATGCGTGTT
+ATAATATTAAGCACAATACGCATTACATTTCATAAAAAACCTAAAATGCATTTTGTTATAAGATATTGGGATATTATACA
+CATTTACAAATATTGACAATATGATCTATATCATCAAATATTATTTCATTGTATGAATATAGAAGTTTTATTAAAAGATA
+ATAATGAGTACTATTAAAAAGGGAATTCCCCAAAAAATGTTTTGATTGGAAATTCCCTTTTTTAATTTTTATGTGGCGAA
+TTGTTGCACTTAATTTGACAACCTAAAACTTAAGAAAATATTCAGTCACACAACCTATCTTACTTATTACTTATTTAATT
+CCGTATACCCATCTCACAAATCCATCTATAATACAAACTATCATTTTATATAAGCAGAATTTACCCTGTCTTCCACACAA
+ACTGTTTTCGTCACTTTAATATGTCTTCTATTCAAAAAAGTCACTCATAACAAATTGCGCATTTTAATAAATTTAGCAAT
+GCCATTTGCATGCTGCAAAAATACTCATATTAATATTTATATTTTATATTATTTAAGTTTTTTAAATCCATATTTTTATA
+ACACTTGCTATGTGATAAAATTAATTTTATATATATAATCTTAAGATTCAGATTATTTAATAGCAAAGGAGATAGTGATA
+TGGATGTTTTAACAATAGAACATTTAACAAAGAAGATAGGTAATAAAACGATTCTCGACGATGTATCATTTAAGCTGAAA
+CGCGGACAAATAGTTGGTCTTGTTGGAGCGAATGGTGCAGGTAAAACAACTTTAATGAAAGTTATATTAGGTTACTCTAG
+TTTCCAAAGCGGGAATTTTAATGTTATTAACAGCAAGGATAGCAAAAGCAATATCGGTGCATTGATTGAAAATCCAGGAA
+TATATCCTTTTATGTCTGGATATGAAAACTTGAAGTTATTGAATGAATCAAAAAACACTCAAGATATCGATAAAATTGTC
+TCACAACTTCATATGGATGAATACATTCATAAAAAAGCTAAAACGTATTCTCTTGGTATGAAACAAAAATTAGGAATTGC
+TATAGCATTTTTAAATGAACCTCAATTTATTATCTTAGATGAACCAATGAATGGCTTAGATCCAAAAGCTGTGCGAGATG
+TACGTGAATTGATTGTCCAAAAAGCGCAAGAAGGTGTCACTTTCTTAATTTCGAGTCATATTTTAAGTGAATTAGTTAAA
+ATCACAAACTCTATCCTTATTATTAACAAAGGTAAAATTGTTACAGAAACATCGGAAGAAGAACTTAAACAATTTAAAGA
+TAATGATTTAGAAAATGTATTACTAGACATCATAGAAAGGGAGGATCAAGCATAAAATGGGAACTTTAATTAAACAAGAA
+TGTTTCAAATTATTTAAAAAGAAATCAACTTTTATCGCACCTATTGTCTTTATTCTACTAATGGTTGCTCAAGGTTATAT
+TGCTACAAAATACAATGAAATTTTTACACCACAGGAATCTTTTACATCTGCTTATAATGGTTTTTCATGGTTTGCATTTT
+TATTAATTATTCAAGCAAGTACAATCATTTCAATGGAATTTCATTACGGTACGATTAAAAATTTACTCTATCGTGAATAT
+TCAAGAACAACTATGATTGTTAGCAAAATCATCACATTATTTATTATTTCTTTAATTTATTTTGTTATTACAATTATTGC
+TTCAATTGTTATTGGGTCTTTATTCTTTAATGATTTAAATATATTTGAAAGTAGCGGTAATCAATTATCTTTATTGAATC
+AATTATTATTAGTTAGTTTAGGTACATTTGTTGGTGTTTGGTTAGTTTTAAGCTTAACGTTGCTATTATCATCTGCAACT
+AATTCAACGGGTGTAGCCATTGCTGTAGGTATTGTTTTTTATTTTGCAAGTTCTATTTTAGCAGTTATTCAAACGGCACT
+TTTAGAAAAAATAGACTGGCTAAAGTGGAATCCTATTAATATGATGAATATTATGCTTCAAACAGTTGAAAAAGGCTTTA
+GTAAGTCGACGAAATTAGAACTTCATGAATTGTTTATTGGTAATATTGCTTATATTTCTATTTTCTTAATACTTGTAGTA
+TTTATTTTCAAGAAGAAAAATATTTAGTAACTTAAAGTATTAGATGAATAAATACACACATATTTCATCGTAATTCAAAA
+TTATTTTCAAATCCCTTCACCCAAATAATGGTGCAGGGATTTTTGATATGTCAGCATGCCACTCATTCTATCTTTAATAT
+ATTTCAAAATCCCCCCACTTGTAATGTACAAAATATGCTCACTTAAACGATAATCGTATCTCTGCCAAGCTATTTCAACT
+CTGCTTTAATATAAAAATTATTCTCCCGGATGGGATGCTTATATCTCTATCATGATATTTCAACGCCGCTTCAACAACTT
+TATCACTTCATATTTATGCGGGTACACTTCAACGCTACTAATATGAATGATACAACCACAGATTCTCAACACTAAAATTC
+ACAATATGTTTACTCTATTTTTATCAATTCAAGCATACTTATTGAAAAATGTTAACGTTTTCTTGATAATCATTGTAAGC
+GTATTAATTTTACAAACCAATGATTGAAATATACTACAGGAGTGACACACAATGACTCAAATTACTGAAAGAGAATTAAA
+AAAGAAATATTTGGATTTATTATCTCAACATTTCGATACTCCAGAAAAGCTTGCGACTGAAATTATTAATTTAGAATCTA
+TTTTAGAATTGCCTAAAGGTACGGAGCATTTCGTCAGCGATTTACATGGTGAATATGAAGCTTTCCAACACGTATTACGC
+AACGGTTCTGGGAACGTGCGAGCGAAAATTAATGATATTTTCAAAGACAAGTTATCAACGAAAGAACTTAACGATTTGAC
+TGCCCTTGTTTACTATCCAGAAGACAAATTGCAACTTATTAAATGTGATTTTCAAAATTATGGACAATTAAATGTTTGGT
+ATATTACGACGATTGAACACCTCATTCAGCTAATTAAATATTGTTCTTCAAAATATACGCGTTCAAAACTTCGACGTGCC
+TTGCCGGAGCAATACGTTTTCATCGTAGAAGAGTTATTATATAAGAACAACGAATTTAAAAATAAAAAATCTTACTACGA
+AACACTTGTAAACCAAGTGATTGAGCTTAAGCAAGCGGATGATTTAATTATAGGGCTTGCGTATTCTGTACAACGCTTAG
+TCGTCGATCATTTACACGTTGTCGGCGATATTTATGATCGTGGCCCGCAACCAGATAAAATCATGGACACGCTGATTAAT
+TATCATTCTCTGGATATTCAATGGGGTAATCATGATGTGCTGTGGGTTGGTGCGTATGCAGGGTCTAAAGTATGTTTAGC
+TAATTTACTACGTATTTGTGCACGTTATGACAATCTAGATATCGTTGAAGATGCATACGGTATTAATTTAAGACCTTTGC
+TAACATTAGCCGAAAAATACTATGATGCAGATAATCCTGCTTTTAAACCTAAAAAAAGGCCTGACAAACATGAACGTTTA
+ACTCAACGCGAAGAAAGTCAGATTACTAAAATTCATCAAGCAATTGCGATGATTCAATTCAAACTGGAAATACCGGTTAT
+TAAGCGACGTCCAAACTTTGAAATGGACGAACGACTTGTACTTGAAAAAGTTAATTATGATACTAATGAAATAACAGTAT
+ACGGAAAAACATATCCATTAAAAGATACATGCTTCCAAACTGTTAACCGTGATAACCCAGCAAAGTTACTACCTGAAGAA
+GAAGAAGTCATGAACAAACTATTATTGTCATTCCAGCAATCTGAAAAATTACGTCGTCATATGTCTTTCTTGATGCGTAA
+AGGCTCACTTTACTTACCTTGTAATGGCAATTTACTCATTCATGGTTGTATTCCAGTTGATGAAAATGGTGAGATGGAAT
+CATTCGAAATTGATGGTCAGACATACAGTGGCCAAGAGTTATTAGATGTGTTTGAATATCATGTCCGTAAATCATTTGAT
+GAAAAAGAAAATACTGATGACTTATCCACTGATTTAGTTTGGTATTTATGGACTGGGAAATACTCTTCACTATTTGGTAA
+ACGTGCGATGACTACGTTTGAACGATACTTTATTGCAGATAAAGCTTCTCATAAAGAAGAAAAGAATCCGTACTATCATC
+TTCGTGAAGATGTGAATATGGTTCGTAAAATGCTCAGTGATTTCGGATTAAATCCAGATGAAGGACGCATTATTAATGGT
+CACACACCAGTGAAAGAAATTAATGGCGAAGATCCTATCAAAGCTGATGGAAAGATGCTTGTCATTGATGGCGGCTTTTC
+AAAAGCTTATCAGTCAACAACTGGCATTGCAGGCTATACATTGTTGTATAATTCATTCGGAATGCAACTCGTTGCACATC
+AACAATTTAACGCAAAAGAAAAAATTCTTTCCGAAGGTATCGACGAACTGTCAATTAAACGGATTGTTGATAAAGAATTA
+CAACGTAAAAAAATCCGCAATACAAATAAAGGTAAAGAGCTTCAGGCTCAAATAGATATTTTGAAAATGTTAATGCATGA
+TCGTTACTTAGACTAAAGACGACTTTTGATGCACGTGTCGTACACTTATTTAGAGGTGCTGTGTTTACGCATTGGCTACG
+CAAACGCGATGGTAAATAGGCGACCTAGCTACACCGAAAAAATCCCCTCACTATTACGAGTAGTGAGGGGATTGGTGTAT
+>PZTC01000055.1 Staphylococcus aureus strain CM178 PROKKA_contig000055, whole genome shotgun sequence
+ATTAAAACACTTCTTTCACAATCAATCTCTCATGCCATATCCACTCATTATGATTGTTCCAATAAATGCGACACCAACCA
+TCTATAATTTCAAACACATATATTAATGTTCCAGGCGCGTATACAGCCTGTCCAACATCGAATCTATAGTTAGTACGATT
+ATCACCGTATCTAGTGGCTGAAGTAGCACCTAAGCCGTCGATTTTCGCATTAAAATAAGCACCTTTTGACCATTTAAGGT
+TATAAGGCGCTTTACTTCCAACTGTTATTTTACTTGCAGATTTACCGACTGCTTTTTGAGCAGGTGGTTTAACTTTATTT
+GTGATCTTATTCATTAAGCCCTCACTTTTATACTTAGGTCTAATAAAGTGAGTACAGCCGTAATAATTATCCCAACGTAA
+CTTTGCAGGCGTATTTGCGTTACCGTCATAGTTCTGTTCCAAAATTAAAAATTGATTTGTATTACCACCATTAAACACTA
+AACCAATATGACCGTATTGTTTATATATTCCTTTGGTAAATACAGCCACATCACCTATTTGTGGAACAAACGATGGTGTG
+TTTTCATATACTGTTGCCATGTTTTTAAAATCGTTATTGATTGCATCTTTTGCATTTCCCCACATTCTAATTTCTAACAA
+CCAATAAATGTAATCAACTGCTAAATCTGCACATTGGTAACCATACCAACCGTCAAAATCAATATATCTACCTTGATACC
+AACGTAACCTTGCTCTTGCTTCACTGTATGTTTTCATTATTTTACCTCCTAGTATTTTCTTCTTGGTTCTTCATATTCTA
+AAGCTTGGTGGCTATCACCTATACCTTTAGTAGTCGGGTCTTGAATCACACCAGTTAATACTAAAAATCCTAATATAGCG
+TTTAAACCGTCTGTTAATTGCTCTGTATAAACTTGAATATCATACCCAATAGCTTTGGCGATGTTTTGAGCAAATAAAAA
+GATAGCTGACAATATCGCTACCCAAAATGATTTTTGTTTCATTCTAATTTTCCAATTAATCATATTCTTATCTCCTTTTA
+TCCAAAATAAAAAGACGACTAA
diff --git a/tools/phylophlan/test-data/GCA_003236795_trunc.fna b/tools/phylophlan/test-data/GCA_003236795_trunc.fna
new file mode 100644
index 0000000000..d5ab4745d9
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_003236795_trunc.fna
@@ -0,0 +1,119 @@
+>PZTE01000001.1 Staphylococcus aureus strain CM175 PROKKA_contig000001, whole genome shotgun sequence
+GTATTGACATTAATATCTAATTGTAATGTATCGATTAAGTATTGAAACGACACGCCTTTTTCATATTCTTGAAACATATA
+TAGCAGTACATCTATGTCTACTTTAGGTTTTATTGACATAAATAAAGGTCCCTTCAAAGTTTTCATTTTTTCAATGTCTA
+CTTTGAAGGGAGCATTTCAATATGCTTAAGTCCGAACTCATTGTTTATACTTATAAATTTTACGGGTTTAATATAATACT
+TATTTACCTGTAATATATGATAATTCTTCAGCGGCAGATGCGTTGATAGTTCTATGAGAAATGATACCTAATCCTTTAAC
+ATTGGATTCTGAAATAACGATAGAACCATCACTGTTAACTTTTTCAACAAATGCTACATGACCGTAATGTTGATCTGCAC
+CAAATTGTCCAGCCTCAAATACAACAGCAGCATGACGTTTTGGTGTATGACTTACTTGATAATCACGGTATTGAGCTCGA
+TTATTCCAATTATGTGCATCACCTAAATCACCTGAGATAGATGTACCAAATTGTTTCATACGGTTATATACGTACCAAGT
+ACATTGGCCATGTGGATATGGCATACTATCAGATACCTCGCGGAAAGGTTTGAATTCATCTGATGAATCATCATAATCCT
+TGATAGAACGTTCATATTTATCTAAATCTGGCATGCGTTCATCGTCAAACTGAGTTAATTGATAGTGTTTAATAATACTG
+TTTAATTTCTTAGCATAGTTTGGATCTGTAGCATATGTTTTAGATAAGTGTGATGTTGCATCTTTATAAGAATCGGCTTC
+CGATTTCCATGTTGGTTTATAAATTGTTCGATTGCCATCAATACCATTTTTAATAAGGTCAGAGTAATCTTTTAGTGATT
+CTTTCGTGCTTGGATATTTTCGGAATCCAGCATTAATACTATACAATTGATTACCATCAGCTTCTAATGTGTTAAAAGGA
+ACAGAATTCCCTTCAAAAGCACCTTTGATACCGAATAAATTATGGTTTGGTGACTTAGCTAAAGCACTACGACCTGAGTC
+AGATTCTAAGATTGCTTGGGCAATCATGACAGACGCATAAATATCGTTATCTTGACCAATGCGATGTGCATCTTTAGCAA
+TTGATTTTACAAATTGACGTGTATCTTTTGAGTCAACAACGTTAAATTGTCCACTATCATCATTGTTAGATATACTAGGA
+TCTGTTTCGAATAATGATGTTGCACGTGTATCCTTTTGATTAACATCGTTATTGAATGATTGAGCAGGTTTAGATTTATG
+TTTCAATTCATCTTGTGTTGGTAACTGTGGATTCTTTGTATTAGATTTTTCATTTTTGTCTTTTTTAGATTGAGATGCGT
+AATCTTTTTGTGTTTTCTTTGCATCTTCACTGTATTGATCCAAAATAGAGTCTAAAGCCGAATCTGACATTGATTGATTA
+CCTTTCGATGAAGATTTTTGATTTGCTTTATCGTCACTTGCTGGTTGACTATTTGATTGATTTGGTTGTGTTGGCTTTGG
+CGAATTTGGTTGCTTGTTAGATGTACTTGGTTTTGAATTGTTTGATTTAGGTGCTTTTTGATTGTCTGCTTTATCTTGTT
+TAGATGATTGCGTATCAGTGTCATTTTTGATGCTATTGTCACTGTTTTTATTCGAATCATTTGTTGACTTTTCACCATTA
+CGAGGTTGTTCGTAATCAGAAATATCCGAATTTAAATTGAATAAGTTTTGGATTAAAGTTGTTAATGAGTAATTATCATC
+GTATTTATTTTTGGTTAGCAATTGGTTTATATTGGTTTGTGGTAAATTCTTATAAATAAAATCAATGATATTGTTAGAGT
+CTGAAGTGCTGTCGTCTATAGTTTTAAATTTTTTGTCGTTATTGTCTTGGTTACTTGTATTATTGTTGTCTGCTTTATCA
+ATATCTTTACTTGTAGTATCCTTAGAAGTTTCATCGTCATTAGATTTTTTTGAATCATGAGATGTTGTCTTAGCTGTAGT
+ATCTTTTTGAGGTGTATCAGCATAAGCGGTAGGTGAAACTAAAGTAGGTAATACGAGCGTAGTTGATAGCAAATAAATTA
+AAATTTTATTTTTAGGCATATTTCGTATTCTCCCTTGAAAAATATAATAATTAAGTGTGATAATAAACTATGATTTGTTA
+TAATTTATCGTATGCTGAAAATAGTTGATAGGTATCAATCGACTAAATATCTTCCAGTAAATTGATTATACTAATTCACA
+ACGCAAAAATAAATTAATTTACAAAAAATATATAAAAAATATGAATAATTCCTACATAGGAGTGTGACAATGAAGAACGC
+ATTTAAATTATTTAAAATGGATCTGAAGAAAGTAGCTAAGACGCCAGCTGTGTGGATTATCTTAGCAGGCTTAGCTATTT
+TACCATCGTTCTACGCTTGGTTTAACTTATGGGCAATGTGGGATCCATATGGCAACACGGGACACATCAAGGTCGCAGTC
+GTTAATGAAGATAAAGGCGACACAATCAGAGGGAAAAAAGTTAATGTCGGTAATACGATGGTTAATACACTCAAGAAAAA
+TAAAAGCTTTGATTGGCAGTTTGTAAGTAGAGAGAAAGCTGATCATGAGATAAAAATGGGTAAATATTTTGCAGGTATTT
+ACATCCCATCTAAGTTTACACATGAAATTACTGGAACACTACGTAAGCAGCCTCAAAAAGCAGATGTAGAATTTAAGGTG
+AATCAGAAGATTAACGCTGTTGCGTCTAAGCTAACAGATACTGGTTCGTCAGTTGTCGTTGAAAAAGCGAATGAACAATT
+TAATAAAACAGTAACTCGAGCATTATTAGAAGAAGCTAACAAAGCAGGTTTAACTATTGAAGAAAATGTGCCGACAATTA
+ACAAGATAAAAAATGCGGTATATTCAGCAGATAAAGCTTTACCTAAGATTAATGACTTTGCGAATAAAATTGTATATTTG
+AATAACCACCAAGCGGATTTAGATAAATATGCGAATGATTTTAGAAAACTAGGAAATTATAAAGGTGATATTTTAGATGC
+TCAGAAAAAATTAAACGAAGTCAATGGTGCTATTCCGCAACTTAATGAAAAGGCTAAGTTGATATTAGCTTTAAATAATT
+ATATGCCGAAAATTGAAAAAGCGTTAAATTTTGCAGCTGATGACGTGCCAGCGCAGTTCCCTAAAATTAATCAAGGACTT
+AACATTGCGAGTCAAGGTATTGATCAAGCTAATGGACAGTTAAATGATGCCAAAGGCTTCGTCACACAAGTTAGAAGTAG
+AGTCGGTGATTATCAAGATGCAATTCGACGCGCGCAAGATTTAAATCGAAGAAATCAGCAACAGATTCCTCAAAATAGCG
+CGGCGAACAACGAAACATCAAATAGTGCACCTGCAGCTGGTAATGGTGTAGCACCAACGCCACCAAGTGCACCAAGTGGC
+GATACCGCACCAAATAATAATGTTACGCAAAATACCGCACCAAATAGTAATAATGCGCCTGTATCGACTACACCACAAAG
+TACAAGCGGGAAAAAAGATGGGCAAAGTTTTGCAGATATAACAACAACACAAGTCAGCACAGCTAACGAGAACACACAAA
+ACATTACAGATAAAGATGTTAAATCAATGGAAGCGGCATTAACGGGCTCTTTATTATCATTATCAAATAATTTAGATACC
+CAAGCGAAAGCCGCACAAAAAGATAGTCAGGCATTACGTAATATTTCGTATGGCATTTTAGCATCGGACAAGCCTTCTGA
+TTTTAGAGAGTCTTTAGATAATGTTAAGTCCGGTTTAGAATACACAACTCAATATAATCAACAATTTATCGATACATTAA
+AAGAGATTGAGAAGAATGAAAATGTTGATTTATCAAAAGAAATTGATAAGGTAAAGGCAGCTAATAATAGAATTAATGAA
+TCACTAAGGTTAGTTAATCAATTAAGCAATGCATTAAAGAATGGTAGTTCAGGAACTGCTGAAGCTACTAAATTACTAGA
+TCAACTGTCAAAACTAGATTCATCATTATCATCATTTAGAGATTATGTTAAAAAAGATATTAACAGCTCTTTAGTATCAA
+TATCACAACGTATTATGGATGAATTGAATAAAGGGCAAACGGCATTGTCTAATGTTCAGTCTAAGCTAAATACAATTGAT
+CAAGTCATTAACAGTGGACAAGCTATTTTAAAAAATGGTAAAACACGTATCGATCGTTTACAAACAGTATTACCAAGTAT
+TGAACAACAATACATTAGTGCTGTTAAAAATGCTCAAGCAAACTTCCCTAAAGTGAAAAGTGATGTAGCGAAAGCAGCTA
+ACTTTGTACGTAACGATTTACCACAGTTGGAGCAACGTTTAACCAATGCGACAGCAAGTGTGAATAAAAATTTACCAACG
+TTATTAAATGGTTATGATCAAGCGGTAGGATTACTAAATAAAAATCAGCCACAAGCGAAAAAGGCTTTATCAGATTTAGC
+TGATTTTTCTCAAAATAAATTGCCTGATGTTGAAAAAGATTTGAAAAAAGCGAATAAAATTTTCAAGAAATTAGACAAAG
+ATGATGCAGTCGATAAATTAATCGACACGCTTAAGAATGATTTGAAAAAGCAAGCGGGTATTATTGCAAATCCTATTAAT
+AAGAAGACTGTTGATGTTTTCCCAGTTAAGGATTATGGTTCAGGTATGACACCATTCTATACTGCACTGTCAGTATGGGT
+AGGTGCACTCTTGATGGTAAGTTTATTAACGGTTGATAATAAACATAAGAGTCTAGAGTCAGTGTTAACGACACGACAAG
+TGTTCTTAGGTAAGGCAGGATTCTTTATAATGCTTGGTATGTTGCAAGCACTCATTGTATCGGTTGGAGATTTGTTAATC
+CTAAAAGCAGGGGTTGAGTCACCTGTATTATTCGTACTTATAACGATTTTCTGTTCGATTATTTTCAACTCAATCGTATA
+CACGTGCGTTTCATTACTTGGTAACCCAGGTAAAGCCATTGCAATCGTATTGCTTGTATTACAAATTGCAGGTGGTGGAG
+GAACATTCCCAATTCAAACTACGCCACAATTTTTCCAAAACATTTCGCCATACTTACCATTTACGTATGCAATTGATTCA
+TTACGTGAAACAGTAGGCGGTATTGTTCCGGAAATCTTAATTACAAAATTAATTATATTAACGTTATTTGGCATAGGATT
+CTTCGTTGTAGGTTTAATTTTAAAACCTGTAACAGATCCATTGATGAAGCGCGTATCTGAAAAAGTTGACCAAAGTAACG
+TTACAGAATAAAAATTAAATCCACACATTAGGGTTATAGCTCCTTAATGTGTGGATTTTTATGTTTTTAGACAGAAGAGA
+TAGTAATTTCTGTCTTTTATGGGACGGGTGTTATCATTGCTATTATCCAGGATGACTTACTATAGCACTAATATTACCGA
+CAAAGTGAATATCCTCGTCTTCCGTAGTTAAAATAAAGCTAGAACCTTTTTGGATGTCATAGTGCTTATCGTTTACTGCT
+AAAGTGCCAGTACCATCGATAATTGTAACTAAGCAATAAGCATGTGGTTTATTGAATTTTAAATCTCCATGAATATCCCA
+TTTATATACTGCAAAATACTGATTATCTACAAATTGAGTTACAGTGTGTGTGTCGATGTGAGTTGTTATAGGAGTAGTAT
+TTGGTTCATGATTGCCTAATTCAATCACATCTTTACTTTGCTCTAAGTGCAAATCACGCAATTGACCATTTTGATCTCGT
+CTATCATAGTCATAAATACGGTATGTCGTATCGGATGATTGTTGTGTCTCTAAAATTAAAATACCCGAACCAATGGCATG
+GACAGTGCCAGCAGGAACATAATAAAAATCACCGGGCTTAACAGGTATACGTTTGAAAAGACTGTCAAATTCATGATTAT
+CAATCATGTCGATTAACGTCTGTTTATTATGTGCATGTACGCCATATATAATTTCAGCACCTGGGGCTGCATCTAAAATA
+TACCAACATTCTGTTTTACCTAGTTCGCCTTCGTGTTTTAAAGCGTAATCATCATCCGGATGAACTTGAACAGATAATTT
+ATCATTGGCATCTAATACTTTAGTTAGCAGAGGGAAACTATCTCGTGAATCATTATCGAATAATTCACGATGTTGTGACC
+AAAGTTGATCTAGGGTCATATCCTTGTATGGACCATTGATAATTGTATTAGGACCATTTGGATGTGCAGAAATTGCCCAG
+CATTCACCAGTTGTTTTATTAGGGATATCATAGTTAAATGCTTTTAATGCATGACCGCCCCAAATTCTGTCTTTAAAAAC
+GGGTTGTAAAAATAATGCCATAGTTAAAACTCCTCTATATTTTCATTAATAAGTTGTAAATTTCTGTAGTACTGTTTGCA
+TTAATTAGTGATTGGCGTGTCTCATCATTCATTAACGCTTTAGATAAGCGCTGAAGTATTTTTAAATGTGTATCCTGACT
+GTTGTTTGGTACGGCAATTAAGAATATCAATTGAGGTAGACTACCATCTAGGCTCTCCCATTTAACTCCATGATTATTTT
+TCATAACAGCTACAATCGGTTGTTTTACAACATCAGACTTTGCATGTGGAATGGCCACGTTCATGCCAATAGCCGTCGTA
+GACTCCATTTCACGTTCTAGGATTGCATTTTTTAAATGCGATGTGTGCTCAACATAACGGCAAATTTTAAGTTTATGAAT
+CAACATATCAATTGCTTCGTTTCGAGACATGTCGTGATCAGTAATTACCATAGTTTGTTGATCAAAAACATGAGAAGGTT
+TATTGAGATGTGAATGTTTCGCGGTGTTATCTACATTGTCAACCTCTGTATCATGTTGTGTTATATCTGTATCATGAAGT
+TGCGTGTGTTGCGCTGGTGCATCTACTGCTATAACTGGTGTATTGCGTTTTAATAATAGTACAGTAATCATTGTGACAAG
+ACTACCTACTATCACTGCAAAGGTAAACCATAATATATGATCAATACCACCTAATACAGCCACAATTGGACCTCCATGTG
+CGACTCTATCGCCGACACCACCAATGGCTGCAATGACTGATGCAATCATTGCACCAATGATGTTTGCAGGTATAATGCGC
+AATGGATCTTGCGCTGCGAAAGGAATAGCACCTTCAGTAATACCAAATAGTCCCATAGTGAAGGAAGCCTTACCCATTTC
+TCTTTCGGAATGATTGAATTTATACTTTTGAACAAACGTTGCTAAACCTAAACCGATTGGTGGTGTACATACAGCAACTG
+CGACCATACCCATAACGGCGTAATTACCTTCAGCAATAAGTGCTGAGCCAAATAAAAATGCTACTTTGTTTACTGGACCG
+CCCATATCGAAGGCGATCATCGCACCTATAATCATCGCAAGTATAATAATATTAGCACCTTGCATACTTTTTAACCAGGT
+TGTTAATGCCTCAAAAATATTAGAAATTGGTGCACCGATTAAAAATATAAATATCAATCCTACAACGACCGATGAAATAA
+TGGGAATAATAATGATAGGCATAATTGGTGCCATTGCTTTTGGAACTTTAATATCTTTAATCCACTTTGCGATATAACCT
+GCTAAGAAACCAGCAACAATACCACCTAAAAATCCTGCGCCTGCATCACTGCCATAAAAACTACCGTCAGCAGCGATAGC
+GCCGCCAATCATACCAGGAACGAGACCGGGCTTGTCAGCGATACTAACAGCGATATATCCAGCTAGTATTGGGACCATAA
+ATTTAAAGGCTAAACTACCAATGTTTTCAATGGATTTCCAAAATGAATCATCTGGGATGACTAATCCTTTTGATGTCGTT
+>PZTE01000044.1 Staphylococcus aureus strain CM175 PROKKA_contig000044, whole genome shotgun sequence
+GGTTCTCCACCAAATGTGGTGGGTATATAATTTAAAGAACTATTTTAAATTACAACTTTTAGAGTTTTTATTATTAGGCG
+GCCAGTCCATTATTGGGCTTGGTTGTCTTCTTTTTTTCTCCTTTGTACAAGCTGAAAATCATCATTATACGTGCTTTAAA
+GTTGTTGAAATTTCTGTAACCAAAAGAAATTCGCTTGATTAATTTTATCTTATTATTAATTCCTTCTATAGCACCATTAT
+TAAATGCTGGGTAATAAATTGTATTTCTTAACATCCTTTGATGTTTTCTATAATATTTAACCACTTTCCATACACCCTTA
+CTCACAGACTTTTTACTAACTGAATTTAAACGATTAATAAATTTAGGCCAATTACATAACCTTAGGTCTTTTCGTAATCC
+TTGGACAAGTTCGTAGGAGTGTCGTAGTATATCGTCTTTTGAAAGCATGAATTCTACAATGTCAGATGAGCGTTTATAAG
+CCTTAAAAGATTTATTCCATCTGTATTTACTAAATATGGTTTTACTAGTATCCATCAATAGAACTTTCCAGTTATTCTTA
+AAAATTGTATAATTAGGTCCTTTTTTATTACGGTATTCATTCATAACTTGTACACGATACTTATTAAGTTCTCTATTTAA
+ATGTTGAACGATATGGAATCTGTCAAAAATAATAGCCGCATTAGGAAATAGGTCGCGAAATAATCGGACATAGGGTTCAT
+ACATGTCAATAGTAACCGTCTTAACTTGTTGTCGATTTTTTAAATCGAATCGCTCGAAATAGGCACGCAAGAATCTTGTA
+GTTCTATTTTCTAAAATATCTATAACATCATGAGTATCATTATCTATAAAAATGAAACTCATTGACCCAGTTACATTTTT
+AACGCTTTTAAATTCATCCATAGCGATGTGTTCTGGCAAACAATTAAACGGTTTAATTCGCAATGAATTAGCCGCTTTAG
+TTCTAATACGACTTACAGTAGATGGAGAGATACAGTTGTCTTCTGCAGTATCAATCTCTGTTTTAACTTTAGTAGCTTCT
+TCTATAACTTTTTGAGTAACACATCTTGAGATAAAACACGACTCATCAACAATTGATGTTTTAGCAGTAAAAGTGCCATT
+GCATTCTAAGCATTTAAAACGTTGTTTAGCTAAGTTGAGGTATGTGTTATACCCTTGAGTTTTAAGTAAAGTAATACGAG
+AAACACGCTTACCATGTTTATGAATTTGTCCTTCATTTTTAACACCACAACAATAACAGGCCGAAGGCTTATACGTTAGT
+ACAGCATTAACCACTGTTGCTTTTTTTCCTTTGATAATGACGTCAATTTCTTGGTTTATATAATTTATATTTTCATCTTT
+TATTCTTAGTAATTCTAAGGTATCATTACACATAGGCGCACTTGTCTCCTTTAGTTTGGGTTTGGTCACTTTAAATTATA
+GAGGCAATTGCGCTTTTTGTGTATTAAAAAAAGCAGGAAGTTTTACCTTCCCACCATAAAAGATGAAGAACC
diff --git a/tools/phylophlan/test-data/GCA_003236805_trunc.fna b/tools/phylophlan/test-data/GCA_003236805_trunc.fna
new file mode 100644
index 0000000000..d827341e42
--- /dev/null
+++ b/tools/phylophlan/test-data/GCA_003236805_trunc.fna
@@ -0,0 +1,118 @@
+>PZRU01000001.1 Staphylococcus aureus strain CM173 PROKKA_contig000001, whole genome shotgun sequence
+TTTGTTTTCAAACCAATGTTATATTGGAATGGCCATCGCATAGCTTTAACATGATTAGTTTTTTTATAGTTGTAATATGT
+TGTTCTAGAGCTAATGAATCCTTGCATCTTTAATATCAAAGCATCTTTGTTATATTTTTTATCCTTCACAAAATCAAATT
+GAATATTTTGAGTCACGCCCCATTTATTACTAGTTTTATCTTCTGTCCTTTTGATAATTTCTATATCGCTTCCTTTACCG
+ATGTCTTCAGTATCGTTGGCAGCTTTAGCATTTTCTAATAACGGATTGGCAAGAGGGGCAAGTAAGCTCACAGATAAAGT
+TGTAGCTAATATTTTATTTCTAAGCATAAGTTTCACTTTCTTTCTATAATTTTATTTAACTTAATTAAATAATAATATAT
+TTTGAACGTTATTATAATTAACTGTTCATTAACAATTGACCATTATCAACTTTTTTTACAATTAAGTTAAAAATGCCATA
+ATTCCGTTCGATTTAACCTTTTTTGTTTGGAATGCTAAAATCTAATTTTGTGAGAAATATAGTTAATAAAACCTTGGTAT
+TGTTGACAGTTGTAAACAATTTAAGGTAACCGATTGCACGAATGTCTTGCTTTTATTTTTAATTAATGTTTGTAAAATAC
+AAATTGTTCTTTTTTAAGATTTTTGATGTATCCATCTAAAAGTTAATTATTTATTAACTTGAGAATATTTTATTTAAGCT
+TTCAAGTTAAATTGCTTCATTTGTATTATTTGTGTATCTACTATGGTGTGATATTTTGTTCTTATAAAAATCAGTTGTTA
+TTATTAAATTTAATGTACGATAAAATAATTTAATGTTATGAGACTGATTCAATATGTTAAAAAATCCTGAGACAAGTATG
+AAGTGTCCCAGGATTTTATAAAATGATTGAACTGTTTACTTAGGTGTGATGCTTTTAATTTTTACTTCATGTGTTTTCCA
+GTTCACTTCATATTTAACTGTAACGTTTCGGTTTTTAAAAGCATCATGTTTTCTATCAACGGCTAAACGATGTCTTGTCA
+CGTATGCATAAGTAGCATCCATGTTTCTGCCGTAAGTGATTTCAAACTCGCTTTTATCACCTTTACCTCTTTCGTGTGAC
+AATGTTGTAATAAATGATGGATTAAAGCCACTTTGAATTAAAGGAGGTAGTTGATTATCTGGGACGAAATAGTCTCTTGC
+TGCTGGACCAGTTGGGTCTTGTGCAAATAAGTATTGATCATATGCAGATACTTGACCATTCGGTGTAACGAATGAATTTG
+CTTTCACTCCCCATTTAACACCTTTAGAGTTCTGACTTTCTACTTCAGTAACATAGTTTTTTTGATTATAACTAATTGTT
+TTAGAGTAGTTGAATGAGCCACTGCCTCCGATTGATGGCGCTGATTGGAAGTTTCCGCCGATATTATAGCCTAATTTCTG
+ACTAACATCTGCTGAATCAATTTTATTTTTAGGAAGATAATTGATTAAATCAACATTAGAGTCTTTCGTTTTCAAACTGA
+TATTATATTGAAATGGCCATATCATTCTTTTAATATATGGATATTTTTTTAAGTCTGAATATGTTGTTCTAGAGCTGATG
+AAGCCTTGCATCTTAACAACTAGAGCATCTTTGTTATATTTTTTATCTTTTACAAAATCAAATTGAATGTTTTGAGTTAT
+AGCTAATCGTTTGCTAGTAATGTCTTGAGTTCTTTTGATGATTTCTGCACCTTGGCCGATATCTTCTATCTTATTTTCTG
+CTTTAGAAATTTCTATAAATGGATTGGCTAAAGGGGCTATTAAACCAACTGCTAAAGTTGCTGTTAATATTTTATTTTTA
+ATCATAGAAATCACTTTCTTTCTATTTAATTTTAAGTTCATATATATAATAATCTATTTGTAAGCGTTTTCGAATTAACT
+GTTCGTTAAAAGTTAATTACTATCAACATGTATTGAAGAGACATTTTAGCATTGTTAAATGATGTTTTTGCATTATGTTA
+TGTTTAAAAGATTTATTGGTCGTAGGCGTTTATATAGCTACATAACTATGTTTTGCAAGTCTTATTCTATTGAATTGTTG
+TTTAATTATGGTGCTTGTAGTGGAAGAGGAATGGATTGCGCAATAGTTTGTGAAAATTTGAAGTTAATAAAGTTGTGCTG
+ATTCAACTAAATGATGAACTATTCGTTAACGATGTAAGGATTATTTAACAAGTTGCAGGTAAAAAAGTAGGCTGACAAAT
+AGCGAAGAAACATTTAATTGATGGAAAATAAAAAAAGAACCGCAGATTCGATTGAGAATCAACGGTTCTTTTTAATCACG
+GTTTATTACGAAAATTATTTAAAAAATGATGTAAAACTAGAGAAGATATTTTTGATTGATGATGCTGTTTCAGCTGTAGT
+TATAGCAGCTTTAACTACTTTTGGATTTTGATAAAATGCATATAATACTTTACCTGTGTTTAAAGTTTCAGTTACATAGT
+TTCTTACTTGTGCATATGATTTAGATACATAATTTTTTTGATCTTCAACTTTTAATGGTTGGATGTATGATTTGTATCCA
+TTACCAAAAACTGATAGTACAGTTTTATCTATTGTACCTTTATATTTAAAATATTTATCAGTGTAGTACTTTGCTGTATC
+ATATTTTTCTTTATAGCTTTTATAAGTATCTGTTAAATATTTGTAACCATAGTTAAATGAATCTTTTAATGATTGGTAGT
+AACCTAATAATTTAGATTGAGGAACCTCAACTTTTGGTGATTGAATTTGAGGGACTTCAACTTTTGGTGATTCTGCTTTA
+GGTTTTTCAATTTGTGGTGATTGAATTTGAGGAGCCTCAACTTTTGGCGCCACTTTCTTTTCAGCATCTTTTTGAGCTAC
+TAATGCGTCTAATTGTTTCTGTAAATGCTTTTGTACATCCATAGGTGCTTTATTAACTTCACGTTGTGCTAAACGTCTGT
+TTTCAATTGAATCTTTTTCATTTAATTTTGAGATTGCATCATTTGCTGATTTCACACGCTCATCATGACGAACGATTGCT
+TTTTCAATTGAAACTTTTTCTACAAAGCGGTTATTTTTATCGCGTAAATCTTTAGGTAATTTTGAGTTAGCTTCATATGC
+TGCTGATTTATCGTGTGGTGCTTTGTTATCTTGGAAATCTTTAATTGCTTTATCCGCATTTTCAATATTTTGACGTTCTT
+TAGCTTTAGAAGATTGTACTGATTCTACCCAAACTTGTTGGCTTCTATCAGGGTTTTCTTTAATTTGTGCAATGTAATTA
+TTTTTTTCTTGTTCAGTTAAGTTATCATTTTTAAGAACATTGTAAAAAGCGTTTTGTTGTGCAACACGTCGGTCTGGGTT
+CTTGCTGTCTTTAAGTGATTCAGAGAATACTTCTTGTGCACGTTCTGGGTGTTCGCGTAATGTTTTGATGTATTGGTTAC
+GTTGTTCTTCTGTGATACCTTTTAGATGCAATACTTGATAAAAAGCTTTTTGTTGATCTGTTACGTAGTTGTTTTGAGTT
+GTTTGGTGCTTAGTTGAAGTTTGTTGCGTGTTTTCACTCGCTTTTGCTTCCCCATTTGAAATCATTGTAGCTAAAGTAAT
+TGTTGCTGCCCCAACTAGCAACTTCGAGATATATTTATTTTTCATGTGTATTCCCTTTCTTTTTACATATTAAATTTATT
+GTATGCTTTTAGAATTTATCACATGAGAATACAAATGGAAATTAACTAATTATTAACTAATGTTAACTAATAGATTAACT
+AGTGTTAACTATGTAAAAAAGCGTTTAATTCAGAACATTCAGCGTATTTTAAGTAAGGAAGTACTATATGGAGAAATGCA
+ATGGTTTGCTAATAAATAGAGGAGAAAATTGTCTTTCGAAGAGAGTTTGGTAGAGTAGAAATCACATTTGATTTGTCACT
+GATGCACTTTTTCTTCTATATAATTAGGTCACGACATTAGATAGCTTCGCAACTCATGCATAGGGTCCCAACATAGAAAC
+TTTCGAGGCGAAAGTTAACAAGTAGGAAGAGTTGGGCGCCTTTCTAACAAATAATTTCGCAGAAAATAAAGGAACGCAGT
+TGGACGTAAAACGTCAACTGCATAAGCCTTTCTAGCTCATAAAATTCGCAGAAAATAAAGGAACGCATTAGATAGCTTCG
+CTACTAATGCATAAGCCTTTCTAACAAATAAATTTGAAGAAAGGCTAAAAAATATTTTTAGGGGTTGCGAATGAATAAAT
+TAGTTTAATTTTATAAAAATTTATAAAAATTAAAAACGTTGTAAATTTAAAATAAATCATTCATAATATTGTTACTATAC
+TAATTCAAGGTGGTTCAACGCATGTCTCATAATGAAAATCTTAAATTGGCGCAACGCGGTGCTTATTTGAGTTTAATTGT
+ATATATAATCTTATCTATTGTTAAGTATGTCACGGGTTTTGTCTTTAACTCTGCAGCTGTAAGAGCCGACGCATTAAACA
+ATATGACAGATATTATCGTTTCTTTAGCTGTTATTATTGGATTGAAAATTTCAATTAAACCTGCCGATCGAAATCATCCT
+TATGGCCATTTGAAGTCTGAAAATATTTCTTCATTATTGGTGTCATTTGTCATTATGTTTGTAGGTATCCAAGTAGTTAT
+TCAAAATGCACTTCGTTTGTTCAAAGAAGATGACGTTGTACCTAACGCAATAACAATTATCGTCAGCTTAATCAGTGGTC
+TTGTAATGTTGATTGTATTTGCAGTCAATCAAAGACTAGCGAAAAGAACGAAAAGTAGTTCTTTAAATTCTGCTGCCAAA
+GATAATTTATCAGATAGTTTAGTCAGCATTGGAACGGCGATAGGATTAATTTTTACGCAAATCGGTTTCCCAATTGTCGA
+TATTATTTTAGCAACATTGCTAGGCTTACTAATCGTTTATACTGGTTTTGGTATTTTTAAAGAAGCAATTTTTATGTTGA
+GTGATGGTTTCAATGAAACTGAATTAGAAGCGTATCGCAATGATATTTTAGAAGTTGATGAAGTACAAGAAGTTAAAAGT
+ATTAAAGGGCGTTACCATGGAAGTAGTGTGTTTATTGATGTCACAATTGTTGTAGATGCTAACCTTTCCTTAGTAGAAGC
+CCATCAAATTTGTGACAATGTCGAACATCATTTGCACAAAAAAGGTATTTCCTCAGTATACGTTCACCCAGAACCAGACC
+ATCTATAATGTATTTAAACGTCTTCATAGATATATAAATATCTGAGGAGGCGTTTTTATTACATTTATTTTTAGGCGCGC
+CTAAAAATATTTTTTAAACCTTAGAAAAATAGCGGACAAAGGTGTATAATATGATTTATTATTAGGTGGTTATTGATTCA
+TTTATGAATTAAAAAATGAAAATGGGGAATAGGATTTATGTATTTAATGTCTAGTGATAATTGATTTAATCATTGAATTT
+TAAAACATATTGAAAAGAAAATTACTAAGATTAAATCATCTTAAAATATCCCTGAAATAACGTCCTAAAGATTAAAGGAA
+AGAGGTTATAAGTTATGCCAAAATTAATTTTATGTCGTCATGGACAAAGCGAGTGGAATGCTAAAAACTTATTTACTGGA
+TGGGAAGATGTTAATTTATCTGAACAAGGTATTAATGAAGCGACTAGAGCAGGTGAAAAAGTAAGAGAAAATAACATTGC
+CATCGATGTAGCTTTTACATCGTTATTAACACGTGCTTTAGATACAACGCATTATATTTTAACTGAATCTAAACAACAAT
+GGATTCCTGTATATAAAAGCTGGCGTTTAAATGAACGCCACTATGGTGGATTGCAAGGCTTAAATAAAGATGATGCTAGA
+AAAGAATTTGGAGAAGAACAAGTACATATTTGGCGTCGTTCTTATGATGTGAAACCACCTGCTGAAACTGAAGAACAACG
+TGAAGCTTACTTAGCTGATCGTCGATATAATCATTTAGATAAACGTATGATGCCTTATTCTGAAAGTCTGAAAGATACTT
+TAGTTCGAGTGATACCATTTTGGACAGATCATATTTCACAATATTTGCTAGATGGTCAAACGGTATTAGTTTCTGCACAC
+GGAAATTCAATTCGCGCATTGATTAAATATCTTGAAGATGTGTCAGATGAAGATATCATTAATTATGAAATTAAAACAGG
+TGCACCGCTTGTTTATGAATTAACGGATGATTTAGAAGTTATAGATAAATACTACTTATAAAAAAAGAGCTGAATGTACA
+CAAGGAGTGAGTGTATATGCAGCTCTTAAATATGTGAAGTAATGTAAGGAAATAGTTAAGTATAGAGTTTATATTAACGA
+GCTAGGGATACTCGAAAATATAGTTAGACATACAATATAGTCAAATTAAAACAATTATTTCGCTCTTTTATGTTGTTTAA
+TAATCTTTAAAGCACGCTTTCTTGTTTTAATGTTAGGGCTATTTAAATTACGACGAGCAGTCTGTAAATCTAATTTCATC
+TCTATCCCTCCTTGTAAATATATTATGACCGATAACTACTCATATGTAAATAGTAATGATTACGTTTTAAAGAAATTGTA
+ATAAAGTCGTGATAATTTTTTTGAAAATGGGTATAATTACCGGATATCTAAAAATGAGTGTCGTTTTTTAGATGATGAGG
+GGGAAGCTTTAAATGTCGAAGAAACAAAAATTAACGAGGATTATTACTATGCTGATGGGTGGATTTTTTGGATTATTAAA
+TGAAACACTATTAGTGACGGCTTTACCAAGTATTATGAAAGATTTTGAAATTTCATATACACAAGTTCAATGGCTGACAA
+CAGCTTTTTTATTGACTAATGGGATTGTTATTCCTTTGTCCGCGCTTGTTATACAACGTTATACAACAAGACAAGTGTTT
+TTAGTGGGTATTACTATCTTTTTCTTAGGTACATTACTCGGCGGTTTGAGTCCGCACTTTGCAACATTATTAGTTGCTAG
+AATTATTCAGGCGTTAGGTGTAGGTATTATGATGCCATTGATGATGACAACGATTTTGGATGTGTTCCAACCGCACGAAC
+GCGGTAAATATATGGGGATATTTGGTTTGGTAATTGGTTTAGCACCAGCTATTGGACCTACTCTTTCAGGTTACCTTGTT
+GAATATTTTAACTGGAGATCGCTTTTCCATGTTGTCGCTCCAATTGCAGCTGTAACATTTTTAATTGGATTTAAAACGAT
+AAAAAATGTTGGAACTACAATTAAAGTACCTATTGATTTTATTTCTGTCATTTTTTCTGTACTAGGTTTCGGTGGGTTAT
+TGTATGGAACGAGTTCAATTTCAGAAAAAGGTTTTGATAATCCTATCGTATTGGTATCTATGATTGGTGGTATTGCTTTA
+GTCGCATTATTTGTATTACGTCAATATCGACTATCAACACCATTATTAAATTTTGCTGTATTTAAAAATAAACAATTTAC
+AGTTGGTATCATTATTATGGGTGTCACAATGGTATCGATGATTGGTTCGGAAACGATTTTACCTATCTTTGTGCAAAATT
+TATTGCATCGTTCAGCTTTAGATTCTGGGTTAACTTTATTACCAGGAGCAATTGTTATGGCATTTATGTCGATGACTTCG
+GGTGCTTTATATGAAAAGTTTGGTCCTAGAAAGCTTGCTTTAGTAGGTATGGCGATTGTTGTTATTACTACGGCTTATTT
+TGTTGTAATGGATGAACAAACATCAACAATCATGTTGGCAACAGTTTATGCGATTCGAATGGTTGGTATCGCGTTAGGAT
+TAATTCCAGTAATGACCCATACGATGAATCAATTAAAGCCAGAAATGAATGCACACGGTTCATCTATGACAAACACAGTA
+>PZRU01000091.1 Staphylococcus aureus strain CM173 PROKKA_contig000091, whole genome shotgun sequence
+CAATTGCCTCTATAATTTAAAGTGACCAAACCCAAACTAAAGGAGACAAGTGCGCCTATGTGTAATGATACCTTAGAATT
+ACTAAGAATAAAAGATGAAAATATAAATTATATAAACCAAGAAATTGACGTCATTATCAAAGGAAAAAAAGCAACAGTGG
+TTAATGCTGTACTAACGTATAAGCCTTCGGCCTGTTATTGTTGTGGTGTTAAAAATGAAGGACAAATTCATAAACATGGT
+AAGCGTGTTTCTCGTATTACTTTACTTAAAACTCAAGGGTATAACACATACCTCAACTTAGCTAAACAACGTTTTAAATG
+CTTAGAATGCAATGGCACTTTTACTGCTAAAACATCAATTGTTGATGAGTCGTGTTTTATCTCAAGATGTGTTACTCAAA
+AAGTTATAGAAGAAGCTACTAAAGTTAAAACAGAGATTGATACTGCAGAAGACAACTGTATCTCTCCATCTACTGTAAGT
+CGTATTAGAACTAAAGCGGCTAATTCATTGCGAATTAAACCGTTTAATTGTTTGCCAGAACACATCGCTATGGATGAATT
+TAAAAGCGTTAAAAATGTAACTGGGTCAATGAGTTTCATTTTTATAGATAATGATACTCATGATGTTATAGATATTTTAG
+AAAATAGAACTACAAGATTCTTGCGTGCCTATTTCGAGCGATTCGATTTAAAAAATCGACAACAAGTTAAGACGGTTACT
+ATTGACATGTATGAACCCTATGTCCGATTATTTCGCGACCTATTTCCTAATGCGGCTATTATTTTTGACAGATTCCATAT
+CGTTCAACATTTAAATAGAGAACTTAATAAGTATCGTGTACAAGTTATGAATGAATACCGTAATAAAAAAGGACCTAATT
+ATACAATTTTTAAGAATAACTGGAAAGTTCTATTGATGGATACTAGTAAAACCATATTTAGTAAATACAGATGGAATAAA
+TCTTTTAAGGCTTATAAACGCTCATCTGACATTGTAGAATTCATGCTTTCAAAAGACGATATACTACGACACTCCTACGA
+ACTTGTCCAAGGATTACGAAAAGACCTAAGGTTATGTAATTGGCCTAAATTTATTAATCGTTTAAATTCAGTTAGTAAAA
+AGTCTGTGAGTAAGGGTGTATGGAAAGTGGTTAAATATTATAGAAAACATCAAAGGATGTTAAGAAATACAATTTATTAC
+CCAGCATTTAATAATGGTGCTATAGAAGGAATTAATAATAAGATAAAATTAATCAAGCGAATTTCTTTTGGTTACAGAAA
+TTTCAACAACTTTAAAGCACGTATAATGATGATTTTCAGCTTGTACAAAGGAGAAAAAAAGAAGACAACCAAGCCCAATA
+ATGGACTGGCCGCCTAATAATAAAAACTCTAAAAGTTGTAATTTAAAATAGTTCTTTAA
diff --git a/tools/phylophlan/test-data/bin2meta.tsv b/tools/phylophlan/test-data/bin2meta.tsv
new file mode 100644
index 0000000000..8a4b82c1da
--- /dev/null
+++ b/tools/phylophlan/test-data/bin2meta.tsv
@@ -0,0 +1,369 @@
+CM_ethiopia__CM_A01_I1_18__bin.19 A01_I1
+CM_ethiopia__CM_A01_I1_18__bin.31 A01_I1
+CM_ethiopia__CM_A01_I1_18__bin.42 A01_I1
+CM_ethiopia__CM_A01_I1_18__bin.51 A01_I1
+CM_ethiopia__CM_A01_I1_18__bin.52 A01_I1
+CM_ethiopia__CM_A01_I1_18__bin.5 A01_I1
+CM_ethiopia__CM_A01_I1_18__bin.73 A01_I1
+CM_ethiopia__CM_A01_M0_18__bin.21 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.30 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.31 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.43 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.56 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.59 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.60 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.62 A01_M0
+CM_ethiopia__CM_A01_M0_18__bin.63 A01_M0
+CM_ethiopia__CM_A04_I1_18__bin.1 A04_I1
+CM_ethiopia__CM_A04_I1_18__bin.2 A04_I1
+CM_ethiopia__CM_A04_I1_18__bin.42 A04_I1
+CM_ethiopia__CM_A04_M0_18__bin.15 A04_M0
+CM_ethiopia__CM_A04_M0_18__bin.16 A04_M0
+CM_ethiopia__CM_A04_M0_18__bin.8 A04_M0
+CM_ethiopia__CM_A06_I1_18__bin.31 A06_I1
+CM_ethiopia__CM_A06_I1_18__bin.32 A06_I1
+CM_ethiopia__CM_A06_I1_18__bin.34 A06_I1
+CM_ethiopia__CM_A06_I1_18__bin.37 A06_I1
+CM_ethiopia__CM_A06_I1_18__bin.46 A06_I1
+CM_ethiopia__CM_A06_I1_18__bin.54 A06_I1
+CM_ethiopia__CM_A06_M0_18__bin.19 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.24 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.2 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.31 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.34 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.36 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.39 A06_M0
+CM_ethiopia__CM_A06_M0_18__bin.9 A06_M0
+CM_ethiopia__CM_D02_I1_18__bin.21 D02_I1
+CM_ethiopia__CM_D02_I1_18__bin.24 D02_I1
+CM_ethiopia__CM_D02_I1_18__bin.2 D02_I1
+CM_ethiopia__CM_D02_I1_18__bin.31 D02_I1
+CM_ethiopia__CM_D02_I1_18__bin.46 D02_I1
+CM_ethiopia__CM_D02_I1_18__bin.49 D02_I1
+CM_ethiopia__CM_D02_M0_18__bin.17 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.21 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.23 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.25 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.3 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.49 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.4 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.61 D02_M0
+CM_ethiopia__CM_D02_M0_18__bin.62 D02_M0
+CM_ethiopia__CM_D03_I12_18__bin.27 D03_I12
+CM_ethiopia__CM_D03_I12_18__bin.33 D03_I12
+CM_ethiopia__CM_D03_I12_18__bin.34 D03_I12
+CM_ethiopia__CM_D03_I12_18__bin.5 D03_I12
+CM_ethiopia__CM_D03_M0_18__bin.30 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.44 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.45 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.62 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.63 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.64 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.65 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.67 D03_M0
+CM_ethiopia__CM_D03_M0_18__bin.69 D03_M0
+CM_ethiopia__CM_D04_I1_18__bin.12 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.1 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.26 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.33 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.35 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.36 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.39 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.44 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.47 D04_I1
+CM_ethiopia__CM_D04_I1_18__bin.8 D04_I1
+CM_ethiopia__CM_D04_M0_18__bin.42 D04_M0
+CM_ethiopia__CM_D04_M0_18__bin.47 D04_M0
+CM_ethiopia__CM_D04_M0_18__bin.76 D04_M0
+CM_ethiopia__CM_D05_I1_18__bin.27 D05_I1
+CM_ethiopia__CM_D05_I1_18__bin.37 D05_I1
+CM_ethiopia__CM_D05_I1_18__bin.7 D05_I1
+CM_ethiopia__CM_D05_M0_18__bin.24 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.27 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.42 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.4 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.50 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.52 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.54 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.57 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.59 D05_M0
+CM_ethiopia__CM_D05_M0_18__bin.93 D05_M0
+CM_ethiopia__CM_D06_I1_18__bin.21 D06_I1
+CM_ethiopia__CM_D06_I1_18__bin.42 D06_I1
+CM_ethiopia__CM_D06_I1_18__bin.43 D06_I1
+CM_ethiopia__CM_D06_M0_18__bin.10 D06_M0
+CM_ethiopia__CM_D06_M0_18__bin.22 D06_M0
+CM_ethiopia__CM_D06_M0_18__bin.39 D06_M0
+CM_ethiopia__CM_D06_M0_18__bin.40 D06_M0
+CM_ethiopia__CM_D06_M0_18__bin.41 D06_M0
+CM_ethiopia__CM_D06_M0_18__bin.42 D06_M0
+CM_ethiopia__CM_D06_M0_18__bin.7 D06_M0
+CM_ethiopia__CM_D07_I1_18__bin.13 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.1 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.23 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.30 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.32 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.38 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.44 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.48 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.49 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.4 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.53 D07_I1
+CM_ethiopia__CM_D07_I1_18__bin.9 D07_I1
+CM_ethiopia__CM_D07_M0_18__bin.18 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.19 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.23 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.40 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.44 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.73 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.78 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.80 D07_M0
+CM_ethiopia__CM_D07_M0_18__bin.81 D07_M0
+CM_ethiopia__CM_D08_I1_18__bin.1 D08_I1
+CM_ethiopia__CM_D08_I1_18__bin.21 D08_I1
+CM_ethiopia__CM_D08_I1_18__bin.22 D08_I1
+CM_ethiopia__CM_D08_I1_18__bin.24 D08_I1
+CM_ethiopia__CM_D08_I1_18__bin.5 D08_I1
+CM_ethiopia__CM_D08_M0_18__bin.14 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.17 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.18 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.1 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.21 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.24 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.29 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.31 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.34 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.3 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.41 D08_M0
+CM_ethiopia__CM_D08_M0_18__bin.43 D08_M0
+CM_ethiopia__CM_D09_I1_18__bin.17 D09_I1
+CM_ethiopia__CM_D09_I1_18__bin.19 D09_I1
+CM_ethiopia__CM_D09_I1_18__bin.39 D09_I1
+CM_ethiopia__CM_D09_I1_18__bin.50 D09_I1
+CM_ethiopia__CM_D09_M0_18__bin.11 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.22 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.25 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.28 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.37 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.39 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.40 D09_M0
+CM_ethiopia__CM_D09_M0_18__bin.9 D09_M0
+CM_ethiopia__CM_D10_I1_18__bin.10 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.13 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.1 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.26 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.29 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.2 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.31 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.32 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.41 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.43 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.4 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.50 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.55 D10_I1
+CM_ethiopia__CM_D10_I1_18__bin.9 D10_I1
+CM_ethiopia__CM_D10_M0_18__bin.109 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.120 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.129 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.136 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.140 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.141 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.145 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.20 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.26 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.31 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.50 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.53 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.57 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.59 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.60 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.62 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.67 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.6 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.73 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.74 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.76 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.77 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.79 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.82 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.8 D10_M0
+CM_ethiopia__CM_D10_M0_18__bin.97 D10_M0
+CM_ethiopia__CM_D11_I1_18__bin.16 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.19 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.23 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.32 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.38 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.41 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.43 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.47 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.57 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.58 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.67 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.69 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.71 D11_I1
+CM_ethiopia__CM_D11_I1_18__bin.73 D11_I1
+CM_ethiopia__CM_D11_M0_18__bin.11 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.14 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.29 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.36 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.39 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.49 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.52 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.55 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.61 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.64 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.67 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.68 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.70 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.8 D11_M0
+CM_ethiopia__CM_D11_M0_18__bin.9 D11_M0
+CM_ethiopia__CM_D13_I1_18__bin.17 D13_I1
+CM_ethiopia__CM_D13_I1_18__bin.25 D13_I1
+CM_ethiopia__CM_D13_I1_18__bin.36 D13_I1
+CM_ethiopia__CM_D13_I1_18__bin.6 D13_I1
+CM_ethiopia__CM_D13_M0_18__bin.11 D13_M0
+CM_ethiopia__CM_D13_M0_18__bin.18 D13_M0
+CM_ethiopia__CM_D13_M0_18__bin.19 D13_M0
+CM_ethiopia__CM_D13_M0_18__bin.22 D13_M0
+CM_ethiopia__CM_D13_M0_18__bin.23 D13_M0
+CM_ethiopia__CM_D13_M0_18__bin.2 D13_M0
+CM_ethiopia__CM_D13_M0_18__bin.4 D13_M0
+CM_ethiopia__CM_D15_I1_18__bin.32 D15_I1
+CM_ethiopia__CM_D15_M0_18__bin.54 D15_M0
+CM_ethiopia__CM_D15_M0_18__bin.5 D15_M0
+CM_ethiopia__CM_D15_M0_18__bin.65 D15_M0
+CM_ethiopia__CM_D15_M0_18__bin.6 D15_M0
+CM_ethiopia__CM_D21B_I12_18__bin.4 D21B_I12
+CM_ethiopia__CM_D21_I1_18__bin.10 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.21 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.26 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.2 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.31 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.32 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.39 D21_I1
+CM_ethiopia__CM_D21_I1_18__bin.44 D21_I1
+CM_ethiopia__CM_D21_M0_18__bin.14 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.30 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.36 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.42 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.48 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.58 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.59 D21_M0
+CM_ethiopia__CM_D21_M0_18__bin.7 D21_M0
+CM_ethiopia__CM_D24_I1_18__bin.16 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.21 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.33 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.52 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.57 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.59 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.71 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.77 D24_I1
+CM_ethiopia__CM_D24_I1_18__bin.82 D24_I1
+CM_ethiopia__CM_D24_M0_18__bin.18 D24_M0
+CM_ethiopia__CM_D24_M0_18__bin.26 D24_M0
+CM_ethiopia__CM_D24_M0_18__bin.36 D24_M0
+CM_ethiopia__CM_D24_M0_18__bin.58 D24_M0
+CM_ethiopia__CM_D24_M0_18__bin.72 D24_M0
+CM_ethiopia__CM_D24_M0_18__bin.9 D24_M0
+CM_ethiopia__CM_D26AB_I1_18__bin.20 D26AB_I1
+CM_ethiopia__CM_D26AB_I1_18__bin.22 D26AB_I1
+CM_ethiopia__CM_D26AB_I1_18__bin.25 D26AB_I1
+CM_ethiopia__CM_D26AB_I1_18__bin.38 D26AB_I1
+CM_ethiopia__CM_D26AB_I1_18__bin.44 D26AB_I1
+CM_ethiopia__CM_D26AB_I1_18__bin.8 D26AB_I1
+CM_ethiopia__CM_D26AB_I1_18__bin.9 D26AB_I1
+CM_ethiopia__CM_D26A_I13_18__bin.11 D26A_I13
+CM_ethiopia__CM_D26A_I13_18__bin.13 D26A_I13
+CM_ethiopia__CM_D26A_I13_18__bin.25 D26A_I13
+CM_ethiopia__CM_D26A_I13_18__bin.31 D26A_I13
+CM_ethiopia__CM_D26A_I13_18__bin.33 D26A_I13
+CM_ethiopia__CM_D26K_I12_18__bin.8 D26K_I12
+CM_ethiopia__CM_D26_M0_18__bin.18 D26_M0
+CM_ethiopia__CM_D26_M0_18__bin.25 D26_M0
+CM_ethiopia__CM_D26_M0_18__bin.26 D26_M0
+CM_ethiopia__CM_D26_M0_18__bin.38 D26_M0
+CM_ethiopia__CM_D26_M0_18__bin.57 D26_M0
+CM_ethiopia__CM_D26_M0_18__bin.64 D26_M0
+CM_ethiopia__CM_D33_I1_18__bin.10 D33_I1
+CM_ethiopia__CM_D33_I1_18__bin.13 D33_I1
+CM_ethiopia__CM_D33_M0_18__bin.11 D33_M0
+CM_ethiopia__CM_D33_M0_18__bin.12 D33_M0
+CM_ethiopia__CM_D33_M0_18__bin.19 D33_M0
+CM_ethiopia__CM_D33_M0_18__bin.20 D33_M0
+CM_ethiopia__CM_D33_M0_18__bin.31 D33_M0
+CM_ethiopia__CM_D33_M0_18__bin.34 D33_M0
+CM_ethiopia__CM_D33_M0_18__bin.3 D33_M0
+CM_ethiopia__CM_D39_I1_18__bin.13 D39_I1
+CM_ethiopia__CM_D39_I1_18__bin.15 D39_I1
+CM_ethiopia__CM_D39_I1_18__bin.22 D39_I1
+CM_ethiopia__CM_D39_I1_18__bin.29 D39_I1
+CM_ethiopia__CM_D39_I1_18__bin.9 D39_I1
+CM_ethiopia__CM_D39_M0_18__bin.15 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.23 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.32 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.33 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.35 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.36 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.40 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.44 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.45 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.46 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.52 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.64 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.65 D39_M0
+CM_ethiopia__CM_D39_M0_18__bin.66 D39_M0
+CM_ethiopia__CM_D40_I1_18__bin.11 D40_I1
+CM_ethiopia__CM_D40_I1_18__bin.16 D40_I1
+CM_ethiopia__CM_D40_I1_18__bin.19 D40_I1
+CM_ethiopia__CM_D40_I1_18__bin.23 D40_I1
+CM_ethiopia__CM_D40_I1_18__bin.27 D40_I1
+CM_ethiopia__CM_D40_M0_18__bin.10 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.20 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.21 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.28 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.34 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.35 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.36 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.62 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.63 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.66 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.71 D40_M0
+CM_ethiopia__CM_D40_M0_18__bin.76 D40_M0
+CM_ethiopia__CM_D43_I1_18__bin.13 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.18 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.20 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.30 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.36 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.37 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.42 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.49 D43_I1
+CM_ethiopia__CM_D43_I1_18__bin.8 D43_I1
+CM_ethiopia__CM_D43_M0_18__bin.12 D43_M0
+CM_ethiopia__CM_D43_M0_18__bin.16 D43_M0
+CM_ethiopia__CM_D43_M0_18__bin.28 D43_M0
+CM_ethiopia__CM_D48_M0_18__bin.11 D48_M0
+CM_ethiopia__CM_D48_M0_18__bin.19 D48_M0
+CM_ethiopia__CM_D48_M0_18__bin.23 D48_M0
+CM_ethiopia__CM_D48_M0_18__bin.24 D48_M0
+CM_ethiopia__CM_D48_M0_18__bin.46 D48_M0
+CM_ethiopia__CM_D50_I1_18__bin.10 D50_I1
+CM_ethiopia__CM_D50_I1_18__bin.23 D50_I1
+CM_ethiopia__CM_D50_I1_18__bin.27 D50_I1
+CM_ethiopia__CM_D50_I1_18__bin.2 D50_I1
+CM_ethiopia__CM_D50_I1_18__bin.3 D50_I1
+CM_ethiopia__CM_D50_I1_18__bin.4 D50_I1
+CM_ethiopia__CM_D50_I1_18__bin.8 D50_I1
+CM_ethiopia__CM_D50_M0_18__bin.12 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.36 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.39 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.42 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.43 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.46 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.49 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.58 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.59 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.60 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.63 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.64 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.67 D50_M0
+CM_ethiopia__CM_D50_M0_18__bin.72 D50_M0
diff --git a/tools/phylophlan/test-data/database_trunc.faa b/tools/phylophlan/test-data/database_trunc.faa
new file mode 100644
index 0000000000..9e9dce750e
--- /dev/null
+++ b/tools/phylophlan/test-data/database_trunc.faa
@@ -0,0 +1,78 @@
+>s--Staphylococcus-aureus_UniRef90-A0A2X2MCQ2_0
+MINWKIRMKQKSFWVAILSAIFLFAQNIAKAIGYDIQVYTEQLTDGLNAILGFLVLTGVI
+QDPTTKGIGDSHQALEYEEPRRNTRR
+>s--Staphylococcus-aureus_UniRef90-A0A380E267_0
+MKTYSEARARLRWYQGRYIDFDGWYGYQCADLAVDYIYWLLEIRMWGNAKDAINNDFKNM
+ATVYENTPSFVPQIGDVAVFTKGIYKQYGHIGLVFNGGNTNQFLILEQNYDGNANTPAKL
+RWDNYYGCTHFIRPKYKSEGLVNKITNKINPPVQKVVGKSASKITVGSKAPYNLKWSKGA
+YFNAKIDGLGATSATRYGDNRTNYRFDVGQAVYAPGTLIYVFEIIDGWCRIYWNNHNEWI
+WHERLIVKEVY
+>s--Staphylococcus-aureus_UniRef90-A0A7U7JQN2_0
+MLTVDQVKELVGEIKDPIIDVPLKETEGIVEVSIKEEKEHVSVKLAMAQLGGAPQLDLQM
+AVVNVLKENGAKTVGIRFETLPEDKVNQFKPKEENKPKTIEGLLSQNNPVEFIAIASGKG
+GVGKSTVAVNLAVALAREGKKVGLVDADIYGFSVPDMMGIDEKPGIKGKEVIPVERHGVK
+VISMAFFVEENAPVIWRGPMLGKMLTNFFTEVKWGDIEYLILDLPPGTGDVALDVHTMLP
+SSKEIIVTTPHPTAAFVAARAGAMAKHTEHSILGVIENMSYFESKETGNKEYVFGKGGGT
+KLADELNTQLLGELPLEQPSWNPKDFSPSIYQPDDRLGKIYSSIAQKVIASTNK
+>s--Staphylococcus-aureus_UniRef90-P31716_0
+MLKNKILATTLSVSLLAPLANPLLENAKAANDTEDIGKGSDIEIIKRTEDKTSNKWGVTQ
+NIQFDFVKDTKYNKDALILKMQGFISSRTTYYNYKKTNHVKAMRWPFQYNIGLKTNDKYV
+SLINYLPKNKIESTNVSQTLGYNIGGNFQSAPSLGGNGSFNYSKSISYTQQNYVSEVEQQ
+NSKSVLWGVKANSFATESGQKSAFDSDLFVGYKPHSKDPRDYFVPDSELPPLVQSGFNPS
+FIATVSHEKGSSDTSEFEITYGRNMDVTHAIKRSTHYGNSYLDGHRVHNAFVNRNYTVKY
+EVNWKTHEIKVKGQN
+>s--Staphylococcus-aureus_UniRef90-Q2FVK8_0
+MPKLILCRHGQSEWNAKNLFTGWEDVNLSEQGINEATRAGEKVRENNIAIDVAFTSLLTR
+ALDTTHYILTESKQQWIPVYKSWRLNERHYGGLQGLNKDDARKEFGEEQVHIWRRSYDVK
+PPAETEEQREAYLADRRYNHLDKRMMPYSESLKDTLVRVIPFWTDHISQYLLDGQTVLVS
+AHGNSIRALIKYLEDVSDEDIINYEIKTGAPLVYELTDDLEVIDKYYL
+>s--Staphylococcus-aureus_UniRef90-Q2FW81_0
+MLDKNQLAKYKQDHLCEYEKIMSNNEKEALEEKVASLDLDFIAKLYNDLYINKKTIDDVS
+AVSEVKYDIKSQMSDDEIKRLEEQGLQAIKEGQFAVLLMAGGQGTRLGYKGPKGSFEIEG
+VSLFELQANQLKTLNHQSGHTIQWYIMTSDINHEETLAYFEAHSYFGYDQEAIHFFKQDN
+IVALSEEGKLILNQQGRIMETPNGNGGVFKSLDKAGYLEEMSNNGVKYIFLNNIDNVLVR
+VLDPLFAGFTVEHDYDITSKTIQPKPGESVGRLVNVDCKDTVLEYSELDPEVANQFNNAN
+IGIHAFKLGFILNAVNRELPYHLAIKNLKQLDENFGVIEQPTLKFELFYFDIFTYGTSFV
+TLQVPREEEFSPLKNKEGKDSVATATEDLRRMGLI
+>s--Staphylococcus-aureus_UniRef90-Q2FW85_0
+MAKVELTTRRRNFIVAVMLISAFVAILNQTLLNTALPSIMRELNINESTSQWLVTGFMLV
+NGVMIPLTAYLMDRIKTRPLYLAAMGTFLLGSIVAALAPNFGVLMLARVIQAMGAGVLMP
+LMQFTLFTLFSKEHRGFAMGLAGLVIQFAPAIGPTVTGLIIDQASWRVPFIIIVGIAILA
+FVFGLVSISSYNEVKYTKLDKRSVMYSTIGFGLMLYAFSSAGDLGFTSPIVIGALILSMV
+IIYLFIRRQFNITNALLNLRVFKNRTFALCTISSMIIMMSMVGPALLIPLYVQNSLSLSA
+LLSGLVIMPGAIINGIMSVFTGKFYDKYGPRPLIYTGFTILTITTIMLCFLHTDTSYTYL
+IVVYAIRMFSVSLLMMPINTTGINSLRNEEISHGTAIMNFGRVMAGSLGTALMVTLMSFG
+AKIFLSTSPSHLTATEIKQQSIAIGVDISFAFVAVLVMAAYVIALFIREPKEIESNRRKF
+>s--Staphylococcus-aureus_UniRef90-Q2G1T0_0
+MVTAIIHGFILAIGLILPLGAQNVFIFNQGANQPKYRYVLPAIITAGLSDSLLIIIAVVG
+VSIIIMSLPVLQAIIYIVGLIFLMYMAWTIWHDKPSTDGETQIMSPMKQVSFALSVSLLN
+PHAILDTIGVIGSSAALYSGSNKIAFTIACISVSWLWFFLLAILGKMVGSIDKTGKLLTI
+INKISSIIIIIVALMILQKLIQLLF
+>s--Staphylococcus-aureus_UniRef90-Q2G222_0
+MPKNKILIYLLSTTLVLPTLVSPTAYADTPQKDTTAKTTSHDSKKSNDDETSKDTTSKDI
+DKADKNNTSNQDNNDKKFKTIDDSTSDSNNIIDFIYKNLPQTNINQLLTKNKYDDNYSLT
+TLIQNLFNLNSDISDYEQPRNGEKSTNDSNKNSDNSIKNDTDTQSSKQDKADNQKAPKSN
+NTKPSTSNKQPNSPKPTQPNQSNSQPASDDKANQKSSSKDNQSMSDSALDSILDQYSEDA
+KKTQKDYASQSKKDKNEKSNTKNPQLPTQDELKHKSKPAQSFNNDVNQKDTRATSLFETD
+PSISNNDDSGQFNVVDSKDTRQFVKSIAKDAHRIGQDNDIYASVMIAQAILESDSGRSAL
+AKSPNHNLFGIKGAFEGNSVPFNTLEADGNQLYSINAGFRKYPSTKESLKDYSDLIKNGI
+DGNRTIYKPTWKSEADSYKDATSHLSKTYATDPNYAKKLNSIIKHYQLTQFDDERMPDLD
+KYERSIKDYDDSSDEFKPFREVSDSMPYPHGQCTWYVYNRMKQFGTSISGDLGDAHNWNN
+RAQYRDYQVSHTPKRHAAVVFEAGQFGADQHYGHVAFVEKVNSDGSIVISESNVKGLGII
+SHRTINAAAAEELSYITGK
+>s--Staphylococcus-aureus_UniRef90-Q5HDD6_0
+MIKNKILTATLAVGLIAPLANPFIEISKAENKIEDIGQGAEIIKRTQDITSKRLAITQNI
+QFDFVKDKKYNKDALVVKMQGFISSRTTYSDLKKYPYIKRMIWPFQYNISLKTKDSNVDL
+INYLPKNKIDSADVSQKLGYNIGGNFQSAPSIGGSGSFNYSKTISYNQKNYVTEVESQNS
+KGVKWGVKANSFVTPNGQVSAYDQYLFAQDPTGPAARDYFVPDNQLPPLIQSGFNPSFIT
+TLSHERGKGDKSEFEITYGRNMDATYAYVTRHRLAVDRKHDAFKNRNVTVKYEVNWKTHE
+VKIKSITPK
+>s--Staphylococcus-aureus_UniRef90-Q931F4_0
+MKNKYISKLLVGAATITLATMISNGEAKASENTQQTSTKHQTTQNNYVTDQQKAFYQVLH
+LKGITEEQRNQYIKTLREHPERAQEVFSESLKDSKNPDRRVAQQNAFYNVLKNDNLTEQE
+KNNYIAQIKENPDRSQQVWVESVQSSKAKERQNIENADKAIKDFQDNKAPHDKSAAYEAN
+SKLPKDLRDKNNRFVEKVSIEKAIVRHDERVKSANDAISKLNEKDSIENRRLAQREVNKA
+PMDVKEHLQKQLDALVAQKDAEKKVAPKVEAPQIQSPQIEKPKAESPKVEVPQSKLLGYY
+QSLKDSFNYGYKYLTDTYKSYKEKYDTAKYYYNTYYKYKGAIDQTVLTVLGSGSKSYIQP
+LKVDDKNGYLAKSYAQVRNYVTESINTGKVLYTFYQNPTLVKTAIKAQETASSIKNTLSN
+LLSFWK
diff --git a/tools/phylophlan/test-data/output.tsv b/tools/phylophlan/test-data/output.tsv
new file mode 100644
index 0000000000..bfd7c8fa28
--- /dev/null
+++ b/tools/phylophlan/test-data/output.tsv
@@ -0,0 +1,2 @@
+#input_bin [u|k]_[S|G|F]GBid:taxa_level:taxonomy:avg_dist
+CM_ethiopia__CM_A06_M0_18__bin.34 is not close to any SGB present in the ethiopia_tutorial database
diff --git a/tools/phylophlan/test-data/output_heatmap_counts.png b/tools/phylophlan/test-data/output_heatmap_counts.png
new file mode 100644
index 0000000000..5320c97d7c
Binary files /dev/null and b/tools/phylophlan/test-data/output_heatmap_counts.png differ
diff --git a/tools/phylophlan/test-data/output_heatmap_pres_abs.png b/tools/phylophlan/test-data/output_heatmap_pres_abs.png
new file mode 100644
index 0000000000..2bb08926ff
Binary files /dev/null and b/tools/phylophlan/test-data/output_heatmap_pres_abs.png differ
diff --git a/tools/phylophlan/test-data/output_metagenomic.tsv b/tools/phylophlan/test-data/output_metagenomic.tsv
new file mode 100644
index 0000000000..cab88ef52b
--- /dev/null
+++ b/tools/phylophlan/test-data/output_metagenomic.tsv
@@ -0,0 +1,365 @@
+#input_bin [u|k]_[S|G|F]GBid:taxa_level:taxonomy:avg_dist
+CM_ethiopia__CM_A01_I1_18__bin.19 uSGB_4894:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_unclassified_SGB4894|t__SGB4894:0.0321575902631579
+CM_ethiopia__CM_A01_I1_18__bin.31 kSGB_4350:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_bacterium|t__SGB4350:0.035591812592592594
+CM_ethiopia__CM_A01_I1_18__bin.42 kSGB_4563:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Mediterraneibacter|s__Ruminococcus_torques|t__SGB4563:0.037374750437317784
+CM_ethiopia__CM_A01_I1_18__bin.5 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.04053020105263159
+CM_ethiopia__CM_A01_I1_18__bin.51 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03559054139475368
+CM_ethiopia__CM_A01_I1_18__bin.52 kSGB_4940:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_inulinivorans|t__SGB4940:0.04562117861072903
+CM_ethiopia__CM_A01_I1_18__bin.73 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.032458176190476196
+CM_ethiopia__CM_A01_M0_18__bin.21 kSGB_1333:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB1333:0.024229557692307693
+CM_ethiopia__CM_A01_M0_18__bin.30 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.022375910814094777
+CM_ethiopia__CM_A01_M0_18__bin.31 kSGB_9209:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9209:0.015718422018348624
+CM_ethiopia__CM_A01_M0_18__bin.43 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.04064938601986249
+CM_ethiopia__CM_A01_M0_18__bin.56 kSGB_9203:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9203:0.01644279676470588
+CM_ethiopia__CM_A01_M0_18__bin.59 uSGB_19976:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__GGB12851|s__GGB12851_SGB19976|t__SGB19976:0.030983433333333334
+CM_ethiopia__CM_A01_M0_18__bin.60 uSGB_2076:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_unclassified_SGB2076|t__SGB2076:0.024005437423312886
+CM_ethiopia__CM_A01_M0_18__bin.62 kSGB_5904:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__Mitsuokella|s__Mitsuokella_jalaludinii|t__SGB5904:0.021870221544715445
+CM_ethiopia__CM_A01_M0_18__bin.63 kSGB_15467:Species:k__Bacteria|p__Proteobacteria|c__Deltaproteobacteria|o__Desulfovibrionales|f__Desulfovibrionaceae|g__Desulfovibrio|s__Desulfovibrio_piger|t__SGB15467:0.023819577638888895
+CM_ethiopia__CM_A04_I1_18__bin.1 kSGB_4716:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lacrimispora|s__Lacrimispora_amygdalina|t__SGB4716:0.037654118810679614
+CM_ethiopia__CM_A04_I1_18__bin.2 uSGB_14439:Genus:k__Bacteria|p__Actinobacteria|c__Coriobacteriia|o__Coriobacteriales|f__Coriobacteriaceae|g__Collinsella|s__Collinsella_SGB14439|t__SGB14439:0.06418826730769231
+CM_ethiopia__CM_A04_I1_18__bin.42 kSGB_19444:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacter|s__Campylobacter_jejuni|t__SGB19444:0.01665842264392324
+CM_ethiopia__CM_A04_M0_18__bin.15 kSGB_5904:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__Mitsuokella|s__Mitsuokella_jalaludinii|t__SGB5904:0.022711207845528457
+CM_ethiopia__CM_A04_M0_18__bin.16 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.022738580923450786
+CM_ethiopia__CM_A04_M0_18__bin.8 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.030365172766048203
+CM_ethiopia__CM_A06_I1_18__bin.31 uSGB_1437:Other:k__Bacteria|p__Bacteroidetes|c__CFGB544|o__OFGB544|f__FGB544|g__GGB1123|s__GGB1123_SGB1437|t__SGB1437:0.02269366791262136
+CM_ethiopia__CM_A06_I1_18__bin.32 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.0218392411299435
+CM_ethiopia__CM_A06_I1_18__bin.34 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.024418974191980556
+CM_ethiopia__CM_A06_I1_18__bin.37 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.021414286354166662
+CM_ethiopia__CM_A06_I1_18__bin.46 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.033303842259543616
+CM_ethiopia__CM_A06_I1_18__bin.54 kSGB_2075:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2075:0.019615276206896553
+CM_ethiopia__CM_A06_M0_18__bin.19 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.021415001979166667
+CM_ethiopia__CM_A06_M0_18__bin.2 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.02487240189550425
+CM_ethiopia__CM_A06_M0_18__bin.24 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02168037502824859
+CM_ethiopia__CM_A06_M0_18__bin.31 kSGB_4285:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bromii|t__SGB4285:0.04570293804561542
+CM_ethiopia__CM_A06_M0_18__bin.34 kSGB_66053:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_sp_MUC_MUC_530_WT_4D|t__SGB66053:0.059212150000000005
+CM_ethiopia__CM_A06_M0_18__bin.36 kSGB_2075:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2075:0.0198921175862069
+CM_ethiopia__CM_A06_M0_18__bin.39 kSGB_7061:Species:k__Bacteria|p__Firmicutes|c__Bacilli|o__Lactobacillales|f__Lactobacillaceae|g__Ligilactobacillus|s__Ligilactobacillus_ruminis|t__SGB7061:0.02888113339517625
+CM_ethiopia__CM_A06_M0_18__bin.9 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.034505634763275755
+CM_ethiopia__CM_D02_I1_18__bin.2 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.037184771315789476
+CM_ethiopia__CM_D02_I1_18__bin.21 kSGB_4940:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_inulinivorans|t__SGB4940:0.040451880055020636
+CM_ethiopia__CM_D02_I1_18__bin.24 kSGB_1475:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1475:0.024409391818181816
+CM_ethiopia__CM_D02_I1_18__bin.31 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03249809963744935
+CM_ethiopia__CM_D02_I1_18__bin.46 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.03509609662447257
+CM_ethiopia__CM_D02_I1_18__bin.49 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.042205436287242167
+CM_ethiopia__CM_D02_M0_18__bin.17 kSGB_5904:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__Mitsuokella|s__Mitsuokella_jalaludinii|t__SGB5904:0.02257218024390244
+CM_ethiopia__CM_D02_M0_18__bin.21 kSGB_8595:Species:k__Bacteria|p__Candidatus_Melainabacteria|c__Candidatus_Melainabacteria_unclassified|o__Candidatus_Gastranaerophilales|f__Candidatus_Gastranaerophilales_unclassified|g__Candidatus_Gastranaerophilales_unclassified|s__Candidatus_Gastranaerophilales_bacterium|t__SGB8595:0.01280233394736842
+CM_ethiopia__CM_D02_M0_18__bin.23 uSGB_4890:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_unclassified_SGB4890|t__SGB4890:0.02620155625
+CM_ethiopia__CM_D02_M0_18__bin.25 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.0300982457880145
+CM_ethiopia__CM_D02_M0_18__bin.3 kSGB_1853:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroides|s__Bacteroides_fragilis|t__SGB1853:0.021933116666666665
+CM_ethiopia__CM_D02_M0_18__bin.4 kSGB_714:Species:k__Archaea|p__Euryarchaeota|c__Methanobacteria|o__Methanobacteriales|f__Methanobacteriaceae|g__Methanobrevibacter|s__Methanobrevibacter_smithii|t__SGB714:0.022009852936910802
+CM_ethiopia__CM_D02_M0_18__bin.49 uSGB_1437:Other:k__Bacteria|p__Bacteroidetes|c__CFGB544|o__OFGB544|f__FGB544|g__GGB1123|s__GGB1123_SGB1437|t__SGB1437:0.0230746927184466
+CM_ethiopia__CM_D02_M0_18__bin.61 kSGB_9202:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Victivallales|f__Victivallaceae|g__Victivallis|s__Victivallis_vadensis|t__SGB9202:0.018689171962616824
+CM_ethiopia__CM_D02_M0_18__bin.62 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.02604421055900621
+CM_ethiopia__CM_D03_I12_18__bin.27 uSGB_14980:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Clostridiaceae|g__GGB9568|s__GGB9568_SGB14980|t__SGB14980:0.024585907200000003
+CM_ethiopia__CM_D03_I12_18__bin.33 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02024565118644068
+CM_ethiopia__CM_D03_I12_18__bin.34 kSGB_3548:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetia_unclassified|f__Spirochaetia_unclassified|g__Spirochaetia_unclassified|s__Spirochaetia_bacterium|t__SGB3548:0.02412463823529412
+CM_ethiopia__CM_D03_I12_18__bin.5 uSGB_1701:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1267|s__GGB1267_SGB1701|t__SGB1701:0.021216877375000002
+CM_ethiopia__CM_D03_M0_18__bin.30 uSGB_2076:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_unclassified_SGB2076|t__SGB2076:0.02347683251533742
+CM_ethiopia__CM_D03_M0_18__bin.44 kSGB_2021:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2021:0.03222965960264901
+CM_ethiopia__CM_D03_M0_18__bin.45 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.032545289285714284
+CM_ethiopia__CM_D03_M0_18__bin.62 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.021596757853107343
+CM_ethiopia__CM_D03_M0_18__bin.63 uSGB_1024:Other:k__Archaea|p__Euryarchaeota|c__CFGB343|o__OFGB343|f__FGB343|g__GGB781|s__GGB781_SGB1024|t__SGB1024:0.027763024661246614
+CM_ethiopia__CM_D03_M0_18__bin.64 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.028853236459627327
+CM_ethiopia__CM_D03_M0_18__bin.65 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.025928870909090913
+CM_ethiopia__CM_D03_M0_18__bin.67 kSGB_1404:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1404:0.016574511313131316
+CM_ethiopia__CM_D03_M0_18__bin.69 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.037718670263157894
+CM_ethiopia__CM_D04_I1_18__bin.1 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.04149574178762414
+CM_ethiopia__CM_D04_I1_18__bin.12 kSGB_4335:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_bacterium|t__SGB4335:0.022550591692307692
+CM_ethiopia__CM_D04_I1_18__bin.26 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03944625904243975
+CM_ethiopia__CM_D04_I1_18__bin.33 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.032972708333333337
+CM_ethiopia__CM_D04_I1_18__bin.35 kSGB_4540:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Anaerostipes|s__Anaerostipes_hadrus|t__SGB4540:0.03343807104123946
+CM_ethiopia__CM_D04_I1_18__bin.36 uSGB_2240:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1632|s__GGB1632_SGB2240|t__SGB2240:0.03582656050955414
+CM_ethiopia__CM_D04_I1_18__bin.39 kSGB_1475:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1475:0.02569116299465241
+CM_ethiopia__CM_D04_I1_18__bin.44 kSGB_14993:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Agathobaculum|s__Agathobaculum_butyriciproducens|t__SGB14993:0.035852457205623904
+CM_ethiopia__CM_D04_I1_18__bin.47 kSGB_6754:Species:k__Bacteria|p__Firmicutes|c__Erysipelotrichia|o__Erysipelotrichales|f__Erysipelotrichaceae|g__Faecalibacillus|s__Faecalibacillus_intestinalis|t__SGB6754:0.031273649734395746
+CM_ethiopia__CM_D04_I1_18__bin.8 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.021270506700564976
+CM_ethiopia__CM_D04_M0_18__bin.42 kSGB_2075:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2075:0.02010362379310345
+CM_ethiopia__CM_D04_M0_18__bin.47 kSGB_15447:Species:k__Bacteria|p__Proteobacteria|c__Deltaproteobacteria|o__Desulfovibrionales|f__Desulfovibrionaceae|g__Desulfovibrionaceae_unclassified|s__Desulfovibrionaceae_bacterium|t__SGB15447:0.022900349822064056
+CM_ethiopia__CM_D04_M0_18__bin.76 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02028208033898305
+CM_ethiopia__CM_D05_I1_18__bin.27 kSGB_19434:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacteraceae_unclassified|s__Campylobacteraceae_bacterium|t__SGB19434:0.021683595806451614
+CM_ethiopia__CM_D05_I1_18__bin.37 uSGB_4664:Other:k__Bacteria|p__Firmicutes|c__CFGB1424|o__OFGB1424|f__FGB1424|g__GGB3490|s__GGB3490_SGB4664|t__SGB4664:0.026189018749999998
+CM_ethiopia__CM_D05_I1_18__bin.7 uSGB_4890:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_unclassified_SGB4890|t__SGB4890:0.02281281875
+CM_ethiopia__CM_D05_M0_18__bin.24 uSGB_4372:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_unclassified_SGB4372|t__SGB4372:0.020020442857142856
+CM_ethiopia__CM_D05_M0_18__bin.27 uSGB_2237:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1629|s__GGB1629_SGB2237|t__SGB2237:0.03719957027027026
+CM_ethiopia__CM_D05_M0_18__bin.4 uSGB_13976:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB9059|s__GGB9059_SGB13976|t__SGB13976:0.02635656379781421
+CM_ethiopia__CM_D05_M0_18__bin.42 kSGB_4262:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bicirculans|t__SGB4262:0.03198925178845171
+CM_ethiopia__CM_D05_M0_18__bin.50 kSGB_1855:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroides|s__Bacteroides_fragilis|t__SGB1855:0.017717912779661015
+CM_ethiopia__CM_D05_M0_18__bin.52 uSGB_1701:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1267|s__GGB1267_SGB1701|t__SGB1701:0.020903162500000003
+CM_ethiopia__CM_D05_M0_18__bin.54 kSGB_4285:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bromii|t__SGB4285:0.03201108596146284
+CM_ethiopia__CM_D05_M0_18__bin.57 kSGB_19434:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacteraceae_unclassified|s__Campylobacteraceae_bacterium|t__SGB19434:0.02145104725806451
+CM_ethiopia__CM_D05_M0_18__bin.59 kSGB_4938:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_sp_AF02_12|t__SGB4938:0.02524454456780333
+CM_ethiopia__CM_D05_M0_18__bin.93 kSGB_9210:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9210:0.019514726373626372
+CM_ethiopia__CM_D06_I1_18__bin.21 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03673517719298246
+CM_ethiopia__CM_D06_I1_18__bin.42 uSGB_4327:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB3277|s__GGB3277_SGB4327|t__SGB4327:0.027861904666234606
+CM_ethiopia__CM_D06_I1_18__bin.43 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.03363195357142858
+CM_ethiopia__CM_D06_M0_18__bin.10 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.03613631054852321
+CM_ethiopia__CM_D06_M0_18__bin.22 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.02828699814459373
+CM_ethiopia__CM_D06_M0_18__bin.39 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.021422726011299433
+CM_ethiopia__CM_D06_M0_18__bin.40 kSGB_3539:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetia_unclassified|f__Spirochaetia_unclassified|g__Spirochaetia_unclassified|s__Spirochaetia_bacterium|t__SGB3539:0.015086198863636362
+CM_ethiopia__CM_D06_M0_18__bin.41 kSGB_714:Species:k__Archaea|p__Euryarchaeota|c__Methanobacteria|o__Methanobacteriales|f__Methanobacteriaceae|g__Methanobrevibacter|s__Methanobrevibacter_smithii|t__SGB714:0.017517191007976798
+CM_ethiopia__CM_D06_M0_18__bin.42 uSGB_26990:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB18271|s__GGB18271_SGB26990|t__SGB26990:0.01416074142857143
+CM_ethiopia__CM_D06_M0_18__bin.7 uSGB_1701:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1267|s__GGB1267_SGB1701|t__SGB1701:0.02138389541666667
+CM_ethiopia__CM_D07_I1_18__bin.1 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.021332762789101605
+CM_ethiopia__CM_D07_I1_18__bin.13 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.02847675687530803
+CM_ethiopia__CM_D07_I1_18__bin.23 uSGB_2076:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_unclassified_SGB2076|t__SGB2076:0.02353445337423313
+CM_ethiopia__CM_D07_I1_18__bin.30 kSGB_1408:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1408:0.025046275641025642
+CM_ethiopia__CM_D07_I1_18__bin.32 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.021253345423728812
+CM_ethiopia__CM_D07_I1_18__bin.38 kSGB_2295:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Alistipes|s__Alistipes_shahii|t__SGB2295:0.017644593427970555
+CM_ethiopia__CM_D07_I1_18__bin.4 kSGB_9226:Species:k__Bacteria|p__Verrucomicrobia|c__Verrucomicrobiae|o__Verrucomicrobiales|f__Akkermansiaceae|g__Akkermansia|s__Akkermansia_muciniphila|t__SGB9226:0.022643940591467356
+CM_ethiopia__CM_D07_I1_18__bin.44 kSGB_1949:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Tannerellaceae|g__Parabacteroides|s__Parabacteroides_merdae|t__SGB1949:0.01594793287222809
+CM_ethiopia__CM_D07_I1_18__bin.48 kSGB_4285:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bromii|t__SGB4285:0.029072833326779395
+CM_ethiopia__CM_D07_I1_18__bin.49 uSGB_13976:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB9059|s__GGB9059_SGB13976|t__SGB13976:0.02688394453551913
+CM_ethiopia__CM_D07_I1_18__bin.53 kSGB_1965:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Barnesiellaceae|g__Barnesiella|s__Barnesiella_intestinihominis|t__SGB1965:0.01897670766252955
+CM_ethiopia__CM_D07_I1_18__bin.9 kSGB_1836:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroides|s__Bacteroides_uniformis|t__SGB1836:0.023904933409807132
+CM_ethiopia__CM_D07_M0_18__bin.18 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.028727236024844716
+CM_ethiopia__CM_D07_M0_18__bin.19 uSGB_26990:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB18271|s__GGB18271_SGB26990|t__SGB26990:0.015226757142857145
+CM_ethiopia__CM_D07_M0_18__bin.23 kSGB_4272:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_sp_JE7A12|t__SGB4272:0.027610883665338645
+CM_ethiopia__CM_D07_M0_18__bin.40 kSGB_3546:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetales|f__Spirochaetaceae|g__Treponema|s__Treponema_succinifaciens|t__SGB3546:0.02012432380952381
+CM_ethiopia__CM_D07_M0_18__bin.44 kSGB_2229:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_bacterium|t__SGB2229:0.024130417094017094
+CM_ethiopia__CM_D07_M0_18__bin.73 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02030263152542373
+CM_ethiopia__CM_D07_M0_18__bin.78 kSGB_3548:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetia_unclassified|f__Spirochaetia_unclassified|g__Spirochaetia_unclassified|s__Spirochaetia_bacterium|t__SGB3548:0.022464210294117645
+CM_ethiopia__CM_D07_M0_18__bin.80 uSGB_4328:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB3278|s__GGB3278_SGB4328|t__SGB4328:0.021747616975308644
+CM_ethiopia__CM_D07_M0_18__bin.81 kSGB_4262:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bicirculans|t__SGB4262:0.03087436561062851
+CM_ethiopia__CM_D08_I1_18__bin.1 kSGB_5115:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Coprococcus|s__Coprococcus_sp_OM04_5BH|t__SGB5115:0.017265259798994976
+CM_ethiopia__CM_D08_I1_18__bin.21 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.020066164745762713
+CM_ethiopia__CM_D08_I1_18__bin.22 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03401490985284709
+CM_ethiopia__CM_D08_I1_18__bin.24 kSGB_5904:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__Mitsuokella|s__Mitsuokella_jalaludinii|t__SGB5904:0.024617650813008127
+CM_ethiopia__CM_D08_I1_18__bin.5 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03866051754385965
+CM_ethiopia__CM_D08_M0_18__bin.1 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.0199903340625
+CM_ethiopia__CM_D08_M0_18__bin.14 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.02349544459295261
+CM_ethiopia__CM_D08_M0_18__bin.17 kSGB_19434:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacteraceae_unclassified|s__Campylobacteraceae_bacterium|t__SGB19434:0.023360407419354835
+CM_ethiopia__CM_D08_M0_18__bin.18 kSGB_714:Species:k__Archaea|p__Euryarchaeota|c__Methanobacteria|o__Methanobacteriales|f__Methanobacteriaceae|g__Methanobrevibacter|s__Methanobrevibacter_smithii|t__SGB714:0.016190648498912257
+CM_ethiopia__CM_D08_M0_18__bin.21 kSGB_3546:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetales|f__Spirochaetaceae|g__Treponema|s__Treponema_succinifaciens|t__SGB3546:0.01888655894179894
+CM_ethiopia__CM_D08_M0_18__bin.24 kSGB_5065:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Butyrivibrio|s__Butyrivibrio_crossotus|t__SGB5065:0.028811107293666028
+CM_ethiopia__CM_D08_M0_18__bin.29 kSGB_1475:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1475:0.024320632192513368
+CM_ethiopia__CM_D08_M0_18__bin.3 kSGB_4285:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bromii|t__SGB4285:0.04425564889893826
+CM_ethiopia__CM_D08_M0_18__bin.31 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03719356475438597
+CM_ethiopia__CM_D08_M0_18__bin.34 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.0356452894514768
+CM_ethiopia__CM_D08_M0_18__bin.41 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.026033423512476006
+CM_ethiopia__CM_D08_M0_18__bin.43 kSGB_2075:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2075:0.018980628620689655
+CM_ethiopia__CM_D09_I1_18__bin.17 kSGB_1473:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1473:0.023315838333333335
+CM_ethiopia__CM_D09_I1_18__bin.19 kSGB_6783:Species:k__Bacteria|p__Firmicutes|c__Erysipelotrichia|o__Erysipelotrichales|f__Erysipelotrichaceae|g__Catenibacterium|s__Catenibacterium_sp_AM22_15|t__SGB6783:0.0383189283295711
+CM_ethiopia__CM_D09_I1_18__bin.39 uSGB_4886:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3614|s__GGB3614_SGB4886|t__SGB4886:0.022254304488778055
+CM_ethiopia__CM_D09_I1_18__bin.50 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03665488789473684
+CM_ethiopia__CM_D09_M0_18__bin.11 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03707280315789473
+CM_ethiopia__CM_D09_M0_18__bin.22 uSGB_1024:Other:k__Archaea|p__Euryarchaeota|c__CFGB343|o__OFGB343|f__FGB343|g__GGB781|s__GGB781_SGB1024|t__SGB1024:0.02888795149051491
+CM_ethiopia__CM_D09_M0_18__bin.25 kSGB_8021:Species:k__Bacteria|p__Firmicutes|c__Bacilli|o__Lactobacillales|f__Streptococcaceae|g__Streptococcus|s__Streptococcus_lutetiensis|t__SGB8021:0.01528407674033149
+CM_ethiopia__CM_D09_M0_18__bin.28 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03013315607805502
+CM_ethiopia__CM_D09_M0_18__bin.37 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.021090136451313277
+CM_ethiopia__CM_D09_M0_18__bin.39 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.028159944603252836
+CM_ethiopia__CM_D09_M0_18__bin.40 uSGB_1701:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1267|s__GGB1267_SGB1701|t__SGB1701:0.019142116249999997
+CM_ethiopia__CM_D09_M0_18__bin.9 kSGB_3546:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetales|f__Spirochaetaceae|g__Treponema|s__Treponema_succinifaciens|t__SGB3546:0.020248204444444445
+CM_ethiopia__CM_D10_I1_18__bin.1 kSGB_2301:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Alistipes|s__Alistipes_finegoldii|t__SGB2301:0.02510436442105263
+CM_ethiopia__CM_D10_I1_18__bin.10 kSGB_1613:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__Prevotella|s__Prevotella_copri|t__SGB1613:0.02915100620689655
+CM_ethiopia__CM_D10_I1_18__bin.13 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.0385965949456174
+CM_ethiopia__CM_D10_I1_18__bin.2 kSGB_4837:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Blautia|s__Blautia_wexlerae|t__SGB4837:0.05107277361154691
+CM_ethiopia__CM_D10_I1_18__bin.26 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.020753195833333335
+CM_ethiopia__CM_D10_I1_18__bin.29 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.03003536934450468
+CM_ethiopia__CM_D10_I1_18__bin.31 kSGB_5190:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Anaerotignum|s__Anaerotignum_faecicola|t__SGB5190:0.0310274795256917
+CM_ethiopia__CM_D10_I1_18__bin.32 kSGB_15316:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Faecalibacterium|s__Faecalibacterium_prausnitzii|t__SGB15316:0.032510090447598256
+CM_ethiopia__CM_D10_I1_18__bin.4 uSGB_4939:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_SGB4939|t__SGB4939:0.05174999090909091
+CM_ethiopia__CM_D10_I1_18__bin.41 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.036088981403508774
+CM_ethiopia__CM_D10_I1_18__bin.43 kSGB_4871:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Faecalicatena|s__Faecalicatena_fissicatena|t__SGB4871:0.025038668704663213
+CM_ethiopia__CM_D10_I1_18__bin.50 kSGB_6783:Species:k__Bacteria|p__Firmicutes|c__Erysipelotrichia|o__Erysipelotrichales|f__Erysipelotrichaceae|g__Catenibacterium|s__Catenibacterium_sp_AM22_15|t__SGB6783:0.03784759616252822
+CM_ethiopia__CM_D10_I1_18__bin.55 kSGB_9273:Species:k__Bacteria|p__Proteobacteria|c__Betaproteobacteria|o__Burkholderiales|f__Sutterellaceae|g__Duodenibacillus|s__Duodenibacillus_massiliensis|t__SGB9273:0.017259645991091314
+CM_ethiopia__CM_D10_I1_18__bin.9 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.03400034404761905
+CM_ethiopia__CM_D10_M0_18__bin.109 kSGB_4368:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_bacterium|t__SGB4368:0.018531030952380952
+CM_ethiopia__CM_D10_M0_18__bin.120 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.03478694345991561
+CM_ethiopia__CM_D10_M0_18__bin.129 kSGB_4883:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_bacterium|t__SGB4883:0.026223828205128204
+CM_ethiopia__CM_D10_M0_18__bin.140 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.032568390773809526
+CM_ethiopia__CM_D10_M0_18__bin.141 kSGB_6970:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadales_unclassified|g__Selenomonadales_unclassified|s__Selenomonadales_bacterium|t__SGB6970:0.019997668421052633
+CM_ethiopia__CM_D10_M0_18__bin.145 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03629123457894737
+CM_ethiopia__CM_D10_M0_18__bin.20 kSGB_19694:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19694:0.024437433962264152
+CM_ethiopia__CM_D10_M0_18__bin.26 uSGB_5099:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3751|s__GGB3751_SGB5099|t__SGB5099:0.01863289090909091
+CM_ethiopia__CM_D10_M0_18__bin.31 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.025934238181818177
+CM_ethiopia__CM_D10_M0_18__bin.50 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02179893775141243
+CM_ethiopia__CM_D10_M0_18__bin.53 kSGB_9203:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9203:0.016550575686274507
+CM_ethiopia__CM_D10_M0_18__bin.57 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.027513782608695653
+CM_ethiopia__CM_D10_M0_18__bin.59 kSGB_3548:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetia_unclassified|f__Spirochaetia_unclassified|g__Spirochaetia_unclassified|s__Spirochaetia_bacterium|t__SGB3548:0.02181751029411764
+CM_ethiopia__CM_D10_M0_18__bin.6 uSGB_4373:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_unclassified_SGB4373|t__SGB4373:0.11444471913580247
+CM_ethiopia__CM_D10_M0_18__bin.60 kSGB_9210:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9210:0.019368654505494506
+CM_ethiopia__CM_D10_M0_18__bin.62 uSGB_4383:Other:k__Bacteria|p__Firmicutes|c__CFGB1358|o__OFGB1358|f__FGB1358|g__GGB3314|s__GGB3314_SGB4383|t__SGB4383:0.023548200000000002
+CM_ethiopia__CM_D10_M0_18__bin.67 kSGB_4200:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcaceae_unclassified|s__Ruminococcaceae_bacterium|t__SGB4200:0.019383474285714287
+CM_ethiopia__CM_D10_M0_18__bin.73 kSGB_2229:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_bacterium|t__SGB2229:0.024503928205128204
+CM_ethiopia__CM_D10_M0_18__bin.74 uSGB_1024:Other:k__Archaea|p__Euryarchaeota|c__CFGB343|o__OFGB343|f__FGB343|g__GGB781|s__GGB781_SGB1024|t__SGB1024:0.027872528997289973
+CM_ethiopia__CM_D10_M0_18__bin.76 kSGB_14205:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_bacterium|t__SGB14205:0.11534651428571428
+CM_ethiopia__CM_D10_M0_18__bin.77 kSGB_17244:Species:k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Bifidobacteriales|f__Bifidobacteriaceae|g__Bifidobacterium|s__Bifidobacterium_adolescentis|t__SGB17244:0.02472740579310345
+CM_ethiopia__CM_D10_M0_18__bin.8 kSGB_5904:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__Mitsuokella|s__Mitsuokella_jalaludinii|t__SGB5904:0.023576634024390246
+CM_ethiopia__CM_D10_M0_18__bin.82 uSGB_9243:Other:k__Bacteria|p__Proteobacteria|c__CFGB2394|o__OFGB2394|f__FGB2394|g__GGB6544|s__GGB6544_SGB9243|t__SGB9243:0.01981209159663866
+CM_ethiopia__CM_D10_M0_18__bin.97 uSGB_1701:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1267|s__GGB1267_SGB1701|t__SGB1701:0.021690822916666668
+CM_ethiopia__CM_D11_I1_18__bin.16 kSGB_6817:Species:k__Bacteria|p__Firmicutes|c__Firmicutes_unclassified|o__Firmicutes_unclassified|f__Firmicutes_unclassified|g__Firmicutes_unclassified|s__Firmicutes_bacterium_AM41_11|t__SGB6817:0.013849751061946905
+CM_ethiopia__CM_D11_I1_18__bin.19 kSGB_9273:Species:k__Bacteria|p__Proteobacteria|c__Betaproteobacteria|o__Burkholderiales|f__Sutterellaceae|g__Duodenibacillus|s__Duodenibacillus_massiliensis|t__SGB9273:0.016540447906458797
+CM_ethiopia__CM_D11_I1_18__bin.23 kSGB_4936:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_hominis|t__SGB4936:0.024950490716180374
+CM_ethiopia__CM_D11_I1_18__bin.32 kSGB_1934:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Tannerellaceae|g__Parabacteroides|s__Parabacteroides_distasonis|t__SGB1934:0.022831115687096212
+CM_ethiopia__CM_D11_I1_18__bin.38 kSGB_1790:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Odoribacteraceae|g__Odoribacter|s__Odoribacter_splanchnicus|t__SGB1790:0.016398938586678055
+CM_ethiopia__CM_D11_I1_18__bin.41 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03819003903508771
+CM_ethiopia__CM_D11_I1_18__bin.43 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02119712497175141
+CM_ethiopia__CM_D11_I1_18__bin.47 kSGB_7061:Species:k__Bacteria|p__Firmicutes|c__Bacilli|o__Lactobacillales|f__Lactobacillaceae|g__Ligilactobacillus|s__Ligilactobacillus_ruminis|t__SGB7061:0.028093501298701296
+CM_ethiopia__CM_D11_I1_18__bin.57 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.020593590340574848
+CM_ethiopia__CM_D11_I1_18__bin.58 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.034769342278481004
+CM_ethiopia__CM_D11_I1_18__bin.67 kSGB_9283:Species:k__Bacteria|p__Proteobacteria|c__Betaproteobacteria|o__Burkholderiales|f__Sutterellaceae|g__Sutterella|s__Sutterella_wadsworthensis|t__SGB9283:0.0233507723542989
+CM_ethiopia__CM_D11_I1_18__bin.69 kSGB_15452:Species:k__Bacteria|p__Proteobacteria|c__Deltaproteobacteria|o__Desulfovibrionales|f__Desulfovibrionaceae|g__Bilophila|s__Bilophila_wadsworthia|t__SGB15452:0.023001601151761517
+CM_ethiopia__CM_D11_I1_18__bin.71 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.042388908174178765
+CM_ethiopia__CM_D11_I1_18__bin.73 kSGB_5190:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Anaerotignum|s__Anaerotignum_faecicola|t__SGB5190:0.03145028529644269
+CM_ethiopia__CM_D11_M0_18__bin.11 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03706913798245614
+CM_ethiopia__CM_D11_M0_18__bin.14 uSGB_2240:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1632|s__GGB1632_SGB2240|t__SGB2240:0.033622282802547775
+CM_ethiopia__CM_D11_M0_18__bin.29 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02071046485875706
+CM_ethiopia__CM_D11_M0_18__bin.39 uSGB_4372:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_unclassified_SGB4372|t__SGB4372:0.02026614761904762
+CM_ethiopia__CM_D11_M0_18__bin.52 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.022798438821385176
+CM_ethiopia__CM_D11_M0_18__bin.55 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.030572115248453827
+CM_ethiopia__CM_D11_M0_18__bin.61 uSGB_1024:Other:k__Archaea|p__Euryarchaeota|c__CFGB343|o__OFGB343|f__FGB343|g__GGB781|s__GGB781_SGB1024|t__SGB1024:0.02766992466124661
+CM_ethiopia__CM_D11_M0_18__bin.64 uSGB_2076:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_unclassified_SGB2076|t__SGB2076:0.02182924643558282
+CM_ethiopia__CM_D11_M0_18__bin.67 uSGB_4348:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB3293|s__GGB3293_SGB4348|t__SGB4348:0.023505065566391595
+CM_ethiopia__CM_D11_M0_18__bin.68 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.033016548809523816
+CM_ethiopia__CM_D11_M0_18__bin.70 kSGB_17244:Species:k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Bifidobacteriales|f__Bifidobacteriaceae|g__Bifidobacterium|s__Bifidobacterium_adolescentis|t__SGB17244:0.023832747298850574
+CM_ethiopia__CM_D11_M0_18__bin.8 uSGB_4920:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3632|s__GGB3632_SGB4920|t__SGB4920:0.015620066666666666
+CM_ethiopia__CM_D11_M0_18__bin.9 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.030145264596273296
+CM_ethiopia__CM_D13_I1_18__bin.17 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.02767735608871828
+CM_ethiopia__CM_D13_I1_18__bin.25 kSGB_16955:Species:k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Propionibacteriales|f__Propionibacteriaceae|g__Cutibacterium|s__Cutibacterium_acnes|t__SGB16955:0.01086989962264151
+CM_ethiopia__CM_D13_I1_18__bin.36 kSGB_12308:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Pseudomonadales|f__Pseudomonadaceae|g__Pseudomonas|s__Pseudomonas_oryzihabitans|t__SGB12308:0.0245435984375
+CM_ethiopia__CM_D13_I1_18__bin.6 uSGB_6927:Other:k__Bacteria|p__Firmicutes|c__CFGB1872|o__OFGB1872|f__FGB1872|g__GGB4964|s__GGB4964_SGB6927|t__SGB6927:0.03409726279069768
+CM_ethiopia__CM_D13_M0_18__bin.11 kSGB_19434:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacteraceae_unclassified|s__Campylobacteraceae_bacterium|t__SGB19434:0.021231454838709682
+CM_ethiopia__CM_D13_M0_18__bin.18 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.019654927932203387
+CM_ethiopia__CM_D13_M0_18__bin.19 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03655025675438596
+CM_ethiopia__CM_D13_M0_18__bin.2 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03231342654084026
+CM_ethiopia__CM_D13_M0_18__bin.22 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.02959525115820601
+CM_ethiopia__CM_D13_M0_18__bin.23 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.04187566042780749
+CM_ethiopia__CM_D13_M0_18__bin.4 uSGB_4890:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_unclassified_SGB4890|t__SGB4890:0.0210063125
+CM_ethiopia__CM_D15_I1_18__bin.32 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.0292009301863354
+CM_ethiopia__CM_D15_M0_18__bin.5 kSGB_17244:Species:k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Bifidobacteriales|f__Bifidobacteriaceae|g__Bifidobacterium|s__Bifidobacterium_adolescentis|t__SGB17244:0.02568076935057471
+CM_ethiopia__CM_D15_M0_18__bin.54 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.027952527777777778
+CM_ethiopia__CM_D15_M0_18__bin.6 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.032447703154761906
+CM_ethiopia__CM_D15_M0_18__bin.65 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.020352729583333333
+CM_ethiopia__CM_D21B_I12_18__bin.4 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.027357181168790958
+CM_ethiopia__CM_D21_I1_18__bin.10 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.027743261442582552
+CM_ethiopia__CM_D21_I1_18__bin.2 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.031152088774792065
+CM_ethiopia__CM_D21_I1_18__bin.21 kSGB_8768:Species:k__Bacteria|p__Verrucomicrobia|c__Opitutae|o__Opitutales|f__Opitutales_unclassified|g__Opitutales_unclassified|s__Opitutales_bacterium|t__SGB8768:0.020660228988764042
+CM_ethiopia__CM_D21_I1_18__bin.26 uSGB_2126:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__GGB1543|s__GGB1543_SGB2126|t__SGB2126:0.029611555686274507
+CM_ethiopia__CM_D21_I1_18__bin.31 kSGB_2318:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Alistipes|s__Alistipes_putredinis|t__SGB2318:0.016858436284490963
+CM_ethiopia__CM_D21_I1_18__bin.32 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.036264767517543865
+CM_ethiopia__CM_D21_I1_18__bin.39 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.026600874363636368
+CM_ethiopia__CM_D21_I1_18__bin.44 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.020716957916666667
+CM_ethiopia__CM_D21_M0_18__bin.14 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.02671283618181818
+CM_ethiopia__CM_D21_M0_18__bin.30 kSGB_4910:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_bacterium_WCA3_601_WT_6H|t__SGB4910:0.028309220983015956
+CM_ethiopia__CM_D21_M0_18__bin.36 kSGB_8768:Species:k__Bacteria|p__Verrucomicrobia|c__Opitutae|o__Opitutales|f__Opitutales_unclassified|g__Opitutales_unclassified|s__Opitutales_bacterium|t__SGB8768:0.019424386292134832
+CM_ethiopia__CM_D21_M0_18__bin.42 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03175504916080187
+CM_ethiopia__CM_D21_M0_18__bin.48 kSGB_2318:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Alistipes|s__Alistipes_putredinis|t__SGB2318:0.01525946214240406
+CM_ethiopia__CM_D21_M0_18__bin.58 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.027847230688516512
+CM_ethiopia__CM_D21_M0_18__bin.59 uSGB_20192:Other:k__Bacteria|p__Bacteroidetes|c__CFGB4422|o__OFGB4422|f__FGB4422|g__GGB13020|s__GGB13020_SGB20192|t__SGB20192:0.026230874761904766
+CM_ethiopia__CM_D21_M0_18__bin.7 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.02066290020833333
+CM_ethiopia__CM_D24_I1_18__bin.16 kSGB_3548:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetia_unclassified|f__Spirochaetia_unclassified|g__Spirochaetia_unclassified|s__Spirochaetia_bacterium|t__SGB3548:0.022377923529411762
+CM_ethiopia__CM_D24_I1_18__bin.21 uSGB_1701:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1267|s__GGB1267_SGB1701|t__SGB1701:0.021716905416666665
+CM_ethiopia__CM_D24_I1_18__bin.33 uSGB_26990:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB18271|s__GGB18271_SGB26990|t__SGB26990:0.014240885714285712
+CM_ethiopia__CM_D24_I1_18__bin.52 kSGB_4368:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_bacterium|t__SGB4368:0.018302542857142858
+CM_ethiopia__CM_D24_I1_18__bin.57 kSGB_15084:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcaceae_unclassified|s__Ruminococcaceae_bacterium|t__SGB15084:0.035313026250000004
+CM_ethiopia__CM_D24_I1_18__bin.59 kSGB_9210:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9210:0.019280890989010983
+CM_ethiopia__CM_D24_I1_18__bin.71 kSGB_1333:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB1333:0.02428298269230769
+CM_ethiopia__CM_D24_I1_18__bin.77 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.024894785093167702
+CM_ethiopia__CM_D24_I1_18__bin.82 kSGB_6970:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadales_unclassified|g__Selenomonadales_unclassified|s__Selenomonadales_bacterium|t__SGB6970:0.01973624035087719
+CM_ethiopia__CM_D24_M0_18__bin.18 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.021611797916666665
+CM_ethiopia__CM_D24_M0_18__bin.26 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.04213284117647059
+CM_ethiopia__CM_D24_M0_18__bin.36 kSGB_3546:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetales|f__Spirochaetaceae|g__Treponema|s__Treponema_succinifaciens|t__SGB3546:0.018794813227513227
+CM_ethiopia__CM_D24_M0_18__bin.58 kSGB_9210:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9210:0.020020817582417583
+CM_ethiopia__CM_D24_M0_18__bin.72 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.037580156118143464
+CM_ethiopia__CM_D24_M0_18__bin.9 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.03191376547619048
+CM_ethiopia__CM_D26AB_I1_18__bin.20 uSGB_4920:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3632|s__GGB3632_SGB4920|t__SGB4920:0.06605975
+CM_ethiopia__CM_D26AB_I1_18__bin.22 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.03655784101265823
+CM_ethiopia__CM_D26AB_I1_18__bin.25 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.04199274713521772
+CM_ethiopia__CM_D26AB_I1_18__bin.38 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.021307665186440682
+CM_ethiopia__CM_D26AB_I1_18__bin.44 kSGB_5100:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_bacterium|t__SGB5100:0.017473495
+CM_ethiopia__CM_D26AB_I1_18__bin.8 kSGB_19692:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19692:0.021568808020833333
+CM_ethiopia__CM_D26AB_I1_18__bin.9 uSGB_4930:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3637|s__GGB3637_SGB4930|t__SGB4930:0.03330005789473684
+CM_ethiopia__CM_D26A_I13_18__bin.11 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03706791665789474
+CM_ethiopia__CM_D26A_I13_18__bin.13 uSGB_1680:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__Prevotella|s__Prevotella_SGB1680|t__SGB1680:0.032731439077155824
+CM_ethiopia__CM_D26A_I13_18__bin.25 kSGB_4910:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_bacterium_WCA3_601_WT_6H|t__SGB4910:0.02695052974781266
+CM_ethiopia__CM_D26A_I13_18__bin.31 kSGB_5904:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__Mitsuokella|s__Mitsuokella_jalaludinii|t__SGB5904:0.023625802845528458
+CM_ethiopia__CM_D26A_I13_18__bin.33 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02041316615819209
+CM_ethiopia__CM_D26K_I12_18__bin.8 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.02512904894886217
+CM_ethiopia__CM_D26_M0_18__bin.18 uSGB_4373:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_unclassified_SGB4373|t__SGB4373:0.024968250925925924
+CM_ethiopia__CM_D26_M0_18__bin.25 uSGB_1680:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__Prevotella|s__Prevotella_SGB1680|t__SGB1680:0.0326514602118003
+CM_ethiopia__CM_D26_M0_18__bin.26 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.026412663818181817
+CM_ethiopia__CM_D26_M0_18__bin.38 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.030845753081680527
+CM_ethiopia__CM_D26_M0_18__bin.57 kSGB_4910:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_bacterium_WCA3_601_WT_6H|t__SGB4910:0.024341045548121464
+CM_ethiopia__CM_D26_M0_18__bin.64 kSGB_5117:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Coprococcus|s__Coprococcus_eutactus|t__SGB5117:0.02213430023277467
+CM_ethiopia__CM_D33_I1_18__bin.10 kSGB_7967:Species:k__Bacteria|p__Firmicutes|c__Bacilli|o__Lactobacillales|f__Enterococcaceae|g__Enterococcus|s__Enterococcus_faecium|t__SGB7967:0.013812849596293844
+CM_ethiopia__CM_D33_I1_18__bin.13 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.020821249463852626
+CM_ethiopia__CM_D33_M0_18__bin.11 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03597226614035088
+CM_ethiopia__CM_D33_M0_18__bin.12 uSGB_4894:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Lachnospiraceae_unclassified_SGB4894|t__SGB4894:0.02622717157894737
+CM_ethiopia__CM_D33_M0_18__bin.19 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.029589739751552793
+CM_ethiopia__CM_D33_M0_18__bin.20 kSGB_714:Species:k__Archaea|p__Euryarchaeota|c__Methanobacteria|o__Methanobacteriales|f__Methanobacteriaceae|g__Methanobrevibacter|s__Methanobrevibacter_smithii|t__SGB714:0.018459912472806383
+CM_ethiopia__CM_D33_M0_18__bin.3 kSGB_4546:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Eubacteriaceae|g__Eubacteriaceae_unclassified|s__Eubacteriaceae_bacterium|t__SGB4546:0.08417412999999999
+CM_ethiopia__CM_D33_M0_18__bin.31 kSGB_1636:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__Prevotella|s__Prevotella_copri|t__SGB1636:0.0394016177631579
+CM_ethiopia__CM_D33_M0_18__bin.34 uSGB_2321:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1689|s__GGB1689_SGB2321|t__SGB2321:0.023868098969072167
+CM_ethiopia__CM_D39_I1_18__bin.13 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.04053677043859649
+CM_ethiopia__CM_D39_I1_18__bin.15 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.02083194812890242
+CM_ethiopia__CM_D39_I1_18__bin.22 kSGB_14762:Species:k__Bacteria|p__Actinobacteria|c__Coriobacteriia|o__Coriobacteriales|f__Coriobacteriaceae|g__Collinsella|s__Collinsella_sp_AK_207A|t__SGB14762:0.019462590000000002
+CM_ethiopia__CM_D39_I1_18__bin.29 kSGB_5862:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__Megasphaera|s__Megasphaera_elsdenii|t__SGB5862:0.025090881273408243
+CM_ethiopia__CM_D39_I1_18__bin.9 kSGB_9273:Species:k__Bacteria|p__Proteobacteria|c__Betaproteobacteria|o__Burkholderiales|f__Sutterellaceae|g__Duodenibacillus|s__Duodenibacillus_massiliensis|t__SGB9273:0.015058685679287306
+CM_ethiopia__CM_D39_M0_18__bin.15 kSGB_3548:Species:k__Bacteria|p__Spirochaetes|c__Spirochaetia|o__Spirochaetia_unclassified|f__Spirochaetia_unclassified|g__Spirochaetia_unclassified|s__Spirochaetia_bacterium|t__SGB3548:0.0224373
+CM_ethiopia__CM_D39_M0_18__bin.23 uSGB_19976:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__GGB12851|s__GGB12851_SGB19976|t__SGB19976:0.08399291666666665
+CM_ethiopia__CM_D39_M0_18__bin.32 uSGB_14238:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB9285|s__GGB9285_SGB14238|t__SGB14238:0.01312110188888889
+CM_ethiopia__CM_D39_M0_18__bin.35 uSGB_14980:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Clostridiaceae|g__GGB9568|s__GGB9568_SGB14980|t__SGB14980:0.027242376
+CM_ethiopia__CM_D39_M0_18__bin.36 uSGB_17345:Other:k__Bacteria|p__Firmicutes|c__CFGB3170|o__OFGB3170|f__FGB3170|g__GGB10690|s__GGB10690_SGB17345|t__SGB17345:0.024214035555555548
+CM_ethiopia__CM_D39_M0_18__bin.40 kSGB_4188:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcaceae_unclassified|s__Ruminococcaceae_bacterium|t__SGB4188:0.021926175000000003
+CM_ethiopia__CM_D39_M0_18__bin.44 uSGB_2076:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_unclassified_SGB2076|t__SGB2076:0.023842498159509205
+CM_ethiopia__CM_D39_M0_18__bin.45 uSGB_1437:Other:k__Bacteria|p__Bacteroidetes|c__CFGB544|o__OFGB544|f__FGB544|g__GGB1123|s__GGB1123_SGB1437|t__SGB1437:0.02291870339805825
+CM_ethiopia__CM_D39_M0_18__bin.46 kSGB_2215:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_bacterium|t__SGB2215:0.02294027358490566
+CM_ethiopia__CM_D39_M0_18__bin.52 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.026268718712029158
+CM_ethiopia__CM_D39_M0_18__bin.64 uSGB_4373:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_unclassified_SGB4373|t__SGB4373:0.021488724074074074
+CM_ethiopia__CM_D39_M0_18__bin.65 uSGB_13976:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB9059|s__GGB9059_SGB13976|t__SGB13976:0.02665185232240437
+CM_ethiopia__CM_D39_M0_18__bin.66 kSGB_1333:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB1333:0.024211184615384615
+CM_ethiopia__CM_D40_I1_18__bin.11 kSGB_1814:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Phocaeicola|s__Phocaeicola_vulgatus|t__SGB1814:0.020266540251533745
+CM_ethiopia__CM_D40_I1_18__bin.16 kSGB_4584:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Mediterraneibacter|s__Ruminococcus_gnavus|t__SGB4584:0.027413949829816202
+CM_ethiopia__CM_D40_I1_18__bin.19 kSGB_5862:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__Megasphaera|s__Megasphaera_elsdenii|t__SGB5862:0.023824916666666668
+CM_ethiopia__CM_D40_I1_18__bin.23 kSGB_17248:Species:k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Bifidobacteriales|f__Bifidobacteriaceae|g__Bifidobacterium|s__Bifidobacterium_longum|t__SGB17248:0.0501009919504644
+CM_ethiopia__CM_D40_I1_18__bin.27 kSGB_15316:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Faecalibacterium|s__Faecalibacterium_prausnitzii|t__SGB15316:0.03170473258733624
+CM_ethiopia__CM_D40_M0_18__bin.10 kSGB_2021:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2021:0.03208925540838852
+CM_ethiopia__CM_D40_M0_18__bin.20 kSGB_5065:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Butyrivibrio|s__Butyrivibrio_crossotus|t__SGB5065:0.022000097792706334
+CM_ethiopia__CM_D40_M0_18__bin.21 kSGB_19694:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19694:0.02432507358490566
+CM_ethiopia__CM_D40_M0_18__bin.28 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.024695422360248447
+CM_ethiopia__CM_D40_M0_18__bin.34 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.026474718181818183
+CM_ethiopia__CM_D40_M0_18__bin.35 uSGB_19436:Family:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__GGB12503|s__GGB12503_SGB19436|t__SGB19436:0.03357034285714285
+CM_ethiopia__CM_D40_M0_18__bin.36 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.02195771367231639
+CM_ethiopia__CM_D40_M0_18__bin.62 uSGB_4372:Genus:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__Clostridia_unclassified|s__Clostridia_unclassified_SGB4372|t__SGB4372:0.02067538571428571
+CM_ethiopia__CM_D40_M0_18__bin.63 kSGB_2075:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_bacterium|t__SGB2075:0.019396263448275865
+CM_ethiopia__CM_D40_M0_18__bin.66 uSGB_1024:Other:k__Archaea|p__Euryarchaeota|c__CFGB343|o__OFGB343|f__FGB343|g__GGB781|s__GGB781_SGB1024|t__SGB1024:0.028231784281842812
+CM_ethiopia__CM_D40_M0_18__bin.71 uSGB_14238:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB9285|s__GGB9285_SGB14238|t__SGB14238:0.013153862222222222
+CM_ethiopia__CM_D40_M0_18__bin.76 kSGB_9209:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9209:0.015802699082568806
+CM_ethiopia__CM_D43_I1_18__bin.13 uSGB_3677:Other:k__Bacteria|p__Proteobacteria|c__CFGB1062|o__OFGB1062|f__FGB1062|g__GGB2734|s__GGB2734_SGB3677|t__SGB3677:0.020400869468926556
+CM_ethiopia__CM_D43_I1_18__bin.18 kSGB_4925:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_faecis|t__SGB4925:0.026292968977243
+CM_ethiopia__CM_D43_I1_18__bin.20 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.02689805155279503
+CM_ethiopia__CM_D43_I1_18__bin.30 uSGB_4900:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3623|s__GGB3623_SGB4900|t__SGB4900:0.024630386046511632
+CM_ethiopia__CM_D43_I1_18__bin.36 uSGB_4920:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3632|s__GGB3632_SGB4920|t__SGB4920:0.020173433333333334
+CM_ethiopia__CM_D43_I1_18__bin.37 uSGB_2230:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_unclassified_SGB2230|t__SGB2230:0.02237896609963548
+CM_ethiopia__CM_D43_I1_18__bin.42 kSGB_10043:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Shimwellia|s__Shimwellia_blattae|t__SGB10043:0.146706
+CM_ethiopia__CM_D43_I1_18__bin.49 uSGB_14238:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridia_unclassified|f__Clostridia_unclassified|g__GGB9285|s__GGB9285_SGB14238|t__SGB14238:0.014570531777777774
+CM_ethiopia__CM_D43_I1_18__bin.8 kSGB_9209:Species:k__Bacteria|p__Lentisphaerae|c__Lentisphaeria|o__Lentisphaeria_unclassified|f__Lentisphaeria_unclassified|g__Lentisphaeria_unclassified|s__Lentisphaeria_bacterium|t__SGB9209:0.01510988899082569
+CM_ethiopia__CM_D43_M0_18__bin.12 uSGB_5809:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__GGB4266|s__GGB4266_SGB5809|t__SGB5809:0.03525266333333333
+CM_ethiopia__CM_D43_M0_18__bin.16 kSGB_17256:Species:k__Bacteria|p__Actinobacteria|c__Actinobacteria|o__Bifidobacteriales|f__Bifidobacteriaceae|g__Bifidobacterium|s__Bifidobacterium_bifidum|t__SGB17256:0.020424639705882354
+CM_ethiopia__CM_D43_M0_18__bin.28 uSGB_2238:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1630|s__GGB1630_SGB2238|t__SGB2238:0.034011544444444444
+CM_ethiopia__CM_D48_M0_18__bin.11 kSGB_4285:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Ruminococcaceae|g__Ruminococcus|s__Ruminococcus_bromii|t__SGB4285:0.029795503912701533
+CM_ethiopia__CM_D48_M0_18__bin.19 kSGB_4938:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_sp_AF02_12|t__SGB4938:0.028649695479777953
+CM_ethiopia__CM_D48_M0_18__bin.23 uSGB_4930:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3637|s__GGB3637_SGB4930|t__SGB4930:0.027672151754385962
+CM_ethiopia__CM_D48_M0_18__bin.24 uSGB_4303:Other:k__Bacteria|p__Firmicutes|c__CFGB1340|o__OFGB1340|f__FGB1340|g__GGB3256|s__GGB3256_SGB4303|t__SGB4303:0.028321308674223757
+CM_ethiopia__CM_D48_M0_18__bin.46 kSGB_1475:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1475:0.026731281550802143
+CM_ethiopia__CM_D50_I1_18__bin.10 kSGB_1644:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__Prevotella|s__Prevotella_copri|t__SGB1644:0.046138954773869346
+CM_ethiopia__CM_D50_I1_18__bin.2 kSGB_6922:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Veillonellales|f__Veillonellaceae|g__Veillonella|s__Veillonella_ratti|t__SGB6922:0.008928070652173914
+CM_ethiopia__CM_D50_I1_18__bin.23 kSGB_1949:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Tannerellaceae|g__Parabacteroides|s__Parabacteroides_merdae|t__SGB1949:0.022577076673706443
+CM_ethiopia__CM_D50_I1_18__bin.27 kSGB_10068:Species:k__Bacteria|p__Proteobacteria|c__Gammaproteobacteria|o__Enterobacterales|f__Enterobacteriaceae|g__Escherichia|s__Escherichia_coli|t__SGB10068:0.028076913590484545
+CM_ethiopia__CM_D50_I1_18__bin.3 kSGB_19434:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacteraceae_unclassified|s__Campylobacteraceae_bacterium|t__SGB19434:0.02186850806451613
+CM_ethiopia__CM_D50_I1_18__bin.4 kSGB_5765:Species:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Acidaminococcales|f__Acidaminococcaceae|g__Phascolarctobacterium|s__Phascolarctobacterium_succinatutens|t__SGB5765:0.04288258372803667
+CM_ethiopia__CM_D50_I1_18__bin.8 uSGB_14439:Genus:k__Bacteria|p__Actinobacteria|c__Coriobacteriia|o__Coriobacteriales|f__Coriobacteriaceae|g__Collinsella|s__Collinsella_SGB14439|t__SGB14439:0.064952925
+CM_ethiopia__CM_D50_M0_18__bin.12 kSGB_4938:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Roseburia|s__Roseburia_sp_AF02_12|t__SGB4938:0.027289032910388582
+CM_ethiopia__CM_D50_M0_18__bin.36 uSGB_1699:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__GGB1266|s__GGB1266_SGB1699|t__SGB1699:0.024195238077969174
+CM_ethiopia__CM_D50_M0_18__bin.39 kSGB_19688:Species:k__Bacteria|p__Elusimicrobia|c__Elusimicrobia|o__Elusimicrobiales|f__Elusimicrobiales_unclassified|g__Elusimicrobiales_unclassified|s__Elusimicrobiales_bacterium|t__SGB19688:0.01242276923076923
+CM_ethiopia__CM_D50_M0_18__bin.42 kSGB_714:Species:k__Archaea|p__Euryarchaeota|c__Methanobacteria|o__Methanobacteriales|f__Methanobacteriaceae|g__Methanobrevibacter|s__Methanobrevibacter_smithii|t__SGB714:0.01796047839013778
+CM_ethiopia__CM_D50_M0_18__bin.43 kSGB_1855:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroides|s__Bacteroides_fragilis|t__SGB1855:0.017164711101694916
+CM_ethiopia__CM_D50_M0_18__bin.46 kSGB_1404:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidaceae|g__Bacteroidaceae_unclassified|s__Bacteroidaceae_bacterium|t__SGB1404:0.015718816464646464
+CM_ethiopia__CM_D50_M0_18__bin.49 uSGB_6973:Family:k__Bacteria|p__Firmicutes|c__Negativicutes|o__Selenomonadales|f__Selenomonadaceae|g__GGB4979|s__GGB4979_SGB6973|t__SGB6973:0.03582619113924051
+CM_ethiopia__CM_D50_M0_18__bin.58 uSGB_2214:Family:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__GGB1617|s__GGB1617_SGB2214|t__SGB2214:0.027074628181818182
+CM_ethiopia__CM_D50_M0_18__bin.59 kSGB_19434:Species:k__Bacteria|p__Proteobacteria|c__Epsilonproteobacteria|o__Campylobacterales|f__Campylobacteraceae|g__Campylobacteraceae_unclassified|s__Campylobacteraceae_bacterium|t__SGB19434:0.022509777580645162
+CM_ethiopia__CM_D50_M0_18__bin.60 kSGB_4933:Species:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__Lachnospiraceae_unclassified|s__Eubacterium_rectale|t__SGB4933:0.03287236667732992
+CM_ethiopia__CM_D50_M0_18__bin.63 uSGB_5239:Family:k__Bacteria|p__Firmicutes|c__Clostridia|o__Clostridiales|f__Lachnospiraceae|g__GGB3862|s__GGB3862_SGB5239|t__SGB5239:0.02704829732919254
+CM_ethiopia__CM_D50_M0_18__bin.64 kSGB_2229:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Rikenellaceae|g__Rikenellaceae_unclassified|s__Rikenellaceae_bacterium|t__SGB2229:0.023970951282051286
+CM_ethiopia__CM_D50_M0_18__bin.67 uSGB_2076:Genus:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Bacteroidales_unclassified|g__Bacteroidales_unclassified|s__Bacteroidales_unclassified_SGB2076|t__SGB2076:0.021426739687116562
+CM_ethiopia__CM_D50_M0_18__bin.72 kSGB_1676:Species:k__Bacteria|p__Bacteroidetes|c__Bacteroidia|o__Bacteroidales|f__Prevotellaceae|g__Prevotella|s__Prevotella_sp_Marseille_P4119|t__SGB1676:0.024065360540540537
\ No newline at end of file
diff --git a/tools/phylophlan/test-data/phylophlan.tsv b/tools/phylophlan/test-data/phylophlan.tsv
new file mode 100644
index 0000000000..622f9a69ad
--- /dev/null
+++ b/tools/phylophlan/test-data/phylophlan.tsv
@@ -0,0 +1,400 @@
+p0000 PROTCATLG
+p0001 PROTCATLG
+p0002 PROTCATLG
+p0003 PROTCATLG
+p0004 PROTCATLG
+p0005 PROTCATCPREVF
+p0006 PROTCATLG
+p0007 PROTCATLG
+p0008 PROTCATLG
+p0009 PROTCATLG
+p0010 PROTCATLG
+p0011 PROTCATRTREV
+p0012 PROTCATLG
+p0013 PROTCATLG
+p0014 PROTCATLG
+p0015 PROTCATLG
+p0016 PROTCATLG
+p0017 PROTCATLG
+p0018 PROTCATLG
+p0019 PROTCATLG
+p0020 PROTCATLG
+p0021 PROTCATLG
+p0022 PROTCATLG
+p0023 PROTCATLG
+p0024 PROTCATLG
+p0025 PROTCATLG
+p0026 PROTCATLG
+p0027 PROTCATLG
+p0028 PROTCATLG
+p0029 PROTCATLG
+p0030 PROTCATLG
+p0031 PROTCATLG
+p0032 PROTCATRTREV
+p0033 PROTCATLG
+p0034 PROTCATRTREV
+p0035 PROTCATLG
+p0036 PROTCATLG
+p0037 PROTCATLG
+p0038 PROTCATLG
+p0039 PROTCATLG
+p0040 PROTCATLG
+p0041 PROTCATLG
+p0042 PROTCATLG
+p0043 PROTCATRTREV
+p0044 PROTCATLG
+p0045 PROTCATLG
+p0046 PROTCATLG
+p0047 PROTCATLG
+p0048 PROTCATRTREV
+p0049 PROTCATLG
+p0050 PROTCATLG
+p0051 PROTCATLG
+p0052 PROTCATLG
+p0053 PROTCATCPREVF
+p0054 PROTCATLG
+p0055 PROTCATLG
+p0056 PROTCATLG
+p0057 PROTCATLG
+p0058 PROTCATLG
+p0059 PROTCATLG
+p0060 PROTCATLG
+p0061 PROTCATLG
+p0062 PROTCATLG
+p0063 PROTCATLG
+p0064 PROTCATLG
+p0065 PROTCATRTREV
+p0066 PROTCATLG
+p0067 PROTCATLG
+p0068 PROTCATLG
+p0069 PROTCATLG
+p0070 PROTCATLG
+p0071 PROTCATLG
+p0072 PROTCATLG
+p0073 PROTCATLG
+p0074 PROTCATLG
+p0075 PROTCATRTREV
+p0076 PROTCATLG
+p0077 PROTCATLG
+p0078 PROTCATLG
+p0079 PROTCATLG
+p0080 PROTCATLG
+p0081 PROTCATLG
+p0082 PROTCATLG
+p0083 PROTCATLG
+p0084 PROTCATLG
+p0085 PROTCATLG
+p0086 PROTCATLG
+p0087 PROTCATLG
+p0088 PROTCATLG
+p0089 PROTCATLG
+p0090 PROTCATRTREV
+p0091 PROTCATLG
+p0092 PROTCATLG
+p0093 PROTCATLG
+p0094 PROTCATRTREV
+p0095 PROTCATLG
+p0096 PROTCATLG
+p0097 PROTCATLG
+p0098 PROTCATLG
+p0099 PROTCATLG
+p0100 PROTCATRTREV
+p0101 PROTCATLG
+p0102 PROTCATLG
+p0103 PROTCATLG
+p0104 PROTCATRTREV
+p0105 PROTCATLG
+p0106 PROTCATLG
+p0107 PROTCATLG
+p0108 PROTCATLG
+p0109 PROTCATRTREV
+p0110 PROTCATLG
+p0111 PROTCATRTREV
+p0112 PROTCATLG
+p0113 PROTCATLG
+p0114 PROTCATLG
+p0115 PROTCATLG
+p0116 PROTCATLG
+p0117 PROTCATLG
+p0118 PROTCATRTREV
+p0119 PROTCATLG
+p0120 PROTCATLG
+p0121 PROTCATLG
+p0122 PROTCATLG
+p0123 PROTCATLG
+p0124 PROTCATLG
+p0125 PROTCATLG
+p0126 PROTCATLG
+p0127 PROTCATLG
+p0128 PROTCATLG
+p0129 PROTCATVT
+p0130 PROTCATLG
+p0131 PROTCATLG
+p0132 PROTCATLG
+p0133 PROTCATLG
+p0134 PROTCATLG
+p0135 PROTCATLG
+p0136 PROTCATRTREV
+p0137 PROTCATLG
+p0138 PROTCATLG
+p0139 PROTCATVT
+p0140 PROTCATLG
+p0141 PROTCATLG
+p0142 PROTCATLG
+p0143 PROTCATLG
+p0144 PROTCATVT
+p0145 PROTCATLG
+p0146 PROTCATLG
+p0147 PROTCATLG
+p0148 PROTCATLG
+p0149 PROTCATCPREVF
+p0150 PROTCATLG
+p0151 PROTCATCPREVF
+p0152 PROTCATLG
+p0153 PROTCATLG
+p0154 PROTCATLG
+p0155 PROTCATLG
+p0156 PROTCATLG
+p0157 PROTCATLG
+p0158 PROTCATLG
+p0159 PROTCATRTREV
+p0160 PROTCATVT
+p0161 PROTCATRTREV
+p0162 PROTCATLG
+p0163 PROTCATLG
+p0164 PROTCATLG
+p0165 PROTCATLG
+p0166 PROTCATLG
+p0167 PROTCATRTREV
+p0168 PROTCATLG
+p0169 PROTCATRTREV
+p0170 PROTCATLG
+p0171 PROTCATLG
+p0172 PROTCATLG
+p0173 PROTCATLG
+p0174 PROTCATLG
+p0175 PROTCATLG
+p0176 PROTCATLG
+p0177 PROTCATLG
+p0178 PROTCATLG
+p0179 PROTCATRTREV
+p0180 PROTCATLG
+p0181 PROTCATLG
+p0182 PROTCATLG
+p0183 PROTCATLG
+p0184 PROTCATLG
+p0185 PROTCATBLOSUM62
+p0186 PROTCATLG
+p0187 PROTCATLG
+p0188 PROTCATLG
+p0189 PROTCATLG
+p0190 PROTCATLG
+p0191 PROTCATLG
+p0192 PROTCATLG
+p0193 PROTCATLG
+p0194 PROTCATRTREV
+p0195 PROTCATLG
+p0196 PROTCATPMB
+p0197 PROTCATLG
+p0198 PROTCATLG
+p0199 PROTCATLG
+p0200 PROTCATLG
+p0201 PROTCATLG
+p0202 PROTCATLG
+p0203 PROTCATLG
+p0204 PROTCATRTREV
+p0205 PROTCATRTREV
+p0206 PROTCATLG
+p0207 PROTCATLG
+p0208 PROTCATLG
+p0209 PROTCATLG
+p0210 PROTCATLG
+p0211 PROTCATRTREV
+p0212 PROTCATRTREV
+p0213 PROTCATLG
+p0214 PROTCATLG
+p0215 PROTCATLG
+p0216 PROTCATCPREVF
+p0217 PROTCATLG
+p0218 PROTCATLG
+p0219 PROTCATCPREVF
+p0220 PROTCATCPREVF
+p0221 PROTCATLG
+p0222 PROTCATRTREV
+p0223 PROTCATLG
+p0224 PROTCATLG
+p0225 PROTCATCPREV
+p0226 PROTCATLG
+p0227 PROTCATLG
+p0228 PROTCATRTREV
+p0229 PROTCATLG
+p0230 PROTCATRTREV
+p0231 PROTCATLG
+p0232 PROTCATLG
+p0233 PROTCATCPREV
+p0234 PROTCATRTREV
+p0235 PROTCATLG
+p0236 PROTCATRTREV
+p0237 PROTCATLG
+p0238 PROTCATLG
+p0239 PROTCATLG
+p0240 PROTCATCPREV
+p0241 PROTCATLG
+p0242 PROTCATLG
+p0243 PROTCATVT
+p0244 PROTCATLG
+p0245 PROTCATRTREV
+p0246 PROTCATRTREV
+p0247 PROTCATLG
+p0248 PROTCATLG
+p0249 PROTCATRTREV
+p0250 PROTCATLG
+p0251 PROTCATVT
+p0252 PROTCATLG
+p0253 PROTCATLG
+p0254 PROTCATLG
+p0255 PROTCATVT
+p0256 PROTCATRTREV
+p0257 PROTCATLG
+p0258 PROTCATVT
+p0259 PROTCATLG
+p0260 PROTCATLG
+p0261 PROTCATLG
+p0262 PROTCATCPREVF
+p0263 PROTCATLG
+p0264 PROTCATRTREV
+p0265 PROTCATLG
+p0266 PROTCATLG
+p0267 PROTCATLG
+p0268 PROTCATCPREVF
+p0269 PROTCATLG
+p0270 PROTCATLG
+p0271 PROTCATLG
+p0272 PROTCATLG
+p0273 PROTCATCPREVF
+p0274 PROTCATLG
+p0275 PROTCATRTREV
+p0276 PROTCATRTREV
+p0277 PROTCATLG
+p0278 PROTCATLG
+p0279 PROTCATLG
+p0280 PROTCATLG
+p0281 PROTCATRTREV
+p0282 PROTCATLG
+p0283 PROTCATVT
+p0284 PROTCATLG
+p0285 PROTCATLG
+p0286 PROTCATBLOSUM62
+p0287 PROTCATLG
+p0288 PROTCATLG
+p0289 PROTCATLG
+p0290 PROTCATLG
+p0291 PROTCATCPREVF
+p0292 PROTCATLG
+p0293 PROTCATLG
+p0294 PROTCATLG
+p0295 PROTCATLG
+p0296 PROTCATRTREV
+p0297 PROTCATLG
+p0298 PROTCATLG
+p0299 PROTCATLG
+p0300 PROTCATLG
+p0301 PROTCATLG
+p0302 PROTCATLG
+p0303 PROTCATLG
+p0304 PROTCATLG
+p0305 PROTCATLG
+p0306 PROTCATLG
+p0307 PROTCATLG
+p0308 PROTCATRTREV
+p0309 PROTCATLG
+p0310 PROTCATLG
+p0311 PROTCATLG
+p0312 PROTCATLG
+p0313 PROTCATLG
+p0314 PROTCATLG
+p0315 PROTCATBLOSUM62
+p0316 PROTCATLG
+p0317 PROTCATLG
+p0318 PROTCATRTREV
+p0319 PROTCATLG
+p0320 PROTCATRTREV
+p0321 PROTCATLG
+p0322 PROTCATLG
+p0323 PROTCATLG
+p0324 PROTCATLG
+p0325 PROTCATLG
+p0326 PROTCATLG
+p0327 PROTCATLG
+p0328 PROTCATCPREVF
+p0329 PROTCATRTREV
+p0330 PROTCATLG
+p0331 PROTCATLG
+p0332 PROTCATLG
+p0333 PROTCATLG
+p0334 PROTCATLG
+p0335 PROTCATRTREV
+p0336 PROTCATRTREV
+p0337 PROTCATLG
+p0338 PROTCATLG
+p0339 PROTCATLG
+p0340 PROTCATLG
+p0341 PROTCATRTREV
+p0342 PROTCATLG
+p0343 PROTCATCPREVF
+p0344 PROTCATCPREVF
+p0345 PROTCATLG
+p0346 PROTCATPMB
+p0347 PROTCATLG
+p0348 PROTCATLG
+p0349 PROTCATRTREV
+p0350 PROTCATLG
+p0351 PROTCATLG
+p0352 PROTCATLG
+p0353 PROTCATRTREV
+p0354 PROTCATLG
+p0355 PROTCATLG
+p0356 PROTCATLG
+p0357 PROTCATCPREVF
+p0358 PROTCATVT
+p0359 PROTCATRTREV
+p0360 PROTCATBLOSUM62
+p0361 PROTCATRTREV
+p0362 PROTCATLG
+p0363 PROTCATLG
+p0364 PROTCATLG
+p0365 PROTCATLG
+p0366 PROTCATRTREV
+p0367 PROTCATLG
+p0368 PROTCATCPREV
+p0369 PROTCATLG
+p0370 PROTCATRTREV
+p0371 PROTCATLG
+p0372 PROTCATLG
+p0373 PROTCATLG
+p0374 PROTCATVT
+p0375 PROTCATLG
+p0376 PROTCATLG
+p0377 PROTCATLG
+p0378 PROTCATLG
+p0379 PROTCATLG
+p0380 PROTCATLG
+p0381 PROTCATLG
+p0382 PROTCATLG
+p0383 PROTCATLG
+p0384 PROTCATVT
+p0385 PROTCATLG
+p0386 PROTCATLG
+p0387 PROTCATCPREVF
+p0388 PROTCATLG
+p0389 PROTCATLG
+p0390 PROTCATRTREV
+p0391 PROTCATLG
+p0392 PROTCATLG
+p0393 PROTCATLG
+p0394 PROTCATLG
+p0395 PROTCATLG
+p0396 PROTCATVT
+p0397 PROTCATLG
+p0398 PROTCATLG
+p0399 PROTCATLG
diff --git a/tools/phylophlan/test-data/phylophlan_markers_filtered.faa.gz b/tools/phylophlan/test-data/phylophlan_markers_filtered.faa.gz
new file mode 100644
index 0000000000..6afb4e910b
Binary files /dev/null and b/tools/phylophlan/test-data/phylophlan_markers_filtered.faa.gz differ
diff --git a/tools/phylophlan/validate_mapping_file.py b/tools/phylophlan/validate_mapping_file.py
new file mode 100644
index 0000000000..496679d122
--- /dev/null
+++ b/tools/phylophlan/validate_mapping_file.py
@@ -0,0 +1,12 @@
+import string
+import sys
+
+print("Validating --maas mapping file ...")
+allowed = set(string.ascii_letters + string.digits + '._-')
+for line in open(sys.argv[1], 'r'):
+ if line.startswith('#'):
+ continue
+ for s in line.strip().split('\t'):
+ if not set(s).issubset(allowed):
+ print(f"Invalid line in mapping file: {line}")
+ sys.exit(1)