Repository 'tiara'
hg clone https://toolshed.g2.bx.psu.edu/repos/bgruening/tiara

Changeset 1:66058890173e (2024-10-18)
Previous changeset 0:3f33a8ac8891 (2024-05-30)
Commit message:
planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/tiara commit eb21d389502b053adf569eb53a0b4cc9e0864fbe
modified:
tiara.xml
added:
test-data/arc
test-data/bac
test-data/euk
test-data/main_result01.txt
test-data/main_result02.txt
test-data/main_result03.txt
test-data/pla
removed:
test-data/bacteria_fr.fasta
test-data/mitplas1.fasta
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/arc
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/arc Fri Oct 18 11:50:31 2024 +0000
b
b'@@ -0,0 +1,20 @@\n+>archea_HG425166.1_0_15000 HG425166.1 Methanobacterium sp. MB1 complete sequence\n+TTGTTATTGGGTTTAAAACCCTGGATCCCAGCATTCGAATCGCTGGTGTTATTCTGAACATGGTTAAAAACAGGAAACACTACCTCAAAACCAAGGAAGCAGTGGAAAAACTGGCAGATCTACCGGTAATTGGAGGAATCCCCCGGGATGATTTCATCAAAGTTGAGCAACGACACCTGGGATTGGTTCCTGCTGTGGAAAGGGAAAACATTAAGAAAAACATTGATGACTGGGGTCTAGTCATGGGGGAGAATATAGACTTAGACGCCCTCACCAATATAATGAAGAGTTCTGGAAAGTTACCTGAAGGTAGGGAACCTCTTTTCCATGAGGAATACTGTGACCGGGTGAAGATTGGTATAGCCAGGGATGAAGTGTTTAACTTTTATTATCAAGATAATTTAGAAGCTTTGGAATCTAATAATGCTGATCTAATTTATTTCAGCCCGTTACATGATGAAGAAGTGCCGGATGTCGATGGTCTCTACATTGGTGGAGGTTATCCTGAGATATTTGCCCGAGAACTGGAGGCTAATCAATCCATGCGCCACTCCATGAAACAGTTTCACCAAGAGGAAAGACCAATCTATGCAGAATGTGGCGGGCTCATGTATTTAACTCGTTCCATAAACCAGCACCAGATGTGTGATGTTTTCCCCTATGATTCTCATATGACCAAAAAACCCCAAGCCCTAAGTTATGTTATTGCCCAGGCAACACAGGATAACATAATTATTCCGAAAGGGGAAATCTTCCATGGACATGAATTCCACTACTCCCGACTGGAACTGGAGGGGGCCCAACCAAAATTTGCCTTTGATATCCTGCGTGGTAGGGGAGTCACTGGTAACTGTGATGGGCTCATGAGTAAAAACACATTGGCCAGTTACGTGCATACCCATGTGGCAGCTTGCCCCTCCTTTGCCAGTAGAATGGTGAAGGCGGCTGCCCATGATCTTTAATGAGGATTGAGAAGGAAAAAACTTTTTCAATACTTTAATTTTTAAAAAAGCCCTTTTGCTACCTTTTAAAATATTTTCTACTGTAGAATTAAATCAACCAATAATTGGATTGAATAACCTCTTATGGTTAATTAACTCTAATTAATATTTCTACTGTAGACTAAATTACCTTGCATTTTCACTTCATGGTAGTCTACTGTAGAATAAATTTGGTACAACATTTACTACTCCTATGGCTCATTATTGGAAAAAATCAGTGATAAATCAGCGAAGCTAAAAAGTATATAAGCACGTGAAAGAAAGGAGTAGACATATAACACTTTAAATAAATTTTTAAAGCTCGCAAATTATTCCAAAATGAAAAAAAGATTGGAATATGCCCTTCTTGATTTATCCCCAAAAATTTTTTCAAGGTTTTATAGAAAATTAAATTTATTTCATGTATCCAAAGATATTAAGAGATTGTTCAGGAGACTGATTTATGAAATTTAAAAGCGTTGACCTTTTTTCACCTTATATCATGGTGGTAATAATAGCCATCTATGTGGGCCTGGCAGCCATAGCCTACCAGGAACATTTAAGGAATCTTCAATGGATTTCCAGCACCACATGGCTCTATGTATTAATGGGAACCCTGTTTTTTGTGGTTGGAGCATTCCTTCCCAAATTCATTTATAACCGCAGTGCGAAACTCAAATCCCTGTGGGGAGGGGCCAAAGTTACTCCGGAAAATTCAGCACCATGGTACAACAAACTCCTCATTCTACTGGATGAAAGGGTGGTATTAACCGTAGCCATCGTTGGTATCCTCCTACAGATTGTGAACCTCTACATACTGGGAGGAATACCCATCCTAAGCGGATACCTGAAATTCAAGGCCACCACCGATCTCTGGCGATTTGCTTATCCCCTATTTCTCCCAGCCATTACTATTCTTCTAGCTAAATACCCTCGAAAATTGACTTACGCACTTTTCATTATAGGTCTAGTAGTTTTCGCCATCAACGGGTACCGAACCACCACCATGGCCATACTCCTCAGTGGATTTATAACCATCTATTACACTCGGAAGATGAAAACCAGTCACATACTGATTGCTATTTTATTAATTGGATTAGTGGGAATAGCTGCTGGTTACATAGCGGTGATGTCCATCCAATGGCAACAGTGGTCCCTGAATCCTCTGCAACTAGTAGCCTACCGTGCCGGGTTCACCATGATGGTCTTTGACAAGGTCGTGCATATGGCTGGAGCTACTGCCGGAGATTTATTTTATCAGGCACTCTCTACCGGACATCCCCGGGTTACAGTGGGGCAAGTAGTTCTCAACTACCCAGTATCAGGTAGCACACCTACCACCAGTATAACCTCTACCATCTTCGGACCAGCCGTACTAGACTTTGGTTTTTACGCCATGGCCCTGCAGATGTTCATAATTGGAGCACTACTCAGAATAATATACGCTACACAGGTAAAGGCCAACGGGGCTTTAACTGCTCTCTACGCTATTGTTTTAACCCATACCATGATATGGGTAGAAACTGGGCCCACAGACAGTGTGGTTTACCTGTTTTACATCTTGGCATTGGTGGCCGTGGTTTTATACGCAACTCAACTGGGTAGAATCAAAAAAAGTTAATGATAAATAACTTCTATACTTTTCCATGGCCTTAAACCATATTTAATAAATCATGAGTTCGAATAAACCTCTTTTTTTATTTTTAAAATGAATTTTTTACACTTGAAATACACCTCTATTATTTCGGGTAAGGATTTCTCATTTTCCAAAATAGGCAAAAATATTTCAAAAAAAGTTGTGAAGAATATTTTGTAGGTTTAATTTAACGAATTATTTATCTTCAACGATTTAAAAAAAGTTCCAAGTTCTCTCTTCCCGGATAATCCAAAAAGATGTTAATAATAATGGAGTATGTGCTATTATTCTTACAAAGACATCTTATAACTCCTAATTAGATATCAATGCCTTTAAATAGGGCCTATGATGGGTATAATCATCTTATTCTCAATTTATTCAATGACATGTTTCCCCAACAGGATAAACAGAAGGCTCATGCCATAGGGGACTCTTGAAATTATTGTTTTAAATGGGATGTCTCTTTTTTACAAGCCGTCCCGGGAATCTCATATATAAATCTTCCCCTAAAAATTAAATGAAAAAATACTTAAACCGATCTTCCAAAATAGCAAATCGGTGATAATATGGTTGTAAAAATAGGAGTTATTAAAAGCGGTAATATTGGAACCTCTCCTGTCCTTGACTTAGTCTTAGACGAGAGGGCAGACCGACCTAACATCGACGTTAGAGGAGTGGGTTCCGGAGCAAAAATGAACCCAGAACAGGTTGAAGAAGTCGTACCAAAAATAATGGACTTCGACCCAGATTTCGTAATATTCATCAGCCCAAACCCTGGTGCTCCTGGTCCTGCTAAAGCCCGAGAACTATTATCTGAAATGGACATCCCAGCACTGATCATTGGTGACGCCCCTGGAATGGGTAAGAGGGAAGAAATGGATGAACAGGGCTTAGGATACATTGTCGTCCTCGGTGACCCAATGATCGGAGCTCGAAGAGAATTCCTCGACCCAACTGAAATGGCATCCTTCAACGCTGATGTAATAAAAGTACTGGCTGCTACTGGTGCATACCGAGTAGTTCAGGAAACAATCGATGAAATGATCGCAGCCTGCGAAGCAGGAAAAGACATTGAACTACCAAAAGTAGTCATTGATGCTGCTACCGCAACTGAAGCTGCTGGATTTGCTAACCCATACGCTAAAGCAAAAGCTATGGCTGCATACGAAATGGCTGCTAAAGTAGGTGACATAGACCTCAAAGGCTGTTTCATGGTTAAAGATATGGAAAAATACATACCAATCGTGGCTTCAGCCCACGAACTCATTGCTGCAGCTGCTCAA'..b'GGAATCCCTATCTTGCGTTTTTTAAATGTAGGGTAGATTGTGAAGGGATAAAAAGTGAATTTAAAGGGGAGGAAAATTGGCAGATAATCGGATGGATACTCGATGGTGGTATGAATCTCTGCCAACTTTTCCTACGTACCGACAGTATGTACCTATAGCTGAGGAGAGTGGACCTCTACCTTTATTATAGGTATCTTACAGGGAGTGGGTAAACTTCAGTGAATTTATATTTCTTTACAAATTTCCTGGTGGTTTCCCATTCCATCTCCCTATATGCGATATGAGTATATATACATTTCGATTTCCTGATCTGGGAATACATAAAATTGAAAAATTCAACGGGTAAAAATTTGAAAAAAGAATTAAAATTAAAAAAATAAAGGAGGAAAAGATAAAACTTACTTTCCAGCCATCAATCCCGAGAGTTTGTTCTGCCAGGACTTGGAACGGATATTTTCCAGATTCATCTTGTCCCGTTTTATAGTGATACATTTTTGCGGGCAGACATTACTACAGGCACCGCACAGAATGCAGAACTTCTCTTCAATGGATGATTTATCATCTACAATACTTGCTGCATTGCAGGGGCAGACATCCACACAGGCATGGCAGGATTCTCCCTTACATTCTTCGATGTTAACTGAAATTTCACCTTCAAATGGTTTGACGACATGGGCCGCATCTACCGGACAGATTTCCTGACACCAACCACAGTTCACACAGGAATCTTCCTGTAGGATGGCTCTACCGGTGATCTTTGCATCTTCAGGATTCAGTTCATACTCTCCATAGGAACAGGAAGTACAGGCTGCTTTTATGGCATCTACTGGACAGGCACGTTTGCATACCAGGCAATAAACACATTTATCCTCATCTACTTTAATATCCCGGTCCAGGGGCCTATCTCTGGTTATGGATATGGCCTGGGGTGGGCACATCTCTTCACAGATACCGCAGTAAATGCAGTCGTCCTTATTTATCTCGATTTCACCGATCACCAGGTTGGAACGCTTGGGTAATTCCCGTTTGATGGTTATGGCATCCTGGGGGCAAGCAGTTTCACAGGCTTTGCAGTACAGGCATTCTTCATTGTCAATGGAAGCAGAGTGTTTCCACTGGGGATAGGCATCAAGATCTTTGATGTTTTCATCGTTGATCTTAAACTGGAATGCCTCGAAGGGACATGCTGATGCGCACAAACCACATAAAACACAGCTATTTTTGTTGATACTCACGTAGTCCATGTCCACCAGTCCCCGGGCTATGGGTAGCACGGGCCCCAGCCTTAAGGATTCTGTGGGGCAGATACTGGTACATATACCGCATCCCACACATTTATCACTGATGTAATCCAGGGAGCGTTTGTCGTTCCCATCTCTTTCCACTGCACTCATAAATACCATTCCCCTGCATATTAAGATTTAAGCTTTGGATATAGCCTGGTTAGGGCAGTTTGTGATGCATAAATCACAGTCATCACATTTATCCGGATACAAAACGAGTTCGCCATCTTCTTCGACTAAAGCACCCTGTTCGCATAGTTTGATGCACAGTCCTTCTCCGGGGCAGTTAGCGATCTTTCCACATTTTTCTTCGTCTATGACTATTGGCATAATTATCACCCTAAGTAACTGATTGATGCTATAGATATGCGATATGAGTATATAAACATATCGAATTTCATGTGATTATAAAAATGCATTATCATGGCTAAAAAATTTAAAAAAACTGCTATAGTCTTTTAAAGAACGAGATGTTTGCTGATGACTATTTATGAAAATTTGTTAATTATAAAAATAGATATTTAAAAAAAAGATTAAAAGAGGTAATGGTGTTTATTCTTTGGCAACCATTACTTCTGTGGATTTTATAAGGGCTATTACTTCGTCTCCATCTTTAATGTCCAGATCTTTGACGGATTCTTTGGTTATTATTGCGGTAATGACATCTGGAGATTCTATTTTTATTTTAACATTGGCCATCACTGCTCCCACATCAACTCCGGTTACTTTTCCTTTGATCATATTTCTGGCACTTATTTTCATGTTATACCCTCTCCATTTTTTTTAATGTTCCTTACCTAAGCACACTATATTTTATATACTGGCTGATTAAAATAATTTTTTAATGTAAACTGATACATCTCGGTATTTCCACCCATTTTGTATTACGGTGATAAACAATGAACCCAGTACAGTACAATCCCATTGGAATAATACATTCTCCCTTCAAAGAACTCCACGGAATGCCTATACAGCCGGTTGGTGCCCGGGGAGTCAAGGGACAGATAGAACTCGATAAAAAATACGAATCTGGATTAAAAGATTTGGATGGGTTTTCCCACATTCTGCTCATCTATCACTTCCATCTCTGTAACGGCCATTCCCTGGAAGTAAAACCCTTTTTAGATAAGGTAAAACATGGAATATTTGCCACAAGAGCTCCTAAACGACCTAATCCTCTTGGTATTTCTGTGGTTCGCCTGGAAAAGATTGAGGGAACCACCATCCATATCAGTAATGTGGATGTGGTGGATGGAACACCTCTCCTGGACATAAAGCCTCACATTCCTCATTTTGACTGTGAGGAAGGTGAAAAAGTGGCCATAGGATGGTTTGAGGATAAATATCATCAAGCCAAGGATAAAAAATCAGATAAACGCTTTGTTGATTAACAAAGGAAGCAGATCAAACTAAAAACAATAAAATATCATTATCTTCTGGGTAATCTTAAAATAATTATTTAATAATAACGGATCAGGAGAAAAGAGAATAGGAGAGTTTAAAACTAAAACTCTTCCATCTCAGATATATCCATGAGAGTTTCCACGGCCTTAGCCTCCACAGGAATTCCTGCTTCTTTAATGGCGGCTATTGGATTTAAACCTCCTGGTGCAACTATACCTGCATGGTAACGGTCTACCTTGGCGTTGTAAATCAGTTCACTTGGTTTACCTACTTTCAAGATGGAGAAACCAGCTTCTTCGGTCTCATCTAAAATGTCTAGGGCTTCAGGTCGGGCAACGTAGGGTATCTCCCTTAAACTTGCTAAAATTCGACCTCCTTTCTTTAAAGATTTATTTACTGATGTTAATCCCTTGGCGACGTATATTTCGTGGGGATCAAGGGATGATCCACTATAGGCGGTGAGTTCTATGAACCGGGGGGATTTACCCTTGGTTTCCAGTATTCCTCCGTACTGGGGTGTGGAAGCAATACCTTTTTTGGTGAGTATCCCATCGATGGTTAGGCTGCACACTGTGGCTAGACCCTTCTTTCCGTGGGGTCCAGGAACTATCTGGAAGTATTTACTGGTACAATATTCAGGGCGAGAGGCCATAACCTCATCGAATACTTTGAGACCTTCTTCCACATTTTCCTCCTTTAGATAGGAAATGTTCACAATTACTTTTCCCTGTTGGGTTTCTGGATCAAAGTCTACTTCATTTATAAGATTCCAAGCTTTTGAAAGAAGGAATTTAACTTTTTTACCAGTTTTACTCCCACTCTTTTTGATTACATTTTTAGTACTGGTCAGTGATTCCATTTCTGAAAATTCCACCGTGTTTTCTGCCATTTTAATGTTAACATCATAACCAGCTTCTTTGGCAGCACAAAGGGGTGAAATTCCTCCAGTTATGGTAATACCCACCATATCTTTATCTATGGGGATGCCAAGAACAGATTCTCCAGGTTTACCTATCTTCAACAGTCCGCTAACTCCTATTTTTTGTAGGTTGGTGAATAATTTGAGGGCTTTTTCCCGGGCAGTGGCGGGTATCAAGCGGAAGTTAGCGGGAATATTTCCACTTCCTGATTCAATAACTTCCAGTACAGAAGTCATTTCTTGGTCAGTGAAGGCCTCTAAGGGGGTCATAGAAGTCTTTTTATAAGCAATAAGTTCGGTAAAGGTTTGGGGTATGTAATTTTTAATTTCCACTAACCCTCCGTATCGAGGTACAACGGGAATACCTGCTTTAAGTAACATACCATCTATGG\n'
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/bac
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/bac Fri Oct 18 11:50:31 2024 +0000
b
b'@@ -0,0 +1,20 @@\n+>bacteria_AE015924.1_0_15000 AE015924.1 Porphyromonas gingivalis W83, complete genome\n+ATGAACTACCACTCGACCAATGTAAATGAAATATGGGACGCGTGTCTTCGCATCCTTCAGGATATTGTGGATGAGCGAGCATACCGTACATGGTTCTTGCCTATCATACCGGTATCTATCGAGGGCGATACGCTTACCTTACAAGTGCCGAGTCAGTTCTTCTGTGAGTTTTTGGAGGGCAATTTCGTAGAGCAGCTGCGTACGGTGTTGGGGCGTGTTATAGGTCCCAACGCATCATTACAGTATAATGCCCTTGTAGACAACAGTTCGCCCAAATATCCCGGCACGGTGACATTGGCCGGTTGTGCCGACGGTGGACAGGCAGCCGAACAGTTCGATGTCAATTTGCTACACAGGCACATGCCCAATGCAGCCACCCATAGCGAAGCACAGGATTTCGACACGCAGCTCAATAGCAGGCTCAATTTCCGCAACTTCTACCAGAGCGAATGCAACTATGTAGCTCGCTCAGTGGCTGAAGCCATCGCCGCCAGCCCGGGCAATACGCCGATGAATCCATTCTTTATATATGGAGCTTCCGGTGTGGGCAAGACGCACTTGTGCCATGCCTTGGGCCTTCGTGTCAGAGAGATGCACCCCCGGTTGAAAGTACTATACGTATCGAGTCATTTGTTCGAGATGCAGTTCACTACGGCAGCCCGTATGGGGACGATCAATGACTTCATCGCATTCTACCAGCAAGTGGATGTACTGATCATCGATGACATCCAATGGTTGATCGGCAAGAAGAAAACGCAATTAGCTTTCTTCCAAGTGTTCAATCACCTCTATATGCTTGGCAAACAGATAGTCTTGACGTCGGACAAACCTCCTGTAGACCTTAACGGGATGGAGGAGCGGTTGGTCACTCGTATGGCCGGTGCTACCTGTGTCAAGATAGAACGTCCGGATTTGAAGTTGCGTCGTGAGATACTCCAGCAGCGTACGCTTCAAAGCGGTGTCCGGCTGGACGAATCGGTGCTGAACTTTATCGCCGAAAATGTCTGCGACAATGTTCGTGAACTGGAAGGCACCCTCGTATCCTTGATCACAAATTCGGTGGTTGTAGGTAAGGAAATCGACCTGACCTTTGCCAAACGGATTGTCCGCCAAGCTGTCAGACTGGAGAAAAAGGAAGTCACCATCGAGTGCATCCAGCAGGCAGTCAGCAGAGTATTTCAGGTGCAGATAGAGCAGATGAAAAGCAAGAGTCGGAAGCAGGATATCGTACAGGCTCGTCAGGTGGTCATGTTCCTCTCCAAAAAACACACGGCTCAGTCCTTGTCGGCTATCGGCGAACTGATGGGAGGACGTAACCATGCCACCGTACTCCACGGCTGTCGCTGTGTGACGAACGAGATGGAGATGAATGCCTCATTCCGTTCATCGGTAGAACGTGCCGAACAGTTGATCGCCAATTGATAGCAGGTCTTTATGATCCATCCCACAGCGATAGTAGAAGACGGTTGTGTGCTTGGTCAGGGTACACGCGTATGGCACTTCTCTCACTTGATGTGCGGAGCCGAGGTCGGAGAGAATTGCAACATCGGGCAGAATGTCGTTATAATGCCGGAGGTACGACTGGGGCGAGGCTGTAAGGTGCAGAACAACGTTTCTCTGTATAGTGGTGTCATATGCGAAGATTACGTATTCCTCGGACCGAGTTGTGTATTTACCAACGTGATCAATCCTCGCGCCTTTATTGAAAGAAAATCCGAATACCGCCCCACTCATTTGCACGAAGGCGTCTCCATCGGAGCCAATGCCACTATTCTTTGTGGTATTACGATAGGGGCTTATGCCATGGTAGGTGCAGGAACCGTGGTGATTAGGGATGTACCGCCCTATGCCTTGGTAGTGGGCAATCCTGCTCGCCGGATCGGTTGGGTAAGCCGCGCCGGTCACCGCTTGTCGTTCGATGACAAGGGGATGGCCGTCTGTCCTGAAACGGGCGAACGATATAGAGAGGTCGAAGAAACGGGTACAATAGAACCGGTATCGGACTGATCTAGACCAAATAGCGGCATATCGGCAACCGCTTCATCAGCCGCACAACTCCCCAAGAAACGAAGAAAACCAATCCTACACGGATCGGTATGTTGAGCCATGCGCATTGCATCAGGCTGGGGGTGGTCAGTACAAGTATTTTTGTCACCACGTTCAGCACAGCGATGTGTACTAAGTAGATTCCTAAAATATCCCCCTGCATTTTCCCGATCCGCGCCAATTTTCCTCCACATCCTCCCCAAGAAACGAAGAACGCGAAGAGACTGATAGCAGAAAGAACAATCAAAGGAGAGAGATTACGGTAGAAGTATAGCCCTTCGCCGTGCTCGAAAGCGTACCGACTTGCGAAGAAAAGAGAAATCGTAGAGAGTCCGTACAAGGAAAGAGCCGGTAAAGAACGCTGCGGAGCATGGCTCTTCAGGGTATAACCCACAAGGAAATATCCCAAATAATCCGGCCAAAGAAAAGGGAAAAAGCGGTTGTAACCGAGTATGTAATCGTAGGTGTTGGACAATATCCCCAGCAGTAGCAATATGGTAGAGAGAGTCCAAAGTCGTTTACGAGCAGCCTTCTCTCCATCGGCTTCGCACCTGCGAATTATTTCGTTGAGCAGAGGAACGACTGCATAAAGTCCCAGCAGCATCACCACATACCACAGATGAACGAATGAGCGTCCCTGCCAAAAGCCGGCAAGATAGGAACCTATATCATCGCCCTTGAGCCACAGCCACAGCCAATAGAACGGAAGCCAAAAAGCGAGTAGTACCAGCAGTCGCGGTATTCGTTTCCGATAGAAATCTCCCCACGTCTCATTGCGTCCCAAGACAAAAGCCCCGCTGATAATGACGAATATAGGAACGGCCGGCTGCACGACCGCCTCCCAGCATAGACCGGCTATAAAGTTTGCACCCTCAGCCACTCCTTCGAGAACGTATTCTCCCGAAGTATGGATGCCGATTACCATCAATCCTGCCAGAACTCGCAGGACATCGACGGTGGTATTCCTCCCCTTGGTAGTCATAACTATCTGATAATTGCAGACAAATATACGGGGACTTCTCTTTATCTTTGTCAATAAACCCCTAAACGAAGGATACGACATGAATAAGAAAAGACTCGTCGTCTTGAGTGGCGCAGGCATGAGTGCCGAAAGCGGCATATCGACTTTTCGTGATGCCAACGGATTGTGGGAGAATTATCCCGTCGAGGATGTGGCCTCTATCGATGGGTTTAGGCGCAATCCTGCCCTCGTTCTCAAGTTCTACAATGCACGCCGACGCGACTATGCCGGTTGCAAACCGAATGCAGGCCATATTGGTTTGGCGGAAATGGAGAAGGAGTATGATGTAAGAATCATCACGCAGAATGTGGATGATCTGCACGAGAGAGCAGGCAGCACACACGTCATTCATCTGCACGGAGAGTTGATGAAGAACAGATCTGTGGCCACAGACAGTGTGCTCTATCCCGTAGACCCGACCAATCCCGATCTGCATGTAGGAGATCTGGCACCCGACGGCTGTCAGCTACGGCCGTTTATTGTGTGGTTTGGAGAAGCTGTTCCGATGATAGAGCCGGCCATCGAAGAGGTAACACAGGCAGACATTCTCGTTGTCATCGGCACCTCTCTCAACGTTTATCCGGCTGCCGGACTGTTGAATTATGCTCCTCGCAACTGCCCCATCTATCTGATCGATCCAAAGCCTGTGCGCAGCACCTCCCGGCAAGACATTCGGTATATCCATGCTCCTGCCACGGAAGGCGTAAGGATGTTGCGGCAAGAACTCCGTGATATAGATCGCTAAAAAAACACTAACCCCAAGAACCTGCCATCGTGGTGGTTCTTGGGGTTAATTGTATTTGTTCGTTTTTCGGAAGGCTAATGAA'..b'GCTTGACACCTCCGAAGTAGCGCACTACTGCGACGAATACCTGCGTAAGCCCCAATGAGGTGATCTGCCCGAGGATGGGTTTGCCGGCAGTCCCCGATGGCTCTCCGTCGTCATTGGATCGTGTGCGTTCGCCTTTGGCTCCCAGCTTGTATGCCCAGCATACATGGCGTGCATCGAAGTAGCGGCGACGCAGATCGGCCACAAGCGACAGGGCCTCCTCTTCCGACTTTACAGGATAGGCGAAAGCCAGGAAGCGGCTGCGTTTCTCCGTGTACTGTGCTTCCGAGGGAGCACTGATCGTGAGGTAGGAATCTTCGGCCATGGTTCAAAGGAGAGCCTCATCTGTACCTTCCTCCCGGGCGGCAAACTTTTCGGACAGGACGGAGAGGAGCGTACTCATTTGTTTGATACTGGCGAGCGTCTCTTCGCTCACTTCCTTTTTCTGCAAGCGCAGGGTCAGCAGACCGTATATGGCAGTCAGGCAAGTCTCTATCTCTCCCGTATTGCTCCCTGCACTCTTGGCTCTAAGCTGTACGATGGCAGGGAGCACCTGATAGTAGAGTCCTTGATAAATCATCTCTTTGGGGTCCGCCATCAGTCGTGAGTGTATCTCTTCCATTTGCATGATGGCTATGCGGACGATATTGATATGCCCCTGCTCGCGAACGCCCTCGGTCAGCATCATCTCCACCAGCTCGGCATACCAGCGGTCTATCTCGGCGGTCGTCTCCGTATCTTGCCGGTATTGGGCAATTACAGTGGCGCGAAGCCGCTGCATATCCAGTTCGTTGGCACGTATAAGATCCTCTATCTGCCACATGTAGAGGACGTACTCGGCGATATTGTTGCGCCGTTTTTCCCTTGCTATGATCATGGTCGTTTGTCTCGGATCAGGCCGTTCAGCAACGTTTCGTCCGCATCGTTGGGTGCAGGCTCTATACCCAACAGCCTGCATATGAGCGGATAGATGGTGATATTCGGCAGGTTTTCCACCCTACTGCCCGGACGGAAATCGGGTCCGACAGCCCGGAGTAAAGCCCGCATTTCCGGTGCTTGGTTGTCATAGCCATGTGCCGCTCCCGGACGAACGTCTTCATTTATTGCGAAAAAGACGGTGGAGCCTATGTCCGGAATCACGACCAGTTCGCCCAAACGAGGATTGGTGCCACAGCGCAAACGCTTGGGCACCTCCCCCTTGCGGTAAACCGATATATGTGGAATGGCCCGCAGGATCTCATAGGCTCGCTCGGTATAGGAGGGCTTCGGGTACAAGTGGGTGAAGGCCCCGGTGGCCATGTAGAGGAAACTGTCCGCAGGCAGATAATGCGACAGATTGACACATTTCTCATTTTCGTACGTGGCCATACCGTGATCGGATACTATGATGAAGTCGGTCTGTGCGGCTATGGGCAGAGAGTCCAACCGCTTGCGGAAATAGCCGACCACACTGTCCAACCGCTCTACCATTGCCAGTGTCAGCGGGCTTTCGGGCGTTTGGCTGTGTCCGATCATATCCGGCTCCTCGATGTACCACATGAGCAAGCGCGGTCGCTCCTTTTCGGGCAGTCCGAGCCACGCGATGACGGAGTCGGCACGGTCACGAAACGGAACGGTGGAGGAGAATTTTTTCCACCGCCACGGCCGATTTCCGTTCACAGCCGTTTCGGATCCTACCCAAAAGTAGACACCGGTACGGATGCCTTGGCGTGCGGCCGTATTCCAAACCGGCTCGCCGCCCCAAAATCCGGGGGTCTCCACGGCTTTTCGGTCGGATATACGAAAGATGCCCAGTAGCGAATCCACAAACTCATTGGCTACGATACCGTGATGATCGGGGTAAAGCCCCGTAGCCATGCTGTAATGATTGGGAAATGTAAGCGAGGGGAAGCATGGTTGGAGCGACCCGCTCAATCCCTCCTGTGCCATCCGATCCAACGCCGGTGTACGTGCCCGATCGGTATAGTCCGGTCGGAAGCCGTCCAAAGACAGGACTACGACGTACCGTTCCGACTGCTTAGGTGTTTGTCGGACTGTTCTGCAACCGACATAAGAGAAGGCAAGAAGCAGAAACAAGATAAAAGGAAATAGAGATAAATGCTGTCTCATTTTTATAAAAATCTTTCGATTTGATGCCGTCAAAGGTAAGGGATTCCTCTTTCATTACTGTAAGCAGATCGGTTTTTGAGCCGATGATTTTCAGCGTGTCGTCGGGAGTGAAACCATACCATCGGGAGTAAAAAATCACAGGAATACCCACAGCCGACCCTTCCAACCTCTCCAAAATCCGGGGGTCTCCACGGCTTTTCGGTCGGGAAAATGTCATTGTTCGGCGTGCAAACCTGCAAATCGGACACGAAATTCACTGCTCCAACTTGGAGGACGACAAATCCGCGCGGAAAATGCTTCCTCCGGCTTGGAGCGACTTTTTTCGGCCCGCAATGCAGATTTCCTGTCGGACATTCCCTCTTTTGCCGAAAGTACCCGTATATCCCTTGCAGAGAGTGAAACTGTCGCACGGCCTTTTCGTCGAATCCTTTTGCCGCAGAGTCGATCCCTTTATTCGTTGCACATCCGGGCTTCGGCAAATACGGCTTCCTTACTCCGTTAATGCTCTCATTCATTTAGAGAATGGGATCGGGAAAAATAAGAGACACGAACGGAATCTTACCTATCTTCGTCCTGAAATTATGGCAGATCGTAGAAGAACCGATGACAATAAGGGTGCGAGAGAGGTGGTATTGCTGCTGAATATCGGCTCGCCGGACAGCCCTGAGGAGAAGGACGTGGCGCGCTACCTCAATTCTTTTCTGACCGACAGGAGGATCATCACCTTGCCTTTTCTCCTGAGACAGTTACTCGTGAGAGGTATCATCACTCCTTTCAGAAAGAAAAGTTCGGCACAAAAATATCGGACCGTTTGGGACGAAAGCACCCGGTCTTTCCCCCTCATATCGCATACGAAAGCCATAGCCCGGGCACTGGCACATACGGGCAGAGAAGTCCATGTAGCCATGCGCTACGGCAAGCCGGCTGTGGCCGATGTGCTGAAGGAGCTGCCACACGGCCGAAGCCTCGTCGTCCTCCCGCTCTTCCCACACTACGCCATGAGCAGCTACGAGACGGCCGTGGAGCATTGCAAGGCCGAAATCCGCCGCCTTTGTCCGAATCTTTCCTTCCGCGTCGTGCAGCCTTTCTACGCACACGAAGCCTATATTCGTGTCCTTGCCGATAACATCAGACCCTATCTGACGAAGCCTTTCGACAAGCTCATTCTTTCCTATCACGGCATTCCCCGCGATCATTTGGACAAGACCACCCGACAGGCTTTGAATCTCCGGCATCCCGAAGGATGCTGCACGGAGGAGGATCCTACGGCAAACGTCTGCTACCGCTATCAGACTTACAGGACGACGGCTCTCATCCGCGAGGCACTTGGCTTGGCCGAGGAGCAGGTGGAGCAGGTGTTCCAGTCACGTGTAGGCCATACCGAATGGCTGCGCCCCTATTTGATCGAACGACTGTCCGCTTGGCCGCAAGAGGAAACAAAACGTATCCTCATAGCCTGCCCCTCCTTCGTGTGCGACTGTCTGGAGAGCCTCGAAGAAGTAGCCGATCACGGACAAAGCATTTTCAAAAAAGCAGGAGGTGCGGATTTCACTTACATCCCCTGTCTCAATAGCGGGGCGAATTGGATCGATGCTCTCCGAAACATTTTAGAGGAATAATACAGCATGCTCAGTTATCATACCGATATACCGACAGACCTGCCCCTCCTGAGGCAAGCCGTCGAAGCCATCCGCCGGGAAGAATCCGGCGGTGCCGTACCCGACTCCGATCGGCCGAGGGTGATATACGAGGCGCGCAACCGGCTTTACGCCATCCGTACCGCACAGGGAGAGCAGGTGGTGAAGAGCTTCCGGATCCCTATTGCCATTCAGCGCGTGGTCTACTCATTCTTCCGCCCCTCGAAGGCTGCTCGCTCTTATCGCAACGCCATA\n'
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/bacteria_fr.fasta
--- a/test-data/bacteria_fr.fasta Thu May 30 11:10:39 2024 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,2511 +0,0 @@\n->bacteria_AE015924.1_0_15000 AE015924.1 Porphyromonas gingivalis W83, complete genome\n-ATGAACTACCACTCGACCAATGTAAATGAAATATGGGACGCGTGTCTTCGCATCCTTCAG\n-GATATTGTGGATGAGCGAGCATACCGTACATGGTTCTTGCCTATCATACCGGTATCTATC\n-GAGGGCGATACGCTTACCTTACAAGTGCCGAGTCAGTTCTTCTGTGAGTTTTTGGAGGGC\n-AATTTCGTAGAGCAGCTGCGTACGGTGTTGGGGCGTGTTATAGGTCCCAACGCATCATTA\n-CAGTATAATGCCCTTGTAGACAACAGTTCGCCCAAATATCCCGGCACGGTGACATTGGCC\n-GGTTGTGCCGACGGTGGACAGGCAGCCGAACAGTTCGATGTCAATTTGCTACACAGGCAC\n-ATGCCCAATGCAGCCACCCATAGCGAAGCACAGGATTTCGACACGCAGCTCAATAGCAGG\n-CTCAATTTCCGCAACTTCTACCAGAGCGAATGCAACTATGTAGCTCGCTCAGTGGCTGAA\n-GCCATCGCCGCCAGCCCGGGCAATACGCCGATGAATCCATTCTTTATATATGGAGCTTCC\n-GGTGTGGGCAAGACGCACTTGTGCCATGCCTTGGGCCTTCGTGTCAGAGAGATGCACCCC\n-CGGTTGAAAGTACTATACGTATCGAGTCATTTGTTCGAGATGCAGTTCACTACGGCAGCC\n-CGTATGGGGACGATCAATGACTTCATCGCATTCTACCAGCAAGTGGATGTACTGATCATC\n-GATGACATCCAATGGTTGATCGGCAAGAAGAAAACGCAATTAGCTTTCTTCCAAGTGTTC\n-AATCACCTCTATATGCTTGGCAAACAGATAGTCTTGACGTCGGACAAACCTCCTGTAGAC\n-CTTAACGGGATGGAGGAGCGGTTGGTCACTCGTATGGCCGGTGCTACCTGTGTCAAGATA\n-GAACGTCCGGATTTGAAGTTGCGTCGTGAGATACTCCAGCAGCGTACGCTTCAAAGCGGT\n-GTCCGGCTGGACGAATCGGTGCTGAACTTTATCGCCGAAAATGTCTGCGACAATGTTCGT\n-GAACTGGAAGGCACCCTCGTATCCTTGATCACAAATTCGGTGGTTGTAGGTAAGGAAATC\n-GACCTGACCTTTGCCAAACGGATTGTCCGCCAAGCTGTCAGACTGGAGAAAAAGGAAGTC\n-ACCATCGAGTGCATCCAGCAGGCAGTCAGCAGAGTATTTCAGGTGCAGATAGAGCAGATG\n-AAAAGCAAGAGTCGGAAGCAGGATATCGTACAGGCTCGTCAGGTGGTCATGTTCCTCTCC\n-AAAAAACACACGGCTCAGTCCTTGTCGGCTATCGGCGAACTGATGGGAGGACGTAACCAT\n-GCCACCGTACTCCACGGCTGTCGCTGTGTGACGAACGAGATGGAGATGAATGCCTCATTC\n-CGTTCATCGGTAGAACGTGCCGAACAGTTGATCGCCAATTGATAGCAGGTCTTTATGATC\n-CATCCCACAGCGATAGTAGAAGACGGTTGTGTGCTTGGTCAGGGTACACGCGTATGGCAC\n-TTCTCTCACTTGATGTGCGGAGCCGAGGTCGGAGAGAATTGCAACATCGGGCAGAATGTC\n-GTTATAATGCCGGAGGTACGACTGGGGCGAGGCTGTAAGGTGCAGAACAACGTTTCTCTG\n-TATAGTGGTGTCATATGCGAAGATTACGTATTCCTCGGACCGAGTTGTGTATTTACCAAC\n-GTGATCAATCCTCGCGCCTTTATTGAAAGAAAATCCGAATACCGCCCCACTCATTTGCAC\n-GAAGGCGTCTCCATCGGAGCCAATGCCACTATTCTTTGTGGTATTACGATAGGGGCTTAT\n-GCCATGGTAGGTGCAGGAACCGTGGTGATTAGGGATGTACCGCCCTATGCCTTGGTAGTG\n-GGCAATCCTGCTCGCCGGATCGGTTGGGTAAGCCGCGCCGGTCACCGCTTGTCGTTCGAT\n-GACAAGGGGATGGCCGTCTGTCCTGAAACGGGCGAACGATATAGAGAGGTCGAAGAAACG\n-GGTACAATAGAACCGGTATCGGACTGATCTAGACCAAATAGCGGCATATCGGCAACCGCT\n-TCATCAGCCGCACAACTCCCCAAGAAACGAAGAAAACCAATCCTACACGGATCGGTATGT\n-TGAGCCATGCGCATTGCATCAGGCTGGGGGTGGTCAGTACAAGTATTTTTGTCACCACGT\n-TCAGCACAGCGATGTGTACTAAGTAGATTCCTAAAATATCCCCCTGCATTTTCCCGATCC\n-GCGCCAATTTTCCTCCACATCCTCCCCAAGAAACGAAGAACGCGAAGAGACTGATAGCAG\n-AAAGAACAATCAAAGGAGAGAGATTACGGTAGAAGTATAGCCCTTCGCCGTGCTCGAAAG\n-CGTACCGACTTGCGAAGAAAAGAGAAATCGTAGAGAGTCCGTACAAGGAAAGAGCCGGTA\n-AAGAACGCTGCGGAGCATGGCTCTTCAGGGTATAACCCACAAGGAAATATCCCAAATAAT\n-CCGGCCAAAGAAAAGGGAAAAAGCGGTTGTAACCGAGTATGTAATCGTAGGTGTTGGACA\n-ATATCCCCAGCAGTAGCAATATGGTAGAGAGAGTCCAAAGTCGTTTACGAGCAGCCTTCT\n-CTCCATCGGCTTCGCACCTGCGAATTATTTCGTTGAGCAGAGGAACGACTGCATAAAGTC\n-CCAGCAGCATCACCACATACCACAGATGAACGAATGAGCGTCCCTGCCAAAAGCCGGCAA\n-GATAGGAACCTATATCATCGCCCTTGAGCCACAGCCACAGCCAATAGAACGGAAGCCAAA\n-AAGCGAGTAGTACCAGCAGTCGCGGTATTCGTTTCCGATAGAAATCTCCCCACGTCTCAT\n-TGCGTCCCAAGACAAAAGCCCCGCTGATAATGACGAATATAGGAACGGCCGGCTGCACGA\n-CCGCCTCCCAGCATAGACCGGCTATAAAGTTTGCACCCTCAGCCACTCCTTCGAGAACGT\n-ATTCTCCCGAAGTATGGATGCCGATTACCATCAATCCTGCCAGAACTCGCAGGACATCGA\n-CGGTGGTATTCCTCCCCTTGGTAGTCATAACTATCTGATAATTGCAGACAAATATACGGG\n-GACTTCTCTTTATCTTTGTCAATAAACCCCTAAACGAAGGATACGACATGAATAAGAAAA\n-GACTCGTCGTCTTGAGTGGCGCAGGCATGAGTGCCGAAAGCGGCATATCGACTTTTCGTG\n-ATGCCAACGGATTGTGGGAGAATTATCCCGTCGAGGATGTGGCCTCTATCGATGGGTTTA\n-GGCGCAATCCTGCCCTCGTTCTCAAGTTCTACAATGCACGCCGACGCGACTATGCCGGTT\n-GCAAACCGAATGCAGGCCATATTGGTTTGGCGGAAATGGAGAAGGAGTATGATGTAAGAA\n-TCATCACGCAGAATGTGGATGATCTGCACGAGAGAGCAGGCAGCACACACGTCATTCATC\n-TGCACGGAGAGTTGATGAAGAACAGATCTGTGGCCACAGACAGTGTGCTCTATCCCGTAG\n-ACCCGACCAATCCCGATCTGCATGTAGGAGATCTGGCACCCGACGGCTGTCAGCTACGGC\n-CGTTTATTGTGTGGTTTGGAGAAGCTGTTCCGATGATAGAGCCGGCCATCGAAGAGGTAA\n-CACAGGCAGACATTCTCGTTGTCATCGGCACCTCTCTCAACGTTTATCCGGCTGCCGGAC\n-TGTTGAATTATGCTCCTCGCAACTGCCCCATCTATCTGATCGATCCAAAGCCTGTGCGCA\n-GCACCTCCCGGCAAGACATTCGGTATATCCATGCTCCTGCCACGGAAG'..b'GCCTTTGGCTCCCAGCTTGTATGCCCAG\n-CATACATGGCGTGCATCGAAGTAGCGGCGACGCAGATCGGCCACAAGCGACAGGGCCTCC\n-TCTTCCGACTTTACAGGATAGGCGAAAGCCAGGAAGCGGCTGCGTTTCTCCGTGTACTGT\n-GCTTCCGAGGGAGCACTGATCGTGAGGTAGGAATCTTCGGCCATGGTTCAAAGGAGAGCC\n-TCATCTGTACCTTCCTCCCGGGCGGCAAACTTTTCGGACAGGACGGAGAGGAGCGTACTC\n-ATTTGTTTGATACTGGCGAGCGTCTCTTCGCTCACTTCCTTTTTCTGCAAGCGCAGGGTC\n-AGCAGACCGTATATGGCAGTCAGGCAAGTCTCTATCTCTCCCGTATTGCTCCCTGCACTC\n-TTGGCTCTAAGCTGTACGATGGCAGGGAGCACCTGATAGTAGAGTCCTTGATAAATCATC\n-TCTTTGGGGTCCGCCATCAGTCGTGAGTGTATCTCTTCCATTTGCATGATGGCTATGCGG\n-ACGATATTGATATGCCCCTGCTCGCGAACGCCCTCGGTCAGCATCATCTCCACCAGCTCG\n-GCATACCAGCGGTCTATCTCGGCGGTCGTCTCCGTATCTTGCCGGTATTGGGCAATTACA\n-GTGGCGCGAAGCCGCTGCATATCCAGTTCGTTGGCACGTATAAGATCCTCTATCTGCCAC\n-ATGTAGAGGACGTACTCGGCGATATTGTTGCGCCGTTTTTCCCTTGCTATGATCATGGTC\n-GTTTGTCTCGGATCAGGCCGTTCAGCAACGTTTCGTCCGCATCGTTGGGTGCAGGCTCTA\n-TACCCAACAGCCTGCATATGAGCGGATAGATGGTGATATTCGGCAGGTTTTCCACCCTAC\n-TGCCCGGACGGAAATCGGGTCCGACAGCCCGGAGTAAAGCCCGCATTTCCGGTGCTTGGT\n-TGTCATAGCCATGTGCCGCTCCCGGACGAACGTCTTCATTTATTGCGAAAAAGACGGTGG\n-AGCCTATGTCCGGAATCACGACCAGTTCGCCCAAACGAGGATTGGTGCCACAGCGCAAAC\n-GCTTGGGCACCTCCCCCTTGCGGTAAACCGATATATGTGGAATGGCCCGCAGGATCTCAT\n-AGGCTCGCTCGGTATAGGAGGGCTTCGGGTACAAGTGGGTGAAGGCCCCGGTGGCCATGT\n-AGAGGAAACTGTCCGCAGGCAGATAATGCGACAGATTGACACATTTCTCATTTTCGTACG\n-TGGCCATACCGTGATCGGATACTATGATGAAGTCGGTCTGTGCGGCTATGGGCAGAGAGT\n-CCAACCGCTTGCGGAAATAGCCGACCACACTGTCCAACCGCTCTACCATTGCCAGTGTCA\n-GCGGGCTTTCGGGCGTTTGGCTGTGTCCGATCATATCCGGCTCCTCGATGTACCACATGA\n-GCAAGCGCGGTCGCTCCTTTTCGGGCAGTCCGAGCCACGCGATGACGGAGTCGGCACGGT\n-CACGAAACGGAACGGTGGAGGAGAATTTTTTCCACCGCCACGGCCGATTTCCGTTCACAG\n-CCGTTTCGGATCCTACCCAAAAGTAGACACCGGTACGGATGCCTTGGCGTGCGGCCGTAT\n-TCCAAACCGGCTCGCCGCCCCAAAATCCGGGGGTCTCCACGGCTTTTCGGTCGGATATAC\n-GAAAGATGCCCAGTAGCGAATCCACAAACTCATTGGCTACGATACCGTGATGATCGGGGT\n-AAAGCCCCGTAGCCATGCTGTAATGATTGGGAAATGTAAGCGAGGGGAAGCATGGTTGGA\n-GCGACCCGCTCAATCCCTCCTGTGCCATCCGATCCAACGCCGGTGTACGTGCCCGATCGG\n-TATAGTCCGGTCGGAAGCCGTCCAAAGACAGGACTACGACGTACCGTTCCGACTGCTTAG\n-GTGTTTGTCGGACTGTTCTGCAACCGACATAAGAGAAGGCAAGAAGCAGAAACAAGATAA\n-AAGGAAATAGAGATAAATGCTGTCTCATTTTTATAAAAATCTTTCGATTTGATGCCGTCA\n-AAGGTAAGGGATTCCTCTTTCATTACTGTAAGCAGATCGGTTTTTGAGCCGATGATTTTC\n-AGCGTGTCGTCGGGAGTGAAACCATACCATCGGGAGTAAAAAATCACAGGAATACCCACA\n-GCCGACCCTTCCAACCTCTCCAAAATCCGGGGGTCTCCACGGCTTTTCGGTCGGGAAAAT\n-GTCATTGTTCGGCGTGCAAACCTGCAAATCGGACACGAAATTCACTGCTCCAACTTGGAG\n-GACGACAAATCCGCGCGGAAAATGCTTCCTCCGGCTTGGAGCGACTTTTTTCGGCCCGCA\n-ATGCAGATTTCCTGTCGGACATTCCCTCTTTTGCCGAAAGTACCCGTATATCCCTTGCAG\n-AGAGTGAAACTGTCGCACGGCCTTTTCGTCGAATCCTTTTGCCGCAGAGTCGATCCCTTT\n-ATTCGTTGCACATCCGGGCTTCGGCAAATACGGCTTCCTTACTCCGTTAATGCTCTCATT\n-CATTTAGAGAATGGGATCGGGAAAAATAAGAGACACGAACGGAATCTTACCTATCTTCGT\n-CCTGAAATTATGGCAGATCGTAGAAGAACCGATGACAATAAGGGTGCGAGAGAGGTGGTA\n-TTGCTGCTGAATATCGGCTCGCCGGACAGCCCTGAGGAGAAGGACGTGGCGCGCTACCTC\n-AATTCTTTTCTGACCGACAGGAGGATCATCACCTTGCCTTTTCTCCTGAGACAGTTACTC\n-GTGAGAGGTATCATCACTCCTTTCAGAAAGAAAAGTTCGGCACAAAAATATCGGACCGTT\n-TGGGACGAAAGCACCCGGTCTTTCCCCCTCATATCGCATACGAAAGCCATAGCCCGGGCA\n-CTGGCACATACGGGCAGAGAAGTCCATGTAGCCATGCGCTACGGCAAGCCGGCTGTGGCC\n-GATGTGCTGAAGGAGCTGCCACACGGCCGAAGCCTCGTCGTCCTCCCGCTCTTCCCACAC\n-TACGCCATGAGCAGCTACGAGACGGCCGTGGAGCATTGCAAGGCCGAAATCCGCCGCCTT\n-TGTCCGAATCTTTCCTTCCGCGTCGTGCAGCCTTTCTACGCACACGAAGCCTATATTCGT\n-GTCCTTGCCGATAACATCAGACCCTATCTGACGAAGCCTTTCGACAAGCTCATTCTTTCC\n-TATCACGGCATTCCCCGCGATCATTTGGACAAGACCACCCGACAGGCTTTGAATCTCCGG\n-CATCCCGAAGGATGCTGCACGGAGGAGGATCCTACGGCAAACGTCTGCTACCGCTATCAG\n-ACTTACAGGACGACGGCTCTCATCCGCGAGGCACTTGGCTTGGCCGAGGAGCAGGTGGAG\n-CAGGTGTTCCAGTCACGTGTAGGCCATACCGAATGGCTGCGCCCCTATTTGATCGAACGA\n-CTGTCCGCTTGGCCGCAAGAGGAAACAAAACGTATCCTCATAGCCTGCCCCTCCTTCGTG\n-TGCGACTGTCTGGAGAGCCTCGAAGAAGTAGCCGATCACGGACAAAGCATTTTCAAAAAA\n-GCAGGAGGTGCGGATTTCACTTACATCCCCTGTCTCAATAGCGGGGCGAATTGGATCGAT\n-GCTCTCCGAAACATTTTAGAGGAATAATACAGCATGCTCAGTTATCATACCGATATACCG\n-ACAGACCTGCCCCTCCTGAGGCAAGCCGTCGAAGCCATCCGCCGGGAAGAATCCGGCGGT\n-GCCGTACCCGACTCCGATCGGCCGAGGGTGATATACGAGGCGCGCAACCGGCTTTACGCC\n-ATCCGTACCGCACAGGGAGAGCAGGTGGTGAAGAGCTTCCGGATCCCTATTGCCATTCAG\n-CGCGTGGTCTACTCATTCTTCCGCCCCTCGAAGGCTGCTCGCTCTTATCGCAACGCCATA\n-\n'
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/euk
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/euk Fri Oct 18 11:50:31 2024 +0000
b
b'@@ -0,0 +1,20 @@\n+>eukarya_NW_012132931.1_0_15000 NW_012132931.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold8033, whole genome shotgun sequence\n+gatcagtagtatagtacagggtcaacaacgaatagttaggaaagaaaagagaacccccctccaagctgtaacatctaatctatatctaattgttatctgataagataagataggcatccgcttattctggaatatttATTcagaaaactgtgacaacacgctaggtattcttagatagccaatagcgtattgtgagcatcagtcatcctaagtgttaggtgtactaccagtagtatttggggtctggtcccacatgtataaataccagataatacagcatagtacagcagtctgatcttatTAGATCATACTTTGTCTACTTCACTCAACTCTTCCTCTAAGCTAACCGCTCTCAAGACAAGTCAAGCCTcttacctcttgcaactaccagaaccacacaagtgagtgctggggttagagttagggttagggtcaagggtgatatCTTGACAGTATTCTCCTGAGATTCATAGATATCAGACCCAAAGATGTGATGTGCTGGATAGCTAGGGTGATTTGGTGCCTGTCAAAGTATTGTCCTGATACTTGACACTCtctctaaccctaacccctagatactcacttgtagtggtagGTAGTTGATATAGCTGGGTTGCTGGTTGGCTATAGGAGCTGGTGGGCTCAGAGTTGAGAGTGTGTAAGTTGATGAGGTTAGACAAGTAGTATAACTAGTCTACCCTCTCaatgctgtattgctctggtatttatacaagagggaccagacccctaatactactggtagtacacctaacaccttaggatgactgatgctcataatacactattggctatctaagaatacctagcacgTGAACCATCACCATGTattcggtcagcagtctactatgtgatgatcacctgaatgactgtgtgtgtctctagtacaaatggggaaaatcttgtgtgaacatatgatagcccatttgccctgcttctgataagctagacacctgactagtaacagTGATgccatgcattatgctatccttatctctgtagatatctaattggataagatatagatcatctagatgctaaagataagatagatgccatgaaattctgtgacagtgCCAGAGATAATGTGAAACTATATCTGGACAGGCTTCAATCTTCAATCCAGCACAAATCAACCAGTAGACCCACACACTCAAGACATTCTTTAGCACCAGCAGACTCTAGCTCACCTCTATATATCATGAGATGACAATCTTGAGATGAGATTTGACTAATGATATAGAAGAAAAGAGGCACTTTGTCTACCTCAATTCTCGATACAGGCACCATTCAGGGAGTGTCAAGGGGAATTGCACAGACCTGGCAACACAGTGCATCAGCACCTCTGGCAGTAATAGTGAAGGTCTAATTCAGGACATCTAAGTGATAGATGACCTCAAGTGGAAGTAAGCTATGGAGGTACATTGCATGCAATTCCCATCAGGAGACAGGCATGGTGACAGAGCAAATGAGAGCCTTAAAATAGGAGGTGAACAAAGCAATACCCTAACTTCAACCACTATAGCTAGGTGTCTTTGACGTGTGGCTGGGTGCTCGAATTCATCAGTAGCAACATGTAATATACATAAAATAGAAAGAGACAGACTGTCAAAACAGGTGCGCCATGCTCTGCACCGTACCTTTGAAATGGAGGGAGTCCGCCCGCTAAGTTCGCGGTCGTATGGCGGGGCGTGCGGAGGAATGTCCTGGGTCGCGAATTCAGGCCATCATGAGACTCTCCTGGGCCACTTCCGGCCCGCCTGCGGCGAGCAACCTCCTTGGAATGACCAATTTGCCCGCTGGGTGACATGTGCCACGCGATAGAACCCATCATATATTCTTATCATTTATCTTGATGCCAGACTCTAGTTTCTTTTTCCCCCAGGCTGCTCCTCGACAAATATTGTCGAACTTGAAAGCTGCCATTTCATATTTGACTAGCGGAGATGGATAAGATCCGCAGAGGCAACAACGATCATGCATTAGCCACAGTTTGAAATGATCGAACAGGGTCGTTCACAGGTTGTACCTATGTTGCACTTGGGTAATCAGTACTCAACGttcgctcgtcctcctgttcctacATTCGACCTCTGACAAACACTGTCTTCTGGACCTCTAATAGTACCACGCCCACGGTTGGTTATATTGTCTCACACGTCTCACCACAACATGTACATACAAGTGTCACTTCGAAACTCAATCATGCCCCTGGCATGCGCCTCGCTATTTAATCCAGTGTGTTTTCGACATCAATATGTCACGCCATGAAGGTTTCTTCTCTactctctcttctcgccattTCTGCACTTCAGCTGCTGTCAGCTGTAGCACAGTCCAATGTCACAGTTCTCGCAAAGGATCCGCAAATTGTGTATGCGGGCGGTTGGACAAACCAAGAGAATGGTCAATACTTCTACGCTAACGGACCTGGGTCGTCATTTTCTTTCTCGTTTACAGGTAAGTATAGATTTACATCACGTATATACCATTTTAACTAGGATCGAGTACAGGGACAGCAGTCTATTATCATTCTGTGATAAATCCGAACGGAGGAGTAGCAAGCATTGTCCTGAATAATGGCTCTCCGACCCTTGTAGATGAATCAGAAAATGCTTACGAAGGCGAAGCTCCTATACCGGCTGTACTTTGGTCGAAGACCGATCTGGATGGTGAAAAAAACCATGTACTGAATGTAAGCTATGTAGGCAGTGGAGTATTAGGTGGTGCCTATGTTGAGTTCTATTATCTTCAGTATGTATGTGCTCGGAATAGTGTCTATTGTATCAACATTTACGATACCCATCCAGATATACAAGCTCGGGTAGCCAGACAAATGAAACCGGAAGTGCAGGTCCGATCTCAGGTATTGTTTTTTTGCGGTCCGCATCAGATATTCCTGTTAACACCGCAAGAGGTCAGTAAGTCCTAGCGGAGCTCAAGACTCGCCTTCGATGAGCGGAACATCCAACGGTGGTGCACCTACCGCCTCACTTAAATCTTCAGCGAGCgctgcctcatcctctcACTTTTCAAATACAAGGGCTATTATCATTGGTACTGTGGCTGGAGTGGGAGGCACCCTGATCGTTGCAAGTGCGATCATGTTATTCTTGTGTCGTAAAGGCTGTAGATGGACTGCAAAGATCAATCATACGCGTAAGTTTTAAGCCTACTCCATGCACCTCCATTAGATCCATCTCAACCTGCTTTTACAGCATCACCTTACAATATGAGCACTGTCGAGACTCTGCGACCCCTACGCAGGAAGACACCCGCAATGTCTTCCCTTCCGCCGAATGTCGATCAGCCATCCGCTCCCAACTCATCTCGTCCTGACACACCTAGCGAGCTCCTCACCCCGGCTAATGAAGACGGGCTGACGCCAGAAACACTCCCGTATTCTTCTTATAACGCGAGAGTGATTAAGATGATGCATATTTTGGGATCGTCTCGTTCCACTAGTCCACCAAATGAGCACCACATTACTCCTGGGCCTAGTGCTCTTCCGAGTCATAGTCAGCCTCGTCAGGTGTCCTTGGTTGGTTCTGATAGTTTAACTTACTTATCTGATCCACCGCCTGTGTATGATGGACGTAGGACAGCGTAGCGGTAGTCGGTCTCGTCACGGTATGAGCAATATACTAGAACAATATACTAGTAGCTCTCCCAAATTCCATTTAGTATACATCCACTCACAATCGACTTCAATTGGATTCTAACCATCGCCACGAGCTAATTCTTGTATTACATGACTTGACACCGAGGAAAAGGTATGCTATAATCGTTCTCTAGTGTTCGAACCCACTTATTAGAGC'..b'ATAGGAAGGTTGTACTTTGGGGCCTCAAAGGCACTGACGGCGAAGGAAAGACCCTGCGGGTATTTTAGTCTGTGAATGACGCAGACGTGGCAAAAGACGAACGGtcccgacgaggacgagcttcgAGGTGTCCAGACGTTGCAAAAAGTCGGCCATGATAGAGGCTGGTAAGCTGCAGGAGGGAAGAAGGGAAATGCTGCGGTGTGTGGGGAAGGAAGCGCGGACTGGTTTGGGTTGCGCGTCTGCGCACTCCGCCACCGACGAAACTGATCGCAGCTATGTCCGAGTCCAAAACTGTTTTGGATCTCCTCTCCTATGTTCGCACCAGAGTcaccgtcgatgtcgacTCGATGGATCCTGCCGTCGCTGCTCGGCATACCTCAGGTAGCAAATTCTGCGACATGACCTCCAATCAGGCCATCGTCTACTCTGAGGCCGCCAAGCCTGAGCGCGCACAGCTCTTCAAGACTGCTTGTCAACTGGCACGGGTCAGCGGATCAGACACGGAGAGTCAGATAACAGAGGCTTTGGACATTTTGGTCGGAATCATCTCTCAGATCATGGTGGTCCGATCAGAGCTTAACCACACGCACAGACTGTCCTCCTCGCAAAGGAGGTGTATCCCTACCTTACTGGTCGTGTTCATGCACAGACCTCTCCTCCCACTGCCTATGACACTGAGAAAACCATCGCACACGCGAGGAAGCTCGTCGAACTTTTTGAGGCAAACGGCATACCACGGTGTGCATCATGCTAATATTACCGCTGCGTCACTGAATCATCAGCGCGTACAATGCAGCGACCGGGTGTGTATTAAGATTCCTGCGACACCAGAGTCAATAATAGCCTGCCAAAGGCTCGAGAGTACCGGCATCAGGACTCTTGCGACTTGTCTTTTCTCCCTTCCACAGGCCGTGGCTGCTTCCCAAGCAGGCTGTCTCTACGTCGCGCCGTACTTCAACGGTGACTGATTGGCTTATCGTGAATCAGATTTGACCCAATGACTAATAGTTCTTTTCAACAGAGCTCCGAGTGCACTTTGAACCGAAAATATGGAAGGAATACAACGACACAGCGAGAGAACATCCGATGGCGCCTGTCATCGCCTCTATAGTCCAAGAGTTTAGAGCAATTGATTCGAAGACGCTAGTCATGCCTGCTAGGTAAGGGGCCATGCACCTTCGTGGAAAAATATCTCAACATTACTGTAAAGCATCGTAACCTCGACAGAGGTATGTATATTCAATATGATTTCCATCGAGTATAATTAAGCCGCTCCCATTCGTGAGGTCATTGCATTGGCGTCGTTGCAACCTGATCATCTCACGCTAGCGGGGGCAGTCTTGGACCAGctagcagcagcatcgaatGTCAAACTTCTTGATGAACCGAATACACATGCCTCTCTTAGCATAAACACTACGAGTAATGGCGCTTCATATGGAAAAGGTTGCTTTATAGTGATGTGCTCTGCGGAGGCTATTACTTATGACAACACTGAATATAGATTTTCTTGCTGATGGCGCGAGCGCACTCAGACAGGCTCTAGCTGCTGATGCAGAGGCTACACGCAAACTCGCTGACGCGCTGAAGATATTCGGCGAGATGGAGCAGAAAACCAGGGAACTCGTAAGGAAAGAGCTGGGTGAGATGTAAGGGCTACAAATACGGGATATACCGACATCCATTCTGTCTGTGCCATTTCAATGTTTGATACAGGAGATAATCGTAGTGTACAGTAGTGATGAACAGGGGTATGAGGTCAAATCAAATGTCGTCTGAATTAGAAACACAAGAGTTGTCCTTGTCTGTGTTGGTACCAGTGTCTTCCAATTCTTCTACTAGGTCGCCAATGATTGTAAGGCGTTCCGCTTTGCCCTCTACCTTTTTGCGCTCGAACAGCCAAGGGCAATCTAGTGATTCGCATCTGACAGGCTCCCCGGGGGCAGTTCCGCAACAAGAGCTACAAATTAATTGTACATCTCTCAGTCGGTCTTCTGCCACTCGAAGTCGGGATAGAAGTCCGGAAATGGTCGTTATAGGATCAGCGCGACAATCATCGCACAAGCCTGAAGTATCACTCAGCAAGGCGCACTTGATGAACACGCGATGGTTACCTTCCAACGTCAGTGCTCTACAGTTGATACAATGCGAACTCAGAAAATGTTCTTCAATCTTGAACGCGTTAGTTGCGGCGGTGTATTTCTTGACTCTCCTCGGTGACAGGGAGATTGGGTCTAGTGGCTGGTCTGCACGCAGCGCTTTCGGCATGTCATCGTACCAGCTCCTGACGTCAGCACCAACTAGATTGAATATTCGCTCGAGAGGAGGAATCAGTACTCGAGAAATATAGTACACCGCGTCCAGCTGTTTTTGACTAATCCAGATAAGCCAAACTGTCATCGCGAGATAGAACGATGTACCTGTTGTCAATAAGCTCGCCAGGAGAGACAGCCCTGTCTACCAGCCTGGTATCTGGGTCACCGCGCATGATAACATATGGTACACGTTCCCCATATTGCGGCTCGTCCATGGGGTCATTGGTCGTGCGTCGTGCGGCGACAGTGACTCCTGGGGGTGGTGGAACTTTATCACTGATGACCGAATCAATGTGTGGGCAGCAATCAGCCAATGGGACACACACCTATACGTCCCCATCTTCACCTCTTTAGCGAATATAAAGTCGTGAGGTGAAACTCTATTCTCCAAGATTCGGGTCCAAGATTCATAACAGTATTTTTTGACTTTACTGAGATCCTGCGTGCGAAATAAAATTCTAGCATCTATCAGCAAAGTATTACGGGATTTTTTAAAGCATAATACTTGAGGCAAGTCTctgtcatcttctgctgaGCGGGAATTCCATCTCGACGGACAGTTTCAATGCCCTTGGCATCGAATGTCGGCTCACTGTCATCTGGACTTTCGAACTTGAATCCAACATATCGTTTCTTCGCCATCAGCACACACGGAAGGTATACCTAATTACAACTATAAGGTCTGCGCCACATAGATAAATGTCGACATTATTCACCTTCTCAAACTTAAGCTTTACTGGTGCAGGATTCATGGATGTGACCGTCTCAGCCATATCTTGACCAATGCGGAAGGCTTGCTCCTTGGTCTTCCCACGAAGGTAAATAAAAAGTGAATCTGTATCACCGTACACAACCTTCGCCCCCCATTTCTTCGTTGAATTGATGACGCGAATGGCCTTGATTTAGAATGTGTGTCTCAGATTCCAAACATCAGTGGCACACAGATTTGCGTTACCTTTTCCAACGTCTCGCGACCACTCTGAACAATACTGTCAGCAATTTCAACCGCCGGCATCCGCCCAGAGAATGTAGCACTGGTATATCCGTATGTGACATTGGCAATGAACTTCAGGCCGAGCTGACGAGCATCCAGAATTCGTCTGAGTGCCTATGAGACATTATTATACTCATGACCAGATGCATGCGATTTGGAGCACACCTTATCGTCTTTGGCCCCCTTCATTGCTTGTTTGACCATCACCCGCGTATCCAATAACTCAGTCAACATCCTTCCTAATAGTCCTTTGCGTACGTCTTGATTAACATACACCATCCCGTTAGGTGCGACTGCAACCATGAGGCTTTGGTTTTTTGTATTTGTGCAGCATCTCGATGAGACTCACCGTGCATGTGCTCTTGTAGTGTTTCCAATAGCCCTGCAGGCTGATGTAAATCCGTTACGCCGAATTTGTTTTGTCCTTTGAAATCAGTGACACGTCCAAGACACGTAGAATAACAATAATTATATGCGATCATAACGGAGGGATACAATGATTGAAAGTCGAGTACGACAAGAGGACTGTTATAAAAGGCGGATAGAGGTTCCATGATAAGTGGCATACATTCTGCTGCGTTCTGTTTTCCGACCTTCAACGGTCATTAGCTTTCTGCAGGAGAAAACAGCGGAATTACTCACATCTTGCTTACTGGGGGATAGTAGCACAAAACTCTCTGGTTTAG\n'
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/main_result01.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/main_result01.txt Fri Oct 18 11:50:31 2024 +0000
b
@@ -0,0 +1,11 @@
+sequence_id class_fst_stage class_snd_stage
+plastid_NC_026299.1_0_15000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_15000_30000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_30000_45000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_45000_60000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_60000_75000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_75000_90000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_90000_105000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_105000_120000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_120000_135000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_135000_150000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/main_result02.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/main_result02.txt Fri Oct 18 11:50:31 2024 +0000
b
@@ -0,0 +1,51 @@
+sequence_id class_fst_stage class_snd_stage
+archea_HG425166.1_0_15000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_15000_30000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_30000_45000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_45000_60000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_60000_75000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_75000_90000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_90000_105000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_105000_120000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_120000_135000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+archea_HG425166.1_135000_150000 HG425166.1 Methanobacterium sp. MB1 complete sequence archaea n/a
+bacteria_AE015924.1_0_15000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_15000_30000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_30000_45000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_45000_60000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_60000_75000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_75000_90000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_90000_105000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_105000_120000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_120000_135000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+bacteria_AE015924.1_135000_150000 AE015924.1 Porphyromonas gingivalis W83, complete genome bacteria n/a
+eukarya_NW_012132931.1_0_15000 NW_012132931.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold8033, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012132937.1_0_15000 NW_012132937.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold8623, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012132972.1_0_15000 NW_012132972.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold11742, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012132977.1_0_15000 NW_012132977.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold12580, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012133002.1_0_15000 NW_012133002.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold15615, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012133036.1_0_15000 NW_012133036.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold26232, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012133063.1_0_15000 NW_012133063.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold33822, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012133067.1_0_15000 NW_012133067.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold36096, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012133074.1_0_15000 NW_012133074.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold38051, whole genome shotgun sequence eukarya n/a
+eukarya_NW_012133082.1_0_15000 NW_012133082.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold39632, whole genome shotgun sequence eukarya n/a
+mitochondria_NC_013604.1_0_15000 NC_013604.1 Acraea issoria mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_014887.1_0_15000 NC_014887.1 Acrida cinerea mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_015799.1_0_15000 NC_015799.1 Abidama producta mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_015842.1_0_15000 NC_015842.1 Agriosphodrus dohrni mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_016432.1_0_15000 NC_016432.1 Alloeorhynchus bakeri mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_018095.1_0_15000 NC_018095.1 Ahamus yunnanensis mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_018133.1_0_15000 NC_018133.1 Actias selene mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_018542.1_0_15000 NC_018542.1 Alulatettix yunnanensis mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_018754.1_0_15000 NC_018754.1 Acleris fimbriana mitochondrion, complete genome organelle mitochondrion
+mitochondria_NC_021396.1_0_15000 NC_021396.1 Adoxophyes orana mitochondrion, complete genome organelle mitochondrion
+plastid_NC_026299.1_0_15000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_15000_30000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_30000_45000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_45000_60000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_60000_75000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_75000_90000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_90000_105000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_105000_120000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_120000_135000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
+plastid_NC_026299.1_135000_150000 NC_026299.1 Acorus gramineus plastid, complete genome organelle plastid
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/main_result03.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/main_result03.txt Fri Oct 18 11:50:31 2024 +0000
b
@@ -0,0 +1,11 @@
+sequence_id class_fst_stage class_snd_stage org bac arc euk unk1 pla unk2 mit
+eukarya_NW_012132931.1_0_15000 NW_012132931.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold8033, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012132937.1_0_15000 NW_012132937.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold8623, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012132972.1_0_15000 NW_012132972.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold11742, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012132977.1_0_15000 NW_012132977.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold12580, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012133002.1_0_15000 NW_012133002.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold15615, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012133036.1_0_15000 NW_012133036.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold26232, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012133063.1_0_15000 NW_012133063.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold33822, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012133067.1_0_15000 NW_012133067.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold36096, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012133074.1_0_15000 NW_012133074.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold38051, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
+eukarya_NW_012133082.1_0_15000 NW_012133082.1 Fibroporia radiculosa TFFH 294 genomic supercontigs, scaffold39632, whole genome shotgun sequence eukarya n/a 0.000000 0.000000 0.000000 1.000000 0.000000 n/a n/a n/a
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/mitplas1.fasta
--- a/test-data/mitplas1.fasta Thu May 30 11:10:39 2024 +0000
+++ /dev/null Thu Jan 01 00:00:00 1970 +0000
b
b'@@ -1,7279 +0,0 @@\n->mitochondria_NC_013604.1_0_15000 NC_013604.1 Acraea issoria mitochondrion, complete genome\n-TTAAAAATAAGCTAAATTAAGCTTTTGGGTTCATACCCCAAATATAAAGGAAACCCCTTT\n-TTTTTAAAAATAAAGTGCCTGATTAAAAGGATTATTCTGATAGAATAAATTATGTAATTT\n-TCTTACCTTTATTATATTTTATAGAATTAAACTATATCTAATAACTTCAAAAATTATTGT\n-GCATCTTACACTAAAATATAATTACCAAAATATGAATAAATTTCATTTTAGAATTATAAT\n-TCTTATTTTTAATTTTATACACAAATAATTCAAATAAAATATTTTTTTTATTTATTTTAT\n-TTTTTAGAACAATAATTTCTATTTCAGCTAATTCATGATTAGGATGTTGAATTGGACTAG\n-AAATTAATTTATTAAGATTTATCCCTCTAATATCTTCCCCCCTAAATTTACTTAATTCTG\n-AAGCATCATTAAAATACTTTTTAACCCAATCAATTGCTTCAATTAATTTCCTATTTTCTA\n-TTTTATTAAATTTATTATTATTTAAATTTTTTTTTTATGATAATTTTTTATCAATTTTAA\n-TTAATTCAACTTTATTTATAAAAATAGGGTCAGTACCTTTTCATTTTTGATTCCCTAATA\n-TTATAGAAGGATTATCATGATTTAATAATTTTATTTTAATAACCTGACAAAAAATTTCCC\n-CTATAATTTTACTTTCTTACTACATAAATTTTAATTATTCAATTTTTATTATAATCTTAA\n-ATGTACTCATTGGGACTATTGGAAGATTTAATCAATCTTCTTTACGTAAACTTATAGCCT\n-TTTCTTCAATTAATAATTTAGGATGAATAATTTCAGCTTTATTAATTAGAGAAAATTTAT\n-GATTAACTTATTTCTTATTTTACTCCATATTCCTATTTATTTCTTGTTTTATTTTTTATA\n-TTACTAATATATTTTATATTAATCAATTATTTAATTTTAATTTTAATTATTTTATTAAAT\n-TTACAATTATATTAAATTTTCTTTCTTTAGGGGGATTACCTCCATTCTTAGGATTTTTCC\n-CTAAATGATTAATTATTAATTATTTAATTTTAAATAAATTTTATATTGTTACATTTATTT\n-TTATTATATGTAGTCTAATTATATTATTTGTATATATCCGAATTATCTATTCTTCATTCA\n-TATTTTATTTTATTAAATTGAAATGGTTTAACCTATTTATAAAAAATAATCTAATTATTT\n-TTATTTATTTTTTTAATAGAATTTCATTATTAGGTATAATTTTAAGAACTTTATTTTTTT\n-TTTAATATTAAGGTTTTAAGTTAATTTAAACTAATAATCTTCAAAATTATATATAAAGAA\n-ATTCTTTAAGCCTTAATAATATTTATTATACCTTAAAATTTGCAATTTTAAATCATATTT\n-GAATATAAGACTTTAATAAAAGAGATATTTCTCGTTAATAAATTTACAATTTATCGCTTA\n-TTAACTCAGCCATTTTATTGCGAAAATGACTTTTTTCTACTAATCATAAAGATATTGGAA\n-CTTTATATTTTATTTTTGGAATTTGATCAGGAATAGTAGGAACATCTTTAAGATTATTAA\n-TTCGTACAGAATTAGGAACCCCAGGATCTTTAATTGGAGATGACCAAATTTATAATACTA\n-TTGTAACTGCTCATGCTTTCATTATAATTTTTTTTATAGTTATACCAATTATAATTGGAG\n-GATTTGGAAACTGATTAGTCCCATTAATATTAGGAGCCCCAGATATAGCTTTCCCTCGTA\n-TAAATAATATAAGTTTTTGACTTCTTCCCCCCTCATTAATTTTATTAATTTCTAGAAGAA\n-TTGTTGAAAATGGAGTAGGAACAGGATGAACAGTTTACCCCCCCCTTTCCTCTAATATTG\n-CCCATAGAGGTTCTTCAGTAGATTTAGCTATTTTTTCTTTACATTTAGCTGGTATTTCTT\n-CTATTTTAGGAGCAATTAACTTTATTACAACAATTATTAATATACGAATTAATAATTTAT\n-CTTTTGATCAAATACCTTTATTTGTTTGAGCAGTAGGTATTACAGCCCTTTTACTTCTTT\n-TATCCCTACCTGTATTAGCAGGGGCTATTACTATATTATTAACAGATCGAAATTTAAATA\n-CTTCCTTTTTTGATCCTGCTGGTGGAGGAGACCCAATTTTATACCAACATTTATTTTGAT\n-TTTTTGGACATCCTGAAGTTTATATTTTAATCCTACCTGGATTTGGAATAATTTCACATA\n-TTATTTCCCAAGAAAGAGGAAAAAAAGAAACTTTTGGAGCTTTAGGAATAATTTATGCTA\n-TAATAGCAATTGGATTACTTGGATTTATTGTTTGAGCTCATCATATATTTACAGTAGGAA\n-TAGATATTGATACTCGAGCTTATTTTACATCAGCAACAATAATTATTGCAGTCCCTACAG\n-GAATTAAAATTTTTAGTTGATTAGCAACTTTACATGGGACTCAAATTAACTATAGCCCCT\n-CAATATTATGAAGATTAGGATTTATTTTCCTATTCACAATTGGGGGATTAACCGGAGTAA\n-TTTTAGCTAACTCTTCAATTGACATTACCCTACATGATACATATTATGTTGTTGCCCATT\n-TTCATTATGTTTTATCTATAGGAGCTGTATTTGCTATTTTTGGAGGATTCATTCATTGAT\n-ACCCATTATTTACAGGATTAATACTTAACCCTTATTTATTAAAAATTCAATTTATTTCCA\n-TATTCATTGGAGTAAATTTAACATTTTTCCCTCAACATTTTTTAGGACTCGCAGGAATAC\n-CTCGACGATACTCCGACTATCCTGATAGATTTATATCATGAAATATTATTTCTTCTTTTG\n-GGTCTTATATTTCATTATTATCAATAATTTTAATTATTATCATTATTTGAGAATCAATAA\n-TTAATCAACGAATTATTTTATTTTCCTTAAATATACCATCTTCTATTGAATGATATCAAA\n-ATTTACCCCCAGCTGAACATTCTTACAATGAATTACCTATTTTAAGTAACTTCTAATATG\n-ACAGATTATATGTAATGGATTTAAACCCCATTTATAAAGGTAAATCCTTTTTTTAGAAAT\n-GGCTACTTGATCTAATTTTAATTATCAAAATAGAACTTCCCCTTTAATAGAACAAATTAT\n-TTTTTTTCACGATCATACTTTAATTATTTTAATTATAATTACAATTTTAGTTTCTTATTT\n-AATAATTAATTTATTTTTTAATAAATATATTAATCGATTTCTTTTAGAAGAACAAATAAT\n-TGAATTAATTTGAACTATTTTACCAGCTATTACTTTAATTTTTATTGCTCTTCCTTCTTT\n-ACGATTACTTTATCTCTTAGATGAACTTAATAACCCATTAATTACTTTAAAGTCAATTGG\n-GCATCAATGATATTGAAGTTATGAATACTCTGATTTTAATAATATTGAATTTGACTCTTA\n-CATAATTCAATCTAATGAAAATTTAAATAATTTTCGTCTTCTTGATGTTGATAATCGAAT\n-TATTTTACCTATAAAAAATCAAATTCGAATTTTAGTAACAGCTACTGATGTAATTCATTC\n-ATGAACAATCCCCTCATTAGGAGTAAAAATTGATGCAAACCCAGGACGTCTTAATCAAAC\n-TAGATTTTTTATAAATCAACCAGGAATTTTTTATGGTCAATGTTCTGAAATTTGTGGAGC\n-TAATCATAGATTTATACCTATTGTTGTAGAAAGTATCCCTATTAAGAATTTTATTAATTG\n-AATTAATAATTACTCATTAGATGACTGAAAGCAAGTAATGGT'..b'ATAATCGAGATCATTCTTTGATACAGGATG\n-ACTATGAGTCAGACTCCATAGAATTTGATCAATCCTTTTTTCGGTCGTTAAGGTGGAGAA\n-CTGAACTGCCAAGTCTCTTTCGTCCTCATCAATCAAATCATTGATCGTAACCCAGGATTC\n-TACTCTGTCTTCAATCCAATCACTGTTCACGTTTTTTCTTTCTCTTATCAATGAATAGAT\n-CTCTTTACTTGTACGACTTAGATGTCTCGTATTTCTCGAAAAAGTGATGGTATTTGATAT\n-GATACTTATGAGATCGATATTCCAATCTAATTGTTCCAGAGCAAAGAGATTATTTAACAA\n-GAAAGAATTCAGTTCATATTCATATTCAGATTCAGATTTAGATGTAGATGTAGGATACCT\n-ATACAGAAGTTTTTGCAACTCAATCATGTATGATGGAATCATCAAAGATTTGATCTTTTC\n-TAACTCTGTCTGTAACTCATTAGAGACTCGGGAAACAAAGAGAAGATGCGTACGAACGAG\n-ATATCCAGCAACAAGAAGAAGGAAAAGGATTGAATAGAGGAACTCCCGAGCATTTGTTGA\n-TCTCAGATGTGTCAATATCATTGAAACGGGTGACTCATTATTTCGATGAATCATTTCTTC\n-GGACAGAAGAAGATTCTGTAAACACTTACTCGAAATCTCACTTATCAGATTCCATTGTGG\n-AAGAATCGTCCACCATTTTTTAATTAGCCGTGATATATCTGATCTATGCATAATAGAATT\n-CAAAATGGATACCGATTTTGGACTACTACTTAGTATCGACAATCGGTCTGAAAAAATATC\n-TAAAAGGACGGAAGTTAGATATTTGCACCCTGTCGAAGTAAGGAACCATGGCATATATGT\n-TTGGAACAGATTCCATTTTGAAAAAGCACTATCCCGTTGTTGAGAGGTTCTATACATCTG\n-CCCTTTCTCAACGCATTTCTTTAGATAAAGACTCCGTTTTTTCCTCAGATAAAGACTCCG\n-TTTTTTCCTCAGATAAAGACTCTGTTTTTTCCTCTTTACGTATGGTAAATTTTTCTCAGA\n-ACATGGAGTGTGAATCAAACCAATGTTTGAATTGAAACTGAGATACTGATGCAAGTTCTT\n-CCCTTCTGAATCGGATAGATTCATATCTGAAAGAGGCTGACAATAAGTTCTTTCAAAATT\n-GACTATTTGTTCCTCTGTTAGAGGTGTTCCAGAAATGTCTGCGATCGAGTAAAGAGCTCT\n-ACGAACGAATGGATCGGGTCGAATTGGAAAACGGAAAGATTTGTACAAGTTATACGTTTC\n-GTCACCACTTTGTGGAAAATCGTTAGGTATGAATATGTCAGATACCTGTGAATAAATCGG\n-TAAAAGATGTTTTTTTTTACCGACGCATAAAGAAAATATTTTGTTGCGAATGAACAAGAT\n-ATTGAGGAATTGTCCATATGTACGATCATAATTATTGATACGGGTCTTTTCCACATAAAA\n-GGGGAATCTTTTGTTACAATAGAACCAGAAGTGATGTGGATTATTCAAGAATCGAAGTTG\n-ATTTGCTTTATAAAAAGACGATATCAATGAACTTCTATGAAATGGTTTCACGGGATTCAG\n-CCAATTGTCTCGATCGTGGGATATCATTGAGAAATAGGAATCCGTGTTAGCAAAGGATTT\n-GCTGCGATTCTTTCTAGTATGGAATGAGTCAATCATCCACTTTGGTATCTTATTGAACAA\n-AAATGGTGATATTGTTCCTCCATTGATCAAGAATTTCGATCTTTGGGAAGTATCATGATC\n-AGGTTTCAATTTATGCAAATGAATGATTTGAACACCTATTGATTTTAACAACTGATTGCA\n-GAGCGGCTCATTCGGACCTTTCAATTCATAGATGTGGATCTCGGACCTATGAATGGGGCT\n-ATTCCCGATACTCACAAAGAACAAAGGAAGTGACTTGGACAAAAAGAAACGAAGTGGCTT\n-GGACAAAAAGAGAAGTGACTTGGACAAAAAGAAACGAAGTGACTTAGACAAATCTTGTTT\n-GTCGATAGCCTCGGACCAATTAATCGAATATTGATTAATACGTAATTGATCAAACACTAC\n-TTGAAAACGGTTCTTCTGTTCAGAAACGAAATGTTCCAAATGTTCCTGGAAATTCTTACT\n-CCCGTTGGACCATTTGTATCTATATGCATTAGGATCCCGATTCATGGATCTCTCGGTTCG\n-AGAAATAAGAGGATCAAACCATTTCTTCTGACTCTTTTTCAAATTCGATAAATGTTGGTT\n-GATCGTATATTTCATTATAGTTATATGATTCAGAGTATCATTTCCTATTTGATCCCTTTG\n-AATTCCATATTCGAAGTTGCGATCGGATCTATTCATTAAAAAGAATCGATTCAATACATT\n-TCTTATGTACCCATAGGCGCTATATTGGATTTGAATCAGATTTCGGATCAATCTATATTG\n-ATTGACTGCCTCCATTATGTTGTTGCTAGCAAATACCACTCTTTTGAGTTTTGAATCTTC\n-CAAATCATTCCCGCAGTGGATCCAGACCGGTTTTTTTCTGATGCTTCGATAAAAAAAGGC\n-ATTCTCTTCATAAAAAAGAGGAGGTAGAACCAATAAAGATTTCTTTTTCGATTCATCCTT\n-TGTTTTTTCCTTTCCATTCACTAATTTTTTTTGATCTAATCCGCAGGAATCAATCGAAAA\n-GGCAAATCCCCTATGATACACCAGATCCGGCTCGGTTATTGATAGAGTGAATAGATCTGC\n-CATTTCTTGAAATCTCTCTTCTGATTCAAAATCGTGGTGTAATGTGTACCCCCCCTTGTT\n-CCGATCGTGGAATAGATGAAATAAATCAAAAAATGGATTTTTGTTCAAGAATGAAATCTT\n-ATTGGAACTGTCCATATCTGGTTCATCCTTCGGAACCATATCACATCCCGGATCTGATGA\n-AATAGGATGAATTGAGACGGTATTTTGTAAATAAGTAATTATCTTGAATATATCAACCAT\n-TTCTTTATTTTCTGATCGCCGGGAAGAGACAAAAGAAACATCTTGTTGTTTCTTCAACCA\n-TTTCTGATCTCTAGTGGACCTGTCAGTAGGATTCGAACCCATATGAAGTTCTGACCATCT\n-GTCAGAGAAAAAAGAACGAATTGATCTTGTAGGATTCCCAAGAAATTCGTCGATTTCTTC\n-CGGAAGCCGATGAATAATCATCTGCTTCTCATGTTCGGGGAATAGCGGGGACATTGGGGA\n-AGATCCAGAAAGGCATTTCGGGAATCGATCTGATTCTATCTCTGTTCGTTCCGTTTGAAG\n-AAAGGAAGGATCCCCAGGAATCGATCTTCCTTTTAGTTGCGGAATCTCTGTTTGATCGAT\n-CAATGTGTGATATTCTGAATCCTCCTTACTAATGGAATCGAAGTGATCTCTGGATTGATC\n-AGAAGATCCTTTCGATTGGCTAAAATCCGTTACTTGAACGAAAATAGATCTTGTGGAATC\n-ATATTGAATATTTGACGATACATTCTGTACCTTGCTAAAAAACCGATCCTTGCGGATCGG\n-ATCATCCGTATAGGATAAAAAAAGAAACTCCAGATATTTTAGATCTTTCTCTTTGGATGA\n-GATCTCAATTCCAGCTACGGTTTTATTAGATATCTTACAACTAGAATCCCTCTTTTTTCC\n-GATCCGGTTCCTCCACCACCGCGAACCCCGGTTAGATTCGGGCATGATACGCTTTTGATT\n-TATTTTATTTATTGGGAAAAGCCAAAGACTCTCTTTCGGATCCATGAAACAACTCTCAGA\n-GGTCTTTTTCCCTTTTGGAAGATACAGGAGCAAAACAATCAACCTATTGATATCGGAAGA\n-CCAAAAGGATTCTTCCAATGTCTCATTTCCGGGTCCAATGGAATTCATAGGTATAGGAAG\n'
b
diff -r 3f33a8ac8891 -r 66058890173e test-data/pla
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/pla Fri Oct 18 11:50:31 2024 +0000
b
b'@@ -0,0 +1,20 @@\n+>plastid_NC_026299.1_0_15000 NC_026299.1 Acorus gramineus plastid, complete genome\n+GAGCTTATATGAGTGAAACACTAAAAAAAGAGCTTATATGAGTGAAACACTAATCAAATGAACCGAATGGAGCAATACCAAATCTCTTGATAGAACAAGATATTGCGTATTGCTCCTTCAACGACTCATATACACTACACTTACACTACACTAAGACCGAAGTCTTATCCATTTGTAGAAGGTGCTTCAACAGAAGCTAGGTCTAGAGGGAAGTTGTGAGCATTACGTTCATGCATTACTTCCATACCAAGGTTAGCACGGTTGATGATATCAGCCCAAGTGTTAATAACACGACCTTGACTGTCAACTACGGATTGGTTGAAATTGAAACCGTTTAGGTTGAAAGCCATAGTACTAATACCTAAAGCAGTGAACCAGATACCTACTACAGGCCAAGCAGCCAAGAAGAAATGTAGGGAACGGGAATTGTTGAAACTAGCATATTGGAAGATTAATCGGCCAAAATAACCGTGAGCAGCGACGATATTATAAGTTTCTTCCTCTTGACCGAATCTGTAACCTTCATTAGCAGATTCGTTTTCAGTAGTTTCCCTGATTAAACTGGAGGTTACCAAGGAACCATGCATAGCACTAAATAGGGAGCCGCCGAATACACCAGCTACGCCTAACATGTGGAATGGATGCATAAGGATGTTGTGTTCGGCCTGGAATACAATCATAAAGTTGAAAGTACCAGATATTCCTAGAGGCATACCATCAGAGAAGCTTCCTTGACCAATAGGGTAGATCAAGAAAACAGCAGTAGCAGCTGCAACAGGAGCTGAATATGCGACAGCAATCCAAGGACGCATACCCAGACGGAAACTAAGTTCCCACTCACGACCCATATAACAAGCTACACCAAGTAAGAAGTGTAGAACAATTAGTTCATAAGGACCACCATTGTATAACCACTCATCAACGGATGCTGCTTCCCAAATTGGGTAAAAGTGCAAACCTATAGCTGCAGATGTAGGAATAATGGCACCAGAAATAATGTTGTTTCCATAAAGTAAAGACCCGGAAACAGGTTCACGAATACCATCAATATCTACTGGAGGAGCAGCGATGAAGGCGATAATAAATACAGAAGTTGCGGTCAATAAGGTAGGGATCATTAAAACACCGAACCATCCAATGTAAAGGCGGTTTTCGGTGCTGGTTATCCAGTTACAGAAGCGACCCCATAGGCTTGTACTTTCGCGTCTCTCTAAAATTGCAGTCATGGTAAGATCTTGGTTTATTTAATTATCAAGGACTCCCAAGCGCATGAACTATCTATAAATAGATATAGATAATGGAAGGCTTGTTATTTAACAGTATAACACGACTCATATGTCCATGTCAACCAACATCGACAGGTAGATTTATCTAGCGATCTATATAAATAATAGATCTTTCTTTTTCGATTTTACGTATGGGTTGCCCGGGACTCGAACCCGGAACTAGTCGGATGGAGTAGATAATTTCCTTTTGCAATAGGCTAAAAGGATCCCTCCCCAAATCGTGCTTGCATTTTTCATTGCACACGACTTTCCCTATGTATACATCTAAAACTTAGTTTCCTGGAAGGAAGAAACTTGAATACTCAGTTGATTCAACCACTACTCTATAAGCATTTCAGAATGCAAATACATGAGAATTTTTGTCTCTTCATCATTTATTTATAGATCGTTTCTATTCCATTTATTAGAAAAGTCCCATGACAAATCATGAATTATTCACCAGGTCATTGATACGTATAATATCCAAATACCAAATACGTTCTCCTTTATGGACCCTGGGTGAAGGTGAACGAAGGGAAGGGAAGATCAAAGAAAGAACTTGTTCTTTATCCGTAAAGAATTCTTCTAAGAATTCTGAACCTAATCGTTTGAAAAAAGCGCGCACTGTACTTTTATGTTTACGGGCCAAAGTTCTCGCACACGAAAGGCGAAGTATATACTTTACTCGATACAAACTCTGTTTTTTTGAGGATCCACTGTGATAATGAGAAAGATTTCTACATATTCGTCCAAATCGATCAATAATATCAGCATCTGACAAATCAGCCCAGACCGGCTTACTAACAGGATGCCCTGATACGTTACAAAACTTAGCTTTAACCAATGATCCGATTAGAGGAATAATTGGGACTATAGTATCGAATTTTTTAGTAGGAGTATCCATCAGAAATGAACTCTCTAGCATTTGACTCCTTACCGTCGAAAAATTGATTCGTACACTTGAAAGATAGCCCATAAAATAGAAAGAACGATTTGATAATTGGTTTATATGAATCCTATGCGGTTGAGACCAAAAGTAAAAACGACATTGCCAGAAATTTAGAAGGTGATATTTCCATTTCTTCATCAGAAAATGAGTCCCCTTTGAAGCCAGAATTGATTTTCCTTTATATCGGATATAATGGATGAAAGGATCTTTGAACAAAGATAAGGCCTTTTGAAAATTCTTCCTACGCACTACTACAATATGCTCTATTTTTCCATAGAAATGTGTTCGCTCAACAAAGGTTCCAAAAGATGTTGATCGTAAATAAAAGGATTGTTTACGGAGAAAGACTAATGCGGATTCACACTCAAATACATAAGAATTATATAAGAACAAGAAGAGTCTTTGATTCCCCTTTGAAAAAAGAAAAGAAATGGATTTCTTTGGAGTAATGAGACTATTCCAATTATGAAACTCATGGAGAAAGAACCGCAATAAATGTAAAGACGGAACATCTTGTATCCAGCCTTGAAGAACTTGAACCAGGATTTCGAGATGGATGGGATAGGGTATTAATATATCTGATACATGATTTAAATGTGATAATTTGTCTTCTAAAAAGGGAAATGTTGCATGAATAGATCGTAAATTCTGAATTTTTGGTATTTTTGCTTTTTTTTCTTCAACGGAAGATAAAAATATTATCGAGAATGGAATTTCCATAATGACTGAAAAACCCTCTAATATCGTTTGATAATAAAAATTCTTGTTTTGCCGAACTAATCGATTTCGGTTAGAATCATTAACCAAATTACTCAAAGAATTCTGTTGATACATTTGAGTAATTAAACGTTTTACAATTATTAAACTAAATTTATTATCATAAACGAAATTTTCCGAGGATTCGTAAAAAATCAATCCATTTAAAACATGATTATGAGCAAGTGCGTAGATGTACTCCTGAAAGAGAAGTGGATATAGGAAGTATTGTTGACGAGACCCATCTTTTTCGAAATAGACTTTGAATTCTTCCATTTGAAATTTTATTTGATTGAACTAAATGCAGGAAGAATTTCTTGGATTATCAAATGATACATAGTGCGATATGGTCAGAACGCGGTATAGAAAAAAACGAATACCACGGAGACAGGGAGTCCAATCAACAGACCTTCTTCCTCTCTTTTTGCATTCAACCAGTTTGTGTTCGTTATAGTTACACGAGATGGTCAGAAATCTTTTATTTTTGCAACCCAATCGCTCTTTTGACTTTGGAAAAATTTATCTCTATCAGTATACCGGTTCTCTTACACATTCGTCTCCACTCTATAATATGGAATAGTTAGGATTCAAAAAGGAATCGATGATCCACTCACAAGAGAACCCTTTCCCGCATCAGGCACTAATTTATTTTTAACGTCTAATTAGATTGGGTAATCATTCGAATTAAGAACATAAGCTCGTTTCTTTTTCTTTCCTTAGAATTGGAGCCACAAGGCTCTATCCATTTATTCACTCGACCCAACTCCAACCGCGAATTGATTTTGTCATGTTCCAAAAATCAAACAAAACGATTTTTATATCGATCCGGTAAGGATGGAGTATTCTCAGAGTTCTTCATTAATACGACATGCTATTTTTTCCCTTCATTCCCTTTAAGGATCAGTCGTGGTCTTATTAAACTCTACC'..b'CGATAATTAGCAAGGAATATCCGTTTTTCTGCTAAACAGGATCCATTGAACTCATAATTCATTAGATCCTTTTTATGAATGTCAACTAAGTATCGTAAGGAAATTAATCCCGGTTGTTCAATCATTTGATAATCGAGATCATTCTTTGATACAGGATGACTATGAGTCAGACTCCATAGAATTTGATCAATCCTTTTTTCGGTCGTTAAGGTGGAGAACTGAACTGCCAAGTCTCTTTCGTCCTCATCAATCAAATCATTGATCGTAACCCAGGATTCTACTCTGTCTTCAATCCAATCACTGTTCACGTTTTTTCTTTCTCTTATCAATGAATAGATCTCTTTACTTGTACGACTTAGATGTCTCGTATTTCTCGAAAAAGTGATGGTATTTGATATGATACTTATGAGATCGATATTCCAATCTAATTGTTCCAGAGCAAAGAGATTATTTAACAAGAAAGAATTCAGTTCATATTCATATTCAGATTCAGATTTAGATGTAGATGTAGGATACCTATACAGAAGTTTTTGCAACTCAATCATGTATGATGGAATCATCAAAGATTTGATCTTTTCTAACTCTGTCTGTAACTCATTAGAGACTCGGGAAACAAAGAGAAGATGCGTACGAACGAGATATCCAGCAACAAGAAGAAGGAAAAGGATTGAATAGAGGAACTCCCGAGCATTTGTTGATCTCAGATGTGTCAATATCATTGAAACGGGTGACTCATTATTTCGATGAATCATTTCTTCGGACAGAAGAAGATTCTGTAAACACTTACTCGAAATCTCACTTATCAGATTCCATTGTGGAAGAATCGTCCACCATTTTTTAATTAGCCGTGATATATCTGATCTATGCATAATAGAATTCAAAATGGATACCGATTTTGGACTACTACTTAGTATCGACAATCGGTCTGAAAAAATATCTAAAAGGACGGAAGTTAGATATTTGCACCCTGTCGAAGTAAGGAACCATGGCATATATGTTTGGAACAGATTCCATTTTGAAAAAGCACTATCCCGTTGTTGAGAGGTTCTATACATCTGCCCTTTCTCAACGCATTTCTTTAGATAAAGACTCCGTTTTTTCCTCAGATAAAGACTCCGTTTTTTCCTCAGATAAAGACTCTGTTTTTTCCTCTTTACGTATGGTAAATTTTTCTCAGAACATGGAGTGTGAATCAAACCAATGTTTGAATTGAAACTGAGATACTGATGCAAGTTCTTCCCTTCTGAATCGGATAGATTCATATCTGAAAGAGGCTGACAATAAGTTCTTTCAAAATTGACTATTTGTTCCTCTGTTAGAGGTGTTCCAGAAATGTCTGCGATCGAGTAAAGAGCTCTACGAACGAATGGATCGGGTCGAATTGGAAAACGGAAAGATTTGTACAAGTTATACGTTTCGTCACCACTTTGTGGAAAATCGTTAGGTATGAATATGTCAGATACCTGTGAATAAATCGGTAAAAGATGTTTTTTTTTACCGACGCATAAAGAAAATATTTTGTTGCGAATGAACAAGATATTGAGGAATTGTCCATATGTACGATCATAATTATTGATACGGGTCTTTTCCACATAAAAGGGGAATCTTTTGTTACAATAGAACCAGAAGTGATGTGGATTATTCAAGAATCGAAGTTGATTTGCTTTATAAAAAGACGATATCAATGAACTTCTATGAAATGGTTTCACGGGATTCAGCCAATTGTCTCGATCGTGGGATATCATTGAGAAATAGGAATCCGTGTTAGCAAAGGATTTGCTGCGATTCTTTCTAGTATGGAATGAGTCAATCATCCACTTTGGTATCTTATTGAACAAAAATGGTGATATTGTTCCTCCATTGATCAAGAATTTCGATCTTTGGGAAGTATCATGATCAGGTTTCAATTTATGCAAATGAATGATTTGAACACCTATTGATTTTAACAACTGATTGCAGAGCGGCTCATTCGGACCTTTCAATTCATAGATGTGGATCTCGGACCTATGAATGGGGCTATTCCCGATACTCACAAAGAACAAAGGAAGTGACTTGGACAAAAAGAAACGAAGTGGCTTGGACAAAAAGAGAAGTGACTTGGACAAAAAGAAACGAAGTGACTTAGACAAATCTTGTTTGTCGATAGCCTCGGACCAATTAATCGAATATTGATTAATACGTAATTGATCAAACACTACTTGAAAACGGTTCTTCTGTTCAGAAACGAAATGTTCCAAATGTTCCTGGAAATTCTTACTCCCGTTGGACCATTTGTATCTATATGCATTAGGATCCCGATTCATGGATCTCTCGGTTCGAGAAATAAGAGGATCAAACCATTTCTTCTGACTCTTTTTCAAATTCGATAAATGTTGGTTGATCGTATATTTCATTATAGTTATATGATTCAGAGTATCATTTCCTATTTGATCCCTTTGAATTCCATATTCGAAGTTGCGATCGGATCTATTCATTAAAAAGAATCGATTCAATACATTTCTTATGTACCCATAGGCGCTATATTGGATTTGAATCAGATTTCGGATCAATCTATATTGATTGACTGCCTCCATTATGTTGTTGCTAGCAAATACCACTCTTTTGAGTTTTGAATCTTCCAAATCATTCCCGCAGTGGATCCAGACCGGTTTTTTTCTGATGCTTCGATAAAAAAAGGCATTCTCTTCATAAAAAAGAGGAGGTAGAACCAATAAAGATTTCTTTTTCGATTCATCCTTTGTTTTTTCCTTTCCATTCACTAATTTTTTTTGATCTAATCCGCAGGAATCAATCGAAAAGGCAAATCCCCTATGATACACCAGATCCGGCTCGGTTATTGATAGAGTGAATAGATCTGCCATTTCTTGAAATCTCTCTTCTGATTCAAAATCGTGGTGTAATGTGTACCCCCCCTTGTTCCGATCGTGGAATAGATGAAATAAATCAAAAAATGGATTTTTGTTCAAGAATGAAATCTTATTGGAACTGTCCATATCTGGTTCATCCTTCGGAACCATATCACATCCCGGATCTGATGAAATAGGATGAATTGAGACGGTATTTTGTAAATAAGTAATTATCTTGAATATATCAACCATTTCTTTATTTTCTGATCGCCGGGAAGAGACAAAAGAAACATCTTGTTGTTTCTTCAACCATTTCTGATCTCTAGTGGACCTGTCAGTAGGATTCGAACCCATATGAAGTTCTGACCATCTGTCAGAGAAAAAAGAACGAATTGATCTTGTAGGATTCCCAAGAAATTCGTCGATTTCTTCCGGAAGCCGATGAATAATCATCTGCTTCTCATGTTCGGGGAATAGCGGGGACATTGGGGAAGATCCAGAAAGGCATTTCGGGAATCGATCTGATTCTATCTCTGTTCGTTCCGTTTGAAGAAAGGAAGGATCCCCAGGAATCGATCTTCCTTTTAGTTGCGGAATCTCTGTTTGATCGATCAATGTGTGATATTCTGAATCCTCCTTACTAATGGAATCGAAGTGATCTCTGGATTGATCAGAAGATCCTTTCGATTGGCTAAAATCCGTTACTTGAACGAAAATAGATCTTGTGGAATCATATTGAATATTTGACGATACATTCTGTACCTTGCTAAAAAACCGATCCTTGCGGATCGGATCATCCGTATAGGATAAAAAAAGAAACTCCAGATATTTTAGATCTTTCTCTTTGGATGAGATCTCAATTCCAGCTACGGTTTTATTAGATATCTTACAACTAGAATCCCTCTTTTTTCCGATCCGGTTCCTCCACCACCGCGAACCCCGGTTAGATTCGGGCATGATACGCTTTTGATTTATTTTATTTATTGGGAAAAGCCAAAGACTCTCTTTCGGATCCATGAAACAACTCTCAGAGGTCTTTTTCCCTTTTGGAAGATACAGGAGCAAAACAATCAACCTATTGATATCGGAAGACCAAAAGGATTCTTCCAATGTCTCATTTCCGGGTCCAATGGAATTCATAGGTATAGGAAG\n'
b
diff -r 3f33a8ac8891 -r 66058890173e tiara.xml
--- a/tiara.xml Thu May 30 11:10:39 2024 +0000
+++ b/tiara.xml Fri Oct 18 11:50:31 2024 +0000
[
@@ -1,4 +1,4 @@
-<tool id="tiara" name="tiara" version="@TOOL_VERSION@+galaxy0" profile="21.05">
+<tool id="tiara" name="tiara" version="@TOOL_VERSION@+galaxy1" profile="21.05">
     <description>Deep-learning-based approach for identification of eukaryotic sequences in the metagenomic data </description>
     <macros>
         <import>macros.xml</import>
@@ -6,17 +6,12 @@
     <expand macro="biotools"/>
     <expand macro="requirements"/>
     <command detect_errors="exit_code"><![CDATA[ 
-        
+        mkdir ./results/ &&
         tiara 
         -t \${GALAXY_SLOTS:-4} 
         -i '$input' 
-        -o '$output'
+        -o ./results/main_result.txt
 
-        #if $taxonomy_filter
-            --tf #for $tf in $taxonomy_filter
-                $tf
-            #end for
-        #end if   
         #if $probabilities
             --pr '$probabilities'
         #end if
@@ -33,6 +28,15 @@
             --k1 $advanced_options.advance.first_stage_kmer
             --k2 $advanced_options.advance.second_stage_kmer
         #end if
+        #if $taxonomy_filter
+            --tf #for $tf in $taxonomy_filter
+                $tf
+            #end for
+            #for $tf in $taxonomy_filter
+              && ls -l ./results/
+              &&  mv ./results/${tf}*.dat ./results/${tf}.fasta
+            #end for
+        #end if
 
     ]]></command>
     <inputs>
@@ -43,9 +47,6 @@
             <option value="bac">bacteria</option>
             <option value="arc">archea</option>
             <option value="euk">eukarya</option>
-            <option value="unk">unknown</option>
-            <option value="pro">prokarya</option>
-            <option value="all">all</option>
         </param>
         <param argument="probabilities" type="boolean" truevalue="--pr" falsevalue="" checked="false" label="Add probabilities of individual classes for each sequence."/>
         <param argument="min_len" type="integer" value="3000" min="1000" optional="true" label="Minimum length of a sequence. Default: 3000 bp." help="Specify the desired minimum length in base pairs.Default value is 3000 bp and we do not recommend classifying sequences shorter than 1000 bp. "/>
@@ -77,48 +78,28 @@
         </section>
     </inputs>
     <outputs>
-        <data name="output" format="txt" label="${tool.name} on ${on_string}: sequence ID, classification results"/>
+        <collection name="output" type="list" label="${tool.name} on ${on_string}: classified sequences in txt and Fasta Output">
+            <discover_datasets pattern="__name_and_ext__"  ext="fasta,txt" directory="results" />
+        </collection>
     </outputs>
     <tests>
         <test expect_num_outputs="1">
             <param name="input" value="plast_fr.fasta.gz"/>
             <param name="taxonomy_filter" value="pla"/>
-            <output name="output" ftype="txt">
-                <assert_contents>
-                    <has_text_matching expression=".*sequence_id*"/>
-                    <has_n_lines n="11" delta="5"/>
-                </assert_contents>
-            </output>
-        </test>
-        <test expect_num_outputs="1">
-            <param name="input" value="mitplas1.fasta"/>
-            <param name="taxonomy_filter" value="pla,mit"/>
-            <output name="output" ftype="txt">
-                <assert_contents>
-                    <has_text_matching expression=".*sequence_id*"/>
-                    <has_n_lines n="30" delta="5"/>
-                </assert_contents>
-            </output>
+            <output_collection name="output" type="list">
+                <element name="main_result" file="main_result01.txt" ftype="txt"/>
+                <element name="pla" file="pla" ftype="fasta" />
+            </output_collection>
         </test>
         <test expect_num_outputs="1">
             <param name="input" value="sample_all.fasta"/>
-            <param name="taxonomy_filter" value="all"/>
-            <output name="output" ftype="txt">
-                <assert_contents>
-                    <has_text_matching expression=".*sequence_id*"/>
-                    <has_n_lines n="51" delta="5"/>
-                </assert_contents>
-            </output>
-        </test>
-        <test expect_num_outputs="1">
-            <param name="input" value="sample_all.fasta"/>
-            <param name="taxonomy_filter" value="euk,bac,arc,unk"/>
-            <output name="output" ftype="txt">
-                <assert_contents>
-                    <has_text_matching expression=".*sequence_id*"/>
-                    <has_n_lines n="51" delta="5"/>
-                </assert_contents>
-            </output>
+            <param name="taxonomy_filter" value="euk,bac,arc"/>
+            <output_collection name="output" type="list">
+                <element name="arc" file="arc" ftype="fasta" />
+                <element name="bac" file="bac" ftype="fasta" />
+                <element name="euk" file="euk" ftype="fasta" />
+                <element name="main_result" file="main_result02.txt" ftype="txt" />
+            </output_collection>
         </test>
         <test expect_num_outputs="1">
             <param name="input" value="eukarya_fr.fasta"/>
@@ -126,26 +107,11 @@
             <param name="min_len" value="5000"/>
             <param name="cutoff_stage1" value="0.65"/>
             <param name="cutoff_stage2" value="0.60"/>
-            <output name="output" ftype="txt">
-                <assert_contents>
-                    <has_text_matching expression=".*sequence_id*"/>
-                    <has_n_lines n="11" delta="5"/>
-                </assert_contents>
-            </output>
-        </test>
-        <test expect_num_outputs="1">
-            <param name="input" value="bacteria_fr.fasta"/>
-            <param name="taxonomy_filter" value="bac"/>
-            <param name="min_len" value="5000"/>
-            <param name="cutoff_stage1" value="0.65"/>
-            <param name="cutoff_stage2" value="0.60"/>
             <param name="probabilities" value="true"/>
-            <output name="output" ftype="txt">
-                <assert_contents>
-                    <has_text_matching expression=".*bac*"/>
-                    <has_n_lines n="11" delta="5"/>
-                </assert_contents>
-            </output>
+            <output_collection name="output" type="list">
+                <element name="euk" file="euk" ftype="fasta" />
+                <element name="main_result" file="main_result03.txt" ftype="txt" />
+            </output_collection>
         </test>
     </tests>
     <help><![CDATA[