Repository 'semibin'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/semibin

Changeset 0:7b382efabb98 (2022-10-14)
Next changeset 1:6b517dc161e4 (2023-03-27)
Commit message:
"planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/semibin commit aa9bfb2fb62547ee8bac34f0de5b3beaa0bfd1a4"
added:
macros.xml
semibin.xml
test-data/S1.fasta
test-data/S10.fasta
test-data/S2.fasta
test-data/S3.fasta
test-data/S4.fasta
test-data/S5.fasta
test-data/S6.fasta
test-data/S7.fasta
test-data/S8.fasta
test-data/S9.fasta
test-data/cannot.txt
test-data/data.csv
test-data/data_split.csv
test-data/input_coassembly_sorted1.bam
test-data/input_coassembly_sorted2.bam
test-data/input_coassembly_sorted3.bam
test-data/input_coassembly_sorted4.bam
test-data/input_coassembly_sorted5.bam
test-data/input_multi.fasta.gz
test-data/input_multi_sorted1.bam
test-data/input_multi_sorted10.bam
test-data/input_multi_sorted2.bam
test-data/input_multi_sorted3.bam
test-data/input_multi_sorted4.bam
test-data/input_multi_sorted5.bam
test-data/input_multi_sorted6.bam
test-data/input_multi_sorted7.bam
test-data/input_multi_sorted8.bam
test-data/input_multi_sorted9.bam
test-data/input_single.bam
test-data/input_single.fasta
test-data/input_single_2.fasta
test-data/input_single_3.fasta
test-data/model.h5
test-data/taxonomy.tsv
test-data/taxonomy_10.tsv
test-data/taxonomy_2.tsv
test-data/taxonomy_3.tsv
test-data/taxonomy_4.tsv
test-data/taxonomy_5.tsv
test-data/taxonomy_6.tsv
test-data/taxonomy_7.tsv
test-data/taxonomy_8.tsv
test-data/taxonomy_9.tsv
test-data/test-db/GTDB
test-data/test-db/GTDB.dbtype
test-data/test-db/GTDB.index
test-data/test-db/GTDB_mapping
test-data/test-db/GTDB_merged.dmp
test-data/test-db/GTDB_names.dmp
test-data/test-db/GTDB_nodes.dmp
test-data/test_database.loc
tool-data/gtdb.loc.sample
tool_data_table_conf.xml.sample
tool_data_table_conf.xml.test
b
diff -r 000000000000 -r 7b382efabb98 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Fri Oct 14 21:38:26 2022 +0000
[
b'@@ -0,0 +1,351 @@\n+<?xml version="1.0"?>\n+<macros>\n+    <token name="@TOOL_VERSION@">1.1.1</token>\n+    <token name="@VERSION_SUFFIX@">0</token>\n+    <token name="@PROFILE@">21.01</token>\n+    <xml name="biotools">\n+        <xrefs>\n+            <xref type="bio.tools">semibin</xref>\n+        </xrefs>\n+    </xml>\n+    <xml name="requirements">\n+        <requirements>\n+            <requirement type="package" version="@TOOL_VERSION@">semibin</requirement>\n+            <yield/>\n+        </requirements>\n+    </xml>\n+    <xml name="version">\n+        <version_command>SemiBin -v</version_command>\n+    </xml>\n+    <xml name="mode_fasta_bam">\n+        <conditional name="mode">\n+            <expand macro="mode_select"/>\n+            <when value="single">\n+                <expand macro="input-fasta-single"/>\n+                <expand macro="input-bam-single"/>\n+            </when>\n+            <when value="co">\n+                <expand macro="input-fasta-single"/>\n+                <expand macro="input-bam-multi"/>\n+            </when>\n+            <when value="multi">\n+                <expand macro="input-fasta-multi"/>\n+                <expand macro="input-bam-multi"/>\n+            </when>\n+        </conditional>\n+    </xml>\n+    <xml name="mode_fasta">\n+        <conditional name="mode">\n+            <expand macro="mode_select"/>\n+            <when value="single">\n+                <expand macro="input-fasta-single"/>\n+            </when>\n+            <when value="co">\n+                <expand macro="input-fasta-single"/>\n+            </when>\n+            <when value="multi">\n+                <expand macro="input-fasta-multi"/>\n+            </when>\n+        </conditional>\n+    </xml>\n+    <xml name="mode_select">\n+        <param name="select" type="select" label="Binning mode">\n+            <option value="single" selected="true">Single sample binning (each sample is assembled and binned independently)</option>\n+            <option value="co">Co-assembly binning (samples are co-assembled together and binned together)</option>\n+            <option value="multi">Multi-sample binning (multiple samples are assembled and binned individually, but information from multiple samples is used together)</option>\n+        </param>\n+    </xml>\n+    <xml name="input-fasta-single">\n+        <param argument="--input-fasta" type="data" format="fasta,fasta.gz" label="Contig sequences"/>\n+    </xml>\n+    <xml name="input-fasta-multi">\n+        <conditional name="multi_fasta">\n+            <param name="select" type="select" label="Contig files of the samples">\n+                <option value="concatenated" selected="true">1 concatenated file (created using the dedicated tool) with all sample contigs </option>\n+                <option value="multi">1 contig file per sample</option>\n+            </param>\n+            <when value="concatenated">\n+                <param argument="--input-fasta" type="data" format="fasta,fasta.gz" label="Combined contig sequences"/>\n+                <expand macro="separator"/>\n+            </when>\n+            <when value="multi">\n+                <param argument="--input-fasta" type="data" multiple="true" format="fasta,fasta.gz" label="Contig sequences"/>\n+                <expand macro="concat_min_len"/>\n+            </when>\n+        </conditional>\n+    </xml>\n+    <xml name="concat_min_len">\n+        <param name="min_len" type="integer" min="0" value="0" label="Minimal length for contigs to be kept"/>\n+    </xml>\n+    <token name="@SINGLE_FASTA_FILES@"><![CDATA[\n+#if $input_fasta.ext.endswith(".gz")\n+gunzip -c \'$input_fasta\' > \'contigs.fasta\' &&\n+#else\n+ln -s \'$input_fasta\' \'contigs.fasta\' &&\n+#end if\n+    ]]></token>\n+    <token name="@FASTA_FILES@"><![CDATA[\n+#if $mode.select == \'single\' or $mode.select == \'co\'\n+    #if $mode.input_fasta.ext.endswith(".gz")\n+gunzip -c \'$mode.input_fasta\' > \'contigs.fasta\' &&\n+    #else\n+ln -s \'$mode.input_fasta\' \'contigs.fasta\' &&\n+    #end if\n+#else\n+    #if $mode.multi_fasta.select == \'concate'..b'${on_string}: Coverage">\n+            <filter>mode["select"]=="co" and extra_output and "coverage" in extra_output</filter>\n+            <discover_datasets pattern=".*\\.bam_(?P&lt;designation&gt;.*)_data_cov\\.csv" format="csv" directory="output/" />\n+        </collection>\n+        <collection name="co_split_cov" type="list" label="${tool.name} on ${on_string}: Coverage (split data) per sample">\n+            <filter>mode["select"]=="co" and extra_output and "coverage" in extra_output</filter>\n+            <discover_datasets pattern=".*\\.bam_(?P&lt;designation&gt;.*)_data_split_cov\\.csv" format="csv" directory="output/" />\n+        </collection>\n+        <collection name="multi_cov" type="list" label="${tool.name} on ${on_string}: Coverage">\n+            <filter>mode["select"]=="multi" and extra_output and "coverage" in extra_output</filter>\n+            <discover_datasets pattern=".*\\.bam_(?P&lt;designation&gt;.*)_data_cov.csv" format="csv" directory="output/samples/" />\n+        </collection>\n+        <collection name="multi_cov_sample" type="list" label="${tool.name} on ${on_string}: Coverage per sample">\n+            <filter>mode["select"]=="multi" and extra_output and "coverage" in extra_output</filter>\n+            <discover_datasets pattern="(?P&lt;designation&gt;.*)\\/data_cov.csv" format="csv" directory="output/samples/" recurse="true" match_relative_path="true"/>\n+        </collection>\n+        <collection name="multi_split_cov" type="list" label="${tool.name} on ${on_string}: Coverage (split data) per sample">\n+            <filter>mode["select"]=="multi" and extra_output and "coverage" in extra_output</filter>\n+            <discover_datasets pattern=".*\\.bam_(?P&lt;designation&gt;.*)_data_split_cov.csv" format="csv" directory="output/samples/" />\n+        </collection>\n+        <collection name="multi_split_cov_sample" type="list" label="${tool.name} on ${on_string}: Coverage (split data) per sample">\n+            <filter>mode["select"]=="multi" and extra_output and "coverage" in extra_output</filter>\n+            <discover_datasets pattern="(?P&lt;designation&gt;.*)\\/data_split_cov.csv" format="csv" directory="output/samples/" recurse="true" match_relative_path="true"/>\n+        </collection>\n+        <collection name="multi_contigs" type="list" label="${tool.name} on ${on_string}: Contigs">\n+            <filter>mode["select"]=="multi" and extra_output and "contigs" in extra_output</filter>\n+            <discover_datasets pattern="(?P&lt;designation&gt;.*).fa" format="fasta" directory="output/samples/" />\n+        </collection>\n+    </xml>\n+    <xml name="train_output">\n+        <data name="model" format="h5" from_work_dir="output/model.h5" label="${tool.name} on ${on_string}: Semi-supervised deep learning model" />\n+    </xml>\n+    <xml name="cannot_link_output">\n+        <data name="cannot" format="txt" from_work_dir="output/cannot/cannot.txt" label="${tool.name} on ${on_string}: Cannot-link constraints" />\n+    </xml>\n+    <token name="@HELP_HEADER@"><![CDATA[\n+What it does\n+============\n+\n+SemiBin is a Semi-supervised siamese neural network for metagenomic binning\n+\n+]]></token>\n+    <token name="@HELP_INPUT_FASTA@"><![CDATA[\n+- Contigs in fasta for 1 or several samples from single or co-assembly\n+]]></token>\n+    <token name="@HELP_INPUT_BAM@"><![CDATA[\n+- BAM with reads mapping to the contigs\n+]]></token>\n+    <token name="@HELP_CANNOT@"><![CDATA[\n+- Cannot-link constraints\n+]]></token>\n+    <token name="@HELP_DATA@"><![CDATA[\n+- Training data and split training data for the model\n+]]></token>\n+    <token name="@HELP_MODEL@"><![CDATA[\n+- Semi-supervised deep learning model\n+]]></token>\n+    <token name="@HELP_BINS@"><![CDATA[\n+- Reconstructed bins after reclustering\n+- Reconstructed bins before reclustering\n+]]></token>\n+    <xml name="citations">\n+        <citations>\n+            <citation type="doi">10.1038/s41467-022-29843-y</citation>\n+        </citations>\n+    </xml>\n+</macros>\n\\ No newline at end of file\n'
b
diff -r 000000000000 -r 7b382efabb98 semibin.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/semibin.xml Fri Oct 14 21:38:26 2022 +0000
[
b'@@ -0,0 +1,435 @@\n+<tool id="semibin" name="SemiBin" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">\n+    <description>\n+        for Semi-supervised Metagenomic Binning\n+    </description>\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+    <expand macro="biotools"/>\n+    <expand macro="requirements"/>\n+    <expand macro="version"/>\n+    <command detect_errors="exit_code"><![CDATA[\n+#import re\n+@BAM_FILES@\n+@FASTA_FILES@\n+\n+SemiBin\n+#if $mode.select == \'single\' or $mode.select == \'co\'\n+    single_easy_bin\n+    #if $mode.select == \'single\' and str($mode.environment) != \'\'\n+    --environment \'$mode.environment\'\n+    #end if\n+    #if $mode.ref.select == "cached"\n+    --reference-db-data-dir \'$mode.ref.cached_db.fields.path\'\n+    #else\n+    --taxonomy-annotation-table \'$mode.ref.taxonomy_annotation_table\'\n+    #end if\n+#else\n+    multi_easy_bin\n+    --separator \'$separator\'\n+    #if $mode.ref.select == "cached"\n+    --reference-db-data-dir \'$mode.ref.cached_db.fields.path\'\n+    #else\n+    --taxonomy-annotation-table \n+        #for $e in $mode.ref.taxonomy_annotation_table\n+            \'$e\' \n+        #end for\n+    #end if\n+#end if\n+    --input-fasta \'contigs.fasta\'\n+    --input-bam *.bam\n+    --output \'output\'\n+    --cannot-name \'cannot\'\n+    @MIN_LEN@\n+    --orf-finder \'$orf_finder\'\n+    --random-seed $random_seed\n+\n+#if str($annot.ml_threshold) != \'\'\n+    --ml-threshold $annot.ml_threshold\n+#end if\n+    --epoches $training.epoches\n+    --batch-size $training.batch_size\n+    --max-node $bin.max_node\n+    --max-edges $bin.max_edges\n+    --minfasta-kbs $bin.minfasta_kbs\n+    $bin.no_recluster\n+    --threads \\${GALAXY_SLOTS:-1}\n+    --processes \\${GALAXY_SLOTS:-1}\n+&& \n+echo "output" &&\n+ls output\n+    ]]></command>\n+    <inputs>\n+        <conditional name="mode">\n+            <expand macro="mode_select"/>\n+            <when value="single">\n+                <expand macro="input-fasta-single"/>\n+                <expand macro="input-bam-single"/>\n+                <expand macro="ref-single"/>\n+                <expand macro="environment"/>\n+            </when>\n+            <when value="co">\n+                <expand macro="input-fasta-single"/>\n+                <expand macro="input-bam-multi"/>\n+                <expand macro="ref-single"/>\n+            </when>\n+            <when value="multi">\n+                <expand macro="input-fasta-multi"/>\n+                <expand macro="input-bam-multi"/>\n+                <expand macro="ref-multi"/>\n+            </when>\n+        </conditional>\n+        <expand macro="min_len"/>\n+        <expand macro="orf-finder"/>\n+        <expand macro="random-seed"/>\n+        <section name="annot" title="Contig annotations" expanded="true">\n+            <expand macro="ml-threshold"/>\n+        </section>\n+        <section name="training" title="Training">\n+            <expand macro="epoches"/>\n+            <expand macro="batch-size"/>\n+        </section>\n+        <section name="bin" title="Binning">\n+            <expand macro="max-node"/>\n+            <expand macro="max-edges"/>\n+            <expand macro="minfasta-kbs"/>\n+            <expand macro="no-recluster"/>\n+        </section>\n+        <param name="extra_output" type="select" multiple="true" optional="true" label="Extra outputs" help="In addition to the training data">\n+            <option value="data">Training data</option>\n+            <option value="coverage">Coverage files</option>\n+            <option value="contigs">Contigs (if multiple sample)</option>\n+        </param>\n+    </inputs>\n+    <outputs>\n+        <collection name="output_recluster_bins" type="list" label="${tool.name} on ${on_string}: Reconstructed bins after reclustering">\n+            <filter>not bin["no_recluster"]</filter>\n+            <discover_datasets pattern=".*?\\.(?P&lt;designation&gt;.*).fa" format="fasta" directory="output/output_recluster_bins" />\n+        </collection>\n+        <collection name="output_bins" type="list" label="${tool'..b'rted9.bam,input_multi_sorted10.bam"/>\n+                <conditional name="ref">\n+                    <param name="select" value="taxonomy"/>\n+                    <param name="taxonomy_annotation_table" value="taxonomy.tsv,taxonomy_2.tsv,taxonomy_3.tsv,taxonomy_4.tsv,taxonomy_5.tsv,taxonomy_6.tsv,taxonomy_7.tsv,taxonomy_8.tsv,taxonomy_9.tsv,taxonomy_10.tsv"/>\n+                </conditional>\n+            </conditional>\n+            <conditional name="min_len">\n+                <param name="method" value="ratio"/>\n+                <param name="ratio" value="0.05"/>\n+            </conditional>\n+            <param name="orf_finder" value="fraggenescan"/>\n+            <param name="random_seed" value="0"/>\n+            <section name="annot">\n+                <param name="ml_threshold" value=""/>\n+            </section>\n+            <section name="training">\n+                <param name="epoches" value="20"/>\n+                <param name="batch_size" value="2048"/>\n+            </section>\n+            <section name="bin">\n+                <param name="max_node" value="1"/>\n+                <param name="max_edges" value="200"/>\n+                <param name="minfasta_kbs" value="200"/>\n+                <param name="no_recluster" value="true"/>\n+            </section>\n+            <param name="extra_output" value="data,coverage,contigs"/>\n+            <output_collection name="multi_bins" count="2">\n+                <element name="0" ftype="fasta">\n+                    <assert_contents>\n+                        <has_text text=">g1k_0"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_contigs" count="10">\n+                <element name="S8" ftype="fasta">\n+                    <assert_contents>\n+                        <has_text text=">g1k_0"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_data" count="10">\n+                <element name="S8" ftype="csv">\n+                    <assert_contents>\n+                        <has_text text="g1k_0,"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_cov" count="10">\n+                <element name="8" ftype="csv">\n+                    <assert_contents>\n+                        <has_text text="S1:g1k_5,"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_cov_sample" count="10">\n+                <element name="S8" ftype="csv">\n+                    <assert_contents>\n+                        <has_text text="g1k_3"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_split_cov" count="10">\n+                <element name="8" ftype="csv">\n+                    <assert_contents>\n+                        <has_text text="S1:g1k_5_1,0."/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_split_cov_sample" count="10">\n+                <element name="S8" ftype="csv">\n+                    <assert_contents>\n+                        <has_text text="g1k_3_1"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output_collection name="multi_contigs" count="10">\n+                <element name="S8" ftype="fasta">\n+                    <assert_contents>\n+                        <has_text text=">g1k_0"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+        </test>\n+    </tests>\n+    <help><![CDATA[\n+@HELP_HEADER@\n+\n+Inputs\n+======\n+\n+@HELP_INPUT_FASTA@\n+@HELP_INPUT_BAM@\n+\n+    ]]></help>\n+    <expand macro="citations"/>\n+</tool>\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S1.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S1.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S10.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S10.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S2.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S3.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S3.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S4.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S4.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S5.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S5.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S6.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S6.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S7.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S7.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S8.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S8.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/S9.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/S9.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/cannot.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/cannot.txt Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,15 @@
+g1k_0,g2k_0
+g1k_1,g2k_2
+g1k_1,g2k_3
+g1k_2,g3k_4
+g3k_5,g2k_6
+g4k_5,g2k_9
+g4k_3,g2k_1
+g4k_2,g2k_6
+g3k_1,g2k_1
+g3k_2,g2k_9
+g3k_4,g1k_2
+g3k_9,g1k_9
+g4k_1,g2k_7
+g4k_2,g3k_7
+g2k_7,g3k_1
b
diff -r 000000000000 -r 7b382efabb98 test-data/data.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/data.csv Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,41 @@\n+,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135,mean,var\n+g1k_0,0.055358300480707674,0.040706103647532084,0.014652197333250568,0.016102414767250883,0.030454566614081583,0.025203779353045963,0.016552482246768224,0.013902084867388337,0.012501874931112173,0.010001500044904734,0.003750562829386136,0.006851027688283361,0.01955293211021715,0.011201679990284305,0.004200630308903475,0.00605090772469698,0.030804619098150625,0.010401560026697924,0.006250937715593575,0.006801020190559211,0.04055608115435964,0.018152722173940983,0.011901784958422387,0.014452167342353973,0.010351552528973774,0.005200780263386451,0.006300945213317724,0.017352602210354603,0.010301545031249627,0.003750562829386136,0.005200780263386451,0.012251837442491429,0.0020003004090409287,0.0016002404272477384,0.0072510876700765505,0.004250637806627624,0.0018502779158684824,0.004250637806627624,0.004200630308903475,0.0013001954409028456,0.0014002104363511432,0.01180176996297409,0.0030504578612480533,0.0024503678885582675,0.0016002404272477384,0.01590238477635429,0.004500675295248367,0.004750712783869112,0.008451267615456122,0.0036005403362136894,0.0025003753862824166,0.003950592820282731,0.0016002404272477384,0.001450217934075292,0.0017002554226960359,0.008751312601801014,0.0012501879431786966,0.001200180445454548,0.04045606615891134,0.006300945213317724,0.010001500044904734,0.007551132656421444,0.008701305104076865,0.010401560026697924,0.007451117660973146,0.0034505178430412433,0.0066009901996626165,0.008901335094973461,0.0024503678885582675,0.0039005853225585825,0.02070310455787257,0.015252287305940354,0.009851477551732287,0.017252587214906304,0.013752062374215892,0.016552482246768224,0.007751162647318038,0.011201679990284305,0.01710256472173386,0.0028004203726273093,0.004550682792972516,0.0028004203726273093,0.0033004953498687968,0.004500675295248367,0.0025503828840065653,0.0061009152224211285,0.0015502329295235895,0.0022503378976616727,0.004600690290696666,0.0017502629204201848,0.0024503678885582675,0.004700705286144963,0.004850727779317409,0.004200630308903475,0.0020503079067650774,0.001000150454557953,0.000500075477316465,0.0020003004090409287,0.001000150454557953,0.0016502479249718871,0.005850877733800385,0.005200780263386451,0.00770115514959389,0.0023003453953858214,0.0014002104363511432,0.0020003004090409287,0.0011001654500062503,0.0014002104363511432,0.003250487852144648,0.0013001954409028456,0.00970145505855984,0.0026503978794548627,0.003100465358972202,0.0009001354591096553,0.0011001654500062503,0.002150322902213375,0.004050607815731029,0.0006500979704889113,0.000500075477316465,0.000750112965937209,0.00010001549552327481,0.004600690290696666,0.006500975204214319,0.0012501879431786966,0.0004000604818681675,0.0008501279613855065,0.006300945213317724,0.0016502479249718871,0.0025503828840065653,0.0025503828840065653,0.0006000904727647626,0.0030504578612480533,0.001000150454557953,0.000500075477316465,0.0004000604818681675,0.00020003049097157234,0.030236700251889168,0.04897040200749957\n+g1k_1,0.055358300480707674,0.040706103647532084,0.014652197333250568,0.016102414767250883,0.030454566614081583,0.025203779353045963,0.016552482246768224,0.013902084867388337,0.012501874931112173,0.010001500044904734,0.003750562829386136,0.006851027688283361,0.01955293211021715,0.011201679990284305,0.004200630308903475,0.00605090772469698,0.030804619098150625,0.010401560026697924,0.006250937715593575,0.006801020190559211,0.04055608115435964,0.018152722173940983,0.011901784958422387,0.014452167342353973,0.010351552528973774,0.005150772765662301,0.006300945213317724,0.01735260221035460'..b',0.0017002554226960359,0.0024503678885582675,0.004700705286144963,0.004850727779317409,0.004200630308903475,0.0020003004090409287,0.001000150454557953,0.000500075477316465,0.0019502929113167798,0.001000150454557953,0.0016502479249718871,0.005850877733800385,0.005200780263386451,0.00770115514959389,0.0023003453953858214,0.001450217934075292,0.0020003004090409287,0.0011001654500062503,0.0014002104363511432,0.003250487852144648,0.0013001954409028456,0.00970145505855984,0.002600390381730714,0.003100465358972202,0.0008501279613855065,0.0011001654500062503,0.002150322902213375,0.004050607815731029,0.0006500979704889113,0.000500075477316465,0.000750112965937209,0.00010001549552327481,0.004600690290696666,0.006500975204214319,0.0012501879431786966,0.0004000604818681675,0.0008501279613855065,0.006300945213317724,0.0016502479249718871,0.0025503828840065653,0.0025003753862824166,0.0006000904727647626,0.0030504578612480533,0.0009501429568338041,0.000500075477316465,0.0004000604818681675,0.00020003049097157234,0.015123350125944584,0.02466823652202602\n+g4k_9,0.05545831547615598,0.040756111145256235,0.014652197333250568,0.016102414767250883,0.03050457411180573,0.025203779353045963,0.016552482246768224,0.013902084867388337,0.012501874931112173,0.009951492547180585,0.003750562829386136,0.006851027688283361,0.01955293211021715,0.011201679990284305,0.004200630308903475,0.0061009152224211285,0.030804619098150625,0.010401560026697924,0.006300945213317724,0.006801020190559211,0.04060608865208379,0.018152722173940983,0.011851777460698239,0.014452167342353973,0.010351552528973774,0.005200780263386451,0.006250937715593575,0.017352602210354603,0.010301545031249627,0.003750562829386136,0.005200780263386451,0.012251837442491429,0.0020503079067650774,0.0016002404272477384,0.007301095167800699,0.004250637806627624,0.0018002704181443335,0.004250637806627624,0.004250637806627624,0.0013001954409028456,0.0014002104363511432,0.01180176996297409,0.0030504578612480533,0.0024503678885582675,0.0016002404272477384,0.01590238477635429,0.004500675295248367,0.004750712783869112,0.00850127511318027,0.0036005403362136894,0.0025003753862824166,0.0039005853225585825,0.0016002404272477384,0.001450217934075292,0.0017002554226960359,0.008751312601801014,0.0012501879431786966,0.001200180445454548,0.04045606615891134,0.006250937715593575,0.010051507542628882,0.007551132656421444,0.008701305104076865,0.010401560026697924,0.007501125158697295,0.0034505178430412433,0.0066009901996626165,0.008901335094973461,0.0024503678885582675,0.0039005853225585825,0.020653097060148423,0.015302294803664502,0.009901485049456435,0.017252587214906304,0.013752062374215892,0.016552482246768224,0.007751162647318038,0.011201679990284305,0.01710256472173386,0.0028004203726273093,0.004500675295248367,0.0028004203726273093,0.0033004953498687968,0.004500675295248367,0.0025503828840065653,0.00605090772469698,0.0015502329295235895,0.0022503378976616727,0.004600690290696666,0.0017002554226960359,0.0024503678885582675,0.004700705286144963,0.004850727779317409,0.004200630308903475,0.0020003004090409287,0.001000150454557953,0.000500075477316465,0.0019502929113167798,0.001000150454557953,0.0016502479249718871,0.005850877733800385,0.005200780263386451,0.00770115514959389,0.0023003453953858214,0.001450217934075292,0.0020003004090409287,0.0011001654500062503,0.0014002104363511432,0.003250487852144648,0.0013001954409028456,0.00970145505855984,0.002600390381730714,0.003100465358972202,0.0008501279613855065,0.0011001654500062503,0.002150322902213375,0.004050607815731029,0.0006500979704889113,0.000500075477316465,0.000750112965937209,0.00010001549552327481,0.004600690290696666,0.006500975204214319,0.0012501879431786966,0.0004000604818681675,0.0008501279613855065,0.006300945213317724,0.0016502479249718871,0.0025503828840065653,0.0025003753862824166,0.0006000904727647626,0.0030504578612480533,0.0009501429568338041,0.000500075477316465,0.0004000604818681675,0.00020003049097157234,0.027012518891687657,0.045930738028919685\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/data_split.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/data_split.csv Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,81 @@\n+,0,1,2,3,4,5,6,7,8,9,10,11,12,13,14,15,16,17,18,19,20,21,22,23,24,25,26,27,28,29,30,31,32,33,34,35,36,37,38,39,40,41,42,43,44,45,46,47,48,49,50,51,52,53,54,55,56,57,58,59,60,61,62,63,64,65,66,67,68,69,70,71,72,73,74,75,76,77,78,79,80,81,82,83,84,85,86,87,88,89,90,91,92,93,94,95,96,97,98,99,100,101,102,103,104,105,106,107,108,109,110,111,112,113,114,115,116,117,118,119,120,121,122,123,124,125,126,127,128,129,130,131,132,133,134,135\n+g1k_0_1,0.05391616851795648,0.03921175919495924,0.015104530304875343,0.015704710277242576,0.030509149595634347,0.025907769807485555,0.014004200355535415,0.01350405037856272,0.012303690433828252,0.010303090525937472,0.002900870866741585,0.007402220659495841,0.018405520152895132,0.011303390479882863,0.004801440779237827,0.005701710737788678,0.030409119600239808,0.011003300493699245,0.007402220659495841,0.007202160668706763,0.04151244908903364,0.01650495024039889,0.01260378042001187,0.012703810415406408,0.009702910553570237,0.005001500770026904,0.0055016507469996,0.01640492024500435,0.009802940548964776,0.004001200816081515,0.00440132079765967,0.01350405037856272,0.002200660898979812,0.001500450931218039,0.009002700585808465,0.004701410783843288,0.002000600908190734,0.004001200816081515,0.0035010508391088192,0.001700510922007117,0.000900270958850805,0.012803840410800947,0.0035010508391088192,0.002600780880557968,0.001800540917401656,0.014104230350929954,0.005901770728577755,0.005201560760815982,0.009702910553570237,0.0046013807884487485,0.00240072088976889,0.00440132079765967,0.001700510922007117,0.001900570912796195,0.001500450931218039,0.008902670590413926,0.001700510922007117,0.001300390940428961,0.03851154922719747,0.006001800723972294,0.01050315051672655,0.00850255060883577,0.009202760576597543,0.010303090525937472,0.0078023406410739965,0.003000900862136124,0.006902070682523145,0.009402820567386621,0.002500750885163429,0.00440132079765967,0.02040612006078591,0.015004500309480804,0.010303090525937472,0.01740522019894974,0.014104230350929954,0.015704710277242576,0.007302190664101302,0.0114034204752774,0.016905070221977046,0.0032009608529252023,0.004301290802265131,0.002800840871347046,0.0034010208437142806,0.005001500770026904,0.002100630903585273,0.0054016207516050605,0.001000300954245344,0.002500750885163429,0.004301290802265131,0.001500450931218039,0.002200660898979812,0.006101830719366833,0.005001500770026904,0.004701410783843288,0.002200660898979812,0.001200360945034422,0.000600180972667188,0.001500450931218039,0.001200360945034422,0.001500450931218039,0.006301890710155912,0.004901470774632366,0.006802040687128606,0.002000600908190734,0.001300390940428961,0.002200660898979812,0.0014004209358235,0.0014004209358235,0.004201260806870592,0.001800540917401656,0.009102730581203004,0.002600780880557968,0.0033009908483197415,0.000800240963456266,0.001200360945034422,0.002200660898979812,0.0039011708206869752,0.000700210968061727,0.0004001209818781099,0.000500150977272649,0.00020006099108903195,0.004901470774632366,0.007702310645679457,0.001600480926612578,0.0004001209818781099,0.0011003309496398828,0.0055016507469996,0.0014004209358235,0.002900870866741585,0.002500750885163429,0.0004001209818781099,0.002900870866741585,0.000900270958850805,0.000500150977272649,0.0004001209818781099,0.00020006099108903195\n+g1k_0_2,0.056817038384398104,0.04221265905679541,0.014204260346324493,0.01650495024039889,0.030409119600239808,0.02450734987196201,0.019105730120656902,0.014304290341719032,0.012703810415406408,0.009702910553570237,0.0046013807884487485,0.006301890710155912,0.020706210046969528,0.011103330489093784,0.0036010808345033583,0.006401920705550451,0.03120935956339612,0.009802940548964776,0.005101530765421443,0.006401920705550451,0.0396118791765374,0.019805940088418676,0.011203360484488323,0.016204860254215272,0.011003300493699245,0.0054016207516050605,0.007102130673312224,0.018305490157500593,0.010803240502910167,0.0035010508391088192,0.006001800723972294,0.011003300493699245,0.00180054091'..b'0034010208437142806,0.005001500770026904,0.002100630903585273,0.005301590756210521,0.001000300954245344,0.002500750885163429,0.004301290802265131,0.001500450931218039,0.002200660898979812,0.006101830719366833,0.005001500770026904,0.0046013807884487485,0.002200660898979812,0.001200360945034422,0.000600180972667188,0.001500450931218039,0.001200360945034422,0.001500450931218039,0.006301890710155912,0.004901470774632366,0.006802040687128606,0.002000600908190734,0.001300390940428961,0.002200660898979812,0.0014004209358235,0.0014004209358235,0.004101230811476054,0.001800540917401656,0.009102730581203004,0.002600780880557968,0.0032009608529252023,0.000800240963456266,0.001200360945034422,0.002100630903585273,0.0039011708206869752,0.000700210968061727,0.0004001209818781099,0.000500150977272649,0.00020006099108903195,0.004901470774632366,0.007602280650284918,0.001600480926612578,0.0004001209818781099,0.0011003309496398828,0.0055016507469996,0.0014004209358235,0.002900870866741585,0.002500750885163429,0.0004001209818781099,0.002800840871347046,0.000900270958850805,0.000500150977272649,0.0004001209818781099,0.00020006099108903195\n+g4k_9_2,0.056817038384398104,0.04221265905679541,0.014304290341719032,0.01650495024039889,0.030409119600239808,0.02450734987196201,0.019005700125262363,0.014304290341719032,0.012703810415406408,0.009702910553570237,0.0046013807884487485,0.006301890710155912,0.020706210046969528,0.011103330489093784,0.0036010808345033583,0.006401920705550451,0.03120935956339612,0.009802940548964776,0.005101530765421443,0.006401920705550451,0.0396118791765374,0.019805940088418676,0.011103330489093784,0.016204860254215272,0.011003300493699245,0.0054016207516050605,0.0070021006779176845,0.018305490157500593,0.010803240502910167,0.0035010508391088192,0.006001800723972294,0.011103330489093784,0.001800540917401656,0.001700510922007117,0.005601680742394139,0.0039011708206869752,0.001600480926612578,0.004501350793054209,0.004901470774632366,0.000900270958850805,0.001900570912796195,0.010903270498304706,0.002600780880557968,0.002300690894374351,0.0014004209358235,0.01770531018513336,0.0031009308575306632,0.004301290802265131,0.007302190664101302,0.002600780880557968,0.002600780880557968,0.0034010208437142806,0.001500450931218039,0.001000300954245344,0.001900570912796195,0.008602580604230308,0.000800240963456266,0.0011003309496398828,0.042412719047584486,0.00650195070094499,0.00950285056278116,0.006601980696339529,0.008202460622652152,0.01050315051672655,0.007102130673312224,0.0039011708206869752,0.006301890710155912,0.00840252061344123,0.00240072088976889,0.0034010208437142806,0.020906270037758606,0.0155046502864535,0.009402820567386621,0.017105130212766124,0.01350405037856272,0.01740522019894974,0.008202460622652152,0.011003300493699245,0.017305190203555202,0.00240072088976889,0.004701410783843288,0.002800840871347046,0.0032009608529252023,0.004001200816081515,0.003000900862136124,0.006802040687128606,0.002100630903585273,0.002000600908190734,0.004901470774632366,0.001900570912796195,0.002700810875952507,0.0033009908483197415,0.004701410783843288,0.0038011408252924365,0.001800540917401656,0.000800240963456266,0.0004001209818781099,0.00240072088976889,0.000800240963456266,0.001800540917401656,0.0054016207516050605,0.0055016507469996,0.008602580604230308,0.002600780880557968,0.001500450931218039,0.001800540917401656,0.000800240963456266,0.0014004209358235,0.00240072088976889,0.000800240963456266,0.010303090525937472,0.002600780880557968,0.003000900862136124,0.000900270958850805,0.001000300954245344,0.002100630903585273,0.004201260806870592,0.000600180972667188,0.000600180972667188,0.001000300954245344,1.00029995394539e-09,0.004301290802265131,0.0054016207516050605,0.000900270958850805,0.0004001209818781099,0.000600180972667188,0.007102130673312224,0.001900570912796195,0.002200660898979812,0.002500750885163429,0.000800240963456266,0.0033009908483197415,0.001000300954245344,0.000500150977272649,0.0004001209818781099,0.00020006099108903195\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_coassembly_sorted1.bam
b
Binary file test-data/input_coassembly_sorted1.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_coassembly_sorted2.bam
b
Binary file test-data/input_coassembly_sorted2.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_coassembly_sorted3.bam
b
Binary file test-data/input_coassembly_sorted3.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_coassembly_sorted4.bam
b
Binary file test-data/input_coassembly_sorted4.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_coassembly_sorted5.bam
b
Binary file test-data/input_coassembly_sorted5.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi.fasta.gz
b
Binary file test-data/input_multi.fasta.gz has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted1.bam
b
Binary file test-data/input_multi_sorted1.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted10.bam
b
Binary file test-data/input_multi_sorted10.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted2.bam
b
Binary file test-data/input_multi_sorted2.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted3.bam
b
Binary file test-data/input_multi_sorted3.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted4.bam
b
Binary file test-data/input_multi_sorted4.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted5.bam
b
Binary file test-data/input_multi_sorted5.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted6.bam
b
Binary file test-data/input_multi_sorted6.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted7.bam
b
Binary file test-data/input_multi_sorted7.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted8.bam
b
Binary file test-data/input_multi_sorted8.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_multi_sorted9.bam
b
Binary file test-data/input_multi_sorted9.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_single.bam
b
Binary file test-data/input_single.bam has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_single.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_single.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_single_2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_single_2.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/input_single_3.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/input_single_3.fasta Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,13400 @@\n+>g1k_0\n+ATGGCTAATAATTATCAAACTTTATATGATTCAGCAATAAAAAGGATTCCATACGATCTT\n+ATTTCTGATCAAGCTTATGCAATTCTACAAAATGCTAAAACTCATAAAGTTTGCGATGGT\n+GTTTTATATATAATTGTAGCCAATGCCTTTGAAAAAAGTATTATTAACGGTAATTTTATT\n+AACATTATTTCTAAATATCTAAGCGAAGAATTCAAAAAGGAAAATATTGTTAATTTTGAA\n+TTTATTATAGACAATGAAAAATTATTAATTAATAGCAATTTTTTAATTAAAGAAACTAAT\n+ATTAAAAATCGTTTTAATTTTAGTGATGAACTTTTACGTTACAATTTTAACAATTTAGTA\n+ATTAGTAATTTTAATCAAAAAGCGATTAAGGCGATTGAAAATTTATTTTCAAATAACTAT\n+GATAATAGTTCAATGTGTAACCCTTTATTTTTATTTGGTAAAGTTGGTGTTGGTAAAACG\n+CATATCGTGGCTGCTGCTGGTAATCGTTTTGCTAATAGTAATCCTAATTTAAAAATTTAT\n+TATTATGAAGGGCAAGATTTTTTTCGAAAGTTTTGTTCTGCTTCGTTAAAAGGGACTAGT\n+TATGTTGAAGAGTTTAAAAAAGAAATTGCTTCAGCAGATTTATTAATTTTTGAAGATATT\n+CAAAATATCCAATCACGTGATTCAACGGCTGAATTGTTTTTTAATATCTTTAATGATATA\n+AAATTAAATGGTGGAAAAATTATCTTAACATCTGACCGTACACCAAACGAACTTAATGGT\n+TTTCATAATCGAATTATTTCGAGATTAGCGTCAGGTTTGCAGTGTAAAATTTCTCAACCC\n+GACAAAAATGAAGCTATTAAAATTATTAATAATTGGTTTGAATTCAAAAAAAAATATCAA\n+ATTACTGACGAAGCTAAAGAATATATTGCTGAAGGTTTTCACACTGATATTAGACAGATG\n+ATTGGTAATCTAAAACAAATTTGTTTTTGAGCGGACAATGATACTAATAAAGATTTAATA\n+ATCACAAAAGATTATGTAATTGAGTGTTCAGTTGAAAACGAAATTCCACTAAATATTGTT\n+GTTAAAAAACAATTTAAACCTGAACAAATAATTGAAATTGTTGCAAAAGAATTAAATATA\n+AAAACAGATTTAATTAAATCTTCTATTAGAAAAAATAATATAGTTTGAGCGCGTGATATT\n+GTTTGTTATATTCTAAAAAATAAACTAAATTTAACTTTAACAGATATTGGTAAATTACTA\n+AACGGACGAGAACACACTACAATTAGTCATAGTATTAGTAAAGTTCAAAAAATTCTTGAT\n+GATGAAAATAGTCAAGAAGCACTACAAATTAATCTAATTATCAATAAATTTTAATTTTAT\n+TAAAGAAAAGTAATCAAAACTTATTAAAATATTATATATTTATATATAGTGTATTTTCGT\n+GTTTTTGAACTCAAAACATAAAATTACTAATTTTTTATTATTTAACTTATATATTGTAAT\n+AAAGGAAGAGAATTATGAGAGATATTCATCCAGTAAGCAAACCATGCGTTTATAATTGTG\n+TAACATGTAAAAAAGAATTTATAATTGATTCTGCAGCAAAAAATACAGAAGTTGCAATTG\n+AAGTTTGTTCAAATTGCCATACATTTTTTATTGGTAAACAAAACGCAACTACAACATTAC\n+GTGGTCGTGCTGAAAAACTAAATAATCGTTTTGAAGCTGGTTTAAATAACATTAATAAAA\n+AACCAGAAAAGAAAAAAATACAAGGTAAATCTGAACCAAGAAAAAGTTTAAACGAATTAT\n+AATTAATCATCTTGTCATTAATTGCCAAGATTGTTTAATTCTTTTTGTATAATTAAAAAT\n+TAGTAGATTAAATAACAGGCAATTAGATTACCTGTTATTTTATTTTTACTAAAATATTTA\n+AAACTGAGGGACTTATGGAATACAACAAAAAACTTTATGAAGCAATTGAACGAGTCGCTA\n+TTAAAAATGACGCTTTAAAAAAAGAATTAGAAACGGTTGTAACAGACTTTAAAAAAATTA\n+AAGAGATTAATATACAGTTAAAAAAAACTACTAAAATTGCTGAAGCCTTTGCAAAATATA\n+AACAAAAATTGGATACTGGTATAGCTGCTGAAAAAATATTAAATACAGAAAAAGATTTAG\n+AATTAATCGAATTAGCACAGATGGATTTAGATGAAGCTAAAATTAATATTCCAATAATTG\n+AAAATGATTTAAAAATTATGCTGTTGCCAACTGATCCTAATGATGATAAAAATGTTATTG\n+TTGAAATGCGCCCTGCTGCTGGAGGGGATGAATCATCAATTTTTGTCGGCAATTTGTTTG\n+ATACATATCGTGCTTATGCTGAAAATAATAATTGAAAAATGAAAATTATAGAAATGACTC\n+CGAATGCTGTTGGTTTTAGTTTTATTTCTTTTATGATTTCTGGAGAAGAAGTTTATTCAC\n+GAATGAAATTTGAGTCAGGAGTTCATCGAGTACAACGTGTACCTGCTACTGAATCTAAAG\n+GAAGAGTACATACGTCAACAATTACAGTTGCTGTTCTTCCAGAACAAGATGAAGTTGATG\n+TTGTAATTAATCCAACAGAATTAAGAATTGATACTTACCGTGCAAGTGGGGCTGGAGGAC\n+AGCATGTTAATAGAACAGAATCAGCTGTAAGAATTACGCATATTCCAACAGGGGTTGTTG\n+CTGCATGTCAAGAGGGAAAATCACAAATTGAAAACCGAGAAACAGCTATGAAAATGTTAA\n+GAGCTAAATTATGAGAAGCAGCTCAAGAACAGCAAAATGCAGAATTTGCTAATTTAAGAA\n+AAAATCAAGTTGGTACAGGGGATCGTTCTGAAAAAATCCGTACTTACAATTATCCACAGA\n+ACCGCGTTACTGACCATCGTATTAACCTAACATTAAATAAATTAGACCAAATCATGATGG\n+GTGAGTTAGATGAGATTATTGATGCATTAATTGCTGACGAACAAACTGGTTTAATGGCTA\n+ATTTAGATATTTAATGACCTACCATCAATTAATTTTTCAAGCATACTCACTACTTGAAAA\n+AAAATTACGTAATCCACAAGTAGCATTTCAGTTGCTGTACGGATTAGATAATAAAATTAA\n+CGATTCTTATAGTTTTTCAAATAACCGCTTAACAATTGTAAATTCTAATTTAGAATATAC\n+ATATTTTAAACTATTAGATGAATTTATTAATGGAAAACCATTAGTGAGAATTTTAGGATA\n+TGGCTATTTTTGTGCAAAGCGCTTTTATGTTGATAAAAATGTTTTTGCTTTTCGTGTTGA\n+AACTGAATTATTAATAGATGTTGTTAATAAAGTAATTCAACAATCCACTTATAAAATTAA\n+AAATGTTATTGATGTTTGTTGTGGTAGTGGTGTTTTAGGGTTAAGTACAAAAATGAATTT\n+TAATCAATTGAATGTTTCATTATTAGATATTTCTATTGATGCAATTAATAATTGCAAAAA\n+AAATGCTAAATATCATAACTTAACAGATGTAAATTTTATTCATAAAAGTATGCAAGAATA\n+CTTTTTAAACACAAAAAAACGGTTTGATTTAATTATCTGTAATCCCCCATATATCAAAAG\n+TAATTATGAATTAAATCGTGAAGTCTTAGATTATGACCCCATTAATGCACTTATTGATTT\n+CGATCACAAAGATGGAATTAGTTTTTATTTATTTATAATAAATAACATTAAATCAATTGC\n+TAATGAGAAATTCACTATTATTTTTGAAATTGGTTTTGATCAAAAAGAAATTTTAGAAAA\n+AGTTATTAAAAAAAATGAATTTCCTCTTTTTTACTACTTTATAAATGATTATAATAATCT\n+AT'..b'TTTATTTT\n+TTTCACTATCTTTTAAAACTCATCCATCGCTTGTTTTTGTAGCAAGATCTTCTAATTTTG\n+TAGTTCCTTTTGTTGAAAGAAGTTTAAATAATTCTTCATTTTGAATAACATTAACAATTT\n+GAGCATATGTAATTGCTTTTAAACCAGCTAGTTTAGCCGCTTGTTCTAAATAAACACGAC\n+CTGCATTTGATAATTCAACAAGCGGAGTATCATCTACATATGTGCTCTTATCTAAACTTG\n+CTTCAGTATGTGTTCCTAATTTATAAGCATCTTTATTAATATCATTAGTTAGTTGTGCAC\n+CTTTTGAAGCATTTTCAATTGCTCCCTTCATTGCTAAATCAACACGTTTAACAATTGAGA\n+ATAAAATTGTTTTTCCATCATTAACAGTTTTGTTTGTAATTCTTTTACGGTTTGTTACAT\n+CATCTAATTCTTGTGCAGTATCAACACCAATAATTACACTTGGATCTGTTGCATTTGAAA\n+CAATTGAAGTTGCAAGGTTTGTTTGTGGACCAGCTACAGGTAAAATAACATCAGCTTTTT\n+TTGTAATTAAATCATTGATAATGTTTGTTGCACCTTCTTCATCTGGTTTAAATGAACCAG\n+CAACGTATTTGCTAGCAAATACTTGTTCAACATTCATTCATTTTTTCTTGCTTCCATTAG\n+CATCTTCTTGATTAATTTCTTTATCTTTTAACTTTTCATTTGCTCATTGAACACCTAATT\n+TAAAACCTTGGATAAAAGTTGAAGTTGATGTAAAATGTAATCCAACATATCCACCTCAAG\n+TTAGTTTTCCATCTGCTGCAAAAGTTTTTTGGTTAGCATTTAAATAGTACGCCGCAGCAA\n+TACCTGTTAAAAATGCTGCTTGATCTACACGATATGAGACAGACGCAATACGGTCTTTAC\n+CCACTGTTCCACTAAATTTATCATCAATTAAAACTGCACTTAAATCTTTTTTATCGCTGC\n+TTGAACCAAAATATTCTTTAATTGGAATTGAGTGACTAAATGAAATCAAGCCTAACATAC\n+GAGCACCATCATCGTATAATGAATTATATGTTCTGTGATATCCTAAACTATCATCTCCAG\n+CTGGTTTTGCATAAAAATCTTCTAAAGACAATTTAGAAATATAATTTCCATCTTTATTTG\n+TTTTCCCATCATCTTTATTACTATCATTACATGATGCAGCAATAGCTGCAACTGAAGTTA\n+ATGTAACCACTCCAGCAAGTGATGCAAACAAGATTTTTTTATTGATTTTGCTTTTTTTCA\n+TAAAATTTATTTTTTATCCTTTTTGACATGAAAAATCTAAAATAACTAAACAACACAATT\n+TTTAAGATTGTGTAGTATCATTATACAAAAAATAAACTTGTATATATAAGTTAAACACTT\n+AATTTTTGTTTTTTGTATAAAAAAAAGCGTTTTTTTAATTAAAACACTTTTTTATTTTTT\n+AAAATTTAGAATTCTTAATGAATTTTCTAATAAGATTTTTTGCATTTTTTCATGTGTAAT\n+GCCTAATAAGTTGGCAATAAATGCTGATGTATATAATACATAATAAGGATAGTTAGTTTG\n+CCCTCGTTTAGGAACTGGTGTTAAATATGGGGCGTCTGTTTCTACTAGAATCTTATCAAG\n+TGGGGTTATTTTAATCGCCTCATACAGTTCATGTAATTGATTATTTTTTGTTGGTTTAAA\n+AGTAATTACACCAGGATATGAAATATAATAACCCATTTCAATATATTGTTGTGCATACTC\n+TTTTTTATCTGTAAAACAATGGATTATTACATCTTGAACAGCTAATTCTTTTAAGATGGC\n+AATTGCGTCATCGTGTGCATTACGGATGTGTAACATTAATGGTTTATGATACTTTTTAGC\n+CAATTCAATATGTTTTTTAAACCAATGTTTTTGAAAATCATGATCATAATTTTGTTCATG\n+ATAATAGTCTAAACCACACTCACCAATACAACTTATGTAATCAATATTTTCTGCTATCAA\n+TTTTTCTAATGCAACAAAATCATTTTCTATATTATGTAAATCATTAGGATGGATTGCAAC\n+ACTACAAGTCAAAAATTTAAATTTTTTAGCTTGTTGAATGGCTGTCTGTGAAGTTTTTAA\n+ATCTACTCCAACAATATTTAATCCAATACCTTGTTCATAACATTTAAAGATAATGTCATC\n+AAATTCTTCAATTAATGGTTCAATATTAGGATGAGTATGAGTATCAATAATTTTTATTTT\n+TTCTAACATATTATTTACCTATACAAAAATTTTTAAATAAATCATCTAAAAAATCATATT\n+CGCTACTTATGCCTAAGAGTTCATTTAAACGTAAATTGCAAAATTCTAAATCAGCGACAA\n+TTAAATCAAGTGTATCCCCTTTTTCTAAATTAAGAATTGCGTTATTAATTAAATAATGAA\n+CATTTTCTAAAATACCAATTTGACGTTGGGATTGTAAAACATCAATGTTAGCATTGTCAA\n+ACTCTTGAACATAAAAAAGTTTTTTAATTTCATCAATCAATGACTGAATATCATTATTTT\n+TTGCATTAATATATATTTGTTTATCATCGTATTGATCAACTAAATCTTTTTTTGTATAAA\n+CTAATAAATGTTTTTGTTTTTTAATTAAATCATATAACTCCAAATCTTGTTGTTCGTTTG\n+CAGGTATTAAATATAAAATTAAATCAACTTTATCAATTAATGCTTTGGCTTTATTAATTC\n+CTAAATTTTCAACAAAATCATTTGTTAAATGAATTCCTGCAGTATCTAAGATATTTAAAG\n+TAATATTATCAATATTAATTGAGGATTCAATAACATCACGTGTTGTCCCAGGAATATCTG\n+TAACAATCGCTTTTTGTTCATTGCATAAAGCGTTTAATAGAGTTGATTTACCTACATTTG\n+GTTTTCCAATTATTAACACCCTAATGCCTTTATTGATTGGTAAAAATTTTTTTGATTGAT\n+CAATAATTTTTGTAATTTTTTTATCTAAAGATAATAAACGTTGTTTTAAAATAATAGCAT\n+CAACTTGTTCAACATCATCGTATTCAGGATAATCAATATTAACTTCAATTTGCCCAATTA\n+TCATAAATAACTCATGCCTAAATTCAGCAATTGATTGCGAAACACGTCCTAATAGAGCGC\n+CAATTACACCTTTAACGCTTAATTCATTTTTAGCATTAACCAAATTGTTAATTGCTTCAA\n+TTTTTGATAAATCCATTTTTTTATTTAATAAAGCACGGCGAGAAAATTCTCCACGTTGTG\n+CTGGTTGACAACCATATTTAATTAATGTTTTAATAATTAAATTAGCAACCACTATTCCTC\n+CGTGGCAATTAATTTCTACTAAATCTTCTCCAGTAAATGTTTTTGGAGCTACAAATGTAT\n+TTATTAAAACTTCATCTAAAATTTGATTATCATCTTTTAGAATTGTATACCAAATTTTAA\n+AAGTTTCTTTTTTTATTTTTATTGTTGAAATTTTATTAATTATTTCAAAAGCTTTTGGAC\n+CACTAACCCGAATAATGTGAATGGCACAATTCATAGGCGCGGTTGCTAAAGCAACAATTG\n+TTGACATTGTTAATCACCTTTATTTTTATTAATAATTGTATAAATAATAGTAAACAAATT\n+ATTTTTATTAATATTAATTTTTAAATTCGCACGCATTAAATCCAAAATAATTTCTTTGCT\n+ATTTACATTATTAATTCTAATGAAGATTAATTTTAATAGATAATGAATTTGTAAGGTAGA\n+TAAATTTTTAAATATTTCTTTTAAATCATTTAATATTTCAAAACTTCTTAAATCACTTAA\n+TTTTCCATAATAAGTTAAAACATCATTGATTTCCTTGTTTTCTAATAAAATTTTTAGCTC\n+ATCCAAATCATCAAACATTA\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/model.h5
b
Binary file test-data/model.h5 has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_10.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_10.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_2.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_2.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_3.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_3.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_4.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_4.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_5.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_5.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_6.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_6.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_7.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_7.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_8.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_8.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/taxonomy_9.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/taxonomy_9.tsv Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,40 @@
+g1k_0 13548 genus Treponema A 4 4 4 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g1k_1 566 species Prevotella intermedia 11 9 6 0.520 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_2 566 species Prevotella intermedia 15 15 10 0.980 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_3 206 order Bacteroidales 5 5 5 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_4 566 species Prevotella intermedia 21 19 11 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_5 206 order Bacteroidales 18 16 12 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_6 206 order Bacteroidales 22 22 14 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales
+g1k_7 566 species Prevotella intermedia 8 8 5 0.540 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g1k_8 209 species Bacteroides fragilis 6 5 2 0.640 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g1k_9 565 genus Prevotella 27 25 21 0.870 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_0 13548 genus Treponema A 3 3 3 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema A
+g2k_1 209 species Bacteroides fragilis 9 9 4 0.930 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_2 565 genus Prevotella 9 9 9 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_3 565 genus Prevotella 8 8 7 0.840 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g2k_4 209 species Bacteroides fragilis 10 8 4 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_5 8420 species Treponema D porcinum 2 1 1 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema D;s_Treponema D porcinum
+g2k_6 209 species Bacteroides fragilis 58 52 32 0.730 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g2k_7 1193 species Bacteroides eggerthii 14 14 10 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g2k_8 566 species Prevotella intermedia 33 32 19 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g2k_9 566 species Prevotella intermedia 15 15 7 0.600 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_0 22555 species UBA1066 sp002316215 3 2 1 0.940 d_Bacteria;p_Firmicutes A;c_Clostridia;o_Lachnospirales;f_Lachnospiraceae;g_UBA1066;s_UBA1066 sp002316215
+g3k_1 11375 species Treponema B denticola A 7 7 5 0.610 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae;g_Treponema B;s_Treponema B denticola A
+g3k_2 208 genus Bacteroides 22 19 13 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_3 288 family Treponemataceae 5 5 5 1.000 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g3k_4 208 genus Bacteroides 11 11 7 0.740 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_5 208 genus Bacteroides 46 40 24 0.670 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g3k_6 2 superkingdom Bacteria 7 7 6 1.000 d_Bacteria
+g3k_7 209 species Bacteroides fragilis 2 2 1 0.500 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g3k_8 566 species Prevotella intermedia 14 14 10 0.750 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
+g3k_9 565 genus Prevotella 52 51 45 0.860 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_0 565 genus Prevotella 10 9 5 0.820 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_1 565 genus Prevotella 36 35 32 0.890 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_2 565 genus Prevotella 34 33 31 0.920 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_3 209 species Bacteroides fragilis 13 12 4 0.560 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_4 209 species Bacteroides fragilis 4 4 3 0.990 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides fragilis
+g4k_5 208 genus Bacteroides 24 20 18 0.940 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides
+g4k_6 1193 species Bacteroides eggerthii 3 3 3 1.000 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Bacteroides;s_Bacteroides eggerthii
+g4k_7 288 family Treponemataceae 4 4 3 0.670 d_Bacteria;p_Spirochaetota;c_Spirochaetia;o_Treponematales;f_Treponemataceae
+g4k_8 565 genus Prevotella 9 9 7 0.530 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella
+g4k_9 566 species Prevotella intermedia 11 10 6 0.790 d_Bacteria;p_Bacteroidota;c_Bacteroidia;o_Bacteroidales;f_Bacteroidaceae;g_Prevotella;s_Prevotella intermedia
b
diff -r 000000000000 -r 7b382efabb98 test-data/test-db/GTDB
b
Binary file test-data/test-db/GTDB has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/test-db/GTDB.dbtype
b
Binary file test-data/test-db/GTDB.dbtype has changed
b
diff -r 000000000000 -r 7b382efabb98 test-data/test-db/GTDB.index
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-db/GTDB.index Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,1205 @@\n+1826398\t360017\t709\n+1826399\t360726\t267\n+1826400\t34819\t451\n+1826401\t35270\t676\n+1826402\t35946\t114\n+1826403\t36060\t477\n+1826404\t36537\t510\n+1826405\t37047\t151\n+1826406\t37198\t366\n+1826407\t37564\t266\n+1826408\t37830\t367\n+1826409\t38197\t549\n+1826410\t288324\t309\n+1826411\t288633\t453\n+1826412\t289086\t1309\n+1826413\t290395\t80\n+1826414\t290475\t441\n+1826415\t290916\t280\n+1826416\t291196\t280\n+3083454\t81815\t294\n+3083455\t82109\t223\n+3083456\t82332\t301\n+3083457\t82633\t92\n+3083458\t82725\t465\n+3083459\t83190\t299\n+3083460\t291476\t197\n+3083461\t291673\t297\n+3083462\t291970\t272\n+3083463\t292242\t555\n+3083464\t292797\t393\n+3083465\t293190\t147\n+3083466\t293337\t275\n+3083467\t293612\t277\n+3083468\t293889\t379\n+3083469\t294268\t358\n+3083470\t360993\t336\n+3083471\t361329\t271\n+3083472\t361600\t147\n+5140526\t129047\t750\n+5140527\t129797\t496\n+5140528\t130293\t598\n+5140529\t130891\t234\n+5140530\t381110\t221\n+5140531\t381331\t1437\n+5140532\t382768\t521\n+5140533\t383289\t474\n+5140534\t383763\t242\n+5140535\t384005\t184\n+5140536\t384189\t452\n+5140537\t384641\t270\n+5140538\t384911\t903\n+5140539\t385814\t419\n+5140540\t335606\t619\n+5140541\t336225\t458\n+5140542\t336683\t436\n+5140543\t337119\t599\n+5140544\t337718\t386\n+6397582\t172815\t470\n+6397583\t173285\t292\n+6397584\t173577\t185\n+6397585\t173762\t700\n+6397586\t174462\t371\n+6397587\t174833\t887\n+6397588\t175720\t122\n+6397589\t175842\t103\n+6397590\t83489\t237\n+6397591\t83726\t138\n+6397592\t83864\t463\n+6397593\t84327\t219\n+6397594\t84546\t84\n+6397595\t84630\t91\n+6397596\t84721\t881\n+6397597\t85602\t277\n+6397598\t85879\t599\n+6397599\t86478\t323\n+6397600\t294626\t225\n+8454654\t361747\t257\n+8454655\t362004\t161\n+8454656\t362165\t239\n+8454657\t362404\t439\n+8454658\t362843\t232\n+8454659\t363075\t1308\n+8454660\t86801\t431\n+8454661\t87232\t216\n+8454662\t87448\t133\n+8454663\t87581\t129\n+8454664\t87710\t794\n+8454665\t88504\t171\n+8454666\t88675\t323\n+8454667\t88998\t631\n+8454668\t89629\t828\n+8454669\t90457\t770\n+8454670\t294851\t297\n+8454671\t295148\t1370\n+8454672\t296518\t116\n+9711710\t402852\t142\n+9711711\t402994\t244\n+9711712\t403238\t168\n+9711713\t403406\t620\n+9711714\t404026\t449\n+9711715\t404475\t59\n+9711716\t404534\t182\n+9711717\t404716\t201\n+9711718\t404917\t273\n+9711719\t405190\t225\n+9711720\t38746\t178\n+9711721\t38924\t435\n+9711722\t39359\t247\n+9711723\t39606\t226\n+9711724\t39832\t245\n+9711725\t40077\t279\n+9711726\t40356\t225\n+9711727\t40581\t241\n+9711728\t40822\t61\n+11768782\t386233\t178\n+11768783\t386411\t91\n+11768784\t386502\t1057\n+11768785\t387559\t242\n+11768786\t387801\t156\n+11768787\t387957\t176\n+11768788\t388133\t524\n+11768789\t388657\t252\n+11768790\t232386\t721\n+11768791\t233107\t1584\n+11768792\t234691\t451\n+11768793\t235142\t587\n+11768794\t235729\t387\n+11768795\t236116\t61\n+11768796\t236177\t363\n+11768797\t236540\t559\n+11768798\t237099\t232\n+11768799\t237331\t581\n+11768800\t187479\t51\n+13025838\t40883\t468\n+13025839\t41351\t174\n+13025840\t316254\t457\n+13025841\t316711\t144\n+13025842\t316855\t376\n+13025843\t317231\t87\n+13025844\t317318\t60\n+13025845\t317378\t664\n+13025846\t318042\t245\n+13025847\t318287\t252\n+13025848\t318539\t247\n+13025849\t318786\t219\n+13025850\t364383\t323\n+13025851\t364706\t463\n+13025852\t365169\t766\n+13025853\t365935\t346\n+13025854\t366281\t199\n+13025855\t366480\t280\n+13025856\t366760\t953\n+15082909\t338104\t460\n+15082910\t0\t160\n+15082911\t160\t611\n+15082912\t771\t45\n+15082913\t816\t397\n+15082914\t1213\t228\n+15082915\t1441\t287\n+15082916\t1728\t253\n+15082917\t1981\t77\n+15082918\t2058\t540\n+15082919\t2598\t461\n+15082920\t260838\t224\n+15082921\t261062\t327\n+15082922\t261389\t278\n+15082923\t261667\t144\n+15082924\t261811\t119\n+15082925\t261930\t661\n+15082926\t262591\t153\n+15082927\t262744\t431\n+16339966\t131125\t477\n+16339967\t131602\t203\n+16339968\t131805\t334\n+16339969\t132139\t819\n+16339970\t237912\t368\n+16339971\t238280\t192\n+16339972\t238472\t160\n+16339973\t238632\t293\n+16339974\t238925\t191\n+16339975\t239116\t471\n+16339976\t239587\t346\n+16339977\t239933\t470\n+16339978\t240403\t321\n+16339979\t240724\t528\n+16339980\t187530\t378\n+16339981\t187908\t283\n+16339982\t188191\t294\n+16339983\t188485\t313\n+16339984\t188798\t222\n+18397037\t189020\t98\n+18397038\t189118\t358\n+18397039\t189476\t296\n+18397040\t367713\t1048\n+18397041\t368761\t1087\n+18397042\t369848\t150\n+18397043\t369998\t200\n+18397044\t370198\t816\n+18397045\t37101'..b'469\n+91307842\t331395\t77\n+91307843\t331472\t600\n+91307844\t332072\t210\n+91307845\t332282\t116\n+91307846\t332398\t241\n+91307847\t332639\t194\n+91307848\t332833\t64\n+91307849\t332897\t184\n+91307850\t185153\t189\n+91307851\t185342\t194\n+91307852\t185536\t78\n+91307853\t185614\t260\n+91307854\t185874\t250\n+91307855\t186124\t364\n+91307856\t186488\t276\n+91307857\t186764\t360\n+91307858\t187124\t62\n+91307859\t187186\t293\n+92564897\t355745\t277\n+92564898\t356022\t512\n+92564899\t356534\t106\n+92564900\t272169\t101\n+92564901\t272270\t516\n+92564902\t272786\t208\n+92564903\t272994\t126\n+92564904\t273120\t157\n+92564905\t273277\t298\n+92564906\t273575\t164\n+92564907\t273739\t442\n+92564908\t274181\t161\n+92564909\t274342\t194\n+92564910\t285463\t277\n+92564911\t285740\t478\n+92564912\t286218\t483\n+92564913\t286701\t422\n+92564914\t287123\t369\n+92564915\t287492\t425\n+94621968\t310297\t370\n+94621969\t310667\t724\n+94621970\t168818\t102\n+94621971\t168920\t418\n+94621972\t169338\t101\n+94621973\t169439\t505\n+94621974\t169944\t339\n+94621975\t170283\t135\n+94621976\t170418\t366\n+94621977\t170784\t87\n+94621978\t170871\t227\n+94621979\t171098\t400\n+94621980\t258659\t401\n+94621981\t259060\t363\n+94621982\t259423\t384\n+94621983\t259807\t315\n+94621984\t260122\t56\n+94621985\t260178\t497\n+94621986\t260675\t163\n+95879024\t210731\t82\n+95879025\t210813\t374\n+95879026\t211187\t100\n+95879027\t211287\t510\n+95879028\t211797\t362\n+95879029\t212159\t96\n+95879030\t124514\t109\n+95879031\t124623\t397\n+95879032\t125020\t1157\n+95879033\t126177\t495\n+95879034\t126672\t398\n+95879035\t127070\t81\n+95879036\t127151\t121\n+95879037\t127272\t622\n+95879038\t127894\t552\n+95879039\t128446\t601\n+95879040\t287917\t158\n+95879041\t288075\t189\n+95879042\t288264\t60\n+97936095\t311391\t352\n+97936096\t311743\t144\n+97936097\t311887\t204\n+97936098\t312091\t303\n+97936099\t312394\t81\n+97936100\t356640\t294\n+97936101\t356934\t250\n+97936102\t357184\t185\n+97936103\t357369\t58\n+97936104\t357427\t149\n+97936105\t357576\t98\n+97936106\t357674\t252\n+97936107\t357926\t221\n+97936108\t358147\t112\n+97936109\t358259\t233\n+97936110\t401665\t70\n+97936111\t401735\t583\n+97936112\t402318\t126\n+97936113\t402444\t408\n+99193151\t22634\t164\n+99193152\t22798\t369\n+99193153\t23167\t549\n+99193154\t23716\t917\n+99193155\t24633\t108\n+99193156\t24741\t245\n+99193157\t24986\t183\n+99193158\t25169\t211\n+99193159\t25380\t648\n+99193160\t333081\t449\n+99193161\t333530\t300\n+99193162\t333830\t213\n+99193163\t334043\t265\n+99193164\t334308\t339\n+99193165\t334647\t224\n+99193166\t334871\t317\n+99193167\t335188\t128\n+99193168\t335316\t205\n+99193169\t335521\t85\n+101250222\t74704\t326\n+101250223\t75030\t582\n+101250224\t75612\t83\n+101250225\t75695\t840\n+101250226\t76535\t63\n+101250227\t76598\t443\n+101250228\t77041\t389\n+101250229\t77430\t124\n+101250230\t424608\t553\n+101250231\t425161\t194\n+101250232\t425355\t267\n+101250233\t425622\t73\n+101250234\t425695\t378\n+101250235\t426073\t86\n+101250236\t426159\t86\n+101250237\t426245\t383\n+101250238\t426628\t301\n+101250239\t426929\t231\n+101250240\t305792\t485\n+102507278\t77554\t182\n+102507279\t77736\t308\n+102507280\t228375\t194\n+102507281\t228569\t125\n+102507282\t228694\t569\n+102507283\t229263\t160\n+102507284\t229423\t104\n+102507285\t229527\t502\n+102507286\t230029\t1207\n+102507287\t231236\t778\n+102507288\t232014\t259\n+102507289\t232273\t113\n+102507290\t358492\t357\n+102507291\t358849\t180\n+102507292\t359029\t104\n+102507293\t359133\t88\n+102507294\t359221\t265\n+102507295\t359486\t374\n+102507296\t359860\t157\n+104564349\t26028\t242\n+104564350\t78044\t601\n+104564351\t78645\t570\n+104564352\t79215\t669\n+104564353\t79884\t81\n+104564354\t79965\t324\n+104564355\t80289\t306\n+104564356\t80595\t206\n+104564357\t80801\t425\n+104564358\t81226\t295\n+104564359\t81521\t294\n+104564360\t312475\t1445\n+104564361\t313920\t152\n+104564362\t314072\t502\n+104564363\t314574\t778\n+104564364\t315352\t289\n+104564365\t315641\t244\n+104564366\t315885\t101\n+104564367\t315986\t268\n+105821405\t274536\t516\n+105821406\t275052\t64\n+105821407\t275116\t1133\n+105821408\t276249\t255\n+105821409\t276504\t518\n+105821410\t427160\t55\n+105821411\t427215\t134\n+105821412\t427349\t396\n+105821413\t427745\t281\n+105821414\t428026\t197\n+105821415\t428223\t149\n+105821416\t428372\t224\n+105821417\t428596\t214\n+105821418\t428810\t239\n+105821419\t429049\t379\n+105821420\t171498\t590\n+105821421\t172088\t234\n+105821422\t172322\t200\n+105821423\t172522\t293\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/test-db/GTDB_mapping
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-db/GTDB_mapping Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,265 @@
+5140526 1490
+5140527 1490
+5140528 1490
+5140529 1490
+5140530 1490
+5140531 1490
+5140532 1490
+5140533 1490
+5140534 1490
+5140535 1490
+5140536 1490
+5140537 1490
+5140538 1490
+5140539 1490
+5140540 1490
+5140541 1490
+5140542 1490
+5140543 1490
+5140544 1490
+8454654 1490
+8454655 1490
+8454656 1490
+8454657 1490
+8454658 1490
+8454659 1490
+8454660 1490
+8454661 1490
+8454662 1490
+8454663 1490
+8454664 1490
+8454665 1490
+8454666 1490
+8454667 1490
+8454668 1490
+8454669 1490
+8454670 1490
+8454671 1490
+8454672 1490
+11768782 1490
+11768783 1490
+11768784 1490
+11768785 1490
+11768786 1490
+11768787 1490
+11768788 1490
+11768789 1490
+11768790 1490
+11768791 1490
+11768792 1490
+11768793 1490
+11768794 1490
+11768795 1490
+11768796 1490
+11768797 1490
+11768798 1490
+11768799 1490
+11768800 1490
+15082909 1490
+15082910 1490
+15082911 1490
+15082912 1490
+15082913 1490
+15082914 1490
+15082915 1490
+15082916 1490
+15082917 1490
+15082918 1490
+15082919 1490
+15082920 1490
+15082921 1490
+15082922 1490
+15082923 1490
+15082924 1490
+15082925 1490
+15082926 1490
+15082927 1490
+1826398 1490
+1826399 1490
+1826400 1490
+1826401 1490
+1826402 1490
+1826403 1490
+1826404 1490
+1826405 1490
+1826406 1490
+1826407 1490
+1826408 1490
+1826409 1490
+1826410 1490
+1826411 1490
+1826412 1490
+1826413 1490
+1826414 1490
+1826415 1490
+1826416 1490
+3083454 29907
+3083455 29907
+3083456 29907
+3083457 29907
+3083458 29907
+3083459 29907
+3083460 29907
+3083461 29907
+3083462 29907
+3083463 29907
+3083464 29907
+3083465 29907
+3083466 29907
+3083467 29907
+3083468 29907
+3083469 29907
+3083470 29907
+3083471 29907
+3083472 29907
+6397582 29907
+6397583 29907
+6397584 29907
+6397585 29907
+6397586 29907
+6397587 29907
+6397588 29907
+6397589 29907
+6397590 29907
+6397591 29907
+6397592 29907
+6397593 29907
+6397594 29907
+6397595 29907
+6397596 29907
+6397597 29907
+6397598 29907
+6397599 29907
+6397600 29907
+9711710 29907
+9711711 29907
+9711712 29907
+9711713 29907
+9711714 29907
+9711715 29907
+9711716 29907
+9711717 29907
+9711718 29907
+9711719 29907
+9711720 29907
+9711721 29907
+9711722 29907
+9711723 29907
+9711724 29907
+9711725 29907
+9711726 29907
+9711727 29907
+9711728 29907
+13025838 29907
+13025839 29907
+13025840 29907
+13025841 29907
+13025842 29907
+13025843 29907
+13025844 29907
+13025845 29907
+13025846 29907
+13025847 29907
+13025848 29907
+13025849 29907
+13025850 29907
+13025851 29907
+13025852 29907
+13025853 29907
+13025854 29907
+13025855 29907
+13025856 29907
+16339966 29907
+16339967 29907
+16339968 29907
+16339969 29907
+16339970 29907
+16339971 29907
+16339972 29907
+16339973 29907
+16339974 29907
+16339975 29907
+16339976 29907
+16339977 29907
+16339978 29907
+16339979 29907
+16339980 29907
+16339981 29907
+16339982 29907
+16339983 29907
+16339984 29907
+19654094 29907
+19654095 29907
+19654096 29907
+19654097 29907
+19654098 29907
+19654099 29907
+19654100 29907
+19654101 29907
+19654102 29907
+19654103 29907
+19654104 29907
+19654105 29907
+19654106 29907
+19654107 29907
+19654108 29907
+19654109 29907
+19654110 29907
+19654111 29907
+19654112 29907
+22968222 29907
+22968223 29907
+22968224 29907
+22968225 29907
+22968226 29907
+22968227 29907
+22968228 29907
+22968229 29907
+22968230 29907
+22968231 29907
+22968232 29907
+22968233 29907
+22968234 29907
+22968235 29907
+22968236 29907
+22968237 29907
+22968238 29907
+22968239 29907
+22968240 29907
+26282350 29907
+26282351 29907
+26282352 29907
+26282353 29907
+26282354 29907
+26282355 29907
+26282356 29907
+26282357 29907
+26282358 29907
+26282359 29907
+26282360 29907
+26282361 29907
+26282362 29907
+26282363 29907
+26282364 29907
+26282365 29907
+26282366 29907
+26282367 29907
+26282368 299073083454 29907
+3083455 29907
+3083456 29907
+3083457 29907
+3083458 29907
+3083459 29907
+3083460 29907
+3083461 29907
+3083462 29907
+3083463 29907
+3083464 29907
+3083465 29907
+3083466 29907
+3083467 29907
+3083468 29907
+3083469 29907
+3083470 29907
+3083471 29907
+3083472 29907
b
diff -r 000000000000 -r 7b382efabb98 test-data/test-db/GTDB_names.dmp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-db/GTDB_names.dmp Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,45503 @@\n+1\t|\troot\t|\t-\t|\tscientific name\t|\n+2\t|\tBacteria\t|\t-\t|\tscientific name\t|\n+3\t|\tProteobacteria\t|\t-\t|\tscientific name\t|\n+4\t|\tGammaproteobacteria\t|\t-\t|\tscientific name\t|\n+5\t|\tEnterobacterales\t|\t-\t|\tscientific name\t|\n+6\t|\tEnterobacteriaceae\t|\t-\t|\tscientific name\t|\n+7\t|\tEscherichia\t|\t-\t|\tscientific name\t|\n+8\t|\tEscherichia flexneri\t|\t-\t|\tscientific name\t|\n+9\t|\tSalmonella\t|\t-\t|\tscientific name\t|\n+10\t|\tSalmonella enterica\t|\t-\t|\tscientific name\t|\n+11\t|\tFirmicutes\t|\t-\t|\tscientific name\t|\n+12\t|\tBacilli\t|\t-\t|\tscientific name\t|\n+13\t|\tStaphylococcales\t|\t-\t|\tscientific name\t|\n+14\t|\tStaphylococcaceae\t|\t-\t|\tscientific name\t|\n+15\t|\tStaphylococcus\t|\t-\t|\tscientific name\t|\n+16\t|\tStaphylococcus aureus\t|\t-\t|\tscientific name\t|\n+17\t|\tLactobacillales\t|\t-\t|\tscientific name\t|\n+18\t|\tStreptococcaceae\t|\t-\t|\tscientific name\t|\n+19\t|\tStreptococcus\t|\t-\t|\tscientific name\t|\n+20\t|\tStreptococcus pneumoniae\t|\t-\t|\tscientific name\t|\n+21\t|\tKlebsiella\t|\t-\t|\tscientific name\t|\n+22\t|\tKlebsiella pneumoniae\t|\t-\t|\tscientific name\t|\n+23\t|\tActinobacteriota\t|\t-\t|\tscientific name\t|\n+24\t|\tActinomycetia\t|\t-\t|\tscientific name\t|\n+25\t|\tMycobacteriales\t|\t-\t|\tscientific name\t|\n+26\t|\tMycobacteriaceae\t|\t-\t|\tscientific name\t|\n+27\t|\tMycobacterium\t|\t-\t|\tscientific name\t|\n+28\t|\tMycobacterium tuberculosis\t|\t-\t|\tscientific name\t|\n+29\t|\tPseudomonadales\t|\t-\t|\tscientific name\t|\n+30\t|\tPseudomonadaceae\t|\t-\t|\tscientific name\t|\n+31\t|\tPseudomonas\t|\t-\t|\tscientific name\t|\n+32\t|\tPseudomonas aeruginosa\t|\t-\t|\tscientific name\t|\n+33\t|\tMoraxellaceae\t|\t-\t|\tscientific name\t|\n+34\t|\tAcinetobacter\t|\t-\t|\tscientific name\t|\n+35\t|\tAcinetobacter baumannii\t|\t-\t|\tscientific name\t|\n+36\t|\tEscherichia coli\t|\t-\t|\tscientific name\t|\n+37\t|\tFirmicutes A\t|\t-\t|\tscientific name\t|\n+38\t|\tClostridia\t|\t-\t|\tscientific name\t|\n+39\t|\tPeptostreptococcales\t|\t-\t|\tscientific name\t|\n+40\t|\tPeptostreptococcaceae\t|\t-\t|\tscientific name\t|\n+41\t|\tClostridioides\t|\t-\t|\tscientific name\t|\n+42\t|\tClostridioides difficile\t|\t-\t|\tscientific name\t|\n+43\t|\tBurkholderiales\t|\t-\t|\tscientific name\t|\n+44\t|\tNeisseriaceae\t|\t-\t|\tscientific name\t|\n+45\t|\tNeisseria\t|\t-\t|\tscientific name\t|\n+46\t|\tNeisseria meningitidis\t|\t-\t|\tscientific name\t|\n+47\t|\tStreptococcus pyogenes\t|\t-\t|\tscientific name\t|\n+48\t|\tEscherichia dysenteriae\t|\t-\t|\tscientific name\t|\n+49\t|\tEscherichia coli D\t|\t-\t|\tscientific name\t|\n+50\t|\tMycobacterium abscessus\t|\t-\t|\tscientific name\t|\n+51\t|\tBurkholderiaceae\t|\t-\t|\tscientific name\t|\n+52\t|\tBurkholderia\t|\t-\t|\tscientific name\t|\n+53\t|\tBurkholderia mallei\t|\t-\t|\tscientific name\t|\n+54\t|\tListeriaceae\t|\t-\t|\tscientific name\t|\n+55\t|\tListeria\t|\t-\t|\tscientific name\t|\n+56\t|\tListeria monocytogenes\t|\t-\t|\tscientific name\t|\n+57\t|\tCampylobacterota\t|\t-\t|\tscientific name\t|\n+58\t|\tCampylobacteria\t|\t-\t|\tscientific name\t|\n+59\t|\tCampylobacterales\t|\t-\t|\tscientific name\t|\n+60\t|\tCampylobacteraceae\t|\t-\t|\tscientific name\t|\n+61\t|\tCampylobacter D\t|\t-\t|\tscientific name\t|\n+62\t|\tCampylobacter D jejuni\t|\t-\t|\tscientific name\t|\n+63\t|\tEnterococcaceae\t|\t-\t|\tscientific name\t|\n+64\t|\tEnterococcus B\t|\t-\t|\tscientific name\t|\n+65\t|\tEnterococcus B faecium\t|\t-\t|\tscientific name\t|\n+66\t|\tEnterococcus\t|\t-\t|\tscientific name\t|\n+67\t|\tEnterococcus faecalis\t|\t-\t|\tscientific name\t|\n+68\t|\tPseudomonas E\t|\t-\t|\tscientific name\t|\n+69\t|\tPseudomonas E viridiflava\t|\t-\t|\tscientific name\t|\n+70\t|\tVibrionaceae\t|\t-\t|\tscientific name\t|\n+71\t|\tVibrio\t|\t-\t|\tscientific name\t|\n+72\t|\tVibrio parahaemolyticus\t|\t-\t|\tscientific name\t|\n+73\t|\tListeria monocytogenes B\t|\t-\t|\tscientific name\t|\n+74\t|\tStreptococcus agalactiae\t|\t-\t|\tscientific name\t|\n+75\t|\tEnterobacter\t|\t-\t|\tscientific name\t|\n+76\t|\tEnterobacter himalayensis\t|\t-\t|\tscientific name\t|\n+77\t|\tStreptococcus suis\t|\t-\t|\tscientific name\t|\n+78\t|\tVibrio cholerae\t|\t-\t|\tscientific name\t|\n+79\t|\tBordetella\t|\t-\t|\tscientific name\t|\n+80\t|\tBordetella pertussis\t|\t-\t|\tscientific name\t|\n+81\t|\tHelicobacteraceae\t|\t-\t|\tscientific name\t|\n+82\t|\tHelicobacter\t|\t-\t|\tscientific name\t|\n+83\t|\tHelicobacter pylori\t|\t-\t|\tscientific name\t|\n+84\t|\tCampylobacter D coli\t|\t-\t|\tscientific name\t|\n+85\t|\tLegionella'..b'fic name\t|\n+45429\t|\tMethanoregula sp002497485\t|\t-\t|\tscientific name\t|\n+45430\t|\tHaloterrigena salina\t|\t-\t|\tscientific name\t|\n+45431\t|\tFerroglobus\t|\t-\t|\tscientific name\t|\n+45432\t|\tFerroglobus placidus\t|\t-\t|\tscientific name\t|\n+45433\t|\tThermococcus A sp001484685\t|\t-\t|\tscientific name\t|\n+45434\t|\tNatronococcus occultus\t|\t-\t|\tscientific name\t|\n+45435\t|\tCBA1134 sp003021175\t|\t-\t|\tscientific name\t|\n+45436\t|\tHalorientalis persicus\t|\t-\t|\tscientific name\t|\n+45437\t|\tNanoarchaeaceae\t|\t-\t|\tscientific name\t|\n+45438\t|\tNanoarchaeum\t|\t-\t|\tscientific name\t|\n+45439\t|\tNanoarchaeum equitans\t|\t-\t|\tscientific name\t|\n+45440\t|\tB23\t|\t-\t|\tscientific name\t|\n+45441\t|\tB23 sp001593875\t|\t-\t|\tscientific name\t|\n+45442\t|\tB63 sp003601695\t|\t-\t|\tscientific name\t|\n+45443\t|\tPyrobaculum arsenaticum\t|\t-\t|\tscientific name\t|\n+45444\t|\tARS1285 sp002688335\t|\t-\t|\tscientific name\t|\n+45445\t|\tBMS3B sp002897955\t|\t-\t|\tscientific name\t|\n+45446\t|\tMethanomassiliicoccus sp002067635\t|\t-\t|\tscientific name\t|\n+45447\t|\tMethanofastidiosum sp9950u\t|\t-\t|\tscientific name\t|\n+45448\t|\tHalorubrum sp000296615\t|\t-\t|\tscientific name\t|\n+45449\t|\tRBG-16-57-9 sp001775965\t|\t-\t|\tscientific name\t|\n+45450\t|\tHalolamina rubra\t|\t-\t|\tscientific name\t|\n+45451\t|\tHalolamina pelagica B\t|\t-\t|\tscientific name\t|\n+45452\t|\tUBA153 sp003694385\t|\t-\t|\tscientific name\t|\n+45453\t|\t40CM-2-53-6 sp005888635\t|\t-\t|\tscientific name\t|\n+45454\t|\tMP8T-1 sp004524595\t|\t-\t|\tscientific name\t|\n+45455\t|\tSKXI01 sp007128515\t|\t-\t|\tscientific name\t|\n+45456\t|\tMGIIb-O5 sp002726275\t|\t-\t|\tscientific name\t|\n+45457\t|\tNitrosopumilus salaria\t|\t-\t|\tscientific name\t|\n+45458\t|\tMGIIa-K1 sp002701145\t|\t-\t|\tscientific name\t|\n+45459\t|\tMethanofastidiosum sp001587675\t|\t-\t|\tscientific name\t|\n+45460\t|\t40CM-2-53-6 sp005881695\t|\t-\t|\tscientific name\t|\n+45461\t|\tNitrosarchaeum sp003569705\t|\t-\t|\tscientific name\t|\n+45462\t|\tThermococcus gorgonarius\t|\t-\t|\tscientific name\t|\n+45463\t|\tMethanoculleus sp000691865\t|\t-\t|\tscientific name\t|\n+45464\t|\tHalobellus sp003665925\t|\t-\t|\tscientific name\t|\n+45465\t|\tSMTZ1-45 sp004376265\t|\t-\t|\tscientific name\t|\n+45466\t|\tNitrosopumilus sediminis\t|\t-\t|\tscientific name\t|\n+45467\t|\tStaphylothermus hellenicus\t|\t-\t|\tscientific name\t|\n+45468\t|\tMethanomethylovorans sp001896725\t|\t-\t|\tscientific name\t|\n+45469\t|\tMGIIb-O3 sp002731195\t|\t-\t|\tscientific name\t|\n+45470\t|\tMethanocaldococcus A infernus\t|\t-\t|\tscientific name\t|\n+45471\t|\tMethanobrevibacter A sp900320955\t|\t-\t|\tscientific name\t|\n+45472\t|\tXQ-INN-246\t|\t-\t|\tscientific name\t|\n+45473\t|\tXQ-INN-246 sp006543045\t|\t-\t|\tscientific name\t|\n+45474\t|\tMGIIa-L3 sp002694585\t|\t-\t|\tscientific name\t|\n+45475\t|\tNitrosopumilus sp006740685\t|\t-\t|\tscientific name\t|\n+45476\t|\tHalorussus rarus\t|\t-\t|\tscientific name\t|\n+45477\t|\tB75-G9\t|\t-\t|\tscientific name\t|\n+45478\t|\tB75-G9 sp003661465\t|\t-\t|\tscientific name\t|\n+45479\t|\tJdFR-22\t|\t-\t|\tscientific name\t|\n+45480\t|\tJdFR-22 sp002010045\t|\t-\t|\tscientific name\t|\n+45481\t|\tHalogranum sp004116405\t|\t-\t|\tscientific name\t|\n+45482\t|\tHalorussus amylolyticus\t|\t-\t|\tscientific name\t|\n+45483\t|\tNitrosopumilus sp002788515\t|\t-\t|\tscientific name\t|\n+45484\t|\tEX4572-165\t|\t-\t|\tscientific name\t|\n+45485\t|\tEX4572-165 sp002254885\t|\t-\t|\tscientific name\t|\n+45486\t|\tB47-G15\t|\t-\t|\tscientific name\t|\n+45487\t|\tB47-G15\t|\t-\t|\tscientific name\t|\n+45488\t|\tB47-G15 sp003660975\t|\t-\t|\tscientific name\t|\n+45489\t|\tThalassarchaeum sp002727275\t|\t-\t|\tscientific name\t|\n+45490\t|\tQENH01\t|\t-\t|\tscientific name\t|\n+45491\t|\tQENH01 sp003336485\t|\t-\t|\tscientific name\t|\n+45492\t|\tHEL-GB-A\t|\t-\t|\tscientific name\t|\n+45493\t|\tHEL-GB-A\t|\t-\t|\tscientific name\t|\n+45494\t|\tHEL-GB-A sp005191415\t|\t-\t|\tscientific name\t|\n+45495\t|\tHalonotius sp006861665\t|\t-\t|\tscientific name\t|\n+45496\t|\tNatrinema salaciae\t|\t-\t|\tscientific name\t|\n+45497\t|\tSBBD01\t|\t-\t|\tscientific name\t|\n+45498\t|\tSBBD01\t|\t-\t|\tscientific name\t|\n+45499\t|\tSBBD01 sp005239845\t|\t-\t|\tscientific name\t|\n+45500\t|\tGW2011-AR5 sp10154u\t|\t-\t|\tscientific name\t|\n+45501\t|\tMethanotorris formicicus\t|\t-\t|\tscientific name\t|\n+45502\t|\tHaladaptatus cibarius\t|\t-\t|\tscientific name\t|\n+45503\t|\tDTU008 sp002498285\t|\t-\t|\tscientific name\t|\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/test-db/GTDB_nodes.dmp
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test-db/GTDB_nodes.dmp Fri Oct 14 21:38:26 2022 +0000
b
b'@@ -0,0 +1,45503 @@\n+1\t|\t1\t|\tno rank\t|\t-\t|\n+2\t|\t1\t|\tsuperkingdom\t|\t-\t|\n+3\t|\t2\t|\tphylum\t|\t-\t|\n+4\t|\t3\t|\tclass\t|\t-\t|\n+5\t|\t4\t|\torder\t|\t-\t|\n+6\t|\t5\t|\tfamily\t|\t-\t|\n+7\t|\t6\t|\tgenus\t|\t-\t|\n+8\t|\t7\t|\tspecies\t|\t-\t|\n+9\t|\t6\t|\tgenus\t|\t-\t|\n+10\t|\t9\t|\tspecies\t|\t-\t|\n+11\t|\t2\t|\tphylum\t|\t-\t|\n+12\t|\t11\t|\tclass\t|\t-\t|\n+13\t|\t12\t|\torder\t|\t-\t|\n+14\t|\t13\t|\tfamily\t|\t-\t|\n+15\t|\t14\t|\tgenus\t|\t-\t|\n+16\t|\t15\t|\tspecies\t|\t-\t|\n+17\t|\t12\t|\torder\t|\t-\t|\n+18\t|\t17\t|\tfamily\t|\t-\t|\n+19\t|\t18\t|\tgenus\t|\t-\t|\n+20\t|\t19\t|\tspecies\t|\t-\t|\n+21\t|\t6\t|\tgenus\t|\t-\t|\n+22\t|\t21\t|\tspecies\t|\t-\t|\n+23\t|\t2\t|\tphylum\t|\t-\t|\n+24\t|\t23\t|\tclass\t|\t-\t|\n+25\t|\t24\t|\torder\t|\t-\t|\n+26\t|\t25\t|\tfamily\t|\t-\t|\n+27\t|\t26\t|\tgenus\t|\t-\t|\n+28\t|\t27\t|\tspecies\t|\t-\t|\n+29\t|\t4\t|\torder\t|\t-\t|\n+30\t|\t29\t|\tfamily\t|\t-\t|\n+31\t|\t30\t|\tgenus\t|\t-\t|\n+32\t|\t31\t|\tspecies\t|\t-\t|\n+33\t|\t29\t|\tfamily\t|\t-\t|\n+34\t|\t33\t|\tgenus\t|\t-\t|\n+35\t|\t34\t|\tspecies\t|\t-\t|\n+36\t|\t7\t|\tspecies\t|\t-\t|\n+37\t|\t2\t|\tphylum\t|\t-\t|\n+38\t|\t37\t|\tclass\t|\t-\t|\n+39\t|\t38\t|\torder\t|\t-\t|\n+40\t|\t39\t|\tfamily\t|\t-\t|\n+41\t|\t40\t|\tgenus\t|\t-\t|\n+42\t|\t41\t|\tspecies\t|\t-\t|\n+43\t|\t4\t|\torder\t|\t-\t|\n+44\t|\t43\t|\tfamily\t|\t-\t|\n+45\t|\t44\t|\tgenus\t|\t-\t|\n+46\t|\t45\t|\tspecies\t|\t-\t|\n+47\t|\t19\t|\tspecies\t|\t-\t|\n+48\t|\t7\t|\tspecies\t|\t-\t|\n+49\t|\t7\t|\tspecies\t|\t-\t|\n+50\t|\t27\t|\tspecies\t|\t-\t|\n+51\t|\t43\t|\tfamily\t|\t-\t|\n+52\t|\t51\t|\tgenus\t|\t-\t|\n+53\t|\t52\t|\tspecies\t|\t-\t|\n+54\t|\t17\t|\tfamily\t|\t-\t|\n+55\t|\t54\t|\tgenus\t|\t-\t|\n+56\t|\t55\t|\tspecies\t|\t-\t|\n+57\t|\t2\t|\tphylum\t|\t-\t|\n+58\t|\t57\t|\tclass\t|\t-\t|\n+59\t|\t58\t|\torder\t|\t-\t|\n+60\t|\t59\t|\tfamily\t|\t-\t|\n+61\t|\t60\t|\tgenus\t|\t-\t|\n+62\t|\t61\t|\tspecies\t|\t-\t|\n+63\t|\t17\t|\tfamily\t|\t-\t|\n+64\t|\t63\t|\tgenus\t|\t-\t|\n+65\t|\t64\t|\tspecies\t|\t-\t|\n+66\t|\t63\t|\tgenus\t|\t-\t|\n+67\t|\t66\t|\tspecies\t|\t-\t|\n+68\t|\t30\t|\tgenus\t|\t-\t|\n+69\t|\t68\t|\tspecies\t|\t-\t|\n+70\t|\t5\t|\tfamily\t|\t-\t|\n+71\t|\t70\t|\tgenus\t|\t-\t|\n+72\t|\t71\t|\tspecies\t|\t-\t|\n+73\t|\t55\t|\tspecies\t|\t-\t|\n+74\t|\t19\t|\tspecies\t|\t-\t|\n+75\t|\t6\t|\tgenus\t|\t-\t|\n+76\t|\t75\t|\tspecies\t|\t-\t|\n+77\t|\t19\t|\tspecies\t|\t-\t|\n+78\t|\t71\t|\tspecies\t|\t-\t|\n+79\t|\t51\t|\tgenus\t|\t-\t|\n+80\t|\t79\t|\tspecies\t|\t-\t|\n+81\t|\t59\t|\tfamily\t|\t-\t|\n+82\t|\t81\t|\tgenus\t|\t-\t|\n+83\t|\t82\t|\tspecies\t|\t-\t|\n+84\t|\t61\t|\tspecies\t|\t-\t|\n+85\t|\t4\t|\torder\t|\t-\t|\n+86\t|\t85\t|\tfamily\t|\t-\t|\n+87\t|\t86\t|\tgenus\t|\t-\t|\n+88\t|\t87\t|\tspecies\t|\t-\t|\n+89\t|\t3\t|\tclass\t|\t-\t|\n+90\t|\t89\t|\torder\t|\t-\t|\n+91\t|\t90\t|\tfamily\t|\t-\t|\n+92\t|\t91\t|\tgenus\t|\t-\t|\n+93\t|\t92\t|\tspecies\t|\t-\t|\n+94\t|\t45\t|\tspecies\t|\t-\t|\n+95\t|\t5\t|\tfamily\t|\t-\t|\n+96\t|\t95\t|\tgenus\t|\t-\t|\n+97\t|\t96\t|\tspecies\t|\t-\t|\n+98\t|\t15\t|\tspecies\t|\t-\t|\n+99\t|\t12\t|\torder\t|\t-\t|\n+100\t|\t99\t|\tfamily\t|\t-\t|\n+101\t|\t100\t|\tgenus\t|\t-\t|\n+102\t|\t101\t|\tspecies\t|\t-\t|\n+103\t|\t17\t|\tfamily\t|\t-\t|\n+104\t|\t103\t|\tgenus\t|\t-\t|\n+105\t|\t104\t|\tspecies\t|\t-\t|\n+106\t|\t21\t|\tspecies\t|\t-\t|\n+107\t|\t6\t|\tgenus\t|\t-\t|\n+108\t|\t107\t|\tspecies\t|\t-\t|\n+109\t|\t6\t|\tgenus\t|\t-\t|\n+110\t|\t109\t|\tspecies\t|\t-\t|\n+111\t|\t6\t|\tgenus\t|\t-\t|\n+112\t|\t111\t|\tspecies\t|\t-\t|\n+113\t|\t21\t|\tspecies\t|\t-\t|\n+114\t|\t4\t|\torder\t|\t-\t|\n+115\t|\t114\t|\tfamily\t|\t-\t|\n+116\t|\t115\t|\tgenus\t|\t-\t|\n+117\t|\t116\t|\tspecies\t|\t-\t|\n+118\t|\t82\t|\tspecies\t|\t-\t|\n+119\t|\t52\t|\tspecies\t|\t-\t|\n+120\t|\t2\t|\tphylum\t|\t-\t|\n+121\t|\t120\t|\tclass\t|\t-\t|\n+122\t|\t121\t|\torder\t|\t-\t|\n+123\t|\t122\t|\tfamily\t|\t-\t|\n+124\t|\t123\t|\tgenus\t|\t-\t|\n+125\t|\t124\t|\tspecies\t|\t-\t|\n+126\t|\t24\t|\torder\t|\t-\t|\n+127\t|\t126\t|\tfamily\t|\t-\t|\n+128\t|\t127\t|\tgenus\t|\t-\t|\n+129\t|\t128\t|\tspecies\t|\t-\t|\n+130\t|\t24\t|\torder\t|\t-\t|\n+131\t|\t130\t|\tfamily\t|\t-\t|\n+132\t|\t131\t|\tgenus\t|\t-\t|\n+133\t|\t132\t|\tspecies\t|\t-\t|\n+134\t|\t101\t|\tspecies\t|\t-\t|\n+135\t|\t19\t|\tspecies\t|\t-\t|\n+136\t|\t15\t|\tspecies\t|\t-\t|\n+137\t|\t99\t|\tfamily\t|\t-\t|\n+138\t|\t137\t|\tgenus\t|\t-\t|\n+139\t|\t138\t|\tspecies\t|\t-\t|\n+140\t|\t138\t|\tspecies\t|\t-\t|\n+141\t|\t34\t|\tspecies\t|\t-\t|\n+142\t|\t68\t|\tspecies\t|\t-\t|\n+143\t|\t82\t|\tspecies\t|\t-\t|\n+144\t|\t4\t|\torder\t|\t-\t|\n+145\t|\t144\t|\tfamily\t|\t-\t|\n+146\t|\t145\t|\tgenus\t|\t-\t|\n+147\t|\t146\t|\tspecies\t|\t-\t|\n+148\t|\t52\t|\tspecies\t|\t-\t|\n+149\t|\t101\t|\tspecies\t|\t-\t|\n+150\t|\t26\t|\tgenus\t|\t-\t|\n+151\t|\t150\t|\tspecies\t|\t-\t|\n+152\t|\t103\t|\tgenus\t|\t-\t|\n+153\t|\t152\t|\tspecies\t|\t-\t|\n+154\t|\t15\t|\tspecies\t|\t-\t|\n+155\t|\t101\t|\tspecies\t|\t-\t|\n+156\t|\t68\t|\tspecies\t|\t-\t|\n+157\t|\t91\t|\tgenus\t|\t-\t|\n+158\t|\t157\t|\tspecies\t|\t-\t|\n+159\t|\t6\t|\tgenus\t|\t-\t|\n+160\t|\t159\t|\tspecies\t|\t-\t|\n+161\t|\t101\t|\tspecies\t|\t-\t|\n+162\t|\t116\t|\tspecies\t|\t-\t|\n+163\t|\t91\t|\tgenus\t'..b'73\t|\t45372\t|\tspecies\t|\t-\t|\n+45374\t|\t43770\t|\tgenus\t|\t-\t|\n+45375\t|\t45374\t|\tspecies\t|\t-\t|\n+45376\t|\t44150\t|\tspecies\t|\t-\t|\n+45377\t|\t43948\t|\tspecies\t|\t-\t|\n+45378\t|\t44076\t|\tspecies\t|\t-\t|\n+45379\t|\t42838\t|\tspecies\t|\t-\t|\n+45380\t|\t42969\t|\tspecies\t|\t-\t|\n+45381\t|\t42895\t|\tgenus\t|\t-\t|\n+45382\t|\t45381\t|\tspecies\t|\t-\t|\n+45383\t|\t43564\t|\tspecies\t|\t-\t|\n+45384\t|\t43249\t|\tfamily\t|\t-\t|\n+45385\t|\t45384\t|\tgenus\t|\t-\t|\n+45386\t|\t45385\t|\tspecies\t|\t-\t|\n+45387\t|\t44252\t|\tgenus\t|\t-\t|\n+45388\t|\t45387\t|\tspecies\t|\t-\t|\n+45389\t|\t43676\t|\tspecies\t|\t-\t|\n+45390\t|\t43296\t|\tspecies\t|\t-\t|\n+45391\t|\t43060\t|\tspecies\t|\t-\t|\n+45392\t|\t43092\t|\tspecies\t|\t-\t|\n+45393\t|\t43315\t|\tspecies\t|\t-\t|\n+45394\t|\t42894\t|\tfamily\t|\t-\t|\n+45395\t|\t45394\t|\tgenus\t|\t-\t|\n+45396\t|\t45395\t|\tspecies\t|\t-\t|\n+45397\t|\t43237\t|\tspecies\t|\t-\t|\n+45398\t|\t43347\t|\tspecies\t|\t-\t|\n+45399\t|\t43078\t|\tspecies\t|\t-\t|\n+45400\t|\t43041\t|\tspecies\t|\t-\t|\n+45401\t|\t43450\t|\torder\t|\t-\t|\n+45402\t|\t45401\t|\tfamily\t|\t-\t|\n+45403\t|\t45402\t|\tgenus\t|\t-\t|\n+45404\t|\t45403\t|\tspecies\t|\t-\t|\n+45405\t|\t42763\t|\tgenus\t|\t-\t|\n+45406\t|\t45405\t|\tspecies\t|\t-\t|\n+45407\t|\t42922\t|\tfamily\t|\t-\t|\n+45408\t|\t45407\t|\tgenus\t|\t-\t|\n+45409\t|\t45408\t|\tspecies\t|\t-\t|\n+45410\t|\t43365\t|\tspecies\t|\t-\t|\n+45411\t|\t44666\t|\tspecies\t|\t-\t|\n+45412\t|\t43085\t|\tgenus\t|\t-\t|\n+45413\t|\t45412\t|\tspecies\t|\t-\t|\n+45414\t|\t43645\t|\tspecies\t|\t-\t|\n+45415\t|\t42902\t|\tfamily\t|\t-\t|\n+45416\t|\t45415\t|\tgenus\t|\t-\t|\n+45417\t|\t45416\t|\tspecies\t|\t-\t|\n+45418\t|\t43446\t|\tspecies\t|\t-\t|\n+45419\t|\t44906\t|\tspecies\t|\t-\t|\n+45420\t|\t42859\t|\torder\t|\t-\t|\n+45421\t|\t45420\t|\tfamily\t|\t-\t|\n+45422\t|\t45421\t|\tgenus\t|\t-\t|\n+45423\t|\t45422\t|\tspecies\t|\t-\t|\n+45424\t|\t43358\t|\tspecies\t|\t-\t|\n+45425\t|\t43038\t|\tspecies\t|\t-\t|\n+45426\t|\t42948\t|\tspecies\t|\t-\t|\n+45427\t|\t43135\t|\tspecies\t|\t-\t|\n+45428\t|\t44666\t|\tspecies\t|\t-\t|\n+45429\t|\t42936\t|\tspecies\t|\t-\t|\n+45430\t|\t44076\t|\tspecies\t|\t-\t|\n+45431\t|\t42957\t|\tgenus\t|\t-\t|\n+45432\t|\t45431\t|\tspecies\t|\t-\t|\n+45433\t|\t43058\t|\tspecies\t|\t-\t|\n+45434\t|\t43019\t|\tspecies\t|\t-\t|\n+45435\t|\t43253\t|\tspecies\t|\t-\t|\n+45436\t|\t44515\t|\tspecies\t|\t-\t|\n+45437\t|\t43262\t|\tfamily\t|\t-\t|\n+45438\t|\t45437\t|\tgenus\t|\t-\t|\n+45439\t|\t45438\t|\tspecies\t|\t-\t|\n+45440\t|\t43960\t|\tgenus\t|\t-\t|\n+45441\t|\t45440\t|\tspecies\t|\t-\t|\n+45442\t|\t43782\t|\tspecies\t|\t-\t|\n+45443\t|\t43003\t|\tspecies\t|\t-\t|\n+45444\t|\t44799\t|\tspecies\t|\t-\t|\n+45445\t|\t43637\t|\tspecies\t|\t-\t|\n+45446\t|\t43098\t|\tspecies\t|\t-\t|\n+45447\t|\t43155\t|\tspecies\t|\t-\t|\n+45448\t|\t42775\t|\tspecies\t|\t-\t|\n+45449\t|\t44926\t|\tspecies\t|\t-\t|\n+45450\t|\t44666\t|\tspecies\t|\t-\t|\n+45451\t|\t44666\t|\tspecies\t|\t-\t|\n+45452\t|\t44028\t|\tspecies\t|\t-\t|\n+45453\t|\t43078\t|\tspecies\t|\t-\t|\n+45454\t|\t44207\t|\tspecies\t|\t-\t|\n+45455\t|\t43588\t|\tspecies\t|\t-\t|\n+45456\t|\t42826\t|\tspecies\t|\t-\t|\n+45457\t|\t42854\t|\tspecies\t|\t-\t|\n+45458\t|\t43135\t|\tspecies\t|\t-\t|\n+45459\t|\t43155\t|\tspecies\t|\t-\t|\n+45460\t|\t43078\t|\tspecies\t|\t-\t|\n+45461\t|\t43036\t|\tspecies\t|\t-\t|\n+45462\t|\t43237\t|\tspecies\t|\t-\t|\n+45463\t|\t42794\t|\tspecies\t|\t-\t|\n+45464\t|\t43317\t|\tspecies\t|\t-\t|\n+45465\t|\t43976\t|\tspecies\t|\t-\t|\n+45466\t|\t42854\t|\tspecies\t|\t-\t|\n+45467\t|\t44494\t|\tspecies\t|\t-\t|\n+45468\t|\t43138\t|\tspecies\t|\t-\t|\n+45469\t|\t42920\t|\tspecies\t|\t-\t|\n+45470\t|\t43354\t|\tspecies\t|\t-\t|\n+45471\t|\t42783\t|\tspecies\t|\t-\t|\n+45472\t|\t43018\t|\tgenus\t|\t-\t|\n+45473\t|\t45472\t|\tspecies\t|\t-\t|\n+45474\t|\t42978\t|\tspecies\t|\t-\t|\n+45475\t|\t42854\t|\tspecies\t|\t-\t|\n+45476\t|\t43658\t|\tspecies\t|\t-\t|\n+45477\t|\t44085\t|\tgenus\t|\t-\t|\n+45478\t|\t45477\t|\tspecies\t|\t-\t|\n+45479\t|\t42957\t|\tgenus\t|\t-\t|\n+45480\t|\t45479\t|\tspecies\t|\t-\t|\n+45481\t|\t43468\t|\tspecies\t|\t-\t|\n+45482\t|\t43658\t|\tspecies\t|\t-\t|\n+45483\t|\t42854\t|\tspecies\t|\t-\t|\n+45484\t|\t42903\t|\tgenus\t|\t-\t|\n+45485\t|\t45484\t|\tspecies\t|\t-\t|\n+45486\t|\t44078\t|\tfamily\t|\t-\t|\n+45487\t|\t45486\t|\tgenus\t|\t-\t|\n+45488\t|\t45487\t|\tspecies\t|\t-\t|\n+45489\t|\t42828\t|\tspecies\t|\t-\t|\n+45490\t|\t43731\t|\tgenus\t|\t-\t|\n+45491\t|\t45490\t|\tspecies\t|\t-\t|\n+45492\t|\t45401\t|\tfamily\t|\t-\t|\n+45493\t|\t45492\t|\tgenus\t|\t-\t|\n+45494\t|\t45493\t|\tspecies\t|\t-\t|\n+45495\t|\t43425\t|\tspecies\t|\t-\t|\n+45496\t|\t43092\t|\tspecies\t|\t-\t|\n+45497\t|\t42886\t|\tfamily\t|\t-\t|\n+45498\t|\t45497\t|\tgenus\t|\t-\t|\n+45499\t|\t45498\t|\tspecies\t|\t-\t|\n+45500\t|\t44552\t|\tspecies\t|\t-\t|\n+45501\t|\t44073\t|\tspecies\t|\t-\t|\n+45502\t|\t43006\t|\tspecies\t|\t-\t|\n+45503\t|\t42810\t|\tspecies\t|\t-\t|\n'
b
diff -r 000000000000 -r 7b382efabb98 test-data/test_database.loc
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/test_database.loc Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,6 @@
+# Tab separated with 4 columns:
+# - value (Galaxy records this in the Galaxy DB)
+# - name (Galaxy shows this in the UI)
+# - value (Galaxy records this in the Galaxy DB)
+# - path (folder name containing the Kraken DB)  
+test-db "Test Database" test-db ${__HERE__}/test-db
\ No newline at end of file
b
diff -r 000000000000 -r 7b382efabb98 tool-data/gtdb.loc.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool-data/gtdb.loc.sample Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,7 @@
+#This is a sample file distributed with Galaxy that enables tools
+#to use a directory of metagenomics files.
+#file has this format (white space characters are TAB characters)
+# - db-build-version-date
+# - db-name
+# - build
+# - /path/to/data
\ No newline at end of file
b
diff -r 000000000000 -r 7b382efabb98 tool_data_table_conf.xml.sample
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.sample Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,6 @@
+<tables>
+    <table name="gtdb" comment_char="#">
+        <columns>value, name, dbkey, path</columns>
+        <file path="tool-data/gtdb.loc" />
+    </table>
+</tables>
b
diff -r 000000000000 -r 7b382efabb98 tool_data_table_conf.xml.test
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/tool_data_table_conf.xml.test Fri Oct 14 21:38:26 2022 +0000
b
@@ -0,0 +1,6 @@
+<tables>
+    <table name="gtdb" comment_char="#">
+        <columns>value, name, dbkey, path</columns>
+        <file path="${__HERE__}/test-data/test_database.loc" />
+    </table>
+</tables>
\ No newline at end of file