Repository 'das_tool'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/das_tool

Changeset 0:a8e434ebe961 (2022-06-27)
Next changeset 1:edd3771cdb79 (2022-10-24)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/das_tool commit 151c0e625ce20fb3ea75aa5043486e41b1da48de
added:
das_tool.xml
macros.xml
test-data/contigs.fasta
test-data/maxbin2.001.fasta
test-data/maxbin2.002.fasta
test-data/metabat.tabular
test-data/proteins.fasta
b
diff -r 000000000000 -r a8e434ebe961 das_tool.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/das_tool.xml Mon Jun 27 12:41:23 2022 +0000
[
b'@@ -0,0 +1,237 @@\n+<tool id="das_tool" name="DAS Tool" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">\n+    <description>\n+        for genome resolved metagenomics\n+    </description>\n+    <macros>\n+        <import>macros.xml</import>\n+    </macros>\n+    <expand macro="biotools"/>\n+    <expand macro="requirements"/>\n+    <expand macro="version"/>\n+    <command detect_errors="exit_code"><![CDATA[\n+#set $bins = ""\n+#set $labels = ""\n+#set $sep = ""\n+#for $i, $s in enumerate($binning)\n+    #set $bins += "%s%s" %($sep, $s.bins)\n+    #set $labels += "%s%s" %($sep, $s.labels)\n+    #set $sep = ","\n+#end for\n+\n+#if $adv.proteins\n+ln -s $adv.proteins \'proteins\' &&\n+#end if\n+\n+DAS_Tool\n+    --contigs \'$contigs\'\n+    --outputbasename \'outputs\'\n+    --bins \'$bins\'\n+    --labels \'$labels\'\n+    --search_engine \'$adv.search_engine\'\n+#if $adv.proteins\n+    --proteins \'proteins\'\n+#end if\n+    --score_threshold $adv.score_threshold\n+    --duplicate_penalty $adv.duplicate_penalty\n+    --megabin_penalty $adv.megabin_penalty\n+    $output.write_bin_evals\n+    $output.write_bins.write_bins\n+#if str($output.write_bins.write_bins) != \'\'\n+    $output.write_bins.write_unbinned\n+#end if\n+    $output.debug\n+    --threads \\${GALAXY_SLOTS:-1}\n+    ]]></command>\n+    <inputs>\n+        <param argument="--contigs" type="data" format="fasta" label="Contig sequences"/>\n+        <repeat name="binning" title="Bins" min="1">\n+            <param argument="--bins" type="data" format="tabular" label="Contigs-to-bin table" help="Tabular with two columns: contig-IDs and bin-IDs. Fasta_to_Contigs2Bin can be used to  Converts genome bins in fasta format to Contigs-to-bin table"/>\n+            <param argument="--labels" type="text" value="" label="Name of binning prediction tool used to generate the table"/>\n+        </repeat>\n+        <section name="adv" title="Advanced options">\n+            <param argument="--search_engine" type="select" label="Engine used for single copy gene identification">\n+                <option value="diamond" selected="true">diamond</option>\n+                <option value="blastp">blastp</option>\n+            </param>\n+            <param argument="--proteins" type="data" format="fasta" optional="true" label="Predicted proteins" help="The file should be prodigal fasta format: >contigID_geneNo"/>\n+            <param argument="--score_threshold" type="float" min="0" max="1" value="0.5" label="Score threshold until selection algorithm will keep selecting bins"/>\n+            <param argument="--duplicate_penalty" type="float" min="0" max="3" value="0.6" label="Penalty for duplicate single copy genes per bin (weight b)" help="Only change if you know what you are doing"/>\n+            <param argument="--megabin_penalty" type="float" min="0" max="3" value="0.5" label="Penalty for megabins (weight c)" help="Only change if you know what you are doing"/>\n+        </section>\n+        <section name="output" title="Outputs">\n+            <param name="proteins" type="boolean" checked="false" label="Output predicted proteins?"/>\n+            <param argument="--write_bin_evals" type="boolean" truevalue="--write_bin_evals" falsevalue="" checked="false" label="Write evaluation of input bin sets?"/>\n+            <conditional name="write_bins">\n+                <param argument="--write_bins" type="select" label="Export bins as fasta files?">\n+                    <option value="--write_bins" selected="true">Yes</option>\n+                    <option value="">No</option>\n+                </param>\n+                <when value="--write_bins">\n+                    <param argument="--write_unbinned" type="boolean" truevalue="--write_unbinned" falsevalue="" checked="false" label="Export unbinned contigs as fasta file?"/>\n+                </when>\n+                <when value=""/>\n+            </conditional>\n+            <param argument="--debug" type="boolean" truevalue="--debug" falsevalue="" checked="false" label="Write debug information to log file?"'..b'Target sequences to report alignments for: 1"/>\n+                </assert_contents>\n+            </output>\n+            <output name="eval" ftype="tabular">\n+                <assert_contents>\n+                    <has_text text="unique_SCGs"/>\n+                    <has_text text="metabat.8"/>\n+                </assert_contents>\n+            </output>\n+        </test>\n+        <test expect_num_outputs="6">\n+            <param name="contigs" value="contigs.fasta"/>\n+            <repeat name="binning">\n+                <param name="bins" value="metabat.tabular"/>\n+                <param name="labels" value="metabat"/>\n+            </repeat>\n+            <section name="adv">\n+                <param name="search_engine" value="diamond"/>\n+                <param name="score_threshold" value="0.5"/>\n+                <param name="duplicate_penalty" value="0.6"/>\n+                <param name="megabin_penalty" value="0.5" />\n+            </section>\n+            <section name="output">\n+                <param name="proteins" value="true"/>\n+                <param name="write_bin_evals" value="false"/>\n+                <conditional name="write_bins">\n+                    <param name="write_bins" value="--write_bins"/>\n+                    <param name="write_unbinned" value="true"/>\n+                </conditional>\n+                <param name="debug" value="true"/>\n+            </section>\n+            <output name="summary" ftype="tabular">\n+                <assert_contents>\n+                    <has_text text="unique_SCGs"/>\n+                    <has_text text="metabat.8"/>\n+                    <has_text text="bacteria"/>\n+                </assert_contents>\n+            </output>\n+            <output name="contigs2bin" ftype="tabular">\n+                <assert_contents>\n+                    <has_text text="Ley3_66761_scaffold_6"/>\n+                </assert_contents>\n+            </output>\n+            <output name="log" ftype="txt">\n+                <assert_contents>\n+                    <has_text text="Parameters"/>\n+                    <has_text text="Predicting genes"/>\n+                </assert_contents>\n+            </output>\n+            <output_collection name="bins" count="1">\n+                <element name="8" ftype="fasta">\n+                    <assert_contents>\n+                        <has_text text=">Ley3_66761_scaffold_6"/>\n+                    </assert_contents>\n+                </element>\n+            </output_collection>\n+            <output name="unbinned_contigs" ftype="fasta">\n+                <assert_contents>\n+                    <has_text text=">Ley3_66761_scaffold_505"/>\n+                </assert_contents>\n+            </output>\n+            <output name="proteins" ftype="fasta">\n+                <assert_contents>\n+                    <has_text text="Ley3_66761_scaffold_6_1 # 1 # 786 # 1 #"/>\n+                </assert_contents>\n+            </output>\n+        </test>\n+    </tests>\n+    <help><![CDATA[\n+@HELP_HEADER@\n+\n+Inputs\n+======\n+\n+- Bins: Tab separated files of contig-IDs and bin-IDs. Contigs to bin file example: ::\n+\n+    Contig_1\tbin.01\n+    Contig_8\tbin.01\n+    Contig_42\tbin.02\n+    Contig_49\tbin.03\n+\n+- Contigs: Assembled contigs in fasta format: ::\n+\n+    >Contig_1\n+    ATCATCGTCCGCATCGACGAATTCGGCGAACGAGTACCCCTGACCATCTCCGATTA...\n+    >Contig_2\n+    GATCGTCACGCAGGCTATCGGAGCCTCGACCCGCAAGCTCTGCGCCTTGGAGCAGG...\n+\n+- [Optional] Proteins: Predicted proteins in prodigal fasta format. Header contains contig-ID and gene number: ::\n+\n+    >Contig_1_1\n+    MPRKNKKLPRHLLVIRTSAMGDVAMLPHALRALKEAYPEVKVTVATKSLFHPFFEG...\n+    >Contig_1_2\n+    MANKIPRVPVREQDPKVRATNFEEVCYGYNVEEATLEASRCLNCKNPRCVAACPVN...\n+\n+Outputs\n+=======\n+\n+- Summary of output bins including quality and completeness estimates\n+- Contigs to bin file of output bins\n+- [Optional] Quality and completeness estimates of input bin sets\n+- [Optional] Bins in fasta format\n+- [Optional] Unbinned contigs\n+\n+    ]]></help>\n+    <expand macro="citations"/>\n+</tool>\n'
b
diff -r 000000000000 -r a8e434ebe961 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Mon Jun 27 12:41:23 2022 +0000
[
@@ -0,0 +1,31 @@
+<?xml version="1.0"?>
+<macros>
+    <token name="@TOOL_VERSION@">1.1.4</token>
+    <token name="@VERSION_SUFFIX@">0</token>
+    <token name="@PROFILE@">21.01</token>
+    <xml name="biotools">
+        <xrefs>
+            <xref type="bio.tools">dastool</xref>
+        </xrefs>
+    </xml>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@TOOL_VERSION@">das_tool</requirement>
+            <yield/>
+        </requirements>
+    </xml>
+    <xml name="version">
+        <version_command>DAS_Tool -v</version_command>
+    </xml>
+    <token name="@HELP_HEADER@"><![CDATA[
+What it does
+============
+
+DAS Tool is an automated method that integrates the results of a flexible number of binning algorithms to calculate an optimized, non-redundant set of bins from a single assembly.
+]]></token>
+    <xml name="citations">
+        <citations>
+            <citation type="doi">10.1038/s41564-018-0171-1</citation>
+        </citations>
+    </xml>
+</macros>
\ No newline at end of file
b
diff -r 000000000000 -r a8e434ebe961 test-data/contigs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/contigs.fasta Mon Jun 27 12:41:23 2022 +0000
b
b'@@ -0,0 +1,10 @@\n+>Ley3_66761_scaffold_6\n+ATCATCGTCCGCATCGACGAATTCGGCGAACGAGTACCCCTGACCATCTCCGATTACGACGCCGAGCAAGGCTCGGTAACGATCGTCACGCAGGCTATCGGAGCCTCGACCCGCAAGCTCTGCGCCTTGGAGCAGGGCGATGCGCTGGCCGATTTCGTCGGTCCGCTGGGGCACCCCTCGGAGTTCATTCACGAAGATCTCGACACCCTGCGCAAGAAACGCTTCCTGTTCGTAGCGGGCGGCGTGGGTACGGCTCCGGTCTATCCGCAGGTAAAATGGCTGCACGAACACGGGGTGAAAGCCGATGTCATCATCGGTGCCAAGACCAAGTCGATGCTGATCTATACCGAGGAGATGGCCCGCGTAGCGGACAATCTCTACATCGCTACTGACGACGGCAGCGAAGGCTTCAAAGGTATGGTAACGGCCCTGATCAAAGACCTGATCGACAACCGGGGCAAGCAGTACGACGTCTGCGTGGCCATCGGTCCGATGATTATGATGAAGTTCGTGACGCTCACGACCAAGGAGTACTCCCTGCCGACGGTCGTATCGCTCAATACGCTGATGGTCGATGGTACGGGCATGTGCGGCGCCTGCCGCGTCACGGTGGGCGGCAAGACCGTCTTCACCTGTGTCGATGGCCCCGAATTCGACGGGTTCCAGGTCGATTTCGACGAAGCGATGCGCCGTCAGGGTATGTACCGCACGCAGGAAGAGCGTGCCCGCGCCATCGAGCAGGAGCGCGAGAACGGTCACAAATGCCGTGTCGGGCTCGACAAATAACTACCGATCCACACACAACCGGACGTTTCCGGCAGACGAGTATGGAGCGATGCTCTGCGTCCGAATGCCGAAGGCGTCCACAGAACAATGAAAGCAAACAACTATGGCAAATAAAATTCCGCGCGTTCCCGTGCGCGAACAAGATCCGAAAGTCCGGGCCACCAACTTCGAGGAGGTGTGCTACGGTTATAATGTCGAGGAAGCCACGCTCGAAGCGTCCCGCTGCCTGAATTGCAAGAATCCCCGCTGCGTGGCGGCGTGTCCGGTGAATATCCGTATTCCGGATTTCATCCATCAGGTCGTGGAGGGTAATTTCGCTGCGGCTGCCGCCGTTATCTCCGAGGACAGCTCGCTGCCGAGCGTTTGCGGCCGCGTCTGCCCGCAGGAGAGCCAGTGCGAAGGCTCCTGCGTTTTGGGAGTCAAGGGCGAGCCGGTGGCTATCGGCAAGCTGGAGCGCTTCGTCGGCGACTGGAAAATCGAGAATGCCGACAAGATGCCCGCTCCCGACATCAAGCGCAACGGACACAAGGTAGCGGTCATCGGCAGCGGTCCTTCGGGACTGGCCTGCGCGAGCGACCTGGCCCGCATGGGGTATGAAGTGAAGATTTTCGAAGCGCTGCACAAGGTCGGCGGCGTATTGGTGTACGGTATTCCCGAATTCCGTCTTCCCAAGGAGAAGATCGTAGCCAGGGAGGTCGAGGCCGTGAAGAAGCTGGGTGTAGAGATCGAAACCGACGTGATCGTCGGCCGCACCGTGACCATCGACGAACTGATGAACGAAGAGGGTTACGAGGCCGTCTTCATCGGTTCGGGTGCCGGCCTGCCCCGTTTCATGGGCATCCCGGGCGAAAACCTGAACGGCGTGGTTTCGGCCAACGAGTTCCTCACGCGTACCAACCTGATGAAGGCTTACGATACGCATTACGATACACCGATCTATGTCGGTCAGCGCGTAGTGGTGGTCGGCGGCGGTAACGTGGCGATGGATGCCGTACGTACGGCTAAGCGCCTGGGGGCCGAAGCGACCATCGTATATCGCCGCAGCGAGAAGGAGCTGCCCGCCCGCGTGGAGGAGGTCCACCACGCCAAGGAGGAGGGGATCGAATTCCGCATGCTGACCAATCCGACTTCGATCATCGGCGACGAGAAGGGCTGGGTCGTAGGTATCAGTTGCGTCGAGATGGAGTTGGGCGAGCCCGACGAAAGCGGACGCCGCTCTCCGATCGAAAAGGCCGGTTCGGATTTCGAAATTCCGTGCGACGTGGTGATTATGGCGCTCGGCACTTCGCCGAACCCGCTGCTCAAGATGACCACCGAAGGGTTGGAAACCAACCGCAAGGGGTGTCTGGTGGCCGATGAAAAGGGTGCGACTACCCGTGAAGGGATCTTCGCCGGCGGCGATGCCGTAACCGGAGCCGCGACGGTCATCCTGGCCATGGGCGCCGGCCGTAAAGCCGCCAAGTCCATCGACGAATACATCCGTCAAAAAAAGCATTAAACGCTTGCAAGATATGAGGAAATTTTGTTTCGCCGCATTCGCTGCTGTGCTCATCGGGACGACGGCTTGTACACCCAAAGCTCCGGAGCAATTCACGGGTAAGATCGTCGATGGAACGATGAATACCGTCACGGTAGAGTCCCCGGCCGACGGAAGAAGGGTGACTTTCACCACGGAGGATGCCGATATGCAGGAGGCTTACGGCCTGCTGCTGGGCAATACGGCGACCGTTACCTACCGGGGGAAGCTCGGCGAGACGACTCCGGCTTTGAAGGTGGTGACCGATCCCGCCTATGTTACGGCCATCGGCCGCTGGGTGGAGCCCAATCCGATCGACCCCGAGCAGGAACAAGGCATTGAAATTCGAGTAAACGGCGTCGCCGCTTCGATCAATATGCTGACTCTGCGCTACGAAGCTTGGGAATTGGCGCCCGAAGGAGATCGAATTATCTTGAGCGGCGTATCGGAAGGAAGCGGCGGGCCGTATCCTTTCGAGCAAACGGCTGAAATTATCGAGATGGACGGCAAGCCGGCCCTCAAGATCGATGCGGTCGTTCTGACCAAAAAAGATCTGATCTAAATTGGATGCCGTTTCATATACGGCTTGGTTCGATAAAAAAACTCACGCTTTTCAAGCGTGAGTTTTTTTATCGGGTGCCGGAAATCGGGATTCGGAACCAAACAACGGAACTTCGTCGGGAAGGAGTGCGGAAACAGGTAAAAAATGGGAGCAAAGGGAATCGACGAAACGATAAGCCGAAATTACTCCGTTTTACCGACCAACCGCTCGACCCGGTCGAGGATCATCTGCGGTTCTATGCTCCAGATACAGCGGTAATCGCCATATTTACAGGGTTTCTTTCCATATACGGAGCAAGGTCGGCAAGCGAAATCGGTCTGCAAGACACCTTCCTGTCCGAACCCGTAACCCAGAAAGCCGAGCCCGGGATGGGTCGCTCCCCACACCGACACGGTGGGCGTAGCCATGAGCGAAGCCAGATGCATCACCAGCGAATCCATCGACACCACGCAATCCAGGTTGGAAATGAGGTTCATCTCATCCCCCAGCTTTATCTTGCCATACAATGCCGTGACGTTCGGATAGAGCGCCTCCATGCGGCGGGCGAATTCGGCTTCCTCTCCGCCGCCGCTGTGGACGAAAACCCGGTCGAAACGCCCGCTCAACAGACGGACGGCTTCGGCGCTCAACTTTTCGGGATAAGTCTTGCCCGGCTGGGCGGAGAACGGCGCGAAACCGATCCATATACCCTGTTTTTCTCCCATGGGATTGGGTCGGGGGCGTTTCTCGGCCGGCCGGGGATCGGGAAAGTCGAATCCCAAGCGACGGAAGACGTCGCAATAACGGATGACGGTGTGTTTCAAAGGTTTCACACCTTCCGAACCGCGTCCCAGCCGCATGTATTTTTCGATCCGCCCCTTGTGAATTACCGAAACGGGAATCCCCCGCAGGTGGAGTGCCGCACGCACCATCTTCGAACGCAGTACATTGTGCATGTCGGCCACCGCGTCGATCTTCAACTCGGCCGCTTCGCGGGCGAACCGAATGGCGCCCCGGATACCCCGGTGCGTGCGGCGGGTTTCGATATCCAAAAAATCGACATCCACCCCTTCGAAAAAGGGATGGAACAGCGATTTGGTCGCAACGGTCACCT'..b'TCGTGTCAAAAATGTCGCACTGCATCTATGACCTGCTTGCCCGCTACAGAGCCGGTGAATGGAAAGAGTGGAATGTGGAGATACCGGTGATAGTCAGCAACCATCCCGACCTGAAATATGTGGCCGACCAGTTCGGCATACCGTTTGAGGTAATATCCGTTACCCGCGAGAACAAGCCGCAGGCCGAAGCGCAGCAGTTCGCGCTGCTTGAGCACTACAATATCGATTTTGTAGTTCTTGCCCGCTACATGCAGGTGCTGTCAGACGATTTCACACGCCGTTATCCCAACCGGGTAATCAACATACACCACTCGTTCCTGCCCGCATTCATCGGGTCGAAGCCATATCATGCAGCCCACCAGCGCGGAGTAAAACTCATAGGAGCGACAAGCCACTACGTGACAGCCGACCTTGACGCAGGTCCCATCATAGAACAGGACATCGTGCGCATCACTCACAAAGACACAGTAGACGATCTGGTGAAGAAGGGTCGCGACCTCGAAAAGATTGTGCTGGCGCGCGCAGTCGAGAAGCATCTCCAACACAAGATATTGCCGTACGGAAACAAAACGGTGGTATTCAACTGAAAAAACCGATATGAAATTAACAAAATACCTTCTTCTGTTGCCCGCGGCCTTACTATGCCTTGTAGACGCCGCGGCCAAAAACGAGCCTCTCAAGGGCTTTGACAAAATAGGCTACACAAGCCGTATTATCGAATCGTTCTATTTGGACAGCATCGACAATGACAAACTTGCCGAAGAAGCCATCGTAGCGATGCTCAAGACGCTCGACCCGCATTCGCTATATTCCAATCCGGAAGAGACCAAGGAACTGGTAACGCCGCTCGAGGGGAATTTTTCGGGGATAGGCATCCAGTTCAATATGCTCAACGATACACTTATAGTGATACAGACCACCTCGGGAGGTCCGTCGGAGAAAGTAGGAATACTCCCCGGCGACAAGATACTGAGCGCCGACACGACTATGATATCGGGAGTAAAACGCCCGCGCAACGAGATAATGAAAGCTCTCCGTGGGCCGAAAGGCACGCGTGTAGACGTGAAAGTGGCGCGCCGCAATGTGGAGGAGCCGATAGAGTTCCGCATCACCCGCGACGATATACCGGTCAACTCGGTCGACGCCGCCTACATGGCGTCGCCCGGCACAGGCTACATACGTCTGTCACGTTTCGCCGAGACATCATACGACGAGGTCCTCGAGGCTCTCAAAGGACTGGAAAAGCAGGGTATGAAACGCCTTATCTTCGACTTGGAGGATAATGGAGGCGGCATACTTGGAGCAGCAGCCGAGATAGCAGAACTCTTTCTCGACAAGGACGACCTCATCACCTATACGGAGTCGCCAAAATTAGGCACAACGCCTTACGTATCGCGCCAAAAAGGGCGCTACGCCGACCTGCCCGTGGCCGTGACCGTCAACCAATACAGCGCATCGGCATCCGAGATACTCTCGGGTGCGCTTCAGGACCACGACCGCGCCGTAGTAGTGGGGCGCCGCACGTTCGGCAAAGGCCTTGTGCAAAGGCCGTTTCCGTTTCCCGACGGATCGATGATACGTCTGACTGTCGCACGCTACCACACTCCCTCCGGTCGCGTCATACAGAAACCTTACGAACGTGGTAAAGCCGAGGACTATGCGGCCGACATCAAGGCCCGTTATGACAACGGCGAATTCTACAGTGCCGACAGCATATCGTTTCCCGACTCGCTGAAATACACGACACTGCACCGGCACCGCACGGTATACGGTGGGGGCGGCATAATGCCCGACAAGTTCGTGCCCCTCGATACCGCGCTTTATACGCCCTACTACCGTGACCTGATGGCGAAAGGAGTATTCAATACCTTCTGCCTCGGATACACCAACGACCATCGGAAAGAACTGCAAAAAAAATATGATACGCAGGATAAATTCATCAAGAATTTCGATGTCGATGACAAGATGATGGGAGAATTTGTGGCGCAGGGGGAAAAAGACGGTGTGCCTGTCAATGACAACGAGCTTGCCCGCAGCCGTACTCTTATCGCCGCCATTATAAAGGGAATAATAGGGCGCGACCTGTTTGACACATCGACCTATTTCAGAATAGTTAATCCGCTGCTCAACCCCATCTACCGCGAAGCATTGGAGATAATAAATTCACCGGAAGAATACGAAAAATATCTGAATTGAAATCAATAGAGCAGGGGTGTAGCAAAAGTGCTACACCCCTGCTCTATTGATTTCAATATCTTATAATATCGCAGCGATATTACGTATTGATGAAAGGCGTGTCATAAATGAAGCGTCAGACTTAGCTACCTGCATATTATAATCGCGCTGAAGATTGAGGAGCAAATCAGCCGGGATACCCAATGCCGCTTCAATAAGAAGTGCCATTTCCGTATTAACGCCTCTCTTCCCTTTAATAATTTCATTAATGAGGGAGGGACTTACTCCAATACTTTCAGCGAGCTTTGCCTGAGTAATGTTACTTGCTTCAAGCTCATCGTGAATAAGCTCCCCCGGATGGGTAGGCTCAAACGGAGTCAAATTATTTGCTATCATGTCGGTGGCAATGCCCGAAAGTGTAATCATATCAATCGTAGTGGTTTGAAAGTTCAACAATATTGCAAATGGTCAAAATCGGTTCTTCAATAGTTTCGCGCATGGTAAACTCTATCCGATACTGATTGTTAACTCTAATAGAAAATCGGTCGGATTTATTTCCTTTCAAGGCCTCGAAATTTAAAGAATTAATCCGATACAAGTCTTCTTTGCAAGAAGCCCATTTAAGATAATCAACGCTACGCTTATAGCGCTTGATTATATCAATCCTGTAGCGATGTTTCTTATCGCTACATTCTCCTTTATCATAGAGGTCTCTCAGATATTTTTCCCCGAATTCTACTATCATATATTTATATTACAGGACAAAGGTATGAAAAGTATTTAATTCTTCACAAAACTGTGAAGAATATTTTCAGAATGCACCCCATGAAAGATTCTTCCGCCACAATCCGAAATTACAGTGCATATTCCACTTCCCATTTAATATCGCTTTCCGCGGTTAAAAACCGCGGCTATTATAACATCCTATTAATCAATTACGTAGTAGCCGCGGTTTCTTTGCATAGCAAAGCGCCAAAGGCGATGATTAACCGCGGACAATAAAGCCTGCAATTGTCATATTGTCATGCACTGCGATTTCGGATTGAGGCATTCTTCCGATTCTCATAAAACGAAGGCGAAGGCAATCGCAGTATGCGGTTGCCTTCGCACGATTGACACGGTGGGTACTGTCAGCAGCGGCCACCGTGCCGCCTATCACACTTTATTACCCTATCTAATGGTCGATTAAACCGCCTGTCAATCAATCCGCCTTATCGTTAACTTACCGCACCGACAAGGCCGATCAGTACACGATTATAGTCGACAGGCTGAAAAACCAACCGCTTTTTCCTTCTAAAAAACATGAGACAACCCATTTATTATCCCATAGCCATTACCCTGAGAAACCATCAGTACCGGTCCCGAATACGCTTTTATATCTGCACTACCCCAATCAGCTCCATGATAATGAAACCAACACGTTAATTCCAGACATTGCATCAAATAGTTGAAAATAAAATAAGAATAACTGAAATGTCAAGGACGAGTATTAGCTATCATGAGAGATAAAAGTATTATATGCACTAAATTGCTTTCAACATGCGTAATGCTCAGTAGCAACGGCTCGCAAATGTAAAAATTTATTTTTAAACAACAGACAAATTATTTACTAAAAAACTGATAAAATCGCCCGAATTAATGTTAAACTTTGTAAAATCACCTTTCAACATTTGATTTATGGATAAAATTTAACTAAATCGAGGGTTAAATGACACCTACCAACGCCCACATCGACAGATGAGTAAGCAACATAAGGGCGATAATAATCCACGTCATGACTGTCCGCCGGCCATAA\n\\ No newline at end of file\n'
b
diff -r 000000000000 -r a8e434ebe961 test-data/maxbin2.001.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/maxbin2.001.fasta Mon Jun 27 12:41:23 2022 +0000
b
b'@@ -0,0 +1,8225 @@\n+>contig-201_2\n+TAACCAGACGGAACGGTATCTGATGGCCACGGGATTGGTGCACCGACTGGATAAAACTCTGCAGGAGGAT\n+GAGCCGAGGTGTAAAGCTGCGCCCACGGCGACCAGTTTGCGTCGGTCGTATCCCGTCGTGAACGAATAAA\n+TGCCGGAGCATGAGCACCGCTTGTACCACTCCAGCCGATGAGTAACTCACCTTCGCCAACGGCTGTCATC\n+CCTTTCAGGTGAATGATATTTCCATACGCTGTTGGATATCCGTTGTTATACACCTCGTATAACTCAAGAC\n+CTGCTGCCCCCTGCGTATTGTCTGTCAGCGCGGTTATATTCACTCAGCAACCCCGGTATCAGTTCATCCA\n+GCGCGGCTGCTTTGTTCATGGCTTTGATGATATCCCGTTTCAGGAAATCAACATGTCGGTTTTCCAGTTC\n+CGGAAAACGCCGCTGCACCGACAGGGGGATCCCGTCGAGAATACTGGCAATTTCACCTGCGATCCGCGAC\n+AGCACGAAAGTACAGAATGCGGTTTCCACCACTTCAGCGGAGTCTCTGGCATTTTTCAGCTCCTGTGCGT\n+CGGCCTGCGCACGCGTAAGTCGATGGCGTTCGTACTCAATAGTCCCTGGCTGGAGATCTGTCTCGCTGGC\n+CTGCCGCAGTTCTTCAACTTCCCGGCGCAGCTTTTCGTTCTCAATTTCAGCATCCCTTTCGGCATACCAT\n+CTTATAACGGCGGCAGAGTCATAAAGCACCTCATTACCCTTGCCACCGCCTCGCAGAACGGGCATTCCCT\n+GTTCCTGCCAGTTCTGAATGGTACGGATACTCGCACCGAAAATGTCAGCCAGCTGCTTTTTGTTGACTTC\n+CATTGCACATTCCACGGACAAAAACAGAGAAAGGAAACGACAGAGGCCAAAAAGCTCGCTTTCAGCACCT\n+GTCGTTTCCTTTCTTTTCAGGGGGTATTTTAAATAAATACATTAAGTTACGACGAAGAAGAACGGAAACA\n+CCTTAAACCGGAAAATTTTCATAAATAGCGAAAACCCGCGAGGTCGCCGCCCCGTAACCTGTCGGATCGC\n+CGGAAAGGACCCACAAAATGATAATAATTATCATCTACATGTCACAACGTGCATCTACGCCATCAAACCA\n+CGTCAAATAATCAATTATGACGCAGGTATCGTATTAATTGATCTGCATCAACTTAACGTAAAAACAACTT\n+CAGACAATACAAATCAGCGACACTGAATACGGGGCAACCTCATGTCAACGAAGAACAGAACCCGCAGAAC\n+AACAACCCGCAACATCCGCTTTCCTAACCAAATGATTGAACAAATTAACATCGCTCTTGAGCAAAAAGGG\n+TCCGGGAATTTCTCAGCCTGGGTCATTGAAGCCTGCCGCCGGAGACTGTGCTCAGAAAAAAGAGTTTCTT\n+CTGAAGCAAACAAAGAAAAGAGTGACATTACTGAATTGCTCAGAAAACAGGTCAGACCAGATTGAAGCAA\n+TTTAGATAATCGTGCAGACTACGCCCCCTCATATCACATGGAAGGTTTATCTATGGATCAGGTAGTCATT\n+TTTAAACAAATATTTGATAAAGTTCGAAACGATTTAAACTATCAATGGTTTTATTCTGAGCTAAAACGTC\n+ACAATGTCTCACATTACATTTACTATTTAGCCACAGAGAATGTTCATATTGTATTAAAAAATGATAATAC\n+AGTGTTATTAAAGGGCCTAAAAAACATTGTGTCTGTCAAATTTTCAAAGGATAGGCATCTTATAGAAACG\n+ACCTCTAATAAGCTGAAATCCAGAGAGATCACATTTCAGGAATACAGAAGAAACCTTGCTAAAGCAGGAG\n+TTTTTCGGTGGGTTACAAATATCCACGAACAAAAAAGATATTACTATACCTTTGATAATTCATTACTATT\n+TACTGAAAGCATCCAGAAAACTACACAGATCTTACCACGCTAAACCATAACGTCCGGCTTCTCTCACTCC\n+TGAGCCGGACTGCATTGGTTTAATAAAAACCATCAACAATTGTGATTTAGATATTCGGAACCATTCAAAT\n+ATAACAAAACCCCGTAAAAACGAGGTTTATGGATAAATTTTATTATTGAATACATCAGATTAAATTAATC\n+TTGACATCATAGCTTTCAAGACCCGTCATTTTTTCCCGTGCGGTAAACTGAATACTGGTAACTTCTTTCC\n+CGGTCTTTTTCTTAAGTTCAATAATTTTTTTTGTTATATATTCAGAAATATCTGCTTCTGCTTTTGTTTT\n+TAAGTTTTCAATATTCATCATTTCCTCTTTTAGTCTGTTATGACTTTCCAGTTACACAGTAAGTCGATTA\n+TATGGTGCAAACGTGTAAAAGATAAGATGAAACATCGCAATAATCAACATACGATAGTCTAAATTTTACA\n+CAAACAGACAAAGAGAATTTTCCTGAATTATCAATGCAATAGCATCAAATCAACTCAAGAGCCTTATTGC\n+TGCTTCCAGAATTTCTTCTGAAGTAACATGTCGATCCGCGGCTACATAAATGACTTTATGATCTCCGGTC\n+AGAGATGGAAACCCTGCGGCCATTACAGTAAGGTGTGTTTTTTCGCCATTTGGATATTCACGCATGATGG\n+TGTTAACTCCAGTCATCGCTGGCACTACCACTGCTGGTTCAGAGTTAAAAAAACTATGATTTTTTTCATG\n+ATGTTACCGTAGTATGTGAGTATCCATCGAATAGACACCAAGCAAAAAAGCTCCCGAAGGAGCCTTCATT\n+TTCACTTTTTTAAATCCAACGACAGACGGCTGGCATTTAAGTATTGTGAAATATTATCAAATGTAATCAT\n+CATTGATTTACAAAAGATACATTTTGCCCCGAAAGGATTCATGTCAGAAACATCAAAAGATGATGTTCTA\n+TACTGGGAACCATGACAACACGGGCATCTAAAGTGAATATGGTTTGTAATATTGTCTACCTCAAAGCGCC\n+ACTACATGAACAGCGGCAGGACCTTTAGGTCCGTTCTCAATACCAAATTCAACTTCCTGATTCTCAGTTA\n+ATGTTTTGAAATCGTTGCTCTGAATTGCTGAGAAATGGACAAACACATCTTTGCTGCCATCTTTCGGCGT\n+GATGAAACCAAAACCTTTTTCAGGGTTAAACCATTTCACTAAACCAGTCATTTTGTTAGACATAATTATT\n+ACCTTTTGAAGAAATTAGCCCTTGGGCAGAATGGTCCGAAAAAAAATATCAGAGAGAAAAACCAACAAGG\n+AAATCTCAAGAGGTACAAATAATAAAATTATAACAATGACTGCTTCAGATAAATTTGTAACAAACCAGAA\n+CACCATTAACGCATGATTAACCACCCATAGCAAGGATTACTTTTGTAAAGAAAAACACAGCAATGAAAGA\n+ATAGCTTTATTTATTAATAAAACGTGTCATTCTGATTAAGACCTTTTATCTTACCCTTAAGATTTCAGGA\n+ATTTTGGCTCATGGAAGAGTCCTTTTTATTTAAATTTTACATTCCGCGATGTAAATGTTCCGATTTAATA\n+TTACCCTACATTTGATGCTTTTTATCTCTTAAAGATTCATAGATCTGTTGACAAGTCACTCCTGCGATGT\n+AGCGTTCGTCAGCAATTTCAGCATAAAGCTGAGCTTCTGCTGCAATATCTCCGAGCATGTTGGTGAGCAT\n+TCCTTCGGCGGTTTTGGTTGTTTTGCCTCTGACGGCAGCGGCAAGATCTGCGGTATGCTTCGCTGCGTCA\n+AGGCGTATGGCATATTTTTTTGCTTCGGCACGCAACTGGTTAACACTATCAGACAGATAAGCAGCCCTGG\n+CAGAAATTTCAGCAGATTTCTGTTGCGCATCTTTAACAGCCTCATCACGGGCTATAGTTCGCCCCTGTTC\n+AATT'..b'GATGTATAACACCAAAACTTGCTATGCAGAAATTTGCACAGTGCGCAATTTTC\n+TGCATAGCCGCTCATTCTCCTTATAAATCCCCATCCAATTTATCCCTTCATATTCAATTAGTTAAATAAC\n+TAAATCCAAT\n+>contig-201_954\n+AATATTGCCAGTAGATTATTATCTAATCAAACATACTTTCCTATAATTCACAATTATAATTCAGGTGAAT\n+AAAAAAAGACCATGAAATATATAAATTGTGTATATAATATAAATTACAAATTAAAACCACATTCTCATTA\n+TAAATAATTATATGATGAAAAAACGGTATGAATTAATACTCAAATAAATAAAGCAGAGCTTAAACATAAC\n+TCTGCTTTATAATTAAAGGGACAAAATAATTTTACATCTGTTACTGTTTCGGTCGCAGATTCTCATCAAA\n+TACCAGGCGTTTCCTGCCAGGTTCAATTTCCCGCAATGGCTCGACTTGATGTAACGTCTGCTTACAGCGT\n+GTCACCAGCACCTGGTACTCATGCGTACCCTGCTTTTTCCATGCCAACTCCTGCTCACTGAGTTCACGAA\n+TCGCTTTCGCCGGGCTGCCGACAATCAGGTAATTAGCTGGCATTTCTGCTTTGGCTTTCACAAATGCGGA\n+TGCACCAACAATGCTGTTCTCGCCAATCACCGCACCGTCCATCACTACCGCGTTCATTCCCACTAATGCA\n+TTGCGGCGGATAATGCAGCCGTGAAGGATAGCGCTATGACCAATATGTCCATCTTCTCCTACAACAGTAT\n+CCTGCTCGGGAAAACCGTGCATAACGCAATTATCCTGAATGTTCGCGCCATCTTTCACCACGATACGACC\n+AAAATCGCCACGCAGGCTGGCATTTGGCCCAACGTAAACGCCCTTGCCGAGAATAACATCGCCGATCAAT\n+ACCGCTGTCGGATGGACAAAACTCTCTTCTGGCACAACCGGAGTCAGACCGTCTATCTGATAAATTGGCA\n+TAACGCCTCCTGTTCAATATTCAAGCCGCCAAAACGTTGAAAATACAGGCTTCCCGGCGCAGGCAGTTCA\n+CCGACCGAGGTTTCACCTTTTTCACTAACGAACGCTAAAGCAGCAGGCGCTACGCGCTGATAAATGTTGA\n+TACACAGCTGACGCGCCGTATGCCCTGCCCAGTGTGCCGGAAGCAACTCCTCCGGCAACAATGGGTCTTT\n+AAGGACGACACGGCGATAAAAATGGATCAGTAAAAGCTGAATATGAAATGCCCGCTCCGGGGTTAACTCG\n+TCTGCCGCCTCTTTTAAAAGCGGCACCAGCGGGCGGAATGACTGAATAAAGGTTTCGTACATGGCATTTT\n+GTTCAGTTAAATGCCAGCACTCTTCTACTCTGGCACGCAGTGCTGCGCGAGAAAG\n+>contig-201_956\n+GTTCGGGATGTTTCACTTCATCAATTAGAGTTAGTGCATCATTAAGACCAAGGTAATTCTGTGTCGAATA\n+GCGATAGGCCGCGATATTCAGTGAAGTACTTGTTTCTTCGAATAACTTGTTCCAGGAAACACGATAACTT\n+TGCCCCTGGTATGTTTTATCATCCGGGATACGAACATTGGAATGAGTCACATCGAAAGAAAATGCACCAA\n+CTGAAGTATTCAGACCAAGACCTAACAAACCAGCGGTATAGTTATTATCGGTTATCTGAATACCGGTATA\n+ACCCGTCAGATAGTTATTCAGGCCGTAGTAGTAGCTTGCTTGAAATAAATTAGGCTCATCCTGAATATCA\n+TCTTTTAAGACCTGACCGCCGCTAATATCCCAACGTCCAACGCCAGGGCGTAACATTTGAACAACGGATG\n+AGAAAGGTTGCGAGAATGTCCGCTTTGAGCCATCGGATTCTTCGATGGTAACAATAAGATCGCTGCCGTA\n+CCCTGACGGACTCAGATCATCAATGACGAAAGCGCCTGGCGGCACCGTCGTTTCATAAATCTTATAGCCA\n+CCTTGCGTAATAGTGACTTTGGCGTTGGTATTGGCAACGCCATGAATGATAGGCGCAAAGCTGGCTAAAG\n+TCGGAGGCAACATGCGGCTGTCACTGTATAAACGAATGCCTCGGATACTGACGGAATCAAAGGTTTCGCC\n+CGTCGTATAAGACTCACCAAGAATGAGTTGAGAACGCAGCGAGGCGATATCACGCTGAACATACCGATTC\n+TTAAAATCATAATTACTGCCAGAATCGGTCATCCAGTTGTAGTTGCCCGAGGCACGCAGTCGCCATGCAC\n+CTAAATTCATCCCACCGTTAAATGCAGCATAAATGCTTTCATTTTTTCGACCAGGGGTTTCACTATGATA\n+TCCGTTGAGGTTGTATGACAACATGGCCGCATTAATGCCGTTTTCCCATAACGATGGATCAACATAGTTT\n+TGGTAATTTTTCATTACCCAGGCTTGAGGAACGTCTATATCCAGACGTTGATCGTTAACGTCATAACGAA\n+CAGAAGCCTGAGGGATAATTTCCGTCAAATTGAGGCAATTGCCGAGCGTTTCATCCCTGGCAAGCAGAAC\n+GGCTTTTTCGTTATTTATATCGGGAGAATTAATATGAAACTGCAATAAATTCTTTAATGTGATACAAGCC\n+TGGGCGTTCTTTTTTCCTTCAATTGCGACAAATGTAATACTTTGGTTAAT\n+>contig-201_962\n+CCGGCTCGCGTTTGCCAAGATCCAACTCATTGAAGGCATAACCATGACGCTCAAGCAGTTGTGCCTCTTT\n+GATGGTGAAATCACCATGACGAGAGAATCCACGTGGATAATGTTTATTGTCGAAATATCGATTAGTCGTC\n+GTAAAGCTTTCCGCCATCCTGCACGCTCCTAATTCTTTGACCGAGCTAGTTATGGCGCGGAGTATTAGTT\n+ACGCTTGACAGAGTGTAAAACAAAACATTTAAATCATAACGACAAATAATTTTGCGGAGAGCACTGTGGA\n+TACGGAATTGTTAAAAACTTTCCTGGAAGTTAGCCGAACGCGTCACTTTGGTCGAGCGGCTGAATCGCTC\n+TATCTGACCCAGTCAGCAGTGAGCTTTCGAATCAGACAACTGGAAAATCAACTGGGTGTGAACCTTTTCA\n+CCCGCCACAGAAACAATATCCGTTTAACCGCTGCCGGTGAAAAACTACTGCCTTATGCAGAAACGCTCAT\n+GAGCACCTGGCAGGCCGCCCGTAAGGAGGTGGCGCATACCTCACGACATAACGAGTTTTCTATCGGTGCC\n+AGCGCCTCGTTGTGGGAATGTATGCTTAATCAGTGGCTGGGACGCTTGTATCAAAATCAGGATGCCCATA\n+CAGGCTTACAGTTCGAAGCGCGAATTGCCCAACGGCAGTCTCTGGTAAAACAGCTGCATGAACGCCAGCT\n+TGATCTTCTTATTACCACTGAAGCGCCCAAAATGGACGAATTTAGTAGTCAGTTGCTGGGATATTTCACT\n+TTAGCGCTTTATACCAGTGCCCCTTCAAAACTAAAGGGAGATCTTAATTATCTGCGACTTGAGTGGGGGC\n+CAGATTTTCAACAGCATGAGGCAGGTTTGATCGGTGCTGACGAAGTGCCCATTCTGACAACCAGTTCTGC\n+TGAACTGGCACAGCAACAGATTGCGATGCTTAATGGTTGCACCTGGCTACCCGTCAGCTGGGCGCGTAAA\n+AAAGGCGGCCTGCATACCGTTGTCGATAGCACAACACTTTCACGGCCGCTTTATGCCATATGGCTGCAAA\n+ATAGCGATAAAAATGCGTTGATTCGCGATCTTTTGAAAATTAACGTGCTGGATGAAGTGTATTAATATGA\n+ATGGCTGGCAAGGATGCCGGTAGAAGGATTTACTTCGGAGAGGGTTATTTCAGATAAAAAAAATCCTTAG\n+CTTTCGCTAAGGATGATTTCTGGCAGG\n'
b
diff -r 000000000000 -r a8e434ebe961 test-data/maxbin2.002.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/maxbin2.002.fasta Mon Jun 27 12:41:23 2022 +0000
b
b'@@ -0,0 +1,2186 @@\n+>contig-201_29\n+GAATTAGTTAAAGTTTCAGTATCGATATCTTTTACCGTATATGTTGGGGATACTATTTGTATAGATTTAT\n+GATGATTCGGGGACCAAATTAAATGCGAGGGATATTCCGGAGTACGTGAATTAGGGTAAAATGCAAGCGT\n+TGGTTTATGATAAGCCGCAGCGATATGAACAAGAGCTGTATCAACAGAAATGACAAAATCACTATACTTG\n+GTCAACGCAACGGTATAAATAAACTCATCAAATGGTAGTGTTTCGATTTCAAGTATTGGTATTGTCAATA\n+AATCTTGCGGTAACCCGGTAAATATAATCCGATAATTTTCAAAGTGTGTTTTCACTTCTTGATATATAAC\n+TTTTATTTGCTCAAACGTAAGACGGCATATTTTTTTTGCACCTAATGGATTAATAATGACTATTCTTGTA\n+TCTCCAATAAATTCTTTTATTTTATCTTCAACATCTACTGGTAAATGCAAGTCGTAGTTGGTGGAAAATT\n+TACCCTCACCATAAATATGCTTCAGTATTTCTATTGCTCGTGTACTCATATGTTCTTTTAAACATTCATC\n+GTGGGGATGGTAAAATGAATAGTAACGCTTATACCAATGATCAAAACCCAGAATGTAAGAATCTTTTAAA\n+CTTGATAATATTAAGCTATGCTTAAATGAGGGCATAGTTTCAAAGGGGTCTAATACAATATCGAACTGTA\n+AATCCCGCAGATGCTTACATAGAGTAAGCATTTCAAGAAAACCGGTTGATTCTTTAATACAGAACTCAAA\n+TATATTTTTATTATTAGAGAGAAATTCCCCACCCTTTCTATTTGTGAGAAGAGTTATTTTAACCCCTTTA\n+CTATAAAGTTCACGATAAATCGAACTTAATACAATTAGATCACCAAGTTTATTATTATCATGAATAATAA\n+GGCATGATTTAACTTGTGCTGGATCTGTAATTTGATTATTTATTTTATTACGAAATAAAAAAGAAAGGAA\n+ATTAATCTTGATTTTGTTTATATAAAATCTTTTCTTTTTGTGAAAAGTTCCTAAGCGCATTTTTATACCA\n+TATTATTTTAGTTTCAGGATGATTAATTAGCATAAGAATCGGTTGAAGTTCTATATTGCATTTTTTTTCT\n+TGTCATATCTTTTGATTCTTCTGCACTGATGTCTTGAAGTTTAATAAATGGAATTACATCGTAAGAAATA\n+GCTGTATCATCTGATAAATTATAAATATTAATATCTTTTACATTATCATGCATAAAACGAAAAAATGGCA\n+ATATTTTGAATAAATCCCTACTTAATTCCGAGGGCATGGGATTTTTATTCTCATCATAGAAACGAGAACA\n+GCTACCCGTTAAATCAAGACCAGAACAAATAATCCGCGCATACTTAAGTGAATATGCGATTTGAATTGCA\n+GCAAAGGCAATAGTATGGCATGAGCAATAACCAAGACTAATGTCCTTGCAAAATCCAACCAGACGACCTT\n+TTTTAGACAACGGTACAGAGATCAGCAGTTCTTTGTGAATCTGTCTCAAAATATTAAATTTAATCTTCTT\n+TATAAAACCACCTTTTTCCCGACGGTAAAAGGACCGTAATACGAGGCAGTTCTGGAGGATATAAAGTTTA\n+TCTTCTTTGGAAGCGTGTTCATAAACGTCAACGTTTACTATGGTATAACGACTTCTCTGGCTAAATTTAT\n+AAAAATCATCACGACGCTGATGTAAAAATCGGACATCTGTAAGTACATATATAAAAGGAACGATATTATT\n+ACTTAACAGATATTGCGCAGAACCATTGACAGCAATAATATCCTTTGTTCGTAATACTGACAAAGGTGTT\n+TTTTGCGATGTAGGGCCCGAAAGAAAAATAATAACATCATCAGATATTTTATTTTCAATCAGGTTTTCAA\n+CATCTTTTTTGTCAATGTATCTAATATTCTTCATGATAAACCTGTGAAATAAATAACTCCGCTTAAAACT\n+GTCCTGGTGAAGACATGTAATTGTGGGATTTTTTTTAGCGCGCTGGTTTCCCTTTCAAACGCCGCATAAA\n+ATTGCGCATTTTTTTACGATATACTAAAAGATAATAGCCTAGATCTCTAATCTCATTTTTAATACCGTAA\n+TGACGCTCTAAGTCAATACGATCTTTCGCTTTACGCTGCGCTGAAGCACGCTTTCCGGAGAGATCGATAA\n+TTCGAACCTCACCATTTTTTATAATGAAGTTACCACGATGGGGGTCGCCAGAAACCATGCCATGTTGATG\n+TAAGGCATTAATTGATTGCTGAATTTTATTTTTTAGCGCATCATCAATATCGGGCATATCACACAACTCT\n+ATGCCATCAATATACTCGATGATCATGATATAAGTATGGACAAAACGTAAGGTTTTCCGTTCAGCCAATA\n+AATAAAAGTCATTGAGTGTATTTAACCCTTCATTTCGTACTTTTTGGGTTTGCTCAAAAAGGCGTTCGTA\n+ATAATCACCTTTTAACAGAGACTTAAAGAAACGTTCGTTACGCTTAACTTTCGGAGAAAAAACCTTAAGA\n+ATCAATTTACCGTAATCGGTATCAATAAGCATAACTTTTGTATCATCAATAGAACGAAAAACCTTGATGA\n+TATTTATATTATAAGACAAGAAGTCATTTAATACATTGAGGTACTTTGAATTGTTTTCATCGGTAAAAAC\n+AACCAAGTCTTTGATCTTGCTCTTCTGAATCATAATAAACCAGTTAAATGTTATTTACGGTAATATTTTC\n+GGCAAAGATAACAGACTCCTGCTATAATTCCTGAGATATAATGATGTTGCACTAAAAGATGTTTATATCT\n+TTTTTTAAATTCAATAATTGATTTCGCATCTCGTGGAGAGTCATCTTTCCAGGGGGAATTTTCTAAAGCT\n+ATTTTATAGTATTTTACCGATGGATAAATTGCCCATTTGTGCCACGGTTTAGTTGCACCTGTATAATGAA\n+TAAGAAGAGTACTTTCTGTAATCAGCTTTTTATAGTTTTGATGTGTTTTGTCTTTTAATTCACTTTTAAT\n+TGTATAAATTGTATTGTACTCACGAGGCAAAAATAATGTCATCCCTTTCAGTAAGACATTCATAACATCC\n+TGATCAGGGTATTTATAAACATTATCTTTACTCATAAGAATAGACAACGCTTTTTCTGTTAGTTTTGCGT\n+CAGCCCATTTTTTTAAGTCTAAATAAACGACACCGGAATTAAAGTACTGCCCAAGTAATTCAGGATCAGA\n+CAACCTGGATACCGCCTTTTCTTGCATTGGCTCAACATCTTTAACAACAGCAGCAACCGCTCCATTTAAA\n+CCCAGATGTAATAGTTGGCTAATATCGCCTTTACAAACAACATCTGCATCAAGATAAAGCAAACGATCAA\n+GCGTTAAACCCAATAATTGAAATGCAAATAAACGGAAGTACATTGCTCTTGACCAGACCTGTGTACAAGG\n+CAAGCACTGGAGCTTATCAGTGTTAATTCTATATAACGTGATTCTTAATTGGTTTTGCTCTGCAAGCTTT\n+GCAATTTTTTGAAAAAAACCATCATTATAAACATCAGCAATAATATAAAAATCAAGATTAATATGTCGAT\n+TATTTAGGACAATTGATGTGATGGAAACACCTACACCATCAAGATAATTAGCATCGACACCATAGGCAAC\n+ATTTAAACATTCAGAAGTATTTATATTAGCTAGCCGAAAATCCCAGGCTTTAACTTTATCTATCTCTATG\n+GCAGGAAATGAGTCCACAATGCTACCCTTATATCATTACTTTATAGTTTCCCAGTTTTAATGCTTTATCT\n+TTTCAATAAAATAAAAAAGATAGTTGCTAAATCCTTTTAGATATCTATGCTTTTTAAGCATATGTTTTGC\n+GCT'..b'TGCATGATTATTTATGATCTCAATTCTGCATTTTGTCAGTAAAATGC\n+>contig-201_940\n+AGCGTTACGTGATCTTTCCCTGCAAATGGAACGCAAAATAAACACCTATTCCATGAGTTATATAATTTTT\n+CACAATGATTAATTTGTTTTCTCAGGAAGAGATTTTATTTCTCTTCACTACGAATTAGTTCATGCTGTAT\n+CTTTATTAAACATTCGTAAGACTCATTTTTGTTCGGGAGATGTGCTGTCATTCGAGCATAAGTTGGTTTC\n+TCATCTTTAAAATATTTTACCATGATTGAATTATCAAGGACTGCCAACAACTGAACTGGATCACTGCTCT\n+TTTTTTGATAGATACCCGCTCTTATATAACTTCTAAACCGATCGCCGAGAAACGCCGTTTTTTCTGCTGT\n+ATTTATCAACTCCTGCAACGTTCCTTTGATGGCATGATTTTCATTAAGGCGTAGTGACCCGACGCGAATT\n+AAGAGTCTCGCCCCGCTTGGTGTGAATTTATTATTTTTACATGTACCCAGTTCTGTTTGCCAATAATACT\n+CACCGATGTCCTCATTCTGATACCATCTCCACATGGCTTTATTATTTAAGACAGGAAACGCGGAAAAAAT\n+AGTACCCTTAGCGAAAATAGTAAAACAATCATGATCTTTAGCTTGTATTTCGCAATCAGCTATAACACCA\n+AAACTAACAAATATCATCAGCAAAAAGAACAAAACTCTTTTCATTTTCTTATTCCTCTCGATGTTCTCTG\n+TTTCATCTTAGCTAAAATTTCACCCAAATCATCTATCCCTGCTGTTGCTGGCCCATCGGGTTTATTAATG\n+TCTGGGAATAAATAGGGTTCTGCACAAGTATATCCTGGTGGTAATTGAGTTGTTGGCCAATTTGTCTGTG\n+GCAGGTAATCACTTGCTGTCTTTGTATCCATCCCTGGATACTGGGAATCATCCTGTGGCGTACAAGTCAG\n+ATTTGGTTTTACCCACTTCCTGCAATACAGTGTGTAGTCGTAAGGGCTTAATGCTCTGAAGAATGTTTTG\n+AAAACATTAGGCGCACTACTGGCCTGGTCAATAGGATATGGCAGTCTTAATTGTTTCGCTATGTCCGGCA\n+ATTTACTTGGATCGGGCGTAGGCGGTTTGTTGGGTCTCGCTCCATATCCGCCATTATTTAAGTGTCCATA\n+TTTTGATGCCAGTCCCATTGAATCTATATACTGAACCGGATTCAGCGGATACTGATAAAAATTCCATCCC\n+CCCTTCAGCCCAATCGGATCCTGAGTGATATACCTCCCCTGCAGCGGGTCATAATAGCGGTGGCGGTTGT\n+AATACAGGCCGGACTCCTCATCATACTGCTG\n+>contig-201_950\n+GGATCTTAGATTCTGTGCTTTTAAGCAGAGATTACAGGCTGGTTACGTTACCAGCTGCCGGGCCTTTAGC\n+GCCGCTTTCGATGGTGAAGGACACTTTCTGACCTTCGTCCAGAGATTTGTAACCATCGTTCTGGATAGCA\n+GAGAAGTGTACGAACACATCTTTAGAGCCATCGTCAGGAGTGATGAAGCCGAAGCCTTTGTCAGCGTTGA\n+ACCATTTTACGATACCAGTCATTTTACCGGACATAGTGTATTACCTTTAATAATTAAGTGTGCCTTTCGG\n+CGATATGGCGTGCTTTACAGATTTTGAAGCGTTAAAGGAATGTGCACTACGAGGGGTATCAACGATAACT\n+CTTGAAGGGACTTGCCTTACTACACTGCTTTAATGGTCTGTACGTCAAACCGTTGATGTGCATTAAGCCA\n+CGCATTGGCGGGTGATGCAACAATTATTTTTCATATTTATGATTAATCGGTTGGAAAACGGTCCTGTCAT\n+CAGGACCGTAAACAGCAATAAAGTGGATAAAAGTCTATTCCATCAACTGCTTACTTAATGCCGGGTTGGC\n+TTGAATCAAACGCATCAATTTTAGTTCGGCACTTGAAGGCTTCACGCGTCTGGATTCCCATTCCTTTACC\n+ATGGCGACTGATACGCCCAAAACCCGGGCGAAATCATCGATTTTTAATCCTGTCCCTTTTCGTAACTGCT\n+CAATTTCGGTACAGGACGTTGTTCTGTGCGTCAGGGTAATTTTCTGCGTTTCATCTTTAAAAACAATCTG\n+TTCCAGGCTGCTCAACAGCTCATGCATTGGATCTTTATATTCCATTGAAAACTCCTCAAATCACACTGCG\n+GGATCGTGAATTGCATCGAAGCTCATTAAGAATAGTCGGGAAAAGCAGACACAGCGGGGTGAAGTCAGGG\n+CATGCTCTGGCTATGATTCGATTCAGCCTGTCATTTAGCGTGACTTATAGCCACCTAACGATCTGATAAA\n+TGCCGATATATCTCTTACCACTCCTGTTTTGTAAAGATTTCGAAAATCTAACCTTCTGCGAAGGCGTAAA\n+TCTCTGGCTACAAAAAAGGCAACGGCACTATCATTTTTTAACAATGAAACAACAAATTAACCTTGTTTCA\n+TTTTCTCCATGATTTTACCAGGAAGATTACGTAGAAAGGGTATCCTGCAAGCCTGTCCTGGACTATCCTT\n+GTCACGTCAGACACGCGTGTGTCGTTGTGCGCTTTTTTTGGGTGAAAGGAGTAAGAAAATGGCGACAGG\n+>contig-201_955\n+TGGCCCCCTTTCCAGGTGACCGTGTAATCTGAACTACCCTTTGGTATCTTCAGTGCCTGCCTGCAGGCTG\n+AGGTGTTGCCCTTACAAATGCAACAACGACATGGATTACAACACCCTCATAAACAAAGGGCAATCACCTG\n+ATCTAAGCTCTTACCTATGACAGTGATAGGTTATGCCTTTTACTCGACTTTTGCACTGACTGAAAAGGAC\n+AAATTAATGTTAAAAAAGATACTTTTACTGGCTCTGCTTCCTGCAATCGCCTTCGCAGAGGAACTTCCTG\n+CTCCAGTAAAAGCGATTGAAAAACAGGGCATTACAATCATCAAAACATTCGATGCCCCCGGAGGAATGAA\n+AGGTTATCTCGGAAAGTATCAGGATATGGGCGTCACCATCTACCTGACTCCAGATGGTAAGCACGCTATC\n+TCTGGTTACATGTACAACGAGAAAGGTGAAAACCTGAGTAACACACTTATCGAAAAAGAAATTTACGCAC\n+CAGCCGGACGCGAAATGTGGCAACGGATGGAACAATCCCACTGGCTCCTCGACGGTAAAAAAGATGCGCC\n+GGTCATTGTCTACGTCTTCGCCGATCCGTTCTGCCCATATTGTAAACAGTTCTGGCAGCAGGCGCGCCCG\n+TGGGTAGATTCTGGCAAAGTGCAATTAAGAACATTGTTGGTTGGGGTTATCAAGCCAGAAAGCCCGGCGA\n+CAGCAGCGGCAATTCTTGCCTCCAAAGATCCCGCAAAAACCTGGCAACAATATGAAGCCTCTGGTGGCAA\n+GCTTAAGCTAAACGTGCCTGCAAACGTAAGTACAGAGCAAATGAAAGTGTTAAGTGACAATGAGAAACTG\n+ATGGACGATCTGGGGGCAAATGTCACGCCGGCTATCTATTACATGAGTAAGGAAAATACGCTACAACAGG\n+CCGTGGGGTTGCCCGATCAGAAAACGCTTAATATCATTATGGGGAATAAATAAAAGGTAATTCATGGATG\n+GTTGAACTATATCCCTGCTTTTCAACCATCCTAAAAAAGCATGAATTGCTCGCTCTGCCCTAAGTGGCTG\n+TGCTATTTTAGAAAAACTTAATCCTGAGTTAAGCAAAAAAACATAATCAATAAAAATATATACGCAAAAA\n+ACATTGATTAAGTGAATATATCATGGAAGAAAAATATAACCGGAGTAGTGTATGGCCAATCTCTACGACT\n+TGAAAAAGTTCGACTTAAATCTTCTTGTCATATTTGAGTGTATTTACCAG\n'
b
diff -r 000000000000 -r a8e434ebe961 test-data/metabat.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/metabat.tabular Mon Jun 27 12:41:23 2022 +0000
b
@@ -0,0 +1,3 @@
+Ley3_66761_scaffold_6 metabat.8
+Ley3_66761_scaffold_191 metabat.8
+Ley3_66761_scaffold_505 metabat.25
b
diff -r 000000000000 -r a8e434ebe961 test-data/proteins.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/proteins.fasta Mon Jun 27 12:41:23 2022 +0000
b
b'@@ -0,0 +1,6277 @@\n+>Ley3_66761_scaffold_6_1 # 1 # 786 # 1 # ID=1_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.599\n+IIVRIDEFGERVPLTISDYDAEQGSVTIVTQAIGASTRKLCALEQGDALADFVGPLGHPS\n+EFIHEDLDTLRKKRFLFVAGGVGTAPVYPQVKWLHEHGVKADVIIGAKTKSMLIYTEEMA\n+RVADNLYIATDDGSEGFKGMVTALIKDLIDNRGKQYDVCVAIGPMIMMKFVTLTTKEYSL\n+PTVVSLNTLMVDGTGMCGACRVTVGGKTVFTCVDGPEFDGFQVDFDEAMRRQGMYRTQEE\n+RARAIEQERENGHKCRVGLDK*\n+>Ley3_66761_scaffold_6_2 # 890 # 2284 # 1 # ID=1_2;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.604\n+MANKIPRVPVREQDPKVRATNFEEVCYGYNVEEATLEASRCLNCKNPRCVAACPVNIRIP\n+DFIHQVVEGNFAAAAAVISEDSSLPSVCGRVCPQESQCEGSCVLGVKGEPVAIGKLERFV\n+GDWKIENADKMPAPDIKRNGHKVAVIGSGPSGLACASDLARMGYEVKIFEALHKVGGVLV\n+YGIPEFRLPKEKIVAREVEAVKKLGVEIETDVIVGRTVTIDELMNEEGYEAVFIGSGAGL\n+PRFMGIPGENLNGVVSANEFLTRTNLMKAYDTHYDTPIYVGQRVVVVGGGNVAMDAVRTA\n+KRLGAEATIVYRRSEKELPARVEEVHHAKEEGIEFRMLTNPTSIIGDEKGWVVGISCVEM\n+ELGEPDESGRRSPIEKAGSDFEIPCDVVIMALGTSPNPLLKMTTEGLETNRKGCLVADEK\n+GATTREGIFAGGDAVTGAATVILAMGAGRKAAKSIDEYIRQKKH*\n+>Ley3_66761_scaffold_6_3 # 2298 # 2864 # 1 # ID=1_3;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.566\n+MRKFCFAAFAAVLIGTTACTPKAPEQFTGKIVDGTMNTVTVESPADGRRVTFTTEDADMQ\n+EAYGLLLGNTATVTYRGKLGETTPALKVVTDPAYVTAIGRWVEPNPIDPEQEQGIEIRVN\n+GVAASINMLTLRYEAWELAPEGDRIILSGVSEGSGGPYPFEQTAEIIEMDGKPALKIDAV\n+VLTKKDLI*\n+>Ley3_66761_scaffold_6_4 # 3047 # 4078 # -1 # ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.583\n+MPRKNKKLPRHLLVIRTSAMGDVAMLPHALRALKEAYPEVKVTVATKSLFHPFFEGVDVD\n+FLDIETRRTHRGIRGAIRFAREAAELKIDAVADMHNVLRSKMVRAALHLRGIPVSVIHKG\n+RIEKYMRLGRGSEGVKPLKHTVIRYCDVFRRLGFDFPDPRPAEKRPRPNPMGEKQGIWIG\n+FAPFSAQPGKTYPEKLSAEAVRLLSGRFDRVFVHSGGGEEAEFARRMEALYPNVTALYGK\n+IKLGDEMNLISNLDCVVSMDSLVMHLASLMATPTVSVWGATHPGLGFLGYGFGQEGVLQT\n+DFACRPCSVYGKKPCKYGDYRCIWSIEPQMILDRVERLVGKTE*\n+>Ley3_66761_scaffold_6_5 # 4062 # 4667 # -1 # ID=1_5;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.528\n+MFTQNANKIFAQAIDDYHRYDDVDHQLSNPYAEGTIDHLLYMKNWVDTVQWHLEDIIRDP\n+RIDPVEALKIKRRIDKSNQVRTDMVEYIDSYLLDKYKNIDVQPGARINTETPAWAIDRLS\n+ILALKIYHMRQEVLRKDVDEAHRAACQQKLDVLLSQQVDLSTAIEELIEDIEAGRKYMKT\n+YKQMKMYNDPALNPVLYAAKK*\n+>Ley3_66761_scaffold_6_6 # 4808 # 5806 # 1 # ID=1_6;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.554\n+MNFYHKAISLAGFVLLTVLPAQAQVRQTREEYINKYKKIAVAHMERYGIPASITMAQGIL\n+ESDCGNSWLSQASNNHFGIKCKRNWTGDVVYYDDDEKGECFRSYPSVEASYQDHAEFLDS\n+QPRYDSLFSYAPNDYKSWARGLKAAGYATAPDYAQRLIRIIEESKLYLLDREDGLTIYGA\n+QTGHLTDDWFSGQSNVDQAAAIASGAVDPDDYRVTVNAHKGYNVYRTNGVNYILAHDGDT\n+FEKISRDFRISARNLRKFNDVSKNAQPVANEVIYIGRKKKRWDGNVLLHTVREGETLWSL\n+GQSYGIRTKSLARLNKLKEGDALTPGTTIKIR*\n+>Ley3_66761_scaffold_6_7 # 5825 # 6511 # 1 # ID=1_7;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.534\n+MESIPLRKKILETIVSKSTLKQKVFDNTFATFNDLKETLLEMASEMDDQLDGLLDRRVRL\n+EYRDRGKFEAQIQVANDLLIFQMHTDVFEFEPNHVIWQNPYVQTDRDNSYCGVINIYNFL\n+SDSFKFNRNADEGYLIGRIFINREKCYFVEGKQQTSMRPMQFGKAEIDSEALVRILESAI\n+YYALNFDLLLPSYDDNKRVTVDQFNTKLDNSKFVTGKRLGYDFDVDDI*\n+>Ley3_66761_scaffold_6_8 # 6536 # 8683 # 1 # ID=1_8;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.577\n+MLKKLLLLTLLGTAFAAQAEAAAPSTYRDIARLRAMNQRAQGIRPAADGKSYTTLRGNAI\n+ERHSYTKDAPGELLFEWKNDKENRDIADYQFSPDGKLLLLSIGSEPIYRHSYTTDYYLKD\n+ADGLRPILTDLSDTRDASFSPDGRTIAFSSGNNLYLYDIVGDSVRPITTDGAWNRIINGT\n+TDWVYEEECAFTKAYAFSPDGQKIAYLRFDESLVPVFEMMRYDGKLYNEAYSFKYPKAGD\n+ANSVVDLYVYDLKTGETERVDVGPDRGQYILQPEWTPDGRLCFQRMNRRQNHFEAVLCNP\n+DGTQQVIYDERSPKYVDHLNKTFYFLEDGRRFIVREETSTGYMHLYLYGIGQGVLHPITQ\n+GEWEVTDFVGLRGDKVYYISTESSPLKRDLYRVGLDGKHKERLTPGDGYYSIYPSADLSY\n+YICEGGDSSAPGRTDVFNAAGKRVRTLYDNAPLKEALAEAGLPVREFFTFTTERGDELNG\n+YMLKPLDFDPAKRYPVLLTQYSGPGSQQVAEGWGPDWEDALVTHGYIVVCVDPRGTGYRG\n+EEFKKLTYGNLGRLEVEDQISTARYMARQSYVDPARIGIYGWSYGGFMALGCAFRGEGLF\n+KMAIAVAPVTSWRYYDSIYTENFNGLPDDYPKGYDDNSPVNLAHLFRDDSTRLLIVHGTA\n+DDNVHFQNTMEMARALNKLGKQYDMMVYPDQNHSMMPDDMIHVREKMLRYTLENL*\n+>Ley3_66761_scaffold_6_9 # 8697 # 9167 # 1 # ID=1_9;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.577\n+MKNLLLHPTPIGTVGIVENGRAITD'..b'KILLFIVS\n+TAVIVVIVWGLSSTKSSNVIVEPNIASVDSIITEPIDTAKIIADQRKDSIFEGNIFAGLR\n+FGISKGEYQRLINNFKREYDNKIVFPNEKGNVLSYRISGVEPKFYRGKLYAVEVKIDNHH\n+AYYELEPVFERKYGITKNNHWKWQNAEIELSSRAPHSESVHDPTSGTGARYNIKKPGYTT\n+IRYRDLTLYNLERKEQMQNDSIKKAKEQAAREKRRQREREQADRYKENI*\n+>Ley3_66761_scaffold_90_229 # 199454 # 199642 # 1 # ID=4_229;partial=00;start_type=ATG;rbs_motif=TAAA;rbs_spacer=14bp;gc_cont=0.354\n+MSRRNDDGLGCIFGFLAIFYIFKWLTDSAEELTLKELIWIIIVCLGICLVGIVSFAIINA\n+LT*\n+>Ley3_66761_scaffold_90_230 # 199887 # 200270 # 1 # ID=4_230;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.357\n+MEQNEKNESTPETKSDNTVLENGTPKKQKSNTVNINIPLIIEIAFYVVGAILLYFAFKWY\n+NNDLELWNNSDPFMFSEKRYVGGDAYNYIISAARSSAIVTKSLIWTILGCSSIIAGRLTS\n+IQRKKCK*\n+>Ley3_66761_scaffold_90_231 # 200261 # 200668 # 1 # ID=4_231;partial=00;start_type=ATG;rbs_motif=TAA;rbs_spacer=3bp;gc_cont=0.360\n+MQVKKRTLYIICSIALLLVIGGIVYYKYSEKQAKVKALANSIERALDAYNREVEREYDRM\n+KRQYEDYIETIKDSSYSLSFRERYIHKVYDLIGYQYSYGYDAFDVWNFSYEQQKHEKQDL\n+EMLKLKATEKVQKSL*\n+>Ley3_66761_scaffold_90_232 # 200911 # 201432 # 1 # ID=4_232;partial=00;start_type=ATG;rbs_motif=AAAA;rbs_spacer=12bp;gc_cont=0.362\n+MKFKLPMFSKESLKESSGWIAFVLGLICYLFGNIVIYFQSDIALIWTKCVFWADLLISIG\n+DILLIGGVVGFLTSVAQWKGVFTEELTNVVYGKELLSKRIDVKTIWENTTKQMFKYKFHC\n+IHREILDAMSKYLPNKNEISYYDNFTEDIVVKWADRNKGLVSTTETLVFDHST*\n+>Ley3_66761_scaffold_505_1 # 222 # 2180 # 1 # ID=5_1;partial=00;start_type=ATG;rbs_motif=TAAAAA;rbs_spacer=7bp;gc_cont=0.529\n+MEQDDIFSSDFGDDEQQNANAREEVAYTEDNIVTLDWREHIRRRPGMYIGKLGDGSNFDD\n+GIYVLLKEVLDNSIDEYMMGYGKQITVDVTETTVAVRDYGRGIPLGKLIEVASKMNTGGK\n+YDSKAFKKSVGLNGVGIKAVNALSSDFIIKSVRDGQARQAVFCEGKLVSEEEPFATDEPN\n+GTYVNFTPDSTIFRDYAYREEYIVPLFKNYTFLNTGLSIIYNGKRYHSRNGLLDLLRENI\n+TKEPLYPIIHLKGEDIEIALTHANQYGEEYYSFVNGQHTTQGGTHLAAFKESVSRTLKDY\n+FGRNFEYSDIRNGMIAAIAIKVEEPVFESQTKTKLGSRDMGPDGPTVAKFISDFVKKELD\n+NYLHKNLETAEIILKKVQESERERKAMAGVTKLARERAKKVNLHNRKLLDCRVHLNDVKG\n+DEEKKAASSIFITEGDSAAGSITKIRNVETQAVFSLRGKPLNSYGLTQKVVYENEEFNLL\n+QAALNIEEGIDGLRYNNVIIATDADVDGMHIRLLMLTFFLQFFPDLVKKGHVYVLQTPLF\n+RVRNRDTVRRAKGKGKGEKKDETYYCYTDDERIEAINKLGNKAEITRFKGLGEISPEEFR\n+DFIGPDMRLDRVTLRKEDGVAELLEFYMGKNTSERQTFIIDNLVIEDDEAIS*\n+>Ley3_66761_scaffold_505_2 # 2205 # 2711 # 1 # ID=5_2;partial=00;start_type=ATG;rbs_motif=TAAA;rbs_spacer=9bp;gc_cont=0.556\n+MHTDSNDITEREAAAGRRAMFPGSFNPFTIGHQSLVDRGLELFDTVVIAAGISSKKQVSE\n+AEIIARLEPIRALYAGNPRVEVTYYTGLTVDAARRHGCKFLLRGIRNTIDMEYERSLADI\n+NRRISGIETVLLFTLPELSAVSSSTVRELQHYGHDVSEFMPNTGDSEE*\n+>Ley3_66761_scaffold_505_3 # 2784 # 3689 # 1 # ID=5_3;partial=00;start_type=ATG;rbs_motif=TAAA;rbs_spacer=6bp;gc_cont=0.530\n+MEKTDTPEKAAQAGEKTAVLLMHCPDRPGIIAILTEFINANGGNILYLDQYVDRVNSVFY\n+MRVQWDLEGFAIPAEKIRDYFDTLYAQRFEVSYNLYFTGTPQRMAIFVSKMSHCIYDLLA\n+RYRAGEWKEWNVEIPVIVSNHPDLKYVADQFGIPFEVISVTRENKPQAEAQQFALLEHYN\n+IDFVVLARYMQVLSDDFTRRYPNRVINIHHSFLPAFIGSKPYHAAHQRGVKLIGATSHYV\n+TADLDAGPIIEQDIVRITHKDTVDDLVKKGRDLEKIVLARAVEKHLQHKILPYGNKTVVF\n+N*\n+>Ley3_66761_scaffold_505_4 # 3700 # 5298 # 1 # ID=5_4;partial=00;start_type=ATG;rbs_motif=AAAAA;rbs_spacer=6bp;gc_cont=0.528\n+MKLTKYLLLLPAALLCLVDAAAKNEPLKGFDKIGYTSRIIESFYLDSIDNDKLAEEAIVA\n+MLKTLDPHSLYSNPEETKELVTPLEGNFSGIGIQFNMLNDTLIVIQTTSGGPSEKVGILP\n+GDKILSADTTMISGVKRPRNEIMKALRGPKGTRVDVKVARRNVEEPIEFRITRDDIPVNS\n+VDAAYMASPGTGYIRLSRFAETSYDEVLEALKGLEKQGMKRLIFDLEDNGGGILGAAAEI\n+AELFLDKDDLITYTESPKLGTTPYVSRQKGRYADLPVAVTVNQYSASASEILSGALQDHD\n+RAVVVGRRTFGKGLVQRPFPFPDGSMIRLTVARYHTPSGRVIQKPYERGKAEDYAADIKA\n+RYDNGEFYSADSISFPDSLKYTTLHRHRTVYGGGGIMPDKFVPLDTALYTPYYRDLMAKG\n+VFNTFCLGYTNDHRKELQKKYDTQDKFIKNFDVDDKMMGEFVAQGEKDGVPVNDNELARS\n+RTLIAAIIKGIIGRDLFDTSTYFRIVNPLLNPIYREALEIINSPEEYEKYLN*\n+>Ley3_66761_scaffold_505_5 # 5359 # 5703 # -1 # ID=5_5;partial=00;start_type=ATG;rbs_motif=AAA;rbs_spacer=14bp;gc_cont=0.429\n+MITLSGIATDMIANNLTPFEPTHPGELIHDELEASNITQAKLAESIGVSPSLINEIIKGK\n+RGVNTEMALLIEAALGIPADLLLNLQRDYNMQVAKSDASFMTRLSSIRNIAAIL*\n+>Ley3_66761_scaffold_505_6 # 5705 # 6022 # -1 # ID=5_6;partial=00;start_type=ATG;rbs_motif=TATAA;rbs_spacer=4bp;gc_cont=0.358\n+MIVEFGEKYLRDLYDKGECSDKKHRYRIDIIKRYKRSVDYLKWASCKEDLYRINSLNFEA\n+LKGNKSDRFSIRVNNQYRIEFTMRETIEEPILTICNIVELSNHYD*\n'