Repository 'fasta_to_contig2bin'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/fasta_to_contig2bin

Changeset 0:5033d753964b (2022-06-27)
Next changeset 1:67ec0d65f925 (2022-10-24)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/das_tool commit 151c0e625ce20fb3ea75aa5043486e41b1da48de
added:
Fasta_to_Contig2Bin.xml
macros.xml
test-data/contigs.fasta
test-data/maxbin2.001.fasta
test-data/maxbin2.002.fasta
test-data/metabat.tabular
test-data/proteins.fasta
b
diff -r 000000000000 -r 5033d753964b Fasta_to_Contig2Bin.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/Fasta_to_Contig2Bin.xml Mon Jun 27 12:41:53 2022 +0000
[
@@ -0,0 +1,52 @@
+<tool id="Fasta_to_Contig2Bin" name="Converts genome bins in fasta format" version="@TOOL_VERSION@+galaxy@VERSION_SUFFIX@" profile="@PROFILE@">
+    <description>
+        to scaffolds-to-bin table
+    </description>
+    <macros>
+        <import>macros.xml</import>
+    </macros>
+    <expand macro="biotools"/>
+    <expand macro="requirements"/>
+    <expand macro="version"/>
+    <command detect_errors="exit_code"><![CDATA[
+#import re
+mkdir "inputs" &&
+#for $i in $inputs
+    #set file_name = $i.file_name
+    #set identifier = re.sub('[^\s\w\-\\.]', '_', str($i.element_identifier))
+    ln -s '$file_name' 'inputs/${identifier}.fasta' &&
+#end for
+Fasta_to_Contig2Bin.sh
+    --extension fasta
+    --input_folder 'inputs'
+    > '$contigs2bin'
+    ]]></command>
+    <inputs>
+        <param name="inputs" type="data_collection" collection_type="list"  format="fasta" label="Bin sequences"/>
+    </inputs>
+    <outputs>
+        <data name="contigs2bin" format="tabular"/>
+    </outputs>
+    <tests>
+        <test expect_num_outputs="1">
+            <param name="inputs">
+                <collection type="list">
+                    <element name="001" value="maxbin2.001.fasta" ftype="fasta"/>
+                    <element name="002" value="maxbin2.002.fasta" ftype="fasta"/>
+                </collection>
+            </param>
+            <output name="contigs2bin" ftype="tabular">
+                <assert_contents>
+                    <has_text text="contig-201_2"/>
+                    <has_text text="001"/>
+                    <has_text text="contig-201_798"/>
+                    <has_text text="002"/>
+                </assert_contents>
+            </output>
+        </test>
+    </tests>
+    <help><![CDATA[
+@HELP_HEADER@
+    ]]></help>
+    <expand macro="citations"/>
+</tool>
\ No newline at end of file
b
diff -r 000000000000 -r 5033d753964b macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Mon Jun 27 12:41:53 2022 +0000
[
@@ -0,0 +1,31 @@
+<?xml version="1.0"?>
+<macros>
+    <token name="@TOOL_VERSION@">1.1.4</token>
+    <token name="@VERSION_SUFFIX@">0</token>
+    <token name="@PROFILE@">21.01</token>
+    <xml name="biotools">
+        <xrefs>
+            <xref type="bio.tools">dastool</xref>
+        </xrefs>
+    </xml>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@TOOL_VERSION@">das_tool</requirement>
+            <yield/>
+        </requirements>
+    </xml>
+    <xml name="version">
+        <version_command>DAS_Tool -v</version_command>
+    </xml>
+    <token name="@HELP_HEADER@"><![CDATA[
+What it does
+============
+
+DAS Tool is an automated method that integrates the results of a flexible number of binning algorithms to calculate an optimized, non-redundant set of bins from a single assembly.
+]]></token>
+    <xml name="citations">
+        <citations>
+            <citation type="doi">10.1038/s41564-018-0171-1</citation>
+        </citations>
+    </xml>
+</macros>
\ No newline at end of file
b
diff -r 000000000000 -r 5033d753964b test-data/contigs.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/contigs.fasta Mon Jun 27 12:41:53 2022 +0000
b
b'@@ -0,0 +1,10 @@\n+>Ley3_66761_scaffold_6\n+ATCATCGTCCGCATCGACGAATTCGGCGAACGAGTACCCCTGACCATCTCCGATTACGACGCCGAGCAAGGCTCGGTAACGATCGTCACGCAGGCTATCGGAGCCTCGACCCGCAAGCTCTGCGCCTTGGAGCAGGGCGATGCGCTGGCCGATTTCGTCGGTCCGCTGGGGCACCCCTCGGAGTTCATTCACGAAGATCTCGACACCCTGCGCAAGAAACGCTTCCTGTTCGTAGCGGGCGGCGTGGGTACGGCTCCGGTCTATCCGCAGGTAAAATGGCTGCACGAACACGGGGTGAAAGCCGATGTCATCATCGGTGCCAAGACCAAGTCGATGCTGATCTATACCGAGGAGATGGCCCGCGTAGCGGACAATCTCTACATCGCTACTGACGACGGCAGCGAAGGCTTCAAAGGTATGGTAACGGCCCTGATCAAAGACCTGATCGACAACCGGGGCAAGCAGTACGACGTCTGCGTGGCCATCGGTCCGATGATTATGATGAAGTTCGTGACGCTCACGACCAAGGAGTACTCCCTGCCGACGGTCGTATCGCTCAATACGCTGATGGTCGATGGTACGGGCATGTGCGGCGCCTGCCGCGTCACGGTGGGCGGCAAGACCGTCTTCACCTGTGTCGATGGCCCCGAATTCGACGGGTTCCAGGTCGATTTCGACGAAGCGATGCGCCGTCAGGGTATGTACCGCACGCAGGAAGAGCGTGCCCGCGCCATCGAGCAGGAGCGCGAGAACGGTCACAAATGCCGTGTCGGGCTCGACAAATAACTACCGATCCACACACAACCGGACGTTTCCGGCAGACGAGTATGGAGCGATGCTCTGCGTCCGAATGCCGAAGGCGTCCACAGAACAATGAAAGCAAACAACTATGGCAAATAAAATTCCGCGCGTTCCCGTGCGCGAACAAGATCCGAAAGTCCGGGCCACCAACTTCGAGGAGGTGTGCTACGGTTATAATGTCGAGGAAGCCACGCTCGAAGCGTCCCGCTGCCTGAATTGCAAGAATCCCCGCTGCGTGGCGGCGTGTCCGGTGAATATCCGTATTCCGGATTTCATCCATCAGGTCGTGGAGGGTAATTTCGCTGCGGCTGCCGCCGTTATCTCCGAGGACAGCTCGCTGCCGAGCGTTTGCGGCCGCGTCTGCCCGCAGGAGAGCCAGTGCGAAGGCTCCTGCGTTTTGGGAGTCAAGGGCGAGCCGGTGGCTATCGGCAAGCTGGAGCGCTTCGTCGGCGACTGGAAAATCGAGAATGCCGACAAGATGCCCGCTCCCGACATCAAGCGCAACGGACACAAGGTAGCGGTCATCGGCAGCGGTCCTTCGGGACTGGCCTGCGCGAGCGACCTGGCCCGCATGGGGTATGAAGTGAAGATTTTCGAAGCGCTGCACAAGGTCGGCGGCGTATTGGTGTACGGTATTCCCGAATTCCGTCTTCCCAAGGAGAAGATCGTAGCCAGGGAGGTCGAGGCCGTGAAGAAGCTGGGTGTAGAGATCGAAACCGACGTGATCGTCGGCCGCACCGTGACCATCGACGAACTGATGAACGAAGAGGGTTACGAGGCCGTCTTCATCGGTTCGGGTGCCGGCCTGCCCCGTTTCATGGGCATCCCGGGCGAAAACCTGAACGGCGTGGTTTCGGCCAACGAGTTCCTCACGCGTACCAACCTGATGAAGGCTTACGATACGCATTACGATACACCGATCTATGTCGGTCAGCGCGTAGTGGTGGTCGGCGGCGGTAACGTGGCGATGGATGCCGTACGTACGGCTAAGCGCCTGGGGGCCGAAGCGACCATCGTATATCGCCGCAGCGAGAAGGAGCTGCCCGCCCGCGTGGAGGAGGTCCACCACGCCAAGGAGGAGGGGATCGAATTCCGCATGCTGACCAATCCGACTTCGATCATCGGCGACGAGAAGGGCTGGGTCGTAGGTATCAGTTGCGTCGAGATGGAGTTGGGCGAGCCCGACGAAAGCGGACGCCGCTCTCCGATCGAAAAGGCCGGTTCGGATTTCGAAATTCCGTGCGACGTGGTGATTATGGCGCTCGGCACTTCGCCGAACCCGCTGCTCAAGATGACCACCGAAGGGTTGGAAACCAACCGCAAGGGGTGTCTGGTGGCCGATGAAAAGGGTGCGACTACCCGTGAAGGGATCTTCGCCGGCGGCGATGCCGTAACCGGAGCCGCGACGGTCATCCTGGCCATGGGCGCCGGCCGTAAAGCCGCCAAGTCCATCGACGAATACATCCGTCAAAAAAAGCATTAAACGCTTGCAAGATATGAGGAAATTTTGTTTCGCCGCATTCGCTGCTGTGCTCATCGGGACGACGGCTTGTACACCCAAAGCTCCGGAGCAATTCACGGGTAAGATCGTCGATGGAACGATGAATACCGTCACGGTAGAGTCCCCGGCCGACGGAAGAAGGGTGACTTTCACCACGGAGGATGCCGATATGCAGGAGGCTTACGGCCTGCTGCTGGGCAATACGGCGACCGTTACCTACCGGGGGAAGCTCGGCGAGACGACTCCGGCTTTGAAGGTGGTGACCGATCCCGCCTATGTTACGGCCATCGGCCGCTGGGTGGAGCCCAATCCGATCGACCCCGAGCAGGAACAAGGCATTGAAATTCGAGTAAACGGCGTCGCCGCTTCGATCAATATGCTGACTCTGCGCTACGAAGCTTGGGAATTGGCGCCCGAAGGAGATCGAATTATCTTGAGCGGCGTATCGGAAGGAAGCGGCGGGCCGTATCCTTTCGAGCAAACGGCTGAAATTATCGAGATGGACGGCAAGCCGGCCCTCAAGATCGATGCGGTCGTTCTGACCAAAAAAGATCTGATCTAAATTGGATGCCGTTTCATATACGGCTTGGTTCGATAAAAAAACTCACGCTTTTCAAGCGTGAGTTTTTTTATCGGGTGCCGGAAATCGGGATTCGGAACCAAACAACGGAACTTCGTCGGGAAGGAGTGCGGAAACAGGTAAAAAATGGGAGCAAAGGGAATCGACGAAACGATAAGCCGAAATTACTCCGTTTTACCGACCAACCGCTCGACCCGGTCGAGGATCATCTGCGGTTCTATGCTCCAGATACAGCGGTAATCGCCATATTTACAGGGTTTCTTTCCATATACGGAGCAAGGTCGGCAAGCGAAATCGGTCTGCAAGACACCTTCCTGTCCGAACCCGTAACCCAGAAAGCCGAGCCCGGGATGGGTCGCTCCCCACACCGACACGGTGGGCGTAGCCATGAGCGAAGCCAGATGCATCACCAGCGAATCCATCGACACCACGCAATCCAGGTTGGAAATGAGGTTCATCTCATCCCCCAGCTTTATCTTGCCATACAATGCCGTGACGTTCGGATAGAGCGCCTCCATGCGGCGGGCGAATTCGGCTTCCTCTCCGCCGCCGCTGTGGACGAAAACCCGGTCGAAACGCCCGCTCAACAGACGGACGGCTTCGGCGCTCAACTTTTCGGGATAAGTCTTGCCCGGCTGGGCGGAGAACGGCGCGAAACCGATCCATATACCCTGTTTTTCTCCCATGGGATTGGGTCGGGGGCGTTTCTCGGCCGGCCGGGGATCGGGAAAGTCGAATCCCAAGCGACGGAAGACGTCGCAATAACGGATGACGGTGTGTTTCAAAGGTTTCACACCTTCCGAACCGCGTCCCAGCCGCATGTATTTTTCGATCCGCCCCTTGTGAATTACCGAAACGGGAATCCCCCGCAGGTGGAGTGCCGCACGCACCATCTTCGAACGCAGTACATTGTGCATGTCGGCCACCGCGTCGATCTTCAACTCGGCCGCTTCGCGGGCGAACCGAATGGCGCCCCGGATACCCCGGTGCGTGCGGCGGGTTTCGATATCCAAAAAATCGACATCCACCCCTTCGAAAAAGGGATGGAACAGCGATTTGGTCGCAACGGTCACCT'..b'TCGTGTCAAAAATGTCGCACTGCATCTATGACCTGCTTGCCCGCTACAGAGCCGGTGAATGGAAAGAGTGGAATGTGGAGATACCGGTGATAGTCAGCAACCATCCCGACCTGAAATATGTGGCCGACCAGTTCGGCATACCGTTTGAGGTAATATCCGTTACCCGCGAGAACAAGCCGCAGGCCGAAGCGCAGCAGTTCGCGCTGCTTGAGCACTACAATATCGATTTTGTAGTTCTTGCCCGCTACATGCAGGTGCTGTCAGACGATTTCACACGCCGTTATCCCAACCGGGTAATCAACATACACCACTCGTTCCTGCCCGCATTCATCGGGTCGAAGCCATATCATGCAGCCCACCAGCGCGGAGTAAAACTCATAGGAGCGACAAGCCACTACGTGACAGCCGACCTTGACGCAGGTCCCATCATAGAACAGGACATCGTGCGCATCACTCACAAAGACACAGTAGACGATCTGGTGAAGAAGGGTCGCGACCTCGAAAAGATTGTGCTGGCGCGCGCAGTCGAGAAGCATCTCCAACACAAGATATTGCCGTACGGAAACAAAACGGTGGTATTCAACTGAAAAAACCGATATGAAATTAACAAAATACCTTCTTCTGTTGCCCGCGGCCTTACTATGCCTTGTAGACGCCGCGGCCAAAAACGAGCCTCTCAAGGGCTTTGACAAAATAGGCTACACAAGCCGTATTATCGAATCGTTCTATTTGGACAGCATCGACAATGACAAACTTGCCGAAGAAGCCATCGTAGCGATGCTCAAGACGCTCGACCCGCATTCGCTATATTCCAATCCGGAAGAGACCAAGGAACTGGTAACGCCGCTCGAGGGGAATTTTTCGGGGATAGGCATCCAGTTCAATATGCTCAACGATACACTTATAGTGATACAGACCACCTCGGGAGGTCCGTCGGAGAAAGTAGGAATACTCCCCGGCGACAAGATACTGAGCGCCGACACGACTATGATATCGGGAGTAAAACGCCCGCGCAACGAGATAATGAAAGCTCTCCGTGGGCCGAAAGGCACGCGTGTAGACGTGAAAGTGGCGCGCCGCAATGTGGAGGAGCCGATAGAGTTCCGCATCACCCGCGACGATATACCGGTCAACTCGGTCGACGCCGCCTACATGGCGTCGCCCGGCACAGGCTACATACGTCTGTCACGTTTCGCCGAGACATCATACGACGAGGTCCTCGAGGCTCTCAAAGGACTGGAAAAGCAGGGTATGAAACGCCTTATCTTCGACTTGGAGGATAATGGAGGCGGCATACTTGGAGCAGCAGCCGAGATAGCAGAACTCTTTCTCGACAAGGACGACCTCATCACCTATACGGAGTCGCCAAAATTAGGCACAACGCCTTACGTATCGCGCCAAAAAGGGCGCTACGCCGACCTGCCCGTGGCCGTGACCGTCAACCAATACAGCGCATCGGCATCCGAGATACTCTCGGGTGCGCTTCAGGACCACGACCGCGCCGTAGTAGTGGGGCGCCGCACGTTCGGCAAAGGCCTTGTGCAAAGGCCGTTTCCGTTTCCCGACGGATCGATGATACGTCTGACTGTCGCACGCTACCACACTCCCTCCGGTCGCGTCATACAGAAACCTTACGAACGTGGTAAAGCCGAGGACTATGCGGCCGACATCAAGGCCCGTTATGACAACGGCGAATTCTACAGTGCCGACAGCATATCGTTTCCCGACTCGCTGAAATACACGACACTGCACCGGCACCGCACGGTATACGGTGGGGGCGGCATAATGCCCGACAAGTTCGTGCCCCTCGATACCGCGCTTTATACGCCCTACTACCGTGACCTGATGGCGAAAGGAGTATTCAATACCTTCTGCCTCGGATACACCAACGACCATCGGAAAGAACTGCAAAAAAAATATGATACGCAGGATAAATTCATCAAGAATTTCGATGTCGATGACAAGATGATGGGAGAATTTGTGGCGCAGGGGGAAAAAGACGGTGTGCCTGTCAATGACAACGAGCTTGCCCGCAGCCGTACTCTTATCGCCGCCATTATAAAGGGAATAATAGGGCGCGACCTGTTTGACACATCGACCTATTTCAGAATAGTTAATCCGCTGCTCAACCCCATCTACCGCGAAGCATTGGAGATAATAAATTCACCGGAAGAATACGAAAAATATCTGAATTGAAATCAATAGAGCAGGGGTGTAGCAAAAGTGCTACACCCCTGCTCTATTGATTTCAATATCTTATAATATCGCAGCGATATTACGTATTGATGAAAGGCGTGTCATAAATGAAGCGTCAGACTTAGCTACCTGCATATTATAATCGCGCTGAAGATTGAGGAGCAAATCAGCCGGGATACCCAATGCCGCTTCAATAAGAAGTGCCATTTCCGTATTAACGCCTCTCTTCCCTTTAATAATTTCATTAATGAGGGAGGGACTTACTCCAATACTTTCAGCGAGCTTTGCCTGAGTAATGTTACTTGCTTCAAGCTCATCGTGAATAAGCTCCCCCGGATGGGTAGGCTCAAACGGAGTCAAATTATTTGCTATCATGTCGGTGGCAATGCCCGAAAGTGTAATCATATCAATCGTAGTGGTTTGAAAGTTCAACAATATTGCAAATGGTCAAAATCGGTTCTTCAATAGTTTCGCGCATGGTAAACTCTATCCGATACTGATTGTTAACTCTAATAGAAAATCGGTCGGATTTATTTCCTTTCAAGGCCTCGAAATTTAAAGAATTAATCCGATACAAGTCTTCTTTGCAAGAAGCCCATTTAAGATAATCAACGCTACGCTTATAGCGCTTGATTATATCAATCCTGTAGCGATGTTTCTTATCGCTACATTCTCCTTTATCATAGAGGTCTCTCAGATATTTTTCCCCGAATTCTACTATCATATATTTATATTACAGGACAAAGGTATGAAAAGTATTTAATTCTTCACAAAACTGTGAAGAATATTTTCAGAATGCACCCCATGAAAGATTCTTCCGCCACAATCCGAAATTACAGTGCATATTCCACTTCCCATTTAATATCGCTTTCCGCGGTTAAAAACCGCGGCTATTATAACATCCTATTAATCAATTACGTAGTAGCCGCGGTTTCTTTGCATAGCAAAGCGCCAAAGGCGATGATTAACCGCGGACAATAAAGCCTGCAATTGTCATATTGTCATGCACTGCGATTTCGGATTGAGGCATTCTTCCGATTCTCATAAAACGAAGGCGAAGGCAATCGCAGTATGCGGTTGCCTTCGCACGATTGACACGGTGGGTACTGTCAGCAGCGGCCACCGTGCCGCCTATCACACTTTATTACCCTATCTAATGGTCGATTAAACCGCCTGTCAATCAATCCGCCTTATCGTTAACTTACCGCACCGACAAGGCCGATCAGTACACGATTATAGTCGACAGGCTGAAAAACCAACCGCTTTTTCCTTCTAAAAAACATGAGACAACCCATTTATTATCCCATAGCCATTACCCTGAGAAACCATCAGTACCGGTCCCGAATACGCTTTTATATCTGCACTACCCCAATCAGCTCCATGATAATGAAACCAACACGTTAATTCCAGACATTGCATCAAATAGTTGAAAATAAAATAAGAATAACTGAAATGTCAAGGACGAGTATTAGCTATCATGAGAGATAAAAGTATTATATGCACTAAATTGCTTTCAACATGCGTAATGCTCAGTAGCAACGGCTCGCAAATGTAAAAATTTATTTTTAAACAACAGACAAATTATTTACTAAAAAACTGATAAAATCGCCCGAATTAATGTTAAACTTTGTAAAATCACCTTTCAACATTTGATTTATGGATAAAATTTAACTAAATCGAGGGTTAAATGACACCTACCAACGCCCACATCGACAGATGAGTAAGCAACATAAGGGCGATAATAATCCACGTCATGACTGTCCGCCGGCCATAA\n\\ No newline at end of file\n'
b
diff -r 000000000000 -r 5033d753964b test-data/maxbin2.001.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/maxbin2.001.fasta Mon Jun 27 12:41:53 2022 +0000
b
b'@@ -0,0 +1,8225 @@\n+>contig-201_2\n+TAACCAGACGGAACGGTATCTGATGGCCACGGGATTGGTGCACCGACTGGATAAAACTCTGCAGGAGGAT\n+GAGCCGAGGTGTAAAGCTGCGCCCACGGCGACCAGTTTGCGTCGGTCGTATCCCGTCGTGAACGAATAAA\n+TGCCGGAGCATGAGCACCGCTTGTACCACTCCAGCCGATGAGTAACTCACCTTCGCCAACGGCTGTCATC\n+CCTTTCAGGTGAATGATATTTCCATACGCTGTTGGATATCCGTTGTTATACACCTCGTATAACTCAAGAC\n+CTGCTGCCCCCTGCGTATTGTCTGTCAGCGCGGTTATATTCACTCAGCAACCCCGGTATCAGTTCATCCA\n+GCGCGGCTGCTTTGTTCATGGCTTTGATGATATCCCGTTTCAGGAAATCAACATGTCGGTTTTCCAGTTC\n+CGGAAAACGCCGCTGCACCGACAGGGGGATCCCGTCGAGAATACTGGCAATTTCACCTGCGATCCGCGAC\n+AGCACGAAAGTACAGAATGCGGTTTCCACCACTTCAGCGGAGTCTCTGGCATTTTTCAGCTCCTGTGCGT\n+CGGCCTGCGCACGCGTAAGTCGATGGCGTTCGTACTCAATAGTCCCTGGCTGGAGATCTGTCTCGCTGGC\n+CTGCCGCAGTTCTTCAACTTCCCGGCGCAGCTTTTCGTTCTCAATTTCAGCATCCCTTTCGGCATACCAT\n+CTTATAACGGCGGCAGAGTCATAAAGCACCTCATTACCCTTGCCACCGCCTCGCAGAACGGGCATTCCCT\n+GTTCCTGCCAGTTCTGAATGGTACGGATACTCGCACCGAAAATGTCAGCCAGCTGCTTTTTGTTGACTTC\n+CATTGCACATTCCACGGACAAAAACAGAGAAAGGAAACGACAGAGGCCAAAAAGCTCGCTTTCAGCACCT\n+GTCGTTTCCTTTCTTTTCAGGGGGTATTTTAAATAAATACATTAAGTTACGACGAAGAAGAACGGAAACA\n+CCTTAAACCGGAAAATTTTCATAAATAGCGAAAACCCGCGAGGTCGCCGCCCCGTAACCTGTCGGATCGC\n+CGGAAAGGACCCACAAAATGATAATAATTATCATCTACATGTCACAACGTGCATCTACGCCATCAAACCA\n+CGTCAAATAATCAATTATGACGCAGGTATCGTATTAATTGATCTGCATCAACTTAACGTAAAAACAACTT\n+CAGACAATACAAATCAGCGACACTGAATACGGGGCAACCTCATGTCAACGAAGAACAGAACCCGCAGAAC\n+AACAACCCGCAACATCCGCTTTCCTAACCAAATGATTGAACAAATTAACATCGCTCTTGAGCAAAAAGGG\n+TCCGGGAATTTCTCAGCCTGGGTCATTGAAGCCTGCCGCCGGAGACTGTGCTCAGAAAAAAGAGTTTCTT\n+CTGAAGCAAACAAAGAAAAGAGTGACATTACTGAATTGCTCAGAAAACAGGTCAGACCAGATTGAAGCAA\n+TTTAGATAATCGTGCAGACTACGCCCCCTCATATCACATGGAAGGTTTATCTATGGATCAGGTAGTCATT\n+TTTAAACAAATATTTGATAAAGTTCGAAACGATTTAAACTATCAATGGTTTTATTCTGAGCTAAAACGTC\n+ACAATGTCTCACATTACATTTACTATTTAGCCACAGAGAATGTTCATATTGTATTAAAAAATGATAATAC\n+AGTGTTATTAAAGGGCCTAAAAAACATTGTGTCTGTCAAATTTTCAAAGGATAGGCATCTTATAGAAACG\n+ACCTCTAATAAGCTGAAATCCAGAGAGATCACATTTCAGGAATACAGAAGAAACCTTGCTAAAGCAGGAG\n+TTTTTCGGTGGGTTACAAATATCCACGAACAAAAAAGATATTACTATACCTTTGATAATTCATTACTATT\n+TACTGAAAGCATCCAGAAAACTACACAGATCTTACCACGCTAAACCATAACGTCCGGCTTCTCTCACTCC\n+TGAGCCGGACTGCATTGGTTTAATAAAAACCATCAACAATTGTGATTTAGATATTCGGAACCATTCAAAT\n+ATAACAAAACCCCGTAAAAACGAGGTTTATGGATAAATTTTATTATTGAATACATCAGATTAAATTAATC\n+TTGACATCATAGCTTTCAAGACCCGTCATTTTTTCCCGTGCGGTAAACTGAATACTGGTAACTTCTTTCC\n+CGGTCTTTTTCTTAAGTTCAATAATTTTTTTTGTTATATATTCAGAAATATCTGCTTCTGCTTTTGTTTT\n+TAAGTTTTCAATATTCATCATTTCCTCTTTTAGTCTGTTATGACTTTCCAGTTACACAGTAAGTCGATTA\n+TATGGTGCAAACGTGTAAAAGATAAGATGAAACATCGCAATAATCAACATACGATAGTCTAAATTTTACA\n+CAAACAGACAAAGAGAATTTTCCTGAATTATCAATGCAATAGCATCAAATCAACTCAAGAGCCTTATTGC\n+TGCTTCCAGAATTTCTTCTGAAGTAACATGTCGATCCGCGGCTACATAAATGACTTTATGATCTCCGGTC\n+AGAGATGGAAACCCTGCGGCCATTACAGTAAGGTGTGTTTTTTCGCCATTTGGATATTCACGCATGATGG\n+TGTTAACTCCAGTCATCGCTGGCACTACCACTGCTGGTTCAGAGTTAAAAAAACTATGATTTTTTTCATG\n+ATGTTACCGTAGTATGTGAGTATCCATCGAATAGACACCAAGCAAAAAAGCTCCCGAAGGAGCCTTCATT\n+TTCACTTTTTTAAATCCAACGACAGACGGCTGGCATTTAAGTATTGTGAAATATTATCAAATGTAATCAT\n+CATTGATTTACAAAAGATACATTTTGCCCCGAAAGGATTCATGTCAGAAACATCAAAAGATGATGTTCTA\n+TACTGGGAACCATGACAACACGGGCATCTAAAGTGAATATGGTTTGTAATATTGTCTACCTCAAAGCGCC\n+ACTACATGAACAGCGGCAGGACCTTTAGGTCCGTTCTCAATACCAAATTCAACTTCCTGATTCTCAGTTA\n+ATGTTTTGAAATCGTTGCTCTGAATTGCTGAGAAATGGACAAACACATCTTTGCTGCCATCTTTCGGCGT\n+GATGAAACCAAAACCTTTTTCAGGGTTAAACCATTTCACTAAACCAGTCATTTTGTTAGACATAATTATT\n+ACCTTTTGAAGAAATTAGCCCTTGGGCAGAATGGTCCGAAAAAAAATATCAGAGAGAAAAACCAACAAGG\n+AAATCTCAAGAGGTACAAATAATAAAATTATAACAATGACTGCTTCAGATAAATTTGTAACAAACCAGAA\n+CACCATTAACGCATGATTAACCACCCATAGCAAGGATTACTTTTGTAAAGAAAAACACAGCAATGAAAGA\n+ATAGCTTTATTTATTAATAAAACGTGTCATTCTGATTAAGACCTTTTATCTTACCCTTAAGATTTCAGGA\n+ATTTTGGCTCATGGAAGAGTCCTTTTTATTTAAATTTTACATTCCGCGATGTAAATGTTCCGATTTAATA\n+TTACCCTACATTTGATGCTTTTTATCTCTTAAAGATTCATAGATCTGTTGACAAGTCACTCCTGCGATGT\n+AGCGTTCGTCAGCAATTTCAGCATAAAGCTGAGCTTCTGCTGCAATATCTCCGAGCATGTTGGTGAGCAT\n+TCCTTCGGCGGTTTTGGTTGTTTTGCCTCTGACGGCAGCGGCAAGATCTGCGGTATGCTTCGCTGCGTCA\n+AGGCGTATGGCATATTTTTTTGCTTCGGCACGCAACTGGTTAACACTATCAGACAGATAAGCAGCCCTGG\n+CAGAAATTTCAGCAGATTTCTGTTGCGCATCTTTAACAGCCTCATCACGGGCTATAGTTCGCCCCTGTTC\n+AATT'..b'GATGTATAACACCAAAACTTGCTATGCAGAAATTTGCACAGTGCGCAATTTTC\n+TGCATAGCCGCTCATTCTCCTTATAAATCCCCATCCAATTTATCCCTTCATATTCAATTAGTTAAATAAC\n+TAAATCCAAT\n+>contig-201_954\n+AATATTGCCAGTAGATTATTATCTAATCAAACATACTTTCCTATAATTCACAATTATAATTCAGGTGAAT\n+AAAAAAAGACCATGAAATATATAAATTGTGTATATAATATAAATTACAAATTAAAACCACATTCTCATTA\n+TAAATAATTATATGATGAAAAAACGGTATGAATTAATACTCAAATAAATAAAGCAGAGCTTAAACATAAC\n+TCTGCTTTATAATTAAAGGGACAAAATAATTTTACATCTGTTACTGTTTCGGTCGCAGATTCTCATCAAA\n+TACCAGGCGTTTCCTGCCAGGTTCAATTTCCCGCAATGGCTCGACTTGATGTAACGTCTGCTTACAGCGT\n+GTCACCAGCACCTGGTACTCATGCGTACCCTGCTTTTTCCATGCCAACTCCTGCTCACTGAGTTCACGAA\n+TCGCTTTCGCCGGGCTGCCGACAATCAGGTAATTAGCTGGCATTTCTGCTTTGGCTTTCACAAATGCGGA\n+TGCACCAACAATGCTGTTCTCGCCAATCACCGCACCGTCCATCACTACCGCGTTCATTCCCACTAATGCA\n+TTGCGGCGGATAATGCAGCCGTGAAGGATAGCGCTATGACCAATATGTCCATCTTCTCCTACAACAGTAT\n+CCTGCTCGGGAAAACCGTGCATAACGCAATTATCCTGAATGTTCGCGCCATCTTTCACCACGATACGACC\n+AAAATCGCCACGCAGGCTGGCATTTGGCCCAACGTAAACGCCCTTGCCGAGAATAACATCGCCGATCAAT\n+ACCGCTGTCGGATGGACAAAACTCTCTTCTGGCACAACCGGAGTCAGACCGTCTATCTGATAAATTGGCA\n+TAACGCCTCCTGTTCAATATTCAAGCCGCCAAAACGTTGAAAATACAGGCTTCCCGGCGCAGGCAGTTCA\n+CCGACCGAGGTTTCACCTTTTTCACTAACGAACGCTAAAGCAGCAGGCGCTACGCGCTGATAAATGTTGA\n+TACACAGCTGACGCGCCGTATGCCCTGCCCAGTGTGCCGGAAGCAACTCCTCCGGCAACAATGGGTCTTT\n+AAGGACGACACGGCGATAAAAATGGATCAGTAAAAGCTGAATATGAAATGCCCGCTCCGGGGTTAACTCG\n+TCTGCCGCCTCTTTTAAAAGCGGCACCAGCGGGCGGAATGACTGAATAAAGGTTTCGTACATGGCATTTT\n+GTTCAGTTAAATGCCAGCACTCTTCTACTCTGGCACGCAGTGCTGCGCGAGAAAG\n+>contig-201_956\n+GTTCGGGATGTTTCACTTCATCAATTAGAGTTAGTGCATCATTAAGACCAAGGTAATTCTGTGTCGAATA\n+GCGATAGGCCGCGATATTCAGTGAAGTACTTGTTTCTTCGAATAACTTGTTCCAGGAAACACGATAACTT\n+TGCCCCTGGTATGTTTTATCATCCGGGATACGAACATTGGAATGAGTCACATCGAAAGAAAATGCACCAA\n+CTGAAGTATTCAGACCAAGACCTAACAAACCAGCGGTATAGTTATTATCGGTTATCTGAATACCGGTATA\n+ACCCGTCAGATAGTTATTCAGGCCGTAGTAGTAGCTTGCTTGAAATAAATTAGGCTCATCCTGAATATCA\n+TCTTTTAAGACCTGACCGCCGCTAATATCCCAACGTCCAACGCCAGGGCGTAACATTTGAACAACGGATG\n+AGAAAGGTTGCGAGAATGTCCGCTTTGAGCCATCGGATTCTTCGATGGTAACAATAAGATCGCTGCCGTA\n+CCCTGACGGACTCAGATCATCAATGACGAAAGCGCCTGGCGGCACCGTCGTTTCATAAATCTTATAGCCA\n+CCTTGCGTAATAGTGACTTTGGCGTTGGTATTGGCAACGCCATGAATGATAGGCGCAAAGCTGGCTAAAG\n+TCGGAGGCAACATGCGGCTGTCACTGTATAAACGAATGCCTCGGATACTGACGGAATCAAAGGTTTCGCC\n+CGTCGTATAAGACTCACCAAGAATGAGTTGAGAACGCAGCGAGGCGATATCACGCTGAACATACCGATTC\n+TTAAAATCATAATTACTGCCAGAATCGGTCATCCAGTTGTAGTTGCCCGAGGCACGCAGTCGCCATGCAC\n+CTAAATTCATCCCACCGTTAAATGCAGCATAAATGCTTTCATTTTTTCGACCAGGGGTTTCACTATGATA\n+TCCGTTGAGGTTGTATGACAACATGGCCGCATTAATGCCGTTTTCCCATAACGATGGATCAACATAGTTT\n+TGGTAATTTTTCATTACCCAGGCTTGAGGAACGTCTATATCCAGACGTTGATCGTTAACGTCATAACGAA\n+CAGAAGCCTGAGGGATAATTTCCGTCAAATTGAGGCAATTGCCGAGCGTTTCATCCCTGGCAAGCAGAAC\n+GGCTTTTTCGTTATTTATATCGGGAGAATTAATATGAAACTGCAATAAATTCTTTAATGTGATACAAGCC\n+TGGGCGTTCTTTTTTCCTTCAATTGCGACAAATGTAATACTTTGGTTAAT\n+>contig-201_962\n+CCGGCTCGCGTTTGCCAAGATCCAACTCATTGAAGGCATAACCATGACGCTCAAGCAGTTGTGCCTCTTT\n+GATGGTGAAATCACCATGACGAGAGAATCCACGTGGATAATGTTTATTGTCGAAATATCGATTAGTCGTC\n+GTAAAGCTTTCCGCCATCCTGCACGCTCCTAATTCTTTGACCGAGCTAGTTATGGCGCGGAGTATTAGTT\n+ACGCTTGACAGAGTGTAAAACAAAACATTTAAATCATAACGACAAATAATTTTGCGGAGAGCACTGTGGA\n+TACGGAATTGTTAAAAACTTTCCTGGAAGTTAGCCGAACGCGTCACTTTGGTCGAGCGGCTGAATCGCTC\n+TATCTGACCCAGTCAGCAGTGAGCTTTCGAATCAGACAACTGGAAAATCAACTGGGTGTGAACCTTTTCA\n+CCCGCCACAGAAACAATATCCGTTTAACCGCTGCCGGTGAAAAACTACTGCCTTATGCAGAAACGCTCAT\n+GAGCACCTGGCAGGCCGCCCGTAAGGAGGTGGCGCATACCTCACGACATAACGAGTTTTCTATCGGTGCC\n+AGCGCCTCGTTGTGGGAATGTATGCTTAATCAGTGGCTGGGACGCTTGTATCAAAATCAGGATGCCCATA\n+CAGGCTTACAGTTCGAAGCGCGAATTGCCCAACGGCAGTCTCTGGTAAAACAGCTGCATGAACGCCAGCT\n+TGATCTTCTTATTACCACTGAAGCGCCCAAAATGGACGAATTTAGTAGTCAGTTGCTGGGATATTTCACT\n+TTAGCGCTTTATACCAGTGCCCCTTCAAAACTAAAGGGAGATCTTAATTATCTGCGACTTGAGTGGGGGC\n+CAGATTTTCAACAGCATGAGGCAGGTTTGATCGGTGCTGACGAAGTGCCCATTCTGACAACCAGTTCTGC\n+TGAACTGGCACAGCAACAGATTGCGATGCTTAATGGTTGCACCTGGCTACCCGTCAGCTGGGCGCGTAAA\n+AAAGGCGGCCTGCATACCGTTGTCGATAGCACAACACTTTCACGGCCGCTTTATGCCATATGGCTGCAAA\n+ATAGCGATAAAAATGCGTTGATTCGCGATCTTTTGAAAATTAACGTGCTGGATGAAGTGTATTAATATGA\n+ATGGCTGGCAAGGATGCCGGTAGAAGGATTTACTTCGGAGAGGGTTATTTCAGATAAAAAAAATCCTTAG\n+CTTTCGCTAAGGATGATTTCTGGCAGG\n'
b
diff -r 000000000000 -r 5033d753964b test-data/maxbin2.002.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/maxbin2.002.fasta Mon Jun 27 12:41:53 2022 +0000
b
b'@@ -0,0 +1,2186 @@\n+>contig-201_29\n+GAATTAGTTAAAGTTTCAGTATCGATATCTTTTACCGTATATGTTGGGGATACTATTTGTATAGATTTAT\n+GATGATTCGGGGACCAAATTAAATGCGAGGGATATTCCGGAGTACGTGAATTAGGGTAAAATGCAAGCGT\n+TGGTTTATGATAAGCCGCAGCGATATGAACAAGAGCTGTATCAACAGAAATGACAAAATCACTATACTTG\n+GTCAACGCAACGGTATAAATAAACTCATCAAATGGTAGTGTTTCGATTTCAAGTATTGGTATTGTCAATA\n+AATCTTGCGGTAACCCGGTAAATATAATCCGATAATTTTCAAAGTGTGTTTTCACTTCTTGATATATAAC\n+TTTTATTTGCTCAAACGTAAGACGGCATATTTTTTTTGCACCTAATGGATTAATAATGACTATTCTTGTA\n+TCTCCAATAAATTCTTTTATTTTATCTTCAACATCTACTGGTAAATGCAAGTCGTAGTTGGTGGAAAATT\n+TACCCTCACCATAAATATGCTTCAGTATTTCTATTGCTCGTGTACTCATATGTTCTTTTAAACATTCATC\n+GTGGGGATGGTAAAATGAATAGTAACGCTTATACCAATGATCAAAACCCAGAATGTAAGAATCTTTTAAA\n+CTTGATAATATTAAGCTATGCTTAAATGAGGGCATAGTTTCAAAGGGGTCTAATACAATATCGAACTGTA\n+AATCCCGCAGATGCTTACATAGAGTAAGCATTTCAAGAAAACCGGTTGATTCTTTAATACAGAACTCAAA\n+TATATTTTTATTATTAGAGAGAAATTCCCCACCCTTTCTATTTGTGAGAAGAGTTATTTTAACCCCTTTA\n+CTATAAAGTTCACGATAAATCGAACTTAATACAATTAGATCACCAAGTTTATTATTATCATGAATAATAA\n+GGCATGATTTAACTTGTGCTGGATCTGTAATTTGATTATTTATTTTATTACGAAATAAAAAAGAAAGGAA\n+ATTAATCTTGATTTTGTTTATATAAAATCTTTTCTTTTTGTGAAAAGTTCCTAAGCGCATTTTTATACCA\n+TATTATTTTAGTTTCAGGATGATTAATTAGCATAAGAATCGGTTGAAGTTCTATATTGCATTTTTTTTCT\n+TGTCATATCTTTTGATTCTTCTGCACTGATGTCTTGAAGTTTAATAAATGGAATTACATCGTAAGAAATA\n+GCTGTATCATCTGATAAATTATAAATATTAATATCTTTTACATTATCATGCATAAAACGAAAAAATGGCA\n+ATATTTTGAATAAATCCCTACTTAATTCCGAGGGCATGGGATTTTTATTCTCATCATAGAAACGAGAACA\n+GCTACCCGTTAAATCAAGACCAGAACAAATAATCCGCGCATACTTAAGTGAATATGCGATTTGAATTGCA\n+GCAAAGGCAATAGTATGGCATGAGCAATAACCAAGACTAATGTCCTTGCAAAATCCAACCAGACGACCTT\n+TTTTAGACAACGGTACAGAGATCAGCAGTTCTTTGTGAATCTGTCTCAAAATATTAAATTTAATCTTCTT\n+TATAAAACCACCTTTTTCCCGACGGTAAAAGGACCGTAATACGAGGCAGTTCTGGAGGATATAAAGTTTA\n+TCTTCTTTGGAAGCGTGTTCATAAACGTCAACGTTTACTATGGTATAACGACTTCTCTGGCTAAATTTAT\n+AAAAATCATCACGACGCTGATGTAAAAATCGGACATCTGTAAGTACATATATAAAAGGAACGATATTATT\n+ACTTAACAGATATTGCGCAGAACCATTGACAGCAATAATATCCTTTGTTCGTAATACTGACAAAGGTGTT\n+TTTTGCGATGTAGGGCCCGAAAGAAAAATAATAACATCATCAGATATTTTATTTTCAATCAGGTTTTCAA\n+CATCTTTTTTGTCAATGTATCTAATATTCTTCATGATAAACCTGTGAAATAAATAACTCCGCTTAAAACT\n+GTCCTGGTGAAGACATGTAATTGTGGGATTTTTTTTAGCGCGCTGGTTTCCCTTTCAAACGCCGCATAAA\n+ATTGCGCATTTTTTTACGATATACTAAAAGATAATAGCCTAGATCTCTAATCTCATTTTTAATACCGTAA\n+TGACGCTCTAAGTCAATACGATCTTTCGCTTTACGCTGCGCTGAAGCACGCTTTCCGGAGAGATCGATAA\n+TTCGAACCTCACCATTTTTTATAATGAAGTTACCACGATGGGGGTCGCCAGAAACCATGCCATGTTGATG\n+TAAGGCATTAATTGATTGCTGAATTTTATTTTTTAGCGCATCATCAATATCGGGCATATCACACAACTCT\n+ATGCCATCAATATACTCGATGATCATGATATAAGTATGGACAAAACGTAAGGTTTTCCGTTCAGCCAATA\n+AATAAAAGTCATTGAGTGTATTTAACCCTTCATTTCGTACTTTTTGGGTTTGCTCAAAAAGGCGTTCGTA\n+ATAATCACCTTTTAACAGAGACTTAAAGAAACGTTCGTTACGCTTAACTTTCGGAGAAAAAACCTTAAGA\n+ATCAATTTACCGTAATCGGTATCAATAAGCATAACTTTTGTATCATCAATAGAACGAAAAACCTTGATGA\n+TATTTATATTATAAGACAAGAAGTCATTTAATACATTGAGGTACTTTGAATTGTTTTCATCGGTAAAAAC\n+AACCAAGTCTTTGATCTTGCTCTTCTGAATCATAATAAACCAGTTAAATGTTATTTACGGTAATATTTTC\n+GGCAAAGATAACAGACTCCTGCTATAATTCCTGAGATATAATGATGTTGCACTAAAAGATGTTTATATCT\n+TTTTTTAAATTCAATAATTGATTTCGCATCTCGTGGAGAGTCATCTTTCCAGGGGGAATTTTCTAAAGCT\n+ATTTTATAGTATTTTACCGATGGATAAATTGCCCATTTGTGCCACGGTTTAGTTGCACCTGTATAATGAA\n+TAAGAAGAGTACTTTCTGTAATCAGCTTTTTATAGTTTTGATGTGTTTTGTCTTTTAATTCACTTTTAAT\n+TGTATAAATTGTATTGTACTCACGAGGCAAAAATAATGTCATCCCTTTCAGTAAGACATTCATAACATCC\n+TGATCAGGGTATTTATAAACATTATCTTTACTCATAAGAATAGACAACGCTTTTTCTGTTAGTTTTGCGT\n+CAGCCCATTTTTTTAAGTCTAAATAAACGACACCGGAATTAAAGTACTGCCCAAGTAATTCAGGATCAGA\n+CAACCTGGATACCGCCTTTTCTTGCATTGGCTCAACATCTTTAACAACAGCAGCAACCGCTCCATTTAAA\n+CCCAGATGTAATAGTTGGCTAATATCGCCTTTACAAACAACATCTGCATCAAGATAAAGCAAACGATCAA\n+GCGTTAAACCCAATAATTGAAATGCAAATAAACGGAAGTACATTGCTCTTGACCAGACCTGTGTACAAGG\n+CAAGCACTGGAGCTTATCAGTGTTAATTCTATATAACGTGATTCTTAATTGGTTTTGCTCTGCAAGCTTT\n+GCAATTTTTTGAAAAAAACCATCATTATAAACATCAGCAATAATATAAAAATCAAGATTAATATGTCGAT\n+TATTTAGGACAATTGATGTGATGGAAACACCTACACCATCAAGATAATTAGCATCGACACCATAGGCAAC\n+ATTTAAACATTCAGAAGTATTTATATTAGCTAGCCGAAAATCCCAGGCTTTAACTTTATCTATCTCTATG\n+GCAGGAAATGAGTCCACAATGCTACCCTTATATCATTACTTTATAGTTTCCCAGTTTTAATGCTTTATCT\n+TTTCAATAAAATAAAAAAGATAGTTGCTAAATCCTTTTAGATATCTATGCTTTTTAAGCATATGTTTTGC\n+GCT'..b'TGCATGATTATTTATGATCTCAATTCTGCATTTTGTCAGTAAAATGC\n+>contig-201_940\n+AGCGTTACGTGATCTTTCCCTGCAAATGGAACGCAAAATAAACACCTATTCCATGAGTTATATAATTTTT\n+CACAATGATTAATTTGTTTTCTCAGGAAGAGATTTTATTTCTCTTCACTACGAATTAGTTCATGCTGTAT\n+CTTTATTAAACATTCGTAAGACTCATTTTTGTTCGGGAGATGTGCTGTCATTCGAGCATAAGTTGGTTTC\n+TCATCTTTAAAATATTTTACCATGATTGAATTATCAAGGACTGCCAACAACTGAACTGGATCACTGCTCT\n+TTTTTTGATAGATACCCGCTCTTATATAACTTCTAAACCGATCGCCGAGAAACGCCGTTTTTTCTGCTGT\n+ATTTATCAACTCCTGCAACGTTCCTTTGATGGCATGATTTTCATTAAGGCGTAGTGACCCGACGCGAATT\n+AAGAGTCTCGCCCCGCTTGGTGTGAATTTATTATTTTTACATGTACCCAGTTCTGTTTGCCAATAATACT\n+CACCGATGTCCTCATTCTGATACCATCTCCACATGGCTTTATTATTTAAGACAGGAAACGCGGAAAAAAT\n+AGTACCCTTAGCGAAAATAGTAAAACAATCATGATCTTTAGCTTGTATTTCGCAATCAGCTATAACACCA\n+AAACTAACAAATATCATCAGCAAAAAGAACAAAACTCTTTTCATTTTCTTATTCCTCTCGATGTTCTCTG\n+TTTCATCTTAGCTAAAATTTCACCCAAATCATCTATCCCTGCTGTTGCTGGCCCATCGGGTTTATTAATG\n+TCTGGGAATAAATAGGGTTCTGCACAAGTATATCCTGGTGGTAATTGAGTTGTTGGCCAATTTGTCTGTG\n+GCAGGTAATCACTTGCTGTCTTTGTATCCATCCCTGGATACTGGGAATCATCCTGTGGCGTACAAGTCAG\n+ATTTGGTTTTACCCACTTCCTGCAATACAGTGTGTAGTCGTAAGGGCTTAATGCTCTGAAGAATGTTTTG\n+AAAACATTAGGCGCACTACTGGCCTGGTCAATAGGATATGGCAGTCTTAATTGTTTCGCTATGTCCGGCA\n+ATTTACTTGGATCGGGCGTAGGCGGTTTGTTGGGTCTCGCTCCATATCCGCCATTATTTAAGTGTCCATA\n+TTTTGATGCCAGTCCCATTGAATCTATATACTGAACCGGATTCAGCGGATACTGATAAAAATTCCATCCC\n+CCCTTCAGCCCAATCGGATCCTGAGTGATATACCTCCCCTGCAGCGGGTCATAATAGCGGTGGCGGTTGT\n+AATACAGGCCGGACTCCTCATCATACTGCTG\n+>contig-201_950\n+GGATCTTAGATTCTGTGCTTTTAAGCAGAGATTACAGGCTGGTTACGTTACCAGCTGCCGGGCCTTTAGC\n+GCCGCTTTCGATGGTGAAGGACACTTTCTGACCTTCGTCCAGAGATTTGTAACCATCGTTCTGGATAGCA\n+GAGAAGTGTACGAACACATCTTTAGAGCCATCGTCAGGAGTGATGAAGCCGAAGCCTTTGTCAGCGTTGA\n+ACCATTTTACGATACCAGTCATTTTACCGGACATAGTGTATTACCTTTAATAATTAAGTGTGCCTTTCGG\n+CGATATGGCGTGCTTTACAGATTTTGAAGCGTTAAAGGAATGTGCACTACGAGGGGTATCAACGATAACT\n+CTTGAAGGGACTTGCCTTACTACACTGCTTTAATGGTCTGTACGTCAAACCGTTGATGTGCATTAAGCCA\n+CGCATTGGCGGGTGATGCAACAATTATTTTTCATATTTATGATTAATCGGTTGGAAAACGGTCCTGTCAT\n+CAGGACCGTAAACAGCAATAAAGTGGATAAAAGTCTATTCCATCAACTGCTTACTTAATGCCGGGTTGGC\n+TTGAATCAAACGCATCAATTTTAGTTCGGCACTTGAAGGCTTCACGCGTCTGGATTCCCATTCCTTTACC\n+ATGGCGACTGATACGCCCAAAACCCGGGCGAAATCATCGATTTTTAATCCTGTCCCTTTTCGTAACTGCT\n+CAATTTCGGTACAGGACGTTGTTCTGTGCGTCAGGGTAATTTTCTGCGTTTCATCTTTAAAAACAATCTG\n+TTCCAGGCTGCTCAACAGCTCATGCATTGGATCTTTATATTCCATTGAAAACTCCTCAAATCACACTGCG\n+GGATCGTGAATTGCATCGAAGCTCATTAAGAATAGTCGGGAAAAGCAGACACAGCGGGGTGAAGTCAGGG\n+CATGCTCTGGCTATGATTCGATTCAGCCTGTCATTTAGCGTGACTTATAGCCACCTAACGATCTGATAAA\n+TGCCGATATATCTCTTACCACTCCTGTTTTGTAAAGATTTCGAAAATCTAACCTTCTGCGAAGGCGTAAA\n+TCTCTGGCTACAAAAAAGGCAACGGCACTATCATTTTTTAACAATGAAACAACAAATTAACCTTGTTTCA\n+TTTTCTCCATGATTTTACCAGGAAGATTACGTAGAAAGGGTATCCTGCAAGCCTGTCCTGGACTATCCTT\n+GTCACGTCAGACACGCGTGTGTCGTTGTGCGCTTTTTTTGGGTGAAAGGAGTAAGAAAATGGCGACAGG\n+>contig-201_955\n+TGGCCCCCTTTCCAGGTGACCGTGTAATCTGAACTACCCTTTGGTATCTTCAGTGCCTGCCTGCAGGCTG\n+AGGTGTTGCCCTTACAAATGCAACAACGACATGGATTACAACACCCTCATAAACAAAGGGCAATCACCTG\n+ATCTAAGCTCTTACCTATGACAGTGATAGGTTATGCCTTTTACTCGACTTTTGCACTGACTGAAAAGGAC\n+AAATTAATGTTAAAAAAGATACTTTTACTGGCTCTGCTTCCTGCAATCGCCTTCGCAGAGGAACTTCCTG\n+CTCCAGTAAAAGCGATTGAAAAACAGGGCATTACAATCATCAAAACATTCGATGCCCCCGGAGGAATGAA\n+AGGTTATCTCGGAAAGTATCAGGATATGGGCGTCACCATCTACCTGACTCCAGATGGTAAGCACGCTATC\n+TCTGGTTACATGTACAACGAGAAAGGTGAAAACCTGAGTAACACACTTATCGAAAAAGAAATTTACGCAC\n+CAGCCGGACGCGAAATGTGGCAACGGATGGAACAATCCCACTGGCTCCTCGACGGTAAAAAAGATGCGCC\n+GGTCATTGTCTACGTCTTCGCCGATCCGTTCTGCCCATATTGTAAACAGTTCTGGCAGCAGGCGCGCCCG\n+TGGGTAGATTCTGGCAAAGTGCAATTAAGAACATTGTTGGTTGGGGTTATCAAGCCAGAAAGCCCGGCGA\n+CAGCAGCGGCAATTCTTGCCTCCAAAGATCCCGCAAAAACCTGGCAACAATATGAAGCCTCTGGTGGCAA\n+GCTTAAGCTAAACGTGCCTGCAAACGTAAGTACAGAGCAAATGAAAGTGTTAAGTGACAATGAGAAACTG\n+ATGGACGATCTGGGGGCAAATGTCACGCCGGCTATCTATTACATGAGTAAGGAAAATACGCTACAACAGG\n+CCGTGGGGTTGCCCGATCAGAAAACGCTTAATATCATTATGGGGAATAAATAAAAGGTAATTCATGGATG\n+GTTGAACTATATCCCTGCTTTTCAACCATCCTAAAAAAGCATGAATTGCTCGCTCTGCCCTAAGTGGCTG\n+TGCTATTTTAGAAAAACTTAATCCTGAGTTAAGCAAAAAAACATAATCAATAAAAATATATACGCAAAAA\n+ACATTGATTAAGTGAATATATCATGGAAGAAAAATATAACCGGAGTAGTGTATGGCCAATCTCTACGACT\n+TGAAAAAGTTCGACTTAAATCTTCTTGTCATATTTGAGTGTATTTACCAG\n'
b
diff -r 000000000000 -r 5033d753964b test-data/metabat.tabular
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/metabat.tabular Mon Jun 27 12:41:53 2022 +0000
b
@@ -0,0 +1,3 @@
+Ley3_66761_scaffold_6 metabat.8
+Ley3_66761_scaffold_191 metabat.8
+Ley3_66761_scaffold_505 metabat.25
b
diff -r 000000000000 -r 5033d753964b test-data/proteins.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/proteins.fasta Mon Jun 27 12:41:53 2022 +0000
b
b'@@ -0,0 +1,6277 @@\n+>Ley3_66761_scaffold_6_1 # 1 # 786 # 1 # ID=1_1;partial=10;start_type=Edge;rbs_motif=None;rbs_spacer=None;gc_cont=0.599\n+IIVRIDEFGERVPLTISDYDAEQGSVTIVTQAIGASTRKLCALEQGDALADFVGPLGHPS\n+EFIHEDLDTLRKKRFLFVAGGVGTAPVYPQVKWLHEHGVKADVIIGAKTKSMLIYTEEMA\n+RVADNLYIATDDGSEGFKGMVTALIKDLIDNRGKQYDVCVAIGPMIMMKFVTLTTKEYSL\n+PTVVSLNTLMVDGTGMCGACRVTVGGKTVFTCVDGPEFDGFQVDFDEAMRRQGMYRTQEE\n+RARAIEQERENGHKCRVGLDK*\n+>Ley3_66761_scaffold_6_2 # 890 # 2284 # 1 # ID=1_2;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.604\n+MANKIPRVPVREQDPKVRATNFEEVCYGYNVEEATLEASRCLNCKNPRCVAACPVNIRIP\n+DFIHQVVEGNFAAAAAVISEDSSLPSVCGRVCPQESQCEGSCVLGVKGEPVAIGKLERFV\n+GDWKIENADKMPAPDIKRNGHKVAVIGSGPSGLACASDLARMGYEVKIFEALHKVGGVLV\n+YGIPEFRLPKEKIVAREVEAVKKLGVEIETDVIVGRTVTIDELMNEEGYEAVFIGSGAGL\n+PRFMGIPGENLNGVVSANEFLTRTNLMKAYDTHYDTPIYVGQRVVVVGGGNVAMDAVRTA\n+KRLGAEATIVYRRSEKELPARVEEVHHAKEEGIEFRMLTNPTSIIGDEKGWVVGISCVEM\n+ELGEPDESGRRSPIEKAGSDFEIPCDVVIMALGTSPNPLLKMTTEGLETNRKGCLVADEK\n+GATTREGIFAGGDAVTGAATVILAMGAGRKAAKSIDEYIRQKKH*\n+>Ley3_66761_scaffold_6_3 # 2298 # 2864 # 1 # ID=1_3;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.566\n+MRKFCFAAFAAVLIGTTACTPKAPEQFTGKIVDGTMNTVTVESPADGRRVTFTTEDADMQ\n+EAYGLLLGNTATVTYRGKLGETTPALKVVTDPAYVTAIGRWVEPNPIDPEQEQGIEIRVN\n+GVAASINMLTLRYEAWELAPEGDRIILSGVSEGSGGPYPFEQTAEIIEMDGKPALKIDAV\n+VLTKKDLI*\n+>Ley3_66761_scaffold_6_4 # 3047 # 4078 # -1 # ID=1_4;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.583\n+MPRKNKKLPRHLLVIRTSAMGDVAMLPHALRALKEAYPEVKVTVATKSLFHPFFEGVDVD\n+FLDIETRRTHRGIRGAIRFAREAAELKIDAVADMHNVLRSKMVRAALHLRGIPVSVIHKG\n+RIEKYMRLGRGSEGVKPLKHTVIRYCDVFRRLGFDFPDPRPAEKRPRPNPMGEKQGIWIG\n+FAPFSAQPGKTYPEKLSAEAVRLLSGRFDRVFVHSGGGEEAEFARRMEALYPNVTALYGK\n+IKLGDEMNLISNLDCVVSMDSLVMHLASLMATPTVSVWGATHPGLGFLGYGFGQEGVLQT\n+DFACRPCSVYGKKPCKYGDYRCIWSIEPQMILDRVERLVGKTE*\n+>Ley3_66761_scaffold_6_5 # 4062 # 4667 # -1 # ID=1_5;partial=00;start_type=ATG;rbs_motif=AGGA;rbs_spacer=5-10bp;gc_cont=0.528\n+MFTQNANKIFAQAIDDYHRYDDVDHQLSNPYAEGTIDHLLYMKNWVDTVQWHLEDIIRDP\n+RIDPVEALKIKRRIDKSNQVRTDMVEYIDSYLLDKYKNIDVQPGARINTETPAWAIDRLS\n+ILALKIYHMRQEVLRKDVDEAHRAACQQKLDVLLSQQVDLSTAIEELIEDIEAGRKYMKT\n+YKQMKMYNDPALNPVLYAAKK*\n+>Ley3_66761_scaffold_6_6 # 4808 # 5806 # 1 # ID=1_6;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.554\n+MNFYHKAISLAGFVLLTVLPAQAQVRQTREEYINKYKKIAVAHMERYGIPASITMAQGIL\n+ESDCGNSWLSQASNNHFGIKCKRNWTGDVVYYDDDEKGECFRSYPSVEASYQDHAEFLDS\n+QPRYDSLFSYAPNDYKSWARGLKAAGYATAPDYAQRLIRIIEESKLYLLDREDGLTIYGA\n+QTGHLTDDWFSGQSNVDQAAAIASGAVDPDDYRVTVNAHKGYNVYRTNGVNYILAHDGDT\n+FEKISRDFRISARNLRKFNDVSKNAQPVANEVIYIGRKKKRWDGNVLLHTVREGETLWSL\n+GQSYGIRTKSLARLNKLKEGDALTPGTTIKIR*\n+>Ley3_66761_scaffold_6_7 # 5825 # 6511 # 1 # ID=1_7;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.534\n+MESIPLRKKILETIVSKSTLKQKVFDNTFATFNDLKETLLEMASEMDDQLDGLLDRRVRL\n+EYRDRGKFEAQIQVANDLLIFQMHTDVFEFEPNHVIWQNPYVQTDRDNSYCGVINIYNFL\n+SDSFKFNRNADEGYLIGRIFINREKCYFVEGKQQTSMRPMQFGKAEIDSEALVRILESAI\n+YYALNFDLLLPSYDDNKRVTVDQFNTKLDNSKFVTGKRLGYDFDVDDI*\n+>Ley3_66761_scaffold_6_8 # 6536 # 8683 # 1 # ID=1_8;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.577\n+MLKKLLLLTLLGTAFAAQAEAAAPSTYRDIARLRAMNQRAQGIRPAADGKSYTTLRGNAI\n+ERHSYTKDAPGELLFEWKNDKENRDIADYQFSPDGKLLLLSIGSEPIYRHSYTTDYYLKD\n+ADGLRPILTDLSDTRDASFSPDGRTIAFSSGNNLYLYDIVGDSVRPITTDGAWNRIINGT\n+TDWVYEEECAFTKAYAFSPDGQKIAYLRFDESLVPVFEMMRYDGKLYNEAYSFKYPKAGD\n+ANSVVDLYVYDLKTGETERVDVGPDRGQYILQPEWTPDGRLCFQRMNRRQNHFEAVLCNP\n+DGTQQVIYDERSPKYVDHLNKTFYFLEDGRRFIVREETSTGYMHLYLYGIGQGVLHPITQ\n+GEWEVTDFVGLRGDKVYYISTESSPLKRDLYRVGLDGKHKERLTPGDGYYSIYPSADLSY\n+YICEGGDSSAPGRTDVFNAAGKRVRTLYDNAPLKEALAEAGLPVREFFTFTTERGDELNG\n+YMLKPLDFDPAKRYPVLLTQYSGPGSQQVAEGWGPDWEDALVTHGYIVVCVDPRGTGYRG\n+EEFKKLTYGNLGRLEVEDQISTARYMARQSYVDPARIGIYGWSYGGFMALGCAFRGEGLF\n+KMAIAVAPVTSWRYYDSIYTENFNGLPDDYPKGYDDNSPVNLAHLFRDDSTRLLIVHGTA\n+DDNVHFQNTMEMARALNKLGKQYDMMVYPDQNHSMMPDDMIHVREKMLRYTLENL*\n+>Ley3_66761_scaffold_6_9 # 8697 # 9167 # 1 # ID=1_9;partial=00;start_type=GTG;rbs_motif=None;rbs_spacer=None;gc_cont=0.577\n+MKNLLLHPTPIGTVGIVENGRAITD'..b'KILLFIVS\n+TAVIVVIVWGLSSTKSSNVIVEPNIASVDSIITEPIDTAKIIADQRKDSIFEGNIFAGLR\n+FGISKGEYQRLINNFKREYDNKIVFPNEKGNVLSYRISGVEPKFYRGKLYAVEVKIDNHH\n+AYYELEPVFERKYGITKNNHWKWQNAEIELSSRAPHSESVHDPTSGTGARYNIKKPGYTT\n+IRYRDLTLYNLERKEQMQNDSIKKAKEQAAREKRRQREREQADRYKENI*\n+>Ley3_66761_scaffold_90_229 # 199454 # 199642 # 1 # ID=4_229;partial=00;start_type=ATG;rbs_motif=TAAA;rbs_spacer=14bp;gc_cont=0.354\n+MSRRNDDGLGCIFGFLAIFYIFKWLTDSAEELTLKELIWIIIVCLGICLVGIVSFAIINA\n+LT*\n+>Ley3_66761_scaffold_90_230 # 199887 # 200270 # 1 # ID=4_230;partial=00;start_type=ATG;rbs_motif=None;rbs_spacer=None;gc_cont=0.357\n+MEQNEKNESTPETKSDNTVLENGTPKKQKSNTVNINIPLIIEIAFYVVGAILLYFAFKWY\n+NNDLELWNNSDPFMFSEKRYVGGDAYNYIISAARSSAIVTKSLIWTILGCSSIIAGRLTS\n+IQRKKCK*\n+>Ley3_66761_scaffold_90_231 # 200261 # 200668 # 1 # ID=4_231;partial=00;start_type=ATG;rbs_motif=TAA;rbs_spacer=3bp;gc_cont=0.360\n+MQVKKRTLYIICSIALLLVIGGIVYYKYSEKQAKVKALANSIERALDAYNREVEREYDRM\n+KRQYEDYIETIKDSSYSLSFRERYIHKVYDLIGYQYSYGYDAFDVWNFSYEQQKHEKQDL\n+EMLKLKATEKVQKSL*\n+>Ley3_66761_scaffold_90_232 # 200911 # 201432 # 1 # ID=4_232;partial=00;start_type=ATG;rbs_motif=AAAA;rbs_spacer=12bp;gc_cont=0.362\n+MKFKLPMFSKESLKESSGWIAFVLGLICYLFGNIVIYFQSDIALIWTKCVFWADLLISIG\n+DILLIGGVVGFLTSVAQWKGVFTEELTNVVYGKELLSKRIDVKTIWENTTKQMFKYKFHC\n+IHREILDAMSKYLPNKNEISYYDNFTEDIVVKWADRNKGLVSTTETLVFDHST*\n+>Ley3_66761_scaffold_505_1 # 222 # 2180 # 1 # ID=5_1;partial=00;start_type=ATG;rbs_motif=TAAAAA;rbs_spacer=7bp;gc_cont=0.529\n+MEQDDIFSSDFGDDEQQNANAREEVAYTEDNIVTLDWREHIRRRPGMYIGKLGDGSNFDD\n+GIYVLLKEVLDNSIDEYMMGYGKQITVDVTETTVAVRDYGRGIPLGKLIEVASKMNTGGK\n+YDSKAFKKSVGLNGVGIKAVNALSSDFIIKSVRDGQARQAVFCEGKLVSEEEPFATDEPN\n+GTYVNFTPDSTIFRDYAYREEYIVPLFKNYTFLNTGLSIIYNGKRYHSRNGLLDLLRENI\n+TKEPLYPIIHLKGEDIEIALTHANQYGEEYYSFVNGQHTTQGGTHLAAFKESVSRTLKDY\n+FGRNFEYSDIRNGMIAAIAIKVEEPVFESQTKTKLGSRDMGPDGPTVAKFISDFVKKELD\n+NYLHKNLETAEIILKKVQESERERKAMAGVTKLARERAKKVNLHNRKLLDCRVHLNDVKG\n+DEEKKAASSIFITEGDSAAGSITKIRNVETQAVFSLRGKPLNSYGLTQKVVYENEEFNLL\n+QAALNIEEGIDGLRYNNVIIATDADVDGMHIRLLMLTFFLQFFPDLVKKGHVYVLQTPLF\n+RVRNRDTVRRAKGKGKGEKKDETYYCYTDDERIEAINKLGNKAEITRFKGLGEISPEEFR\n+DFIGPDMRLDRVTLRKEDGVAELLEFYMGKNTSERQTFIIDNLVIEDDEAIS*\n+>Ley3_66761_scaffold_505_2 # 2205 # 2711 # 1 # ID=5_2;partial=00;start_type=ATG;rbs_motif=TAAA;rbs_spacer=9bp;gc_cont=0.556\n+MHTDSNDITEREAAAGRRAMFPGSFNPFTIGHQSLVDRGLELFDTVVIAAGISSKKQVSE\n+AEIIARLEPIRALYAGNPRVEVTYYTGLTVDAARRHGCKFLLRGIRNTIDMEYERSLADI\n+NRRISGIETVLLFTLPELSAVSSSTVRELQHYGHDVSEFMPNTGDSEE*\n+>Ley3_66761_scaffold_505_3 # 2784 # 3689 # 1 # ID=5_3;partial=00;start_type=ATG;rbs_motif=TAAA;rbs_spacer=6bp;gc_cont=0.530\n+MEKTDTPEKAAQAGEKTAVLLMHCPDRPGIIAILTEFINANGGNILYLDQYVDRVNSVFY\n+MRVQWDLEGFAIPAEKIRDYFDTLYAQRFEVSYNLYFTGTPQRMAIFVSKMSHCIYDLLA\n+RYRAGEWKEWNVEIPVIVSNHPDLKYVADQFGIPFEVISVTRENKPQAEAQQFALLEHYN\n+IDFVVLARYMQVLSDDFTRRYPNRVINIHHSFLPAFIGSKPYHAAHQRGVKLIGATSHYV\n+TADLDAGPIIEQDIVRITHKDTVDDLVKKGRDLEKIVLARAVEKHLQHKILPYGNKTVVF\n+N*\n+>Ley3_66761_scaffold_505_4 # 3700 # 5298 # 1 # ID=5_4;partial=00;start_type=ATG;rbs_motif=AAAAA;rbs_spacer=6bp;gc_cont=0.528\n+MKLTKYLLLLPAALLCLVDAAAKNEPLKGFDKIGYTSRIIESFYLDSIDNDKLAEEAIVA\n+MLKTLDPHSLYSNPEETKELVTPLEGNFSGIGIQFNMLNDTLIVIQTTSGGPSEKVGILP\n+GDKILSADTTMISGVKRPRNEIMKALRGPKGTRVDVKVARRNVEEPIEFRITRDDIPVNS\n+VDAAYMASPGTGYIRLSRFAETSYDEVLEALKGLEKQGMKRLIFDLEDNGGGILGAAAEI\n+AELFLDKDDLITYTESPKLGTTPYVSRQKGRYADLPVAVTVNQYSASASEILSGALQDHD\n+RAVVVGRRTFGKGLVQRPFPFPDGSMIRLTVARYHTPSGRVIQKPYERGKAEDYAADIKA\n+RYDNGEFYSADSISFPDSLKYTTLHRHRTVYGGGGIMPDKFVPLDTALYTPYYRDLMAKG\n+VFNTFCLGYTNDHRKELQKKYDTQDKFIKNFDVDDKMMGEFVAQGEKDGVPVNDNELARS\n+RTLIAAIIKGIIGRDLFDTSTYFRIVNPLLNPIYREALEIINSPEEYEKYLN*\n+>Ley3_66761_scaffold_505_5 # 5359 # 5703 # -1 # ID=5_5;partial=00;start_type=ATG;rbs_motif=AAA;rbs_spacer=14bp;gc_cont=0.429\n+MITLSGIATDMIANNLTPFEPTHPGELIHDELEASNITQAKLAESIGVSPSLINEIIKGK\n+RGVNTEMALLIEAALGIPADLLLNLQRDYNMQVAKSDASFMTRLSSIRNIAAIL*\n+>Ley3_66761_scaffold_505_6 # 5705 # 6022 # -1 # ID=5_6;partial=00;start_type=ATG;rbs_motif=TATAA;rbs_spacer=4bp;gc_cont=0.358\n+MIVEFGEKYLRDLYDKGECSDKKHRYRIDIIKRYKRSVDYLKWASCKEDLYRINSLNFEA\n+LKGNKSDRFSIRVNNQYRIEFTMRETIEEPILTICNIVELSNHYD*\n'