Repository 'proteinortho_summary'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/proteinortho_summary

Changeset 0:2e0e9c418a85 (2020-02-18)
Next changeset 1:c3f58c2eee1e (2021-09-14)
Commit message:
"planemo upload for repository https://gitlab.com/paulklemm_PHD/proteinortho commit 889335c0a31f156c3f90d4c2048cb4df155a53b2"
added:
proteinortho_macros.xml
proteinortho_summary.xml
test-data/C.fasta
test-data/C.gff
test-data/C2.fasta
test-data/C2.gff
test-data/E.fasta
test-data/E.gff
test-data/L.fasta
test-data/L.gff
test-data/M.fasta
test-data/M.gff
test-data/result.blast-graph
test-data/result.proteinortho-graph
test-data/result.proteinortho.tsv
b
diff -r 000000000000 -r 2e0e9c418a85 proteinortho_macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/proteinortho_macros.xml Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,23 @@
+<?xml version="1.0"?>
+<macros>
+   <token name="@TOOL_VERSION@">6.0.14</token>
+   <token name="@WRAPPER_VERSION@">2.9.1</token>
+   <xml name="citations">
+        <citations>
+            <citation type="doi">10.1186/1471-2105-12-124</citation>
+            <citation type="doi">10.1371/journal.pone.0105015</citation>
+        </citations>
+    </xml>
+    <xml name="requirements">
+        <requirements>
+            <requirement type="package" version="@TOOL_VERSION@">proteinortho</requirement>
+            <requirement type="package">diamond</requirement>
+            <requirement type="package">blast</requirement>
+            <requirement type="package">blat</requirement>
+            <requirement type="package">last</requirement>
+        </requirements>
+    </xml>
+    <xml name="version_command">
+        <version_command>proteinortho -v</version_command>
+    </xml>
+</macros>
b
diff -r 000000000000 -r 2e0e9c418a85 proteinortho_summary.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/proteinortho_summary.xml Tue Feb 18 17:56:58 2020 -0500
[
@@ -0,0 +1,98 @@
+<tool id="proteinortho_summary" name="Proteinortho summary" version="@TOOL_VERSION@+galaxy@WRAPPER_VERSION@">
+    <description>summaries the orthology-pairs/RBH files</description>
+    <macros>
+        <import>proteinortho_macros.xml</import>
+    </macros>
+    <expand macro="requirements"/>
+    <expand macro="version_command"/>
+    <command detect_errors="exit_code"><![CDATA[
+        proteinortho_summary.pl 
+            $queryfile
+            #if $queryfile2:
+                '$queryfile2'
+            #end if
+            2>&1 | awk '/^$/ && !f{f=1;next}1' | awk -v RS= '{print > ("output" NR ".tsv")}' 
+        &&
+        mv output1.tsv adjacencyMat.tsv &&
+        mv output2.tsv average1paths.tsv &&
+        mv output3.tsv adjacencyMatSquared.tsv &&
+        mv output4.tsv average2paths.tsv
+    ]]></command>
+    <inputs>
+        <param name="queryfile" type="data" format="tabular" label="A orthology-pairs / RBH file"/>
+        <param name="queryfile2" type="data" format="tabular" optional="true" label="(optional) A second orthology-pairs / RBH file" help="If you provide a second file, then difference is calculated (GRAPH - second GRAPH)"/>
+    </inputs>
+    <outputs>
+        <data name="adjacencyMat" format="tabular" label="${tool.name} on ${on_string}: Adjacency Matrix" from_work_dir="adjacencyMat.tsv"/>
+        <data name="average1paths" format="tabular" label="${tool.name} on ${on_string}: Average number of Edges" from_work_dir="average1paths.tsv"/>
+        <data name="adjacencyMatSquared" format="tabular" label="${tool.name} on ${on_string}: Matrix of 2-paths" from_work_dir="adjacencyMatSquared.tsv"/>
+        <data name="average2paths" format="tabular" label="${tool.name} on ${on_string}: Average number of 2-paths" from_work_dir="average2paths.tsv"/>
+    </outputs>
+    <tests>
+        <test expect_num_outputs="4">
+            <param name="queryfile" value="result.proteinortho-graph"/>
+            <output name="adjacencyMat">
+                <assert_contents>
+                    <has_text text="18"/>
+                    <has_text text="14"/>
+                </assert_contents>
+            </output>
+            <output name="average1paths">
+                <assert_contents>
+                    <has_text text="9.6"/>
+                    <has_text text="15"/>
+                </assert_contents>
+            </output>
+            <output name="adjacencyMatSquared">
+                <assert_contents>
+                    <has_text text="750"/>
+                    <has_text text="74"/>
+                </assert_contents>
+            </output>
+            <output name="average2paths">
+                <assert_contents>
+                    <has_text text="1088.8"/>
+                    <has_text text="1374.2"/>
+                </assert_contents>
+            </output>
+        </test>
+        <test expect_num_outputs="4">
+            <param name="queryfile" value="result.proteinortho-graph"/>
+            <param name="queryfile2" value="result.blast-graph"/>
+            <output name="average2paths">
+                <assert_contents>
+                    <has_text text="49.6"/>
+                    <has_text text="59.8"/>
+                </assert_contents>
+            </output>
+        </test>
+    </tests>
+    <help><![CDATA[proteinortho summary
+
+**What it does**
+
+proteinortho_summary : Summaries the (orthology-pairs/RBH) file(s) to determine how well the species are connected to each other.
+
+ * **Adjacency Matrix** : How well are the species connected to each other directly.
+
+ * **Average number of Edges** : Averaged number of connections for each species.
+
+ * **Matrix of 2-paths** : The square of the adjacency matrix = The number of paths of length 2 between two species.
+
+ * **Average number of 2-paths** : The average number of 2-paths for each species. If a species is not well connected to all the other species, it will result in a low average.
+
+
+If you supply a second orthology-pairs/RBH then the difference is calculated for all 4 outputs.
+
+E.g. given the RBH and the orthology-pairs of the same run : The outputs show how much the clustering removed from the initial reciprocal best hit graph.
+Or given 2 orthology-pairs from the same set of fasta files with different parameters (evalue,...) : The output show how the parameters change the connectivity of the output.
+
+**Other Proteinortho-Tools for downstream analysis**
+
+* `proteinortho grab proteins` : find proteins/genes in a given fasta file and retrieve their sequence(s). You can also use a orthology-groups file.
+
+More information can be found on github https://gitlab.com/paulklemm_PHD/proteinortho
+]]>
+    </help>
+    <expand macro="citations"/>
+</tool>
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/C.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/C.fasta Tue Feb 18 17:56:58 2020 -0500
b
b'@@ -0,0 +1,1006 @@\n+>C_10 asd asd\n+VVLCRYEIGGLAQVLDTQFDMYTNCHKMCSADSQVTYKEAANLTARVTTDRQKEPLTGGY\n+HGAKLGFLGCSLLRSRDYGYPEQNFHAKTDLFALPMGDHYCGDEGSGNAYLCDFDNQYGR\n+SVRSPLKKLLGFGYNPTYGKSALGDELRLGLVFREEFRKINKALLTGGANVVKAGVSYKD\n+SKKQGHKLLCDEMDNAVSLLKVLHPKLGCCVGDDNHSYGALSDFFVTCRRLIGKGHIEKE\n+RKSANECLAKSFQPFCSDLNLTGGGVRQHPGILHLKYAIKLLQATPMYMLLCLHAGKTKL\n+CDNAADSSEFCQLQDRDIVAEYVAVWKSKKPQSAPHVLKGPHNKKALVVSSCFAADFRIV\n+AFVVLDSSNDYSDAKASLDDAKLCIESCVFIYAPSLKADGTKGGKYCGKGSIPENCQLRE\n+HVVACDRAGSDCSGEPSSWSCACKFAIGANMRSLARNSDAATQTIHGTAIRDYTPAVGRS\n+SGTFVGPECPLSKFVSSYLFVAKDNGGKLFVWVPGGNYHSLWRSFTMNLCNIGLAELPLS\n+AYRNIKKKGYDGGKAGTLVTLMEFVAQGRVANALFDWGSCNEEGAGLSKQCSETVVGFLQ\n+QSSDYHRLFPKGYGEVPPRCTLGPFPAFHMLMQAALKGSFRTAQQPSVLFSCKCVKLKYS\n+SCKYAL\n+>C_11\n+PQKDTVVRHTRSDIFTLPEAVHYPDGTCQTMLGTVKATRYTASGAGAKSAGYKEGHLGIR\n+KKPHSPCSLAAKASPAGRKGAAAACPLLIGFLPLMFVRFTKTGAYVGDSLWSLKEGIQYY\n+VRHSVRALARSENASKRFVEVIGTKMAPVGRALKSFFTCAHKKPGFLGKADYVIPNHHHG\n+LQPPHYQGYTKKNAQNKTGKGDDLILAHTAVVAPLTKNKHFTHSVKGMEHSGCLGDCSGK\n+HQIASGTKSPVWGCNYLVPGHGDFLLFVRDPRRDIGKLNSNYGLKKEAPVHCGEQREAF\n+>C_12\n+AWEAFVKVNNCDDKSSKGNHNVKDKSLHTHAEFAGTETGCEFSSLLVVSKVHNGIVKDRP\n+RKKLISEKIYKDLGYVGKGACKGPDWWTWHLIPDLKGKVFFHLEPVTCGAAAVGKPQIGS\n+SVHVQLLLKGDGIKVSNYFKICKYQYALATLKKKVEECWADDGGGQHKAEAPLCQVTFDH\n+VASCYAAKLICGEGCERASKTDKGELGEKLLHVPRGLRFQAAGTVLAKKRQNVPDMAAGC\n+DNLSSNRVVHARETPMSDKRQHAHGESKHFGSGGKIHSSKLTEETGLSLFSPGELTCAKE\n+RGGIHTALPGNAGYDGGECALKTQTAAFYLQPYQGVLREKSVEKCGVFGRCFIRPAGFMF\n+GTLPPCYWGDRGCNLGDFLLIVGGQERVPFKSDDNNQVEPMGVSLVGEATCRLYLYQTNG\n+PKLKSRNAKKWANTGESQPDPGVNGLLKVHMEFDESFKTTNGMTFQFGFARCPKKPYLCK\n+PVGIYADSMGFIVNTFLAEEEGKSPIAEELIADGISGHIDGAKTQTANFNFEATLLRVKS\n+GGFYASFLPGSPNEPVYVQGRVALTKSKAKTHLPSAVNGKKLGLPSIGVFVKAFCCGLVK\n+VMCGITSKIYCGCSVALMGNDQCGYEGEPAGMQSYLTIGLYATVSDSNTKRRGPPGAPGG\n+TGKSAFTASSTGDCKGFKGSLFKAKPPLPMVGMIGAFLSKVKSIGAPGMGLVKLTRLTKY\n+QTPAIKCQDKKSNFVCYGVVKKHAIQCQAL\n+>C_21\n+FWDAFIKMDSCEARTSKGYHNVKDTSLLGRAEHAGEDTGCEFSSLLVLNKPHNGITSAKH\n+RKKTIGELIAKSIGFVGQGACCKGQDWWKHWHAVPDAKGKVFFHMQPSTCASAPAGKPQR\n+IGRSIHVQILDKGDGIKVKTFSKTGAYVYGLLTLKKKVQDCWAADGKASSNKVNPPIPQV\n+TFDHIPSRYNTKHICGKGCEHNAKTDKGELGESLLHPRGLKFQFFGTVLQRKRQELPNMV\n+AGCDDLESNRVVVSRGVPTSHSRPEAHGESKFFGQLAGILSSKMTENTGFSLFPEGDTCG\n+KEVGSIHTHLPGAYQSEAKEKLGKAYDGGECALRLAAFYLHPYDGLLSERTFEKCSIFGR\n+CYIKPTGFSFVGLLPPCFWGDRGCHLGKFLLIINAKGRLALKWGDKNQVEPLGVDLMGEP\n+TCRLRLYQTNAFKLRSKSFLTWGKTGASQKSLRQGVHTKIHMEYEDSFKTPNGKTFQFGF\n+SRPQKPYEGVSIKYADSMGFIVHAFFADDEGQKSFTEELTAEYIQGSDTQTAHFDIKVTL\n+LITKSGGFYASFRQGSLAETVSVDFRASKAKSTSHLPAEPICPLFHKEGEALNAKELNLP\n+AMGVFVSGFCCGLVGVRCGITHKIYCGAGLVLRDHDQCGYDSGPANMQFYLTIGYTTVWD\n+GNTVRRGPNGLPLATGKGAFMCSGASTGECTGFEGCLFRQKGPPMVAQNGKYLTYFTAVF\n+TAFLERVKSIGASGMGLVELTRLSKYQTPAVCRAMSKFICLGVVKKNALETAAL\n+>C_13\n+DAVKREGSLCKVVGGCALNLTSDLAAGVVDVSEFDEAANAYAPALATTTDIYSGKLFSSA\n+VYATLGPKDILLDATVFSVCVVCCDICLVVEAELGVCPKICYSLKFKSYHCENLICKKNE\n+ARFTFKKADKDWILAVTTALVLIKKKCQKKPIVCTLFQEMYYAERGRYLMPFNDEPSNCP\n+ALLGVCEM\n+>C_14\n+PSGDLQDNSSLHFCHPHYLLTILGRQYIQNFGEDFVFCSERALFYDGDLMSKNQISVMFG\n+VSNAAVTSRQALHVTDCSDPQGPFGKGLKDPSGRFENQPKSAFLSKLAPYVEPRALQPKP\n+DNWVIAWAGRLNLAIPYQCKWIVQRGGGCCVGLVNTSARVFEQVADVHAHDHLRYIPWKC\n+SKGKWTGLTCKAGKSGKVFFKGKGTPVTRADTARPFSKADELCHGHAGTLTQAGAGDYFK\n+GTLKGLLGAHRRGLKAAKMRFLLQSSNFMKVLEAFAVGHNLRLLAKRNHWKGGRAASYAA\n+NIVKRTMENDAHLPFLVQCTQGHKLIFTGSCTIHEYNGQSKAKTFLPFGERSQQGADNYH\n+RADATSGKYLPADYANTTCKDANLKITISRQNACRNMHGWILSATGIEGVVAQEVKIKPI\n+KKKTDDVHEIKVGVEIDSIGVGLKGAQLWDNDKVCAVEYLADVSGNYLKSHYSLGSLSLM\n+GVSPIKVDKLSGRTLPKKHTVKSCLCRLKSLVKRGAQGCTPLQVCCCTNDKEFIPARGTE\n+CHVTDTSYEIKHLHQTESLKRLPITFAQGNLRNDLEVLNHLLTIPTGYRTCQVQHYLHLK\n+GSKPGQNPPTCALKQVHYVAKTRASDPEIPPHLLVSKNVQYALKGDLVTKEGRGPDVVIL\n+QSLLQLPVFVSSTNALEFLKAGPNPGEQKSQHVGDPCDIRCKSELMKMGDYGVDTPMNFD\n+LHGAEQDLDLGDADAKELKKAGEFAVPGPKAAIFNDKQLCHCNECGVGSTTDRRNSSMKF\n+ELVAGQKLTSVVGAIYHGTLTMNICNSLISDYFTSTAIQAIKYLY\n+>C_15\n+AKTSNYDQSFKTTMLHLHIKVRIPFYITTELGCKTCFLDISSSLMVYSTKAPTKLDAGLK\n+NGNDAEKLDDLQKEARVGSYLPARPKEKETPLRLKLKMRLSLAEQPIFEAHYYELNMPDV\n+GLICQVKHKGGLGGRKEHSSFVKTTCFIVGFYCELNYFFFGKVGAVFVIKKAASKPVFRT\n+VYGKTPLGTINATSENLRETQSEHTVYTVIGLIPTWHDLGDMVLALSLAGIENVPQEDDQ\n+GCNKREWKKSLAQSYKDADIHEGDQRCYKHRLNRGTAYKGDPAHGSTLIE'..b'QNIPETALGSCLDKW\n+NGLKAKLDYACSSSPQKRGGPKSSQKGMTDAGPAEIAAPQSHHGPAEKVCRLQVSGPCLT\n+KLMLVSALCHGDGKDMPKIYVSAKNCGYNYVIPASLASAFMGSVTLLFKAIVRFRRTSTR\n+STVLAAEILKSKILCCAVTGALVSFPPVQTASTAEYLMSSDIQTTVPWSPRCSRVAITKS\n+IIFLNSSEEQQARSCPIAKAHSQIKSVFVGQHEAYHVLKCSREPKVPGGVEHPLKSVAPM\n+ASMACCGHMGDVQWAQHSFHSPIVGLSLPESVDGFFRKLIFCTDGQFIGVKRSAYHRSLR\n+AGMVDTLGCAAFAQEKLETVKLKFSEGVHCATRFPINTRNTASAYGQWCGGWYNKAHVKE\n+DKSPPLGGSVVVLGAGIFPTKPSTSLDKVLAQENLTEVEGAVDPVLTVWLGVGGGPAMQH\n+>C_248\n+LAFSWIGEYNMQIGLPRGTSKRSFYRDARKGVLKVTESLFLESQNLPDVSLGNCLDKWTG\n+ICAKLDYACSSPPQKRGGPKKSQKGVTDAGPAERCAPQSHNGGADKVCPLKVSGPCLTKH\n+LLVSVLCHGDGKDMPMIYVNAKDCGLNCRIPASLGTAFMGSLALLFKAIVRLRRTSDRSS\n+VLAAEILKSKVLCCEQPVTGGLVSFPPVQTASTAEYLMTSDIQSTRPWTPRCSRVNITKN\n+IIFLNSSEEQQAVERRCPIALPHSGIKSVFVGQHEGYHVVQCSREPKVPGDVEHPLQSVA\n+TMASMSCCGHMVDVNWIQHGFHAPIVGLALPESVEGIFRKLIFCTDGQFIGVKRTAYRRS\n+LRAGMVDALGCAAFAQEKLKTVKLKFAEGVHCSTAFPIDTRTTASGYGQFCGGWYNKAHV\n+KEDKSPLLGGSVTVLGAGTFPTKPSASLDKVFAQENLMEVEGSVDPVLTLWLGVGGGAAM\n+QH\n+>C_249\n+LAFSWIGECNLQINLRGASSQSWYRDARKGLPVLKVTTSLFLESQNIPDTSLGNCLDKWT\n+GLRAKLDYSCSSSPPKRGGPKSSQKGVTDAGPAEICAPQSHHGPANKVCRLEVSGQCLTK\n+LLLVSVLCHGDGKDMPKIYHSAKNCGYNCLTPASLATAFMGPLTLLFKAIVRVRRSGVLA\n+AEILKSKILCCAHPVTGAVVSFPPVQTASTAEYLMTSDIQTTRPRTPRCSRVNITKSFIF\n+LNSNEEQQARSCAIAKSHSQIKSVFVEQHPGYHVVHCSRAPKVPGGVNHPLKSCVPMVAM\n+ACCGHMGDVNWAQHGFHAPIIGLALPESVGGFFRKLIFCTDGQFIGVKRSAYRRSLRAGM\n+VDTLGCAAFVQEKLKTVNLKFAQGVHCSSAFPIDTRTTAGAYGQFCGGWYNKNHVKEDKS\n+GELGGSVVVLGAGIFPGKPSASLDKLFAQENLMEGEGSQDPVLTVWLGAGGGTAMQH\n+>C_250\n+LAYSWIGEYSMQINLPRGPSTQSFYRDDRKGLPVLKITVSLFLDSQNIPDTSLGNCLDKW\n+TGLRAKLDYACSSSPQKRGGPKVSQKGVTDAGPSEICAPQSHHGPADKACRLQVSGPCLT\n+KLLLVSVKCHGDGKDMPKINVAAKNCGYTCLIPGSLATAFFGTLTLQFKAIVQLRRYSTR\n+SSVLAAESLELKSKMLCCVQPITGALVSFPPVQTASTADYLMTSDIQTTRPWTPRCSRVN\n+ITKGFTFLNSSEEQQARSCPINKSHSQAKKVFVGQHEGYHVVQCSREPKVPGGVEHPLKS\n+VAPMASMACCGHMGDVNWAQNGFHAPIVSLALPESVDSFFRKLIFCTDGQFIGVKRSAYR\n+RSLRAVDTLACAAFTQAKLKTVKLKFAEGAHCSTGLCLVAFPIDTRTTASAYGQFCGGWY\n+NKAQVKEEKSPLLGGSVVVFGAGMYPTRPSASLDKVFSQENLMEVEGVDPVLTVWLGVGG\n+ATAMQH\n+>C_251\n+LFSWIGGYNMQINLPIGPSTQSFYHDARKGLPVLKVTVSLFLESQNDPDTSLGNCLDKWI\n+GLRVKLDYACSSSSQKRGGPKSSQKGVTDDGPAEICAPQSHHGPVDKVCRLQVSGPCLTK\n+LLLVEVLCHGDGKDMPKIYVSGKNCGYNCLIPASLATAFMGSLTLLFKAIVRLRRTSTRS\n+SVLAAHPEILKSKVLCCVQPVTGALVSFPPVQTASTAEYLMKMTSGIQVTRPWTPRCSRV\n+NITKSFIFLNSSEEQQARSCPIAKSHSQIKSVFVGQHEGYHIVQCNREPKVPGGVEHPLK\n+SVAPMPSMACCGHMGNVNWAQHGFHGPIVGLALPESTDGFRKLIFCTDGQFIGVKRSAYR\n+RSLRAGLVDTLGCAAFAQEKLKTVKLKIAEGVHCSTAFAIDTRTANAYGQFCGGWFNKAH\n+VKENSSPLLGGGVVVLGSGILPTKPSASLDKVFAQENLMEVEGSVDPVLTVWLGVGGGTA\n+MQH\n+>C_252\n+LAFSWIGEYNMQVNLPRGPSTQSFYRDARKGLPVLKVTVSLFLESQNIPDTSIGNCLDKW\n+TALRAKLDYACSSSPQKRGGLKSSQKVVTDAGPAEICAPQSHHGPADKVCRLQVSGPCLT\n+KLVLVCVLCHGDGKNMPKIYVSAKNCGYNCLIPASLATAFMGSLTLLFKRIIRLRRTSTR\n+GSILACEILKSKVLCCTQPVTGALVSFPPVQTASTAEYLMTSDIQTTRPWTPRCSRVNVT\n+KSFIFLNTSEEQEVRSCPIAKDSHSQIKSVFVGQHEGYHVVECSRDPKVPGGVEHPLKSV\n+TPMASMACCGHLGDVNWAQHGFFAEIIGLALPEAVDGFFRKLIFCTDGQFIGVKRSAYRR\n+SLRAGLVDTLGCAEFAQEKLKTVKLKFEEGVHCNTAFPIETRTTASVYVQFCGGWYNTAH\n+VKEDKSPLLGGGVVVLGAGIFPTKPSASLDKVFMQENLMEVEGSVDPVLTVRLGVPGGTA\n+MQN\n+>C_253\n+LAIGEYNMHINLPKGPATQSFYRNARKALPVLKVTVSLFLASQNIPDTSLGNCLNKWTGL\n+RAKLDYACSSSPQKRSGPKSGQKGVTDAGPAEICAPQSHHGPADKVCRLQVSGPCLTKLL\n+LVSVLCHGDGKDMPKICVSAKNCGYKCLIPASLATAFMGTLTLLFKAIVRLRRTSTRSSV\n+LAAEILKSKVLCCTQPVTGALVSFPPVQTASTAEYLMTSDIQTTRPWTPRCSRLNITKSF\n+IYLNSAEEEQGRSCPIAKSHSQIKNVFVGQHEGNVTQCSREPKVPGTVEHPMKSVAPMAS\n+MACCGHMGDVDWAQHGFHPPIVGLALPESADGFFRKLIFCTEGQFIGVKRSAYRRSLRAG\n+MVDTLGCGAFAQEKLKLVKLKFAEGVHCSTAFPLDTRSTASAYGQFCGGWYNKAHVKEEK\n+SPLLGGSVVVMGEAGIFPTKPSASLDKVFAQENLMEVEGSVDPVLTVWLGVGGGTAMQQ\n+>C_254\n+LAFSWIGEYDMQINLPRGASTQSFYRDDKKGLPVLKVTVSLFLESQNIPDTSLTNCLNKW\n+TGLRAKLDYACSASPQKRGGPKSSQKGVTDAGPAEICAPGSHHGPADKICRLQVSGPCLT\n+KLLLVSVLCHGDGKDMPKIYVSAKNCGYNCLIPAGLATNFMGSLTLFFNAIVRLRRASTR\n+SSVLAAEILKSKVLCCTQPVTGARVSFPPVQTASTADYLMTSDIQTTRPWTPRCRRVNIT\n+KSIIFLNSNEEQQARSCPIAKSHSQIKSVFVGEHEGYHVVQCSRESKVPGGVEHPLKSVA\n+PKATMDCCGHMGDVNWAQHGFHAPIQGLALPESVDGFFRKLIFCTNGQFIGVKRSAYRRS\n+LRAGMVDTLGCAAFAQEKTKSAKLKFAEGVHCSTSFPLDTRTTASAYGQFCGSWYTKAHV\n+KEDKSPLLGGSVVVLGAGIFPTKPSASLDKVFAQENLMEVEGSVDVLTAWLGVGGGSAMQ\n+H\n'
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/C.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/C.gff Tue Feb 18 17:56:58 2020 -0500
b
b'@@ -0,0 +1,308 @@\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t1\t1\t.\t+\t.\tID=C_1;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t2\t2\t.\t+\t.\tID=C_2;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t3\t3\t.\t+\t.\tID=C_162;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t4\t4\t.\t+\t.\tID=C_163;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t5\t5\t.\t+\t.\tID=C_164;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t6\t6\t.\t+\t.\tID=C_165;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t7\t7\t.\t-\t.\tID=C_180;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t8\t8\t.\t-\t.\tID=C_179;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t9\t9\t.\t-\t.\tID=C_178;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t10\t10\t.\t-\t.\tID=C_177;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t11\t11\t.\t-\t.\tID=C_176;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t12\t12\t.\t+\t.\tID=C_254;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t13\t13\t.\t+\t.\tID=C_255;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t14\t14\t.\t+\t.\tID=C_256;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t15\t15\t.\t+\t.\tID=C_257;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t16\t16\t.\t+\t.\tID=C_258;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t17\t17\t.\t+\t.\tID=C_259;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t18\t18\t.\t+\t.\tID=C_260;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t19\t19\t.\t+\t.\tID=C_261;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t20\t20\t.\t+\t.\tID=C_262;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t21\t21\t.\t+\t.\tID=C_263;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t22\t22\t.\t+\t.\tID=C_264;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t23\t23\t.\t+\t.\tID=C_265;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t24\t24\t.\t+\t.\tID=C_266;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t25\t25\t.\t+\t.\tID=C_267;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t26\t26\t.\t+\t.\tID=C_268;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t27\t27\t.\t+\t.\tID=C_269;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t28\t28\t.\t+\t.\tID=C_270;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t29\t29\t.\t+\t.\tID=C_271;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t30\t30\t.\t+\t.\tID=C_272;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t31\t31\t.\t+\t.\tID=C_273;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t32\t32\t.\t+\t.\tID=C_274;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t33\t33\t.\t+\t.\tID=C_275;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t34\t34\t.\t+\t.\tID=C_276;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t35\t35\t.\t+\t.\tID=C_277;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t36\t36\t.\t+\t.\tID=C_278;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t37\t37\t.\t+\t.\tID=C_279;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t38\t38\t.\t+\t.\tID=C_280;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t39\t39\t.\t+\t.\tID=C_281;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t40\t40\t.\t+\t.\tID=C_282;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t41\t41\t.\t+\t.\tID=C_283;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t42\t42\t.\t+\t.\tID=C_284;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t43\t43\t.\t-\t.\tID=C_252;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t44\t44\t.\t-\t.\tID=C_251;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t45\t45\t.\t-\t.\tID=C_250;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t46\t46\t.\t-\t.\tID=C_249;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t47\t47\t.\t-\t.\tID=C_248;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t48\t48\t.\t-\t.\tID=C_247;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t49\t49\t.\t-\t.\tID=C_246;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t50\t50\t.\t-\t.\tID=C_245;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t51\t51\t.\t-\t.\tID=C_244;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t52\t52\t.\t-\t.\tID=C_243;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t53\t53\t.\t-\t.\tID=C_242;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t54\t54\t.\t-\t.\tID=C_241;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t55\t55\t.\t-\t.\tID=C_240;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t56\t56\t.\t-\t.\tID=C_239;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t57\t57\t.\t-\t.\tID=C_238;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t58\t58\t.\t-\t.\tID=C_237;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t59\t59\t.\t-\t.\tID=C_236;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t60\t60\t.\t-\t.\tID=C_235;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t61\t61\t.\t-\t.\tID=C_234;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t62\t62\t.\t-\t.\tID=C_233;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t63\t63\t.\t-\t.\tID=C_232;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t64\t64\t.\t-\t.\tID=C_122;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t65\t65\t.\t-\t.\tID=C_121;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t66\t66\t.\t-\t.\tID=C_120;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t67\t67'..b'91;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t244\t244\t.\t-\t.\tID=C_8;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t245\t245\t.\t-\t.\tID=C_161;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t246\t246\t.\t-\t.\tID=C_7;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t247\t247\t.\t-\t.\tID=C_60;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t248\t248\t.\t-\t.\tID=C_59;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t249\t249\t.\t-\t.\tID=C_58;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t250\t250\t.\t-\t.\tID=C_57;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t251\t251\t.\t-\t.\tID=C_56;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t252\t252\t.\t-\t.\tID=C_72;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t253\t253\t.\t-\t.\tID=C_71;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t254\t254\t.\t-\t.\tID=C_70;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t255\t255\t.\t-\t.\tID=C_69;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t256\t256\t.\t-\t.\tID=C_160;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t257\t257\t.\t-\t.\tID=C_159;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t258\t258\t.\t-\t.\tID=C_158;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t259\t259\t.\t-\t.\tID=C_157;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t260\t260\t.\t-\t.\tID=C_156;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t261\t261\t.\t-\t.\tID=C_155;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t262\t262\t.\t-\t.\tID=C_154;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t263\t263\t.\t-\t.\tID=C_153;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t264\t264\t.\t-\t.\tID=C_152;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t265\t265\t.\t-\t.\tID=C_151;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t266\t266\t.\t-\t.\tID=C_150;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t267\t267\t.\t-\t.\tID=C_149;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t268\t268\t.\t-\t.\tID=C_148;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t269\t269\t.\t-\t.\tID=C_147;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t270\t270\t.\t-\t.\tID=C_146;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t271\t271\t.\t-\t.\tID=C_145;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t272\t272\t.\t-\t.\tID=C_144;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t273\t273\t.\t-\t.\tID=C_143;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t274\t274\t.\t-\t.\tID=C_142;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t275\t275\t.\t-\t.\tID=C_141;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t276\t276\t.\t-\t.\tID=C_140;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t277\t277\t.\t-\t.\tID=C_139;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t278\t278\t.\t-\t.\tID=C_138;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t279\t279\t.\t-\t.\tID=C_137;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t280\t280\t.\t-\t.\tID=C_136;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t281\t281\t.\t-\t.\tID=C_135;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t282\t282\t.\t-\t.\tID=C_134;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t283\t283\t.\t-\t.\tID=C_133;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t284\t284\t.\t-\t.\tID=C_132;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t285\t285\t.\t-\t.\tID=C_131;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t286\t286\t.\t-\t.\tID=C_68;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t287\t287\t.\t-\t.\tID=C_67;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t288\t288\t.\t-\t.\tID=C_66;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t289\t289\t.\t-\t.\tID=C_65;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t290\t290\t.\t-\t.\tID=C_55;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t291\t291\t.\t-\t.\tID=C_54;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t292\t292\t.\t-\t.\tID=C_53;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t293\t293\t.\t-\t.\tID=C_130;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t294\t294\t.\t-\t.\tID=C_52;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t295\t295\t.\t-\t.\tID=C_51;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t296\t296\t.\t+\t.\tID=C_11;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t297\t297\t.\t+\t.\tID=C_12;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t298\t298\t.\t+\t.\tID=C_21;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t299\t299\t.\t+\t.\tID=C_13;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t300\t300\t.\t+\t.\tID=C_14;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t301\t301\t.\t+\t.\tID=C_15;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t302\t302\t.\t+\t.\tID=C_16;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t303\t303\t.\t+\t.\tID=C_17;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t304\t304\t.\t+\t.\tID=C_64;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t305\t305\t.\t+\t.\tID=C_19;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t306\t306\t.\t+\t.\tID=C_22;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t307\t307\t.\t+\t.\tID=C_63;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t308\t308\t.\t+\t.\tID=C_20;\n'
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/C2.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/C2.fasta Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,15 @@
+>C_10
+VVLCRYEIGGLAQVLDTQFDMYTNCHKMCSADSQVTYKEAANLTARVTTDRQKEPLTGGY
+HGAKLGFLGCSLLRSRDYGYPEQNFHAKTDLFALPMGDHYCGDEGSGNAYLCDFDNQYGR
+SVRSPLKKLLGFGYNPTYGKSALGDELRLGLVFREEFRKINKALLTGGANVVKAGVSYKD
+SKKQGHKLLCDEMDNAVSLLKVLHPKLGCCVGDDNHSYGALSDFFVTCRRLIGKGHIEKE
+RKSANECLAKSFQPFCSDLNLTGGGVRQHPGILHLKYAIKLLQATPMYMLLCLHAGKTKL
+CDNAADSSEFCQLQDRDIVAEYVAVWKSKKPQSAPHVLKGPHNKKALVVSSCFAADFRIV
+AFVVLDSSNDYSDAKASLDDAKLCIESCVFIYAPSLKADGTKGGKYCGKGSIPENCQLRE
+HVVACDRAGSDCSGEPSSWSCACKFAIGANMRSLARNSDAATQTIHGTAIRDYTPAVGRS
+SGTFVGPECPLSKFVSSYLFVAKDNGGKLFVWVPGGNYHSLWRSFTMNLCNIGLAELPLS
+AYRNIKKKGYDGGKAGTLVTLMEFVAQGRVANALFDWGSCNEEGAGLSKQCSETVVGFLQ
+QSSDYHRLFPKGYGEVPPRCTLGPFPAFHMLMQAALKGSFRTAQQPSVLFSCKCVKLKYS
+SCKYAL
+>C_11
+AAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAAA
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/C2.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/C2.gff Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,2 @@
+gi|12345678|ref|NC_012345.1| sim CDS 210 210 . + . ID=C_10;
+gi|12345678|ref|NC_012345.1| sim CDS 296 296 . + . ID=C_11;
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/E.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/E.fasta Tue Feb 18 17:56:58 2020 -0500
b
b'@@ -0,0 +1,1012 @@\n+>E_10\n+CVLDNYQIALLRNVLPKLFMTKNFIEGMCGGGGEENYKAMTRATAKSTTDNQNAPLSGGF\n+NDGKMGTGCLPSAAKNYKYPENAVSGASNLYALIVGESYCGDENDDKAYLCDVNQYAPNV\n+RQRPLKQLIGYGYSPEYLGDDLHLFKLLDLAILKADFKNGDAALLIGGAAAVRIVTEYIS\n+IQKQADKVLCDDLDDPVRIKALRPRLGCGVGFSYQAFGALSPFLTACKKIVAKAEVERSK\n+MAKRKCLAGSFPPLCPAVKLISYGVKEWPCLNLKCAIFLFQVQPLLYTLLSKYAGKPKFC\n+NFAPGTKQFIELHAHGQLNFQYVTGFPEVRQSGAAPILKGPHNKKAFYISMCLTAPFRVL\n+VMGVRDESCDYSSAKVCGRNRLCIHCIGWARKDAIVSAKGTHPAHCAKSAHVVACRPGKR\n+ASDSVTYTVQEPAIKDYSVGVGRAGGNIVGPECTLNAFLQSYVFHANEEGGKLIGWTGGG\n+CGSYHGLWRAFGVQTCRAGLAKLQHSFGYRLLVKKGYNSGTSGAFMVLLDFIVQGRLIYA\n+LFVWGECNNLVDGTHKACAESVVYLQQQANYRKMFPWGYGEVAPACSKSPFPNHTAHRPN\n+HCNFTL\n+>E_11\n+PKFDSAGRAKHSRNELLNDPDAVVYSSGNAQTMAVKAKHDGAGMTGGKIGNYKLGKPLPY\n+GAKDKSVNKRVSSTKGLARTGGVADCELFPGFVPLIFVRLFWQKLETGTYFADANWGLAQ\n+GIHYAKLASGTAKKYIDLIGDKIHELGRELKVFFSCDHKKAGYKPDFLVGTNPKSLQASN\n+PYAGFEKRNAKQKNGKSGIILAKKRSFALTKVKQFDHSGCLGDCSGKHEVGEIGIKNLAW\n+GCNYLVPKQHNLFLFLRNEPWREIGPLGQSYSLRGEASVGCGPKKDGF\n+>E_313\n+FWEAIIKLSNVEAENSKGNVNATEIALHTHADHPGTERGCVFTSFLVLKKAHKGITADRP\n+RKKLANARLPKGLPFVGSESCCGPKWWRLQPKACSGFGTASGKTLVGRIVLLLKGEGLML\n+GNYFHTGAYANDLMTLAKKVNECWTSEQAACKHKPNGALCDITFQSGPAFESKVLYAKGC\n+YSAAKTDGGQLSDSLLQAKDFKLAPFRLDVQGLPDALTGGGNLSSGACIVASESPVGTTQ\n+SHIHGLESKFYGSFGGVHVAKLTEAGFFLFPAANLTCKAEQLAAILTETLHTTIGGVPFS\n+ATVDAARRYGGEDCSFRTVEKCGVFGRVLTPSGYTIILKLDACFWPGDRGCQLGAFRLIV\n+GGKNRTPIDWDARSEVQPRGLDLVGEDNCKRLRVSLSDTSLLSSQTANNWDECGDSRSVE\n+KKSMGVSLQVGMTYGQSFKVVTPNGKMFQYGHSRPEKLYSGIYAEGLGFVQNVIATTTFD\n+VNDEVAAFFADDFGKLSVGDQLMAEAIKGHVDGPVSQSNKFEYDRKMAGQVGSKIVKSQC\n+LAEETLCVGPFYAAFRHHGAVNENIYVNTKSSNSKAATNLHSAVEAKGLAKARVGLFMNS\n+LHCGLIKLRCGILNRVYCKALMVLRENNQCGFEGDPAHMQFLKPGLFSTKTAGQDKRRGP\n+DTLPIDRVAKLLNGNHLPGATTKGATNDPGQGRLVPFKDTGACKGAGCLFSLRPKPSVAM\n+KGDFHDVIKIVGEPRMPLVALQRLTKYRTPSLCITMTGNFISKGAVRKKTLHANFY\n+>E_315\n+FWEAFISTNRVLHSHSEHEGTDTGCEFPTFLLNEEKGIANDRPRKKLVRQRLPKELAYVG\n+SRPCCRGPSHWDLQPGTCEGVALATGTAASAKPLTGRRVHLTLLLKAEGILLSHYFYTGD\n+YMTNITSLKKMHVEECWAADQSACNHKVDAALCNITFDTGPAYGRKLAYAVGCCSTANTD\n+TGELSEKLLHPRFIKLQLSMLDIQNLPQMLSGCGSLSTASVIVAREEPVVTKQQHGHGLE\n+STFFFAQSGIHPSKLPQRGFSLYPGGEVTCMGQELAAILTESSHPEINEVRFSESRDAKG\n+YGGDNCSKRAVEKCGVHGRVLDPADFTILSKLPPCFWGGICGCVLGKFRLIVDAKEKVPF\n+KWDAKDQVDPNGLDLIGDDECRLQVYQANAFKLTSKVDEKNMGVTREIGMSYAETFKTPQ\n+GKTFQFGLSRPLKLYSAAGIYANSMGFIANAYFAQEIGNGCVADDLKAEGVSGNSDGADS\n+QSAHFDFNRKFDGYVKIVRSHCFADGHLCSVGFYLKSHDGAPTEHVFVDTRGSCAKPCAK\n+LPCVVNAKDLGAATVGAFMTKCCALVVKCGITRKIYCKTGIVLRDHDECGFEGDPTHMEK\n+YLNPSLIARAAGAPRRRGPPTLERGKEGKLNDGVHLSASGKGCTCKPQAGKSAFTERGQC\n+QGYNGCLTHLRPQPNVGMGGDFFDLSKVVRHPPMSDSLIALIRYAKYRCRPMKCPFVCAG\n+VNTCGL\n+>E_13\n+ASIESGGIECKVVPAITLTNIGSGVTDVDDFKESSGSYSSVKGATAALYNGSIFLSAGFP\n+ERVPHDILVDDTHYAVASGCCAICWHVAMEVPLAGQEKICATNDVSFPNCNQAKCRKEKS\n+RFNLQDPDRSRILVVETTMVLFKKKVRKTAAVCALYIEAEYYRERAHYLKSYAQEKGTGP\n+SPLVECQL\n+>E_14\n+PKLDMQKSSKEYCHAHTLLSFVGSPSLKFYGEGFHSCVARPPFYDGDLMGKNGIPLLFGT\n+DDPTKTSRQILHVTDCADFVEGPPVKGKDNVSRFDQDPFVSSTNGYYEPRAEQPKPKQLQ\n+ATWAGGHSLAVPYQMKWIGIRGAGCCIFGGVAKSAAVFETVSDMNGHGHVRYIRRGCTKA\n+KWVAQTCKSARSGRVFFSGRGTRAKKCCQITRAETTRPFASGNEGCHSQTGVFVNFFKAV\n+EPCATVKALPNRQGLGGADIRFLLQGTDFRAAFKAFTVEQNTDLLGKAHHWKGAQTEDDA\n+TITKTMPNENHLALLINSLAKSYKLVYTGKCSLIEYEAASKATSFLPFGKRTDQNFQDID\n+VRHSRHAYLSAHLTAGHITADEANVTCNEASLIVALTRQKTCRGMPGTVLEAGGESGIDG\n+VGMALNVNIKCVKKHTHDVRELKPNEKVNTGIGIKVAKLSICDVEYVEDLNAGAQRPSYL\n+HPSNTGNRLGLVGLCKIDKIANRTLFRPNPINKCLKCRLKTGIKRDARRCEKLAVCYCAN\n+HDDFAPARSVAFACHISDTCFEIRHLCTNDSKFRLCIGFEETSFRIEIEGQDHQYLYVPC\n+GFRRSKIQLFLLVKGPKNGQAPPKCVVTEGTGPEEAISQSLAQLPIFEWSGKSLELIKPG\n+PNPSERKSLRIADKCKVRCAKQRMGDYGVDSPTELILTSHQAAESDLNEADPKSLNRPGG\n+FFVREAAQKPGLKASIFNKQKFCHCEQYYVIGGKKKSALASDLIMRGVSKIGVLYQGGLA\n+MEVCQSLISKYYGAFQSVRPPKLY\n+>E_15\n+ANAETDYPESFKHINAVLHLELKKRFLALYVSTNLACSPYLDVAGYLKIYPFKAVTKLDS\n+SLKNGFANTDKVDEMQKQARVVGFLSTRPEKETTLRFELQKKLGVEASVFRAAYYDLMPE\n+SGMICEIKHGSPGLIELTEHSGLIYATCFQASYICELGYYFFSKVGATFPLKKAARRPVL\n+KSTFAMPAATSVVPVTDNLNGESVHSGYTHGKAHVVALVVCLHDLTSIVVACTLARLGHT\n+HQEEEKGCNKAWIKKLNLSYMESGVEKGPQQCYKLKLKRAVTYKHHAAHGSNLIDVFSLR\n+EKDGEAKHEIKTLGGSDKLNLFSYNLANNTAGIKHIKCLAYSYHLLGGWATPTRPSGPRG\n+GIHLSPCALKSSIDGSGVTLKQNMVDLRNWFTGDAYFNGYIGYSGWLG'..b'LAPRSGSGGRFPPPRLSLLEALFLGTPNADTRLCKS\n+FITGGCELLPH\n+>E_482\n+AHPKGKVLDGCLTASQSQIVWFCCERKRWTKFEAFVRLAQGDGSDVASFAYTPVKEAVAP\n+HIQGEGEDKFGKIKYYVERDKFPEHKCSPGATASESGCHAGSGKQHQHNILVSVGLASRH\n+MQTLATPSGGVSATENIYAPVGSLLLIQAEAFRKGAISAECHKVVRKFAFLIEYACLRSD\n+NLGTTNQFPDLDYLNFAQTKALARLKSGRVRVLLDFEWINEGSIKVSNHLGCEDNLGKGL\n+RHAVYLSVNDALGGYYEVTKYRHVPSRSRPDRHNLGDHLIDYRVTHDFANYANGMAPMKL\n+SPDSLRLKEQDPCSEGRAAVQQYGMVLSGTLEASTGQLEADDTTSDYSFGDEGKKDWVGD\n+AEAAKIATKLRHESGIIKRLCFKICIEHTKCPLRPFYLSPFLRAAADDGVNLCNYDIGSS\n+LISAAGGNADNQKRFHHKASNAFVRNHVCKSIGDEFLVGRPICVLTCKEKFRDFQALYGH\n+GQCLGQCACVKDCAILQAYSGVTVLQNASELERFTRNDDVDELGEFARLAKTYALGTFEQ\n+PTFSSPGLWSLHLKDNLITQIGGQSEKRSARIHLADAAQVAFGVNCLGGYYLRLKDDDDF\n+DWPEHTGGKIFNSKRMGMKIEEQQTLKESLGLLEMEVLFATTWAAGCQLVKPQYAGHQRG\n+PKGKRRALAPRPGSGGRFPVVQLTLLEAAFLGQPNLEHADNCLCKSYITGGCELLQQ\n+>E_483\n+AHLAGMVLHKCLTASESQIIWFCCEGRKRWKGETFVHLAQGEGSAVASFVFTPLKETTAA\n+HIQGEREDDHCKLGKIRYYKDREKFRAHKCSSQSTASDAGCIAGSGQYKKLQLSILDTVG\n+LESTHMDSLATPAGAVKRAELKGPAPFVLDKPHKRAEAVILSKHQLVSYEAIVLPVYGDA\n+CAKSKFRHVLKSTLPGNCSKSSERIYTPVGALQSIAREAFAISPECHRVVKTFAFLIEYT\n+CMGSFPDLQSMKLCHTKRLSRLICGRLRVLLDDWFNNDSIKVSNHLGCENEDLGKGLRPS\n+VYLSVNDLGGYYEATKYGHVPSKSHPPEERHELGDYLIEYRVTQDFANYKNGVAKMKLSQ\n+DCLRDKEQEPCSEARSAVQVFGLVLAGTLDLSTGLNMWSRVWQMEGDNSNGDYNFADNLN\n+KDWVALANAESVVARLRHNTGILKRVPFEICVEHTKCDLQPYHLTPFLRVADDEGVGSCN\n+YDIGSNLLGAKLCTPGGHSDNQKLFHHKAAAALIRHHGTKNVGDELLVSRSCVATCSEKF\n+KDREFDCAVTRAYAGVTATQNASDLERFTRNNELEQLGNIALAKTYALGAYQQPTFSTPV\n+LWKLHLEDNLITDLGDQSEKRSGRINLAAGTQVAFGVNCLGGKYFRLKNDDDFDWPEHAG\n+GKVFKSFHFMMKRVGLKIAELNTLKETPGLLDMEVAVTWTGACQLVRPHAAGNQPGPKGK\n+RRSLAPKVGSGGRLPLPRLTLLEAAFLGQPNADNRLCKSYITGGCQLLPH\n+>E_484\n+AHPQGKTLDGCLTASQSQAVWMCCYGQKKWGFETFVKLTQGDGSDVASFVFKPLKETLAA\n+HIQGEATEEHTLGKVKYYVEREKFRAIHKCPSGSTESDGDCRAGSKHYKQHQHTILLSVG\n+LEPTHMQAFASPPGAVKSAELKAPASFISANPHKRAAAVILPKHQLLIFEVIVLPVYENG\n+CAKSKFRHALKKTLPGNCSSSSERVYGPNGALLLIQQQAFAIVAECHKVLRNFAFLIDYA\n+CLRSFPDLQSMHLSQSKLLARLKSGRLRVLLDFEWINDGSIKVSNHLGCENDYGKGLRPT\n+VYLSADEALGGYYEEAHYGHVPSTAHPDHHALSQHSIEYRVSQDFANYKHGLAKMKLSPE\n+SLRDKEQGPCGAAPSAIPAYGLVSSGTSESSTGQMEGDESHGAYPFGDNLHKDFVTLADA\n+ESIDPKLRHISGIIKKLCFKICFEHTKCPLRPFPLTPFLRVAKDKVVGACNYDGEQLISA\n+ALCSPGGDADNQKRFHHNANSALVRHHVCKAVGADLLVGRPICVATCSEKFRDFQALGKP\n+YGHGQCLMQCGCVKDCEVTHSFSGETLLQNAAGLDRFTRKNELDEVGPFALAKTYGLGSF\n+EQPTFESPVLWSLHLKNNLITNIGDQWEKRSGRIHLVDGAQVAFGVACLGGFYLRLEDDD\n+DFEWSEHTGGIFKSFNFMINLVGLKVAEQKTQKETPGLLEMEVLVTWAGACQLVRPHISG\n+NQPGPKGKRKSLAPRSGSGGKFPVPRLTILEPAFLGQPNVDNRLCKSYCPGGCELLPH\n+>E_485\n+AHPQGKVLKYCLTASQSQVVWFCCEGRKRWDFKNFVRLNHGSGSDVAAFVFTPLKETLTA\n+HIQGSAEDEHCKLSKVKYYAKQQKRAARCSCLGTSSQAGCRAGSGHYKQHQHFILVSVGL\n+ASTSMQNLATPAVAVKSEELKPKASLVAAKAHKRAASVITPKHQLLSYEVVLHVYDNGCA\n+KSKRIYGPVGAILLIEQDAFAVSAECHKVTRKFSFLVEYACSRSFPDLQSMNLAQTRILS\n+RLKKGRLRVLLDFEWKNGGSVKVPNHLGCEDDLGRGLWPTVFLSGNDALGGYYGETKYGH\n+VPSKSHPDRHALGDHLIEYRVTQDFANYRNGMLKMKLEPDSLRNKGQEPCSNARRAVQVY\n+GLILSGTLEQSGGQVEGDDTDGDYAFGDPLYQDWVPTAEAEIDTKLRGNSIIRRLCAKIC\n+LEHTDCPLRAFHLNPFLRVADDDGIGSCNYDVGSSVISASLYSPGNNADNQKRFHHKASG\n+TLIRHHVCKNVCVATCADKFRDFQALGKPYGHGDCLMQCACVKDCAVLHGYSSVTVTQNE\n+SDLERFTFDTDLNNLGNFALAKTYALGSFEHPTFSSPVKLWSLHLKNNLVTNVGDQSEKR\n+SGRIHLADGGQVAFGVNCLGGYYLRQKDDDDSDRPENTGSKSFFMVKRAGLKIPEQKTLP\n+GLLGLEVLAAWAGGACQLVRTHAAGHQPGPNGKRRSLAYTRSGSGGRIPVPKLILLDASF\n+LEQPSSDNKMCKSYIVGGCALLPH\n+>E_486\n+AHPQGRPLVLDGCLTILKSIAQVCWFCCEGKKRWEFETFVWLAQGDGSDVASFVFTPLKE\n+TIAFAHIQGEAEEEHCRLGKAMYYTERNKGKAPKSSSGAEAPGAGCRAGSGGYKQHQHSI\n+LVSVGLDTTHMRTLATPAGAVKSAEFKPPAVWIFIAAEPHMRAAAIILAKHQLLSYEVLV\n+LPVYEDGCAKSKRIYGPVGLILLIQQSSFAITAECHKIVRTFKFLLEYACLRTFPDLQSM\n+TLDQTKILARLKAARTRILLNLEWINDGMIKVDNHLGCENDHGKGLRPTVYLCVSEAAGG\n+FYPEETKYGHVPSKCHPNRHALGDQLIEYRVTQKFAKYKNSMVTMNLEKDKLRAKEEEPC\n+SQARSAVQVYGLTLSGTLEPSKKPMEGDDSNGDYSFGDNQYKDWVSLAEPDSIDTKLRQN\n+STIIKRLCFKICIEHTKYPLRPPHMNPFFRVADDDGIGCCNYDVGSSSFSAALCPPAGCG\n+LYHRNKHYPGKTDNQKRFHHKASSALIRHNVCKDVCVAKCAEKFRDFQAQGKPYGHGQCV\n+MQCACIKDCAVTHGYSGVTVLQSASDLERFTRNNDLDELGKFNLANTYALGSFAHPTFSS\n+PVLWSLHLKEGLIADFGDQSEKRSGRSHLADDTLVSFGTDCIGGYTLRLKQDGDFDWPEH\n+TGGKIFKSFHFMVKRIGLKIGEQMTLKADPGLLEMEVLVVWTAACQLVRVHATGHQPQPK\n+AKKRKLAPRSGEGGKFPVERLTLLEAAILGQPDANVRLCKTFIVGGCEILQH\n'
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/E.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/E.gff Tue Feb 18 17:56:58 2020 -0500
b
b'@@ -0,0 +1,310 @@\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t1\t1\t.\t-\t.\tID=E_319;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t2\t2\t.\t-\t.\tID=E_317;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t3\t3\t.\t+\t.\tID=E_366;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t4\t4\t.\t+\t.\tID=E_367;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t5\t5\t.\t+\t.\tID=E_368;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t6\t6\t.\t+\t.\tID=E_369;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t7\t7\t.\t+\t.\tID=E_432;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t8\t8\t.\t+\t.\tID=E_433;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t9\t9\t.\t+\t.\tID=E_434;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t10\t10\t.\t+\t.\tID=E_435;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t11\t11\t.\t+\t.\tID=E_436;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t12\t12\t.\t+\t.\tID=E_437;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t13\t13\t.\t+\t.\tID=E_438;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t14\t14\t.\t+\t.\tID=E_439;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t15\t15\t.\t+\t.\tID=E_440;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t16\t16\t.\t+\t.\tID=E_441;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t17\t17\t.\t+\t.\tID=E_442;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t18\t18\t.\t+\t.\tID=E_443;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t19\t19\t.\t+\t.\tID=E_444;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t20\t20\t.\t+\t.\tID=E_445;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t21\t21\t.\t+\t.\tID=E_446;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t22\t22\t.\t+\t.\tID=E_447;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t23\t23\t.\t+\t.\tID=E_448;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t24\t24\t.\t+\t.\tID=E_449;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t25\t25\t.\t+\t.\tID=E_450;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t26\t26\t.\t+\t.\tID=E_451;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t27\t27\t.\t+\t.\tID=E_452;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t28\t28\t.\t+\t.\tID=E_453;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t29\t29\t.\t+\t.\tID=E_454;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t30\t30\t.\t+\t.\tID=E_455;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t31\t31\t.\t+\t.\tID=E_456;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t32\t32\t.\t+\t.\tID=E_457;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t33\t33\t.\t+\t.\tID=E_458;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t34\t34\t.\t+\t.\tID=E_459;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t35\t35\t.\t+\t.\tID=E_461;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t36\t36\t.\t+\t.\tID=E_462;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t37\t37\t.\t+\t.\tID=E_463;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t38\t38\t.\t+\t.\tID=E_464;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t39\t39\t.\t+\t.\tID=E_465;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t40\t40\t.\t+\t.\tID=E_466;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t41\t41\t.\t+\t.\tID=E_467;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t42\t42\t.\t+\t.\tID=E_468;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t43\t43\t.\t+\t.\tID=E_469;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t44\t44\t.\t-\t.\tID=E_594;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t45\t45\t.\t-\t.\tID=E_593;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t46\t46\t.\t-\t.\tID=E_592;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t47\t47\t.\t-\t.\tID=E_591;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t48\t48\t.\t-\t.\tID=E_590;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t49\t49\t.\t-\t.\tID=E_589;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t50\t50\t.\t+\t.\tID=E_540;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t51\t51\t.\t+\t.\tID=E_541;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t52\t52\t.\t+\t.\tID=E_542;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t53\t53\t.\t-\t.\tID=E_384;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t54\t54\t.\t-\t.\tID=E_383;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t55\t55\t.\t-\t.\tID=E_431;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t56\t56\t.\t-\t.\tID=E_382;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t57\t57\t.\t-\t.\tID=E_381;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t58\t58\t.\t-\t.\tID=E_380;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t59\t59\t.\t-\t.\tID=E_379;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t60\t60\t.\t-\t.\tID=E_378;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t61\t61\t.\t-\t.\tID=E_377;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t62\t62\t.\t-\t.\tID=E_376;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t63\t63\t.\t-\t.\tID=E_375;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t64\t64\t.\t-\t.\tID=E_374;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t65\t65\t.\t-\t.\tID=E_373;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t66\t66\t.\t-\t.\tID=E_372;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t6'..b'2345678|ref|NC_012345.1|\tsim\tCDS\t246\t246\t.\t-\t.\tID=E_419;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t247\t247\t.\t-\t.\tID=E_418;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t248\t248\t.\t-\t.\tID=E_417;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t249\t249\t.\t-\t.\tID=E_416;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t250\t250\t.\t-\t.\tID=E_415;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t251\t251\t.\t-\t.\tID=E_414;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t252\t252\t.\t-\t.\tID=E_413;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t253\t253\t.\t-\t.\tID=E_412;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t254\t254\t.\t-\t.\tID=E_411;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t255\t255\t.\t-\t.\tID=E_410;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t256\t256\t.\t-\t.\tID=E_409;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t257\t257\t.\t-\t.\tID=E_408;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t258\t258\t.\t-\t.\tID=E_407;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t259\t259\t.\t-\t.\tID=E_406;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t260\t260\t.\t-\t.\tID=E_405;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t261\t261\t.\t-\t.\tID=E_404;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t262\t262\t.\t-\t.\tID=E_403;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t263\t263\t.\t-\t.\tID=E_566;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t264\t264\t.\t-\t.\tID=E_402;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t265\t265\t.\t-\t.\tID=E_401;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t266\t266\t.\t-\t.\tID=E_400;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t267\t267\t.\t-\t.\tID=E_399;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t268\t268\t.\t-\t.\tID=E_398;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t269\t269\t.\t-\t.\tID=E_397;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t270\t270\t.\t-\t.\tID=E_396;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t271\t271\t.\t-\t.\tID=E_395;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t272\t272\t.\t-\t.\tID=E_394;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t273\t273\t.\t-\t.\tID=E_393;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t274\t274\t.\t-\t.\tID=E_392;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t275\t275\t.\t-\t.\tID=E_391;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t276\t276\t.\t-\t.\tID=E_390;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t277\t277\t.\t-\t.\tID=E_389;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t278\t278\t.\t-\t.\tID=E_388;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t279\t279\t.\t-\t.\tID=E_387;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t280\t280\t.\t-\t.\tID=E_386;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t281\t281\t.\t-\t.\tID=E_339;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t282\t282\t.\t-\t.\tID=E_328;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t283\t283\t.\t-\t.\tID=E_327;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t284\t284\t.\t-\t.\tID=E_326;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t285\t285\t.\t-\t.\tID=E_323;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t286\t286\t.\t-\t.\tID=E_321;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t287\t287\t.\t-\t.\tID=E_337;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t288\t288\t.\t-\t.\tID=E_1;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t289\t289\t.\t-\t.\tID=E_430;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t290\t290\t.\t+\t.\tID=E_3;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t291\t291\t.\t+\t.\tID=E_4;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t292\t292\t.\t+\t.\tID=E_5;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t293\t293\t.\t+\t.\tID=E_6;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t294\t294\t.\t+\t.\tID=E_7;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t295\t295\t.\t+\t.\tID=E_8;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t296\t296\t.\t+\t.\tID=E_340;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t297\t297\t.\t+\t.\tID=E_338;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t298\t298\t.\t+\t.\tID=E_9;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t299\t299\t.\t+\t.\tID=E_10;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t300\t300\t.\t+\t.\tID=E_11;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t301\t301\t.\t+\t.\tID=E_313;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t302\t302\t.\t+\t.\tID=E_315;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t303\t303\t.\t+\t.\tID=E_13;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t304\t304\t.\t+\t.\tID=E_14;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t305\t305\t.\t+\t.\tID=E_15;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t306\t306\t.\t+\t.\tID=E_16;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t307\t307\t.\t+\t.\tID=E_17;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t308\t308\t.\t+\t.\tID=E_18;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t309\t309\t.\t+\t.\tID=E_19;\n+gi|12345678|ref|NC_012345.1|\tsim\tCDS\t310\t310\t.\t+\t.\tID=E_20;\n'
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/L.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/L.fasta Tue Feb 18 17:56:58 2020 -0500
b
b'@@ -0,0 +1,506 @@\n+>L_10\n+CVLCKYEIAALGNVLNKLFMTKLEDKVCGGDSQVYYKADARLTPAKTSTDNANSPLAGGY\n+HDNKLAFMGCYPTSAKKYNYPQQTIKAQKTDIFTLTARDHYDENTAGSYYCSFESVYACD\n+TRRCTNKPVVRAVKKLLGYGYRAKHESPYGRSTLGDNLHNVKQFTAKFYLKLSVFRDDFR\n+SVPKKLLIGSAAVYRAVTDYKSVSVGEQYETLTKKGNKENLGGTYSPVCAARGIDVACAD\n+KDGSQRKQVLSPRLACCVVFDYTAFGAIGELLLTVMSLITKVEAAKEKEGTNKCLVGSFP\n+CAENTLSGAGVKDWPGCLSLKCTFTLIQVTPMLYLMLCKYAQKPKFCNLGSNTRAFHQLQ\n+SHQMVSEYVEAFKENKPVGADPVLKGPREEKALYVGHCVPLSFRILSKGAVGEETDYSSS\n+QMAKTSLDQEHLCVGCTPWDARKGAAYKCKGTQQEHSAKSANVVASKVGKPDCIKGRSAW\n+NCMCKFVIGKDRITRTGDAVARTHENAIKKYAVAVASGVGTIMGPECVISDFVLQAYLFV\n+AGGTGGNVISWTPAGCGTYQALWKKYGVNTCWSGLVGLPLESYRQQLQKGYNRDSGGLLH\n+IMMGFVVQGRLVSALFPWGECRADLIQLTQKLTAQGGGYLQQSVKYRKLFPPAQGPVPPP\n+CTIGTFLTFHNLVEQGLKGTFNTAKRPNSCAFTF\n+>L_11\n+PKFDSVVNKSRSDLFNAPEAVLFTNSECQTITVKAKNKGTGVAAEKVNGYNVSQPLEPYS\n+MSKKPVPNCGLEGSKELGRRNAAATCIFPGLIPLVFIRFQDTGTYLGDPSWALLEGVHYY\n+THHNVRDLAHKPNTHKSAKKYINIFGAKLRPAGKELKSFFDCKKAAIRLHNKAGFLGETD\n+DYILGTNTDALQAYHPFEGFANKNGKRKNGKGGVILARARAIALKAKRQFHSVTLNFIGP\n+IGDCSGKHHIGQGLAKAVWGCTYLVPSHADQILLLLMDTPYREVGPLGKNYSLGHLGCEE\n+KKDGF\n+>L_313\n+FWHGFDKLNPHGAKNSQSTLNVRNKSLTTVANHSGKETGCAFKAFLVLKSQHKDITADRP\n+RNKLVNPYVTSEEVHFSREKLPKDLGYVGARYCVSGPKWWHLQPTECGLSDSTKPLCGRK\n+VLLLKVIGIMLHNYFATGAYMDDLFTLKRQTQECLAVCDPNFQSGPNFEAKVEYKNGSFA\n+PAKTNAGQLGTKLLQPRGIKPLPFELNVQNLPDMLGGCGDLGSGHDGPVIIARDTAVLAK\n+AQNKHGLESKFFASMGGTHSELAEAGFFLFPAGNYLICAGEKLAILTQIYTLHAQAGGLR\n+FKLSATLKNQFGRVYGSEECSFHTLECGIFGRVLEPTSFTIVGKLPPCFWGGDRGCALVQ\n+YMLVTGGKGRHPIEWEARPQSADVVGDDTCERSPVYQSHAFKLTSENANNWDEIGDSQKM\n+MNVGRQFGMEYGEGIKTDNDKIFQFGLSRSQKLYSTVTIYDDSIGFTSAGFFPDQIVTPS\n+VAKALFASGVAGHFQGADAQSEGYEFESKEEGVISIAKSCLVEDTLSPGFYTDFHHGTPE\n+NGVYCDTRGSHTKASCSLPSAVQSKELGTGAVGLFMSAFCCGLVKIMCTVTSKALCKTGF\n+LVVRDNDQCGFEKSPAHMRTYLSTGKYTPRTDGATKREKPPTIPLTPKIAKLGAGDQMHS\n+ATAAGCTNKPGVGLSGFTDAGEETKGFESCMFRLRALPTLGIQGDFFGIVPVVGEPKMNL\n+VTLRRLTRYRPPAICRTVKIAKFICTGGVRDKLLHTHGN\n+>L_619\n+EAVKKECQVVAACTLELGCDLVDGVTDLRSKFKKSNGGYTPALDLTSSLFSGKAFASGGY\n+VIVRNKDIVNANQFACCMSCCNTGWQVVIEAPLASSEKVGYKAHVNFPNCEEIVCKTERS\n+RFNLNSPARPDTLVVADAMVLKKSCKKTPVVCTLYIQKYYADRVQYLKDYSQGKISIGCD\n+I\n+>L_621\n+DSVKRDEASCKVVGACTLNIGKSDLAGGVSDVSGLKQSEGGFSPALGTSSGLFNVKIFAE\n+AGYAVLQPKDILVEEAHFSVCMSCCAVAWQIAIDPPLAALEITGYTVHVKFPNCEQIVCR\n+KEGSRLDLNDPRPVTLVIAAAMVLKKACKKTPFVCALYKQKYYNDRGQYLKGYAQDKAKC\n+IGYRV\n+>L_623\n+DSVKKSIAQLAYNKRDGVCKVVGACTLHLGKSALADGVTDVDELKQSEGGFGPALGTTSG\n+HYNVKIYAAAGYAVVQPKDVLDATHFAVCMSCPAIGWQVAIEPPLAGTGTPGSTVHVGFP\n+NCEQIVCRKGRSRLNLHHPERPKTLIVAEAMVLKKACKKTPFVCALYIQKYYNDRGQYLK\n+SYCQEKAKCIGYQI\n+>L_14\n+PQADIQRKFCHANALLFVNAPRVENFGDGFEACVARAPFYEGNLAGKGGVLLLFGTNDPI\n+MTAHKAGQVTGCVEVKGPFFHGRDPTGRYDHQKKSRLEAFVSELKSYFKQRAEQSIPRQW\n+EATWVGKMSLAVPYNIKWLKVRAGGCVSYGLVSKSAAVFDQVAAKVHDEHGHIRYVVWKC\n+TNARRHALTCKAGRGGTVFFCGRGTRVKKCSSTRTDKNQPFSSANQLCQTETGVLLDYFN\n+GTLGALPAAQGLSAGDVRFLLLSTNYNGPIKIYAVGRNKELLAKHHKWKGAQTAGDATIK\n+KTAPNESFLPFLVRNQKSHKLVFTGKSSLKAYASLAKSRAILAFGPHPEQGRTIYNGARS\n+IGSRYSVNEAAESCAKANSIVALTRKKSYRNMHNRILELSGESGLDGVIALNWNIKSAKK\n+QDDDAHEIKPDALIDHTVAGIEGAKLWICQVEYLADLNASAPVADYLHSAYGNGLMGVCR\n+INKIASRTMPRQHDVNSCVTCRQKSGISGAKKCATRHVRYSTEHKEFFMARSTHFRCNRM\n+DTGSFEILHANQADARGNKRLCVSFAQASGRTSKAGQDNLYIYISIGFKRCQERRPKKCK\n+IRCGKKKVGEVDTPPNYVLNYSQGDADLQDLIPALNKPGDFFVRSATDKQSANASIFNEK\n+QFCNCNQSGVAAVVGKKSRALSSEQIVKGPSNVGGLYQDGTAMQVCEPLISNYGCGTYTS\n+IRPIKYLC\n+>L_15\n+PKGTNYQGFRTETLHLDAKTTFTPAFYVTKELACAPCYLHVEGFLMVYSLKEITKADEGP\n+LKNGKATAKVNDLQEEARVATFENRLKSELQKRLGVESADFQAQYYSLLNDVGLVCDSKY\n+KAGLIGHSNHKELIDAACFQCGYHCDAYIFFSRVGSQFPKRKAAGKGPFRGVFATPPAKA\n+VSTIHDHLSEGHWVHTIYTNGKAHVVALNPVWHDLGVLAVAVSLGPLAELDEGKNRGCGK\n+NWVKRLTLGYLESNIPYVEGTVKCYKVKLKRATAVGSHPNDGYVMANVYPLKMPSGVGAS\n+KHEVDAFGNSENLSLFETNLGNYTNGTKKEKCQDVEYRLWGGSNPPTKPAGARGGPHLCG\n+SSPTGATGVTEKENMEELRRFAAGDGFFKGYIQYGGWFGGLKDKAWLEKFREEFGVVSNG\n+RDKRTGELKHVECPIQVQKPYNNPLILHHEKDCGRKTRVHGSGGEKDVGPWRGDTNTKQD\n+KQKFGSGKL\n+>L_16\n+LDDDETQLSDIKDEECRLFDFPGKHVGGFGACASQAAAGLGQIFHCAVGTGRLGLVNVAD\n+VRNSSSTRAHHVKLTHDSGLGPSAFKILLVPQAIKLVSITDESSNPVDVADLPFHNPWND\n+ASYFAQRTHGKWENGVLKTATDKDASHLRFLTRNLYHQVSFIEIQTLADESLHVSGISPR\n+YYHQSRAFDEYLSVPPAERRKLDECTSDYNGKQAKLAAQIVTRPFGIDSNIALLESAGNS\n+'..b'HGDASVAKSKELESLKVQGFEDSTTILGRGDGDVNEPVYDHTKFTLAVVGRLGQVLCST\n+ILTSQMPTVKGQTCDNVLISHYCLLMALPCQTLVVVKNHKRLKYQSYSNSFMGDARNEHY\n+GSPNSTAIKHVRVLSVCKNNFFEPCLHPTSVAGMKGVLAGACGEDRCKETQDQEPSTEPR\n+ECPGLKMVQHMRVSAGNLIAYNVSFFIKDTALSNANEAHTGGVASLRTATHTWGVTANRV\n+DYFNAVLKGYHTALVKTTRCGVGFLKGAILQFIPLVKCFVVTKVAHVCVRVDQKSGNDIR\n+DCRSWLGKAKGAQDDVTNFAKSPALENSKGKGANSRSPDGTAICMSSVAVEKCLGGRCVY\n+GKTEPEGLTNSEFEEPKGRAESYTDSVATLETLAQCGYAISDTAALPLFCLLLGAHDTQL\n+APFDRYGPESSKGIQLNELAYLEAYVSGNCQNKLSQKVGLDEGEFSLQKPIAVPAPYPKD\n+TCVGTMVSKSNSALVSNTHSETASQPFVCCGSKHLVLKVEACNLVVKNGTKKDIVTAEKE\n+PCQYNCGHGAVIAKLTTEDSQLYGPDVVCMKGPALCNSKKDIEPSKLPALVWSMGGKKCP\n+AENLELRYINFRLLYPEQAEPENSDLAHKSS\n+>L_5\n+NCESGNAEADESGSGNYAKCICSGFRREIWQLTMEADANIEHEHKGASEEPISPKGDNVN\n+VLGKDCEKPLVHQKSKDDLKASARLLIKCVSKNAWHNPLQGNSLPGYANKWGVALLNLIL\n+LYSFKALSRAIALRYTGGAKDSPPFINESVVFGAPAAHILVTSMSGNMHGEKHPQRSSVS\n+CAAVDRSKPDTKRAADPRKAQLEGIFDERLHKCVKVSTGEVVNGVHALYAKLYRTPPPVT\n+DAKCFVSKDKGAINEEGKLIGQKVGGVLAPIGRGHAHLFVGNKAAFPMPVNVACLSTGSG\n+MADTGEGTNGDDIAADKSANEQIKIVGALQNHGRPLEFNKGSGPFQLNDKLEEAYFYQCT\n+QHEHAAAHKHARVTSCANGAQTSIWGCQFALLFLPAGFKTTPGLQRFWEFGHAGHLDTQL\n+HGETCLMKAPKTCAHLVVVERWTYSLQLEPFATSQNKAVIFEKESSRSLFNCYPLKEKKN\n+SGVGDTKKTPEVGTFECVIKPYRWQILADAKKNKTLRGTSFAFCSALHLTSPVLRNQIAL\n+RCHTDKVSEETWQMPATFASSVFGVKVIFNERCVTHMSCSSEGEAGLHDLVKAGLQRAKN\n+PLSHPPVSYPLTIVYKVDAKNVGQLSAPCNRQAIQKEKMQSNGLVSKCCCTRTDTAPSTL\n+TKASEVFPLPISAVQVAGLAATHADEPYESFAWAMFTIGEYTQKVKNGQKADTGLGVPCL\n+VHEYGPAEAFDRHYRGSQDCDLRQGALWENASANLRVNVKPEAVANNTCGKTGGSDKGDH\n+DLVSVETVKETLNSANVAEVTAHFNQSIGCILCLKQLECGLSAQSIVKKQNGKKKIETPK\n+VQTVQAALKLKGRCSVRQHNVWAFTNSPVVVAGSQYAHKGIKLLEINAEEQVLIAGNAPR\n+FPGQLGTGSQF\n+>L_6\n+QLPFSWYFKPDVRLIIKEELACHTTAAQKMREPMLPLRRITDAEPAGFIEPLNGLIVKPH\n+DDHPVGDAFKPRIWCNTEYVLFQGYAGHHTAGHNLHKHFLARQERPNEYLTPMGMGPGDV\n+LKGRQGGGFFYVQKELPLWHAIGAGKVKKLKKAFYIRKADMRFHPSFKNHQCVELSIVDG\n+LLNAMATPGSPQLFLNRGDEDLRGEECNSVNTFADKLLRTTMDPCEASGYHASKTFGRES\n+IGDHPSYVLPGGLRMTWDTDEECMIMKAYLIKAENYLLSKPKATTTMVSPYSFFDFARLH\n+HLLPPLGASATGLDCAVYDYVVTDTIFREHVKNQACPAVVYSVNGWSKELIHGKLSVGGG\n+WEQGLDGPFKYHHTQEPFEDKVDVKGAIPVDTKFKAGKFKKHKQSQLINGGGSLYKESCF\n+AHKMKRERNKTPDTGAKNGQGIVQANMSGFTVDGMRALQPEPAQSANVTAGVLAVAVAAV\n+SYFDRVQTTNCEVYASGFWPQAVRGKIKMNQAPPIAEAFFKLGKSELCDGEQFTIGADQP\n+DSKVLIGRASGLCHFLMTPPIEAGWLTTNISQYENDAGTHQDVAKDASVTANFFCEVTVV\n+GISITHGLSADKRSIFRGVISATQSGSVPLTGLALVPPVGLSPQTLTNRLAGLIGYGKLA\n+CLKCTVYKSTRRTLAIVLLEYRVSVWIAKEPRAKLVMNAKAHALHLTHRHSSDRMPFAFS\n+GRNCKAADQPGILTHNKMCQCGDFGLPHEKYGFAHLSRSSFGVSCTACSNPTIVSALHRA\n+ESIHRSGAWLNSQDSTETGTNLFGPTSKESRESICGNQFSVTATIGQLGYVTDVLAHGMV\n+LAFCDFAKTASAGPPKEKVNCDDGHGGLMLEANVFSEESDVRKHLGLSEKGYHCVLTSKT\n+LVKFLIKNQTFHCGAEGCVPTGSGAFGD\n+>L_8\n+CRLPGGVNERAFGHVNDKDLCMLPSPVFCTQKGKEHPPNKEYQMAGSKPPTWPAAQVVDC\n+RHELRTYTGQLPMRSATDLGPNVKSIYTVSERGFKVGQTNHAVCFEAGNVEDKKWKMCHG\n+KNYGRSESWLYFSMNEKANGHLKDLHPSAYQRPKKWTGMRDFGATTKTGLRLVAFSDPSG\n+ACVDMPYLSDCPRGKLSRPTIPPGAGLTVEFTAASARCNKLAEIANAAAKAQKFFTTGIM\n+TSAFLAAKSAVTPTHENKTNGLSLQHPNKSGEELKDYAVKPFGLVQSKLAGTAHAQMIYK\n+DPAGSGYFNNFVTNYPKITHDLIFCPKGGLEFTNGVPFGSPLAGCQLYKSTFPVKSLGKA\n+CEIFSLRRMALSQENKQHVNDHLTAKVGANGPSRGIDVQVGCAHEPNCGGPQLREDFFCL\n+TLGAAHGRFVKSLARDSLQLCFHADITPPLVISISTKILGKVVKLRGASGETVELASAQA\n+VASRPSKQAERARIGFCCGSFSIHADATLQSGSCTGGTDKKLALEQDDDPCVTARQGSGL\n+QRAGQPIKSRSHEACKADSLSDKAAPGQSWTMEIGVETYQVMQGNGPRRTSRSTLYAEGG\n+VIDWFKGAHNSYEFTGIVCSGIRDMLTPQDFQDIKEQTGDLSCMAVNCNAANDIHCSAGQ\n+VLPFKERLVCRHATSGKLINDLSGTSSKVGGMKLPLSSTHFLKLTINEGGPVRTGADSHC\n+SGFSCGCKALKLKDFIPSRQLGSVTGGKQVVTLPNKEGGDTTNLPKEYANTGGMCAVCPN\n+SAHGTGGMTVLSLGAFGYRYTCLVGVEDASKDLLVGNGLAFYHTLYVSLHGKVNHTDSPG\n+DWVSFGIHTSENKSTCTGNGCILHVSVHSQQFGDFLACKHGKQRVPDKERYYYDFAANAV\n+PGTTTPSGILLRTVRTAKSPAKFHFG\n+>L_9\n+LALHHDDACICTRAVGFFYTQFKQEAPVSCASVNKEFDHFSVDKKDPWAAIGLASAAGNN\n+GHNFVAKNKTKQYRSRQRYSRAGSGPIVRALFTAYATTIQNTHTFTTPLGKKRIVDNALR\n+DGSVSRACLPLELSPFVRIRCACSGGLAGAAGFFTVVVPLLLVLLQVNGSLKLTWLGAMY\n+AVFPVLDLRRVLLVVTADTGLETFRPAPNGRHSKDCAT\n+>L_648\n+LYLHHDDACICTRAVGFFYTKFHQEAAVACASVNKEFDHFSVDKKDPWAAIGLTGSTVGN\n+NHHNFVARDKTKQYHSRTEDQRYSRAGSGPIVRALPTAYATTIQNTHTFTTPLGKKRIVD\n+NALKDGSVSRECLPLELSPFVRIRCPCSGGLGAAAFFTVVVPLLAVLLQKSGSVKLKWLG\n+AMYAVFPVLDLRRVLLVVTADTGLETFRPSPNGRHPKDCAT\n'
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/L.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/L.gff Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,41 @@
+gi|12345678|ref|NC_012345.1| sim CDS 1 1 . - . ID=L_319;
+gi|12345678|ref|NC_012345.1| sim CDS 2 2 . - . ID=L_317;
+gi|12345678|ref|NC_012345.1| sim CDS 3 3 . + . ID=L_617;
+gi|12345678|ref|NC_012345.1| sim CDS 4 4 . + . ID=L_6;
+gi|12345678|ref|NC_012345.1| sim CDS 5 5 . + . ID=L_7;
+gi|12345678|ref|NC_012345.1| sim CDS 6 6 . + . ID=L_8;
+gi|12345678|ref|NC_012345.1| sim CDS 7 7 . + . ID=L_9;
+gi|12345678|ref|NC_012345.1| sim CDS 8 8 . + . ID=L_648;
+gi|12345678|ref|NC_012345.1| sim CDS 9 9 . + . ID=L_10;
+gi|12345678|ref|NC_012345.1| sim CDS 10 10 . + . ID=L_11;
+gi|12345678|ref|NC_012345.1| sim CDS 11 11 . + . ID=L_313;
+gi|12345678|ref|NC_012345.1| sim CDS 12 12 . - . ID=L_623;
+gi|12345678|ref|NC_012345.1| sim CDS 13 13 . + . ID=L_333;
+gi|12345678|ref|NC_012345.1| sim CDS 14 14 . + . ID=L_2;
+gi|12345678|ref|NC_012345.1| sim CDS 15 15 . + . ID=L_3;
+gi|12345678|ref|NC_012345.1| sim CDS 16 16 . + . ID=L_4;
+gi|12345678|ref|NC_012345.1| sim CDS 17 17 . + . ID=L_5;
+gi|12345678|ref|NC_012345.1| sim CDS 18 18 . - . ID=L_635;
+gi|12345678|ref|NC_012345.1| sim CDS 19 19 . - . ID=L_633;
+gi|12345678|ref|NC_012345.1| sim CDS 20 20 . - . ID=L_631;
+gi|12345678|ref|NC_012345.1| sim CDS 21 21 . - . ID=L_629;
+gi|12345678|ref|NC_012345.1| sim CDS 22 22 . - . ID=L_627;
+gi|12345678|ref|NC_012345.1| sim CDS 23 23 . + . ID=L_323;
+gi|12345678|ref|NC_012345.1| sim CDS 24 24 . + . ID=L_637;
+gi|12345678|ref|NC_012345.1| sim CDS 25 25 . + . ID=L_639;
+gi|12345678|ref|NC_012345.1| sim CDS 26 26 . + . ID=L_641;
+gi|12345678|ref|NC_012345.1| sim CDS 27 27 . + . ID=L_643;
+gi|12345678|ref|NC_012345.1| sim CDS 28 28 . + . ID=L_645;
+gi|12345678|ref|NC_012345.1| sim CDS 29 29 . + . ID=L_647;
+gi|12345678|ref|NC_012345.1| sim CDS 30 30 . + . ID=L_336;
+gi|12345678|ref|NC_012345.1| sim CDS 31 31 . + . ID=L_328;
+gi|12345678|ref|NC_012345.1| sim CDS 32 32 . + . ID=L_331;
+gi|12345678|ref|NC_012345.1| sim CDS 33 33 . - . ID=L_621;
+gi|12345678|ref|NC_012345.1| sim CDS 34 34 . - . ID=L_619;
+gi|12345678|ref|NC_012345.1| sim CDS 35 35 . + . ID=L_14;
+gi|12345678|ref|NC_012345.1| sim CDS 36 36 . + . ID=L_15;
+gi|12345678|ref|NC_012345.1| sim CDS 37 37 . + . ID=L_16;
+gi|12345678|ref|NC_012345.1| sim CDS 38 38 . + . ID=L_17;
+gi|12345678|ref|NC_012345.1| sim CDS 39 39 . + . ID=L_18;
+gi|12345678|ref|NC_012345.1| sim CDS 40 40 . + . ID=L_19;
+gi|12345678|ref|NC_012345.1| sim CDS 41 41 . + . ID=L_20;
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/M.fasta
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/M.fasta Tue Feb 18 17:56:58 2020 -0500
b
b'@@ -0,0 +1,512 @@\n+>M_10\n+CVLHKYEIAALGNVLNKLFMTKLEDKVCGGDSQVYYKAKSPLTAITSTDNANSPLAGGYH\n+DHKLAFMGCIPTSAKKYNYPEETIKAQKTDIFTLSFATARDHYDESSAKSYLCNFESVYA\n+CDTRRCTNKPSVRAVKKLLGYFGYRAKHESPYGRHTLGDNLHSVKQFTSKNYLKLSVFRD\n+DFRRVPKKLLIGGAAVYRVVSDYKSTKKGNKESLGGTYSPVCAARGVDVHCAKKDGPDRK\n+QVLSPKLKCCVVFDYTAFGAIGELLLTVMSLITTIEAAKEKEGTNKCLVGSFPCAEITLS\n+GAGIKDWPGCLSLKCTFTLFQVTPMLYLMLCKYAQKPKFCNLGSNTRSFCQLNSHQLVAE\n+YVETFKEKKPVGADPVLKGPREEKALYVGNCVPLSFRILSKGAVGEETDYSSSQMARTSL\n+DQDHLCVECTPWDARKGAKCKGTQQEHSAKSANVGGCKVGKPQCIKGRSAWNCMCKFVIG\n+SDRLARNGDAVARTHENAIKNYAVSVARGVGTIIGPECVISDLVLQEYLFVAGGTGGNVA\n+SWTPAGCGTYQALWKKFGVNTCWSGLVALPLESYRNQVKNGYNRESGGLHIMMGFIVQPR\n+LVSALFSWGECRADLIELTQKLDAESGGYLQQSVEYRKLFPPAQGPVPPSCTISTFLTFH\n+NLVEEGLKGTFNTAKRPNACTFT\n+>M_11\n+PKFDSVVNHSRSDLFNNPEAVLFTNSECQTISVKAKNKGTGVAAEKVDGYAVSQPLEPYS\n+MSKKPVPNCGLEGSKELGRRDAAATCIFPGLVPLVFIRFQDTGQYLGDPSWALLEGVHYY\n+ASHGVSDLARKPNTHKSAKKYINIFGAKLNPTGSELKSYFDCKKAAIRLHNRADFLGETN\n+DYILGTNTEALQAYHPFEGFANKDGKKKLGKGGVILARPRTIALKTKRQFHSVTGLNFIG\n+PTGDCSGKHHIGQGLAKAVWGCTYLVPSHADILLLLMDMAYREVGPLGKGYSLGHLGCEE\n+KKDGF\n+>M_313\n+FWRGFAKLNPHDAKNSQGTLNVKNKSLTTVANHSGTETGCAFKAFLVLKSAHKEITADRP\n+QNKLVNPYVTSEEVHFSREKLPKTLAYAGARNCVSGPKWWHLQPTECGLSDSTKPLCGRK\n+VLLLKVIGIMLSNYFATGAYADDLFTLKRQQERIATCDPSFQSGPNFEAKVVYKIGSFTP\n+AKTDAGQLGSKLLQPRGIKPLPFELNVQNLPDMLGGCGDLGSGHDGPVIIARDTAVLPKA\n+QNKHGLESKFFASMGGIHSELALDETGFNLFPAGNYLICAVEKLAILTQIYTLHAAGGLR\n+FKLSASNQFGRVYGGEECSFHTLECGIFGRVLEPTSFTIVGKLRPCFSGNDRGCALVQYL\n+LVVGGKGRHPIEWEARPQGADVVGEDTCERSPVYSHAFKLTSENANNWDEIGDSQKLMNV\n+GRQFGMEYGEGFKTDNNKIFQFGLSRCQKLYSTVGIYDDSIGFTSAVFFPDQIVTPSVAK\n+QLFASGVVGHFQGADAQQEGYEFESKEEGTISIATSCLVEDTLSPGGFYTDFHHGTPENG\n+IYCDTRGSNTKSSCNIPSAVQAKELGTGPVGLFMSAFCCGLVKILCGSKILTKTGFIVVR\n+DNDQCGFEKGPAHMRTYLSTGKYTPRTDGATKREKPPSFCTGTIPLAPKIAKLGAGDQMH\n+GATAAGCTNKPGTGLSGFTDTGEETKGFEGCMFRLRALPTLNMQGDFFGIVSVVGEPKMN\n+LVTLRRLTRYRPPAICRTVKIAKFACTGSVRKKLLHTHGN\n+>M_619\n+DGVKKECQVVGACTLQLGSDLVGGVTDVEKFKKSNGGYTPALNLTDSLFSGKAFAAAGYV\n+IVRPKDILVNENQFACCLSCCDTNWQVVVEAPLASSIRVGYKVHVNFPNSEEIVCKKERS\n+RLSLGSPARPDTLVVADAMVLKKSCKKVPIVCTLYIMKYYADRQQYLKGYAQEKIHSIGC\n+DI\n+>M_621\n+DSVKRDDVSCKVVGACTLNIGKSDLAGGVSDVSELKQSEGGFSPALGTTSGLYNVKIFAA\n+AGYAVLQPKDILVDEAHFSVCMSCCAVAWQIAIHPPLAALEITGYTVHVKFPNCEQIVCR\n+KERSRLDLNDPERPITLVIAAAMVLKKQCKKTPFVCALYKQKYYNDRGQYLKGYAQEKAK\n+CIGYRV\n+>M_623\n+DSVKKSIAQLAYNKRDGICKVVGACTLHLGKSALADGVTDVDDLKQSEGGFGPALGTTSG\n+LYNVKIYAAAGYAVVQPKDVLDATHFSVCMSCPAIGWQVAIEPPLAGTGTPHSTVHVGFP\n+NCEQIVCRKGRSRLNLHHPERPKTLIVAAAMVLKKSCKKTPFACALYIQKYYNDRGQYLK\n+SYSQEKAKCIGYI\n+>M_14\n+PQANIQRKFCHDNALLAVNAPRVENFGDGFEACVARAPFYEGDLMGKGGVLLLFGTNEPI\n+MTAHKAGQVTGSSEVKGPFFHGRDPTGRYDHQKKSHLEVFVSELTSYFKQKAEQSIPRQW\n+EATWVGKMSLAVPYNIKWLKVRGGGCVSYGLVSKSAAVFDQVAAKVHEEHGHVRYVVWKC\n+TNARRHALTCKAARGGHVFFCGRGTRVKKCTSTKTDKNRPFSSANQLCQTETGVLLDYFK\n+GTLAALPAAQGLSAGDVRFLLLSTNYRGLIKAYAVGREKELLVKHHKWKGAQTAGDATNK\n+KTAPNESFLPFLVKGQKSHKLVFTGKSTLEMTRKEYASAAKSRSILGFGPHPEQGRTIYN\n+GARSIGSRYPVNEAAESCTKANSIVALTKKKSCRNMHNRILEASGENGLDGVIALNLNYK\n+CAKKETDDAHEIKPDALIDHTVVGIDGAKLWICQVEYLADLHASALVANYLHSTYGNGLM\n+GICRINKIASRTMPRQHTVQSCVTCRLKSGISGAKKCAPKHVRYTTEHKDFFMVRSTQFR\n+CNKMDEGSFEFLHANQNQPKLGSFGQHDHVESHNEPGKYIEKGHGPHHPIEDARGNKRLC\n+VSFTQASGRTSKAGQDNLYIYISIGFKRCQERRPKKCKIRCGKKKVGEVDTPPNYVLNYS\n+QGDADLEDLIPALNKSGDFFVRSATDKPGASASIFNEKRFCNCEQCNVAAVGGKKSRALS\n+SEEIVKGPSNVGGLYQGGTAMQVCEPLIPNYCGTYTSIRPVKYLC\n+>M_15\n+PKGTNYQGFRTETLHLDIKTTFTPAFYVTKELACSPCYLQVEGFLMVYSLREITKADEGP\n+LKNGKKATAKVNDLQEEARVSTFENRLKSELQKRLGVESADFQAQYYSLLNDVGLICDSK\n+YKAGLIGQADHRELIATACFQCQYHCDAYIFFSRVGSQFPKRKAAGKGPFRGVFATPPAK\n+AVSTIHDQLAEGHWVHTIYTNGKAHIVALAPVWHDLGVLAVAVPLGPLAALDAGSNRQCG\n+KNWVKRLTLGYLESNIPYVEGTVKCYEVKNKRATAVKSHPEHGSVMATIYPLKSGVGASK\n+HEVDAFGGSENLSLFSTNLGNYTDSTNSTKKEKCQDCEYRLWGGSNPPTKPAGARGGPHL\n+CGSAPTGSNTGTGVTEKENMAELRCFAAGDGFFKGYIQYGGWFGGLNDKAWLAKFREEFG\n+NVSNGRDKRTGELRHVECPIQVQKPYNNPILHHEKDCGGKTRVHGSGGEKDVGPWRTDTS\n+TKQDNQKFASGKL\n+>M_16\n+LEDDETQLSDIDDEECRLFDFPGKHVGGFGACASQAAAGLGQIFDCAVGTGRLGLVNVAD\n+VRSSSSTRAHVKLTHDSGLGPSNPVDVAALPFHDPWNDASYFAQRTHGKWENGVLKTATE\n+KDASHLRFLTKNLYHQVSFIGIQTLADESLHVSGISPRYYHQSRAFDEYLSGVPPAEKRK\n+LDECTSDYNGHQFKLAAQIVTRPFGIDSNI'..b'ANLIAYNVGFMTKDTALSNANEAHTGGVASLRTATHT\n+WGVTANRVDYFNAVLKGYHTALVERCGVGFLKGAILEFIPLVKCFVVTKVAHVVRVDQKT\n+GNEIRDCRSWLGKAKGAQGDVSNFAKKPALENSKGKGANSRSPDGTAICMESVAVIKCLG\n+ERCVYGKSEPENLTNSEFEEPKGRAESYTDSIATLETLAQCGYAIADTAALPLFCLLLGA\n+EDTQLASFDERYGPEATSKGIQLNDVTYLEAYYSGNGQNKLGQQVGLDEGEFRLQKPIAV\n+PAPYPKDTCVGTMVSKSNSALVSDTHKATASQPFVCCGSKQLILKVEACDLVVKNGTKDD\n+IVTADTEPCQYNCGHGAVIAKLTTEDSQLYGPDVVCMKNPAKCNSKKDIEPSQLAALVWA\n+MGGKKCPAENLELMYINFKLLYSEQADAENSDLAHKGS\n+>M_5\n+NCESGNAEADESGSGNYAKSICAGFRREVWKLTMEADANIEHEHKGATEEPISPKGNNVN\n+VLGKGCEKPLVHQKSKDDLKAEAQLLIKCEAKNAWHKPLQGNSLPGYAPKWGVALLDLVL\n+LYSFKALARAIPLRYTGGAKDSPPFINESVVFGQPLEHILVTSRYEMSGNLHSEKHPQRS\n+KPDTKPADPRKAQLEGIFDERLHDCVKVSTGEVVNGNDNTTVHTLYAKLYRTPPPVNDAK\n+CFVSKDKGGINEEGKLIGQKVGGVLDPIARGHAHLFVGNKAAYPMKANVACLSTGSGTAD\n+SGDGTNGDDIAADKSANEDIKIVGALQNHGRPMEFNKGSGPFQLNHKLEEPYFYQCTQHD\n+HAKAHKNARVTSCANGQQSSVWGCQFSLLFLPAAFKTTPGLQRFWEFGHAAHLDTQLHPE\n+TCLMSAPKTCAHLVVVEKWTYTLQLEPFATSQNQSLIFEKNSSCSLFNCYPLKEKKNSGV\n+EADAVDQPGDTKKTPEIGTFECVILPYRWQILADAKKNKTMRGTSFAFCNALNLTSPVLR\n+NQIALRCHTDKVSEETSQMPATFASSVFGVKVIFNERCQSHMSCSEEGEAGVHDLVKAGL\n+QRAKNFPLSHPPISYPLTIVYKVNPKNVGHLSAPCNRQAIAKEKMQSNGLVSKCCCTRTG\n+TAPSTLTKASELFPLPISAVEVAGLAATHADEPYESFAWAMFTIGEYTQKVKNGQKAGSG\n+MGVPCLVHAYGPAEAFDRHYRGSQECDMRQGALWENASQELRVNTNPEAVANDTCGKTGG\n+SDKGDNDLVSVETVKETLNSARGSGYGVAEVTAHFNEAVARIGCILCLKQLECGLSAQSI\n+VKKHNGKKKIETPKVHTVQVALKLKGRCSVRQHNLPAFTNSPVVVAESQYAHKGIKLLEI\n+NDEEQVLITGNAPRFPGELGTGSQF\n+>M_6\n+QLPFSWYFKPDVRLEIKEELACHTTAAQKMKEPRRIEDAEPAGFTEPLNGLIVKPHDENP\n+VGDVFGPRIWCDTDYVLFAGYAGNHTAGHNLQKHFLAHQARPNEYLTPRQGGGFFYVQKE\n+LPLWHAIGAGKVKKNKKSFYIRKADMRFHPSFKNHQCVALSIVDGLLNAVATPGSPKLFL\n+NRGDGELRGEECNSVNTFADKLLRTTMQPCGASPFGRESIGDHPSYVLPGGLRMTWDTDE\n+ECMIMKAFLIKAENYLLSNPKATTTMVSPDGFFDFARLHHLLPPLAASATGLDCDVSVYD\n+YVVSDTIFREHVKNKACPAVVYSVNGWSKEIHGKLSVGGGWEQGLDGPFKYHHTQEPFED\n+KVDIKGAIPVDTMFKASMFKKHKQSQLVTGGGSLYKESCFKHKMKRERNKSADKGANLGQ\n+GILQTAMSGFTVDGMQALQPEPAQSANVTAGVLAVAVAAVSYFDRVQTTNCEVYASGFWP\n+QAVRGNISVNQGPPFSEAFFKLGKPELCDGEQFTIGTDQPDSKVLIGRASGLCHFLMTPS\n+IEAGWLTTNVSQYENDAGTHPDVGAKDAGVTENFFCQEVTVIGISITHGLSADKRSIFRG\n+VISATQSGKVQLTGLALVPPVGLSPQTLTNRLAGLIGYGKLACLKCTVYKSTRRTLAIVL\n+LEYRVAVSVAKEPRAKLVMNAKLHTLYVTHRHSSDLMPFAFTGRNCKATNQPGILTHNKM\n+CQCAEAGLPHEKYGFAHLSRSSFGVSCTGCSDPTIVQALHRAESIHRSGAWLNSQNSTET\n+GAILFGPTSKETRDSICGNQAFSVAATIGQLGYIVDVLAHGMVLAFCDYAKTAGGSPPKE\n+KVSCDDGHGGLMLEANVFSEDDHVRKHLGLSENGYHCVLTSKTLVKFLIRHQTIHCGTEG\n+CVPTGSGDFSD\n+>M_7\n+SENNIKWPQLGGVALYGEDANMELGADGVPSLASLGMPWPVLFNANLSGKQCAQCRIFIV\n+CHLTQPHGCGAMQVGMSGDSEAKDQVKLNGGACKDKFRGRTLMAMYPFGRVLFATPSTVA\n+FDKFILKEGFGFLGRCAAKVAATQPLNGVTTAVQVVNKCCNKSKKSLEPLLTGRDHAAEG\n+CGYASAFTVALIKNSYHCDYYSDHAKYASKSYSKSSRALASYFLIQFISCTKGLCSESHE\n+CVKNEFLVKIWAGSKMGTSIPTDYTMLTDPGYPYECDDHQNNRHCSGEKMPKLQNHPSYS\n+AFTQRRKSFTKQLTPSKGERKFDKNAVHLDIGKVTPTASDEYVEALSLVHPTALNPAFGM\n+KAVYQYLKRAYKKGLLGLDVHVSKNNTEASKKDYHVVT\n+>M_8\n+CRLPGGVNERAFGHVNDKDLCMLPSAVFCTQKGKENPQNKEYQMAGSKPQTWPAAQVLDC\n+RHELRTYTGQLPLRAATDLGPDVKSIYTVSQRGFKVGQTNHAVCVFEAGNVADKKWKMCH\n+GKNYGRSESWIYFSLNEKANGHLKALHPSAFQKHKKWTGMRDFGATTKTGLRLVAFSDPT\n+GACAQVPYLSDCPRGKLSRPTIPPGAALTVEFTAASARCKKLAEIANADEPASSAKAQKF\n+FTTGAMASSFLAAKSAVTPTLENKTNGSSLQHPSKSGDQLKDYTVKPFSLVQPKLAGTAH\n+ALMIYKDPPGSGYFINFVTKYQKIKRFWGVPVKARPQNAKASFCTHDLIFCPKGGLEFLN\n+GVPFGSPLAGCQLERSTFPVKGLGKACAILSLSRVALSQENKQHVNDHHEAKVGANGPSR\n+AIDVQVGCAVEPNCGDTQLREDFFCYTLGAAHGRFVLSLARDTLQLCFHADITPPLVISI\n+STKILGSVVKLRGASGETVELASAQAVASKPLKQAERARIGFCRGSLAIHADATLQSGSC\n+TGGTDKKLELEQDNDPCVTAKQGSGLKRAGQPIKSRSHDACKADSLSDKAAPGRSWTMEI\n+GTETYPVMQGNGPRRASRSTLYAEGGVIDWFKGAHNSYEFTGITCSGVRDMLTPQDFEDI\n+KEQTGDLSCMAVNCNAANDCHCSAGLVLPFKETLVCRHATSGKLINDVSGPSVKVGGMKL\n+PLSSNHFLPLTINQGGPVRTGADSDCSGFCCGCKALKLKLAEFIPSRPLGSVTGGKEVVS\n+FPNKEGGDTTNLPKEYANTGGMCAVCPNGAHGTGGMTILSLGAFGYQYTCLVGVDGASKD\n+LLVGNGLEIYHALYVSLHKKVKHTDSPGQWVGFSIHTSEDKSTCTGNGCILHVSVHSQQF\n+GDFLACKHGKQRVPDKEKYYYDFAANPVPGTTTPSGLLLRTVRTAKTPTKFHFG\n+>M_9\n+LSYLHYDDACVVTRAVGFFYTQFKQEAPVSCANVNKEFDHFSVDKKDPWAAIGLTSATGN\n+RAHNFVAADKTKHYRSRQRYARAGSGPIVRALFETAYATTIQNTHTFSTPLKRIVDNGLD\n+DGSVSRACLPLELAPFVRLRCACSGGLFFTGVVPLLTVLLQVNGSVKLTWLGAMYATFPV\n+LDLRRMLLVVTQDTGLATFRPSPNGRHPKDCAT\n'
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/M.gff
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/M.gff Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,40 @@
+gi|12345678|ref|NC_012345.1| sim CDS 1 1 . - . ID=M_319;
+gi|12345678|ref|NC_012345.1| sim CDS 2 2 . - . ID=M_317;
+gi|12345678|ref|NC_012345.1| sim CDS 3 3 . + . ID=M_617;
+gi|12345678|ref|NC_012345.1| sim CDS 4 4 . + . ID=M_6;
+gi|12345678|ref|NC_012345.1| sim CDS 5 5 . + . ID=M_7;
+gi|12345678|ref|NC_012345.1| sim CDS 6 6 . + . ID=M_8;
+gi|12345678|ref|NC_012345.1| sim CDS 7 7 . + . ID=M_9;
+gi|12345678|ref|NC_012345.1| sim CDS 8 8 . + . ID=M_10;
+gi|12345678|ref|NC_012345.1| sim CDS 9 9 . + . ID=M_11;
+gi|12345678|ref|NC_012345.1| sim CDS 10 10 . + . ID=M_313;
+gi|12345678|ref|NC_012345.1| sim CDS 11 11 . - . ID=M_623;
+gi|12345678|ref|NC_012345.1| sim CDS 12 12 . + . ID=M_333;
+gi|12345678|ref|NC_012345.1| sim CDS 13 13 . + . ID=M_2;
+gi|12345678|ref|NC_012345.1| sim CDS 14 14 . + . ID=M_3;
+gi|12345678|ref|NC_012345.1| sim CDS 15 15 . + . ID=M_4;
+gi|12345678|ref|NC_012345.1| sim CDS 16 16 . + . ID=M_5;
+gi|12345678|ref|NC_012345.1| sim CDS 17 17 . - . ID=M_323;
+gi|12345678|ref|NC_012345.1| sim CDS 18 18 . + . ID=M_627;
+gi|12345678|ref|NC_012345.1| sim CDS 19 19 . + . ID=M_630;
+gi|12345678|ref|NC_012345.1| sim CDS 20 20 . + . ID=M_632;
+gi|12345678|ref|NC_012345.1| sim CDS 21 21 . + . ID=M_634;
+gi|12345678|ref|NC_012345.1| sim CDS 22 22 . + . ID=M_636;
+gi|12345678|ref|NC_012345.1| sim CDS 23 23 . + . ID=M_638;
+gi|12345678|ref|NC_012345.1| sim CDS 24 24 . + . ID=M_640;
+gi|12345678|ref|NC_012345.1| sim CDS 25 25 . + . ID=M_649;
+gi|12345678|ref|NC_012345.1| sim CDS 26 26 . + . ID=M_642;
+gi|12345678|ref|NC_012345.1| sim CDS 27 27 . + . ID=M_644;
+gi|12345678|ref|NC_012345.1| sim CDS 28 28 . + . ID=M_646;
+gi|12345678|ref|NC_012345.1| sim CDS 29 29 . + . ID=M_336;
+gi|12345678|ref|NC_012345.1| sim CDS 30 30 . + . ID=M_328;
+gi|12345678|ref|NC_012345.1| sim CDS 31 31 . + . ID=M_331;
+gi|12345678|ref|NC_012345.1| sim CDS 32 32 . - . ID=M_621;
+gi|12345678|ref|NC_012345.1| sim CDS 33 33 . - . ID=M_619;
+gi|12345678|ref|NC_012345.1| sim CDS 34 34 . + . ID=M_14;
+gi|12345678|ref|NC_012345.1| sim CDS 35 35 . + . ID=M_15;
+gi|12345678|ref|NC_012345.1| sim CDS 36 36 . + . ID=M_16;
+gi|12345678|ref|NC_012345.1| sim CDS 37 37 . - . ID=M_20;
+gi|12345678|ref|NC_012345.1| sim CDS 38 38 . - . ID=M_19;
+gi|12345678|ref|NC_012345.1| sim CDS 39 39 . - . ID=M_18;
+gi|12345678|ref|NC_012345.1| sim CDS 40 40 . - . ID=M_17;
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/result.blast-graph
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/result.blast-graph Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,169 @@
+# file_a file_b
+# a b evalue_ab bitscore_ab evalue_ba bitscore_ba
+# E.fasta C.fasta
+# 1.90009e-124 442.2 1.4375e-126 444.9
+E_10 C_10 3.8e-124 434.9 2.8e-126 442.2
+E_11 C_11 5.9e-51 190.7 5.6e-50 187.6
+E_13 C_13 1.1e-26 109.4 1.7e-25 105.5
+E_14 C_14 9.4e-163 563.5 2.5e-161 558.9
+E_15 C_15 5.4e-100 354.4 3.3e-100 355.1
+E_16 C_16 2.7e-45 171.8 7.1e-47 177.2
+E_17 C_17 4.4e-183 631.3 5.0e-182 627.9
+E_18 C_64 6.7e-64 234.2 1.6e-63 233.0
+E_19 C_22 2.2e-30 121.3 5.2e-30 120.2
+E_19 C_63 3.0e-32 127.5 1.2e-31 125.6
+E_313 C_12 4.1e-131 458.4 1.0e-129 453.8
+E_315 C_12 1.8e-128 449.5 7.5e-128 447.6
+E_317 C_1 1.6e-136 476.5 1.8e-133 466.5
+E_366 C_1 9.4e-131 457.2 2.4e-130 456.1
+E_368 C_1 1.5e-134 469.9 4.4e-132 461.8
+E_437 C_1 1.0e-130 457.2 2.9e-128 449.1
+# L.fasta C.fasta
+# 2.95e-95 363.6 2.1e-95 364.35
+L_10 C_10 2.9e-128 448.7 1.6e-130 455.3
+L_11 C_11 1.8e-58 215.7 1.0e-57 212.2
+L_14 C_14 5.1e-123 431.4 7.9e-124 433.3
+L_15 C_15 2.3e-87 312.4 2.7e-87 311.2
+L_16 C_16 1.4e-41 159.5 2.3e-43 164.5
+L_17 C_17 7.1e-170 587.4 3.1e-169 584.3
+L_18 C_64 9.2e-66 240.4 1.8e-65 238.4
+L_19 C_63 7.2e-29 116.3 4.7e-29 115.9
+L_2 C_164 3.0e-94 335.1 1.0e-93 332.4
+L_2 C_166 1.2e-90 323.2 8.0e-91 322.8
+L_2 C_167 5.2e-91 324.3 3.9e-90 320.5
+L_2 C_2 5.9e-95 337.4 4.2e-95 337.0
+L_20 C_20 2.5e-172 595.5 2.2e-170 588.2
+L_313 C_12 1.4e-115 406.8 1.0e-114 402.9
+L_313 C_21 1.8e-110 389.8 2.5e-111 391.7
+L_323 C_1 1.2e-136 476.9 6.7e-134 466.8
+L_336 C_1 2.5e-134 469.2 6.9e-131 456.8
+L_621 C_13 3.3e-34 134.4 4.2e-33 129.8
+L_627 C_1 4.6e-136 474.9 5.1e-134 467.2
+L_631 C_1 1.5e-139 486.5 4.5e-138 480.7
+# C2.fasta C.fasta
+# 0 1391.7 0 1391.7
+C_10 C_10 0.0e+00 1391.7 0.0e+00 1391.7
+# C2.fasta E.fasta
+# 2.8e-126 442.2 5.4e-126 434.9
+C_10 E_10 2.8e-126 442.2 5.4e-126 434.9
+# M.fasta C.fasta
+# 3.5e-119 418.7 1e-117 412.9
+M_10 C_10 1.3e-128 449.9 1.3e-129 452.2
+M_11 C_11 2.0e-57 212.2 4.4e-56 206.8
+M_14 C_14 9.4e-128 447.2 2.6e-130 454.9
+M_15 C_15 1.2e-83 300.1 4.4e-85 303.9
+M_16 C_16 8.3e-36 140.2 9.6e-37 142.5
+M_17 C_17 7.6e-156 540.8 2.3e-156 541.6
+M_18 C_64 8.0e-70 253.8 1.1e-68 249.2
+M_19 C_63 6.3e-25 103.2 5.5e-25 102.4
+M_2 C_164 1.2e-92 329.7 1.2e-91 325.5
+M_2 C_166 5.1e-91 324.3 1.1e-90 322.4
+M_2 C_167 7.7e-95 337.0 1.0e-93 332.4
+M_2 C_2 8.5e-94 333.6 2.3e-93 331.3
+M_20 C_20 7.9e-174 600.5 1.3e-170 589.0
+M_313 C_12 3.5e-119 418.7 1.0e-117 412.9
+M_323 C_1 6.6e-135 471.1 4.8e-132 460.7
+M_331 C_1 2.0e-131 459.5 5.9e-130 453.8
+M_336 C_1 2.2e-135 472.6 2.0e-133 465.3
+M_621 C_13 6.4e-38 146.7 8.3e-37 142.1
+M_630 C_1 9.3e-129 450.7 2.8e-127 444.9
+M_632 C_1 3.3e-134 468.8 1.6e-130 455.7
+M_636 C_1 3.7e-130 455.3 1.1e-128 449.5
+# C2.fasta L.fasta
+# 1.6e-130 455.3 4.1e-130 448.7
+C_10 L_10 1.6e-130 455.3 4.1e-130 448.7
+# C2.fasta M.fasta
+# 1.3e-129 452.2 1.8e-130 449.9
+C_10 M_10 1.3e-129 452.2 1.8e-130 449.9
+# M.fasta L.fasta
+# 0 1374.8 0 1372.5
+M_10 L_10 0.0e+00 1223.0 0.0e+00 1218.4
+M_11 L_11 6.4e-164 565.1 4.2e-163 562.4
+M_14 L_14 0.0e+00 1300.8 0.0e+00 1302.0
+M_15 L_15 1.7e-262 893.3 2.6e-263 896.0
+M_16 L_16 1.8e-135 470.3 3.4e-135 469.5
+M_17 L_17 0.0e+00 1636.7 0.0e+00 1640.9
+M_18 L_18 3.1e-214 732.6 1.5e-213 730.3
+M_19 L_19 5.0e-74 265.4 5.1e-74 265.4
+M_2 L_2 3.2e-230 785.8 7.4e-230 784.6
+M_20 L_20 0.0e+00 1709.1 0.0e+00 1704.1
+M_3 L_3 6.1e-212 724.9 1.4e-211 723.8
+M_313 L_313 0.0e+00 1374.8 0.0e+00 1372.5
+M_317 L_317 0.0e+00 1416.0 0.0e+00 1416.4
+M_319 L_319 0.0e+00 1484.9 0.0e+00 1478.8
+M_323 L_323 0.0e+00 1548.9 0.0e+00 1549.3
+M_328 L_328 0.0e+00 1488.8 0.0e+00 1486.9
+M_331 L_331 0.0e+00 1570.8 0.0e+00 1571.2
+M_333 L_333 0.0e+00 1570.8 0.0e+00 1572.8
+M_336 L_336 0.0e+00 1474.9 0.0e+00 1480.7
+M_4 L_4 0.0e+00 1317.0 0.0e+00 1316.2
+M_5 L_5 0.0e+00 1607.4 0.0e+00 1611.7
+M_6 L_6 0.0e+00 1635.9 0.0e+00 1634.0
+M_617 L_617 0.0e+00 1493.4 0.0e+00 1491.1
+M_619 L_619 5.6e-83 295.4 1.7e-82 293.9
+M_621 L_621 2.6e-99 349.7 2.6e-99 349.7
+M_623 L_623 2.8e-109 382.9 3.8e-109 382.5
+M_627 L_627 0.0e+00 1325.8 0.0e+00 1327.8
+M_632 L_631 0.0e+00 1254.2 0.0e+00 1250.0
+M_632 L_633 0.0e+00 1239.2 0.0e+00 1234.2
+M_634 L_635 0.0e+00 1310.4 0.0e+00 1312.7
+M_636 L_635 0.0e+00 1350.9 0.0e+00 1350.9
+M_636 L_637 0.0e+00 1300.4 0.0e+00 1300.8
+M_638 L_637 0.0e+00 1350.9 0.0e+00 1347.0
+M_638 L_639 0.0e+00 1350.1 0.0e+00 1344.3
+M_640 L_641 0.0e+00 1493.0 0.0e+00 1490.7
+M_640 L_643 0.0e+00 1485.3 0.0e+00 1485.7
+M_642 L_641 0.0e+00 1503.4 0.0e+00 1499.6
+M_642 L_643 0.0e+00 1526.5 0.0e+00 1526.1
+M_644 L_645 0.0e+00 1695.2 0.0e+00 1694.9
+M_644 L_647 0.0e+00 1631.7 0.0e+00 1633.2
+M_646 L_645 0.0e+00 1704.1 0.0e+00 1703.7
+M_646 L_647 0.0e+00 1664.4 0.0e+00 1666.4
+M_649 L_641 0.0e+00 1446.8 0.0e+00 1445.6
+M_8 L_8 0.0e+00 1676.4 0.0e+00 1681.4
+M_9 L_9 5.2e-104 365.5 2.7e-103 363.2
+# L.fasta E.fasta
+# 1.4000000075e-147 526 1.000265e-151 531
+L_10 E_10 5.9e-127 444.5 3.9e-128 447.2
+L_11 E_11 6.2e-65 237.3 3.8e-65 236.9
+L_14 E_14 1.8e-163 565.8 1.1e-165 572.4
+L_15 E_15 3.8e-104 368.2 4.2e-104 367.1
+L_16 E_16 4.7e-59 217.6 1.0e-59 218.8
+L_17 E_17 8.2e-201 690.3 4.2e-201 690.3
+L_18 E_18 4.8e-81 291.2 6.3e-82 293.1
+L_19 E_19 3.7e-31 124.0 4.6e-32 125.9
+L_313 E_313 1.8e-177 612.5 8.9e-178 612.5
+L_317 E_437 1.5e-155 539.7 5.3e-155 537.0
+L_323 E_368 2.0e-182 629.0 6.4e-182 626.3
+L_617 E_432 2.8e-147 512.3 2.0e-151 525.0
+L_621 E_13 3.3e-37 144.4 4.8e-37 142.9
+L_623 E_13 1.1e-38 149.4 5.7e-38 146.0
+L_627 E_368 2.6e-185 638.6 5.6e-186 639.8
+L_631 E_317 2.6e-174 602.1 5.7e-175 603.2
+L_631 E_368 3.2e-180 621.7 2.7e-180 620.9
+L_635 E_317 6.9e-175 604.0 1.4e-176 608.6
+# M.fasta E.fasta
+# 1.4e-164 569.7 9.9e-167 575.9
+M_10 E_10 5.2e-128 448.0 1.1e-127 445.7
+M_11 E_11 4.5e-63 231.1 1.0e-62 228.8
+M_14 E_14 2.3e-164 568.9 9.7e-167 575.9
+M_15 E_15 7.2e-103 364.0 3.2e-104 367.5
+M_16 E_16 1.3e-50 189.5 1.1e-50 188.7
+M_17 E_17 2.2e-198 682.2 6.1e-200 686.4
+M_18 E_18 1.3e-81 293.1 1.1e-81 292.4
+M_19 E_19 4.5e-29 117.1 4.3e-30 119.4
+M_313 E_313 1.2e-178 616.3 3.1e-178 614.0
+M_319 E_367 2.8e-157 545.4 2.8e-158 547.7
+M_323 E_317 3.6e-171 591.7 6.6e-171 589.7
+M_323 E_368 6.3e-176 607.4 4.5e-175 603.6
+M_328 E_432 4.0e-156 541.6 1.6e-153 531.9
+M_331 E_368 1.3e-173 599.7 3.8e-174 600.5
+M_336 E_317 1.5e-166 576.2 2.6e-167 577.8
+M_336 E_366 3.6e-168 581.6 3.3e-167 577.4
+M_336 E_368 1.5e-174 602.8 7.6e-175 602.8
+M_621 E_13 4.5e-42 160.6 5.0e-42 159.5
+M_627 E_368 2.4e-180 622.1 1.4e-181 625.2
+M_632 E_368 2.3e-178 615.5 6.2e-177 609.8
+M_634 E_317 1.4e-164 569.7 9.9e-167 575.9
+M_636 E_317 1.4e-164 569.7 1.1e-165 572.4
+M_636 E_366 1.1e-159 553.5 2.5e-159 551.2
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/result.proteinortho-graph
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/result.proteinortho-graph Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,144 @@
+# file_a file_b
+# a b evalue_ab bitscore_ab evalue_ba bitscore_ba
+# E.fasta C.fasta
+# 1.90009e-124 442.2 1.4375e-126 444.9
+E_10 C_10 3.8e-124 434.9 2.8e-126 442.2
+E_11 C_11 5.9e-51 190.7 5.6e-50 187.6
+E_13 C_13 1.1e-26 109.4 1.7e-25 105.5
+E_14 C_14 9.4e-163 563.5 2.5e-161 558.9
+E_15 C_15 5.4e-100 354.4 3.3e-100 355.1
+E_16 C_16 2.7e-45 171.8 7.1e-47 177.2
+E_17 C_17 4.4e-183 631.3 5.0e-182 627.9
+E_18 C_64 6.7e-64 234.2 1.6e-63 233.0
+E_19 C_22 2.2e-30 121.3 5.2e-30 120.2
+E_19 C_63 3.0e-32 127.5 1.2e-31 125.6
+E_313 C_12 4.1e-131 458.4 1.0e-129 453.8
+E_315 C_12 1.8e-128 449.5 7.5e-128 447.6
+E_368 C_1 1.5e-134 469.9 4.4e-132 461.8
+# L.fasta C.fasta
+# 2.95e-95 363.6 2.1e-95 364.35
+L_10 C_10 2.9e-128 448.7 1.6e-130 455.3
+L_11 C_11 1.8e-58 215.7 1.0e-57 212.2
+L_14 C_14 5.1e-123 431.4 7.9e-124 433.3
+L_15 C_15 2.3e-87 312.4 2.7e-87 311.2
+L_16 C_16 1.4e-41 159.5 2.3e-43 164.5
+L_17 C_17 7.1e-170 587.4 3.1e-169 584.3
+L_18 C_64 9.2e-66 240.4 1.8e-65 238.4
+L_19 C_63 7.2e-29 116.3 4.7e-29 115.9
+L_2 C_164 3.0e-94 335.1 1.0e-93 332.4
+L_2 C_166 1.2e-90 323.2 8.0e-91 322.8
+L_2 C_167 5.2e-91 324.3 3.9e-90 320.5
+L_2 C_2 5.9e-95 337.4 4.2e-95 337.0
+L_20 C_20 2.5e-172 595.5 2.2e-170 588.2
+L_313 C_12 1.4e-115 406.8 1.0e-114 402.9
+L_313 C_21 1.8e-110 389.8 2.5e-111 391.7
+L_323 C_1 1.2e-136 476.9 6.7e-134 466.8
+L_621 C_13 3.3e-34 134.4 4.2e-33 129.8
+L_627 C_1 4.6e-136 474.9 5.1e-134 467.2
+# C2.fasta C.fasta
+# 0 1391.7 0 1391.7
+C_10 C_10 0.0e+00 1391.7 0.0e+00 1391.7
+# C2.fasta E.fasta
+# 2.8e-126 442.2 5.4e-126 434.9
+C_10 E_10 2.8e-126 442.2 5.4e-126 434.9
+# M.fasta C.fasta
+# 3.5e-119 418.7 1e-117 412.9
+M_10 C_10 1.3e-128 449.9 1.3e-129 452.2
+M_11 C_11 2.0e-57 212.2 4.4e-56 206.8
+M_14 C_14 9.4e-128 447.2 2.6e-130 454.9
+M_15 C_15 1.2e-83 300.1 4.4e-85 303.9
+M_16 C_16 8.3e-36 140.2 9.6e-37 142.5
+M_17 C_17 7.6e-156 540.8 2.3e-156 541.6
+M_18 C_64 8.0e-70 253.8 1.1e-68 249.2
+M_19 C_63 6.3e-25 103.2 5.5e-25 102.4
+M_2 C_164 1.2e-92 329.7 1.2e-91 325.5
+M_2 C_166 5.1e-91 324.3 1.1e-90 322.4
+M_2 C_167 7.7e-95 337.0 1.0e-93 332.4
+M_2 C_2 8.5e-94 333.6 2.3e-93 331.3
+M_20 C_20 7.9e-174 600.5 1.3e-170 589.0
+M_313 C_12 3.5e-119 418.7 1.0e-117 412.9
+M_621 C_13 6.4e-38 146.7 8.3e-37 142.1
+M_630 C_1 9.3e-129 450.7 2.8e-127 444.9
+# C2.fasta L.fasta
+# 1.6e-130 455.3 4.1e-130 448.7
+C_10 L_10 1.6e-130 455.3 4.1e-130 448.7
+# C2.fasta M.fasta
+# 1.3e-129 452.2 1.8e-130 449.9
+C_10 M_10 1.3e-129 452.2 1.8e-130 449.9
+# M.fasta L.fasta
+# 0 1374.8 0 1372.5
+M_10 L_10 0.0e+00 1223.0 0.0e+00 1218.4
+M_11 L_11 6.4e-164 565.1 4.2e-163 562.4
+M_14 L_14 0.0e+00 1300.8 0.0e+00 1302.0
+M_15 L_15 1.7e-262 893.3 2.6e-263 896.0
+M_16 L_16 1.8e-135 470.3 3.4e-135 469.5
+M_17 L_17 0.0e+00 1636.7 0.0e+00 1640.9
+M_18 L_18 3.1e-214 732.6 1.5e-213 730.3
+M_19 L_19 5.0e-74 265.4 5.1e-74 265.4
+M_2 L_2 3.2e-230 785.8 7.4e-230 784.6
+M_20 L_20 0.0e+00 1709.1 0.0e+00 1704.1
+M_3 L_3 6.1e-212 724.9 1.4e-211 723.8
+M_313 L_313 0.0e+00 1374.8 0.0e+00 1372.5
+M_317 L_317 0.0e+00 1416.0 0.0e+00 1416.4
+M_319 L_319 0.0e+00 1484.9 0.0e+00 1478.8
+M_328 L_328 0.0e+00 1488.8 0.0e+00 1486.9
+M_331 L_331 0.0e+00 1570.8 0.0e+00 1571.2
+M_333 L_333 0.0e+00 1570.8 0.0e+00 1572.8
+M_336 L_336 0.0e+00 1474.9 0.0e+00 1480.7
+M_4 L_4 0.0e+00 1317.0 0.0e+00 1316.2
+M_5 L_5 0.0e+00 1607.4 0.0e+00 1611.7
+M_6 L_6 0.0e+00 1635.9 0.0e+00 1634.0
+M_617 L_617 0.0e+00 1493.4 0.0e+00 1491.1
+M_619 L_619 5.6e-83 295.4 1.7e-82 293.9
+M_621 L_621 2.6e-99 349.7 2.6e-99 349.7
+M_623 L_623 2.8e-109 382.9 3.8e-109 382.5
+M_627 L_627 0.0e+00 1325.8 0.0e+00 1327.8
+M_632 L_631 0.0e+00 1254.2 0.0e+00 1250.0
+M_632 L_633 0.0e+00 1239.2 0.0e+00 1234.2
+M_636 L_635 0.0e+00 1350.9 0.0e+00 1350.9
+M_638 L_637 0.0e+00 1350.9 0.0e+00 1347.0
+M_638 L_639 0.0e+00 1350.1 0.0e+00 1344.3
+M_640 L_641 0.0e+00 1493.0 0.0e+00 1490.7
+M_640 L_643 0.0e+00 1485.3 0.0e+00 1485.7
+M_642 L_641 0.0e+00 1503.4 0.0e+00 1499.6
+M_642 L_643 0.0e+00 1526.5 0.0e+00 1526.1
+M_644 L_645 0.0e+00 1695.2 0.0e+00 1694.9
+M_644 L_647 0.0e+00 1631.7 0.0e+00 1633.2
+M_646 L_645 0.0e+00 1704.1 0.0e+00 1703.7
+M_646 L_647 0.0e+00 1664.4 0.0e+00 1666.4
+M_649 L_641 0.0e+00 1446.8 0.0e+00 1445.6
+M_8 L_8 0.0e+00 1676.4 0.0e+00 1681.4
+M_9 L_9 5.2e-104 365.5 2.7e-103 363.2
+# L.fasta E.fasta
+# 1.4000000075e-147 526 1.000265e-151 531
+L_10 E_10 5.9e-127 444.5 3.9e-128 447.2
+L_11 E_11 6.2e-65 237.3 3.8e-65 236.9
+L_14 E_14 1.8e-163 565.8 1.1e-165 572.4
+L_15 E_15 3.8e-104 368.2 4.2e-104 367.1
+L_16 E_16 4.7e-59 217.6 1.0e-59 218.8
+L_17 E_17 8.2e-201 690.3 4.2e-201 690.3
+L_18 E_18 4.8e-81 291.2 6.3e-82 293.1
+L_19 E_19 3.7e-31 124.0 4.6e-32 125.9
+L_313 E_313 1.8e-177 612.5 8.9e-178 612.5
+L_317 E_437 1.5e-155 539.7 5.3e-155 537.0
+L_323 E_368 2.0e-182 629.0 6.4e-182 626.3
+L_617 E_432 2.8e-147 512.3 2.0e-151 525.0
+L_621 E_13 3.3e-37 144.4 4.8e-37 142.9
+L_627 E_368 2.6e-185 638.6 5.6e-186 639.8
+# M.fasta E.fasta
+# 1.4e-164 569.7 9.9e-167 575.9
+M_10 E_10 5.2e-128 448.0 1.1e-127 445.7
+M_11 E_11 4.5e-63 231.1 1.0e-62 228.8
+M_14 E_14 2.3e-164 568.9 9.7e-167 575.9
+M_15 E_15 7.2e-103 364.0 3.2e-104 367.5
+M_16 E_16 1.3e-50 189.5 1.1e-50 188.7
+M_17 E_17 2.2e-198 682.2 6.1e-200 686.4
+M_18 E_18 1.3e-81 293.1 1.1e-81 292.4
+M_19 E_19 4.5e-29 117.1 4.3e-30 119.4
+M_313 E_313 1.2e-178 616.3 3.1e-178 614.0
+M_319 E_367 2.8e-157 545.4 2.8e-158 547.7
+M_323 E_317 3.6e-171 591.7 6.6e-171 589.7
+M_336 E_366 3.6e-168 581.6 3.3e-167 577.4
+M_621 E_13 4.5e-42 160.6 5.0e-42 159.5
+M_627 E_368 2.4e-180 622.1 1.4e-181 625.2
+M_634 E_317 1.4e-164 569.7 9.9e-167 575.9
b
diff -r 000000000000 -r 2e0e9c418a85 test-data/result.proteinortho.tsv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/result.proteinortho.tsv Tue Feb 18 17:56:58 2020 -0500
b
@@ -0,0 +1,35 @@
+# Species Genes Alg.-Conn. C.fasta C2.fasta E.fasta L.fasta M.fasta
+2 5 0.16 * * * L_641,L_643 M_640,M_642,M_649
+4 6 0.115 C_12,C_21 * E_313,E_315 L_313 M_313
+3 6 0.301 C_164,C_166,C_167,C_2 * * L_2 M_2
+2 4 0.489 * * * L_645,L_647 M_644,M_646
+3 3 0.312 * * E_367 L_319 M_319
+4 5 0.165 C_63,C_22 * E_19 L_19 M_19
+3 3 0.812 C_20 * * L_20 M_20
+2 2 1 * * * L_9 M_9
+2 2 1 * * * L_8 M_8
+2 2 1 * * * L_619 M_619
+2 2 1 * * * L_6 M_6
+2 2 1 * * * L_5 M_5
+2 2 1 * * * L_4 M_4
+2 2 1 * * * L_333 M_333
+2 2 1 * * * L_3 M_3
+5 5 0.714 C_10 C_10 E_10 L_10 M_10
+4 4 0.803 C_64 * E_18 L_18 M_18
+4 4 0.762 C_17 * E_17 L_17 M_17
+4 4 0.758 C_16 * E_16 L_16 M_16
+4 4 0.78 C_15 * E_15 L_15 M_15
+4 4 0.793 C_14 * E_14 L_14 M_14
+4 4 0.718 C_11 * E_11 L_11 M_11
+3 3 0.316 * * E_432 L_617 M_617
+4 4 0.725 C_13 * E_13 L_621 M_621
+2 2 1 * * * L_328 M_328
+2 2 1 * * * L_623 M_623
+3 3 0.331 * * E_437 L_317 M_317
+2 3 0.333 * * * L_637,L_639 M_638
+2 2 1 * * * L_635 M_636
+4 6 0.126 C_1 * E_368 L_627,L_323 M_627,M_630
+2 3 0.331 * * * L_631,L_633 M_632
+2 2 1 * * * L_331 M_331
+2 3 0.329 * * E_317 * M_634,M_323
+3 3 0.322 * * E_366 L_336 M_336