Repository 'orthofinder_onlygroups'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/orthofinder_onlygroups

Changeset 0:bfb20dbe1309 (2017-10-24)
Next changeset 1:918d141a166b (2017-12-03)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/master/tools/orthofinder commit 2da91121887cc148ff398ddc2f56142490a8e22f
added:
orthofinder_only_groups.xml
test-data/inputs/blastfa/Species0.fa
test-data/inputs/blastfa/Species1.fa
test-data/inputs/blastfa/Species2.fa
test-data/inputs/blastfa/Species3.fa
test-data/inputs/blastids/SequenceIDs.txt
test-data/inputs/blastids/SpeciesIDs.txt
test-data/inputs/blastout/Blast0_0.txt
test-data/inputs/blastout/Blast0_1.txt
test-data/inputs/blastout/Blast0_2.txt
test-data/inputs/blastout/Blast0_3.txt
test-data/inputs/blastout/Blast1_0.txt
test-data/inputs/blastout/Blast1_1.txt
test-data/inputs/blastout/Blast1_2.txt
test-data/inputs/blastout/Blast1_3.txt
test-data/inputs/blastout/Blast2_0.txt
test-data/inputs/blastout/Blast2_1.txt
test-data/inputs/blastout/Blast2_2.txt
test-data/inputs/blastout/Blast2_3.txt
test-data/inputs/blastout/Blast3_0.txt
test-data/inputs/blastout/Blast3_1.txt
test-data/inputs/blastout/Blast3_2.txt
test-data/inputs/blastout/Blast3_3.txt
test-data/inputs/proteomes/Mycoplasma_agalactiae.faa
test-data/inputs/proteomes/Mycoplasma_gallisepticum.faa
test-data/inputs/proteomes/Mycoplasma_genitalium.faa
test-data/inputs/proteomes/Mycoplasma_hyopneumoniae.faa
test-data/results/Orthogroups.csv
test-data/results/Orthogroups.txt
test-data/results/Orthogroups_SpeciesOverlaps.csv
test-data/results/Orthogroups_UnassignedGenes.csv
test-data/results/Statistics_Overall.csv
test-data/results/Statistics_PerSpecies.csv
test-data/results_fromblast/Orthogroups.csv
test-data/results_fromblast/Orthogroups.txt
test-data/results_fromblast/Orthogroups_SpeciesOverlaps.csv
test-data/results_fromblast/Orthogroups_UnassignedGenes.csv
test-data/results_fromblast/Statistics_Overall.csv
test-data/results_fromblast/Statistics_PerSpecies.csv
b
diff -r 000000000000 -r bfb20dbe1309 orthofinder_only_groups.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/orthofinder_only_groups.xml Tue Oct 24 06:40:40 2017 -0400
[
b'@@ -0,0 +1,294 @@\n+<tool name="OrthoFinder OnlyGroups" id="orthofinder_onlygroups" version="1.1.4">\n+    <description>finds orthogroups in a set of proteomes</description>  \n+    <requirements>\n+        <requirement type="package" version="1.1.4">orthofinder</requirement>\n+    </requirements>\n+    <command>\n+    <![CDATA[\n+        ## prepare inputs\n+        #if $init.start=="fasta":\n+            #set $infiles = ""\n+            #for $input in $init.input_fasta\n+                ln -s \'$input\' \'$input.element_identifier\' &&\n+                #set $infiles = $infiles + str($input.element_identifier) + ","\n+            #end for\n+            #set $infiles = $infiles[:-1]\n+        #elif $init.start=="blast":\n+            #set $infilesbl = ""\n+            #for $input in $init.input_blast_out\n+                ln -s \'$input\' \'$input.element_identifier\' &&\n+                #set $infilesbl = $infilesbl + str($input.element_identifier) + ","\n+            #end for\n+            #set $infilesbl = $infilesbl[:-1]\n+            \n+            #set $infilesfa = ""\n+            #for $input in $init.input_blast_fa\n+                ln -s \'$input\' \'$input.element_identifier\' &&\n+                #set $infilesfa = $infilesfa + str($input.element_identifier) + ","\n+            #end for\n+            #set $infilesfa = $infilesfa[:-1]\n+\n+            ln -s $init.specIDs $init.specIDs.element_identifier &&\n+            ln -s $init.seqIDs $init.seqIDs.element_identifier &&\n+        #end if\n+\n+        ## start Orthofinder\n+        orthofinder\n+        #if $init.start=="fasta":\n+            -f .\n+        #elif $init.start=="blast":\n+            -b .\n+        #end if\n+\n+        -I $I -og -t \\${GALAXY_SLOTS:-1} -a \\${GALAXY_SLOTS:-1} &&\n+\n+        #if $init.start=="fasta":\n+            mv Results_* results\n+            #if $init.keepblastout=="yes":\n+                && mkdir -p results/WorkingDirectory/blast results/WorkingDirectory/fa &&\n+                mv results/WorkingDirectory/Blast* results/WorkingDirectory/blast/ &&\n+                mv results/WorkingDirectory/*.fa results/WorkingDirectory/fa/\n+            #end if\n+        #elif $init.start=="blast":\n+            mkdir results  &&\n+            mv *.csv results/ &&\n+            mv Orthogroups.txt results/\n+        #end if\n+       \n+    ]]> \n+    </command>\n+    <inputs>\n+        <!-- Control where Orthofinder starts -->\n+        <conditional name="init">\n+            <param name="start" type="select" label="Orthofinder starting point" help="OrthoFinder_OnlyGroups works in 2 steps. Choose \'From fasta proteomes\' to run OrthoFinder_OnlyGroups from scratch and \'From blast results\' if you have all the blast results from a previous OrthoFinder_OnlyGroups run.">\n+                <option value="fasta" selected="true">From fasta proteomes</option>\n+                <option value="blast">From blast results</option>\n+            </param>\n+\n+            <when value="fasta">\n+                <param name="input_fasta" type="data" format="fasta" multiple="true" label="Select input fasta proteomes" help="One fasta file per species; species and sequences names in the results will remain the same than in the input files."/>\n+                <param name="keepblastout" type="boolean" checked="true" truevalue="yes" falsevalue="no" label="Do you want to get the blast results ?" help="Used to re-run OrthoFinder_OnlyGroups from pre-computed blast results"/>   \n+            </when>\n+\n+            <when value="blast">\n+                <param name="input_blast_out" type="data_collection" collection_type="list" format="txt" label="Select the pre-computed blast files" help="blastX_Y.txt files from the blast output files of a previous OrthoFinder_OnlyGroups run." />\n+                <param name="input_blast_fa" type="data_collection" collection_type="list" format="fasta" label="Select the fasta files" help="= SpeciesX.fa files from the blast output files of a previous OrthoFinder_OnlyGroups run." />\n+                <param name="specIDs"'..b'"/>\n+                        <element name="Blast2_0.txt" value="inputs/blastout/Blast2_0.txt"/>\n+                        <element name="Blast2_1.txt" value="inputs/blastout/Blast2_1.txt"/>\n+                        <element name="Blast2_2.txt" value="inputs/blastout/Blast2_2.txt"/>\n+                        <element name="Blast2_3.txt" value="inputs/blastout/Blast2_3.txt"/>\n+                        <element name="Blast3_0.txt" value="inputs/blastout/Blast3_0.txt"/>\n+                        <element name="Blast3_1.txt" value="inputs/blastout/Blast3_1.txt"/>\n+                        <element name="Blast3_2.txt" value="inputs/blastout/Blast3_2.txt"/>\n+                        <element name="Blast3_3.txt" value="inputs/blastout/Blast3_3.txt"/>\n+                    </collection>\n+                </param>\n+                <param name="input_blast_fa">\n+                    <collection type="list">\n+                        <element name="Species0.fa" value="inputs/blastfa/Species0.fa"/>\n+                        <element name="Species1.fa" value="inputs/blastfa/Species1.fa"/>\n+                        <element name="Species2.fa" value="inputs/blastfa/Species2.fa"/>\n+                        <element name="Species3.fa" value="inputs/blastfa/Species3.fa"/>\n+                    </collection>\n+                </param>\n+                <param name="specIDs" ftype="txt" value="inputs/blastids/SpeciesIDs.txt"/>\n+                <param name="seqIDs" ftype="txt" value="inputs/blastids/SequenceIDs.txt"/>\n+            </conditional>\n+            <param name="inflation" value="1.5" />\n+            <output name="orthogroups1" value="results_fromblast/Orthogroups.txt"/>\n+            <output name="orthogroups2" value="results_fromblast/Orthogroups.csv"/>\n+            <output name="specs_overlap" value="results_fromblast/Orthogroups_SpeciesOverlaps.csv"/>\n+            <output name="unassigned_genes" value="results_fromblast/Orthogroups_UnassignedGenes.csv"/>\n+            <output name="stat_overall" value="results_fromblast/Statistics_Overall.csv" lines_diff="2"/>\n+            <output name="stat_specs" value="results_fromblast/Statistics_PerSpecies.csv"/>\n+        </test>\n+    </tests>    \n+    <help>\n+======================\n+OrthoFinder OnlyGroups\n+======================\n+\n+Full readme at https://github.com/davidemms/OrthoFinder/blob/master/README.md\n+Summary sketch at https://github.com/davidemms/OrthoFinder/blob/master/OrthoFinder-options.pdf\n+\n+OrthoFinder is a fast, accurate and comprehensive analysis tool for comparative genomics. It finds orthologues and orthogroups infers gene trees for all orthogroups and infers a rooted species tree for the species being analysed. OrthoFinder also provides comprehensive statistics for comparative genomic analyses. OrthoFinder is simple to use and all you need to run it is a set of protein sequence files (one per species) in FASTA format (Emms, D.M. and Kelly, S., 2015).\n+\n+.. class:: infomark\n+\n+This galaxy tool implements the first part of the Orthofinder program, e.g. the clustering of orthogroups of genes.\n+\n+If you have already ran OrthoFinder, the tool allows to re-run the analysis from the pre-computed blast-results.\n+\n+-----------\n+Input files\n+-----------\n+    - When using "from fasta" option (e.g Orthofinder from scratch) : the input files are a set of proteomes in fasta format (on file per species). Choose this option if you have no OrthoFinder results yet.\n+    - When using "from blast results" option : the input files are all the following files from of a previous OrthoFinder run (these files appear only if you have chosen to keep them while launching a previous run):\n+        - A dataset collection / multiple datasets for the blast outputs\n+        - A dataset collection / multiple datasets for .fa files\n+        - The SpeciesIDs.txt file\n+        - The SequencesIDs.txt file\n+\n+    </help>\n+    <citations>\n+        <citation type="doi">10.1186/s13059-015-0721-2</citation>\n+    </citations>\n+</tool>\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastfa/Species0.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastfa/Species0.fa Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,5439 @@\n+>0_0\n+MNINSPNDKEIALKSYTETFLDILRQELGDQMLYKNFFANFEIKDVSKIGHITIGTTNVTPNSQYVIRAY\n+ESSIQKSLDETFERKCTFSFVLLDSAVKKKVKRERKEAAIENIELSNREVDKTKTFENYVEGNFNKEAIR\n+IAKLIVEGEEDYNPIFIYGKSGIGKTHLLNAICNELLKKEVSVKYINANSFTRDISYFLQENDQRKLKQI\n+RNHFDNADIVMFDDFQSYGIGNKKATIELIFNILDSRINQKRTTIICSDRPIYSLQNSFDARLISRLSMG\n+LQLSIDEPQKADLLKILDYMIDINKMTPELWEDDAKNFIVKNYANSIRSLIGAVNRLRFYNSEIVKTNSR\n+YTLAIVNSILKDIQQVKEKVTPDVIIEYVAKYYKLSRSEILGKSRRKDVVLARHIAIWIVKKQLDLSLEQ\n+IGRFFGNRDHSTIINAVRKIEKETEQSDITFKRTISEISNEIFKKN\n+>0_1\n+MKIIINKNFLDDIIEVVSRFSDPISSLYGMRCIKITANHNFVKFEATNEITNIVKKIKVDDNKIIVEEDG\n+ELLVQANYFKNIIKKLNGFIEIKTYFNKMEIKQQDSVYTLTLNEISSFPQIDENINIKKFQINTEEFKKA\n+VKNVAFAASNGANLIYKCINFKSSGNKLNLAATDTFRLAYYTIKTNQILEDFDFSVNAKDVKELLPTDVP\n+KTVTMFYNSIKFGVEYDDTTITARITDLPYHNVEQLFNKAISETKHKITIEKSEFNNLLNKIWINSSADK\n+QNRIELKISNQEINVYTKIDELGDSNVRTAKFTLEGSPFVFDMNFNYLKDAISITEGETYILIDEKIQNI\n+VLFSKDNPNSKQIITPLRR\n+>0_2\n+MKPIYKYNVVFKDNNNPNENIIFCHGLNSTADRFDIFKNYWTKSNYYSLQFPASNLTPVLDGDEPSVFCF\n+AKLLVEFVEKNNLKNVTLIGHSLGGGTISLAYQLRPDLFKKLVYLAPMNKPALALYDRYKKDYFPKDYEG\n+FLDLMRSLYYDISKFTSDPNWVKEQKENFDPYLYNNPDIVKLGTPDMNVFNAIEETLKIVKVPTLLILGE\n+KDGVILREECIDYFKKYVKDVETHWIPKTGHMMYLEDWDSFIKILEPFLDK\n+>0_3\n+MNVIYKYDFVFKDNNNPDENIIFCHGFNSSPNSFKIFENYWTKSNYYALQFPGNNHTEIKEGDEATVECY\n+SDLLIKFIEDNKLKNIILIGHSMGGGTISLAYQKRPELFKKLIYLAPTNKSSQNVTEAFLRDYFPKTFDE\n+FIGFFKSLYYDVTKFTSNESWMRLVKNTFDPYDFNNPTIVGLGQYLISNYFHDKLELALQSVNVPALLIL\n+GEDDGVVDRDLCINYFKENVKGVQSLWMPKTGHMMFEEDWENFIKIVEEFINRSELASPKAL\n+>0_4\n+MNKYEQLFRPFKLGNYSLKNRFVLSPMTLSLATKDGKVTIEEEKYSARRADCAPLLISGGTYFDDFGQLF\n+EYGYSAKSDDDIESLKKLAKAMKSKGNIAILQLAHAGKFSKASLKKYGYLYGPSYEKNHIPVEHEVFELS\n+ISQIKQIVKDYASATKRAIAAGFDGIEISMAQRLLIQTFFSSIVNKRNDEYSSDSFENRSRLCLEIVEEI\n+RKMINQYADENFIFGFRATPEETYGAELGYSIIDFIQLIEEIIKKGKINYLAIASWGHDIYLNKVRSENE\n+YKGQLVNKVIYDKFKGILPIISSGGINTPQKCLDALEYSDLVGLSSVFVADPEFVQKIENDQEDKINLNI\n+SFSQLKDLAIPESSFKGIVEMFGFCETIPTESLKTLEENSKS\n+>0_5\n+MILVEPIRNGKYIKDGAYYLATQIWALSHLKFDEIVAFPAVLDPYVQIGYFQNPEVEVNFKYLKEHNIPI\n+VRRDTGGGAIYIDSNQMGVCYLIPYKDNESILGNYEKFLEPAIKIIKELGAKNVVQSGKNDLTIDGFKVS\n+GAAMALIGDTIYGGNTYIYKIDYDAMSQVLKPNRKKIEAKGIKSVRQRIAPLSDYFNEPYKNMDIFEFKD\n+LVVKKLFNVDDLSNVKRYVLTENDWKQIDELVNAKYKNWDWNYGLSPRYEYNRDARLAIGTINFSLAVKG\n+QRIERIKISGDFFAKADINELEKSLVGIKMDYDELSNAIKQANLEKYFFNEISVDDVVRTILSEDDNE\n+>0_6\n+MILVEPIRNGKYVKDGAYWLAIQIWAMNHLRLNEKIVFPGIAAPHIQLGYFQNPEVEVNFKYLKDHNLEV\n+VRRNTGGGAIYIDDNSVNVCYLIPYDEKDNILGNYDKFYEPTIKMLKELGAKDVVQSGKNDLTIDGRKVS\n+GAAMMLNGDVIYGGNSLLYKVDYDAMVDSLKPNRKKIEAKGVKSIRQRVAPLSDYFDEPYRNLDIFEFKD\n+LVIKKLFGVDDLSKVKRYELTEEDWAQVDELVNTKYKNWDWNYGLSPRYEYNRDARLAIGTINFSLAVEG\n+QRIEKIKISGDFFAKKDITELEKALVGTKMTYENLVKAFKDADLQSYFFNEIKAEEVAKIILDEE\n+>0_7\n+MHTLNSVKELDSLINEADAIVIGIGSGMTSADGIGYSGQRFVQNFKDFIDEFKFLDMLQASVYHFDDIQN\n+YWAFHSRFMKLNYFDQPASESFLKLKEYLKGKNYHIITTNSDNSLEAADFEEDKIFYIQGKYNLLQCSKM\n+CHNTLYSNDKAVYEMIEKQKDMKVPLELIPRCPKCNNFLEVNKRLKGKGMVEDKRFFEEKKMYEDFIYRH\n+KGQKILFWEIGVGFSTPTLIKFPFWEMTKEFSNSKYVAMNNKSYRTPQEIRQRTYVWTDDIKQTINKLLE\n+VKNDFSRAN\n+>0_8\n+MKKVVKYLVVEKLEGKDQFYLRFTPEMQDDIGTIGFIQYKNTDKKVLHKDDIFLNLEASKAILTLKMPFD\n+ATVVEINKEAMANPKLLSSPKDSENWVMILSDIDPKTLEQLEDF\n+>0_9\n+MKISILDHGLLTDQNNYEKAYKEVIELCQYVKDLNLYSFWISEQHNVNSLVISSPLILLDHLANSVSGIK\n+LGCGGIMLANYQAYNVAEQIQTLNLLHPERFIYGFGSNIGTKETIELLKPSLTSTEYQQKIIAVNEYLNN\n+KKKFDFKINPNINKPVDIVMLVTSEQSAIFAAQHKFKINYGWFLNPSKVYAENVINSYIETYKTAWNENP\n+PEVTFSVNVVSGIDYESSMRNHNLIAFYRSFADPNHFAYYPPYSEFEKFVFSEEQSKNFLRLHKSIFNVF\n+DDESMNKLNNLCEFLKINHLMILPTVADINDRKRAVKNVADFYVKRGKNEKSC\n+>0_10\n+MYNSDMENRLIENQNSSQNNFRRFENASSVASRKNAFLGASVGWFSYATAIAFISAIMLLLLFPKALDYL\n+QRNPFIGLGLALGLLVLIFIEFIVGPKMNFWAQLIIITLSMMLLGIVLLSFALVELLGTFATGASIKYLA\n+LAKTFGVILLPIVILSIMATLAYFDLIKIKFVYAIIIFLTISFFFIFILSAFIFNSWINALFPSIGFALM\n+ISYMAFDWWLITRYNKAFNATVSNHSTKKEFMKLTIYFGFKLAYDYIYALVYLIKLVRLAKN\n+>0_11\n+MKKNKFYLFLGAAPVLSVPLVAASCGDKYFKETEVDGVKTISTLAHITSRKGLKLREGLTVENAPKATFI\n+TDEGSVHDESFNQSGWEAVHKVSYELGLDKAQVSGNKNLRNKVYEPKKGQLLEAYKNAIDSGFKYIVLCG\n+FTHQAALVGLDANYIKKIKDNNIVFITVDFDLFTENDANVKTFIEKIGEGHLVPVIFDTKQAAYIAGRAL\n+ADYFSQVYKDQPEKRTIGAFGGIPYPAVSDFIAGTFQGIIDWNKEHPDVKTKSLNETIELNTLFTSGTPQ\n+ATTAINSVVKATASYPVAGSLSTDTAKEIKKLADKDKFIIGVDADQKNAL'..b'YGWAKKDQSLANISYVPTQFLSPRAELINDILATGKVDFLAEAIEKELLDSVLVKDEFISQENV\n+FQITKAVKKVLNSNNFANAFTSSKINRELLPKIGLDLLYELSHSDSGNIFKSILFSVFERVKAKLNEKGD\n+LENQKKYLVEEVNNIYSLITGLAGLDISKFLSAEELVYLSNDPKEVINAFQNIIGSIDVYNFSKLANEWY\n+KSEWKKQVEHNKEKYTNRLSSGLLIDWLFKSVDQKTLKTGLKAFINNLDFQKVLNLDDKNSLLYKKINES\n+VPSLIDGIKILLSKVSKDGKFDNVKEGLNSILQNIDFNVLSNYLSEHLTTNYFEYKKSDLDYESNKEKVL\n+REKVALKTIRPKDGMMALIYGLFYNPGTNREFKANLIKMFNLSDKVSTIKVENGSGSVVTPDSDEEKLSF\n+SDFLAFFPALLSADQSKTIFKNQQINNDISYAKEHILKVMSAKGNSVGLHELDIKALEILKKFNIITNEI\n+TIDKKVIEKLNKVQSFIVQTTTSLDEKTKIVSETNKTLADLIYDFNSFDEGDESWKVWKGVIGSYGQASV\n+VNKFSLGAQAFDLLIPWINMLTYSNNATQKEALQFVNDFLKLSIDKSILEEINKLAQDENLPNFNSTNFG\n+LSIALHRPEQVTVFNESNGKFTNAKVEELASKNPKFRRYLSSQKRSLIELLGLIGASQQYSKYDKQPAET\n+GKIYAPNGIYYETIKKAVDRYFSTKEFWEIKDIVLLIARSMQINFPIELLGLSRIIINPVLRSMYPQLMT\n+SFLSTQKQSLGKINGNLAYIVSNRIGNFEEIIRDNSKKLELEAYFEQIWSNKDTSLVPLDYSEEITLALD\n+GARVNKIFNEQTKKVTIFGIDFLNLAGRVVNGIVEPKELKDIVFNDINSYYAKVNYAYLSKNNKAIYNGE\n+LPRNNVEMESLLNTIDDKYILDVNGIKFLIVGEDTTVDYIYPVIDENHLQVNTQNQALVYLNNYGFSRIM\n+AAYQGNVVKKNLLVVNGSKNSNEVVKRNITNIVDSSISDANKLKRVFSYDELDPINPERALRITTIEGMI\n+NVISSSIIALMSLFIIMVSVAIIFIIRRYIANKAKVFGILLAQGYRPIEIAISLLPFAMVTSLIGGILGY\n+SIGFRTQILLQNVFSNYWTLPKSAIPFDFFSLFFNVFIPFLGMSLLIIVVALISLRKSSIDLITGVDDAP\n+RGKLFNKIKKKFINKKNVKKRFSFTLAYSGFWKLASFGGSVLLTSIATMFGLANYKTFNNTINDTYKNRD\n+YRFKIDLESPTTEGKYYSLYNPSELKDLIYTPIGSLNEGNRETADYFKPGKSSIINPDNKANGNPGEFAP\n+HLLSQFSVNVTVDAGVAADPWLIAYNGMPDSQKAKIDKIRDLVGHQLEWTQSLDENGKLITDPNKPIIKV\n+DSNGLMSYEDASGKKYDFFKYYKSPNDKQGSFRLAHWDAANKEYIMKTIKTGDSGGRNEYRDFLVKAYQK\n+NDIVRMQHEKLLAEGKELINPITNWKESRSDSDFWLVDKSDLDRQWVNDYFIGFGGILFDKHYDETYTYI\n+SGSYNNISSKIYGYRKPEDIKSAKVKLIDKNGENLYDALYNFKIENNVYPLVVNDVFAKKHKLGIDDQID\n+FVISNRVDRYRQKLLEKIYANNPIKQADLKKQYDQNIKTKFRIVGINPTYINDELITTHSAANLLVGLPD\n+NESSFNGVLTQNANPVQVTESAGLYSPSGYWAGLDGFDVSSLDQGTVKKMFDEIFKVSDIPEKGGVLQSQ\n+HGFTKDEIAKFLDPKAEKFSDSLYESAKNSAKAHIEDFSRIYENKLFIALSNSIDSRDIEVGFVVQVGHT\n+IEQISIFIIVINFVISLIILIIMSSIIVSENERNIAIWSILGYSQKEKLMMFFGAFIPFLVAALIISIPI\n+VIAMINVFGSFLLSSSSIALLLSLKWWHVLITSGLMLIIFAVTSISVWISINKMKPVDLLKGK\n+>0_816\n+MENERKQKIAKIVLWTILSAVILLIITLLLWNRFKPQVRQGNFQDFVNDIVAASKSVDDNTYLAEVKIDG\n+VQDIAKYTFVENGIAKLREVSLGKGIVEKTFILPDKFTIGDKTYNIADLLKHPGADANVLSTQWSTVGLV\n+LEKPNTFARIALSVLPTLLWIIILFWLYRSMMKRSMNMIGAIGDEKNPAQKIKSDKTFKDVAGNKEAVEE\n+IKEIVDYLKNPKKYEIAGARMPHGILLGGPPGTGKTLLAKATAGEANVPFYFISASNFVEMFVGLGAKRV\n+RTVVDEARKNAPAIIFIDELDAIGRTRGSGIGGGHDEREQTLNQLLVEMDGMKDNNGILFFAATNRTDVL\n+DPALTRPGRFDRTITVGLPDVKEREEILNLHAKGKRVSPNVNLAQVAKRTPGYSGAQLENVINEAGLLAV\n+RRDSEIIERDDIDEAIDRVMAGPAKKNRVITKSELTMVAYHEAGHAVVGIKMPGANKVQKITIIPRGQAG\n+GYNLMTPEEEKYNLTKKELIAMITSFMGGRAAEEIIYGKENVSTGASDDLHKATKIARKMVTEWGMSDLG\n+PIQYEQDEGSPFLGRDYLKSAQFSAQVAHEIDIEVRNIITEAEKKAKEIIEENRELHELIKTALLEKETI\n+VAEEIEYIAKNMKLPSESKEEKAENVNLTIDDILDGKSEEKGETM\n+>0_817\n+MILLGVSGGPDSMYLLDLISSQRSDIVVATVNYNVRHDSAYDAEIVRKFCEDKDIIFECLEIDQKARFKG\n+NFEKWAREQRFSFFKKIYEKYNCETLYLAHHKDDFLESYFMQKESKRQPDFFGIKTENYIYGMKVVRPLV\n+DKVFKNEILEALHNKKIKYANDYTNDLPIYTRNRIRIWLKSLSNSQKSKIFDDIQKENNELAVLAQDTVL\n+EYEHWKKAQFSQDEFLNLSNKERLVYKFVHENYVDIKLSNRKIKSIISFILSNNRTSQYLIKNNVFIQKK\n+HGKLVF\n+>0_818\n+MKLIVGLGNPGNEYRFTRHNAGFLAIDKICEKLNISLNKEKFNGEFVVSDGFILAKPLTYMNKSGDFVYS\n+IASFYKINPSDIIVIYDDLSFSIGQAAIKIGGSSAGHKGIDSLMSKFSSNDFKRIRVGIGVNSGTTIKDY\n+VLSLFTKDEMIVVEEVLEKVADAAISLVYNDVNFVMNKFNTDNKKRVI\n+>0_819\n+MFMSNESNSGAIRLKGKFLVVKWSGADNNIPRELWIFESSPERERFFIYTNKQELKSSCFYEIEVKLRAS\n+KRSKYQNSTYELLSFKIVSPDNDSDIEKMLVSNVAGLGVKGIQRIKSELGLSSIKELFDDVESAQNVLKT\n+AIYENLKAFINSFDQKDYDFFAENGLLKLYDKLRARFENNDFVSRYKNNGDPYELYVDHWIDFKLVDLFA\n+QCVNKNIEPYKIIRAFTYKILRTNFNNICTMYYDVLPFYKSLWNWYEDYRRDNSENSTLFEQSYVVSLLS\n+LLLQKRDISDDLIIESLNVMIQRGEVYFDSDSKRLSLNEVYEQELFVAKKLIKIRDSELKQQIIPLPSQK\n+LADEQKKAYASALNNPLSVITGYPGTGKSYLIAYIVETLLKDKHYKKKDIAVLTPTGRASTILAYKTGIE\n+ARTIHSFLKLSKSDEDDSFIESFEKENPIKVVVIDEFSMVSLPIMYELLKTCTSIERLILVGDRDQLPCI\n+GKGNLLEDIINSKKFPTFVLEEIHRTDKIDIFKHFIAINDNKVPKIDTENVKFIEQNGIQFLNNIVKIYE\n+EKVNKYSIDNVIILLPSYLELGQPGINEVNKRLQEWNIKRTGAKKNLSIHNNLTLFVGDRVIQTVNDYDK\n+NVFNGEIGIVEEINTDSKNTFIIVGFGQDKKVRYNRSEILENLTLAYAITVHKFQGSEASCVIFGILKNR\n+VEHMFTKKFMYTAVSRAKEELLLLGSKDLYIQKIQSRNADLKHYTNLKSLIEKEAK\n+\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastfa/Species1.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastfa/Species1.fa Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,5395 @@\n+>1_0\n+MIISFINNKGGVLKTTLATNICGVFSKFFPKSRSVIVDLDGQGNVSATFGQHPERLKNTLIDIFRGEKDI\n+DDCVLNVFPSIDILPSNHELSFVDMDVARKEYKLSVIKNLIEKLEEMYDFVFLDTPPAMSTIVSVSMHIS\n+DMIVIPFEPDQYSILGLLRVIDTIETFRERNEDLKVLVVPTKVNARTRLHNDVLNIVKTKLSKKNIPLSK\n+NIVSFTTKSSASVGYEKLPIVLINQRSKYQEEYIEITKEIINLLKDNKNNEK\n+>1_1\n+MKNKKAKKKERRFTDLSADLDEEVEKIDPEYEDFKEIKIEKNKDNQVIDKNDPFFYSESFEEARIQLIKD\n+KKVEVKKEEEKVQETTVKNKISEAKKEEAKDVYIDSSLEIASQEPLTKGMHFYTNSRIIRKVRECAKNKG\n+LSISRLITMILDKSIKEE\n+>1_2\n+MKTKLKRFLEEISVHFNEANSELLDAFVHSIDFVFEENDNIYIYFESPYFFNEFKNKLNHLINVENAVVF\n+NDYLSLEWKKIIKENKRVNLLNKKEADTLKEKLATLKKQEKYKINPLSKGIKEKYNFGNYLVFEFNKEAV\n+YLAKQIANKTTHSNWNPIIIEGKPGYGKSHLLQAIANERQKLFPEEKICVLSSDDFGSEFLKSVIAPDPT\n+HIESFKSKYKDYDLLMIDDVQIISNRPKTNETFFTIFNSLVDQKKTIVITLDCKIEEIQDKLTARMISRF\n+QKGINVRINQPNKNEIIQIFKQKFKENNLEKYMDDHVIEEISDFDEGDIRKIEGSVSTLVFMNQMYGSTK\n+TKDQILKSFIEKVTNRKNLILSKDPKYVFDKIKYHFNVSEDVLKSSKRKKEIVQARHICMYVLKNVYNKN\n+LSQIGKLLRKDHTTVRHGIDKVEEELENDPNLKSFLDLFKN\n+>1_3\n+MRVNIFERYQSFSVKNTDKFEKASVLTRMTTDINFIHQSIQSGRTAIRGMSVFLFSLVLMFVTS\n+>1_4\n+MPVIIGGILLVYRFVIGNYKKLFKQYDQLNNLAKESIAGARVVKSYHQQDNEIQKFNRVAGFIYKNFTKI\n+ERITALISPIVLFCIYALAIAIAWIGTNNIVDGKLDIGSLASVFAYAFQMLINLLLLSVVYVTIITAKPS\n+KDRIIEVLTEKIDIKDKKYAIDTVSDYEVEYKDVSFKYVDTNPHHNLEKINIKIKKGQTIGIIGSTGSGK\n+TSIVNLLTRLYECNEGQVLLNNIQLNNYSIKALRDAIAIVPQKSILYSGTIKDNILMGGNYSDEEVEKAI\n+TQAQAAEFINKLPNKLDSIVEQKWN\n+>1_5\n+MSHKKERNAQKKKYFKELLRFIWKNKKWHLLIAFFLIIISSITLVLVNNFIKDLIDDYIAPLLREKSTGK\n+PLDFSGLIKYLSIIGLIFILGVLSNIISGQIMAKATHATLFKLRNNMYVHMQGLPIKYFDTTKHGDIMSY\n+YTNDVDTVRNLIVQIIPQSFQALVQIVVIFVFMLQISIVLTLITVLLLLPMLIFFGFFGKKTRVNFVANQ\n+VEIANLNGVIQEYIETQMISNLFNYSDQVIHKFKLANNKQAAIMKKANVLASIVFPVIFNYSNVMYIVVA\n+IASVFLFESYQNKPILGQQITLRVIVSFVALVRAFVGPLANISENVNFFARSKAGAERIYTMLDEKLEEN\n+KGKIILDYIEKYENGNWRIANKWTKQIGWVINGEIKPFQGKVEFKNVNFSYDGKKQVLKNINISGYPGEK\n+IALIGKTGSGKTTIANLISRFYNVSDGEIYFDDIPISSVDINSIRKTVGMVLQSTELFSGSIRDNIAYGN\n+KEAKLEDIIEAAKLANAHDFIMALPNEYDTYITNNGEGLSQGQKQLLTIARVSSMNPTIMVLDEATSNID\n+SRTEKVIKESMDKLMQNQTTFAIAHRLSTIKNFNQILVIQEGEIVERGNHEQLMAKKGLYESFYHSSFSD\n+EMS\n+>1_6\n+MKRTYQPNKRKRAKTHGFRARMATASGRAVLAARKRKGRHILTVSDEAR\n+>1_7\n+MKRENSLKKITNFLELVKSKNKYYSNNYVIYAEKNRENKIKIGISVSKKLFAKAVIRNKIKREVRSFFDD\n+FTDWSKSLNILIKINNVNYLTNSYYLAKKEEFFDTYKKVVQKFKTI\n+>1_8\n+MNKVHSEIKTQSFNPFWNAATLKEKSRIDPNLKKALSYLWKFLKICVFLFLTVIGLWGCTQTYSEPWTVS\n+NPRIGVGLEIGYNYGVTGDYRYDLTSSNIGPYFSFANYQLSYGPFLAWFVWPASQIILPILYQTRVPLTQ\n+GIDYGLNTILAILILLFIIRLITIGITLNSTLNTERMGEVQGKIAEINAKYKNATDTQSKKMKQIEVMHI\n+YKKHKIKPAALFVQGFVTIPIFLIVYKMVSLTRPIKATILFGIWDLSVTPGTEIISDISRNWVYIFFVLL\n+VVPMQIVSQWLPQFWATRRNRNAKTTSQKGLEQLKKTRRIQWILIFVFALFPVITPSAVGLYWFLNSIFT\n+ILQSYITHVFIVKRRQRTKTISRLDQILNRELD\n+>1_9\n+MINKINKFFKNNEFSPSKQRGQNFLIDQNIINNVVEAVSKINPSKVLEIGPGLGAISEQLIKRFADNYYA\n+IELDKKLFHHLNERLLKDHILHADALEIDWKSIFDNLGDNPTMVGNLPYNISSKLIKKFILSTYRCAIIM\n+VQKEMGLRLLAKINSKDYSAFSALCQYSLSVSKIIEINETAFIPQPKVRSTLLFLEKKDIAFNEGYEKFL\n+KLIFLSRRKTILNNLKNNYDPKLIIQSLVSLGFKKTSRAQELSPTQLFSLYESLSKLC\n+>1_10\n+MVLKKHPELKSYHLPNCLAYMNHYRSYAKVNFYLKIKEYCPKVKKHKLESKLVLVKDLYDDLYLEKWNQT\n+KIKYFDQNNNSLTFSDDILVRTKKFLEDKLNQTFEFKAKVIKRIPTLSGLGSAPSNAAVLINWIYQEFGI\n+LNPVSYYEIATELGSDIPFFLSLHDCAIIKNFGDQVEQSILDGYETEKIIFNKQKPSTKKIFELLDYSQI\n+KKENLNDLEQPFFSLFPELLPSFNQLKNDSNHVVLAGAGSCFVVFRKLNEI\n+>1_11\n+MVFKKIKTQIDHALKQLNLPTDVEYLIQQTKNIQFGDFSSNVAMVLSKRQNKNPQEIAKQIIEQLNPNEF\n+EKITFSKPGFINFFLSNQDKLVVLKRLQETNYSVEKLPKEEQESINIEFVSANPTGFLHLGHVRNAYTGD\n+VLSNILRAVGHNVTKEYWINDLGNQVSLFALSTIIRYLQELGINKYELPDDSYHGKEPIFVAEEMIKDFG\n+NKYQDIKIEDNKIVDSKIANELTQYCTNKMLHFIKQDLESIGVKMDVWTSEKVVYQSNTLTELLNNQLKD\n+HIYEQDGAVWLRTTDGGDDKDRVIIKENKQPTYYGTDIANHYLKHKRGFDRLINVWGADHFGHILRTAYA\n+AELTGIKKGKFVVVLIEMVKLLKDNKEIKFSKRLGNAISIPDMLEFLSKDASRWFMLNQSWTSGIRIDVD\n+LTNKKDSSNPVYYVQYAHARIHKLLTKAEHIDLNKVNLSLLNSDVERTMVNYLASFEHYVHNVATTYEVN\n+KLLNFVYTLTQSFHSWYNSHEILNQKDEIKQTRLLLAKAIKNLINYLLSLFGIEAVEQM\n+>1_12\n+MRNRVRDKQNQNTRKKQVNNKRWIMWVLLLLLIILGVSAYFVINKFPPPKNDVPDSERTNDSQVTTPGTR\n+NETIPLNEQYKKVGDLRLMSWNTLNFGSRSEPTSNKFMNIIRTIQLSDADVVGLSEINYDDQLLAQRLND\n+ALGSSWSYTFSGKNFNENYPRSKESILILYKNQVVQPEVSKAINPNNIYTRPLWYTKFKIIGFDYSFITF\n+FGHFDAPGVNANNGETSAAGFSRQGSQEIKEAQAIATVFSDLKTQYPDTDIIGAADTNIRETN'..b'\n+MKYKLYDTHCHVNIEQLFPKHDELLKAFDQENIYINVVGTTLEDSILANDITKKYNNCSACIAVHPNDVQ\n+QHNLKEVRTTFEQMLSTPNNKIVGIGECGLDFYYTDQYKAIQYQFLDMHLELANKYKKPLMLHIRNAHKE\n+LVEYLNNKEILVPIIFHCFSQDIETYKLLEQLPTKIVRFYSIPGVVTFKNAKALQEVIPLIKNEQLLVET\n+DAPFLTPHPFRGKENNSLYLKYTIEKIAELKNVSVDQIKQLTFDNAYNLFKPKIKD\n+>1_755\n+MINKIMKKYETIYALATAPYNSAIHVIRLSGPDAFEIINKICDKQITKEGYRIQNARIVDNDQIIDDVLL\n+MKFVAPKSFTGEDSIEINCHGGLFVINKIMALLNKHGAHLARRGEFSKRSYINKKIDLNQATAIHDLIFA\n+KNNLSHSASIKALSGEFSKDIKNIQQEIFRLIGLVEIAIDYPEYEDEKKELTEEFKNLTNIRQKLQRIVN\n+KSLKLKQISEGIKIAIVGEPNAGKSSLLNALLNEQKAIVTNIPGTTRDTVEGQIVLNDELIINLIDTAGI\n+RKSSDQIEQIGINKSFKTIDKSDLVIYLIDLNKYQNYDKTNIYKYLINKKKQFVLVGNKVDEVDPTLNTG\n+EIQIKISAKNNDISDLIKYLEETSLAIFNDENKQDSIFQEEWQINLLQTALYNINLILNDPNQYHDLVIQ\n+HLNEANNSLLKVLSEYEDYNLIDEIFKNFCLGK\n+>1_756\n+MNLTNKYIPILLFENKGCYLKKYLEEYLINIVCTEANKPCKKCVWCSKIINNGYYDLIHVYPHNNVIRKQ\n+EIIDIQNKFNNTALESRGIKIYIIHQIEKANKESLNSLLKFLGEPKDNTIGILTTRKPYGVLDTIVSRCV\n+RYSTNSYEEKVEFKNKYKPKELELIKIMFYSYDDILQYESTKDIFKLLELIHLLELNNKKFDQIIKIRDL\n+FEKIDYYEISLVLNYLIFTGDFKRKSKLIPILNNLNLNLSKNAILISIID\n+>1_757\n+MKKGVFIVIEGVDGSGKSSFLKRMMNEHTMINSQPIIYSREPGGCDTSEAVRELIMKLSNSDPLTEALLF\n+CASRNEHLKKKILPALNENKIAICDRFVVSSWIYQGLIKNAGYEKVKKINEYVTDGLEPDLTILFDVDPE\n+IAAKRISERSTMNHLDAYTKERINKIRNAYLERLKDNKKAKIINASLDLDTVYDQVVNIITLFVKNHELN\n+>1_758\n+MLDKNLLKTNSKEIREQLKSRSFNLDWYDEFLRLEKQLSTLLRTIEKLNEQKNINAKKAATTESDAQRKK\n+LIQEGGLLRAELEKNEAKYNEIKEDFDYIYQRIPNLPTEDVPIGKDEKENVEMFKSRKPTFFDFKPLPHY\n+ELATKLEMIGLDVASKITGSRFSIYKKDGARLMRAIQQFCLYVNADKYEEYLPPVIVNKDSYYGSGQFPK\n+FVEDVFKLEGTNYYLASTAEVQLVNLHRNEILKEADLPKYYTASTACFRSEAGSAGKDTKGLIRQHQFYK\n+TELVKIVHPSTSKQEHEAMAKDAEKILELLELPYRRMVLCTGDMGFSATKTYDLEVWIPSENKYREISSI\n+SNCGDFQARRANIKFKDAISKKNLYVHTLNASALAHDRLFVAIVENYQQKDGSIKIPKALVKYFGKEYIK\n+>1_759\n+MNPNDKNNIKELLNKTVVKEASITKELETSFMEYAMSVIVSRALPESRDGLKPVHRRVLYGAYTSGLTHD\n+KPYRKSAQIVGHVMGKYHPHSDSAIYETMVRMAQPFSLRYMLIDGHGNFGSIDGDSAAAMRYTEARLSKI\n+SAEMLRNIDKDTVDFVDNYDASEQEPIVLPSLFPNLLANGSSGIAVGMATNIPPHNLSELIGGIKHLLVN\n+ENATIEELKEFIKGPDFPTAAEILGETGINEYFNTGRGSVSVRAKSEIEELANNKSNIVITQIPYMVNKA\n+NLINKIAELVKTEQIQGIADLRDESNREGIRIVIETKRDVIPEVLLNQLYKSTQLQTNFSVAMLALVNNQ\n+PKVLNLKEALQIYIDHQFDILLRKTNFELKKAKASAHIVEGLVIATNNIDDVIETIKNAKDNEDAKNTLM\n+TKYELSDLQAKAILDMRLRSLSGLERENLQKELAKLKELIKDLEEILQNKERRIKIISDQLDEIDHKFGD\n+ERRTKICYGLNSTIDNEQLIPVETVVITRSSKGYLKRIPISAYKVQHRGGVGVKGMNTYEDDDVESLIVC\n+STHSDLLFFTNYGKVYRIRAHQVPLGSRISKGIPAINLISIEKDEKLMSLLSINDYDSGYFFFSTKKGLV\n+KRVKASEFSRIQNNGKIAIKLTENDSLFKVIKTAGDEEIYIGVSSGLLVRFKEDVVRSMGRTAQGVIGVK\n+FKNPNDEVIGLSSSHEGSLLLAVCEKGVGKMTDREEYRMTNRGSKGVITIKVTPKTGNIINTQLVNGNEE\n+LLMISSTGKIVRVPLAEVSEQGRNTSGVKLISLNEKETLQSVAIFDVEQDDSQQVGSDNPDTELSSDDSN\n+QDQDKE\n+>1_760\n+MNNTKKDQYSSQSIKVLEGLSAVRKRPGMYIGSTDQKGLHHMIWEIIDNSVDEMMAGYGTTVKLTLKDNY\n+LVEVEDDGRGIPVDIHEKTNKSTVETVLTILHAGGKFDSDTYSMSGGLHGVGASVVNALSSSFKVWVNRD\n+YKIHYIEFKDGGVPLKPLEIIGTDSKKQGTRIQFVPDFSIMEQFEYDETIIADRIEQLAFLNKGIKFIFN\n+DERTDKKTKQEWLYEGGIKQYVENLNASKEPIIPQIIYGEKKTKVTLPKRNLEVTMLLEVAFQYTNGYYN\n+STYSFCNNIHTNQGGTHEEGFKNALYKIINRYALEKKFIKETDGKISKEDLSEGLTAIISIKHSEPQYQG\n+QTKDRLGNTEVREFTNSVVSELLERFFLENPEEAAKITAKAVSAMFSRKRSEAALESARKSPFESASLPG\n+KLADCTTKDMEISELYIVEGDSAGGSAKSGRDRFYQAILPLRGKVLNVEKANHEKIFKNEEIRTLITAIG\n+AGVNPEFSLDKIRYNKIIIMTDADVDGAHIRILLLTFFFRHMFPLIEKGHVYIAQPPLYRVSYNKQNKYI\n+YSDAQLEEWKNQNPNVRYELQRYKGLGEMDDVQLWETTMDPEKRTLLKVSINDAANADKTFSLLMGDEVS\n+PRRDFIEKNAKSVKNIDF\n+>1_761\n+MTLYELLEVDQNATLSEIKSSYKRLAKKYHPDVNKNGHDKFVQINNAYSILSDEVQREKYDFMLDHENSK\n+TFEFSADGLTYEYSGVEVWHENFTKNVSLTQQWDFNPSNYYYEEYNLYHKFDKISIDGLGAFLDFDISCA\n+FYELDTSFSLPNNLVKRLINRPDVIRYDISENELIEYLKHRYDFSSWLLLKKYFNIEAIIEVTQEEIDSQ\n+KIINIPIKIKVINLNRSFEIWHEELRNYAFIVPENTKTGDISEFFGKGNVALGWQGDLIVRFKVVPSVEK\n+RLKIFSSMLNNEKSSLWFLVPSENNKNPNTKIFNYKTYQFNN\n+>1_762\n+MKFFTSKSSFLEAIKFSSNFSSDNNFEQLLKNLYIKIDNKECKIYSSNGQVSSIYKIEDDIDVEEEGEVI\n+VNAKKLITIIQSIVSDNFTLAKLDNQLIIRAGKMQTSLNLEEDVSYPEIEIDDSNFSVIDVDSFLFAKSI\n+KKVIHSTSFQTTKNSISSAINFQKEADDMNIWITGSDAIKLSSCYYKVNDTEDALKAKFNFSVNALSLSY\n+VAAFLKDKDQLLLKISKKSDKVVLTNNKFVLYLRVENEPFPEFKKILNANKVVSSFVVDKDLISNNLHAL\n+TGVLSLSDQGKNNADANFEILKNTLRISTNSFDIASYNSEFDISEFQGEVKDINLNPFYLQEHIKMFESK\n+DIEFKLLLQSAISGCILKVCEKNNDQFKLKFVQVLAPSSTN\n+\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastfa/Species2.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastfa/Species2.fa Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,3212 @@\n+>2_0\n+MKILINKSELNKILKKMNNVIISNNKIKPHHSYFLIEAKEKEINFYANNEYFSVKCNLNKNIDILEQGSL\n+IVKGKIFNDLINGIKEEIITIQEKDQTLLVKTKKTSINLNTINVNEFPRIRFNEKNDLSEFNQFKINYSL\n+LVKGIKKIFHSVSNNREISSKFNGVNFNGSNGKEIFLEASDTYKLSVFEIKQETEPFDFILESNLLSFIN\n+SFNPEEDKSIVFYYRKDNKDSFSTEMLISMDNFMISYTSVNEKFPEVNYFFEFEPETKIVVQKNELKDAL\n+QRIQTLAQNERTFLCDMQINSSELKIRAIVNNIGNSLEEISCLKFEGYKLNISFNPSSLLDHIESFESNE\n+INFDFQGNSKYFLITSKSEPELKQILVPSR\n+>2_1\n+MNLYDLLELPTTASIKEIKIAYKRLAKRYHPDVNKLGSQTFVEINNAYSILSDPNQKEKYDSMLKVNDFQ\n+NRIKNLDISVRWHENFMEELELRKNWEFDFFSSDEDFFYSPFTKNKYASFLDKDVSLAFFQLYSKGKIDH\n+QLEKSLLKRRDVKEACQQNKNFIEVIKEQYNYFGWIEAKRYFNINVELELTQREIRDRDVVNLPLKIKVI\n+NNDFPNQLWYEIYKNYSFRLSWDIKNGEIAEFFNKGNRALGWKGDLIVRMKVVNKVNKRLRIFSSFFEND\n+KSKLWFLVPNDKQSNPNKGVFNYKTQHFID\n+>2_2\n+MEENNKANIYDSSSIKVLEGLEAVRKRPGMYIGSTGEEGLHHMIWEIVDNSIDEAMGGFASFVKLTLEDN\n+FVTRVEDDGRGIPVDIHPKTNRSTVETVFTVLHAGGKFDNDSYKVSGGLHGVGASVVNALSSSFKVWVFR\n+QNKKYFLSFSDGGKVIGDLVQEGNSEKEHGTIVEFVPDFSVMEKSDYKQTVIVSRLQQLAFLNKGIRIDF\n+VDNRKQNPQSFSWKYDGGLVEYIHHLNNEKEPLFNEVIADEKTETVKAVNRDENYTVKVEVAFQYNKTYN\n+QSIFSFCNNINTTEGGTHVEGFRNALVKIINRFAVENKFLKDSDEKINRDDVCEGLTAIISIKHPNPQYE\n+GQTKKKLGNTEVRPLVNSVVSEIFERFMLENPQEANAIIRKTLLAQEARRRSQEARELTRRKSPFDSGSL\n+PGKLADCTTRDPSISELYIVEGDSAGGTAKTGRDRYFQAILPLRGKILNVEKSNFEQIFNNAEISALVMA\n+IGCGIKPDFELEKLRYSKIVIMTDADVDGAHIRTLLLTFFFRFMYPLVEQGNIFIAQPPLYKVSYSHKDL\n+YMHTDVQLEQWKSQNPNVKFGLQRYKGLGEMDALQLWETTMDPKVRTLLKVTVEDASIADKAFSLLMGDE\n+VPPRREFIEKNARSVKNIDI\n+>2_3\n+MAKQQDQVDKIRENLDNSTVKSISLANELERSFMEYAMSVIVARALPDARDGLKPVHRRVLYGAYIGGMH\n+HDRPFKKSARIVGDVMSKFHPHGDMAIYDTMSRMAQDFSLRYLLIDGHGNFGSIDGDRPAAQRYTEARLS\n+KLAAELLKDIDKDTVDFIANYDGEEKEPTVLPAAFPNLLANGSSGIAVGMSTSIPSHNLSELIAGLIMLI\n+DNPQCTFQELLTVIKGPDFPTGANIIYTKGIESYFETGKGNVVIRSKVEIEQLQTRSALVVTEIPYMVNK\n+TTLIEKIVELVKAEEISGIADIRDESSREGIRLVIEVKRDTVPEVLLNQLFKSTRLQVRFPVNMLALVKG\n+APVLLNMKQALEVYLDHQIDVLVRKTKFVLNKQQERYHILSGLLIAALNIDEVVAIIKKSANNQEAINTL\n+NTKFKLDEIQAKAVLDMRLRSLSVLEVNKLQTEQKELKDSIEFCKKVLADQKLQLKIIKEELQKINDQFG\n+DERRSEILYDISEEIDDESLIKVENVVITMSTNGYLKRIGVDAYNLQHRGGVGVKGLTTYVDDSISQLLV\n+CSTHSDLLFFTDKGKVYRIRAHQIPYGFRTNKGIPAVNLIKIEKDERICSLLSVNNYDDGYFFFCTKNGI\n+VKRTSLNEFINILSNGKRAISFDDNDTLYSVIKTHGNDEIFIGSTNGFVVRFHENQLRVLSRTARGVFGI\n+SLNKGEFVNGLSTSSNGSLLLSVGQNGIGKLTSIDKYRLTKRNAKGVKTLRVTDRTGPVVTTTTVFGNED\n+LLMISSAGKIVRTSLQELSEQGKNTSGVKLIRLKDNERLERVTIFKEELEDKEMQLEDVGSKQITQ\n+>2_4\n+MLDPNKLRNNYDFFKKKLLERNVNEQLLNQFIQTDKLMRKNLQQLELANQKQSLLAKQVAKQKDNKKLLA\n+ESKELKQKIENLNNAYKDSQNISQDLLLNFPNIAHESVPVGKNESANLELLKEGRKPVFDFKPLPHRELC\n+EKLNLVAFDKATKISGTRFVAYTDKAAKLLRAITNLMIDLNKSKYQEWNLPVVINELSLRSTGQLPKFKD\n+DVFKLENTRYYLSPTLEVQLINLHANEIFNEEDLPKYYTATGINFRQEAGSAGKQTKGTIRLHQFQKTEL\n+VKFCKPENAINELEAMVRDAEQILKALKLPFRRLLLCTGDMGFSAEKTYDLEVWMAASNEYREVSSCSSC\n+GDFQARRAMIRYKDINNGKNSYVATLNGTALSIDRIFAAILENFQTKDGKILIPQALKKYLDFDTIK\n+>2_5\n+MNKGVFVVIEGVDGAGKTALIEGFKKLYPTKFLNYQLTYTREPGGTLLAEKIRQLLLNETMEPLTEAYLF\n+AAARTEHISKLIKPAIEKEQLVISDRFVFSSFAYQGLSKKIGIDTVKQINHHALRNMMPNFTFILDCNFK\n+EALQRMQKRGNDNLLDEFIKGKNDFDTVRSYYLSLVDKKNCFLINGDNKQEHLEKFIELLTRCLQQPTHY\n+>2_6\n+MLTTTHALLIIQRKGSFLKPFLDNYLTSIVCENKNGCKKCINCLEILNNKYNSLYWFDQINPFKRENALQ\n+LARIFNRERTSVNNKNIYLIEEIEKLSSNSINSLLRLVEDSPINSYGIFTTKNESLILSTFLSRVQKVVL\n+KKASKVPFKVSKNDQEIITSFFTVDEQIEAIENGSFNRFKIILDACLNKKTGTEQIYHAWQIFRDFSNSE\n+IAQLITLIINKTENIDKKSILFNCLKVLPYNPPKSTLFANLVSW\n+>2_7\n+MKSEINIFALATAPFNSALHIIRFSGPDVYEILNKITNKKITRKGMQIQRTWIVDENNKRIDDVLLFKFV\n+SPNSYTGEDLIEISCHGNMLIVNEICALLLKKGGVYAKPGEFTQRSFLNGKMSLQQASAVNKLILSPNLL\n+VKDIVLNNLAGEMDQQLEQIAQQVNQLVMQMEVNIDYPEYLDEQVELSTLNNKVKLIIEKLKRIIENSKQ\n+LKKLHDPFKIAIIGETNVGKSSLLNALLNQDKAIVSNIKGSTRDVVEGDFNLNGYLIKILDTAGIRKHKS\n+GLEKAGIKKSFESIKQANLVIYLLDATHPKKDLELISFFKKNKKDFFVFYNKKDLITNKFENSISAKQKD\n+IKELVDLLTKYINEFYKKIDQKIYLIENWQQILIEKIKEQLEQFLKQQKKYLFFDVLVTHLREAQQDILK\n+LLGKDVGFDLVNEIFNNFCLGK\n+>2_8\n+MEYFDAHCHLNCEPLLSEIEKSIANFKLINLKANVVGTDLDNSKIAVELAKKYPDLLKATIGIHPNDVHL\n+VDFKKTKKQLNELLINNRNFISCIGEYGFDYHYTTEFIELQNKFFEMQFEIAETNKLVHMLHIRDAHEKI\n+YEILTRLKPTQPVIFHCFSQDINIAKKLLSLKDLNIDIFFSIPGIVTFKNAQALHEALKIIPSELLLSET\n+DSPWLTPSPFRGKVNWPEYVVHTVSTVAEIKKIEIAEMKRIIVKNAKKLFWH\n+>2_9\n+MDVRTERLNELFFVYHKNLKNQSKSKYSRAVNYLKRRGFNLQDF'..b'KDFNSFFENLSPLLCGNIPYSITSPIINKFLESKLRSFVLMTQKEFANRLLA\n+KVNSSDYSAFGAFCQYYLTITTVFKIDRHAFKPKPKVDSTLILLEKNKSVSYDFKFGLFLKQCFNQRRKM\n+LINNLKHFFAVDYLLNIIQKQNLKTSIRAQELSPCQLFNLYQNICNGKN\n+>2_468\n+MPIKLAQTNKEIKTTFNPFWSAAVVNEKNNWKNFKKFSAIFIKVIKVFIFIFLTIVGLWGCTQTLAQPWT\n+GTNQVLGSGLEIGYKFGTTGDYRYDLISNNFGPYFTFSDYTLAYGPFYGWFVWPAAQIVLPIMYATRVPL\n+GSGVELGFNMILSLIVLLLLVRLITIVITLNSTLALEKMNEVQGKLAEINAKYKGAIDLQSKRNRQLEIM\n+SLYKKHNIKSSAAFVQVFVTLPIFLIIYRIVTTLRPIKAIILFNFWDLSKVPLTEIFSNFTTTGWPFIIF\n+LVIVLPVQFLSQKLPQVWASKRNENAKAHSQKSIEQLNKTKKMQLIFYFVFAAITAFSAAGVGVYWFLNA\n+LFTLLQSYLTHVFIVKRREKRKQNYSKLDLILERE\n+>2_469\n+MLNSRFPVSVKKSHSLRERKVFTTILQSKTRFFGTFINAYFIKNNHSTWRVAISIAKTKYKLAVQRNLIK\n+RQIRSIFQQISNNLEPWDILVIVNKGFIELTFKEKQKLFLQLLKRIKEVDAYQTSANK\n+>2_470\n+MKRTYQPSKLKRAKTHGFMARMATAQGRKVLRQRRFKNRAQLTVSSER\n+>2_471\n+MKKGNKTVWNECIDILDNVKSPSFSANFDDYFKKSKSKPPKKNKKVLNNIKKAELKLKKKANKKQKANTL\n+YIPPFAQQAKGIVITINKMWKNVHNDDSKQEISILSDVSLQIAYGEIVIILGSSGSGKTTLLNLIGGYDS\n+ISLGSCIVANCPLEKCTSEQLLTYRKNNLGYVYQRYNLIELLSAYDNIAISQNLIPKYQRRLDIEELAEK\n+LDIKEILYKFPYEMSGGQKQRVAIARAIIKEPKLLLCDEPTGALDSNSAENIINLLQTINKTYKQTILMV\n+THDVSLTRIANRIIKISDGKIVSNQLVRPLV\n+>2_472\n+MFSFFKQIFKSLKKFFFLLFGIIFVLFSIIFLETSIVQLSNNLVSTYTTLVSKTNSSDIVAPAILKEANP\n+VYIASLTNDSGYFSKIKIDDKKINYLFPYQENDFGSDSGQSNGSGDNQNKTIPRKGDVNEKDKLFLARKR\n+GILKAYGEANIAEKRIYKGLAVSFNNTDSFNGSDISDSITNRHIISDPQNLIYDASGNLLGYFADGLIKE\n+TISLRAGIARFPGDKGKSTGTQVKITQKQQTNNDPQKDSTVNSLYKTNNKDKVWFKSDETKADNTDISAN\n+YLFTGGNEAANWFPNLYANIPIDLEIDPGSQFWKDVNPFKEIVEEFQTQKESKDNQSFTLTFNLDISKLN\n+KLDNEQLKWLETNAKTIANNSSFGDWDLENKLKQLKKFELKINKDWLKKKVESEKDTILNSLPGFSDSDK\n+DTIFKTQNGMMVRNNNLSFQPSSNNLQLVQNQNSQASNGIADPNFSNVQTAYNKIHQSNNTPEKTLDAVY\n+AAVLDQWRSIFQEDLVKKTVDLLEKYRDHFLKATAFNNIDYSKQNIAIANNVSSAESASFLVSNKDEQRY\n+NDLSLIDGVDLKSWLFKPEQNESNPLDTIYGGQDANNGFLQKIDYEFKPSTSSGGMTASLKNTQALSPKS\n+TKFPIYPKLANIIAQAQLPEATNIPTTALDALKQWTNLDANGFNNLKEEDKRKAANNYLALLSYFTPAFQ\n+DPNELIETNRQMLEIPITVKNGVNPLILPTDQQNLVVQTPEAHGAVVSQQWLFRHNKEILPQEGEYAWKT\n+ALQTPNNFPNWLNDLPDRYKFSINGLTFAILGIGESVETGYPVLSLQSPLPNTQDEALIFVNDQAYRSIL\n+FAVPAANQENYYAFKSTDLKQHTDQDPVQFIANRLEGYLDVPRSDLAFNVKDISKFNYLTTARNYFPDLV\n+QSYLAIVSTVIAIFLIILALYLIILLIKSFIKKNQTEFSIIRAGGFSTTKFIVGMSVFAGIVAIVSSFLG\n+VLFAFLLEGQVKGIINRYWFIALPENSFNWLSFFGSFFITFFVFEFISWIAFKQLFSKPVNVLIDQGNET\n+KFSVLLHLLKHKSHTMSPLTKFRVSLIVSRFSRLFTYVGLSSVALLLIGIAGTIPQKFSAAQTSTSLNRN\n+FNYKLNLQTPTEQSGWYAIQPYSHFGVTDNNNGIKTLYNESVQANSQNEHPYKPSNLKLKNRQDQPIKAA\n+DGTELELGNLLLPSYGGAQQLNTDENFFRHASLSKWIIDFPIRVGGSNINPWEIVEKSIPKQITQLLSAS\n+SDQFLISVLTDDFFNNLNANGFLIRNPRTNQIQLDASRVLTTIDVFNPGGVKFNDSFLSFMLKVYGDFEL\n+AKQDSKLNFGIVPVDPAIEETYTYVEGPFGFQEDNLDENSPYTLTGINPESSFVNLIDGSGNSLRNLISS\n+DQEMNVIVNAGFQYANNINIGDYVYIKPKNTATRYSEKFLKAPLNNSTVAFKVVGVSTDAFGQELYINQH\n+IANNLLKLSGNQGRGIIRDVIKKTNGQSQSSDEYEIDYVKPNGYVPFNGVFSKELKPSLLNKALVLNSII\n+GVWGNFTDFGNNFQNLVRNKLDKVITSILPTDPEIINKLAQEKQIINTTSMNYESLRKELVNKYKTEWNS\n+VNLLSQNASSIFGNNIIAPVLNIDAAGTSAQIIRNNAEVLFNTVNQVDAFLLGTIIPFIFITCVVLGISM\n+LEEMKRIFISLKAIGYRDVQNLISLLTFFIPAFVLALLISIGVLAGVLIGIQAVVFNVAQVFLTNVFEFL\n+PYMVGIVLFGVTIFVIGSYFWIKLRSAELKEGF\n+>2_473\n+MVLKTKENKKFDIYLKSSDFAVSKKASKLIKKLNKKHPKRKSLNSFEAKKYDIYFKEVCKAVTNGINNQL\n+ICNHINLKILPGEFVVILGKSGSGKTSLLSLISALDRPTSGDSFVCGTNTICCSDAKLTALRNKNVGYIF\n+QQYGLLRDLDVDDNIKLALPLKKRFNNNLEELLERLELKEHRHKKVHKLSGGQQQRVAIARALIKEPKIL\n+FGDEPTGAVNIDISKKILQFFVEYNRDKGTTIVIVTHNEKIVELAKRVIKIHDGKIIVDYLNQNPKTIEQ\n+INWV\n+>2_474\n+MEQFNAFKSLLKKHYEKTIGFHDKYIKDINRFVFKNNVLLILLENEFARNSLNDNSEIIHLAESLYEGIK\n+SVNFVNEQDFFFNLAKLEENSRDTLYQNSGLSKNYTFQNFVISEGNKRAYEAGVRLAETQDNEFSPLFIY\n+GETGLGKTHLLQAIGNEKFRNFPNARVKYVVSSDFAQEVVDAFYQRDKGIEKLKKNYENLDLVLIDDTQI\n+FGRKEKTLEILFNIFNNLVLNKKQIVLVSDKAPDELIDIDARMISRFKSGLLLKIEKHNLSSLCEILTVK\n+LKEKDPNIQITNEARHDAAQISGNDVRALNGIATKLLFFAKTSKQNLINTENLKEILFEEFEKFHKKSFD\n+PYLLIENVCRRFNVPMDSVLSENRKAELVRVRDVCNYLLRQKYNMQFQQIGKIFKRSHSSVLMAVKRVAK\n+MIENDSSLRDVITSLVI\n+>2_475\n+MIISFVNNKGGVLKTTMATNVAGSLVKLCPERRKVILDLDGQGNVSASFGQNPERLNNTLIDILLKVPKF\n+SGSNNFIEIDDCLLSVYEGLDILPCNFELNFADIDISRKKYKASDIAEIVKQLAKRYEFVLLDTPPNMAT\n+LVSTAMSLSDVIVIPFEPDQYSMLGLMRIVETIDTFKEKNTNLKTILVPTKVNVRTRLHNEVIDLAKTKA\n+KKNNVAFSKNFVSLTSKSSAAVGYEKLPISLVSSPSKKYLNEYLEITKEILNLANYNVH\n+\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastfa/Species3.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastfa/Species3.fa Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,4765 @@\n+>3_0\n+MQTNKNNLKVRTQQIRQQIENLLNDRMLYNNFFSTIYVLNETETEIIIDFTDLIAKQEVISRWVDTVEKA\n+IKNLEISKILTFNNTNNYTINSKESQNFSIKNKYCSFNINNVLNKFTFRNFIKSSYNFQIFSIYDAIVAN\n+SRLNYSPIFISGPSGIGKTHFINAIGNLLVEKQKKVFYINDYKFISCVSSWMQNGQNEKISEFLNWLSQV\n+DAFLFDDIQGLANKQQTSIVALEILNRFIEEDKTVIITSDKSPSLLGGFEERFITRFSSGLHIKLNKPKK\n+EDFLRIFKHKLVEEKLEKHIWTNDAFEFLSKHFRNSIRELEGALKSIVFYIQTNKNKFENEIYFDKKKMF\n+EIFVEKYEIEQTITPDLIIEVVSKYYGVSILDIKSEKRGKNIVHARDIAIWLIKNILDLTHNSVGTFFNN\n+RRHSTIISTLKKIDTLKQSNNNELEIALNHIYKQLNWSFKQRK\n+>3_1\n+MKFTIEKKIIEWQIERMQSAILNNINSPLSSFFLKLTRSGLFIISTNSELSYKVFINKKDLIEIHDVGSC\n+LIDGVFLRDVIRKSDKQLSFHLIGSELKVFWEDALFSKTTRDSSFFPEINFEQKGIKLTVNAKNFKRAIK\n+NTAFATTNNPSQPILSAINLRSEAGFLHFSATDTSRFASEKIEISNKSRINISVSAKNLKDFIPPELDKD\n+IELNIESSKISYIYDNLTIQSRIFTIEYKDISNILPKDSEILYSLTINKRDILDLIDKTTIITPGKDNVI\n+NLSLSKNALKGYISQYDSGQSNVQTKNVLDFRFNPRFASDFRFDPELAQVNINYRYLKDAISVFDKVIDI\n+HINEKMNKMLIVSPEKPEICQLVGLVLV\n+>3_2\n+MSKKSKNSSIEFDAIVVGGGHAGIEAVYALLKKKLKVVLITLDKKKLASMPCNPAIGGPAKGIITREIDA\n+LGGVQGKFSDLAMIQIKYLNESKGPAVLAIRAQIDKEKYSKLILKDLKKQENLLIIEDLVSELLVEKNRV\n+FGLKTAKKQVFFSKTVIITTGTYMDSKVLRGSLAIPSGPDGQQTSNLLSNNLKRLGFELQRLKTGTPPRI\n+FTSSIDFSKVEKEVLPVYNINFSFQSKHKIKKQISCYLTYTTAKTHDIINKNLGKSSMYSGLISGVGPRY\n+CPSIEDKIVRFSEKPRHQIFFEPETKKQDIMYINGLSTSMPEDVQLEMVKTIPGLENAKIAKFGYAIEYD\n+ALNPLELKKSLETKKVKGLFMAGQINGTSGYEEAAAQGLVAGINAGQFVLGKKPVEILRNDGYIGVLIDD\n+LVTKGTKEPYRMLTSRAEYRLILRNDNADIRMAKYALKSGLISKKEYLKIKAKYAKIDRKILELSKEFVS\n+PKDELAKKYNLEKRISKLKLISWPNVNFKDILPDFEFGYELTVMARLKGYIQKQNSEAQKMIRLEKLLIP\n+GDLNYEKVANLSSEALDKFQKVRPKTIGEASRISGVNPADIQMLLFHIKVLKMQKVSKI\n+>3_3\n+MKISIISFGSSPREWLGLYKKEINKIKQFKYQIEFINLSEHSQENIELKKMLETKDILQKIPKNSSCYLF\n+TERGKTVTSKEFSQLLNFSNICFIIGGSYGVDEKLIAKSRPDIGFLSFGKLTFAHKIFKLIVLEQIYRGF\n+SIKFNRKYHHAD\n+>3_4\n+MKRKNYEKIIQNIENHDNIFIFHHIRPDGDCLGAQQGFGYAIAKRFPKKKVFFIGDNENIFNFLNFHFDN\n+ENLIQDEFFQNSLAITVDTADIKRIKKLDFFLNSNFKTRIKIDHHPDIFEEIYNEKWVDPTFSAASEMIG\n+YLLMEENWEINSEISKFIYLGILTDSGRFLFPSTTSRTFQVAAFLMKFNFDFAKLNWFLSNRTEQEVAFC\n+AEVLANYKKKDKVLWYFVSKEIQNKFKLRNDQLSAVNILANIGDARIWLFLIEMENGIRVRIRSNGPKVN\n+EIASEYGGGGHEYAAGINLEKSEKTKEISQEIIEKLVIQVKEFEQNE\n+>3_5\n+MSNIKIKEIIKLIENHDTIVIFHHIRPDGDCIGAQLGLKNLILDNFKNKKVFAVGNHKGSFSFLNAKTDS\n+IPDKLILKNSLAIIVDANFKNRIESVFLFDQFKFKTILRIDHHPNEDDFEQIYRWVDPSYVATCEQIADL\n+AYKAKWKISRKSATFIYLGIYTDSGRFLYKNTSARTHFLTGILFRTGFNFALIHEKLNQKKLSDIDFDSY\n+IFSVKKIYKNVIFYTLSMEEQKKLNKNPSNSVRPNLLANIENFRIWLCLVQEKENSWRVEFRSSGPNVQK\n+VAQNWGGGGHLNASGAIIESLDKLDLLIKDCQAEYESWFSQLK\n+>3_6\n+MEGINITNFLKYLFAYYYIDTGEREVYRTWVQKILWFTHWKFYRMYQIPFFSENFQSYKYGPISWTVLQT\n+QFFGIESFKNSQYNIDEILDFHQNNLVDEFKNRLKEDFLNDFNEDFGETFDENQIKGDLDLRWSCFVFVF\n+EKLKKFRPKDLINLSHSQKSFKIAAKNPHSKVIFNETILDDEEISILES\n+>3_7\n+MSFFRKIREKIFGTKQEKPANLDKYVAGLTKSRLSFFKQIVQLQKKHIKIDENFFEELEEILIMSDISPN\n+FVRTIIDSLKAEVRHHNLNNPDLIPEIIMDKMYTIYSNRSVVNTNLNIKDGRINVFLISGVNGSGKTTSI\n+AKVARKFIIEGKKVLIIAADTFRAAAVEQLEIWANRVGALILKPEANEKDPGSVVFRGLDFAIKEKTDLV\n+LIDTAGRLQNNVNLMQELKKINKIISQKVPNAPHESLLVIDATTGQNGVSQAANFAKITPVSGIILTKMD\n+GTSKGGIIFSIKDQLDISVKLVGLGEAMDDLQPFDLDLFIFAITKEVKNQYQV\n+>3_8\n+MAKISFFALGGQDENGKNCYILEIDDNIFIINSGAKIPLDSSVGVDTIIADFTYLEENQHKIRGVFITDA\n+KNESFSALPWLIMKLKKIKIYSSFFTKALIIERIHKYRLSESAFEVIPITSELKINEKISVSPFPVAGSM\n+PGTIGFCFHTEDGGIVFMANYVVGNLGVYGETNFELIKKISQNPKGILMFISDSGKSNLPGKAINKLFAK\n+NFLENFFLKADKNSRIVVSAYDEEMVSIQEIIDLSIKFNRQITAYGKKYDKLYDMIYKLDKLTTNKLKKL\n+PTFFDYKYANKQKNSVILITSSPERICYRFNRILENDDVYFKLKKSDYVIMLTPPINGMEQLYAKVLDQI\n+AKSTTSIVDISESDFGLARPYKEDISEMIQLLKPKYFLPIQGLYRYLIVASNIAVANKVKRQNIIVLQNK\n+RSANFIDGSLFSRKKISKGEEEIYVSGFGIGDVCFRVLKERDALSRNGLIIVSFLFDPIEKKIFSTPEIT\n+TYGILSRENREAYYDIIRKIIFNNFSNIKKINDKILKELQQKSQKNIKRKLLRIFDKEPSVSVLIHNIYP\n+EVKKMKKMLWKQAENELKTGVVYLEFAADWCNDCKMQEPVNEELSKYFKDRSDVKLIKVDAEESKLFRQK\n+GTKYEVLFVPTHFIFKDGQILFKQFNYVPAEVLIEKIEKALNS\n+>3_9\n+MPKLDSKKEKYLKQIVENFIKTGESIGSLNLKQSYGIKKSPSYLRAIMNQLEKEGFLEKSHSSSGRIPTL\n+QGFQYYAEFLSFDENENLANKLKDLFARRRINIENTISEAVKLISESVGTTLIATTNNENERLMSINLTQ\n+ISQNEGIIVVVSSSGNVENKKITFSEQIPRQDVKIAIRLFQERLINTPLLEISSKLAILKQELEKQIKHS\n+DELLHHFMEKIFNFQVQNKSNIYNKNSLILDKEISRAKLVDLLYIIEKKSIWEMLEDRTTKDDDTLKISI\n+KSPEVSFISKKFEKFLPIKEISMVGAAKKINYSAARTGIKLLEDFLSNKSKIRKG\n+>3_10\n+MVFG'..b'FSMLIFYFSD\n+IIKWIIYEILYLKTNWAINLTLEKTAKKIL\n+>3_666\n+MPRLTNMKISFVAIFISIAVIMLIIGVRLAPFAILPNFRLSIIGLPIKITGFIFGPIVGFLTGLLADLIT\n+FLFIPGVYSWYYTLHLSLAGFIPGIFFWFFVIKGKKWFEKKSILTRLDQKIFEQKQKIFDFTYYRIANNQ\n+KDENLERKMKQKLLFLQKKVKRVESWQEEKSLLNFYWIASNLILISIVVTTIYVVMFSSSIDFSQSRFIS\n+SKLSFLILTLFGTVSMIIFLLLARFINFFRKNERYLTIAPIVVFSALHEPIASIIGARGDVQSGALNNFD\n+TAFLSHIIVSPVKIWINLSVIYFTAKAVVPLVYKKFSYSIT\n+>3_667\n+MTNLHQEKRKKLLFHNIKNKYWNYFSLELEANQGSFIYSSDKNFFNEFKKILEDENSYNGFILENNEPYE\n+YQKNTCFSDFLTKKFFEKNKNKLVIEVLLSLWRIEPFKIKTNTTRRYIQYLSIKNVENFLKMFENELNYL\n+LENRAQAFKFIEKIAKIKEEYQILNKNFYNLYLKTELKPNIEQEKLNEKLKLSIPYPETKFENLKFSQTY\n+AQIALQTIKNDIKNVINHHNSLINSFDSDPYKIKIFITGYNCFLDLIKRSDNFRWLSSLQIYEIYFKFEQ\n+WLIKLLNQKALENILGTQNFFNNTFAEEFWGFWKQNSQQKILEERNKKAQKHFKVKKINSFHKENPYYQN\n+LKTNSKTLLRANILWQHEVIKMEKKLRNKNFQNSFFIKRIWVSSIENKLKKLKEKISKVEYENHFIFLKD\n+ALSDLKNFFYLKNLKKIDVFLKKNQFFIFCFDNKINFDILYKKYGVLTNDDLFFLETKKMQMGNYSRFLF\n+DEYSFLLETNYKQKLFQHFFNNGENSAQLFIYSRRTIKPIRDFSIIFIENGTLVEYIREIDLPLTPKTSF\n+GKFFYQNGTFERTNLPLLETQLYKQLQNEVFQNNSGGIKNNFESFINSWIPIKEFKLEFDSENKKYSLKK\n+DILVIDL\n+>3_668\n+MKNKYDFKLVEEKRNEKWQKKGFFIAPKQTKKPFSIISPPPNVTGQLHLGHSWNAFIQDSLVRYHKLQGF\n+DVLLLPSVDHAGIATQVKVEEDLAKKGIKKSDLKREEFIKKCYHWKEKQYLKIKEQWDKLGICYDFSKER\n+FTLDQDAQIAVSDFFIKLWEKNLIYRGQKAINWDIKLQTAISNIEVINKPVEQKMYYLKYFLENSNEFLT\n+VATTRIETISSDVALAINPKDKRYLHLVGKKVVHPLTKKLIIIIADSNVSSDFGSGIMKVSAHSILDFEI\n+MEKHNLESKDCIDNYGNLNHEVPEFQGQNRFFARDLIAKKLEKEGFLAKIETVISNVGFSQRSDEIVEIL\n+KKPQWFVKMDELAKSLISHLNSKDKIKFYPKNFEKNLRKWFEKIHDWTISRQLWWGHRIPVWCKNDEFKV\n+QIDSPGQGWIQDEDVLDTWFSSGISAFAFLGWPQNFDLIKSYFPTSLLVTGWDILFFWVARMYFSSLFIM\n+KQKPFEKVLLHGLIRDEIGRKMSKSLGNGLDPMEIIEKYGSDTLRQALIFNSSPGKDIKFNIEKLNTAWN\n+LNNKIWNIAKYIADLDTFFAKPDLIDLWMENKIYILKRQIVKNIKKYNFSVIGTEINNFIYGDFSSRYIE\n+LIKTRKNGFYARKLLRKVLIILHPFLPFLTDFLMEKIFKMEILEQKMPRIRQFKENQKVENILEIIDNLR\n+TYREKFQISKKIILEYCIINDKFSNAEIDIINKLTFGKWLENKELVIKTKNFEIAIKVPEELKKEQKGRE\n+LKEIQFLKSEILRAEKILTNKGFLEKAPREKIDLERTKLEKLKEKLVFYEKK\n+>3_669\n+MKKLKIYKNLNYFLPSFVFLGGAFFVLVSCGSTHFGLNISRESQTGIENAKKLKKIVNSPNLIELSPENN\n+EKIYEDKDAKFFLFDLNSAVNGGKNLELMPEFTTKFSPKTEITYLNFINRYYNTRQLQQKKKSLNQDSNS\n+IYIPHVDEKFKDFWYVFMIPTSIGFSALELNGKKTVIDREKTKLPSTLIPYSSVEVKILKKGIISADKKN\n+YLQINVNQMINSFAFREKKSNEPNSSEINVFGFQDNKAYPNYKLIFDSLDSSKKIIKFKLHRKNDNLHEE\n+RSAKNKLNSYISVMNFIYKAKEYKQNLNPDDFFEKNTEQKDKNSEYPFVRFYTQTFIVPFEGKEEVFDSD\n+FSILIEKSE\n+>3_670\n+MKNKITPCIWSLISNTHLRKAESLEILIRALLLNNEEINQNFKNKWLKIYKNKNWKPIGDLNEHLKLAAQ\n+LGVTKTDILTPGQQKINILAKLVNSGIIKIREYISIILFNLVSFINYEYRHIFKMTLELLKKQNNSPVSV\n+DEIFQNFNFGEPVCAEFNIKLLRYNLKQKDHIFYILISGVFFEVLSSRGKNQQYNINFFKIKLYDHWYSR\n+IDELIKRCNNQLESYNFEKASLIRLDSEKWSNYLTQNSQANYDYIVDVLMQKESNNLDEKNDNTINFKAS\n+INHLENQVQKNLENSLQETQINQDISTTISNNPEKVDIELEAILENSQENKVDLSELPANFNDKDQAESH\n+QISLENADLTSTNSVEKLEIEEKIQEKQSDIRIISNNLEQNCCPEQNVVEKEIEKTYEDNIEKNSFYSNF\n+YQDQFERDFNKISEPSGEKNLQDNAQSEICAAEKCCNHIQLEKENLEHIDSSKQEKVVKINSNYLNKGEK\n+NNSNTNKKVPSLPLLYQAKQEMQREISKYPISKSVNSKEHYYNYFIHKINKLFNFSLENMLNKTNFKQNF\n+FNILDFHKKNHEIILKPKKTIIKSGKNLLLISPSANLIYSKIKNELCKTEISEKNYEIVTFFDDYNPESF\n+IGYNDFVLGSKEKLNFIPGPFARILHKAYWNPEKKYCLILENIDNDAAKITLAPLKPLFIRGENGESLLG\n+ISQFDLSFYIFSHPEEKNFIPGNLTIIGTVNSNLDRDFVDLYPDFLENWEIKYLERDNLYSHITKYQICD\n+TGLSWKHFSEKLNSLLESENLNNKWFLPNQIETKILENPRIFVDKVLFSLWNFTSPEKRKIIFRSNSYSV\n+MVKEFLETKGSKRLNIFKFDYEKIKNI\n+>3_671\n+MKNRKIRPKAFDYFQSQNNQNKKTFKFKGFFKFLKIFFYTIIFGISLTGCIQSMVVKTSYNPGEALEFYN\n+SKEEITPNYTIFRESKNKDLPGIDIVTKNNNFLVSADNKKVNQEKILNALRKQIKNENAEFGEFSSLIMF\n+QKGENEFEYLKGDKNNEFIFFSSSENSIEQKTNWTEIKIPSPKYFSLKSDKQYFEKLRDVKSLPINTYSF\n+DKSSSENAAISEKIDSYFFNLDNKIPPVNRSYAIFARDVFQVIYNKLILLPQFSQGKLEKAIAEFEQKSG\n+KDVSPETEKILSGYANLVKKLVFPTNFSRIDIQNKTYSWNNNDESAAKNIAFQNKIPAFPIVSWAESWKL\n+GPFYAIFVYPLSKIILWVTASQSLYEWSGWITILSILAVVVFTKIISFIFRFKTIFGQNKQMELQLKKAK\n+IDAKYENYKKNKVMQQRHRQEIVDLYKKNNFSPFSPFSQILVTMPIFIAVWRALQGIPSFKVTYFLGLEL\n+AATSYQKLFEGYWIYLPIIIVTVLVQALQQIIPKILNKKKSNRIMNVQENETLKKQQKTQRIVSIIFIFF\n+GVIFQASLQIYWIIGGIWEILQTLGIFYLQKSNFYREKMRPWLERKKWV\n+>3_672\n+MQKIRSIKKNWEFQAIINKKNQIVTNYLIFYYVKSDFFEIGISVPKKFANAVKRNYYKRQIKNALYILWK\n+KGEIFLNFRVVLIARKNFLPLSFETKYQKLAKIFKELKRNEK\n+>3_673\n+MKRTYQPNKRKHLKTHGFRARMSTADGRKILAARRAKGRKRLTVSDK\n+\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastids/SequenceIDs.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastids/SequenceIDs.txt Tue Oct 24 06:40:40 2017 -0400
[
b'@@ -0,0 +1,2733 @@\n+0_0: gi|290752267|emb|CBH40238.1| Chromosomal replication initiator protein DnaA [Mycoplasma agalactiae]\n+0_1: gi|290752268|emb|CBH40239.1| DNA polymerase III, beta chain [Mycoplasma agalactiae]\n+0_2: gi|290752269|emb|CBH40240.1| Esterase/lipase [Mycoplasma agalactiae]\n+0_3: gi|290752270|emb|CBH40241.1| Esterase/lipase [Mycoplasma agalactiae]\n+0_4: gi|290752271|emb|CBH40242.1| NADH dependent flavin oxidoreductase [Mycoplasma agalactiae]\n+0_5: gi|290752272|emb|CBH40243.1| Lipoate protein ligase A [Mycoplasma agalactiae]\n+0_6: gi|290752273|emb|CBH40244.1| Lipoate protein ligase A [Mycoplasma agalactiae]\n+0_7: gi|290752274|emb|CBH40245.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+0_8: gi|290752275|emb|CBH40246.1| Glycine cleavage system H protein [Mycoplasma agalactiae]\n+0_9: gi|290752276|emb|CBH40247.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+0_10: gi|290752277|emb|CBH40248.1| Hypothetical protein MAGa0130 [Mycoplasma agalactiae]\n+0_11: gi|290752278|emb|CBH40249.1| Conserved hypothetical protein, predicted lipoprotein, P48 [Mycoplasma agalactiae]\n+0_12: gi|290752279|emb|CBH40250.1| Hypothetical protein MAGa0150 [Mycoplasma agalactiae]\n+0_13: gi|290752280|emb|CBH40251.1| ABC transporter, ATP binding protein, P59 [Mycoplasma agalactiae]\n+0_14: gi|290752281|emb|CBH40252.1| Sugar ABC transporter Permease [Mycoplasma agalactiae]\n+0_15: gi|290752282|emb|CBH40253.1| Sugar ABC transporter permease protein [Mycoplasma agalactiae]\n+0_16: gi|290752283|emb|CBH40254.1| Deoxyguanosine kinase [Mycoplasma agalactiae]\n+0_17: gi|290752284|emb|CBH40255.1| Deoxyguanosine kinase [Mycoplasma agalactiae]\n+0_18: gi|290752285|emb|CBH40256.1| Conserved hypothetical protein, predicted lipoprotein [Mycoplasma agalactiae]\n+0_19: gi|290752286|emb|CBH40257.1| Hypothetical protein, predicted lipoprotein, DUF285 family [Mycoplasma agalactiae]\n+0_20: gi|290752287|emb|CBH40258.1| Conserved hypothetical protein, DUF285 family [Mycoplasma agalactiae]\n+0_21: gi|290752288|emb|CBH40259.1| Transposase [Mycoplasma agalactiae]\n+0_22: gi|290752289|emb|CBH40260.1| Hypothetical protein, predicted lipoprotein, DUF285 family [Mycoplasma agalactiae]\n+0_23: gi|290752290|emb|CBH40261.1| Conserved hypothetical protein YeiN [Mycoplasma agalactiae]\n+0_24: gi|290752291|emb|CBH40262.1| Conserved hypothetical protein YeiC [Mycoplasma agalactiae]\n+0_25: gi|290752292|emb|CBH40263.1| Hydrolase of the HAD superfamily [Mycoplasma agalactiae]\n+0_26: gi|290752293|emb|CBH40264.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+0_27: gi|290752294|emb|CBH40265.1| Hypothetical ABC transporter, ATP binding protein [Mycoplasma agalactiae]\n+0_28: gi|290752295|emb|CBH40266.1| Hypothetical protein MAGa0310 [Mycoplasma agalactiae]\n+0_29: gi|290752296|emb|CBH40267.1| Hypothetical protein MAGa0320 [Mycoplasma agalactiae]\n+0_30: gi|290752297|emb|CBH40268.1| Hypothetical protein MAGa0330 [Mycoplasma agalactiae]\n+0_31: gi|290752298|emb|CBH40269.1| Oligopeptide ABC transporter, ATP binding protein (OppF) [Mycoplasma agalactiae]\n+0_32: gi|290752299|emb|CBH40270.1| Oligopeptide ABC transporter, ATP binding protein (OppD) [Mycoplasma agalactiae]\n+0_33: gi|290752300|emb|CBH40271.1| Oligopeptide ABC transporter, permease protein(OppC) [Mycoplasma agalactiae]\n+0_34: gi|290752301|emb|CBH40272.1| Oligopeptide ABC transporter, permease protein(OppB) [Mycoplasma agalactiae]\n+0_35: gi|290752302|emb|CBH40273.1| Oligopeptide ABC transporter, substrate bindingprotein (OppA), predicted lipoprotein [Mycoplasma agalactiae]\n+0_36: gi|290752303|emb|CBH40274.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+0_37: gi|290752304|emb|CBH40275.1| Cysteinyl tRNA synthetase (Cysteine tRNA ligase) [Mycoplasma agalactiae]\n+0_38: gi|290752305|emb|CBH40276.1| tRNA/rRNA methyltransferase [Mycoplasma agalactiae]\n+0_39: gi|290752306|emb|CBH40277.1| Hypothetical protein MAGa0420 [Mycoplasma agalactiae]\n+0_40: gi|290752307|emb|CBH40278.1| 50S ribosomal protein L33 [Mycoplasma'..b'ae J]\n+3_632: gi|144227736|gb|AAZ44718.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_633: gi|144227737|gb|ABO93485.1| hypothetical protein MHJ_0699 [Mycoplasma hyopneumoniae J]\n+3_634: gi|71852111|gb|AAZ44719.1| O-sialoglycoprotein endopeptidase [Mycoplasma hyopneumoniae J]\n+3_635: gi|71852112|gb|AAZ44720.1| transcription antitermination protein [Mycoplasma hyopneumoniae J]\n+3_636: gi|144227738|gb|AAZ44721.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_637: gi|71852114|gb|AAZ44722.1| hypothetical protein MHJ_0639 [Mycoplasma hyopneumoniae J]\n+3_638: gi|71852115|gb|AAZ44723.1| putative tRNA/rRNA methyltransferase [Mycoplasma hyopneumoniae J]\n+3_639: gi|144227739|gb|AAZ44724.2| cysteinyl-tRNA synthetase [Mycoplasma hyopneumoniae J]\n+3_640: gi|144227740|gb|AAZ44725.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_641: gi|71852118|gb|AAZ44726.1| putative hemolysin C [Mycoplasma hyopneumoniae J]\n+3_642: gi|71852119|gb|AAZ44727.1| replicative DNA helicase [Mycoplasma hyopneumoniae J]\n+3_643: gi|71852120|gb|AAZ44728.1| 50S ribosomal protein L9 [Mycoplasma hyopneumoniae J]\n+3_644: gi|71852121|gb|AAZ44729.1| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_645: gi|71852122|gb|AAZ44730.1| leucyl-tRNA synthetase [Mycoplasma hyopneumoniae J]\n+3_646: gi|144227741|gb|AAZ44731.2| excinuclease ABC subunit B [Mycoplasma hyopneumoniae J]\n+3_647: gi|71852124|gb|AAZ44732.1| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_648: gi|71852125|gb|AAZ44733.1| 30S ribosomal protein S9 [Mycoplasma hyopneumoniae J]\n+3_649: gi|71852126|gb|AAZ44734.1| 50S ribosomal protein L13 [Mycoplasma hyopneumoniae J]\n+3_650: gi|144227742|gb|AAZ44735.2| dimethyladenosine transferase [Mycoplasma hyopneumoniae J]\n+3_651: gi|144227743|gb|AAZ44736.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_652: gi|144227744|gb|AAZ44737.2| ribose-phosphate pyrophosphokinase [Mycoplasma hyopneumoniae J]\n+3_653: gi|71852130|gb|AAZ44738.1| glucose inhibited division protein B [Mycoplasma hyopneumoniae J]\n+3_654: gi|71852131|gb|AAZ44739.1| putative prolipoprotein p65 [Mycoplasma hyopneumoniae J]\n+3_655: gi|71852132|gb|AAZ44740.1| putative ABC transporter ATP-binding protein P115-like protein [Mycoplasma hyopneumoniae J]\n+3_656: gi|71852133|gb|AAZ44741.1| 50S ribosomal protein L33 [Mycoplasma hyopneumoniae J]\n+3_657: gi|71852134|gb|AAZ44742.1| XAA-PRO aminopeptidase [Mycoplasma hyopneumoniae J]\n+3_658: gi|144227745|gb|AAZ44743.2| hypothetical protein MHJ_0660 [Mycoplasma hyopneumoniae J]\n+3_659: gi|144227746|gb|AAZ44744.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_660: gi|144227747|gb|AAZ44745.2| hypothetical protein MHJ_0662 [Mycoplasma hyopneumoniae J]\n+3_661: gi|71852138|gb|AAZ44746.1| putative adhesin like-protein P146 [Mycoplasma hyopneumoniae J]\n+3_662: gi|71852139|gb|AAZ44747.1| putative ABC transporter ATP-binding - Pr1 [Mycoplasma hyopneumoniae J]\n+3_663: gi|71852141|gb|AAZ44749.1| hypothetical protein MHJ_0666 [Mycoplasma hyopneumoniae J]\n+3_664: gi|71852142|gb|AAZ44750.1| transcription elongation factor [Mycoplasma hyopneumoniae J]\n+3_665: gi|144227748|gb|AAZ44751.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_666: gi|71852144|gb|AAZ44752.1| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_667: gi|71852145|gb|AAZ44753.1| hypothetical protein MHJ_0670 [Mycoplasma hyopneumoniae J]\n+3_668: gi|71852146|gb|AAZ44754.1| valyl-tRNA synthetase [Mycoplasma hyopneumoniae J]\n+3_669: gi|144227749|gb|AAZ44755.2| hypothetical protein MHJ_0672 [Mycoplasma hyopneumoniae J]\n+3_670: gi|144227750|gb|AAZ44756.2| hypothetical protein MHJ_0673 [Mycoplasma hyopneumoniae J]\n+3_671: gi|71852149|gb|AAZ44757.1| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+3_672: gi|71852150|gb|AAZ44758.1| ribonuclease P protein component [Mycoplasma hyopneumoniae J]\n+3_673: gi|71852151|gb|AAZ44759.1| 50S ribosomal protein L34 [Mycoplasma hyopneumoniae J]\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastids/SpeciesIDs.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastids/SpeciesIDs.txt Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,4 @@
+0: Mycoplasma_agalactiae.faa
+1: Mycoplasma_gallisepticum.faa
+2: Mycoplasma_genitalium.faa
+3: Mycoplasma_hyopneumoniae.faa
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast0_0.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast0_0.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,3999 @@\n+0_0\t0_0\t100.00\t466\t0\t0\t1\t466\t1\t466\t0.0\t 941\n+0_0\t0_720\t27.36\t106\t70\t3\t155\t258\t153\t253\t1e-07\t48.1\n+0_1\t0_1\t100.00\t369\t0\t0\t1\t369\t1\t369\t0.0\t 734\n+0_2\t0_2\t100.00\t261\t0\t0\t1\t261\t1\t261\t0.0\t 531\n+0_2\t0_499\t64.62\t260\t90\t1\t4\t261\t5\t264\t8e-121\t 345\n+0_2\t0_3\t57.03\t263\t111\t1\t1\t261\t1\t263\t3e-111\t 321\n+0_2\t0_223\t49.04\t261\t132\t1\t2\t261\t3\t263\t1e-88\t 263\n+0_2\t0_147\t38.40\t263\t158\t3\t2\t261\t5\t266\t1e-54\t 176\n+0_2\t0_718\t29.51\t122\t81\t3\t10\t130\t15\t132\t2e-08\t48.9\n+0_3\t0_3\t100.00\t272\t0\t0\t1\t272\t1\t272\t0.0\t 560\n+0_3\t0_499\t58.78\t262\t108\t0\t2\t263\t3\t264\t1e-118\t 340\n+0_3\t0_2\t57.03\t263\t111\t1\t1\t263\t1\t261\t4e-111\t 321\n+0_3\t0_223\t49.04\t261\t132\t1\t3\t263\t4\t263\t1e-89\t 266\n+0_3\t0_147\t37.02\t262\t163\t2\t3\t263\t6\t266\t2e-56\t 181\n+0_3\t0_718\t26.32\t228\t142\t5\t10\t228\t15\t225\t1e-12\t62.0\n+0_3\t0_60\t21.91\t251\t171\t12\t9\t246\t14\t252\t1e-06\t43.9\n+0_4\t0_4\t100.00\t392\t0\t0\t1\t392\t1\t392\t0.0\t 797\n+0_5\t0_5\t100.00\t348\t0\t0\t1\t348\t1\t348\t0.0\t 702\n+0_5\t0_6\t74.49\t345\t88\t0\t1\t345\t1\t345\t0.0\t 548\n+0_5\t0_59\t30.85\t295\t192\t6\t48\t342\t43\t325\t1e-41\t 145\n+0_6\t0_6\t100.00\t345\t0\t0\t1\t345\t1\t345\t0.0\t 699\n+0_6\t0_5\t74.49\t345\t88\t0\t1\t345\t1\t345\t0.0\t 548\n+0_6\t0_59\t31.00\t300\t195\t6\t43\t342\t38\t325\t2e-41\t 145\n+0_7\t0_7\t100.00\t289\t0\t0\t1\t289\t1\t289\t0.0\t 603\n+0_8\t0_8\t100.00\t114\t0\t0\t1\t114\t1\t114\t4e-80\t 230\n+0_8\t0_389\t37.72\t114\t71\t0\t1\t114\t1\t114\t2e-23\t85.5\n+0_9\t0_9\t100.00\t333\t0\t0\t1\t333\t1\t333\t0.0\t 684\n+0_10\t0_10\t100.00\t272\t0\t0\t1\t272\t1\t272\t0.0\t 531\n+0_11\t0_11\t100.00\t465\t0\t0\t1\t465\t1\t465\t0.0\t 946\n+0_11\t0_155\t75.68\t440\t106\t1\t27\t465\t163\t602\t0.0\t 674\n+0_12\t0_12\t100.00\t149\t0\t0\t1\t149\t1\t149\t1e-103\t 292\n+0_12\t0_397\t32.61\t138\t77\t7\t10\t140\t4\t132\t1e-09\t48.9\n+0_13\t0_13\t100.00\t534\t0\t0\t1\t534\t1\t534\t0.0\t1084\n+0_13\t0_27\t31.53\t203\t124\t5\t25\t224\t1\t191\t2e-20\t86.7\n+0_13\t0_476\t28.85\t208\t133\t5\t20\t224\t19\t214\t6e-17\t75.9\n+0_13\t0_535\t27.23\t213\t135\t7\t21\t226\t18\t217\t5e-15\t70.5\n+0_13\t0_535\t21.54\t246\t150\t9\t279\t515\t18\t229\t5e-06\t43.1\n+0_13\t0_157\t29.13\t230\t139\t6\t7\t231\t4\t214\t9e-15\t69.3\n+0_13\t0_814\t23.74\t198\t139\t3\t10\t203\t128\t317\t2e-13\t66.6\n+0_13\t0_814\t23.48\t247\t151\t9\t263\t501\t120\t336\t2e-10\t57.4\n+0_13\t0_624\t24.61\t508\t307\t26\t7\t462\t2\t485\t1e-11\t61.6\n+0_13\t0_534\t23.68\t228\t165\t6\t279\t502\t22\t244\t2e-10\t57.4\n+0_13\t0_534\t23.55\t242\t145\t9\t19\t229\t20\t252\t8e-09\t52.0\n+0_13\t0_32\t27.31\t216\t134\t8\t26\t224\t118\t327\t2e-10\t57.4\n+0_13\t0_32\t22.83\t254\t158\t10\t264\t503\t99\t328\t6e-06\t43.5\n+0_13\t0_520\t34.02\t97\t61\t1\t6\t102\t45\t138\t4e-10\t57.0\n+0_13\t0_520\t25.58\t86\t63\t1\t139\t223\t468\t553\t7e-04\t37.0\n+0_13\t0_324\t29.61\t206\t128\t10\t24\t223\t385\t579\t1e-09\t55.5\n+0_13\t0_324\t40.85\t71\t39\t2\t264\t331\t365\t435\t1e-07\t48.9\n+0_13\t0_627\t27.27\t198\t136\t6\t21\t218\t373\t562\t1e-07\t49.3\n+0_13\t0_124\t22.58\t310\t154\t9\t5\t231\t10\t316\t1e-07\t48.9\n+0_13\t0_124\t28.92\t83\t50\t2\t424\t501\t231\t309\t2e-05\t42.0\n+0_13\t0_626\t25.00\t240\t132\t10\t11\t224\t369\t586\t1e-06\t45.4\n+0_13\t0_626\t24.28\t243\t156\t9\t264\t503\t370\t587\t1e-05\t42.4\n+0_13\t0_259\t29.91\t107\t66\t3\t142\t242\t200\t303\t3e-06\t44.3\n+0_13\t0_259\t35.42\t48\t31\t0\t23\t70\t23\t70\t2e-04\t38.1\n+0_13\t0_401\t29.41\t102\t65\t3\t117\t211\t798\t899\t7e-06\t43.5\n+0_13\t0_31\t30.34\t89\t53\t2\t424\t507\t282\t366\t1e-05\t42.4\n+0_13\t0_31\t30.77\t78\t47\t3\t151\t224\t287\t361\t8e-04\t36.6\n+0_13\t0_712\t37.21\t43\t27\t0\t29\t71\t36\t78\t7e-05\t40.0\n+0_13\t0_712\t26.97\t89\t58\t2\t139\t223\t207\t292\t3e-04\t38.1\n+0_13\t0_712\t24.71\t85\t63\t1\t418\t501\t208\t292\t6e-04\t37.0\n+0_13\t0_224\t23.65\t148\t107\t4\t378\t520\t162\t308\t1e-04\t39.3\n+0_13\t0_325\t24.51\t253\t135\t11\t264\t501\t357\t568\t1e-04\t39.7\n+0_13\t0_325\t24.89\t229\t143\t9\t7\t223\t357\t568\t4e-04\t37.7\n+0_13\t0_106\t43.18\t44\t25\t0\t20\t63\t28\t71\t2e-04\t39.3\n+0_13\t0_106\t26.19\t84\t55\t3\t424\t503\t624\t704\t3e-04\t38.5\n+0_13\t0_106\t30.95\t84\t51\t3\t151\t230\t629\t709\t3e-04\t38.1\n+0_14\t0_14\t100.00\t662\t0\t0\t1\t662\t1\t662\t0.0\t1321\n+0_15\t0_15\t100.00\t325\t0\t0\t1\t325\t1\t325\t0.0\t 648\n+0_16\t0_16\t100.00\t220\t0\t0\t1\t220\t1\t220\t1e-162\t 447\n+0_16\t0_17\t50.70\t213\t104\t1\t1\t213\t1\t212\t7e-73\t 219\n+0_17\t0_17\t100.00\t217\t0\t0\t1\t217\t1\t217\t4e-159\t 439\n+0_17\t0_16\t50.70\t213\t104\t1\t1\t212\t1\t213\t6e-73\t 219\n+0_18\t0_18\t100.00\t621\t0\t0\t1\t621\t1\t621\t0.0\t1241\n+0_18\t0_604\t34.90\t576\t343\t14\t63\t620\t127\t688\t1e-91\t 296\n+0_18\t0_603\t31.33\t517\t315\t11\t110\t619\t54\t537\t6e-64\t 220\n+0_18\t0_250\t23.33\t493\t274\t19\t192\t588\t113\t597\t4e-18\t82.8\n+0_18\t0_242\t27.95\t161\t93\t3\t4'..b'131\t340\t63\t306\t1e-30\t 116\n+0_797\t0_707\t37.76\t143\t88\t1\t183\t325\t274\t415\t4e-23\t94.7\n+0_797\t0_707\t40.54\t74\t44\t0\t180\t253\t345\t418\t2e-10\t56.6\n+0_797\t0_350\t46.05\t152\t77\t3\t143\t291\t172\t321\t1e-28\t 109\n+0_797\t0_350\t47.95\t73\t38\t0\t231\t303\t209\t281\t6e-16\t73.2\n+0_797\t0_350\t41.67\t84\t49\t0\t259\t342\t212\t295\t5e-12\t61.2\n+0_797\t0_236\t31.77\t192\t101\t3\t75\t266\t106\t267\t5e-19\t81.3\n+0_797\t0_236\t40.00\t75\t45\t0\t239\t313\t190\t264\t2e-12\t62.0\n+0_797\t0_20\t52.86\t70\t33\t0\t246\t315\t2\t71\t2e-18\t75.9\n+0_797\t0_20\t50.75\t67\t33\t0\t220\t286\t1\t67\t5e-15\t66.6\n+0_797\t0_20\t43.75\t64\t36\t0\t196\t259\t2\t65\t4e-12\t58.2\n+0_797\t0_20\t49.15\t59\t30\t0\t270\t328\t1\t59\t1e-11\t57.0\n+0_797\t0_20\t34.67\t75\t49\t0\t181\t255\t12\t86\t1e-09\t51.2\n+0_798\t0_798\t100.00\t73\t0\t0\t1\t73\t1\t73\t7e-50\t 150\n+0_798\t0_235\t64.00\t25\t9\t0\t3\t27\t2\t26\t3e-06\t38.5\n+0_798\t0_155\t35.71\t56\t32\t2\t7\t60\t2\t55\t1e-04\t34.3\n+0_798\t0_423\t48.57\t35\t16\t1\t1\t33\t1\t35\t2e-04\t33.1\n+0_798\t0_773\t38.64\t44\t26\t1\t3\t45\t2\t45\t6e-04\t31.6\n+0_798\t0_421\t46.88\t32\t16\t1\t3\t33\t2\t33\t0.001\t31.2\n+0_799\t0_799\t100.00\t376\t0\t0\t1\t376\t1\t376\t0.0\t 761\n+0_800\t0_800\t100.00\t112\t0\t0\t1\t112\t1\t112\t2e-78\t 225\n+0_801\t0_801\t100.00\t411\t0\t0\t1\t411\t1\t411\t0.0\t 832\n+0_802\t0_802\t100.00\t200\t0\t0\t1\t200\t1\t200\t7e-147\t 406\n+0_803\t0_803\t100.00\t300\t0\t0\t1\t300\t1\t300\t0.0\t 615\n+0_803\t0_311\t23.71\t291\t204\t6\t2\t281\t5\t288\t1e-14\t67.8\n+0_804\t0_804\t100.00\t77\t0\t0\t1\t77\t1\t77\t3e-48\t 146\n+0_805\t0_805\t100.00\t240\t0\t0\t1\t240\t1\t240\t3e-176\t 484\n+0_805\t0_197\t24.32\t148\t95\t5\t66\t205\t40\t178\t2e-06\t43.1\n+0_805\t0_170\t33.72\t86\t50\t3\t76\t157\t43\t125\t4e-05\t38.1\n+0_806\t0_806\t100.00\t358\t0\t0\t1\t358\t1\t358\t0.0\t 720\n+0_807\t0_807\t100.00\t473\t0\t0\t1\t473\t1\t473\t0.0\t 950\n+0_807\t0_109\t23.84\t432\t270\t5\t48\t467\t10\t394\t1e-36\t 135\n+0_807\t0_430\t22.28\t395\t254\t13\t94\t464\t76\t441\t4e-04\t37.4\n+0_808\t0_808\t100.00\t655\t0\t0\t1\t655\t1\t655\t0.0\t1357\n+0_808\t0_173\t46.06\t647\t326\t9\t11\t649\t2\t633\t0.0\t 552\n+0_809\t0_809\t100.00\t104\t0\t0\t1\t104\t1\t104\t2e-75\t 217\n+0_810\t0_810\t100.00\t147\t0\t0\t1\t147\t1\t147\t4e-104\t 293\n+0_811\t0_811\t100.00\t319\t0\t0\t1\t319\t1\t319\t0.0\t 653\n+0_812\t0_812\t100.00\t131\t0\t0\t1\t131\t1\t131\t1e-90\t 258\n+0_813\t0_813\t100.00\t902\t0\t0\t1\t902\t1\t902\t0.0\t1827\n+0_813\t0_453\t30.33\t755\t425\t21\t39\t730\t10\t726\t4e-80\t 275\n+0_814\t0_814\t100.00\t357\t0\t0\t1\t357\t1\t357\t0.0\t 722\n+0_814\t0_535\t29.70\t202\t133\t4\t139\t336\t18\t214\t1e-18\t79.7\n+0_814\t0_105\t26.58\t237\t150\t7\t134\t348\t51\t285\t3e-18\t80.1\n+0_814\t0_157\t30.91\t220\t133\t8\t120\t336\t3\t206\t5e-17\t74.7\n+0_814\t0_259\t26.17\t256\t126\t3\t139\t331\t21\t276\t5e-16\t72.8\n+0_814\t0_32\t28.26\t230\t145\t7\t139\t348\t113\t342\t5e-15\t70.9\n+0_814\t0_534\t25.34\t221\t141\t4\t142\t338\t25\t245\t1e-14\t68.9\n+0_814\t0_31\t29.37\t126\t83\t3\t229\t348\t251\t376\t4e-14\t68.2\n+0_814\t0_31\t27.91\t129\t80\t4\t120\t237\t37\t163\t8e-04\t35.8\n+0_814\t0_13\t23.74\t198\t139\t3\t128\t317\t10\t203\t2e-13\t66.6\n+0_814\t0_13\t24.08\t245\t152\t10\t120\t336\t263\t501\t1e-10\t57.8\n+0_814\t0_106\t32.56\t129\t73\t5\t235\t356\t605\t726\t3e-13\t65.9\n+0_814\t0_106\t32.26\t93\t62\t1\t119\t210\t9\t101\t9e-07\t45.4\n+0_814\t0_476\t24.00\t200\t140\t3\t120\t317\t4\t193\t6e-12\t59.7\n+0_814\t0_325\t29.05\t210\t131\t6\t139\t339\t371\t571\t4e-11\t58.9\n+0_814\t0_712\t26.47\t102\t74\t1\t238\t338\t193\t294\t6e-11\t58.2\n+0_814\t0_712\t38.46\t52\t29\t1\t142\t190\t28\t79\t7e-05\t39.3\n+0_814\t0_520\t30.10\t103\t71\t1\t238\t339\t454\t556\t7e-11\t58.5\n+0_814\t0_520\t34.48\t87\t51\t1\t137\t223\t58\t138\t4e-10\t56.2\n+0_814\t0_624\t25.54\t231\t120\t10\t120\t318\t1\t211\t3e-10\t56.2\n+0_814\t0_124\t30.68\t88\t55\t1\t139\t226\t26\t107\t5e-10\t55.5\n+0_814\t0_124\t30.34\t89\t61\t1\t257\t344\t229\t317\t2e-07\t47.4\n+0_814\t0_324\t25.55\t227\t146\t7\t121\t336\t365\t579\t2e-09\t53.5\n+0_814\t0_626\t28.70\t230\t136\t8\t121\t336\t370\t585\t1e-08\t51.6\n+0_814\t0_627\t27.81\t187\t118\t6\t121\t298\t354\t532\t1e-08\t51.2\n+0_814\t0_224\t28.09\t89\t63\t1\t252\t339\t204\t292\t4e-08\t49.3\n+0_814\t0_27\t32.84\t67\t44\t1\t251\t317\t105\t170\t3e-06\t43.1\n+0_815\t0_815\t100.00\t2723\t0\t0\t1\t2723\t1\t2723\t0.0\t5445\n+0_816\t0_816\t100.00\t675\t0\t0\t1\t675\t1\t675\t0.0\t1368\n+0_816\t0_210\t27.33\t150\t93\t6\t236\t380\t106\t244\t9e-08\t49.3\n+0_816\t0_217\t27.52\t109\t64\t2\t197\t305\t10\t103\t4e-05\t41.2\n+0_817\t0_817\t100.00\t286\t0\t0\t1\t286\t1\t286\t0.0\t 583\n+0_818\t0_818\t100.00\t188\t0\t0\t1\t188\t1\t188\t1e-134\t 374\n+0_819\t0_819\t100.00\t756\t0\t0\t1\t756\t1\t756\t0.0\t1533\n+0_819\t0_208\t34.65\t228\t116\t8\t314\t518\t279\t496\t1e-16\t78.6\n+0_819\t0_205\t42.86\t70\t40\t0\t671\t740\t43\t112\t8e-11\t56.6\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast0_1.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast0_1.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1292 @@\n+0_0\t1_2\t29.27\t328\t217\t8\t126\t445\t127\t447\t4e-37\t 137\n+0_1\t1_762\t28.95\t152\t95\t8\t58\t198\t56\t205\t5e-05\t39.7\n+0_2\t1_226\t27.09\t251\t169\t8\t16\t259\t24\t267\t7e-23\t90.5\n+0_2\t1_347\t32.90\t231\t135\t10\t20\t241\t21\t240\t5e-22\t87.8\n+0_2\t1_650\t27.41\t270\t170\t10\t9\t260\t47\t308\t8e-16\t70.9\n+0_3\t1_226\t24.33\t263\t163\t7\t16\t261\t24\t267\t1e-22\t90.1\n+0_3\t1_347\t30.00\t250\t159\t6\t20\t263\t21\t260\t2e-21\t86.7\n+0_3\t1_650\t26.20\t271\t174\t9\t12\t265\t50\t311\t2e-18\t78.2\n+0_5\t1_503\t30.42\t309\t204\t6\t21\t328\t17\t315\t3e-38\t 136\n+0_6\t1_503\t30.34\t323\t215\t5\t21\t343\t17\t329\t2e-40\t 142\n+0_11\t1_630\t22.25\t346\t196\t14\t32\t328\t4\t325\t1e-05\t42.7\n+0_13\t1_619\t44.70\t557\t255\t9\t3\t521\t4\t545\t2e-145\t 429\n+0_13\t1_619\t23.87\t243\t169\t7\t20\t249\t312\t551\t7e-09\t52.8\n+0_13\t1_101\t32.86\t213\t121\t4\t20\t226\t20\t216\t2e-24\t98.2\n+0_13\t1_101\t26.25\t80\t59\t0\t423\t502\t135\t214\t5e-04\t36.6\n+0_13\t1_395\t30.63\t271\t165\t8\t23\t283\t25\t282\t1e-19\t85.1\n+0_13\t1_395\t31.33\t83\t50\t2\t424\t502\t138\t217\t3e-06\t44.3\n+0_13\t1_301\t27.61\t268\t152\t11\t20\t260\t30\t282\t1e-14\t70.5\n+0_13\t1_301\t22.40\t250\t141\t8\t272\t507\t24\t234\t3e-07\t47.4\n+0_13\t1_608\t24.88\t213\t148\t4\t21\t224\t41\t250\t4e-13\t65.1\n+0_13\t1_608\t20.87\t254\t181\t6\t266\t515\t27\t264\t8e-07\t45.8\n+0_13\t1_609\t23.90\t205\t141\t4\t24\t224\t26\t219\t4e-12\t62.0\n+0_13\t1_609\t34.92\t63\t41\t0\t259\t321\t3\t65\t2e-06\t44.3\n+0_13\t1_385\t27.60\t221\t131\t8\t21\t228\t373\t577\t4e-12\t63.2\n+0_13\t1_385\t24.90\t261\t139\t11\t259\t503\t353\t572\t1e-08\t52.0\n+0_13\t1_234\t23.41\t205\t154\t2\t23\t224\t25\t229\t4e-11\t58.2\n+0_13\t1_234\t25.29\t261\t161\t9\t264\t515\t7\t242\t2e-10\t56.2\n+0_13\t1_261\t24.65\t288\t162\t12\t268\t515\t12\t284\t5e-11\t59.3\n+0_13\t1_261\t24.00\t175\t108\t7\t139\t308\t191\t345\t7e-04\t37.0\n+0_13\t1_270\t22.28\t202\t147\t3\t24\t224\t19\t211\t1e-10\t56.6\n+0_13\t1_270\t22.69\t238\t156\t5\t272\t509\t9\t218\t1e-09\t53.5\n+0_13\t1_543\t25.46\t216\t138\t6\t26\t224\t83\t292\t6e-10\t55.8\n+0_13\t1_543\t22.09\t249\t166\t9\t264\t503\t64\t293\t1e-05\t42.0\n+0_13\t1_21\t23.48\t230\t149\t7\t4\t221\t263\t477\t1e-09\t55.1\n+0_13\t1_21\t21.86\t247\t162\t8\t260\t501\t261\t481\t4e-06\t44.3\n+0_13\t1_33\t31.96\t97\t63\t1\t6\t102\t31\t124\t2e-09\t54.7\n+0_13\t1_33\t33.90\t59\t39\t0\t276\t334\t43\t101\t4e-05\t40.8\n+0_13\t1_33\t28.57\t98\t55\t3\t138\t226\t356\t447\t8e-05\t40.0\n+0_13\t1_40\t24.30\t214\t139\t6\t24\t224\t96\t299\t3e-09\t53.5\n+0_13\t1_40\t24.10\t83\t62\t1\t421\t503\t219\t300\t8e-05\t39.7\n+0_13\t1_491\t29.09\t110\t66\t3\t1\t105\t1\t103\t2e-06\t45.1\n+0_13\t1_491\t25.00\t100\t73\t2\t414\t511\t275\t374\t8e-05\t40.0\n+0_13\t1_491\t29.23\t65\t46\t0\t263\t327\t6\t70\t3e-04\t38.1\n+0_13\t1_4\t33.33\t66\t41\t1\t4\t66\t166\t231\t4e-06\t43.5\n+0_13\t1_535\t32.88\t73\t46\t1\t21\t93\t39\t108\t6e-06\t43.9\n+0_13\t1_535\t30.12\t83\t55\t2\t151\t231\t686\t767\t2e-05\t42.0\n+0_13\t1_535\t23.91\t92\t63\t3\t416\t503\t673\t761\t4e-05\t41.2\n+0_13\t1_542\t30.23\t86\t51\t2\t424\t504\t295\t376\t1e-05\t42.7\n+0_13\t1_542\t28.43\t102\t57\t4\t127\t224\t285\t374\t1e-04\t39.3\n+0_13\t1_86\t28.71\t101\t65\t3\t119\t213\t808\t907\t4e-05\t41.2\n+0_13\t1_384\t31.65\t79\t51\t3\t153\t231\t89\t164\t1e-04\t38.5\n+0_14\t1_618\t27.19\t342\t218\t11\t90\t415\t81\t407\t3e-24\t 102\n+0_15\t1_617\t34.37\t323\t186\t8\t9\t325\t8\t310\t6e-40\t 140\n+0_15\t1_618\t25.11\t231\t143\t8\t14\t228\t75\t291\t0.001\t35.4\n+0_16\t1_512\t49.77\t213\t107\t0\t1\t213\t1\t213\t1e-73\t 221\n+0_16\t1_513\t43.13\t211\t112\t2\t1\t211\t1\t203\t1e-57\t 180\n+0_17\t1_512\t41.67\t216\t119\t2\t1\t212\t1\t213\t2e-57\t 180\n+0_17\t1_513\t39.15\t212\t122\t2\t1\t212\t1\t205\t3e-43\t 143\n+0_25\t1_267\t21.88\t256\t198\t2\t17\t271\t26\t280\t4e-16\t71.2\n+0_25\t1_579\t21.76\t262\t186\t6\t8\t256\t11\t266\t3e-08\t48.9\n+0_27\t1_101\t54.64\t194\t85\t2\t1\t193\t25\t216\t5e-70\t 215\n+0_27\t1_395\t45.19\t208\t110\t3\t1\t206\t27\t232\t1e-60\t 194\n+0_27\t1_301\t30.48\t269\t176\t8\t1\t261\t35\t300\t1e-26\t 102\n+0_27\t1_619\t26.00\t200\t140\t4\t1\t193\t28\t226\t5e-18\t79.0\n+0_27\t1_619\t21.72\t221\t152\t6\t1\t201\t317\t536\t4e-07\t45.8\n+0_27\t1_608\t25.94\t212\t138\t3\t1\t195\t45\t254\t5e-17\t74.7\n+0_27\t1_609\t23.79\t248\t180\t5\t1\t243\t27\t270\t2e-13\t63.9\n+0_27\t1_491\t29.37\t143\t97\t3\t56\t197\t231\t370\t3e-12\t61.2\n+0_27\t1_491\t26.83\t82\t58\t1\t1\t80\t26\t107\t2e-06\t43.1\n+0_27\t1_535\t27.42\t124\t89\t1\t87\t209\t655\t778\t4e-12\t61.2\n+0_27\t1_40\t24.23\t227\t148\t7\t1\t209\t97\t317\t3e-10\t55.1\n+0_27\t1_33\t28.70\t108\t73\t3\t105\t209\t356\t462\t3e-09\t52.4\n+0_27\t1_33\t36.11\t72\t38\t2\t1\t64\t50\t121\t2e-08\t49.7\n+0_27\t1_542\t29.01\t131\t90\t2\t80\t209\t264\t392\t5e-09\t51.6\n+0_27\t1_542\t48.78\t41\t21\t0\t1\t41\t71\t111\t1e-06\t43.9\n+0_27\t1_21\t26.44\t174\t118\t5\t1\t167\t288\t458\t8e-09\t50.8\n+0_27\t1_'..b'_790\t1_421\t34.62\t182\t118\t1\t5\t185\t107\t288\t1e-30\t 110\n+0_791\t1_422\t28.63\t241\t153\t8\t14\t236\t176\t415\t2e-17\t76.6\n+0_792\t1_423\t31.78\t236\t139\t7\t24\t246\t31\t257\t7e-28\t 104\n+0_793\t1_424\t34.62\t78\t50\t1\t5\t81\t4\t81\t2e-09\t47.0\n+0_794\t1_160\t38.39\t435\t258\t4\t6\t432\t4\t436\t2e-103\t 314\n+0_794\t1_160\t29.94\t177\t110\t5\t172\t346\t2\t166\t2e-11\t60.5\n+0_794\t1_755\t37.78\t135\t80\t2\t168\t301\t218\t349\t7e-21\t89.7\n+0_794\t1_755\t35.54\t121\t75\t3\t6\t124\t224\t343\t1e-13\t67.4\n+0_794\t1_654\t31.37\t102\t62\t4\t168\t269\t111\t204\t1e-07\t47.8\n+0_794\t1_654\t33.87\t62\t38\t1\t6\t67\t117\t175\t2e-05\t40.8\n+0_794\t1_583\t28.26\t92\t62\t2\t250\t341\t92\t179\t1e-04\t38.9\n+0_794\t1_113\t23.37\t184\t114\t7\t5\t171\t122\t295\t2e-04\t38.5\n+0_794\t1_599\t28.68\t129\t88\t3\t3\t129\t19\t145\t4e-04\t36.2\n+0_794\t1_412\t27.61\t134\t89\t4\t1\t129\t1\t131\t5e-04\t36.6\n+0_794\t1_412\t24.55\t167\t119\t4\t176\t340\t9\t170\t9e-04\t35.8\n+0_795\t1_161\t38.77\t227\t125\t8\t1\t221\t1\t219\t1e-41\t 139\n+0_795\t1_86\t23.81\t126\t84\t4\t102\t216\t332\t456\t1e-04\t37.4\n+0_799\t1_150\t32.63\t377\t221\t10\t2\t355\t3\t369\t2e-50\t 172\n+0_799\t1_155\t49.53\t107\t46\t3\t2\t106\t3\t103\t4e-27\t 100\n+0_799\t1_348\t45.79\t107\t49\t4\t4\t104\t12\t115\t3e-19\t84.7\n+0_799\t1_348\t24.49\t196\t126\t6\t132\t324\t856\t1032\t2e-07\t47.8\n+0_799\t1_75\t44.79\t96\t52\t1\t4\t98\t8\t103\t2e-17\t78.2\n+0_799\t1_75\t37.88\t66\t40\t1\t4\t69\t143\t207\t1e-04\t38.5\n+0_799\t1_298\t47.62\t63\t33\t0\t5\t67\t8\t70\t8e-14\t67.4\n+0_799\t1_298\t34.25\t73\t48\t0\t3\t75\t94\t166\t1e-09\t54.3\n+0_799\t1_761\t48.33\t60\t29\t1\t7\t66\t4\t61\t1e-11\t60.1\n+0_799\t1_300\t44.23\t52\t29\t0\t7\t58\t244\t295\t9e-10\t54.3\n+0_800\t1_114\t38.18\t110\t66\t1\t5\t112\t4\t113\t2e-16\t67.0\n+0_801\t1_305\t41.85\t411\t226\t6\t1\t403\t1\t406\t1e-101\t 308\n+0_802\t1_381\t26.32\t95\t64\t2\t88\t176\t43\t137\t1e-04\t37.4\n+0_803\t1_324\t24.41\t295\t197\t10\t2\t279\t8\t293\t8e-16\t71.2\n+0_803\t1_242\t26.32\t304\t173\t12\t2\t275\t3\t285\t7e-15\t68.6\n+0_804\t1_240\t36.59\t41\t26\t0\t28\t68\t28\t68\t4e-05\t33.5\n+0_805\t1_138\t28.16\t206\t141\t2\t32\t235\t69\t269\t2e-21\t85.9\n+0_806\t1_137\t47.89\t355\t178\t6\t3\t354\t5\t355\t9e-103\t 306\n+0_807\t1_655\t27.55\t421\t274\t9\t65\t471\t25\t428\t2e-54\t 186\n+0_808\t1_760\t52.38\t651\t300\t6\t11\t655\t2\t648\t0.0\t 680\n+0_808\t1_439\t45.54\t639\t331\t7\t16\t649\t3\t629\t6e-180\t 525\n+0_809\t1_665\t36.84\t76\t47\t1\t26\t100\t24\t99\t2e-16\t66.2\n+0_810\t1_465\t38.89\t144\t83\t3\t1\t141\t1\t142\t4e-23\t86.3\n+0_813\t1_253\t31.14\t713\t436\t15\t40\t719\t7\t697\t3e-78\t 270\n+0_814\t1_21\t48.91\t229\t117\t0\t117\t345\t262\t490\t3e-74\t 237\n+0_814\t1_270\t32.42\t182\t117\t3\t138\t318\t15\t191\t5e-28\t 105\n+0_814\t1_234\t27.92\t197\t132\t4\t142\t329\t26\t221\t1e-22\t90.9\n+0_814\t1_301\t29.56\t203\t132\t3\t138\t335\t30\t226\t4e-21\t87.8\n+0_814\t1_609\t30.36\t224\t141\t6\t120\t338\t7\t220\t7e-20\t83.2\n+0_814\t1_543\t29.79\t235\t137\t8\t138\t348\t77\t307\t2e-18\t80.9\n+0_814\t1_40\t27.16\t232\t145\t10\t120\t336\t76\t298\t4e-17\t76.3\n+0_814\t1_619\t24.12\t199\t139\t3\t143\t334\t28\t221\t4e-16\t74.3\n+0_814\t1_619\t23.47\t213\t126\t7\t143\t329\t317\t518\t4e-10\t55.8\n+0_814\t1_101\t26.67\t210\t125\t7\t120\t318\t3\t194\t2e-14\t67.0\n+0_814\t1_542\t32.38\t105\t66\t2\t249\t348\t285\t389\t3e-14\t68.6\n+0_814\t1_542\t27.59\t87\t51\t1\t115\t189\t31\t117\t8e-04\t35.8\n+0_814\t1_535\t35.09\t114\t65\t4\t250\t356\t672\t783\t6e-14\t68.2\n+0_814\t1_536\t33.06\t121\t76\t2\t233\t348\t201\t321\t1e-13\t67.0\n+0_814\t1_608\t27.49\t211\t136\t5\t140\t336\t42\t249\t2e-13\t65.5\n+0_814\t1_491\t37.93\t87\t53\t1\t254\t339\t280\t366\t9e-13\t63.9\n+0_814\t1_491\t26.85\t108\t70\t3\t119\t226\t5\t103\t1e-09\t54.3\n+0_814\t1_385\t25.38\t264\t153\t10\t91\t336\t333\t570\t1e-12\t63.9\n+0_814\t1_33\t31.37\t102\t69\t1\t239\t339\t344\t445\t3e-12\t62.8\n+0_814\t1_33\t33.70\t92\t55\t1\t137\t228\t44\t129\t9e-11\t57.8\n+0_814\t1_5\t27.96\t211\t128\t7\t138\t336\t406\t604\t2e-11\t59.7\n+0_814\t1_395\t23.04\t230\t145\t7\t120\t336\t6\t216\t9e-11\t57.4\n+0_814\t1_261\t23.25\t271\t129\t7\t139\t340\t20\t280\t1e-10\t57.4\n+0_814\t1_293\t24.77\t214\t139\t7\t138\t336\t17\t223\t9e-09\t50.8\n+0_814\t1_384\t30.61\t98\t66\t2\t247\t344\t70\t165\t3e-08\t48.1\n+0_814\t1_86\t28.95\t76\t50\t2\t257\t329\t836\t910\t2e-04\t38.1\n+0_815\t1_20\t26.01\t469\t315\t8\t1692\t2138\t373\t831\t3e-41\t 162\n+0_815\t1_20\t24.63\t402\t254\t10\t2337\t2715\t978\t1353\t3e-22\t 100\n+0_815\t1_20\t27.39\t157\t105\t4\t2570\t2721\t487\t639\t1e-04\t42.0\n+0_816\t1_25\t54.04\t483\t208\t3\t172\t645\t239\t716\t9e-165\t 491\n+0_816\t1_715\t28.99\t169\t102\t7\t235\t393\t100\t260\t1e-06\t45.8\n+0_816\t1_551\t28.72\t94\t58\t2\t230\t322\t40\t125\t2e-06\t45.1\n+0_817\t1_701\t34.39\t285\t172\t6\t3\t284\t10\t282\t4e-38\t 134\n+0_818\t1_700\t45.90\t183\t97\t1\t1\t181\t1\t183\t2e-53\t 167\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast0_2.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast0_2.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1018 @@\n+0_0\t2_474\t27.54\t334\t229\t10\t117\t445\t98\t423\t1e-38\t 141\n+0_1\t2_0\t23.60\t394\t261\t14\t1\t368\t1\t380\t3e-10\t55.5\n+0_2\t2_350\t24.80\t246\t173\t4\t19\t260\t28\t265\t3e-20\t82.0\n+0_2\t2_332\t24.17\t240\t170\t6\t7\t241\t10\t242\t1e-13\t63.5\n+0_2\t2_314\t21.31\t244\t187\t4\t21\t260\t23\t265\t1e-12\t60.8\n+0_3\t2_332\t28.89\t270\t168\t8\t2\t262\t7\t261\t4e-21\t85.1\n+0_3\t2_350\t29.12\t261\t155\t10\t19\t267\t28\t270\t5e-21\t84.7\n+0_3\t2_314\t22.00\t250\t176\t5\t21\t260\t23\t263\t1e-13\t63.9\n+0_5\t2_274\t26.26\t297\t203\t9\t21\t312\t18\t303\t6e-27\t 103\n+0_6\t2_274\t30.09\t329\t212\t10\t21\t343\t18\t334\t9e-37\t 132\n+0_13\t2_119\t42.58\t573\t255\t7\t6\t519\t5\t562\t7e-141\t 417\n+0_13\t2_119\t26.91\t249\t148\t6\t262\t502\t2\t224\t2e-12\t63.2\n+0_13\t2_180\t28.32\t226\t145\t4\t4\t224\t6\t219\t1e-18\t80.9\n+0_13\t2_180\t24.05\t237\t144\t8\t280\t511\t24\t229\t3e-12\t61.6\n+0_13\t2_181\t27.83\t212\t141\t4\t19\t224\t34\t239\t4e-16\t73.6\n+0_13\t2_181\t23.33\t240\t153\t9\t269\t502\t25\t239\t4e-09\t52.4\n+0_13\t2_188\t31.31\t99\t65\t1\t6\t104\t7\t102\t2e-10\t57.4\n+0_13\t2_188\t28.81\t59\t42\t0\t276\t334\t19\t77\t1e-04\t38.9\n+0_13\t2_188\t27.84\t97\t55\t3\t139\t226\t361\t451\t1e-04\t38.9\n+0_13\t2_14\t26.12\t268\t148\t12\t250\t504\t337\t567\t2e-10\t57.4\n+0_13\t2_14\t27.10\t214\t123\t8\t25\t224\t371\t565\t9e-09\t52.0\n+0_13\t2_308\t27.05\t207\t137\t7\t23\t227\t20\t214\t2e-10\t56.2\n+0_13\t2_64\t23.65\t203\t142\t3\t25\t223\t255\t448\t3e-10\t56.2\n+0_13\t2_64\t21.83\t252\t163\t6\t259\t504\t228\t451\t5e-07\t46.2\n+0_13\t2_419\t25.47\t212\t139\t8\t24\t224\t101\t304\t4e-10\t55.8\n+0_13\t2_419\t19.37\t284\t162\t8\t245\t503\t64\t305\t5e-08\t48.9\n+0_13\t2_471\t20.38\t211\t145\t6\t24\t225\t107\t303\t4e-10\t55.5\n+0_13\t2_471\t20.92\t239\t161\t7\t266\t502\t90\t302\t3e-07\t46.6\n+0_13\t2_39\t29.66\t118\t65\t4\t1\t110\t1\t108\t1e-08\t51.6\n+0_13\t2_39\t29.07\t86\t60\t1\t418\t502\t342\t427\t7e-08\t49.3\n+0_13\t2_39\t42.00\t50\t29\t0\t278\t327\t21\t70\t6e-07\t46.2\n+0_13\t2_39\t26.54\t162\t101\t5\t88\t232\t281\t441\t1e-05\t42.0\n+0_13\t2_473\t24.78\t226\t131\t7\t283\t502\t75\t267\t3e-08\t49.3\n+0_13\t2_473\t21.70\t235\t159\t7\t4\t227\t50\t270\t4e-08\t48.9\n+0_13\t2_13\t26.83\t164\t105\t6\t24\t176\t385\t544\t6e-08\t49.3\n+0_13\t2_307\t25.61\t246\t146\t9\t266\t502\t74\t291\t3e-06\t43.5\n+0_13\t2_307\t23.04\t204\t140\t7\t29\t224\t97\t291\t5e-06\t42.7\n+0_13\t2_78\t24.00\t250\t135\t9\t25\t224\t44\t288\t5e-06\t42.7\n+0_13\t2_78\t25.56\t90\t58\t2\t419\t503\t204\t289\t5e-04\t36.6\n+0_13\t2_79\t36.00\t75\t42\t2\t19\t88\t27\t100\t3e-05\t40.8\n+0_13\t2_293\t22.02\t218\t148\t5\t1\t206\t1\t208\t5e-05\t39.3\n+0_13\t2_427\t32.31\t65\t40\t2\t152\t213\t844\t907\t6e-04\t36.6\n+0_14\t2_120\t28.28\t343\t201\t14\t90\t412\t86\t403\t2e-20\t89.4\n+0_15\t2_121\t33.33\t324\t183\t11\t10\t325\t8\t306\t8e-38\t 134\n+0_15\t2_120\t23.56\t208\t141\t5\t20\t218\t89\t287\t2e-05\t40.4\n+0_16\t2_272\t30.30\t198\t123\t5\t2\t194\t16\t203\t6e-22\t85.9\n+0_17\t2_272\t29.74\t195\t125\t5\t3\t193\t17\t203\t8e-21\t82.4\n+0_25\t2_269\t23.32\t283\t185\t10\t9\t274\t6\t273\t5e-08\t47.4\n+0_25\t2_125\t25.78\t256\t164\t10\t22\t260\t19\t265\t9e-07\t43.5\n+0_27\t2_181\t25.37\t205\t140\t2\t2\t195\t41\t243\t2e-20\t83.6\n+0_27\t2_119\t29.76\t205\t128\t6\t1\t193\t26\t226\t2e-19\t82.8\n+0_27\t2_180\t29.21\t202\t129\t7\t1\t194\t27\t222\t1e-15\t69.3\n+0_27\t2_307\t30.50\t200\t117\t7\t15\t199\t107\t299\t7e-13\t62.4\n+0_27\t2_14\t23.74\t219\t145\t6\t1\t206\t371\t580\t5e-12\t60.1\n+0_27\t2_308\t29.56\t203\t118\t11\t1\t191\t22\t211\t2e-11\t57.4\n+0_27\t2_188\t28.66\t157\t94\t6\t106\t259\t361\t502\t2e-11\t58.2\n+0_27\t2_188\t30.51\t59\t40\t1\t1\t58\t26\t84\t1e-04\t37.4\n+0_27\t2_39\t34.07\t91\t59\t1\t110\t199\t345\t435\t1e-10\t55.8\n+0_27\t2_39\t37.50\t64\t36\t1\t1\t64\t26\t85\t8e-09\t50.4\n+0_27\t2_78\t22.92\t253\t141\t7\t1\t199\t44\t296\t2e-10\t55.1\n+0_27\t2_471\t24.00\t200\t138\t5\t1\t191\t108\t302\t7e-10\t53.1\n+0_27\t2_79\t24.59\t122\t91\t1\t79\t199\t651\t772\t1e-09\t53.1\n+0_27\t2_293\t25.00\t196\t122\t6\t1\t178\t25\t213\t1e-08\t48.9\n+0_27\t2_419\t21.05\t209\t149\t7\t1\t195\t102\t308\t2e-08\t48.5\n+0_27\t2_64\t25.85\t147\t99\t3\t5\t144\t259\t402\t4e-06\t42.0\n+0_27\t2_473\t28.57\t175\t104\t7\t8\t170\t82\t247\t8e-06\t40.4\n+0_27\t2_13\t24.00\t175\t101\t4\t1\t151\t386\t552\t1e-05\t40.4\n+0_31\t2_79\t56.92\t130\t56\t0\t261\t390\t664\t793\t2e-43\t 158\n+0_31\t2_79\t34.43\t122\t72\t2\t34\t155\t7\t120\t4e-17\t78.2\n+0_31\t2_78\t29.49\t373\t189\t10\t35\t399\t19\t325\t2e-37\t 136\n+0_31\t2_39\t31.07\t177\t100\t5\t217\t373\t265\t439\t2e-19\t84.7\n+0_31\t2_39\t33.33\t66\t41\t1\t35\t100\t4\t66\t4e-07\t46.2\n+0_31\t2_188\t34.86\t109\t71\t0\t274\t382\t360\t468\t2e-18\t81.6\n+0_31\t2_188\t31.15\t61\t38\t1\t38\t98\t8\t64\t6e-05\t39.3\n+0_31\t2_471\t39.33\t89\t53\t1\t274\t362\t216\t303\t2e-17\t77.0\n+0_31\t2_419\t35.45\t110\t69\t1\t275\t384\t220\t327\t4e-15\t70.5\n+0_31\t2_419\t'..b'\n+0_754\t2_334\t30.08\t123\t74\t3\t117\t227\t183\t305\t2e-05\t41.2\n+0_754\t2_339\t26.40\t125\t73\t6\t113\t223\t21\t140\t0.001\t35.0\n+0_756\t2_140\t25.38\t331\t204\t12\t75\t393\t91\t390\t2e-16\t76.3\n+0_758\t2_31\t46.63\t178\t89\t4\t8\t180\t13\t189\t1e-41\t 137\n+0_759\t2_400\t49.18\t305\t154\t1\t148\t452\t136\t439\t3e-94\t 290\n+0_760\t2_97\t35.38\t65\t34\t2\t53\t113\t91\t151\t4e-05\t39.3\n+0_782\t2_138\t38.95\t552\t329\t4\t3\t550\t15\t562\t2e-122\t 372\n+0_782\t2_429\t22.38\t496\t356\t11\t1\t483\t1\t480\t2e-26\t 107\n+0_784\t2_374\t37.89\t95\t55\t3\t676\t768\t569\t661\t5e-10\t57.0\n+0_784\t2_374\t34.69\t98\t58\t3\t447\t539\t439\t535\t2e-09\t55.5\n+0_786\t2_99\t38.64\t484\t269\t9\t1\t469\t1\t471\t1e-99\t 306\n+0_787\t2_98\t38.79\t428\t239\t10\t27\t432\t46\t472\t1e-83\t 263\n+0_788\t2_97\t26.67\t90\t62\t2\t5\t94\t390\t475\t3e-06\t38.9\n+0_789\t2_208\t27.24\t257\t170\t8\t30\t272\t27\t280\t8e-18\t76.3\n+0_789\t2_378\t25.68\t296\t185\t13\t2\t267\t5\t295\t1e-14\t67.4\n+0_790\t2_216\t34.97\t163\t105\t1\t8\t169\t27\t189\t7e-30\t 106\n+0_791\t2_215\t31.52\t92\t62\t1\t7\t97\t143\t234\t6e-06\t40.8\n+0_792\t2_214\t29.50\t261\t160\t6\t2\t246\t11\t263\t2e-31\t 113\n+0_793\t2_213\t32.50\t80\t49\t3\t6\t81\t5\t83\t2e-09\t45.8\n+0_794\t2_334\t37.53\t437\t262\t4\t6\t432\t4\t439\t1e-98\t 301\n+0_794\t2_334\t30.77\t182\t110\t6\t172\t349\t2\t171\t9e-14\t67.0\n+0_794\t2_7\t35.10\t208\t109\t8\t172\t363\t218\t415\t1e-19\t85.1\n+0_794\t2_7\t37.93\t87\t54\t0\t6\t92\t220\t306\t5e-12\t61.6\n+0_794\t2_339\t30.16\t126\t78\t4\t6\t126\t23\t143\t3e-08\t48.1\n+0_794\t2_142\t25.00\t168\t102\t6\t5\t158\t124\t281\t1e-05\t41.6\n+0_794\t2_142\t25.70\t179\t107\t8\t174\t344\t125\t285\t6e-05\t39.3\n+0_794\t2_447\t45.95\t37\t20\t0\t172\t208\t117\t153\t3e-05\t39.7\n+0_794\t2_447\t35.94\t64\t34\t2\t6\t67\t119\t177\t4e-05\t39.3\n+0_794\t2_396\t29.27\t82\t57\t1\t172\t252\t4\t85\t2e-04\t37.4\n+0_795\t2_335\t33.94\t221\t126\t6\t7\t219\t5\t213\t3e-34\t 119\n+0_799\t2_16\t31.02\t374\t229\t10\t4\t357\t6\t370\t7e-46\t 159\n+0_799\t2_199\t45.65\t92\t47\t2\t4\t94\t6\t95\t7e-17\t76.6\n+0_799\t2_1\t50.00\t60\t28\t1\t7\t66\t4\t61\t1e-11\t59.3\n+0_800\t2_143\t35.24\t105\t66\t1\t9\t111\t8\t112\t3e-11\t51.6\n+0_801\t2_459\t31.88\t414\t255\t8\t2\t411\t4\t394\t2e-67\t 217\n+0_803\t2_331\t21.82\t307\t194\t12\t2\t279\t3\t292\t3e-09\t51.2\n+0_803\t2_454\t24.88\t209\t135\t10\t1\t194\t1\t202\t8e-06\t40.8\n+0_804\t2_291\t37.50\t40\t25\t0\t29\t68\t32\t71\t2e-04\t31.2\n+0_805\t2_262\t35.44\t158\t95\t3\t33\t189\t69\t220\t6e-23\t91.7\n+0_806\t2_261\t43.54\t356\t194\t6\t1\t353\t3\t354\t6e-97\t 291\n+0_807\t2_448\t28.23\t418\t246\t12\t63\t470\t21\t394\t5e-53\t 181\n+0_807\t2_438\t28.40\t405\t247\t10\t67\t467\t17\t382\t3e-42\t 150\n+0_808\t2_2\t50.23\t653\t314\t6\t10\t655\t2\t650\t0.0\t 663\n+0_808\t2_202\t43.75\t640\t341\t8\t16\t649\t3\t629\t1e-180\t 526\n+0_809\t2_124\t32.39\t71\t41\t2\t26\t92\t25\t92\t9e-12\t52.8\n+0_810\t2_58\t40.44\t136\t76\t3\t1\t133\t1\t134\t3e-20\t78.2\n+0_813\t2_70\t28.95\t708\t418\t19\t45\t714\t9\t669\t3e-71\t 248\n+0_814\t2_64\t44.83\t232\t128\t0\t120\t351\t232\t463\t9e-64\t 208\n+0_814\t2_471\t37.89\t227\t139\t1\t112\t336\t75\t301\t4e-51\t 170\n+0_814\t2_473\t36.93\t287\t170\t5\t70\t353\t5\t283\t4e-48\t 162\n+0_814\t2_180\t28.57\t210\t128\t6\t139\t338\t23\t220\t1e-20\t84.7\n+0_814\t2_419\t28.57\t259\t154\t12\t96\t336\t58\t303\t3e-20\t84.3\n+0_814\t2_181\t29.86\t211\t133\t8\t138\t338\t35\t240\t9e-18\t77.4\n+0_814\t2_119\t27.54\t207\t135\t6\t119\t317\t4\t203\t8e-17\t75.9\n+0_814\t2_119\t23.44\t209\t141\t8\t143\t336\t340\t544\t3e-09\t52.4\n+0_814\t2_79\t33.93\t112\t69\t2\t250\t356\t676\t787\t3e-15\t71.6\n+0_814\t2_78\t31.93\t119\t76\t2\t235\t348\t185\t303\t2e-14\t68.6\n+0_814\t2_39\t33.61\t119\t71\t4\t230\t346\t321\t433\t2e-13\t65.1\n+0_814\t2_39\t28.04\t107\t68\t3\t120\t226\t6\t103\t4e-11\t58.5\n+0_814\t2_308\t26.25\t240\t158\t9\t120\t354\t1\t226\t7e-13\t62.4\n+0_814\t2_293\t27.89\t190\t123\t4\t139\t318\t21\t206\t2e-12\t60.8\n+0_814\t2_307\t25.46\t216\t147\t9\t130\t336\t80\t290\t3e-12\t61.2\n+0_814\t2_13\t27.17\t173\t104\t6\t140\t295\t383\t550\t4e-10\t55.1\n+0_814\t2_188\t29.70\t101\t70\t1\t240\t339\t349\t449\t5e-10\t55.1\n+0_814\t2_188\t27.91\t86\t48\t2\t142\t223\t25\t100\t7e-08\t48.1\n+0_814\t2_14\t22.12\t208\t140\t6\t140\t336\t368\t564\t8e-09\t51.2\n+0_814\t2_427\t32.43\t74\t46\t2\t259\t329\t838\t910\t5e-04\t36.2\n+0_815\t2_63\t27.84\t431\t277\t13\t1634\t2044\t288\t704\t3e-29\t 122\n+0_815\t2_63\t24.58\t419\t270\t12\t2307\t2715\t941\t1323\t1e-14\t74.7\n+0_815\t2_472\t21.66\t434\t299\t11\t1640\t2049\t723\t1139\t3e-14\t73.6\n+0_815\t2_472\t20.75\t482\t301\t15\t2289\t2722\t1334\t1782\t7e-09\t55.5\n+0_816\t2_461\t52.73\t550\t239\t7\t110\t647\t135\t675\t3e-168\t 498\n+0_816\t2_366\t23.98\t221\t137\t7\t191\t401\t4\t203\t2e-05\t41.2\n+0_817\t2_83\t33.33\t288\t179\t6\t3\t286\t8\t286\t1e-42\t 145\n+0_818\t2_82\t34.76\t164\t104\t2\t2\t162\t5\t168\t9e-32\t 110\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast0_3.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast0_3.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1528 @@\n+0_0\t3_0\t33.88\t425\t257\t11\t28\t441\t23\t434\t5e-64\t 212\n+0_1\t3_1\t27.34\t384\t248\t12\t1\t364\t1\t373\t6e-30\t 114\n+0_2\t3_130\t38.55\t262\t152\t5\t7\t261\t13\t272\t4e-53\t 172\n+0_2\t3_246\t29.36\t109\t70\t5\t12\t119\t19\t121\t4e-07\t44.7\n+0_3\t3_130\t36.19\t268\t164\t4\t2\t264\t8\t273\t1e-54\t 176\n+0_3\t3_246\t33.93\t112\t67\t5\t9\t119\t16\t121\t8e-10\t53.1\n+0_4\t3_301\t47.68\t388\t197\t4\t6\t391\t4\t387\t9e-124\t 362\n+0_5\t3_302\t51.31\t343\t167\t0\t1\t343\t1\t343\t9e-129\t 372\n+0_5\t3_247\t32.34\t269\t152\t9\t72\t328\t67\t317\t4e-26\t 102\n+0_6\t3_302\t55.10\t343\t154\t0\t1\t343\t1\t343\t3e-136\t 390\n+0_6\t3_247\t29.79\t235\t138\t7\t72\t296\t67\t284\t2e-23\t93.6\n+0_7\t3_303\t54.51\t277\t126\t0\t4\t280\t9\t285\t6e-112\t 324\n+0_8\t3_304\t39.47\t114\t65\t2\t1\t114\t1\t110\t1e-26\t93.2\n+0_10\t3_602\t22.41\t116\t89\t1\t153\t267\t147\t262\t6e-05\t38.1\n+0_11\t3_604\t28.51\t449\t260\t17\t2\t425\t3\t415\t4e-37\t 137\n+0_13\t3_605\t49.05\t524\t241\t7\t1\t520\t2\t503\t5e-163\t 473\n+0_13\t3_508\t31.43\t509\t321\t8\t1\t501\t1\t489\t2e-61\t 208\n+0_13\t3_508\t27.51\t229\t153\t6\t24\t243\t285\t509\t6e-11\t59.3\n+0_13\t3_226\t28.95\t487\t309\t9\t25\t501\t1\t460\t2e-58\t 199\n+0_13\t3_226\t24.30\t251\t150\t10\t283\t521\t1\t223\t5e-08\t50.1\n+0_13\t3_462\t28.00\t200\t132\t3\t25\t223\t2\t190\t9e-17\t75.1\n+0_13\t3_462\t29.11\t79\t56\t0\t423\t501\t112\t190\t1e-05\t41.6\n+0_13\t3_256\t29.44\t214\t129\t8\t22\t228\t22\t220\t7e-15\t70.1\n+0_13\t3_256\t24.14\t232\t140\t8\t276\t502\t16\t216\t3e-07\t47.0\n+0_13\t3_257\t28.23\t248\t154\t7\t19\t249\t20\t260\t7e-15\t70.1\n+0_13\t3_257\t24.47\t237\t145\t10\t279\t502\t22\t237\t3e-08\t50.4\n+0_13\t3_333\t23.85\t218\t152\t4\t7\t224\t2\t205\t4e-14\t69.7\n+0_13\t3_333\t27.47\t91\t65\t1\t424\t514\t128\t217\t5e-06\t43.9\n+0_13\t3_445\t24.89\t225\t152\t8\t7\t223\t61\t276\t6e-13\t64.3\n+0_13\t3_445\t23.11\t251\t162\t8\t256\t501\t52\t276\t4e-06\t43.5\n+0_13\t3_379\t24.44\t225\t135\t5\t7\t220\t2\t202\t4e-12\t63.5\n+0_13\t3_379\t23.97\t242\t128\t9\t263\t493\t1\t197\t9e-05\t39.7\n+0_13\t3_19\t23.55\t259\t172\t7\t23\t274\t18\t257\t6e-12\t62.8\n+0_13\t3_19\t24.34\t267\t141\t10\t263\t514\t1\t221\t5e-04\t37.4\n+0_13\t3_307\t22.61\t345\t227\t11\t7\t349\t2\t308\t1e-11\t62.0\n+0_13\t3_307\t24.57\t232\t140\t7\t271\t501\t8\t205\t6e-05\t40.4\n+0_13\t3_206\t21.70\t530\t292\t19\t7\t460\t2\t484\t6e-11\t59.3\n+0_13\t3_206\t21.83\t229\t165\t5\t276\t501\t13\t230\t1e-05\t42.4\n+0_13\t3_210\t27.52\t218\t131\t9\t31\t228\t153\t363\t7e-11\t58.9\n+0_13\t3_210\t22.96\t257\t154\t10\t264\t503\t129\t358\t7e-07\t46.2\n+0_13\t3_17\t23.50\t217\t152\t4\t7\t223\t2\t204\t9e-11\t58.9\n+0_13\t3_17\t24.79\t242\t125\t9\t263\t493\t1\t196\t8e-05\t40.0\n+0_13\t3_365\t36.78\t87\t52\t1\t6\t92\t38\t121\t1e-10\t58.9\n+0_13\t3_365\t29.35\t92\t62\t2\t138\t226\t500\t591\t5e-05\t40.4\n+0_13\t3_365\t28.81\t59\t42\t0\t276\t334\t50\t108\t1e-04\t39.7\n+0_13\t3_297\t22.00\t200\t141\t4\t25\t223\t20\t205\t3e-09\t54.3\n+0_13\t3_297\t23.08\t234\t141\t6\t271\t501\t8\t205\t1e-06\t45.8\n+0_13\t3_541\t29.08\t141\t92\t4\t96\t231\t180\t317\t6e-09\t52.8\n+0_13\t3_541\t27.78\t108\t72\t3\t398\t501\t205\t310\t8e-07\t46.2\n+0_13\t3_541\t29.69\t64\t45\t0\t4\t67\t8\t71\t4e-05\t40.4\n+0_13\t3_626\t28.57\t203\t121\t8\t23\t218\t352\t537\t1e-08\t52.0\n+0_13\t3_626\t33.33\t75\t48\t2\t263\t336\t335\t408\t4e-04\t37.7\n+0_13\t3_306\t24.52\t208\t144\t4\t7\t214\t2\t196\t3e-08\t50.8\n+0_13\t3_306\t30.95\t84\t49\t2\t414\t493\t119\t197\t2e-05\t42.0\n+0_13\t3_18\t24.48\t192\t121\t5\t37\t223\t32\t204\t4e-08\t50.4\n+0_13\t3_357\t23.01\t226\t161\t7\t23\t242\t28\t246\t1e-07\t48.1\n+0_13\t3_357\t23.62\t271\t178\t9\t260\t523\t6\t254\t7e-06\t42.7\n+0_13\t3_623\t28.65\t192\t109\t8\t23\t206\t351\t522\t4e-07\t47.4\n+0_13\t3_623\t28.70\t223\t118\t11\t280\t497\t350\t536\t9e-06\t42.7\n+0_13\t3_211\t31.87\t91\t53\t2\t424\t509\t281\t367\t1e-06\t45.8\n+0_13\t3_211\t32.10\t81\t52\t1\t254\t331\t34\t114\t1e-06\t45.8\n+0_13\t3_211\t28.69\t122\t68\t5\t107\t224\t254\t360\t4e-06\t43.9\n+0_13\t3_211\t40.91\t44\t26\t0\t24\t67\t65\t108\t4e-05\t40.8\n+0_13\t3_494\t39.29\t56\t34\t0\t10\t65\t12\t67\t2e-06\t45.1\n+0_13\t3_494\t33.77\t77\t46\t2\t151\t224\t622\t696\t4e-06\t43.9\n+0_13\t3_494\t21.14\t123\t85\t4\t389\t503\t579\t697\t4e-04\t37.7\n+0_13\t3_495\t23.85\t239\t147\t8\t7\t224\t17\t241\t2e-06\t44.3\n+0_13\t3_495\t22.22\t252\t158\t9\t264\t503\t17\t242\t9e-06\t42.4\n+0_13\t3_375\t25.60\t125\t88\t3\t102\t224\t76\t197\t3e-05\t40.8\n+0_13\t3_281\t24.41\t127\t83\t3\t138\t258\t14\t133\t9e-05\t39.7\n+0_13\t3_281\t28.21\t78\t55\t1\t407\t484\t5\t81\t6e-04\t37.0\n+0_13\t3_298\t26.09\t115\t72\t3\t418\t524\t80\t189\t2e-04\t38.9\n+0_13\t3_298\t23.42\t158\t111\t3\t67\t223\t14\t162\t3e-04\t38.1\n+0_13\t3_90\t26.88\t93\t64\t2\t124\t213\t812\t903\t2e-04\t38.9\n+0_13\t3_625\t25.95\t185\t117\t9\t35\t214\t363\t532\t3e-04\t38.1\n+0_14\t3_606\t29.36\t579\t316\t17\t10\t525\t7\t555\t7e-53\t 187\n+0_15'..b'\t437\t2e-135\t 395\n+0_788\t3_22\t31.25\t96\t62\t3\t6\t100\t3\t95\t7e-07\t39.3\n+0_789\t3_14\t42.51\t287\t155\t5\t1\t284\t1\t280\t5e-70\t 217\n+0_789\t3_451\t30.00\t280\t150\t11\t15\t267\t21\t281\t9e-23\t90.9\n+0_790\t3_631\t47.12\t191\t98\t3\t1\t188\t1\t191\t1e-59\t 184\n+0_791\t3_630\t40.57\t244\t141\t2\t9\t248\t2\t245\t3e-60\t 189\n+0_792\t3_629\t27.23\t213\t146\t5\t3\t210\t2\t210\t2e-20\t82.4\n+0_792\t3_99\t39.29\t56\t31\t2\t120\t172\t205\t260\t4e-04\t36.2\n+0_794\t3_66\t52.10\t428\t205\t0\t3\t430\t2\t429\t5e-163\t 466\n+0_794\t3_205\t35.40\t113\t69\t2\t154\t266\t200\t308\t3e-15\t72.4\n+0_794\t3_205\t29.07\t86\t61\t0\t7\t92\t220\t305\t4e-08\t49.7\n+0_794\t3_442\t31.40\t121\t75\t2\t7\t122\t41\t158\t4e-08\t48.1\n+0_794\t3_442\t25.79\t190\t115\t6\t159\t339\t25\t197\t1e-04\t37.7\n+0_794\t3_152\t27.64\t123\t85\t2\t174\t296\t9\t127\t1e-06\t44.7\n+0_794\t3_152\t23.89\t113\t86\t0\t6\t118\t9\t121\t2e-06\t43.9\n+0_794\t3_85\t27.62\t181\t106\t6\t83\t251\t24\t191\t7e-05\t39.3\n+0_794\t3_85\t38.36\t73\t37\t4\t8\t80\t124\t188\t1e-04\t38.1\n+0_794\t3_582\t26.47\t170\t98\t5\t174\t335\t116\t266\t1e-04\t39.3\n+0_795\t3_65\t44.13\t213\t119\t0\t4\t216\t5\t217\t5e-62\t 192\n+0_799\t3_64\t36.46\t384\t223\t8\t1\t373\t1\t374\t3e-65\t 210\n+0_800\t3_581\t33.33\t78\t52\t0\t35\t112\t31\t108\t1e-09\t47.4\n+0_801\t3_59\t51.44\t383\t170\t8\t4\t380\t10\t382\t1e-117\t 348\n+0_802\t3_267\t31.91\t94\t57\t2\t84\t174\t38\t127\t1e-06\t43.1\n+0_805\t3_136\t44.78\t230\t118\t6\t6\t233\t9\t231\t1e-46\t 153\n+0_806\t3_135\t62.71\t354\t131\t1\t1\t353\t1\t354\t1e-155\t 441\n+0_808\t3_107\t56.65\t639\t272\t4\t18\t655\t5\t639\t0.0\t 718\n+0_808\t3_29\t41.94\t651\t348\t11\t17\t653\t2\t636\t4e-170\t 500\n+0_809\t3_380\t29.67\t91\t59\t3\t12\t97\t10\t100\t9e-11\t50.4\n+0_809\t3_8\t35.00\t80\t45\t3\t24\t96\t584\t663\t1e-07\t43.5\n+0_810\t3_262\t41.50\t147\t82\t3\t1\t146\t1\t144\t5e-29\t 101\n+0_813\t3_261\t27.37\t771\t460\t21\t43\t765\t31\t749\t1e-60\t 217\n+0_814\t3_445\t56.50\t223\t97\t0\t115\t337\t55\t277\t7e-92\t 276\n+0_814\t3_379\t31.28\t195\t122\t4\t139\t331\t16\t200\t1e-24\t 100\n+0_814\t3_17\t31.94\t216\t126\t9\t120\t331\t1\t199\t1e-23\t97.8\n+0_814\t3_19\t34.52\t197\t112\t8\t139\t331\t16\t199\t2e-23\t97.1\n+0_814\t3_357\t28.63\t255\t162\t8\t116\t357\t5\t252\t5e-23\t92.0\n+0_814\t3_333\t31.02\t216\t128\t8\t120\t331\t1\t199\t9e-23\t94.7\n+0_814\t3_256\t32.73\t220\t140\t6\t120\t336\t1\t215\t1e-22\t90.9\n+0_814\t3_18\t31.00\t200\t117\t6\t138\t331\t15\t199\t3e-22\t92.8\n+0_814\t3_297\t30.73\t205\t124\t6\t139\t338\t16\t207\t1e-21\t90.9\n+0_814\t3_306\t28.02\t207\t137\t4\t139\t343\t16\t212\t2e-21\t90.5\n+0_814\t3_307\t30.73\t205\t124\t7\t139\t338\t16\t207\t2e-20\t87.0\n+0_814\t3_210\t30.12\t259\t146\t9\t119\t348\t120\t372\t5e-19\t82.8\n+0_814\t3_257\t28.18\t220\t133\t5\t138\t336\t21\t236\t4e-18\t78.6\n+0_814\t3_495\t26.00\t250\t157\t8\t119\t348\t15\t256\t7e-18\t78.6\n+0_814\t3_508\t26.46\t223\t148\t5\t139\t346\t282\t503\t3e-16\t74.3\n+0_814\t3_508\t30.43\t207\t126\t9\t140\t335\t22\t221\t4e-14\t68.2\n+0_814\t3_226\t23.89\t247\t152\t8\t112\t337\t230\t461\t2e-15\t72.0\n+0_814\t3_226\t27.27\t187\t119\t5\t143\t317\t1\t182\t2e-13\t65.9\n+0_814\t3_211\t35.29\t102\t61\t2\t252\t348\t274\t375\t5e-15\t70.5\n+0_814\t3_211\t24.44\t180\t114\t6\t106\t268\t18\t192\t8e-06\t42.0\n+0_814\t3_494\t32.08\t106\t67\t2\t253\t353\t611\t716\t8e-15\t70.5\n+0_814\t3_494\t25.69\t109\t72\t3\t119\t223\t3\t106\t1e-04\t38.5\n+0_814\t3_298\t28.19\t188\t110\t6\t166\t345\t1\t171\t2e-14\t69.3\n+0_814\t3_281\t36.61\t112\t63\t4\t249\t354\t12\t121\t2e-13\t65.9\n+0_814\t3_375\t28.16\t174\t105\t7\t186\t345\t42\t209\t3e-12\t61.6\n+0_814\t3_605\t26.29\t213\t139\t6\t142\t338\t276\t486\t1e-11\t60.5\n+0_814\t3_365\t31.37\t102\t69\t1\t239\t339\t488\t589\t2e-11\t60.1\n+0_814\t3_365\t31.03\t87\t54\t1\t137\t223\t51\t131\t2e-10\t56.6\n+0_814\t3_541\t29.73\t111\t71\t2\t138\t247\t24\t128\t1e-10\t57.0\n+0_814\t3_541\t32.53\t83\t55\t1\t257\t338\t230\t312\t7e-09\t51.6\n+0_814\t3_623\t26.04\t192\t112\t10\t138\t318\t348\t520\t2e-10\t56.6\n+0_814\t3_206\t24.68\t231\t122\t8\t120\t318\t1\t211\t4e-10\t55.5\n+0_814\t3_462\t24.37\t197\t134\t7\t145\t336\t4\t190\t2e-08\t48.9\n+0_814\t3_156\t22.10\t181\t114\t7\t150\t318\t495\t660\t2e-08\t50.4\n+0_814\t3_622\t28.99\t207\t118\t11\t137\t331\t347\t536\t7e-08\t48.5\n+0_814\t3_626\t24.34\t189\t121\t6\t138\t318\t348\t522\t1e-07\t47.8\n+0_814\t3_625\t29.44\t231\t119\t12\t116\t318\t307\t521\t3e-06\t43.5\n+0_815\t3_446\t30.06\t1407\t810\t29\t1385\t2723\t1350\t2650\t1e-149\t 518\n+0_815\t3_446\t24.27\t754\t488\t27\t556\t1258\t469\t1190\t3e-23\t 103\n+0_815\t3_446\t23.55\t310\t192\t10\t1\t309\t1\t266\t2e-07\t51.6\n+0_816\t3_202\t66.73\t532\t172\t3\t144\t674\t175\t702\t0.0\t 665\n+0_816\t3_414\t22.13\t253\t162\t8\t197\t439\t11\t238\t5e-05\t40.4\n+0_817\t3_201\t32.71\t269\t178\t2\t3\t271\t12\t277\t3e-45\t 152\n+0_818\t3_200\t43.78\t185\t102\t1\t1\t185\t1\t183\t2e-51\t 162\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast1_0.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast1_0.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1297 @@\n+1_0\t0_652\t41.86\t43\t23\t1\t4\t46\t5\t45\t8e-04\t35.0\n+1_0\t0_472\t41.86\t43\t23\t1\t4\t46\t5\t45\t8e-04\t35.0\n+1_0\t0_294\t41.86\t43\t23\t1\t4\t46\t5\t45\t8e-04\t35.0\n+1_2\t0_0\t29.27\t328\t217\t8\t127\t447\t126\t445\t4e-37\t 137\n+1_4\t0_627\t28.47\t288\t199\t4\t20\t302\t203\t488\t3e-28\t 110\n+1_4\t0_325\t27.72\t303\t187\t7\t19\t303\t202\t490\t7e-23\t94.0\n+1_4\t0_626\t24.00\t300\t205\t7\t19\t301\t210\t503\t2e-20\t86.3\n+1_4\t0_324\t24.41\t295\t202\t6\t15\t293\t201\t490\t4e-17\t76.6\n+1_4\t0_535\t27.36\t106\t68\t2\t169\t274\t2\t98\t1e-09\t52.8\n+1_4\t0_13\t33.33\t66\t41\t1\t166\t231\t4\t66\t2e-06\t43.5\n+1_4\t0_534\t31.08\t74\t47\t2\t168\t237\t2\t75\t6e-06\t42.0\n+1_4\t0_712\t28.24\t131\t78\t5\t173\t301\t15\t131\t1e-05\t41.2\n+1_4\t0_106\t33.93\t56\t37\t0\t190\t245\t33\t88\t1e-05\t41.2\n+1_4\t0_124\t31.40\t86\t50\t2\t187\t268\t27\t107\t1e-05\t40.8\n+1_4\t0_27\t29.85\t67\t44\t1\t190\t256\t1\t64\t2e-05\t40.4\n+1_4\t0_520\t25.95\t131\t69\t5\t132\t256\t11\t119\t4e-04\t36.6\n+1_4\t0_401\t50.00\t32\t16\t0\t184\t215\t621\t652\t5e-04\t36.6\n+1_4\t0_476\t28.57\t70\t47\t1\t187\t256\t21\t87\t7e-04\t35.0\n+1_4\t0_259\t30.65\t62\t42\t1\t169\t230\t5\t65\t9e-04\t35.0\n+1_4\t0_624\t31.82\t44\t30\t0\t187\t230\t17\t60\t9e-04\t35.4\n+1_5\t0_626\t28.84\t631\t390\t14\t16\t629\t22\t610\t1e-77\t 257\n+1_5\t0_324\t29.95\t561\t346\t10\t80\t630\t82\t605\t2e-65\t 223\n+1_5\t0_325\t27.08\t565\t341\t14\t83\t626\t76\t590\t2e-45\t 165\n+1_5\t0_627\t25.56\t622\t401\t15\t27\t628\t13\t592\t6e-38\t 143\n+1_5\t0_535\t25.85\t236\t155\t7\t392\t617\t2\t227\t4e-20\t86.3\n+1_5\t0_534\t25.52\t239\t140\t8\t407\t614\t22\t253\t1e-11\t60.8\n+1_5\t0_814\t27.96\t211\t128\t7\t406\t604\t138\t336\t5e-11\t59.3\n+1_5\t0_32\t24.07\t241\t139\t8\t404\t614\t110\t336\t8e-10\t56.2\n+1_5\t0_105\t24.11\t253\t145\t10\t391\t613\t43\t278\t2e-09\t55.1\n+1_5\t0_476\t25.94\t239\t139\t9\t401\t625\t14\t228\t3e-09\t53.1\n+1_5\t0_124\t34.34\t99\t61\t3\t392\t489\t12\t107\t2e-08\t51.6\n+1_5\t0_520\t31.63\t98\t63\t3\t392\t488\t46\t140\t2e-07\t48.9\n+1_5\t0_624\t24.18\t182\t120\t3\t405\t568\t14\t195\t1e-06\t46.2\n+1_5\t0_106\t39.06\t64\t34\t1\t416\t474\t38\t101\t3e-06\t45.1\n+1_5\t0_27\t20.92\t196\t141\t6\t418\t608\t8\t194\t2e-05\t41.6\n+1_5\t0_157\t25.58\t258\t144\t12\t392\t630\t4\t232\t3e-05\t40.8\n+1_5\t0_259\t34.18\t79\t50\t2\t529\t605\t204\t282\t5e-04\t37.4\n+1_6\t0_56\t75.56\t45\t11\t0\t3\t47\t4\t48\t2e-18\t68.2\n+1_7\t0_57\t42.42\t66\t35\t2\t1\t66\t1\t63\t2e-08\t43.9\n+1_8\t0_58\t28.84\t215\t147\t4\t160\t373\t503\t712\t7e-20\t86.7\n+1_9\t0_49\t31.41\t277\t155\t10\t7\t264\t7\t267\t4e-30\t 111\n+1_11\t0_503\t32.06\t549\t353\t10\t6\t549\t6\t539\t6e-93\t 293\n+1_12\t0_618\t27.70\t343\t186\t18\t85\t380\t70\t397\t1e-12\t63.9\n+1_13\t0_441\t36.33\t256\t124\t9\t7\t235\t6\t249\t2e-38\t 132\n+1_14\t0_440\t59.33\t504\t201\t3\t4\t506\t2\t502\t0.0\t 643\n+1_16\t0_326\t37.37\t570\t287\t20\t177\t727\t116\t634\t2e-93\t 303\n+1_19\t0_782\t37.21\t551\t340\t5\t14\t560\t3\t551\t5e-126\t 382\n+1_19\t0_736\t21.49\t563\t405\t13\t17\t560\t6\t550\t1e-32\t 127\n+1_20\t0_815\t25.80\t469\t316\t8\t373\t831\t1692\t2138\t3e-39\t 155\n+1_20\t0_815\t24.32\t403\t254\t11\t978\t1353\t2337\t2715\t1e-12\t67.8\n+1_21\t0_814\t48.91\t229\t117\t0\t262\t490\t117\t345\t4e-74\t 237\n+1_21\t0_535\t32.37\t207\t121\t6\t284\t481\t18\t214\t5e-21\t88.2\n+1_21\t0_157\t31.82\t220\t131\t7\t265\t481\t3\t206\t5e-17\t75.9\n+1_21\t0_534\t28.78\t205\t119\t7\t284\t463\t22\t224\t7e-16\t73.6\n+1_21\t0_124\t39.47\t114\t57\t4\t264\t376\t10\t112\t8e-16\t74.7\n+1_21\t0_124\t32.54\t126\t76\t4\t373\t493\t197\t318\t1e-11\t61.6\n+1_21\t0_105\t28.83\t222\t128\t8\t265\t463\t36\t250\t3e-15\t72.4\n+1_21\t0_325\t28.35\t261\t154\t11\t245\t489\t333\t576\t3e-15\t72.8\n+1_21\t0_520\t38.46\t104\t54\t2\t265\t368\t45\t138\t7e-15\t72.0\n+1_21\t0_520\t39.51\t81\t49\t0\t383\t463\t454\t534\t1e-11\t62.0\n+1_21\t0_627\t26.27\t236\t135\t9\t239\t462\t340\t548\t2e-14\t70.5\n+1_21\t0_259\t25.52\t286\t136\t5\t265\t481\t4\t281\t2e-13\t65.9\n+1_21\t0_32\t27.80\t223\t142\t7\t284\t488\t113\t334\t3e-13\t66.6\n+1_21\t0_476\t26.47\t204\t134\t5\t263\t462\t2\t193\t7e-13\t63.2\n+1_21\t0_712\t28.57\t133\t94\t1\t351\t482\t161\t293\t9e-13\t64.7\n+1_21\t0_712\t36.14\t83\t41\t1\t290\t372\t34\t104\t3e-06\t43.9\n+1_21\t0_224\t32.08\t106\t71\t1\t381\t485\t188\t293\t9e-12\t61.6\n+1_21\t0_224\t32.53\t83\t44\t1\t290\t372\t36\t106\t7e-04\t36.6\n+1_21\t0_31\t29.20\t113\t78\t2\t374\t484\t251\t363\t3e-11\t60.1\n+1_21\t0_31\t35.19\t54\t35\t0\t265\t318\t37\t90\t8e-05\t39.7\n+1_21\t0_106\t34.38\t96\t61\t2\t388\t481\t607\t702\t5e-10\t56.6\n+1_21\t0_106\t27.47\t91\t65\t1\t265\t354\t10\t100\t2e-05\t42.0\n+1_21\t0_624\t22.49\t249\t154\t9\t265\t487\t1\t236\t5e-10\t56.2\n+1_21\t0_624\t20.81\t197\t139\t4\t284\t477\t335\t517\t5e-04\t37.4\n+1_21\t0_13\t23.48\t230\t149\t7\t263\t477\t4\t221\t1e-09\t55.1\n+1_21\t0_13\t21.86\t247\t162\t8\t261\t481\t260\t501\t4e-06\t44.3\n+1_21\t0_626\t25.56\t2'..b'27\t234\t11\t19\t430\t2\t408\t4e-86\t 268\n+1_714\t0_211\t44.01\t784\t386\t19\t1\t761\t1\t754\t0.0\t 558\n+1_715\t0_210\t54.86\t350\t150\t4\t1\t345\t1\t347\t7e-131\t 377\n+1_715\t0_816\t28.99\t169\t102\t7\t100\t260\t235\t393\t6e-07\t45.8\n+1_715\t0_382\t27.22\t158\t86\t6\t104\t241\t560\t708\t7e-04\t36.2\n+1_716\t0_593\t37.25\t910\t514\t19\t1\t875\t5\t892\t0.0\t 558\n+1_716\t0_599\t36.54\t903\t530\t16\t1\t875\t5\t892\t0.0\t 546\n+1_717\t0_592\t28.71\t209\t115\t8\t20\t202\t8\t208\t2e-13\t63.5\n+1_717\t0_592\t28.50\t214\t102\t9\t20\t202\t216\t409\t2e-10\t54.3\n+1_717\t0_595\t27.23\t202\t126\t6\t20\t202\t144\t343\t2e-10\t54.7\n+1_717\t0_595\t37.31\t67\t39\t1\t139\t202\t70\t136\t2e-07\t45.8\n+1_717\t0_598\t29.26\t188\t126\t5\t20\t202\t209\t394\t6e-10\t52.8\n+1_717\t0_598\t27.57\t214\t104\t9\t20\t202\t8\t201\t1e-08\t48.9\n+1_718\t0_598\t26.57\t207\t123\t7\t4\t194\t202\t395\t2e-14\t65.9\n+1_718\t0_598\t44.07\t59\t33\t0\t136\t194\t144\t202\t4e-11\t56.2\n+1_718\t0_592\t27.54\t207\t120\t5\t13\t194\t8\t209\t2e-13\t63.2\n+1_718\t0_592\t45.76\t59\t32\t0\t136\t194\t352\t410\t4e-11\t56.2\n+1_718\t0_595\t27.49\t211\t130\t8\t4\t194\t137\t344\t1e-10\t55.1\n+1_718\t0_595\t41.79\t67\t36\t2\t131\t194\t71\t137\t2e-10\t53.9\n+1_719\t0_597\t34.79\t983\t521\t33\t8\t929\t5\t928\t2e-129\t 418\n+1_727\t0_298\t35.93\t359\t195\t9\t274\t601\t324\t678\t9e-55\t 196\n+1_727\t0_272\t26.40\t712\t376\t24\t2\t601\t1\t676\t2e-47\t 173\n+1_727\t0_299\t32.86\t353\t204\t9\t266\t590\t341\t688\t1e-43\t 162\n+1_729\t0_273\t31.65\t417\t228\t18\t401\t790\t464\t850\t4e-39\t 150\n+1_729\t0_273\t29.82\t171\t102\t7\t63\t218\t146\t313\t1e-09\t56.2\n+1_729\t0_273\t43.18\t44\t24\t1\t226\t268\t414\t457\t4e-04\t38.5\n+1_733\t0_271\t35.07\t710\t389\t13\t7\t711\t4\t646\t4e-109\t 344\n+1_734\t0_327\t49.06\t159\t76\t3\t1\t159\t1\t154\t4e-46\t 151\n+1_737\t0_298\t29.14\t429\t253\t14\t257\t653\t321\t730\t8e-33\t 130\n+1_737\t0_299\t34.20\t269\t151\t10\t289\t538\t377\t638\t1e-31\t 126\n+1_737\t0_299\t29.09\t165\t95\t7\t2\t153\t3\t158\t3e-04\t38.5\n+1_737\t0_272\t31.27\t275\t167\t9\t282\t539\t344\t613\t2e-27\t 113\n+1_737\t0_603\t35.62\t73\t30\t2\t66\t138\t533\t588\t1e-04\t39.7\n+1_739\t0_272\t39.08\t87\t50\t2\t2\t86\t436\t521\t4e-14\t63.5\n+1_739\t0_299\t35.53\t76\t47\t1\t4\t77\t463\t538\t9e-12\t56.6\n+1_739\t0_298\t34.62\t78\t49\t1\t2\t77\t437\t514\t5e-11\t54.3\n+1_740\t0_298\t53.12\t32\t12\t1\t3\t34\t356\t384\t2e-05\t36.2\n+1_740\t0_299\t32.86\t70\t40\t3\t1\t68\t378\t442\t3e-04\t33.1\n+1_742\t0_300\t35.24\t403\t229\t13\t405\t790\t468\t855\t7e-52\t 189\n+1_742\t0_273\t29.90\t408\t245\t13\t401\t788\t464\t850\t9e-39\t 149\n+1_742\t0_273\t27.87\t183\t98\t9\t63\t222\t146\t317\t1e-05\t43.5\n+1_742\t0_273\t45.71\t35\t18\t1\t238\t271\t426\t460\t0.001\t37.4\n+1_742\t0_326\t30.91\t110\t61\t5\t205\t307\t187\t288\t7e-04\t37.7\n+1_743\t0_298\t34.72\t360\t199\t9\t38\t366\t324\t678\t1e-51\t 181\n+1_743\t0_272\t30.85\t402\t236\t11\t2\t366\t280\t676\t6e-48\t 171\n+1_743\t0_299\t33.82\t346\t196\t8\t38\t355\t348\t688\t1e-44\t 162\n+1_745\t0_299\t35.71\t280\t156\t10\t291\t553\t368\t640\t4e-36\t 140\n+1_745\t0_298\t28.90\t429\t242\t17\t272\t664\t324\t725\t8e-31\t 124\n+1_745\t0_272\t31.32\t281\t166\t9\t291\t552\t341\t613\t3e-30\t 122\n+1_746\t0_298\t29.48\t458\t253\t19\t183\t599\t242\t670\t2e-35\t 138\n+1_746\t0_272\t24.97\t733\t410\t36\t2\t631\t1\t696\t7e-32\t 127\n+1_746\t0_299\t31.29\t278\t168\t9\t288\t546\t367\t640\t2e-29\t 119\n+1_749\t0_605\t43.00\t493\t241\t16\t1\t487\t1\t459\t4e-118\t 355\n+1_750\t0_135\t25.38\t264\t181\t8\t16\t272\t22\t276\t2e-20\t83.6\n+1_751\t0_90\t29.41\t306\t171\t8\t1\t299\t16\t283\t2e-33\t 123\n+1_752\t0_89\t33.68\t291\t187\t4\t3\t289\t6\t294\t2e-48\t 162\n+1_754\t0_50\t27.97\t261\t177\t4\t1\t261\t1\t250\t5e-26\t99.8\n+1_755\t0_51\t39.25\t456\t251\t10\t10\t453\t4\t445\t4e-87\t 272\n+1_755\t0_794\t37.78\t135\t80\t2\t218\t349\t168\t301\t7e-21\t89.7\n+1_755\t0_794\t35.54\t121\t75\t3\t224\t343\t6\t124\t1e-13\t67.4\n+1_755\t0_116\t36.67\t90\t56\t1\t224\t313\t6\t94\t4e-11\t58.9\n+1_755\t0_139\t28.12\t192\t111\t8\t205\t372\t1\t189\t2e-06\t43.1\n+1_755\t0_404\t30.48\t105\t55\t3\t221\t309\t2\t104\t5e-06\t43.1\n+1_755\t0_87\t38.03\t71\t37\t3\t218\t286\t123\t188\t1e-05\t42.0\n+1_755\t0_525\t29.21\t89\t60\t3\t224\t312\t160\t245\t6e-04\t36.6\n+1_756\t0_739\t34.21\t152\t87\t6\t59\t203\t60\t205\t1e-11\t58.5\n+1_756\t0_743\t41.51\t53\t31\t0\t90\t142\t119\t171\t8e-06\t41.6\n+1_757\t0_740\t36.82\t201\t117\t6\t5\t197\t1\t199\t4e-36\t 124\n+1_758\t0_54\t42.76\t428\t228\t8\t1\t419\t1\t420\t1e-107\t 323\n+1_759\t0_591\t50.87\t804\t389\t4\t23\t822\t80\t881\t0.0\t 791\n+1_759\t0_174\t32.57\t786\t511\t12\t1\t779\t1\t774\t4e-125\t 396\n+1_760\t0_808\t52.38\t651\t300\t6\t2\t648\t11\t655\t0.0\t 671\n+1_760\t0_173\t47.72\t658\t315\t12\t1\t648\t1\t639\t0.0\t 550\n+1_761\t0_799\t48.33\t60\t29\t1\t4\t61\t7\t66\t1e-11\t59.7\n+1_762\t0_1\t28.95\t152\t95\t8\t56\t205\t58\t198\t5e-05\t39.7\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast1_1.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast1_1.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,5235 @@\n+1_0\t1_0\t100.00\t262\t0\t0\t1\t262\t1\t262\t0.0\t 526\n+1_1\t1_1\t100.00\t158\t0\t0\t1\t158\t1\t158\t3e-109\t 307\n+1_2\t1_2\t100.00\t461\t0\t0\t1\t461\t1\t461\t0.0\t 926\n+1_3\t1_3\t100.00\t64\t0\t0\t1\t64\t1\t64\t7e-42\t 129\n+1_4\t1_4\t100.00\t305\t0\t0\t1\t305\t1\t305\t0.0\t 611\n+1_4\t1_5\t30.57\t193\t103\t3\t137\t300\t332\t522\t1e-22\t93.6\n+1_4\t1_385\t31.11\t135\t90\t2\t169\t302\t358\t490\t2e-16\t74.7\n+1_4\t1_384\t35.21\t71\t45\t1\t228\t297\t2\t72\t3e-09\t51.2\n+1_4\t1_40\t30.68\t88\t54\t1\t185\t265\t92\t179\t2e-06\t43.5\n+1_4\t1_619\t32.10\t81\t53\t2\t190\t268\t28\t108\t8e-06\t42.0\n+1_4\t1_619\t21.74\t92\t67\t2\t181\t267\t308\t399\t8e-04\t35.4\n+1_4\t1_234\t28.38\t74\t47\t1\t177\t244\t8\t81\t2e-05\t40.0\n+1_4\t1_21\t25.20\t127\t85\t3\t187\t303\t285\t411\t3e-05\t40.0\n+1_4\t1_101\t27.78\t90\t62\t1\t167\t256\t2\t88\t4e-05\t39.3\n+1_4\t1_609\t28.57\t84\t58\t1\t169\t252\t8\t89\t5e-05\t38.9\n+1_4\t1_33\t29.03\t93\t62\t3\t187\t278\t47\t136\t1e-04\t38.5\n+1_4\t1_535\t37.78\t45\t28\t0\t187\t231\t40\t84\t2e-04\t37.7\n+1_4\t1_395\t30.77\t65\t42\t1\t190\t254\t27\t88\t4e-04\t36.2\n+1_4\t1_491\t26.25\t80\t56\t2\t190\t268\t26\t103\t5e-04\t36.2\n+1_4\t1_301\t31.43\t70\t47\t1\t187\t256\t32\t100\t9e-04\t35.4\n+1_5\t1_5\t100.00\t633\t0\t0\t1\t633\t1\t633\t0.0\t1280\n+1_5\t1_385\t29.56\t548\t351\t6\t77\t620\t70\t586\t4e-64\t 220\n+1_5\t1_609\t32.34\t235\t139\t7\t392\t617\t8\t231\t5e-29\t 113\n+1_5\t1_40\t29.18\t233\t156\t4\t393\t616\t78\t310\t7e-23\t95.5\n+1_5\t1_4\t30.57\t193\t103\t3\t332\t522\t137\t300\t2e-22\t93.6\n+1_5\t1_384\t31.49\t181\t113\t3\t454\t626\t2\t179\t4e-21\t88.2\n+1_5\t1_21\t30.32\t188\t110\t6\t406\t583\t283\t459\t7e-14\t69.3\n+1_5\t1_234\t29.85\t201\t129\t6\t410\t600\t26\t224\t2e-13\t65.5\n+1_5\t1_608\t26.76\t213\t125\t9\t422\t613\t56\t258\t4e-11\t59.7\n+1_5\t1_301\t23.53\t238\t152\t8\t396\t616\t15\t239\t2e-10\t57.4\n+1_5\t1_543\t22.31\t251\t156\t7\t392\t614\t62\t301\t4e-10\t57.0\n+1_5\t1_270\t25.81\t217\t128\t10\t405\t606\t14\t212\t1e-08\t50.8\n+1_5\t1_293\t24.88\t217\t149\t8\t404\t609\t15\t228\t2e-08\t50.8\n+1_5\t1_619\t27.94\t204\t133\t8\t411\t606\t28\t225\t5e-08\t50.4\n+1_5\t1_261\t38.64\t88\t45\t3\t391\t478\t7\t85\t1e-07\t48.9\n+1_5\t1_415\t25.11\t223\t128\t8\t392\t603\t471\t665\t3e-07\t48.5\n+1_5\t1_491\t27.27\t99\t69\t2\t392\t489\t7\t103\t5e-07\t47.4\n+1_5\t1_101\t25.43\t232\t148\t7\t392\t612\t4\t221\t8e-07\t45.8\n+1_5\t1_535\t32.14\t84\t54\t2\t529\t609\t681\t764\t5e-06\t44.3\n+1_5\t1_395\t22.22\t225\t155\t9\t407\t623\t23\t235\t8e-05\t39.7\n+1_5\t1_383\t20.83\t264\t199\t5\t84\t346\t58\t312\t3e-04\t38.1\n+1_5\t1_33\t27.66\t94\t63\t3\t403\t493\t42\t133\t4e-04\t38.1\n+1_5\t1_536\t31.17\t77\t48\t2\t392\t465\t22\t96\t4e-04\t38.1\n+1_6\t1_6\t100.00\t49\t0\t0\t1\t49\t1\t49\t6e-30\t97.8\n+1_7\t1_7\t100.00\t116\t0\t0\t1\t116\t1\t116\t2e-76\t 221\n+1_8\t1_8\t100.00\t383\t0\t0\t1\t383\t1\t383\t0.0\t 776\n+1_9\t1_9\t100.00\t268\t0\t0\t1\t268\t1\t268\t0.0\t 539\n+1_10\t1_10\t100.00\t261\t0\t0\t1\t261\t1\t261\t0.0\t 530\n+1_11\t1_11\t100.00\t549\t0\t0\t1\t549\t1\t549\t0.0\t1125\n+1_12\t1_12\t100.00\t389\t0\t0\t1\t389\t1\t389\t0.0\t 792\n+1_13\t1_13\t100.00\t243\t0\t0\t1\t243\t1\t243\t2e-177\t 487\n+1_14\t1_14\t100.00\t508\t0\t0\t1\t508\t1\t508\t0.0\t1042\n+1_15\t1_15\t100.00\t396\t0\t0\t1\t396\t1\t396\t0.0\t 809\n+1_16\t1_16\t100.00\t750\t0\t0\t1\t750\t1\t750\t0.0\t1533\n+1_16\t1_568\t26.58\t617\t358\t31\t1\t573\t1\t566\t6e-28\t 115\n+1_17\t1_17\t100.00\t170\t0\t0\t1\t170\t1\t170\t2e-126\t 352\n+1_18\t1_18\t100.00\t275\t0\t0\t1\t275\t1\t275\t0.0\t 546\n+1_19\t1_19\t100.00\t566\t0\t0\t1\t566\t1\t566\t0.0\t1164\n+1_19\t1_82\t22.42\t504\t353\t12\t11\t493\t17\t503\t7e-22\t94.4\n+1_20\t1_20\t100.00\t1361\t0\t0\t1\t1361\t1\t1361\t0.0\t2726\n+1_21\t1_21\t100.00\t499\t0\t0\t1\t499\t1\t499\t0.0\t1016\n+1_21\t1_270\t37.43\t187\t109\t6\t279\t463\t11\t191\t1e-30\t 114\n+1_21\t1_301\t34.48\t203\t122\t4\t281\t477\t28\t225\t2e-22\t93.6\n+1_21\t1_234\t31.89\t185\t117\t2\t287\t463\t26\t209\t1e-20\t86.7\n+1_21\t1_40\t31.56\t244\t116\t11\t263\t481\t74\t291\t3e-20\t86.7\n+1_21\t1_609\t31.86\t204\t124\t7\t265\t463\t7\t200\t5e-20\t85.5\n+1_21\t1_261\t28.21\t280\t110\t8\t284\t488\t20\t283\t7e-19\t83.6\n+1_21\t1_619\t28.89\t225\t144\t7\t263\t478\t5\t222\t3e-16\t76.3\n+1_21\t1_619\t22.64\t265\t177\t8\t246\t488\t280\t538\t2e-09\t54.3\n+1_21\t1_543\t31.12\t196\t120\t7\t283\t463\t77\t272\t6e-16\t74.7\n+1_21\t1_491\t33.33\t111\t69\t2\t381\t486\t258\t368\t4e-14\t69.3\n+1_21\t1_491\t36.04\t111\t62\t3\t266\t376\t7\t108\t2e-13\t67.0\n+1_21\t1_5\t30.32\t188\t110\t6\t283\t459\t406\t583\t4e-14\t69.3\n+1_21\t1_536\t38.00\t100\t58\t2\t386\t481\t206\t305\t2e-12\t63.5\n+1_21\t1_536\t24.58\t118\t78\t4\t260\t372\t16\t127\t5e-04\t37.4\n+1_21\t1_33\t32.00\t125\t78\t2\t361\t484\t327\t445\t4e-12\t63.2\n+1_21\t1_33\t39.08\t87\t47\t2\t282\t368\t44\t124\t1e-11\t61.6\n+1_21\t1_608\t29.44\t197\t122\t8\t299\t481\t56\t249\t7e-12\t61.2\n+1_21\t1_101\t24.75\t202\t141\t5\t264\t463'..b'1_741\t100.00\t192\t0\t0\t1\t192\t1\t192\t2e-143\t 397\n+1_741\t1_746\t55.15\t194\t83\t2\t2\t192\t99\t291\t4e-68\t 218\n+1_741\t1_745\t52.78\t180\t80\t3\t16\t192\t118\t295\t3e-52\t 174\n+1_741\t1_737\t32.56\t172\t98\t6\t25\t189\t119\t279\t6e-18\t77.4\n+1_742\t1_742\t100.00\t791\t0\t0\t1\t791\t1\t791\t0.0\t1609\n+1_742\t1_729\t72.29\t794\t214\t4\t1\t790\t1\t792\t0.0\t1186\n+1_742\t1_693\t28.64\t618\t277\t24\t193\t790\t206\t679\t2e-48\t 177\n+1_742\t1_692\t31.44\t353\t161\t15\t430\t775\t332\t610\t1e-25\t 107\n+1_742\t1_692\t28.24\t170\t100\t6\t124\t271\t111\t280\t6e-11\t60.5\n+1_742\t1_568\t38.67\t75\t39\t4\t204\t274\t222\t293\t5e-06\t44.7\n+1_742\t1_312\t32.38\t105\t42\t5\t189\t272\t45\t141\t2e-05\t42.7\n+1_743\t1_743\t100.00\t439\t0\t0\t1\t439\t1\t439\t0.0\t 900\n+1_743\t1_727\t82.23\t439\t77\t1\t1\t439\t237\t674\t0.0\t 749\n+1_743\t1_737\t30.69\t378\t229\t12\t17\t373\t244\t609\t8e-44\t 158\n+1_743\t1_745\t29.66\t354\t221\t10\t12\t348\t253\t595\t9e-40\t 147\n+1_743\t1_746\t28.81\t420\t259\t16\t20\t411\t250\t657\t1e-36\t 137\n+1_743\t1_739\t29.73\t74\t52\t0\t148\t221\t1\t74\t1e-10\t54.7\n+1_744\t1_744\t100.00\t243\t0\t0\t1\t243\t1\t243\t3e-177\t 487\n+1_744\t1_727\t56.95\t223\t91\t3\t1\t220\t1\t221\t2e-67\t 218\n+1_744\t1_745\t60.64\t94\t36\t1\t1\t94\t1\t93\t2e-25\t 100\n+1_744\t1_746\t43.88\t139\t72\t4\t1\t134\t1\t138\t8e-24\t96.3\n+1_744\t1_737\t52.00\t100\t44\t4\t1\t99\t1\t97\t6e-23\t93.6\n+1_745\t1_745\t100.00\t705\t0\t0\t1\t705\t1\t705\t0.0\t1429\n+1_745\t1_746\t53.66\t710\t309\t9\t1\t704\t1\t696\t0.0\t 724\n+1_745\t1_737\t49.22\t709\t330\t16\t1\t704\t1\t684\t0.0\t 603\n+1_745\t1_727\t29.30\t628\t366\t26\t1\t595\t1\t583\t7e-58\t 204\n+1_745\t1_741\t52.31\t195\t87\t4\t103\t295\t2\t192\t3e-57\t 190\n+1_745\t1_739\t78.16\t87\t19\t0\t388\t474\t2\t88\t3e-42\t 145\n+1_745\t1_743\t29.66\t354\t221\t10\t253\t595\t12\t348\t2e-39\t 146\n+1_745\t1_738\t83.12\t77\t12\t1\t557\t633\t1\t76\t1e-38\t 134\n+1_745\t1_744\t57.65\t85\t36\t0\t1\t85\t1\t85\t5e-25\t 100\n+1_745\t1_740\t49.30\t71\t35\t1\t302\t371\t1\t71\t8e-18\t75.9\n+1_746\t1_746\t100.00\t701\t0\t0\t1\t701\t1\t701\t0.0\t1437\n+1_746\t1_745\t53.24\t710\t312\t9\t1\t696\t1\t704\t0.0\t 669\n+1_746\t1_737\t47.35\t716\t336\t14\t1\t701\t1\t690\t0.0\t 594\n+1_746\t1_741\t55.15\t194\t83\t2\t99\t291\t2\t192\t1e-67\t 218\n+1_746\t1_739\t91.21\t91\t8\t0\t383\t473\t1\t91\t4e-53\t 175\n+1_746\t1_727\t31.40\t363\t220\t13\t302\t657\t306\t646\t5e-37\t 142\n+1_746\t1_727\t75.00\t84\t20\t1\t1\t84\t1\t83\t3e-32\t 127\n+1_746\t1_743\t28.81\t420\t259\t16\t250\t657\t20\t411\t2e-36\t 137\n+1_746\t1_740\t64.79\t71\t25\t0\t299\t369\t1\t71\t6e-27\t 101\n+1_746\t1_744\t50.59\t85\t41\t1\t1\t84\t1\t85\t1e-17\t79.0\n+1_746\t1_738\t51.43\t70\t34\t0\t550\t619\t1\t70\t6e-17\t73.6\n+1_746\t1_452\t63.16\t19\t7\t0\t88\t106\t34\t52\t0.001\t34.7\n+1_747\t1_747\t100.00\t472\t0\t0\t1\t472\t1\t472\t0.0\t 969\n+1_747\t1_135\t24.45\t409\t286\t10\t34\t427\t74\t474\t5e-29\t 114\n+1_748\t1_748\t100.00\t447\t0\t0\t1\t447\t1\t447\t0.0\t 917\n+1_749\t1_749\t100.00\t498\t0\t0\t1\t498\t1\t498\t0.0\t1021\n+1_750\t1_750\t100.00\t283\t0\t0\t1\t283\t1\t283\t0.0\t 561\n+1_751\t1_751\t100.00\t369\t0\t0\t1\t369\t1\t369\t0.0\t 734\n+1_752\t1_752\t100.00\t310\t0\t0\t1\t310\t1\t310\t0.0\t 627\n+1_753\t1_753\t100.00\t299\t0\t0\t1\t299\t1\t299\t0.0\t 600\n+1_754\t1_754\t100.00\t266\t0\t0\t1\t266\t1\t266\t0.0\t 543\n+1_755\t1_755\t100.00\t453\t0\t0\t1\t453\t1\t453\t0.0\t 903\n+1_755\t1_160\t40.45\t89\t49\t2\t225\t310\t179\t266\t1e-16\t76.6\n+1_755\t1_160\t34.02\t97\t63\t1\t222\t318\t2\t97\t4e-11\t59.3\n+1_755\t1_472\t29.68\t155\t91\t8\t224\t366\t162\t310\t6e-07\t46.2\n+1_755\t1_696\t28.10\t121\t67\t5\t222\t326\t2\t118\t8e-06\t42.4\n+1_755\t1_412\t34.38\t64\t41\t1\t224\t287\t7\t69\t1e-05\t41.6\n+1_755\t1_654\t31.25\t96\t49\t4\t198\t280\t78\t169\t0.001\t35.8\n+1_756\t1_756\t100.00\t260\t0\t0\t1\t260\t1\t260\t0.0\t 511\n+1_756\t1_633\t28.57\t105\t69\t2\t40\t142\t71\t171\t2e-05\t40.0\n+1_757\t1_757\t100.00\t210\t0\t0\t1\t210\t1\t210\t2e-156\t 431\n+1_758\t1_758\t100.00\t420\t0\t0\t1\t420\t1\t420\t0.0\t 865\n+1_758\t1_236\t23.01\t239\t159\t8\t186\t413\t63\t287\t4e-06\t43.5\n+1_759\t1_759\t100.00\t846\t0\t0\t1\t846\t1\t846\t0.0\t1719\n+1_759\t1_438\t37.99\t708\t414\t11\t13\t711\t1\t692\t4e-139\t 431\n+1_760\t1_760\t100.00\t648\t0\t0\t1\t648\t1\t648\t0.0\t1338\n+1_760\t1_439\t43.73\t638\t338\t8\t9\t640\t5\t627\t3e-177\t 518\n+1_761\t1_761\t100.00\t322\t0\t0\t1\t322\t1\t322\t0.0\t 654\n+1_761\t1_348\t33.85\t130\t52\t4\t4\t128\t15\t115\t1e-14\t69.7\n+1_761\t1_298\t48.57\t70\t34\t1\t4\t71\t10\t79\t5e-14\t67.0\n+1_761\t1_298\t32.88\t73\t47\t1\t4\t74\t98\t170\t1e-05\t41.2\n+1_761\t1_150\t44.16\t77\t40\t2\t4\t78\t8\t83\t4e-13\t64.3\n+1_761\t1_155\t42.31\t78\t42\t2\t4\t79\t8\t84\t5e-13\t61.2\n+1_761\t1_75\t50.77\t65\t29\t2\t4\t65\t11\t75\t3e-12\t61.6\n+1_761\t1_300\t42.59\t54\t29\t1\t4\t55\t244\t297\t8e-08\t47.8\n+1_762\t1_762\t100.00\t391\t0\t0\t1\t391\t1\t391\t0.0\t 768\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast1_2.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast1_2.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1158 @@\n+1_0\t2_475\t60.30\t267\t96\t3\t1\t257\t1\t267\t1e-115\t 332\n+1_2\t2_474\t33.14\t338\t214\t5\t120\t453\t100\t429\t2e-53\t 182\n+1_4\t2_14\t34.41\t186\t106\t5\t121\t303\t313\t485\t1e-27\t 107\n+1_4\t2_13\t28.44\t327\t202\t7\t1\t302\t190\t509\t4e-24\t97.4\n+1_4\t2_64\t27.89\t147\t93\t6\t169\t303\t233\t378\t6e-08\t47.8\n+1_4\t2_308\t31.43\t70\t41\t2\t169\t235\t2\t67\t3e-06\t42.0\n+1_4\t2_181\t28.97\t107\t69\t2\t169\t268\t19\t125\t3e-06\t42.0\n+1_4\t2_419\t28.68\t136\t81\t4\t145\t268\t56\t187\t7e-06\t41.2\n+1_4\t2_39\t33.75\t80\t50\t2\t190\t268\t26\t103\t7e-06\t41.6\n+1_4\t2_473\t29.91\t117\t71\t4\t163\t268\t42\t158\t2e-05\t39.3\n+1_4\t2_180\t25.00\t140\t93\t4\t173\t303\t13\t149\t3e-05\t38.9\n+1_4\t2_119\t31.88\t69\t45\t2\t202\t268\t38\t106\t7e-05\t38.1\n+1_4\t2_119\t31.48\t54\t37\t0\t188\t241\t338\t391\t1e-04\t37.7\n+1_4\t2_188\t33.33\t45\t30\t0\t187\t231\t23\t67\t2e-04\t37.0\n+1_5\t2_14\t34.31\t545\t321\t6\t85\t627\t78\t587\t1e-96\t 306\n+1_5\t2_13\t25.58\t563\t358\t13\t86\t626\t88\t611\t8e-35\t 134\n+1_5\t2_180\t30.26\t228\t140\t7\t389\t608\t6\t222\t4e-27\t 106\n+1_5\t2_419\t32.64\t239\t139\t6\t393\t616\t84\t315\t7e-27\t 107\n+1_5\t2_181\t26.24\t221\t141\t8\t422\t633\t51\t258\t5e-15\t70.9\n+1_5\t2_471\t29.60\t223\t130\t9\t398\t605\t92\t302\t2e-14\t68.6\n+1_5\t2_308\t25.62\t242\t158\t8\t392\t624\t2\t230\t5e-14\t67.0\n+1_5\t2_64\t27.56\t225\t133\t9\t407\t617\t251\t459\t5e-12\t62.4\n+1_5\t2_307\t25.56\t223\t144\t8\t397\t607\t81\t293\t2e-08\t50.4\n+1_5\t2_293\t26.49\t185\t126\t6\t384\t563\t2\t181\t3e-08\t49.7\n+1_5\t2_473\t26.09\t207\t135\t7\t407\t605\t71\t267\t5e-08\t49.3\n+1_5\t2_39\t30.30\t99\t66\t2\t392\t489\t7\t103\t2e-07\t47.8\n+1_5\t2_39\t25.87\t143\t88\t5\t471\t609\t303\t431\t4e-06\t43.9\n+1_5\t2_79\t30.00\t90\t60\t2\t529\t615\t685\t774\t2e-06\t45.1\n+1_5\t2_119\t24.37\t238\t141\t11\t391\t605\t3\t224\t3e-06\t44.3\n+1_5\t2_188\t25.29\t87\t62\t2\t392\t478\t8\t91\t2e-04\t38.1\n+1_5\t2_399\t24.19\t186\t108\t7\t412\t588\t481\t642\t0.001\t36.2\n+1_6\t2_470\t72.34\t47\t13\t0\t1\t47\t1\t47\t4e-17\t63.9\n+1_7\t2_469\t29.41\t85\t60\t0\t1\t85\t10\t94\t3e-08\t43.5\n+1_8\t2_468\t57.70\t383\t158\t4\t1\t381\t5\t385\t2e-153\t 437\n+1_9\t2_467\t41.63\t257\t144\t4\t12\t265\t2\t255\t2e-63\t 198\n+1_11\t2_386\t35.45\t536\t319\t11\t22\t549\t21\t537\t2e-94\t 297\n+1_13\t2_30\t38.19\t254\t121\t8\t8\t238\t13\t253\t2e-45\t 150\n+1_14\t2_35\t62.94\t510\t183\t4\t1\t506\t1\t508\t0.0\t 668\n+1_15\t2_36\t47.88\t378\t193\t3\t20\t393\t4\t381\t6e-113\t 334\n+1_16\t2_67\t35.82\t67\t32\t3\t251\t314\t55\t113\t3e-04\t38.1\n+1_19\t2_138\t61.27\t568\t205\t6\t1\t559\t1\t562\t0.0\t 699\n+1_19\t2_429\t22.64\t477\t354\t8\t16\t485\t5\t473\t2e-34\t 131\n+1_20\t2_63\t35.88\t1416\t766\t25\t1\t1360\t1\t1330\t0.0\t 769\n+1_20\t2_472\t21.92\t1104\t725\t34\t328\t1356\t740\t1781\t4e-42\t 163\n+1_21\t2_64\t49.29\t420\t178\t8\t87\t498\t73\t465\t2e-112\t 339\n+1_21\t2_473\t41.16\t277\t159\t3\t224\t498\t9\t283\t1e-63\t 206\n+1_21\t2_471\t45.00\t200\t110\t0\t284\t483\t104\t303\t5e-50\t 171\n+1_21\t2_419\t32.06\t262\t136\t14\t243\t481\t54\t296\t2e-21\t89.7\n+1_21\t2_180\t28.65\t185\t120\t5\t284\t463\t23\t200\t2e-18\t79.7\n+1_21\t2_181\t27.08\t240\t159\t10\t253\t481\t4\t238\t4e-18\t79.3\n+1_21\t2_119\t28.57\t224\t136\t8\t268\t477\t8\t221\t5e-16\t74.7\n+1_21\t2_119\t22.12\t217\t148\t4\t288\t488\t340\t551\t2e-05\t41.2\n+1_21\t2_39\t37.21\t86\t54\t0\t378\t463\t322\t407\t1e-15\t73.9\n+1_21\t2_39\t33.64\t107\t62\t3\t265\t371\t6\t103\t7e-12\t61.6\n+1_21\t2_14\t27.88\t208\t128\t7\t285\t481\t368\t564\t2e-15\t73.2\n+1_21\t2_78\t27.09\t251\t127\t8\t284\t481\t40\t287\t7e-15\t70.5\n+1_21\t2_293\t28.95\t190\t121\t4\t284\t463\t21\t206\t1e-14\t68.2\n+1_21\t2_307\t28.37\t208\t135\t8\t283\t481\t88\t290\t1e-12\t63.5\n+1_21\t2_13\t26.19\t210\t130\t6\t246\t436\t343\t546\t1e-12\t63.9\n+1_21\t2_188\t33.65\t104\t59\t2\t265\t368\t7\t100\t3e-12\t62.8\n+1_21\t2_188\t34.48\t87\t56\t1\t399\t484\t363\t449\t8e-11\t58.2\n+1_21\t2_79\t31.07\t103\t69\t2\t381\t481\t661\t763\t3e-11\t60.1\n+1_21\t2_79\t26.60\t94\t62\t2\t265\t354\t10\t100\t7e-04\t36.2\n+1_21\t2_308\t26.48\t219\t139\t8\t284\t495\t18\t221\t6e-10\t54.3\n+1_21\t2_427\t62.96\t27\t10\t0\t285\t311\t23\t49\t2e-04\t38.1\n+1_21\t2_427\t44.74\t38\t19\t1\t285\t320\t632\t669\t3e-04\t37.4\n+1_21\t2_427\t31.58\t95\t60\t3\t387\t477\t820\t913\t3e-04\t37.4\n+1_23\t2_463\t24.85\t169\t111\t9\t1\t155\t1\t167\t1e-07\t43.1\n+1_24\t2_462\t48.19\t166\t86\t0\t8\t173\t3\t168\t3e-56\t 173\n+1_25\t2_461\t57.61\t696\t251\t8\t26\t720\t25\t677\t0.0\t 756\n+1_25\t2_366\t32.86\t70\t39\t2\t310\t379\t41\t102\t2e-04\t37.7\n+1_25\t2_242\t25.28\t178\t108\t7\t289\t452\t357\t523\t3e-04\t38.1\n+1_28\t2_38\t42.05\t88\t51\t0\t1\t88\t1\t88\t3e-21\t77.4\n+1_29\t2_65\t34.66\t652\t390\t15\t14\t644\t10\t646\t1e-114\t 356\n+1_30\t2_71\t62.64\t803\t290\t3\t2\t801\t3\t798\t0.0\t1030\n+1_31\t2_263\t31.59\t801\t436\t20\t1\t735\t1\t755\t8e-108\t 344\n+1_31\t2_186\t30.36\t774\t434\t23'..b'7\t2_450\t53.45\t232\t101\t3\t1\t232\t1\t225\t1e-83\t 248\n+1_658\t2_451\t58.14\t86\t34\t1\t1\t84\t1\t86\t2e-31\t 103\n+1_659\t2_179\t60.83\t120\t47\t0\t1\t120\t1\t120\t2e-47\t 148\n+1_660\t2_178\t48.14\t322\t162\t2\t16\t332\t1\t322\t2e-108\t 319\n+1_661\t2_177\t57.02\t121\t52\t0\t1\t121\t1\t121\t1e-50\t 155\n+1_662\t2_176\t73.39\t124\t33\t0\t1\t124\t1\t124\t5e-63\t 187\n+1_663\t2_175\t81.08\t37\t7\t0\t1\t37\t1\t37\t4e-17\t63.2\n+1_664\t2_174\t56.52\t69\t30\t0\t1\t69\t1\t69\t2e-24\t84.3\n+1_665\t2_124\t41.76\t91\t53\t0\t9\t99\t10\t100\t3e-26\t90.9\n+1_666\t2_122\t46.65\t716\t342\t12\t8\t703\t5\t700\t0.0\t 611\n+1_668\t2_112\t43.60\t211\t114\t3\t2\t211\t3\t209\t8e-54\t 169\n+1_669\t2_111\t47.90\t428\t216\t4\t1\t426\t7\t429\t5e-139\t 404\n+1_670\t2_110\t38.55\t249\t140\t8\t29\t270\t35\t277\t4e-45\t 151\n+1_671\t2_109\t38.81\t402\t222\t10\t18\t414\t2\t384\t2e-89\t 275\n+1_672\t2_108\t37.05\t251\t142\t6\t12\t258\t16\t254\t3e-49\t 161\n+1_673\t2_107\t47.28\t184\t96\t1\t9\t191\t2\t185\t9e-52\t 163\n+1_674\t2_106\t52.17\t184\t87\t1\t5\t188\t3\t185\t7e-68\t 204\n+1_675\t2_60\t33.70\t540\t277\t16\t12\t492\t2\t519\t6e-72\t 237\n+1_676\t2_387\t56.95\t604\t258\t2\t6\t608\t7\t609\t0.0\t 657\n+1_677\t2_388\t32.42\t182\t110\t5\t27\t207\t9\t178\t3e-23\t89.4\n+1_680\t2_51\t40.20\t204\t113\t4\t6\t206\t7\t204\t2e-40\t 139\n+1_681\t2_52\t35.78\t109\t67\t2\t22\t128\t15\t122\t2e-12\t55.5\n+1_682\t2_53\t55.32\t47\t21\t0\t1\t47\t1\t47\t4e-15\t58.5\n+1_682\t2_330\t41.46\t41\t23\t1\t7\t46\t9\t49\t7e-05\t30.8\n+1_690\t2_410\t42.28\t298\t165\t4\t115\t407\t135\t430\t5e-73\t 238\n+1_690\t2_408\t24.34\t341\t217\t13\t86\t409\t103\t419\t2e-13\t66.2\n+1_691\t2_408\t38.68\t455\t264\t6\t3\t449\t10\t457\t5e-108\t 327\n+1_691\t2_410\t23.99\t271\t192\t7\t59\t322\t81\t344\t2e-09\t53.9\n+1_692\t2_66\t23.91\t389\t211\t20\t269\t594\t122\t488\t2e-04\t38.5\n+1_693\t2_67\t23.19\t457\t221\t21\t262\t658\t72\t458\t2e-07\t47.8\n+1_693\t2_404\t22.62\t367\t207\t16\t262\t601\t113\t429\t1e-04\t39.3\n+1_694\t2_19\t39.86\t138\t77\t2\t3\t134\t7\t144\t7e-26\t92.4\n+1_695\t2_20\t63.76\t287\t104\t0\t4\t290\t2\t288\t2e-130\t 371\n+1_696\t2_21\t52.15\t372\t167\t5\t1\t367\t1\t366\t6e-123\t 358\n+1_696\t2_392\t36.89\t103\t48\t1\t1\t103\t159\t244\t4e-17\t76.6\n+1_696\t2_396\t28.57\t112\t64\t3\t1\t111\t3\t99\t2e-04\t37.0\n+1_696\t2_334\t35.06\t77\t32\t2\t1\t76\t1\t60\t2e-04\t37.0\n+1_697\t2_31\t45.41\t207\t108\t3\t6\t211\t7\t209\t2e-63\t 194\n+1_698\t2_80\t72.79\t136\t36\t1\t4\t139\t1\t135\t9e-67\t 198\n+1_699\t2_81\t62.78\t223\t83\t0\t3\t225\t2\t224\t1e-101\t 293\n+1_700\t2_82\t41.62\t185\t104\t3\t2\t183\t5\t188\t5e-44\t 142\n+1_701\t2_83\t37.86\t280\t164\t2\t4\t276\t2\t278\t1e-63\t 200\n+1_702\t2_61\t30.11\t641\t394\t17\t20\t621\t10\t635\t7e-70\t 238\n+1_712\t2_254\t50.41\t244\t114\t6\t16\t256\t2\t241\t1e-73\t 223\n+1_712\t2_352\t22.45\t147\t108\t4\t111\t253\t6\t150\t6e-04\t33.9\n+1_713\t2_255\t41.67\t432\t244\t3\t5\t435\t4\t428\t3e-117\t 348\n+1_715\t2_362\t26.30\t308\t173\t12\t1\t273\t369\t657\t3e-07\t46.2\n+1_715\t2_461\t28.67\t150\t91\t6\t101\t239\t268\t412\t2e-05\t40.8\n+1_729\t2_404\t26.96\t115\t73\t2\t648\t752\t365\t478\t4e-04\t37.7\n+1_733\t2_256\t41.67\t708\t357\t7\t9\t713\t4\t658\t3e-179\t 526\n+1_734\t2_417\t52.83\t159\t73\t1\t2\t160\t1\t157\t6e-60\t 181\n+1_735\t2_15\t35.53\t833\t503\t13\t288\t1107\t219\t1030\t1e-143\t 457\n+1_748\t2_465\t40.06\t347\t199\t4\t10\t352\t5\t346\t3e-82\t 258\n+1_749\t2_466\t49.19\t492\t237\t4\t1\t492\t1\t479\t6e-170\t 488\n+1_750\t2_12\t30.25\t281\t178\t7\t3\t280\t1\t266\t8e-39\t 134\n+1_751\t2_85\t42.82\t362\t184\t10\t12\t360\t5\t356\t3e-80\t 249\n+1_752\t2_84\t43.43\t297\t166\t2\t3\t299\t4\t298\t2e-86\t 261\n+1_754\t2_8\t42.02\t257\t147\t2\t6\t260\t4\t260\t4e-65\t 202\n+1_755\t2_7\t44.40\t455\t233\t7\t6\t453\t1\t442\t5e-112\t 336\n+1_755\t2_334\t35.79\t95\t57\t2\t222\t313\t179\t272\t3e-12\t62.4\n+1_755\t2_334\t28.90\t173\t106\t4\t224\t382\t4\t173\t1e-11\t60.8\n+1_755\t2_392\t26.11\t180\t104\t7\t208\t378\t149\t308\t6e-08\t48.5\n+1_755\t2_447\t38.20\t89\t45\t5\t204\t291\t103\t182\t1e-06\t43.9\n+1_755\t2_21\t28.71\t101\t54\t3\t225\t309\t5\t103\t9e-05\t38.5\n+1_755\t2_396\t27.56\t127\t72\t3\t222\t332\t4\t126\t1e-04\t37.7\n+1_756\t2_6\t29.41\t255\t169\t8\t9\t260\t7\t253\t7e-20\t80.9\n+1_756\t2_426\t28.04\t107\t67\t3\t40\t142\t72\t172\t9e-04\t34.7\n+1_757\t2_5\t39.68\t189\t107\t5\t1\t185\t1\t186\t5e-41\t 136\n+1_758\t2_4\t49.29\t420\t210\t1\t1\t420\t1\t417\t4e-142\t 411\n+1_759\t2_3\t60.34\t817\t322\t2\t7\t823\t9\t823\t0.0\t1009\n+1_759\t2_203\t31.62\t718\t461\t10\t20\t727\t10\t707\t2e-120\t 381\n+1_760\t2_2\t64.55\t646\t228\t1\t3\t647\t4\t649\t0.0\t 887\n+1_760\t2_202\t45.37\t648\t330\t10\t6\t645\t2\t633\t0.0\t 536\n+1_761\t2_1\t45.99\t324\t155\t5\t1\t320\t1\t308\t6e-88\t 265\n+1_761\t2_16\t35.71\t84\t45\t2\t4\t79\t9\t91\t1e-10\t56.6\n+1_761\t2_199\t41.77\t79\t40\t4\t4\t77\t9\t86\t1e-09\t53.1\n+1_762\t2_0\t25.45\t330\t224\t8\t35\t354\t36\t353\t3e-16\t73.9\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast1_3.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast1_3.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1475 @@\n+1_2\t3_0\t26.35\t334\t218\t9\t124\t443\t115\t434\t3e-30\t 117\n+1_4\t3_622\t25.11\t235\t159\t8\t41\t273\t218\t437\t2e-10\t56.6\n+1_4\t3_625\t23.20\t181\t132\t4\t115\t288\t273\t453\t1e-09\t53.5\n+1_4\t3_256\t25.76\t132\t83\t2\t169\t300\t2\t118\t1e-08\t50.1\n+1_4\t3_494\t57.78\t45\t18\t1\t190\t233\t27\t71\t1e-08\t50.4\n+1_4\t3_365\t31.46\t89\t56\t2\t169\t257\t39\t122\t1e-06\t44.3\n+1_4\t3_541\t28.05\t82\t58\t1\t187\t268\t26\t106\t1e-06\t43.9\n+1_4\t3_605\t31.82\t110\t68\t4\t166\t272\t5\t110\t2e-06\t43.5\n+1_4\t3_17\t27.68\t112\t72\t3\t187\t296\t17\t121\t2e-05\t40.4\n+1_4\t3_226\t24.17\t120\t72\t4\t190\t291\t1\t119\t3e-05\t39.7\n+1_4\t3_462\t30.77\t65\t42\t2\t192\t256\t4\t65\t6e-05\t38.1\n+1_4\t3_206\t30.30\t66\t43\t1\t169\t234\t2\t64\t7e-05\t38.9\n+1_4\t3_156\t30.08\t123\t75\t5\t131\t250\t432\t546\t8e-05\t38.5\n+1_4\t3_257\t38.10\t42\t26\t0\t187\t228\t23\t64\t1e-04\t37.7\n+1_4\t3_19\t23.58\t123\t73\t4\t187\t301\t17\t126\t1e-04\t38.1\n+1_4\t3_445\t34.78\t46\t30\t0\t190\t235\t83\t128\t2e-04\t36.6\n+1_4\t3_18\t23.58\t123\t73\t4\t187\t301\t17\t126\t6e-04\t36.2\n+1_4\t3_626\t25.93\t135\t86\t4\t172\t301\t339\t464\t6e-04\t35.8\n+1_5\t3_256\t28.39\t236\t158\t4\t392\t621\t2\t232\t8e-24\t97.4\n+1_5\t3_625\t27.83\t212\t132\t6\t381\t587\t327\t522\t8e-17\t78.6\n+1_5\t3_17\t30.73\t218\t122\t10\t407\t612\t16\t216\t1e-14\t71.6\n+1_5\t3_622\t27.59\t203\t130\t7\t390\t587\t332\t522\t4e-14\t70.1\n+1_5\t3_257\t28.96\t259\t137\t11\t391\t615\t2\t247\t4e-14\t68.2\n+1_5\t3_156\t25.40\t189\t131\t3\t421\t609\t497\t675\t1e-13\t68.6\n+1_5\t3_18\t30.37\t214\t128\t9\t402\t607\t11\t211\t2e-13\t68.2\n+1_5\t3_297\t29.67\t209\t127\t8\t417\t616\t25\t222\t2e-13\t67.8\n+1_5\t3_19\t30.24\t205\t124\t10\t405\t604\t14\t204\t7e-13\t66.2\n+1_5\t3_307\t28.38\t222\t140\t8\t417\t629\t25\t236\t1e-12\t65.5\n+1_5\t3_333\t25.00\t240\t164\t5\t392\t628\t2\t228\t5e-12\t63.5\n+1_5\t3_210\t23.83\t256\t151\t8\t392\t614\t122\t366\t7e-12\t62.8\n+1_5\t3_379\t26.01\t223\t138\t9\t403\t613\t12\t219\t2e-11\t61.6\n+1_5\t3_306\t30.85\t188\t115\t7\t403\t587\t12\t187\t3e-10\t57.8\n+1_5\t3_495\t23.11\t251\t153\t8\t392\t613\t10\t249\t5e-10\t56.2\n+1_5\t3_357\t25.85\t236\t135\t11\t392\t602\t10\t230\t5e-10\t55.5\n+1_5\t3_541\t38.64\t88\t51\t2\t403\t489\t21\t106\t6e-10\t56.2\n+1_5\t3_226\t27.67\t206\t137\t7\t411\t606\t1\t204\t7e-10\t56.2\n+1_5\t3_445\t27.51\t189\t112\t6\t392\t567\t61\t237\t4e-09\t53.1\n+1_5\t3_626\t24.06\t212\t143\t7\t392\t597\t336\t535\t4e-09\t53.9\n+1_5\t3_508\t24.14\t203\t142\t7\t418\t612\t32\t230\t6e-08\t50.1\n+1_5\t3_508\t25.42\t236\t135\t11\t407\t614\t282\t504\t7e-06\t43.5\n+1_5\t3_623\t26.70\t206\t118\t9\t395\t588\t338\t522\t5e-07\t47.0\n+1_5\t3_298\t29.89\t87\t60\t1\t527\t612\t84\t170\t6e-07\t47.0\n+1_5\t3_281\t29.89\t87\t57\t1\t519\t605\t16\t98\t1e-06\t46.2\n+1_5\t3_206\t21.86\t183\t125\t2\t405\t569\t14\t196\t3e-06\t45.1\n+1_5\t3_494\t28.28\t99\t68\t2\t520\t615\t608\t706\t4e-06\t44.3\n+1_5\t3_494\t31.88\t69\t42\t1\t411\t474\t27\t95\t2e-04\t38.9\n+1_5\t3_365\t29.70\t101\t63\t4\t392\t489\t39\t134\t5e-06\t43.9\n+1_5\t3_211\t33.82\t68\t39\t2\t388\t449\t37\t104\t7e-05\t40.0\n+1_5\t3_462\t23.42\t222\t139\t9\t422\t631\t13\t215\t7e-05\t39.3\n+1_6\t3_673\t76.60\t47\t11\t0\t1\t47\t1\t47\t4e-20\t72.4\n+1_7\t3_672\t37.88\t66\t38\t2\t1\t66\t1\t63\t6e-04\t32.0\n+1_8\t3_671\t29.15\t247\t156\t7\t113\t354\t351\t583\t2e-18\t81.6\n+1_9\t3_650\t31.53\t222\t128\t7\t16\t225\t6\t215\t1e-23\t92.8\n+1_11\t3_11\t35.92\t554\t325\t15\t4\t549\t3\t534\t3e-101\t 315\n+1_12\t3_578\t27.39\t387\t238\t19\t21\t385\t5\t370\t7e-18\t79.3\n+1_13\t3_354\t42.32\t241\t122\t5\t8\t235\t6\t242\t1e-51\t 166\n+1_14\t3_355\t63.69\t504\t180\t2\t4\t505\t7\t509\t0.0\t 681\n+1_15\t3_585\t44.35\t363\t196\t4\t19\t377\t8\t368\t3e-90\t 276\n+1_16\t3_627\t35.20\t588\t308\t22\t180\t749\t69\t601\t8e-81\t 268\n+1_19\t3_91\t36.55\t550\t347\t2\t14\t563\t7\t554\t2e-129\t 397\n+1_19\t3_8\t24.04\t495\t356\t9\t18\t500\t7\t493\t3e-45\t 165\n+1_20\t3_446\t27.49\t411\t284\t4\t379\t786\t1673\t2072\t5e-40\t 157\n+1_20\t3_446\t26.65\t394\t236\t10\t998\t1360\t2278\t2649\t4e-16\t79.0\n+1_21\t3_445\t45.26\t232\t125\t1\t250\t481\t47\t276\t2e-67\t 217\n+1_21\t3_333\t35.82\t201\t111\t7\t265\t463\t1\t185\t1e-24\t 102\n+1_21\t3_379\t32.02\t203\t117\t5\t265\t463\t1\t186\t4e-24\t 100\n+1_21\t3_19\t33.03\t218\t125\t6\t281\t492\t13\t215\t3e-23\t98.6\n+1_21\t3_17\t32.42\t219\t131\t7\t265\t481\t1\t204\t8e-23\t97.1\n+1_21\t3_307\t31.96\t219\t133\t6\t265\t481\t1\t205\t2e-22\t95.5\n+1_21\t3_18\t34.10\t217\t120\t7\t284\t492\t16\t217\t2e-22\t95.5\n+1_21\t3_306\t28.50\t207\t136\t4\t284\t488\t16\t212\t3e-22\t95.1\n+1_21\t3_357\t26.75\t228\t150\t6\t264\t479\t8\t230\t8e-22\t90.5\n+1_21\t3_297\t32.02\t203\t117\t6\t265\t463\t1\t186\t7e-21\t90.9\n+1_21\t3_256\t31.00\t229\t132\t6\t265\t481\t1\t215\t9e-19\t81.3\n+1_21\t3_257\t30.41\t217\t130\t7\t266\t463\t3\t217\t2e-18\t80.9\n+1_21\t3_495\t28.57\t217\t133\t7\t265\t463\t9\t221\t2e-17\t78.6\n+1_21\t3'..b'+1_692\t3_611\t35.22\t301\t156\t9\t341\t610\t509\t801\t7e-39\t 147\n+1_692\t3_611\t27.27\t165\t102\t4\t133\t285\t250\t408\t3e-07\t47.8\n+1_693\t3_611\t29.82\t664\t367\t27\t78\t675\t184\t814\t6e-48\t 176\n+1_693\t3_620\t26.91\t628\t332\t23\t132\t679\t238\t818\t4e-45\t 167\n+1_695\t3_13\t55.21\t288\t127\t1\t3\t290\t2\t287\t1e-106\t 311\n+1_695\t3_571\t32.63\t285\t175\t8\t4\t283\t3\t275\t1e-37\t 132\n+1_696\t3_285\t47.25\t364\t189\t2\t2\t364\t3\t364\t1e-115\t 340\n+1_696\t3_37\t24.40\t250\t150\t7\t1\t246\t156\t370\t3e-15\t71.6\n+1_696\t3_85\t50.00\t34\t17\t0\t2\t35\t120\t153\t7e-04\t35.8\n+1_697\t3_608\t44.02\t184\t97\t1\t11\t194\t7\t184\t1e-49\t 159\n+1_698\t3_453\t52.70\t148\t70\t0\t4\t151\t1\t148\t1e-49\t 155\n+1_699\t3_452\t46.49\t228\t118\t2\t3\t226\t2\t229\t2e-71\t 216\n+1_700\t3_200\t44.72\t161\t82\t2\t1\t156\t1\t159\t2e-47\t 152\n+1_701\t3_201\t42.16\t185\t103\t3\t5\t187\t7\t189\t6e-42\t 144\n+1_702\t3_485\t46.33\t667\t335\t10\t12\t668\t1\t654\t0.0\t 592\n+1_704\t3_487\t33.99\t303\t182\t13\t24\t316\t16\t310\t3e-47\t 159\n+1_706\t3_87\t26.75\t329\t174\t17\t36\t342\t257\t540\t1e-14\t70.9\n+1_706\t3_332\t25.29\t514\t242\t22\t34\t428\t301\t791\t2e-13\t67.4\n+1_712\t3_638\t29.54\t237\t151\t8\t26\t260\t7\t229\t4e-23\t90.5\n+1_712\t3_140\t31.61\t155\t84\t6\t112\t257\t110\t251\t7e-11\t55.8\n+1_713\t3_639\t39.23\t418\t228\t7\t14\t429\t6\t399\t2e-87\t 271\n+1_714\t3_87\t27.61\t163\t96\t7\t360\t504\t286\t444\t8e-04\t37.4\n+1_715\t3_202\t28.15\t135\t88\t4\t101\t229\t266\t397\t5e-04\t36.6\n+1_716\t3_624\t24.66\t292\t156\t14\t153\t416\t237\t492\t2e-07\t48.9\n+1_727\t3_619\t29.11\t426\t253\t11\t247\t639\t395\t804\t1e-43\t 163\n+1_727\t3_612\t33.77\t302\t188\t8\t249\t546\t249\t542\t1e-43\t 161\n+1_727\t3_432\t26.89\t621\t337\t27\t6\t548\t7\t588\t2e-27\t 113\n+1_729\t3_620\t34.63\t387\t191\t14\t438\t792\t462\t818\t2e-43\t 164\n+1_729\t3_620\t33.74\t163\t83\t6\t138\t276\t236\t397\t4e-15\t73.9\n+1_729\t3_611\t31.59\t364\t168\t16\t438\t784\t509\t808\t6e-21\t92.8\n+1_729\t3_611\t30.43\t184\t98\t7\t120\t274\t224\t406\t5e-10\t57.8\n+1_733\t3_259\t34.16\t729\t407\t14\t4\t710\t2\t679\t2e-111\t 351\n+1_737\t3_612\t33.33\t300\t183\t10\t242\t534\t251\t540\t8e-43\t 159\n+1_737\t3_619\t33.33\t348\t193\t16\t257\t578\t409\t743\t2e-39\t 150\n+1_737\t3_432\t27.46\t397\t231\t19\t295\t645\t342\t727\t2e-22\t97.1\n+1_739\t3_619\t47.83\t69\t36\t0\t5\t73\t529\t597\t5e-17\t72.0\n+1_739\t3_612\t44.16\t77\t42\t1\t2\t77\t383\t459\t6e-17\t71.6\n+1_739\t3_432\t43.28\t67\t33\t2\t14\t77\t436\t500\t1e-10\t52.8\n+1_740\t3_612\t28.79\t66\t44\t2\t3\t68\t302\t364\t4e-05\t35.0\n+1_740\t3_619\t31.88\t69\t41\t3\t1\t67\t442\t506\t2e-04\t33.5\n+1_742\t3_620\t33.76\t394\t198\t12\t433\t790\t452\t818\t9e-46\t 171\n+1_742\t3_620\t30.34\t234\t122\t11\t138\t348\t236\t451\t2e-13\t68.6\n+1_742\t3_611\t28.09\t356\t189\t16\t438\t782\t509\t808\t3e-13\t68.2\n+1_742\t3_611\t31.90\t163\t84\t4\t137\t272\t242\t404\t7e-13\t67.0\n+1_742\t3_627\t35.62\t73\t42\t3\t202\t271\t124\t194\t5e-04\t37.7\n+1_743\t3_612\t33.11\t305\t191\t8\t11\t311\t247\t542\t1e-44\t 160\n+1_743\t3_619\t27.91\t412\t239\t11\t14\t389\t398\t787\t2e-40\t 150\n+1_743\t3_432\t31.91\t329\t180\t17\t13\t313\t276\t588\t2e-26\t 107\n+1_745\t3_612\t27.44\t554\t327\t22\t72\t588\t87\t602\t3e-42\t 158\n+1_745\t3_619\t31.23\t269\t163\t9\t301\t553\t441\t703\t2e-30\t 122\n+1_745\t3_432\t24.32\t407\t246\t17\t297\t658\t330\t719\t3e-18\t83.6\n+1_746\t3_612\t29.43\t418\t255\t15\t263\t652\t265\t670\t3e-44\t 164\n+1_746\t3_619\t31.81\t349\t202\t13\t274\t597\t418\t755\t5e-35\t 137\n+1_746\t3_432\t29.49\t312\t181\t15\t259\t541\t284\t585\t1e-20\t91.3\n+1_747\t3_220\t21.96\t428\t305\t11\t22\t431\t46\t462\t6e-19\t84.3\n+1_749\t3_137\t43.23\t495\t238\t9\t3\t487\t2\t463\t1e-119\t 358\n+1_751\t3_96\t28.25\t315\t174\t12\t30\t333\t32\t305\t4e-21\t87.8\n+1_754\t3_651\t30.11\t269\t172\t5\t2\t263\t150\t409\t2e-28\t 107\n+1_755\t3_205\t40.44\t455\t244\t13\t10\t453\t4\t442\t8e-78\t 248\n+1_755\t3_66\t31.55\t206\t119\t5\t222\t412\t171\t369\t2e-22\t94.0\n+1_755\t3_66\t27.12\t118\t85\t1\t224\t341\t5\t121\t2e-10\t57.4\n+1_755\t3_152\t36.56\t93\t52\t3\t224\t313\t9\t97\t7e-07\t45.4\n+1_755\t3_85\t34.09\t132\t64\t8\t202\t317\t93\t217\t2e-06\t43.9\n+1_755\t3_442\t28.99\t169\t91\t10\t223\t371\t39\t198\t3e-04\t36.6\n+1_756\t3_253\t33.33\t90\t60\t0\t67\t156\t62\t151\t2e-08\t48.5\n+1_756\t3_249\t33.04\t115\t70\t4\t31\t143\t66\t175\t4e-07\t45.4\n+1_757\t3_252\t31.90\t210\t131\t6\t5\t207\t1\t205\t2e-25\t95.9\n+1_758\t3_244\t41.36\t411\t236\t4\t6\t414\t5\t412\t3e-102\t 309\n+1_759\t3_526\t45.27\t804\t434\t5\t23\t823\t51\t851\t0.0\t 704\n+1_759\t3_28\t33.70\t727\t452\t12\t13\t725\t1\t711\t6e-114\t 366\n+1_760\t3_107\t49.38\t640\t312\t5\t9\t644\t5\t636\t0.0\t 617\n+1_760\t3_29\t43.73\t638\t337\t8\t9\t640\t3\t624\t1e-179\t 524\n+1_761\t3_64\t43.28\t67\t30\t1\t3\t61\t6\t72\t8e-11\t57.0\n+1_762\t3_1\t23.73\t354\t210\t16\t24\t348\t23\t345\t9e-06\t42.0\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast2_0.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast2_0.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,986 @@\n+2_0\t0_1\t23.60\t394\t261\t14\t1\t380\t1\t368\t5e-10\t55.5\n+2_1\t0_799\t50.00\t60\t28\t1\t4\t61\t7\t66\t2e-11\t59.3\n+2_2\t0_808\t50.23\t653\t314\t6\t2\t650\t10\t655\t0.0\t 657\n+2_2\t0_173\t44.70\t642\t325\t12\t10\t641\t9\t630\t2e-180\t 527\n+2_3\t0_591\t49.94\t801\t395\t4\t23\t818\t78\t877\t0.0\t 759\n+2_3\t0_174\t32.91\t787\t507\t9\t11\t792\t17\t787\t3e-129\t 407\n+2_4\t0_54\t41.31\t426\t234\t7\t1\t416\t1\t420\t5e-102\t 309\n+2_4\t0_353\t23.59\t195\t139\t4\t130\t320\t177\t365\t5e-07\t46.6\n+2_5\t0_740\t30.69\t189\t122\t5\t5\t186\t1\t187\t3e-25\t95.1\n+2_6\t0_743\t37.50\t64\t40\t0\t81\t144\t114\t177\t5e-07\t45.4\n+2_7\t0_51\t37.56\t442\t259\t7\t11\t442\t11\t445\t1e-80\t 255\n+2_7\t0_794\t35.10\t208\t109\t8\t218\t415\t172\t363\t4e-22\t93.2\n+2_7\t0_794\t36.29\t124\t76\t2\t220\t341\t6\t128\t3e-13\t66.2\n+2_7\t0_116\t42.86\t84\t48\t0\t220\t303\t6\t89\t8e-14\t66.6\n+2_7\t0_139\t29.81\t161\t99\t5\t213\t365\t16\t170\t3e-06\t42.7\n+2_8\t0_50\t35.32\t201\t116\t4\t61\t260\t62\t249\t2e-36\t 127\n+2_9\t0_255\t34.43\t61\t38\t1\t111\t171\t256\t314\t3e-04\t36.2\n+2_12\t0_135\t33.06\t248\t146\t8\t26\t258\t34\t276\t3e-29\t 109\n+2_13\t0_627\t30.34\t613\t398\t8\t4\t612\t4\t591\t9e-79\t 259\n+2_13\t0_325\t32.17\t544\t327\t13\t88\t613\t73\t592\t4e-69\t 233\n+2_13\t0_626\t28.46\t527\t327\t15\t108\t612\t110\t608\t2e-42\t 156\n+2_13\t0_324\t27.34\t534\t365\t7\t83\t608\t80\t598\t3e-41\t 153\n+2_13\t0_535\t30.87\t230\t130\t6\t381\t601\t17\t226\t2e-20\t87.0\n+2_13\t0_814\t27.15\t221\t137\t7\t383\t596\t140\t343\t4e-12\t62.8\n+2_13\t0_124\t29.03\t186\t108\t6\t426\t594\t136\t314\t6e-12\t62.8\n+2_13\t0_124\t31.88\t69\t44\t2\t398\t465\t42\t108\t9e-04\t37.0\n+2_13\t0_224\t38.10\t84\t49\t1\t514\t594\t211\t294\t3e-10\t57.4\n+2_13\t0_534\t24.69\t243\t131\t10\t381\t590\t21\t244\t4e-10\t56.2\n+2_13\t0_712\t31.63\t98\t64\t1\t504\t598\t204\t301\t7e-10\t56.2\n+2_13\t0_712\t28.92\t83\t50\t3\t397\t478\t43\t117\t5e-05\t40.8\n+2_13\t0_13\t26.36\t220\t131\t9\t385\t591\t24\t225\t1e-09\t55.8\n+2_13\t0_105\t27.90\t276\t147\t14\t342\t590\t20\t270\t1e-09\t55.1\n+2_13\t0_157\t27.46\t244\t147\t10\t362\t601\t1\t218\t2e-09\t53.9\n+2_13\t0_624\t28.00\t200\t111\t9\t365\t545\t2\t187\t2e-09\t54.7\n+2_13\t0_520\t33.00\t100\t56\t3\t514\t609\t475\t567\t2e-08\t52.0\n+2_13\t0_520\t28.00\t125\t84\t3\t360\t483\t41\t160\t4e-08\t50.8\n+2_13\t0_31\t32.61\t92\t57\t3\t514\t601\t282\t372\t2e-08\t51.2\n+2_13\t0_32\t28.27\t191\t104\t8\t377\t549\t108\t283\t8e-08\t49.7\n+2_13\t0_106\t33.33\t99\t54\t4\t496\t590\t613\t703\t1e-07\t49.7\n+2_13\t0_106\t28.05\t82\t54\t1\t372\t448\t19\t100\t6e-04\t37.7\n+2_13\t0_476\t24.77\t218\t130\t9\t383\t590\t21\t214\t3e-06\t43.9\n+2_13\t0_27\t24.00\t175\t101\t4\t386\t552\t1\t151\t4e-05\t40.4\n+2_13\t0_259\t36.08\t97\t53\t5\t513\t604\t203\t295\t3e-04\t38.1\n+2_14\t0_626\t37.26\t518\t319\t4\t75\t586\t90\t607\t4e-106\t 331\n+2_14\t0_324\t33.54\t492\t325\t1\t100\t589\t113\t604\t2e-85\t 277\n+2_14\t0_325\t27.14\t538\t348\t13\t71\t586\t75\t590\t1e-46\t 169\n+2_14\t0_627\t26.88\t506\t321\t14\t107\t589\t114\t593\t2e-40\t 150\n+2_14\t0_535\t27.65\t217\t130\t6\t371\t574\t22\t224\t5e-18\t79.7\n+2_14\t0_27\t23.74\t219\t145\t6\t371\t580\t1\t206\t2e-11\t60.1\n+2_14\t0_13\t26.12\t268\t148\t12\t337\t567\t250\t504\t3e-10\t57.4\n+2_14\t0_13\t27.10\t214\t123\t8\t371\t565\t25\t224\t2e-08\t52.0\n+2_14\t0_124\t32.41\t108\t66\t4\t343\t449\t6\t107\t6e-09\t53.1\n+2_14\t0_814\t22.12\t208\t140\t6\t368\t564\t140\t336\t1e-08\t52.0\n+2_14\t0_476\t22.94\t170\t104\t4\t361\t520\t14\t166\t7e-07\t45.8\n+2_14\t0_534\t22.27\t238\t151\t7\t371\t579\t26\t258\t1e-06\t45.4\n+2_14\t0_157\t25.75\t233\t145\t10\t352\t575\t4\t217\t3e-06\t43.5\n+2_14\t0_712\t31.15\t61\t38\t2\t352\t409\t11\t70\t8e-06\t43.1\n+2_14\t0_32\t21.79\t234\t145\t7\t368\t574\t114\t336\t8e-06\t43.5\n+2_14\t0_106\t24.66\t73\t50\t1\t367\t434\t29\t101\t9e-06\t43.5\n+2_14\t0_106\t31.82\t88\t49\t3\t489\t569\t624\t707\t8e-05\t40.0\n+2_14\t0_520\t25.47\t106\t74\t2\t482\t582\t468\t573\t4e-05\t41.2\n+2_14\t0_31\t33.33\t90\t55\t3\t489\t574\t282\t370\t2e-04\t38.9\n+2_14\t0_259\t29.51\t61\t42\t1\t352\t411\t5\t65\t3e-04\t38.1\n+2_16\t0_799\t31.02\t374\t229\t10\t6\t370\t4\t357\t1e-45\t 159\n+2_17\t0_69\t38.87\t283\t168\t3\t9\t290\t16\t294\t6e-64\t 203\n+2_18\t0_196\t35.66\t488\t300\t4\t2\t480\t3\t485\t1e-99\t 309\n+2_18\t0_383\t28.12\t128\t90\t1\t1\t126\t31\t158\t1e-09\t55.8\n+2_18\t0_383\t27.37\t95\t58\t3\t241\t329\t480\t569\t7e-04\t37.0\n+2_18\t0_134\t29.23\t130\t71\t3\t9\t118\t42\t170\t7e-09\t53.1\n+2_18\t0_134\t24.22\t322\t198\t19\t155\t451\t357\t657\t6e-08\t50.1\n+2_18\t0_213\t29.70\t165\t92\t6\t12\t161\t61\t216\t1e-06\t45.8\n+2_18\t0_213\t46.15\t39\t21\t0\t287\t325\t579\t617\t3e-06\t44.7\n+2_20\t0_77\t51.90\t289\t133\t2\t1\t287\t6\t290\t3e-101\t 297\n+2_21\t0_404\t49.59\t367\t177\t4\t2\t364\t3\t365\t6e-118\t 346\n+2_21\t0_525\t35.88\t131\t59\t2\t1\t131\t157\t262\t1e-18\t81.6\n+2_22\t0_55\t26.47\t102\t71\t3\t8\t107\t20\t'..b'396\t0.0\t 583\n+2_455\t0_496\t29.67\t246\t146\t11\t7\t247\t2\t225\t1e-17\t79.7\n+2_455\t0_754\t35.12\t168\t80\t7\t15\t177\t115\t258\t6e-17\t77.4\n+2_455\t0_620\t32.87\t143\t91\t3\t1\t141\t1\t140\t8e-13\t64.7\n+2_457\t0_451\t41.44\t292\t165\t4\t1\t288\t1\t290\t7e-63\t 199\n+2_459\t0_801\t31.88\t414\t255\t8\t4\t394\t2\t411\t3e-67\t 217\n+2_461\t0_816\t52.42\t557\t244\t7\t135\t682\t110\t654\t3e-172\t 508\n+2_461\t0_210\t27.55\t196\t116\t8\t271\t451\t109\t293\t2e-07\t48.5\n+2_461\t0_720\t25.14\t175\t85\t8\t240\t399\t127\t270\t2e-04\t38.5\n+2_461\t0_217\t34.29\t70\t38\t2\t267\t336\t41\t102\t0.001\t36.6\n+2_462\t0_406\t37.87\t169\t104\t1\t6\t173\t12\t180\t2e-41\t 135\n+2_464\t0_505\t27.50\t280\t200\t2\t5\t281\t3\t282\t2e-35\t 127\n+2_466\t0_605\t42.18\t486\t248\t9\t1\t477\t1\t462\t8e-121\t 361\n+2_467\t0_49\t34.52\t252\t150\t7\t8\t251\t20\t264\t1e-34\t 123\n+2_468\t0_58\t29.89\t261\t166\t7\t115\t372\t462\t708\t9e-22\t92.0\n+2_470\t0_56\t65.22\t46\t16\t0\t3\t48\t4\t49\t7e-15\t58.5\n+2_471\t0_814\t35.38\t277\t161\t4\t28\t301\t75\t336\t2e-51\t 172\n+2_471\t0_535\t29.85\t201\t132\t4\t108\t304\t22\t217\t2e-23\t92.4\n+2_471\t0_534\t28.27\t237\t128\t9\t101\t304\t19\t246\t8e-20\t82.8\n+2_471\t0_476\t28.57\t203\t131\t6\t105\t302\t21\t214\t1e-19\t81.3\n+2_471\t0_105\t27.98\t218\t139\t6\t102\t302\t54\t270\t6e-18\t78.6\n+2_471\t0_31\t39.77\t88\t52\t1\t216\t302\t274\t361\t9e-18\t78.6\n+2_471\t0_259\t29.17\t264\t120\t8\t104\t302\t21\t282\t2e-17\t76.3\n+2_471\t0_106\t32.00\t125\t84\t1\t181\t304\t581\t705\t2e-17\t78.2\n+2_471\t0_712\t42.00\t100\t57\t1\t203\t301\t193\t292\t2e-17\t77.4\n+2_471\t0_712\t33.64\t110\t58\t3\t82\t191\t9\t103\t9e-07\t44.7\n+2_471\t0_224\t43.00\t100\t56\t1\t203\t301\t190\t289\t4e-17\t76.3\n+2_471\t0_32\t29.68\t219\t130\t6\t104\t302\t113\t327\t7e-17\t75.9\n+2_471\t0_520\t38.53\t109\t64\t2\t203\t310\t454\t560\t7e-15\t70.1\n+2_471\t0_520\t38.89\t90\t49\t2\t101\t190\t57\t140\t5e-11\t58.5\n+2_471\t0_627\t27.06\t218\t121\t7\t105\t303\t372\t570\t1e-14\t69.3\n+2_471\t0_157\t27.88\t208\t127\t6\t104\t304\t18\t209\t2e-13\t63.9\n+2_471\t0_325\t28.64\t206\t131\t8\t104\t301\t371\t568\t8e-12\t60.8\n+2_471\t0_626\t27.27\t209\t111\t7\t115\t302\t398\t586\t9e-12\t60.5\n+2_471\t0_124\t44.26\t61\t34\t0\t223\t283\t230\t290\t1e-11\t60.1\n+2_471\t0_124\t29.91\t107\t61\t2\t104\t202\t26\t126\t7e-09\t51.2\n+2_471\t0_13\t20.38\t211\t145\t6\t107\t303\t24\t225\t5e-10\t55.1\n+2_471\t0_13\t20.92\t239\t161\t7\t90\t302\t266\t502\t6e-07\t45.4\n+2_471\t0_624\t25.70\t214\t134\t7\t104\t296\t16\t225\t6e-10\t55.1\n+2_471\t0_624\t23.01\t326\t188\t11\t1\t300\t232\t520\t5e-09\t52.0\n+2_471\t0_27\t24.00\t200\t138\t5\t108\t302\t1\t191\t2e-09\t52.8\n+2_471\t0_324\t23.11\t212\t135\t7\t104\t301\t382\t579\t7e-08\t48.5\n+2_471\t0_401\t31.71\t82\t47\t4\t224\t299\t831\t909\t6e-05\t39.3\n+2_472\t0_815\t20.87\t599\t399\t18\t723\t1304\t1640\t2180\t1e-21\t98.2\n+2_472\t0_815\t21.19\t420\t257\t12\t1337\t1728\t2292\t2665\t6e-05\t42.7\n+2_473\t0_814\t37.28\t287\t169\t5\t5\t283\t70\t353\t5e-54\t 177\n+2_473\t0_535\t31.16\t199\t128\t4\t75\t268\t22\t216\t1e-20\t84.3\n+2_473\t0_157\t29.79\t235\t132\t6\t59\t278\t6\t222\t2e-20\t83.6\n+2_473\t0_534\t31.60\t231\t118\t10\t72\t269\t23\t246\t3e-20\t83.6\n+2_473\t0_712\t31.19\t109\t74\t1\t159\t266\t184\t292\t5e-16\t72.4\n+2_473\t0_712\t31.71\t82\t44\t1\t77\t158\t34\t103\t4e-04\t36.2\n+2_473\t0_520\t40.22\t92\t55\t0\t159\t250\t445\t536\t2e-15\t70.9\n+2_473\t0_520\t37.63\t93\t50\t2\t70\t162\t59\t143\t5e-12\t60.8\n+2_473\t0_124\t37.17\t113\t61\t2\t51\t163\t10\t112\t6e-15\t69.3\n+2_473\t0_124\t36.67\t90\t56\t1\t178\t266\t220\t309\t9e-12\t60.1\n+2_473\t0_106\t35.16\t91\t58\t1\t178\t267\t613\t703\t1e-14\t68.9\n+2_473\t0_224\t25.00\t256\t123\t6\t77\t269\t36\t285\t3e-14\t67.4\n+2_473\t0_259\t26.81\t276\t132\t7\t71\t280\t21\t292\t3e-14\t66.6\n+2_473\t0_476\t24.51\t204\t132\t5\t74\t267\t23\t214\t8e-14\t64.7\n+2_473\t0_32\t27.00\t237\t147\t6\t52\t267\t96\t327\t8e-14\t66.2\n+2_473\t0_105\t24.45\t229\t142\t8\t64\t267\t48\t270\t3e-12\t61.2\n+2_473\t0_31\t33.33\t81\t53\t1\t188\t267\t281\t361\t1e-11\t59.7\n+2_473\t0_325\t29.82\t171\t105\t5\t60\t220\t360\t525\t1e-11\t59.7\n+2_473\t0_13\t22.13\t235\t158\t7\t50\t270\t4\t227\t3e-10\t55.5\n+2_473\t0_13\t25.40\t248\t143\t8\t53\t267\t264\t502\t7e-10\t54.3\n+2_473\t0_324\t25.76\t229\t141\t9\t53\t266\t365\t579\t4e-10\t55.5\n+2_473\t0_626\t24.38\t201\t127\t5\t81\t267\t397\t586\t2e-09\t52.8\n+2_473\t0_627\t26.40\t197\t111\t7\t50\t227\t351\t532\t1e-07\t47.4\n+2_473\t0_27\t28.49\t172\t108\t7\t82\t247\t8\t170\t5e-07\t45.1\n+2_473\t0_401\t32.05\t78\t45\t3\t189\t261\t831\t905\t3e-04\t37.0\n+2_473\t0_624\t22.28\t193\t136\t5\t69\t259\t333\t513\t9e-04\t35.4\n+2_474\t0_0\t27.54\t334\t229\t10\t98\t423\t117\t445\t1e-38\t 141\n+2_475\t0_652\t42.22\t45\t24\t1\t2\t46\t3\t45\t5e-05\t38.5\n+2_475\t0_472\t42.22\t45\t24\t1\t2\t46\t3\t45\t5e-05\t38.5\n+2_475\t0_294\t42.22\t45\t24\t1\t2\t46\t3\t45\t5e-05\t38.5\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast2_1.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast2_1.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1141 @@\n+2_0\t1_762\t25.45\t330\t224\t8\t36\t353\t35\t354\t5e-16\t73.9\n+2_1\t1_761\t44.75\t324\t159\t4\t1\t308\t1\t320\t5e-78\t 240\n+2_1\t1_298\t48.10\t79\t35\t2\t2\t78\t8\t82\t5e-12\t60.8\n+2_1\t1_348\t47.54\t61\t29\t1\t4\t61\t15\t75\t3e-11\t59.3\n+2_1\t1_150\t40.98\t61\t34\t1\t4\t62\t8\t68\t2e-09\t53.1\n+2_1\t1_75\t42.86\t63\t34\t1\t1\t61\t8\t70\t3e-09\t52.4\n+2_1\t1_155\t36.51\t63\t38\t1\t2\t62\t6\t68\t3e-09\t49.7\n+2_1\t1_300\t44.44\t54\t28\t1\t2\t53\t242\t295\t2e-07\t46.6\n+2_2\t1_760\t64.55\t646\t228\t1\t4\t649\t3\t647\t0.0\t 887\n+2_2\t1_439\t43.97\t639\t336\t9\t10\t642\t5\t627\t2e-178\t 521\n+2_3\t1_759\t60.34\t817\t322\t2\t9\t823\t7\t823\t0.0\t1016\n+2_3\t1_438\t37.01\t708\t431\t7\t15\t717\t1\t698\t3e-139\t 431\n+2_4\t1_758\t49.29\t420\t210\t1\t1\t417\t1\t420\t7e-142\t 411\n+2_5\t1_757\t39.68\t189\t107\t5\t1\t186\t1\t185\t9e-41\t 136\n+2_6\t1_756\t32.53\t166\t106\t4\t7\t166\t9\t174\t4e-19\t79.3\n+2_6\t1_633\t28.07\t114\t79\t2\t34\t145\t66\t178\t1e-04\t37.7\n+2_7\t1_755\t44.40\t455\t233\t7\t1\t442\t6\t453\t1e-115\t 346\n+2_7\t1_160\t40.00\t90\t51\t1\t221\t307\t179\t268\t5e-17\t77.8\n+2_7\t1_160\t32.56\t86\t58\t0\t218\t303\t2\t87\t5e-09\t52.8\n+2_7\t1_412\t30.17\t179\t97\t8\t220\t380\t7\t175\t8e-09\t51.6\n+2_7\t1_654\t33.68\t95\t54\t3\t182\t275\t83\t169\t1e-04\t38.5\n+2_8\t1_754\t42.02\t257\t147\t2\t4\t260\t6\t260\t7e-65\t 202\n+2_9\t1_409\t30.47\t128\t81\t4\t50\t171\t210\t335\t4e-12\t59.7\n+2_12\t1_750\t30.25\t281\t178\t7\t1\t266\t3\t280\t1e-38\t 134\n+2_13\t1_385\t26.02\t561\t373\t11\t68\t614\t63\t595\t1e-41\t 154\n+2_13\t1_384\t39.29\t196\t107\t2\t424\t618\t2\t186\t6e-39\t 138\n+2_13\t1_5\t25.09\t558\t367\t9\t88\t611\t86\t626\t1e-36\t 140\n+2_13\t1_4\t28.44\t327\t202\t7\t190\t509\t1\t302\t4e-25\t 102\n+2_13\t1_609\t31.17\t231\t135\t7\t365\t590\t8\t219\t2e-20\t87.8\n+2_13\t1_301\t28.91\t211\t129\t7\t383\t588\t32\t226\t9e-15\t70.9\n+2_13\t1_608\t28.93\t242\t137\t9\t383\t606\t42\t266\t7e-14\t68.2\n+2_13\t1_21\t27.00\t237\t146\t8\t343\t571\t246\t463\t3e-13\t67.0\n+2_13\t1_234\t29.30\t215\t132\t8\t383\t588\t24\t227\t1e-12\t63.2\n+2_13\t1_383\t23.43\t239\t162\t5\t114\t345\t85\t309\t4e-12\t62.8\n+2_13\t1_542\t37.36\t91\t52\t3\t515\t601\t296\t385\t5e-12\t63.2\n+2_13\t1_40\t24.36\t234\t156\t6\t366\t590\t78\t299\t1e-11\t61.6\n+2_13\t1_33\t36.78\t87\t52\t1\t506\t589\t356\t442\t2e-11\t61.2\n+2_13\t1_33\t31.91\t94\t61\t2\t383\t475\t47\t138\t7e-08\t50.1\n+2_13\t1_491\t38.55\t83\t40\t2\t514\t589\t285\t363\t7e-10\t56.2\n+2_13\t1_543\t26.34\t243\t141\t11\t380\t600\t76\t302\t2e-09\t54.3\n+2_13\t1_270\t25.00\t224\t146\t7\t372\t590\t5\t211\t3e-09\t52.8\n+2_13\t1_261\t32.14\t84\t54\t1\t513\t593\t197\t280\t4e-09\t53.5\n+2_13\t1_101\t25.00\t248\t162\t10\t365\t608\t4\t231\t5e-09\t52.4\n+2_13\t1_535\t32.26\t93\t56\t3\t514\t601\t681\t771\t4e-08\t51.2\n+2_13\t1_535\t27.88\t104\t69\t2\t351\t448\t7\t110\t3e-05\t42.0\n+2_13\t1_619\t28.97\t214\t126\t8\t385\t590\t29\t224\t8e-08\t49.7\n+2_13\t1_395\t23.56\t225\t136\t7\t377\t590\t18\t217\t7e-06\t43.1\n+2_13\t1_536\t34.18\t79\t49\t2\t515\t590\t228\t306\t4e-05\t41.2\n+2_14\t1_5\t34.31\t545\t321\t6\t78\t587\t85\t627\t7e-93\t 297\n+2_14\t1_385\t30.15\t544\t346\t7\t63\t588\t67\t594\t4e-71\t 238\n+2_14\t1_4\t34.41\t186\t106\t5\t313\t485\t121\t303\t5e-27\t 107\n+2_14\t1_609\t28.14\t231\t158\t4\t352\t579\t8\t233\t7e-21\t88.6\n+2_14\t1_384\t28.18\t181\t130\t0\t409\t589\t2\t182\t1e-17\t77.8\n+2_14\t1_619\t35.50\t200\t110\t7\t369\t556\t26\t218\t2e-17\t80.1\n+2_14\t1_619\t26.60\t282\t180\t8\t321\t575\t255\t536\t1e-11\t61.6\n+2_14\t1_40\t29.66\t236\t132\t8\t362\t576\t88\t310\t1e-15\t73.2\n+2_14\t1_21\t27.88\t208\t128\t7\t368\t564\t285\t481\t3e-15\t73.2\n+2_14\t1_270\t28.50\t200\t122\t6\t359\t548\t5\t193\t9e-15\t69.3\n+2_14\t1_608\t28.38\t222\t138\t10\t368\t573\t42\t258\t5e-10\t56.2\n+2_14\t1_101\t24.00\t225\t145\t6\t363\t575\t14\t224\t5e-10\t55.1\n+2_14\t1_301\t26.29\t213\t148\t6\t365\t573\t29\t236\t4e-09\t53.5\n+2_14\t1_234\t22.82\t241\t153\t8\t350\t569\t5\t233\t1e-08\t50.8\n+2_14\t1_33\t32.50\t80\t51\t2\t368\t446\t47\t124\t1e-07\t49.7\n+2_14\t1_33\t27.00\t100\t66\t3\t489\t582\t364\t462\t5e-04\t37.4\n+2_14\t1_535\t35.11\t94\t50\t3\t489\t575\t681\t770\t1e-07\t49.3\n+2_14\t1_395\t21.97\t223\t158\t6\t366\t582\t22\t234\t1e-07\t48.5\n+2_14\t1_293\t25.53\t235\t123\t8\t365\t569\t16\t228\t5e-07\t46.6\n+2_14\t1_261\t34.92\t63\t40\t1\t352\t414\t6\t67\t5e-07\t47.0\n+2_14\t1_261\t36.25\t80\t47\t2\t482\t561\t191\t266\t1e-04\t39.3\n+2_14\t1_383\t22.77\t202\t149\t2\t102\t298\t86\t285\t9e-07\t45.8\n+2_14\t1_543\t25.11\t227\t148\t9\t368\t575\t79\t302\t1e-06\t45.8\n+2_14\t1_536\t22.02\t277\t144\t12\t367\t573\t40\t314\t6e-06\t43.5\n+2_14\t1_491\t27.27\t99\t69\t2\t352\t449\t7\t103\t8e-06\t43.5\n+2_14\t1_491\t30.53\t95\t57\t3\t489\t580\t285\t373\t2e-04\t39.3\n+2_14\t1_415\t22.05\t195\t133\t7\t352\t545\t471\t647\t3e-05\t41.6\n+2_14\t1_542\t31.46\t89\t58\t2\t490\t575\t296\t384\t3e-05\t41.2\n+2_15\t1_735\t35.53\t833\t50'..b'\t1_559\t35.16\t128\t80\t2\t14\t139\t12\t138\t2e-12\t63.9\n+2_456\t1_584\t35.60\t250\t141\t6\t21\t257\t14\t256\t2e-32\t 117\n+2_456\t1_585\t30.65\t261\t158\t6\t8\t248\t1\t258\t1e-24\t95.5\n+2_456\t1_586\t31.98\t222\t138\t6\t18\t229\t10\t228\t7e-22\t87.4\n+2_458\t1_303\t37.14\t140\t84\t4\t19\t155\t5\t143\t2e-27\t97.8\n+2_459\t1_305\t31.96\t413\t243\t8\t9\t391\t7\t411\t9e-63\t 206\n+2_461\t1_25\t57.99\t688\t245\t8\t39\t683\t40\t726\t0.0\t 750\n+2_461\t1_551\t32.39\t71\t41\t2\t262\t332\t40\t103\t1e-05\t43.1\n+2_461\t1_715\t28.67\t150\t91\t6\t268\t412\t101\t239\t6e-05\t40.8\n+2_462\t1_24\t48.19\t166\t86\t0\t3\t168\t8\t173\t5e-56\t 173\n+2_463\t1_23\t24.85\t169\t111\t9\t1\t167\t1\t155\t8e-07\t42.0\n+2_464\t1_72\t32.81\t317\t200\t6\t5\t309\t3\t318\t3e-51\t 170\n+2_465\t1_748\t40.06\t347\t199\t4\t5\t346\t10\t352\t5e-82\t 258\n+2_466\t1_749\t49.19\t492\t237\t4\t1\t479\t1\t492\t1e-169\t 488\n+2_467\t1_9\t41.63\t257\t144\t4\t2\t255\t12\t265\t2e-63\t 198\n+2_468\t1_8\t57.70\t383\t158\t4\t5\t385\t1\t381\t3e-152\t 435\n+2_469\t1_7\t29.41\t85\t60\t0\t10\t94\t1\t85\t5e-08\t43.5\n+2_470\t1_6\t72.34\t47\t13\t0\t1\t47\t1\t47\t7e-17\t63.9\n+2_471\t1_21\t45.00\t200\t110\t0\t104\t303\t284\t483\t3e-50\t 171\n+2_471\t1_270\t36.17\t188\t110\t4\t104\t288\t16\t196\t2e-32\t 117\n+2_471\t1_234\t32.02\t203\t126\t4\t108\t300\t27\t227\t2e-24\t95.5\n+2_471\t1_609\t29.70\t202\t134\t4\t104\t302\t23\t219\t4e-22\t89.4\n+2_471\t1_40\t29.11\t213\t133\t7\t105\t304\t94\t301\t2e-20\t84.7\n+2_471\t1_301\t30.00\t200\t131\t3\t105\t300\t32\t226\t3e-20\t84.3\n+2_471\t1_543\t27.65\t217\t137\t5\t104\t302\t78\t292\t9e-18\t78.2\n+2_471\t1_535\t39.33\t89\t53\t1\t215\t302\t672\t760\t2e-17\t77.4\n+2_471\t1_542\t35.23\t88\t56\t1\t216\t302\t287\t374\t3e-17\t77.0\n+2_471\t1_261\t40.37\t109\t62\t2\t204\t311\t178\t284\t1e-16\t74.7\n+2_471\t1_261\t38.46\t91\t40\t2\t104\t191\t20\t97\t1e-09\t53.5\n+2_471\t1_536\t38.71\t93\t56\t1\t211\t302\t214\t306\t1e-16\t74.7\n+2_471\t1_33\t40.21\t97\t57\t1\t206\t301\t346\t442\t2e-16\t74.7\n+2_471\t1_33\t33.33\t90\t54\t1\t101\t190\t43\t126\t8e-09\t51.2\n+2_471\t1_101\t26.73\t202\t135\t6\t107\t304\t24\t216\t4e-16\t71.6\n+2_471\t1_491\t41.30\t92\t51\t2\t219\t309\t280\t369\t1e-15\t72.4\n+2_471\t1_491\t27.38\t84\t55\t1\t105\t188\t23\t100\t5e-06\t42.7\n+2_471\t1_619\t25.51\t196\t137\t4\t92\t282\t12\t203\t3e-14\t67.8\n+2_471\t1_619\t23.36\t214\t135\t7\t106\t297\t315\t521\t0.001\t35.4\n+2_471\t1_5\t29.60\t223\t130\t9\t92\t302\t398\t605\t4e-14\t67.8\n+2_471\t1_608\t25.11\t235\t145\t9\t91\t304\t28\t252\t2e-13\t65.1\n+2_471\t1_395\t21.03\t214\t135\t7\t104\t302\t23\t217\t9e-11\t57.0\n+2_471\t1_385\t26.76\t213\t126\t7\t105\t302\t374\t571\t2e-10\t56.6\n+2_471\t1_384\t31.00\t100\t63\t3\t204\t302\t64\t158\t7e-08\t47.0\n+2_471\t1_293\t23.56\t208\t151\t5\t104\t303\t18\t225\t2e-07\t46.6\n+2_471\t1_86\t27.50\t80\t50\t3\t223\t297\t837\t913\t4e-05\t40.0\n+2_471\t1_415\t22.58\t186\t126\t4\t104\t288\t485\t653\t8e-05\t38.9\n+2_472\t1_20\t21.92\t1104\t725\t34\t740\t1781\t328\t1356\t9e-51\t 192\n+2_473\t1_21\t42.60\t277\t155\t3\t9\t283\t224\t498\t4e-69\t 221\n+2_473\t1_270\t35.03\t197\t113\t7\t66\t257\t11\t197\t9e-28\t 104\n+2_473\t1_234\t30.29\t208\t133\t4\t72\t268\t24\t230\t8e-21\t84.7\n+2_473\t1_301\t31.82\t220\t137\t6\t72\t284\t32\t245\t1e-20\t85.1\n+2_473\t1_609\t29.21\t202\t133\t5\t71\t267\t23\t219\t1e-19\t81.6\n+2_473\t1_535\t39.60\t101\t56\t2\t180\t275\t672\t772\t8e-18\t78.6\n+2_473\t1_619\t27.02\t248\t158\t9\t46\t281\t1\t237\t1e-17\t77.4\n+2_473\t1_619\t22.66\t203\t136\t6\t75\t258\t317\t517\t1e-06\t44.3\n+2_473\t1_40\t28.87\t239\t141\t9\t44\t267\t75\t299\t9e-17\t73.9\n+2_473\t1_33\t30.67\t150\t96\t2\t125\t266\t293\t442\t5e-15\t70.1\n+2_473\t1_33\t33.70\t92\t53\t2\t70\t161\t45\t128\t2e-09\t52.8\n+2_473\t1_101\t27.00\t200\t129\t6\t75\t267\t25\t214\t5e-13\t62.4\n+2_473\t1_608\t28.71\t209\t134\t7\t73\t267\t43\t250\t8e-13\t62.8\n+2_473\t1_542\t32.10\t81\t54\t1\t188\t267\t294\t374\t1e-12\t62.8\n+2_473\t1_543\t27.57\t214\t129\t6\t76\t267\t83\t292\t3e-12\t61.2\n+2_473\t1_491\t31.78\t107\t68\t2\t161\t266\t261\t363\t2e-11\t58.9\n+2_473\t1_491\t29.91\t107\t66\t2\t53\t159\t7\t104\t7e-09\t51.2\n+2_473\t1_261\t30.69\t101\t69\t1\t167\t266\t176\t276\t1e-10\t56.2\n+2_473\t1_261\t32.97\t91\t51\t2\t69\t159\t18\t98\t3e-07\t45.8\n+2_473\t1_385\t25.12\t215\t135\t7\t67\t267\t369\t571\t2e-10\t56.2\n+2_473\t1_536\t31.71\t82\t55\t1\t187\t267\t225\t306\t3e-10\t55.5\n+2_473\t1_5\t26.76\t213\t126\t9\t71\t267\t407\t605\t7e-10\t54.3\n+2_473\t1_395\t22.33\t206\t149\t3\t67\t268\t19\t217\t6e-09\t50.8\n+2_473\t1_384\t28.30\t106\t63\t4\t165\t267\t63\t158\t2e-06\t42.4\n+2_473\t1_86\t30.38\t79\t47\t3\t188\t261\t837\t912\t3e-05\t40.0\n+2_473\t1_293\t22.05\t263\t145\t8\t58\t284\t5\t243\t3e-05\t39.3\n+2_473\t1_4\t29.91\t117\t71\t4\t42\t158\t163\t268\t4e-05\t39.3\n+2_474\t1_2\t33.14\t338\t214\t5\t100\t429\t120\t453\t4e-53\t 182\n+2_475\t1_0\t60.30\t267\t96\t3\t1\t267\t1\t257\t2e-115\t 332\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast2_2.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast2_2.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1021 @@\n+2_0\t2_0\t100.00\t380\t0\t0\t1\t380\t1\t380\t0.0\t 741\n+2_1\t2_1\t100.00\t310\t0\t0\t1\t310\t1\t310\t0.0\t 626\n+2_1\t2_199\t41.67\t60\t33\t1\t4\t61\t9\t68\t9e-09\t50.4\n+2_1\t2_16\t37.88\t66\t33\t1\t4\t61\t9\t74\t2e-08\t48.9\n+2_2\t2_2\t100.00\t650\t0\t0\t1\t650\t1\t650\t0.0\t1344\n+2_2\t2_202\t45.43\t645\t329\t9\t10\t647\t5\t633\t0.0\t 543\n+2_3\t2_3\t100.00\t836\t0\t0\t1\t836\t1\t836\t0.0\t1699\n+2_3\t2_203\t34.37\t678\t423\t10\t32\t702\t20\t682\t6e-124\t 390\n+2_4\t2_4\t100.00\t417\t0\t0\t1\t417\t1\t417\t0.0\t 851\n+2_5\t2_5\t100.00\t210\t0\t0\t1\t210\t1\t210\t1e-157\t 434\n+2_6\t2_6\t100.00\t254\t0\t0\t1\t254\t1\t254\t0.0\t 509\n+2_6\t2_426\t37.93\t58\t36\t0\t85\t142\t119\t176\t1e-04\t37.0\n+2_7\t2_7\t100.00\t442\t0\t0\t1\t442\t1\t442\t0.0\t 880\n+2_7\t2_334\t35.51\t107\t62\t2\t206\t309\t171\t273\t3e-15\t72.0\n+2_7\t2_334\t32.31\t130\t74\t4\t218\t342\t2\t122\t3e-10\t56.2\n+2_7\t2_447\t47.37\t38\t20\t0\t218\t255\t117\t154\t3e-05\t39.7\n+2_7\t2_396\t44.12\t34\t19\t0\t219\t252\t5\t38\t4e-04\t36.2\n+2_8\t2_8\t100.00\t262\t0\t0\t1\t262\t1\t262\t0.0\t 535\n+2_9\t2_9\t100.00\t218\t0\t0\t1\t218\t1\t218\t5e-159\t 438\n+2_9\t2_252\t26.90\t145\t101\t3\t62\t202\t216\t359\t3e-13\t62.4\n+2_10\t2_10\t100.00\t287\t0\t0\t1\t287\t1\t287\t0.0\t 566\n+2_10\t2_11\t25.81\t124\t90\t2\t125\t247\t140\t262\t4e-05\t38.5\n+2_11\t2_11\t100.00\t287\t0\t0\t1\t287\t1\t287\t0.0\t 582\n+2_12\t2_12\t100.00\t273\t0\t0\t1\t273\t1\t273\t0.0\t 551\n+2_13\t2_13\t100.00\t623\t0\t0\t1\t623\t1\t623\t0.0\t1249\n+2_13\t2_14\t25.71\t560\t351\t16\t79\t611\t65\t586\t6e-40\t 148\n+2_13\t2_180\t31.50\t254\t142\t8\t361\t600\t1\t236\t6e-25\t 100\n+2_13\t2_181\t30.31\t254\t152\t8\t365\t607\t17\t256\t8e-21\t88.2\n+2_13\t2_119\t34.15\t205\t116\t9\t396\t593\t36\t228\t4e-15\t72.4\n+2_13\t2_119\t22.78\t237\t150\t8\t372\t592\t328\t547\t4e-05\t40.4\n+2_13\t2_419\t28.21\t234\t148\t8\t365\t590\t83\t304\t8e-15\t70.5\n+2_13\t2_64\t28.14\t199\t119\t6\t398\t589\t267\t448\t2e-14\t69.7\n+2_13\t2_308\t26.52\t230\t145\t7\t365\t590\t2\t211\t4e-14\t67.0\n+2_13\t2_471\t27.78\t216\t100\t7\t398\t590\t120\t302\t4e-13\t64.7\n+2_13\t2_473\t25.86\t232\t145\t7\t367\t590\t55\t267\t5e-13\t64.3\n+2_13\t2_39\t37.78\t90\t45\t2\t508\t590\t342\t427\t4e-11\t59.7\n+2_13\t2_39\t27.53\t178\t94\t7\t398\t565\t38\t190\t4e-05\t40.4\n+2_13\t2_188\t32.91\t79\t50\t1\t514\t589\t368\t446\t2e-09\t54.7\n+2_13\t2_188\t24.50\t151\t97\t5\t365\t504\t8\t152\t5e-07\t46.6\n+2_13\t2_79\t37.04\t81\t46\t3\t514\t590\t685\t764\t1e-08\t52.4\n+2_13\t2_79\t32.76\t58\t34\t1\t396\t448\t43\t100\t5e-04\t37.0\n+2_13\t2_293\t23.39\t248\t175\t6\t363\t606\t5\t241\t1e-08\t50.4\n+2_13\t2_78\t37.50\t80\t47\t2\t514\t590\t209\t288\t9e-06\t42.4\n+2_14\t2_14\t100.00\t589\t0\t0\t1\t589\t1\t589\t0.0\t1197\n+2_14\t2_13\t25.04\t607\t379\t18\t27\t586\t34\t611\t3e-36\t 137\n+2_14\t2_180\t30.25\t238\t135\t8\t345\t568\t2\t222\t9e-22\t90.5\n+2_14\t2_419\t31.20\t250\t144\t7\t342\t573\t73\t312\t3e-17\t77.8\n+2_14\t2_64\t24.17\t211\t132\t6\t368\t564\t252\t448\t1e-13\t67.4\n+2_14\t2_119\t25.98\t254\t160\t10\t341\t576\t313\t556\t3e-12\t63.2\n+2_14\t2_119\t29.90\t194\t124\t7\t380\t565\t35\t224\t2e-11\t60.8\n+2_14\t2_181\t23.90\t205\t141\t6\t372\t566\t41\t240\t6e-12\t61.2\n+2_14\t2_471\t25.47\t212\t130\t8\t368\t565\t105\t302\t7e-12\t60.8\n+2_14\t2_473\t25.25\t202\t135\t5\t371\t565\t75\t267\t1e-09\t53.9\n+2_14\t2_308\t29.38\t177\t103\t6\t352\t520\t2\t164\t1e-09\t53.5\n+2_14\t2_39\t34.52\t84\t52\t2\t367\t449\t22\t103\t1e-08\t51.6\n+2_14\t2_39\t30.34\t89\t55\t3\t486\t569\t345\t431\t2e-06\t44.7\n+2_14\t2_293\t21.92\t219\t134\t6\t352\t549\t7\t209\t6e-08\t48.5\n+2_14\t2_78\t25.98\t254\t128\t10\t370\t568\t43\t291\t2e-07\t47.8\n+2_14\t2_188\t29.67\t91\t59\t3\t349\t438\t5\t91\t2e-07\t47.8\n+2_14\t2_188\t27.10\t107\t71\t3\t482\t582\t361\t466\t3e-06\t43.9\n+2_14\t2_79\t30.68\t88\t58\t2\t489\t573\t685\t772\t4e-06\t43.9\n+2_14\t2_79\t35.14\t74\t43\t3\t368\t436\t30\t103\t2e-05\t41.6\n+2_14\t2_307\t22.53\t253\t152\t10\t333\t566\t65\t292\t8e-06\t42.4\n+2_14\t2_399\t21.86\t183\t126\t4\t372\t553\t481\t647\t0.001\t35.8\n+2_15\t2_15\t100.00\t1031\t0\t0\t1\t1031\t1\t1031\t0.0\t2080\n+2_16\t2_16\t100.00\t389\t0\t0\t1\t389\t1\t389\t0.0\t 795\n+2_16\t2_199\t47.12\t104\t44\t3\t1\t103\t1\t94\t6e-21\t89.0\n+2_16\t2_199\t24.19\t186\t113\t8\t211\t388\t399\t564\t3e-04\t37.0\n+2_16\t2_1\t37.88\t66\t33\t1\t9\t74\t4\t61\t3e-08\t48.9\n+2_17\t2_17\t100.00\t308\t0\t0\t1\t308\t1\t308\t0.0\t 639\n+2_18\t2_18\t100.00\t512\t0\t0\t1\t512\t1\t512\t0.0\t1057\n+2_18\t2_351\t30.00\t140\t89\t6\t288\t424\t577\t710\t6e-08\t49.3\n+2_18\t2_351\t34.92\t63\t39\t1\t12\t74\t58\t118\t7e-06\t42.7\n+2_18\t2_338\t26.37\t201\t131\t5\t283\t478\t495\t683\t3e-07\t47.0\n+2_18\t2_338\t26.36\t129\t77\t3\t9\t119\t44\t172\t2e-04\t38.1\n+2_18\t2_270\t33.75\t80\t42\t3\t254\t329\t525\t597\t1e-06\t45.1\n+2_18\t2_270\t25.23\t107\t78\t1\t11\t115\t40\t146\t6e-06\t42.7\n+2_19\t2_19\t100.00\t145\t0\t0\t1\t145\t1\t145\t5e-104\t 293\n+2_20'..b'5\t7e-06\t41.2\n+2_447\t2_339\t32.79\t61\t40\t1\t118\t178\t22\t81\t3e-04\t35.0\n+2_448\t2_448\t100.00\t395\t0\t0\t1\t395\t1\t395\t0.0\t 783\n+2_448\t2_438\t34.36\t390\t245\t6\t10\t394\t2\t385\t4e-72\t 229\n+2_449\t2_449\t100.00\t119\t0\t0\t1\t119\t1\t119\t3e-83\t 238\n+2_450\t2_450\t100.00\t231\t0\t0\t1\t231\t1\t231\t2e-174\t 478\n+2_451\t2_451\t100.00\t95\t0\t0\t1\t95\t1\t95\t2e-67\t 196\n+2_452\t2_452\t100.00\t547\t0\t0\t1\t547\t1\t547\t0.0\t1077\n+2_453\t2_453\t100.00\t150\t0\t0\t1\t150\t1\t150\t1e-112\t 315\n+2_454\t2_454\t100.00\t290\t0\t0\t1\t290\t1\t290\t0.0\t 589\n+2_454\t2_331\t24.16\t298\t198\t9\t2\t284\t3\t287\t7e-16\t70.9\n+2_455\t2_455\t100.00\t394\t0\t0\t1\t394\t1\t394\t0.0\t 804\n+2_455\t2_137\t26.69\t266\t171\t9\t14\t273\t8\t255\t2e-17\t78.6\n+2_455\t2_88\t36.72\t128\t78\t2\t14\t139\t12\t138\t2e-13\t65.9\n+2_455\t2_142\t31.74\t167\t86\t8\t15\t176\t125\t268\t3e-09\t53.1\n+2_456\t2_456\t100.00\t261\t0\t0\t1\t261\t1\t261\t0.0\t 512\n+2_456\t2_132\t28.18\t220\t124\t7\t37\t224\t28\t245\t6e-12\t58.5\n+2_457\t2_457\t100.00\t292\t0\t0\t1\t292\t1\t292\t0.0\t 590\n+2_458\t2_458\t100.00\t155\t0\t0\t1\t155\t1\t155\t2e-113\t 317\n+2_459\t2_459\t100.00\t396\t0\t0\t1\t396\t1\t396\t0.0\t 800\n+2_460\t2_460\t100.00\t334\t0\t0\t1\t334\t1\t334\t0.0\t 671\n+2_461\t2_461\t100.00\t702\t0\t0\t1\t702\t1\t702\t0.0\t1429\n+2_461\t2_366\t28.42\t95\t54\t3\t245\t336\t19\t102\t7e-05\t39.3\n+2_461\t2_242\t27.22\t180\t102\t8\t246\t409\t357\t523\t1e-04\t39.3\n+2_462\t2_462\t100.00\t175\t0\t0\t1\t175\t1\t175\t2e-126\t 352\n+2_463\t2_463\t100.00\t169\t0\t0\t1\t169\t1\t169\t1e-124\t 347\n+2_464\t2_464\t100.00\t312\t0\t0\t1\t312\t1\t312\t0.0\t 629\n+2_465\t2_465\t100.00\t425\t0\t0\t1\t425\t1\t425\t0.0\t 876\n+2_466\t2_466\t100.00\t484\t0\t0\t1\t484\t1\t484\t0.0\t 991\n+2_467\t2_467\t100.00\t259\t0\t0\t1\t259\t1\t259\t0.0\t 519\n+2_468\t2_468\t100.00\t385\t0\t0\t1\t385\t1\t385\t0.0\t 776\n+2_469\t2_469\t100.00\t128\t0\t0\t1\t128\t1\t128\t3e-90\t 256\n+2_470\t2_470\t100.00\t48\t0\t0\t1\t48\t1\t48\t9e-30\t96.3\n+2_471\t2_471\t100.00\t311\t0\t0\t1\t311\t1\t311\t0.0\t 625\n+2_471\t2_64\t37.59\t274\t164\t3\t34\t303\t180\t450\t7e-48\t 164\n+2_471\t2_473\t36.20\t279\t160\t4\t28\t306\t11\t271\t7e-44\t 149\n+2_471\t2_181\t29.60\t223\t136\t9\t93\t302\t25\t239\t2e-22\t89.4\n+2_471\t2_79\t44.44\t90\t49\t1\t214\t302\t675\t764\t2e-21\t89.4\n+2_471\t2_307\t30.90\t233\t132\t8\t89\t307\t79\t296\t3e-21\t87.0\n+2_471\t2_419\t31.13\t212\t128\t8\t104\t302\t98\t304\t4e-20\t83.2\n+2_471\t2_293\t30.59\t219\t135\t5\t104\t310\t21\t234\t7e-20\t81.6\n+2_471\t2_180\t26.44\t208\t145\t4\t98\t302\t17\t219\t1e-19\t81.3\n+2_471\t2_39\t31.25\t144\t97\t2\t161\t303\t286\t428\t6e-17\t75.5\n+2_471\t2_39\t33.33\t114\t59\t3\t105\t207\t23\t130\t4e-11\t57.8\n+2_471\t2_188\t43.30\t97\t54\t1\t206\t301\t350\t446\t1e-16\t74.3\n+2_471\t2_188\t29.07\t86\t55\t2\t105\t190\t23\t102\t2e-05\t40.0\n+2_471\t2_78\t26.29\t251\t135\t7\t108\t308\t44\t294\t8e-16\t71.6\n+2_471\t2_119\t26.21\t206\t140\t5\t107\t304\t25\t226\t1e-15\t71.6\n+2_471\t2_119\t23.42\t222\t129\t9\t108\t303\t340\t546\t9e-07\t44.3\n+2_471\t2_14\t25.47\t212\t130\t8\t105\t302\t368\t565\t1e-11\t59.3\n+2_471\t2_308\t23.11\t212\t142\t5\t99\t302\t13\t211\t2e-11\t58.2\n+2_471\t2_13\t27.65\t217\t101\t7\t120\t303\t398\t591\t2e-11\t58.9\n+2_471\t2_399\t24.23\t194\t130\t7\t105\t298\t479\t655\t2e-04\t36.6\n+2_472\t2_472\t100.00\t1783\t0\t0\t1\t1783\t1\t1783\t0.0\t3586\n+2_472\t2_63\t22.76\t1160\t702\t41\t707\t1779\t272\t1324\t3e-36\t 144\n+2_473\t2_473\t100.00\t284\t0\t0\t1\t284\t1\t284\t0.0\t 573\n+2_473\t2_64\t46.61\t236\t120\t2\t53\t284\t233\t466\t2e-64\t 207\n+2_473\t2_471\t42.36\t203\t115\t1\t71\t271\t104\t306\t8e-49\t 162\n+2_473\t2_180\t29.61\t206\t135\t5\t67\t267\t19\t219\t4e-22\t87.8\n+2_473\t2_419\t28.03\t239\t142\t10\t44\t267\t81\t304\t6e-20\t82.4\n+2_473\t2_79\t34.78\t115\t69\t3\t167\t275\t662\t776\t6e-17\t75.1\n+2_473\t2_181\t28.42\t190\t125\t6\t87\t267\t52\t239\t2e-16\t72.0\n+2_473\t2_293\t26.85\t216\t141\t3\t71\t273\t21\t232\t3e-16\t70.9\n+2_473\t2_119\t29.38\t194\t123\t7\t87\t270\t38\t227\t6e-16\t72.0\n+2_473\t2_119\t21.33\t211\t143\t5\t75\t267\t340\t545\t1e-05\t40.8\n+2_473\t2_39\t33.01\t103\t68\t1\t166\t267\t325\t427\t5e-14\t66.2\n+2_473\t2_39\t40.00\t85\t45\t1\t75\t159\t26\t104\t5e-11\t57.4\n+2_473\t2_307\t28.68\t265\t164\t11\t20\t267\t35\t291\t6e-14\t65.5\n+2_473\t2_188\t31.78\t107\t72\t1\t161\t266\t340\t446\t2e-13\t64.7\n+2_473\t2_188\t33.33\t87\t52\t1\t73\t159\t24\t104\t2e-09\t52.4\n+2_473\t2_308\t25.73\t206\t132\t4\t71\t267\t18\t211\t3e-13\t62.8\n+2_473\t2_13\t28.12\t160\t91\t5\t87\t227\t398\t552\t3e-12\t60.8\n+2_473\t2_14\t25.74\t202\t134\t6\t75\t267\t371\t565\t3e-11\t58.2\n+2_473\t2_78\t33.33\t81\t53\t1\t188\t267\t208\t288\t2e-09\t52.0\n+2_473\t2_427\t31.58\t76\t48\t3\t189\t261\t838\t912\t2e-04\t37.0\n+2_474\t2_474\t100.00\t437\t0\t0\t1\t437\t1\t437\t0.0\t 879\n+2_475\t2_475\t100.00\t269\t0\t0\t1\t269\t1\t269\t0.0\t 541\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast2_3.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast2_3.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1096 @@\n+2_1\t3_64\t39.71\t68\t33\t1\t2\t61\t5\t72\t9e-08\t47.8\n+2_2\t3_107\t49.69\t644\t312\t6\t10\t650\t5\t639\t0.0\t 631\n+2_2\t3_29\t41.06\t643\t348\t9\t10\t642\t3\t624\t2e-166\t 491\n+2_3\t3_526\t44.68\t808\t441\t5\t20\t823\t46\t851\t0.0\t 691\n+2_3\t3_28\t33.77\t690\t446\t7\t29\t713\t17\t700\t4e-115\t 369\n+2_4\t3_244\t41.16\t413\t225\t9\t9\t411\t8\t412\t9e-94\t 287\n+2_5\t3_252\t34.18\t196\t120\t5\t5\t193\t1\t194\t1e-28\t 104\n+2_6\t3_253\t36.00\t50\t32\t0\t87\t136\t86\t135\t9e-06\t40.8\n+2_6\t3_249\t29.13\t103\t44\t3\t35\t137\t100\t173\t6e-04\t35.4\n+2_7\t3_205\t36.85\t445\t264\t10\t7\t442\t6\t442\t5e-71\t 229\n+2_7\t3_66\t43.65\t126\t62\t5\t218\t336\t171\t294\t4e-20\t87.0\n+2_7\t3_66\t27.34\t128\t84\t2\t220\t345\t5\t125\t4e-09\t52.8\n+2_7\t3_152\t33.33\t93\t56\t2\t220\t309\t9\t98\t6e-07\t45.8\n+2_8\t3_651\t31.39\t274\t154\t12\t2\t260\t152\t406\t5e-23\t92.4\n+2_9\t3_55\t30.67\t163\t98\t7\t60\t216\t211\t364\t3e-06\t42.0\n+2_13\t3_256\t32.23\t242\t142\t7\t365\t601\t2\t226\t8e-22\t91.3\n+2_13\t3_333\t28.14\t231\t143\t5\t376\t604\t10\t219\t2e-15\t74.7\n+2_13\t3_625\t28.36\t268\t165\t9\t315\t577\t283\t528\t2e-14\t71.2\n+2_13\t3_297\t29.68\t219\t131\t6\t374\t589\t7\t205\t5e-14\t69.7\n+2_13\t3_622\t28.26\t184\t112\t5\t359\t541\t328\t492\t8e-14\t68.9\n+2_13\t3_623\t28.85\t208\t125\t7\t368\t574\t338\t523\t3e-13\t67.0\n+2_13\t3_379\t28.52\t256\t153\t9\t365\t613\t2\t234\t6e-13\t66.6\n+2_13\t3_19\t28.57\t210\t125\t5\t398\t603\t32\t220\t3e-12\t64.3\n+2_13\t3_307\t27.75\t209\t123\t6\t386\t589\t20\t205\t7e-12\t62.8\n+2_13\t3_541\t36.36\t88\t53\t1\t514\t598\t232\t319\t1e-11\t61.6\n+2_13\t3_541\t30.56\t72\t47\t2\t398\t468\t41\t110\t6e-04\t37.0\n+2_13\t3_17\t26.53\t245\t151\t7\t383\t619\t17\t240\t1e-11\t62.0\n+2_13\t3_18\t29.00\t200\t119\t5\t392\t589\t26\t204\t2e-11\t61.2\n+2_13\t3_210\t29.46\t241\t131\t10\t349\t568\t109\t331\t6e-11\t59.7\n+2_13\t3_226\t27.24\t257\t128\t12\t390\t607\t3\t239\t9e-11\t58.9\n+2_13\t3_226\t26.22\t267\t137\t12\t363\t600\t241\t476\t4e-07\t47.4\n+2_13\t3_357\t27.57\t243\t138\t11\t364\t588\t9\t231\t1e-10\t57.0\n+2_13\t3_211\t38.04\t92\t52\t3\t514\t601\t281\t371\t2e-10\t58.2\n+2_13\t3_211\t29.13\t103\t63\t4\t363\t459\t42\t140\t1e-04\t39.7\n+2_13\t3_257\t27.73\t220\t123\t8\t397\t595\t37\t241\t4e-10\t56.2\n+2_13\t3_375\t28.71\t101\t61\t2\t508\t601\t112\t208\t2e-09\t54.3\n+2_13\t3_626\t27.45\t204\t127\t7\t385\t585\t353\t538\t3e-09\t54.3\n+2_13\t3_365\t33.33\t99\t57\t2\t514\t609\t508\t600\t5e-09\t53.5\n+2_13\t3_365\t26.67\t135\t93\t3\t359\t492\t33\t162\t2e-07\t48.5\n+2_13\t3_306\t24.26\t235\t146\t8\t385\t607\t19\t233\t2e-08\t52.0\n+2_13\t3_445\t25.25\t198\t124\t6\t400\t590\t97\t277\t2e-08\t50.8\n+2_13\t3_206\t25.56\t270\t163\t10\t365\t614\t2\t253\t2e-08\t51.6\n+2_13\t3_494\t34.52\t84\t44\t3\t514\t590\t617\t696\t3e-08\t51.6\n+2_13\t3_495\t26.77\t254\t157\t11\t353\t590\t1\t241\t1e-07\t48.9\n+2_13\t3_508\t27.57\t272\t157\t13\t341\t591\t239\t491\t2e-07\t48.5\n+2_13\t3_508\t23.18\t233\t156\t10\t383\t606\t22\t240\t2e-04\t38.9\n+2_13\t3_462\t30.70\t114\t71\t4\t507\t614\t102\t213\t5e-07\t45.8\n+2_13\t3_281\t29.89\t87\t60\t1\t505\t590\t13\t99\t5e-05\t40.8\n+2_13\t3_298\t22.07\t222\t127\t7\t411\t609\t3\t201\t1e-04\t39.7\n+2_13\t3_605\t31.11\t45\t31\t0\t386\t430\t26\t70\t5e-04\t37.4\n+2_14\t3_333\t30.70\t228\t140\t9\t352\t575\t2\t215\t9e-19\t85.1\n+2_14\t3_622\t26.64\t229\t143\t6\t326\t547\t312\t522\t1e-17\t81.3\n+2_14\t3_297\t29.85\t201\t129\t4\t368\t566\t17\t207\t4e-17\t79.3\n+2_14\t3_256\t26.79\t224\t153\t4\t352\t569\t2\t220\t1e-16\t75.1\n+2_14\t3_17\t30.21\t192\t116\t4\t364\t551\t13\t190\t8e-16\t75.5\n+2_14\t3_18\t29.66\t236\t138\t8\t364\t588\t13\t231\t2e-15\t74.3\n+2_14\t3_19\t30.93\t194\t110\t6\t365\t551\t14\t190\t4e-15\t73.2\n+2_14\t3_623\t28.51\t221\t139\t8\t333\t548\t316\t522\t1e-14\t71.6\n+2_14\t3_626\t28.10\t210\t136\t7\t343\t547\t324\t523\t3e-14\t70.5\n+2_14\t3_445\t27.64\t246\t141\t10\t339\t564\t48\t276\t5e-14\t68.2\n+2_14\t3_625\t24.54\t216\t148\t6\t336\t547\t318\t522\t9e-14\t68.6\n+2_14\t3_508\t30.14\t219\t131\t10\t367\t572\t21\t230\t2e-13\t67.8\n+2_14\t3_508\t24.85\t169\t103\t7\t372\t524\t287\t447\t4e-05\t40.8\n+2_14\t3_307\t26.39\t216\t148\t5\t352\t566\t2\t207\t8e-13\t65.9\n+2_14\t3_379\t23.98\t221\t142\t7\t368\t577\t17\t222\t5e-11\t60.1\n+2_14\t3_226\t27.60\t221\t118\t11\t371\t566\t1\t204\t3e-10\t57.4\n+2_14\t3_226\t31.87\t91\t60\t2\t489\t577\t383\t473\t3e-04\t37.7\n+2_14\t3_306\t28.04\t189\t109\t6\t370\t549\t19\t189\t4e-10\t57.4\n+2_14\t3_495\t26.64\t229\t136\t12\t368\t573\t30\t249\t1e-09\t55.1\n+2_14\t3_541\t35.63\t87\t53\t2\t364\t449\t22\t106\t1e-09\t55.1\n+2_14\t3_281\t41.10\t73\t39\t1\t479\t551\t16\t84\t2e-09\t55.1\n+2_14\t3_462\t25.63\t238\t120\t10\t375\t587\t6\t211\t2e-08\t49.7\n+2_14\t3_357\t25.68\t222\t132\t8\t363\t563\t22\t231\t3e-08\t50.1\n+2_14\t3_257\t23.62\t254\t163\t9\t352\t579\t3\t251\t7e-08\t49.3\n+2_14\t3_206\t23.47\t196\t108\t7\t364\t529\t13\t196\t2e-07\t48.5\n'..b'69\t3_672\t25.23\t111\t77\t3\t10\t117\t1\t108\t2e-04\t33.5\n+2_470\t3_673\t65.96\t47\t16\t0\t1\t47\t1\t47\t7e-16\t61.2\n+2_471\t3_445\t39.50\t200\t121\t0\t104\t303\t79\t278\t3e-53\t 174\n+2_471\t3_357\t27.85\t219\t149\t3\t91\t300\t13\t231\t3e-25\t97.8\n+2_471\t3_333\t35.50\t200\t104\t5\t103\t294\t15\t197\t9e-25\t 100\n+2_471\t3_17\t37.56\t197\t106\t6\t104\t296\t16\t199\t1e-24\t99.8\n+2_471\t3_307\t35.47\t203\t113\t6\t104\t301\t16\t205\t2e-24\t99.0\n+2_471\t3_19\t36.55\t197\t110\t5\t103\t296\t15\t199\t1e-23\t96.7\n+2_471\t3_297\t34.00\t200\t120\t5\t104\t301\t16\t205\t5e-23\t94.4\n+2_471\t3_306\t31.98\t197\t122\t5\t104\t298\t16\t202\t9e-23\t94.4\n+2_471\t3_257\t29.69\t229\t140\t7\t93\t302\t11\t237\t1e-21\t87.8\n+2_471\t3_18\t35.15\t202\t114\t6\t104\t301\t16\t204\t3e-21\t89.7\n+2_471\t3_256\t29.56\t203\t136\t4\t104\t303\t19\t217\t7e-20\t82.4\n+2_471\t3_494\t43.68\t87\t48\t1\t218\t303\t611\t697\t8e-20\t84.7\n+2_471\t3_379\t29.53\t193\t124\t5\t104\t294\t16\t198\t4e-19\t82.8\n+2_471\t3_495\t25.44\t228\t136\t6\t99\t302\t24\t241\t2e-18\t79.7\n+2_471\t3_375\t40.19\t107\t63\t1\t197\t302\t91\t197\t4e-18\t77.8\n+2_471\t3_211\t39.77\t88\t52\t1\t216\t302\t273\t360\t1e-17\t78.2\n+2_471\t3_211\t27.18\t103\t68\t3\t104\t201\t62\t162\t2e-04\t37.4\n+2_471\t3_210\t27.65\t217\t137\t6\t104\t302\t143\t357\t1e-17\t78.2\n+2_471\t3_298\t34.33\t134\t84\t3\t172\t303\t33\t164\t7e-16\t73.2\n+2_471\t3_365\t42.11\t95\t54\t1\t208\t301\t492\t586\t3e-14\t68.2\n+2_471\t3_365\t37.23\t94\t53\t2\t108\t201\t57\t144\t1e-10\t57.0\n+2_471\t3_541\t39.02\t82\t49\t1\t223\t303\t231\t312\t8e-13\t63.2\n+2_471\t3_541\t31.87\t91\t56\t1\t104\t194\t25\t109\t3e-09\t52.4\n+2_471\t3_508\t25.00\t212\t137\t7\t105\t303\t22\t224\t1e-11\t60.1\n+2_471\t3_508\t29.03\t217\t135\t9\t104\t306\t282\t493\t1e-10\t57.0\n+2_471\t3_281\t42.42\t66\t36\t1\t223\t288\t21\t84\t3e-11\t58.9\n+2_471\t3_226\t25.20\t246\t141\t10\t89\t311\t244\t469\t3e-11\t58.5\n+2_471\t3_226\t23.91\t184\t129\t4\t108\t282\t1\t182\t4e-10\t55.1\n+2_471\t3_462\t26.73\t202\t123\t10\t110\t301\t4\t190\t4e-11\t56.6\n+2_471\t3_206\t24.09\t220\t142\t6\t103\t301\t15\t230\t1e-09\t53.5\n+2_471\t3_206\t31.71\t82\t51\t2\t225\t305\t449\t526\t5e-07\t45.4\n+2_471\t3_605\t23.56\t208\t139\t5\t108\t304\t26\t224\t3e-07\t46.2\n+2_471\t3_605\t26.48\t219\t127\t10\t107\t301\t276\t484\t7e-05\t38.9\n+2_471\t3_156\t26.92\t156\t84\t6\t120\t260\t499\t639\t5e-07\t45.4\n+2_471\t3_90\t31.17\t77\t49\t2\t224\t297\t834\t909\t1e-06\t44.7\n+2_471\t3_626\t25.41\t185\t119\t7\t104\t282\t350\t521\t3e-06\t43.1\n+2_471\t3_623\t23.68\t190\t121\t6\t104\t285\t349\t522\t4e-06\t42.7\n+2_472\t3_446\t23.25\t400\t284\t7\t785\t1176\t1670\t2054\t9e-19\t88.2\n+2_473\t3_445\t35.47\t265\t166\t3\t6\t266\t13\t276\t6e-45\t 152\n+2_473\t3_307\t32.41\t216\t118\t6\t62\t266\t7\t205\t6e-22\t90.9\n+2_473\t3_256\t29.00\t231\t151\t6\t53\t278\t2\t224\t1e-21\t87.4\n+2_473\t3_357\t29.38\t211\t128\t8\t71\t265\t26\t231\t2e-21\t86.3\n+2_473\t3_297\t27.43\t226\t136\t5\t62\t276\t7\t215\t3e-20\t85.5\n+2_473\t3_17\t32.02\t228\t140\t7\t59\t282\t4\t220\t4e-20\t85.5\n+2_473\t3_257\t30.28\t218\t131\t5\t72\t269\t23\t239\t5e-20\t82.8\n+2_473\t3_333\t31.03\t203\t121\t6\t59\t257\t4\t191\t4e-19\t82.4\n+2_473\t3_226\t29.27\t205\t131\t5\t75\t267\t1\t203\t2e-18\t79.3\n+2_473\t3_226\t24.19\t215\t136\t7\t72\t266\t253\t460\t1e-13\t65.5\n+2_473\t3_19\t31.94\t216\t126\t8\t71\t279\t16\t217\t3e-18\t79.7\n+2_473\t3_306\t29.15\t199\t125\t5\t62\t257\t7\t192\t7e-18\t78.6\n+2_473\t3_494\t37.36\t91\t56\t1\t178\t267\t606\t696\t1e-17\t77.8\n+2_473\t3_18\t32.12\t193\t114\t7\t68\t257\t13\t191\t7e-17\t75.5\n+2_473\t3_379\t27.31\t227\t141\t8\t59\t281\t4\t210\t8e-17\t75.1\n+2_473\t3_365\t34.86\t109\t70\t1\t159\t266\t478\t586\t2e-14\t67.8\n+2_473\t3_365\t36.63\t101\t58\t1\t59\t159\t41\t135\t2e-13\t65.1\n+2_473\t3_541\t32.08\t106\t71\t1\t162\t266\t205\t310\t3e-14\t67.0\n+2_473\t3_541\t37.07\t116\t65\t3\t71\t185\t25\t133\t7e-12\t60.1\n+2_473\t3_211\t38.27\t81\t49\t1\t188\t267\t280\t360\t5e-14\t66.6\n+2_473\t3_375\t30.33\t122\t80\t2\t162\t278\t91\t212\t9e-14\t65.1\n+2_473\t3_495\t27.10\t214\t138\t8\t71\t267\t29\t241\t2e-13\t64.3\n+2_473\t3_508\t30.00\t220\t128\t8\t66\t266\t277\t489\t2e-12\t62.0\n+2_473\t3_508\t27.01\t211\t142\t8\t79\t280\t28\t235\t3e-11\t58.5\n+2_473\t3_298\t29.03\t186\t108\t8\t98\t279\t1\t166\t5e-11\t57.8\n+2_473\t3_623\t27.27\t198\t128\t7\t71\t262\t349\t536\t5e-10\t54.7\n+2_473\t3_281\t40.51\t79\t42\t2\t179\t257\t12\t85\t7e-10\t54.3\n+2_473\t3_210\t32.93\t82\t54\t1\t187\t267\t276\t357\t3e-09\t52.0\n+2_473\t3_206\t22.71\t207\t145\t5\t64\t267\t329\t523\t1e-07\t47.4\n+2_473\t3_626\t24.34\t189\t124\t7\t66\t247\t345\t521\t3e-07\t46.2\n+2_473\t3_90\t35.44\t79\t41\t4\t189\t261\t834\t908\t3e-06\t43.1\n+2_473\t3_625\t29.10\t189\t111\t8\t68\t247\t346\t520\t4e-06\t42.4\n+2_473\t3_462\t22.70\t185\t132\t5\t86\t266\t13\t190\t1e-04\t37.4\n+2_474\t3_0\t27.91\t326\t215\t8\t105\t418\t116\t433\t8e-32\t 121\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast3_0.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast3_0.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1500 @@\n+3_0\t0_0\t33.33\t441\t268\t11\t8\t434\t13\t441\t2e-63\t 211\n+3_1\t0_1\t27.34\t384\t248\t12\t1\t373\t1\t364\t6e-30\t 114\n+3_2\t0_166\t61.44\t599\t230\t1\t12\t609\t5\t603\t0.0\t 749\n+3_2\t0_144\t29.13\t127\t88\t2\t292\t417\t248\t373\t3e-10\t57.4\n+3_3\t0_167\t38.16\t152\t85\t4\t2\t149\t3\t149\t4e-23\t86.7\n+3_4\t0_437\t41.72\t326\t172\t6\t1\t317\t1\t317\t2e-84\t 257\n+3_4\t0_438\t37.58\t314\t189\t3\t13\t325\t13\t320\t4e-66\t 209\n+3_5\t0_438\t49.19\t307\t156\t0\t12\t318\t12\t318\t1e-107\t 317\n+3_5\t0_437\t42.04\t314\t179\t3\t7\t318\t7\t319\t1e-78\t 242\n+3_5\t0_229\t22.64\t318\t219\t9\t1\t297\t329\t640\t4e-10\t55.5\n+3_7\t0_194\t55.01\t349\t134\t3\t1\t327\t1\t348\t8e-126\t 364\n+3_7\t0_609\t34.54\t194\t114\t4\t125\t314\t101\t285\t3e-25\t 100\n+3_8\t0_736\t42.68\t560\t305\t7\t1\t553\t1\t551\t3e-146\t 437\n+3_8\t0_782\t23.21\t504\t363\t11\t1\t493\t1\t491\t5e-34\t 132\n+3_8\t0_515\t24.78\t113\t80\t1\t565\t672\t1\t113\t2e-09\t52.0\n+3_8\t0_809\t35.00\t80\t45\t3\t584\t663\t24\t96\t1e-06\t43.5\n+3_9\t0_587\t39.31\t318\t188\t5\t12\t327\t17\t331\t8e-75\t 233\n+3_10\t0_586\t32.17\t115\t69\t3\t132\t238\t178\t291\t6e-12\t59.7\n+3_11\t0_503\t43.27\t513\t280\t7\t25\t530\t27\t535\t3e-142\t 421\n+3_12\t0_76\t36.14\t83\t47\t2\t1\t77\t1\t83\t1e-10\t49.7\n+3_13\t0_77\t57.04\t284\t122\t0\t3\t286\t7\t290\t8e-111\t 322\n+3_14\t0_789\t42.51\t287\t155\t5\t1\t280\t1\t284\t5e-70\t 217\n+3_14\t0_730\t25.43\t232\t152\t7\t46\t259\t44\t272\t6e-14\t65.9\n+3_17\t0_814\t31.94\t216\t126\t9\t1\t199\t120\t331\t2e-23\t98.2\n+3_17\t0_157\t32.08\t212\t128\t6\t1\t204\t3\t206\t2e-15\t72.4\n+3_17\t0_325\t30.73\t192\t120\t5\t2\t181\t357\t547\t3e-14\t71.2\n+3_17\t0_259\t39.62\t106\t60\t2\t124\t228\t200\t302\t3e-14\t69.3\n+3_17\t0_534\t26.58\t222\t128\t6\t17\t204\t23\t243\t3e-14\t69.3\n+3_17\t0_324\t27.48\t222\t141\t6\t13\t217\t379\t597\t5e-14\t70.1\n+3_17\t0_624\t25.33\t225\t114\t5\t1\t185\t1\t211\t2e-13\t68.2\n+3_17\t0_535\t27.96\t186\t121\t6\t17\t191\t19\t202\t3e-12\t62.8\n+3_17\t0_627\t27.41\t197\t122\t5\t2\t181\t354\t546\t7e-12\t63.5\n+3_17\t0_626\t29.76\t205\t121\t8\t27\t217\t398\t593\t2e-11\t62.0\n+3_17\t0_124\t37.96\t108\t60\t3\t1\t102\t11\t117\t9e-11\t59.7\n+3_17\t0_124\t29.89\t87\t57\t2\t122\t205\t225\t310\t2e-04\t39.3\n+3_17\t0_13\t23.50\t217\t152\t4\t2\t204\t7\t223\t1e-10\t59.3\n+3_17\t0_13\t24.79\t242\t125\t9\t1\t196\t263\t493\t1e-04\t40.0\n+3_17\t0_476\t29.38\t194\t124\t6\t20\t204\t24\t213\t1e-10\t57.0\n+3_17\t0_520\t35.80\t81\t50\t1\t121\t199\t468\t548\t1e-09\t56.2\n+3_17\t0_520\t31.58\t95\t58\t2\t2\t91\t46\t138\t5e-07\t47.8\n+3_17\t0_712\t37.80\t82\t49\t1\t121\t200\t207\t288\t3e-09\t54.7\n+3_17\t0_712\t36.84\t76\t39\t2\t22\t94\t34\t103\t4e-05\t41.2\n+3_17\t0_32\t28.38\t229\t127\t9\t5\t198\t102\t328\t5e-09\t53.9\n+3_17\t0_27\t25.86\t174\t112\t6\t33\t195\t14\t181\t1e-07\t49.3\n+3_17\t0_106\t30.17\t116\t77\t2\t90\t201\t586\t701\t1e-07\t49.7\n+3_17\t0_224\t38.16\t76\t43\t2\t125\t197\t208\t282\t2e-07\t48.9\n+3_17\t0_31\t33.33\t81\t50\t2\t127\t204\t281\t360\t8e-07\t47.0\n+3_17\t0_401\t34.48\t87\t52\t3\t120\t202\t823\t908\t3e-05\t42.4\n+3_17\t0_105\t34.72\t72\t43\t2\t128\t196\t191\t261\t4e-05\t41.6\n+3_18\t0_814\t31.16\t199\t116\t6\t16\t199\t139\t331\t4e-22\t93.6\n+3_18\t0_325\t30.99\t213\t130\t7\t6\t205\t361\t569\t2e-16\t77.8\n+3_18\t0_324\t30.43\t207\t129\t7\t11\t205\t377\t580\t2e-14\t71.2\n+3_18\t0_624\t27.98\t193\t99\t3\t1\t159\t1\t187\t2e-13\t68.6\n+3_18\t0_627\t29.65\t226\t136\t9\t20\t228\t375\t594\t5e-13\t67.0\n+3_18\t0_157\t30.29\t208\t123\t6\t1\t197\t3\t199\t5e-13\t64.7\n+3_18\t0_259\t41.46\t82\t47\t1\t124\t204\t200\t281\t7e-13\t65.1\n+3_18\t0_626\t31.07\t206\t116\t9\t10\t197\t381\t578\t8e-13\t66.6\n+3_18\t0_535\t28.86\t201\t130\t6\t1\t189\t1\t200\t5e-12\t62.0\n+3_18\t0_712\t34.88\t129\t81\t2\t79\t205\t166\t293\t3e-11\t60.8\n+3_18\t0_712\t35.53\t76\t40\t2\t22\t94\t34\t103\t1e-05\t43.1\n+3_18\t0_534\t23.75\t261\t145\t9\t20\t231\t26\t281\t3e-11\t60.1\n+3_18\t0_476\t27.10\t214\t142\t7\t1\t204\t4\t213\t2e-10\t57.0\n+3_18\t0_27\t26.82\t179\t104\t6\t33\t195\t14\t181\t3e-09\t53.5\n+3_18\t0_124\t30.60\t134\t81\t3\t1\t123\t11\t143\t2e-08\t52.4\n+3_18\t0_124\t26.98\t126\t86\t4\t90\t212\t195\t317\t6e-04\t37.7\n+3_18\t0_13\t24.48\t192\t121\t5\t32\t204\t37\t223\t6e-08\t50.8\n+3_18\t0_520\t29.29\t99\t64\t2\t109\t205\t460\t554\t3e-07\t48.9\n+3_18\t0_520\t34.25\t73\t41\t2\t24\t91\t68\t138\t1e-04\t39.7\n+3_18\t0_224\t31.25\t112\t69\t3\t96\t205\t185\t290\t4e-07\t47.8\n+3_18\t0_32\t27.32\t205\t125\t7\t8\t189\t106\t309\t6e-07\t47.4\n+3_18\t0_106\t35.06\t77\t46\t2\t127\t199\t623\t699\t5e-05\t41.2\n+3_18\t0_31\t31.11\t90\t57\t3\t127\t213\t281\t368\t1e-04\t40.0\n+3_18\t0_401\t36.90\t84\t48\t3\t120\t199\t823\t905\t2e-04\t39.7\n+3_18\t0_105\t34.72\t72\t43\t2\t128\t196\t191\t261\t3e-04\t38.5\n+3_19\t0_814\t34.52\t197\t112\t8\t16\t199\t139\t331\t3e-23\t97.1\n+3_19\t0_624\t27.20\t239\t120\t5\t1\t199\t1\t225\t2e-16\t77.8\n+3_19\t0_624\t28.24\t85\t59\t1\t118\t'..b'6\t3e-06\t44.7\n+3_625\t0_814\t29.44\t231\t119\t12\t307\t521\t116\t318\t4e-06\t43.9\n+3_625\t0_13\t25.95\t185\t117\t9\t363\t532\t35\t214\t4e-04\t37.7\n+3_625\t0_259\t30.16\t126\t67\t4\t332\t447\t3\t117\t7e-04\t36.6\n+3_625\t0_31\t32.67\t101\t57\t5\t334\t424\t38\t137\t8e-04\t36.6\n+3_626\t0_324\t25.70\t502\t335\t21\t44\t525\t81\t564\t3e-20\t89.4\n+3_626\t0_535\t31.18\t186\t118\t6\t354\t531\t22\t205\t1e-17\t78.2\n+3_626\t0_157\t32.34\t201\t117\t7\t333\t525\t1\t190\t2e-14\t68.2\n+3_626\t0_476\t31.35\t185\t108\t6\t353\t527\t23\t198\t3e-12\t61.6\n+3_626\t0_624\t26.61\t218\t127\t7\t335\t524\t1\t213\t3e-11\t60.5\n+3_626\t0_627\t26.90\t197\t131\t5\t336\t521\t354\t548\t2e-10\t58.2\n+3_626\t0_325\t23.61\t432\t288\t14\t122\t538\t160\t564\t3e-10\t57.4\n+3_626\t0_13\t28.57\t203\t121\t8\t352\t537\t23\t218\t2e-08\t51.6\n+3_626\t0_13\t33.33\t75\t48\t2\t335\t408\t263\t336\t4e-04\t37.7\n+3_626\t0_27\t30.73\t192\t98\t8\t354\t527\t1\t175\t3e-08\t50.1\n+3_626\t0_626\t23.24\t185\t126\t5\t353\t525\t390\t570\t4e-08\t50.4\n+3_626\t0_814\t24.34\t189\t121\t6\t348\t522\t138\t318\t7e-08\t49.3\n+3_626\t0_124\t33.80\t71\t46\t1\t335\t405\t11\t80\t2e-06\t45.1\n+3_626\t0_124\t33.33\t117\t67\t4\t413\t525\t184\t293\t5e-05\t40.4\n+3_626\t0_106\t35.59\t59\t35\t1\t466\t521\t624\t682\t2e-06\t45.1\n+3_626\t0_520\t33.33\t75\t46\t2\t466\t537\t475\t548\t1e-05\t42.4\n+3_626\t0_712\t29.89\t87\t53\t2\t438\t521\t191\t272\t4e-05\t40.8\n+3_627\t0_326\t39.89\t559\t288\t13\t60\t600\t117\t645\t2e-117\t 362\n+3_627\t0_310\t30.49\t82\t47\t4\t127\t202\t361\t438\t2e-04\t38.9\n+3_628\t0_619\t38.34\t712\t370\t22\t1\t689\t1\t666\t4e-149\t 449\n+3_629\t0_792\t27.69\t195\t134\t4\t20\t210\t19\t210\t4e-20\t82.0\n+3_630\t0_791\t40.57\t244\t141\t2\t2\t245\t9\t248\t3e-60\t 189\n+3_631\t0_790\t47.12\t191\t98\t3\t1\t191\t1\t188\t1e-59\t 184\n+3_632\t0_686\t24.92\t317\t210\t8\t452\t743\t416\t729\t1e-25\t 108\n+3_633\t0_686\t26.32\t95\t52\t2\t24\t106\t806\t894\t2e-07\t44.3\n+3_634\t0_337\t51.70\t323\t140\t7\t1\t320\t1\t310\t3e-107\t 315\n+3_635\t0_42\t44.62\t195\t91\t6\t1\t182\t1\t191\t2e-46\t 150\n+3_636\t0_41\t32.73\t55\t37\t0\t18\t72\t19\t73\t3e-08\t42.4\n+3_638\t0_38\t47.32\t224\t115\t2\t4\t224\t5\t228\t2e-68\t 209\n+3_638\t0_85\t28.80\t191\t109\t7\t42\t222\t63\t236\t8e-18\t74.7\n+3_639\t0_37\t41.67\t408\t221\t6\t11\t401\t2\t409\t8e-98\t 297\n+3_640\t0_403\t37.50\t72\t41\t1\t148\t215\t181\t252\t1e-08\t49.3\n+3_641\t0_232\t35.01\t397\t241\t6\t1\t381\t1\t396\t6e-55\t 186\n+3_642\t0_231\t35.32\t470\t260\t10\t4\t442\t14\t470\t3e-72\t 234\n+3_643\t0_230\t41.78\t146\t80\t1\t1\t141\t1\t146\t3e-25\t92.0\n+3_644\t0_229\t33.83\t668\t404\t16\t15\t665\t20\t666\t6e-98\t 313\n+3_644\t0_437\t23.85\t239\t137\t10\t322\t554\t6\t205\t6e-04\t37.4\n+3_645\t0_383\t32.34\t835\t456\t28\t3\t788\t5\t779\t4e-110\t 352\n+3_645\t0_213\t24.93\t349\t180\t13\t396\t700\t449\t759\t3e-20\t90.5\n+3_645\t0_213\t29.73\t148\t90\t3\t35\t169\t57\t203\t4e-09\t54.7\n+3_645\t0_134\t20.78\t818\t411\t29\t5\t725\t15\t692\t1e-17\t82.4\n+3_645\t0_196\t29.36\t109\t75\t1\t29\t137\t2\t108\t9e-08\t50.1\n+3_645\t0_196\t30.69\t101\t61\t3\t513\t612\t263\t355\t7e-05\t40.8\n+3_645\t0_37\t24.32\t185\t124\t5\t511\t693\t198\t368\t0.001\t37.0\n+3_646\t0_400\t53.12\t657\t299\t4\t10\t658\t4\t659\t0.0\t 724\n+3_647\t0_445\t41.72\t151\t86\t2\t136\t286\t3\t151\t5e-38\t 129\n+3_648\t0_449\t67.72\t127\t41\t0\t6\t132\t9\t135\t3e-52\t 160\n+3_649\t0_448\t65.28\t144\t50\t0\t1\t144\t1\t144\t2e-70\t 207\n+3_650\t0_49\t41.87\t246\t140\t2\t3\t246\t15\t259\t9e-53\t 171\n+3_651\t0_50\t29.34\t259\t170\t5\t152\t408\t4\t251\t2e-41\t 144\n+3_652\t0_179\t53.27\t321\t149\t1\t8\t328\t5\t324\t2e-120\t 349\n+3_653\t0_178\t38.81\t134\t77\t4\t18\t147\t19\t151\t1e-18\t76.3\n+3_654\t0_644\t29.52\t332\t179\t11\t39\t349\t88\t385\t2e-25\t 107\n+3_655\t0_431\t43.86\t1010\t499\t17\t1\t974\t1\t978\t0.0\t 757\n+3_656\t0_191\t70.00\t50\t15\t0\t1\t50\t1\t50\t2e-21\t75.9\n+3_656\t0_40\t48.00\t50\t25\t1\t1\t50\t1\t49\t3e-09\t43.9\n+3_657\t0_117\t53.31\t347\t158\t2\t1\t343\t1\t347\t6e-129\t 372\n+3_657\t0_541\t27.88\t208\t128\t4\t122\t314\t4\t204\t3e-18\t78.2\n+3_664\t0_407\t39.61\t154\t91\t2\t6\t157\t6\t159\t1e-31\t 109\n+3_666\t0_760\t34.69\t320\t194\t6\t2\t315\t19\t329\t4e-40\t 141\n+3_666\t0_481\t31.88\t69\t36\t2\t51\t117\t88\t147\t6e-04\t35.8\n+3_668\t0_134\t49.63\t816\t406\t4\t11\t822\t14\t828\t0.0\t 804\n+3_668\t0_213\t23.97\t701\t436\t15\t16\t633\t32\t718\t3e-46\t 173\n+3_668\t0_383\t29.86\t211\t118\t6\t1\t199\t1\t193\t4e-16\t77.8\n+3_668\t0_383\t21.64\t402\t250\t15\t394\t746\t379\t764\t6e-14\t70.5\n+3_668\t0_196\t40.68\t59\t35\t0\t497\t555\t292\t350\t1e-06\t47.0\n+3_668\t0_196\t26.81\t138\t83\t4\t31\t168\t2\t121\t7e-06\t43.9\n+3_671\t0_58\t35.85\t463\t240\t12\t185\t607\t269\t714\t1e-66\t 228\n+3_671\t0_58\t41.25\t80\t46\t1\t4\t82\t2\t81\t4e-13\t67.4\n+3_672\t0_57\t44.55\t110\t58\t1\t1\t110\t1\t107\t7e-24\t85.9\n+3_673\t0_56\t79.55\t44\t9\t0\t3\t46\t4\t47\t3e-20\t72.8\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast3_1.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast3_1.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1460 @@\n+3_0\t1_2\t26.35\t334\t218\t9\t115\t434\t124\t443\t3e-30\t 117\n+3_1\t1_762\t23.73\t354\t210\t16\t23\t345\t24\t348\t1e-05\t42.0\n+3_2\t1_676\t47.27\t605\t308\t3\t15\t609\t5\t608\t0.0\t 530\n+3_4\t1_36\t38.11\t328\t189\t6\t1\t323\t1\t319\t1e-69\t 218\n+3_4\t1_521\t33.11\t305\t189\t8\t6\t303\t8\t304\t2e-41\t 144\n+3_5\t1_36\t48.43\t318\t161\t2\t6\t321\t6\t322\t3e-105\t 310\n+3_5\t1_521\t31.58\t304\t194\t6\t13\t309\t15\t311\t1e-35\t 129\n+3_7\t1_173\t47.52\t322\t162\t2\t11\t332\t30\t344\t9e-97\t 290\n+3_7\t1_304\t31.16\t276\t162\t9\t51\t314\t31\t290\t3e-30\t 115\n+3_8\t1_82\t27.98\t579\t365\t15\t1\t547\t18\t576\t2e-59\t 207\n+3_8\t1_19\t24.04\t495\t356\t9\t7\t493\t18\t500\t3e-45\t 165\n+3_8\t1_665\t30.95\t84\t52\t2\t582\t665\t20\t97\t6e-10\t53.5\n+3_8\t1_84\t27.52\t109\t77\t1\t565\t671\t1\t109\t2e-07\t46.2\n+3_9\t1_373\t29.17\t312\t215\t4\t3\t308\t17\t328\t2e-35\t 129\n+3_10\t1_349\t28.03\t157\t108\t2\t88\t241\t112\t266\t2e-13\t64.3\n+3_11\t1_11\t35.92\t554\t325\t15\t3\t534\t4\t549\t4e-101\t 315\n+3_13\t1_695\t55.21\t288\t127\t1\t2\t287\t3\t290\t8e-112\t 324\n+3_14\t1_519\t29.29\t297\t154\t15\t31\t281\t32\t318\t9e-17\t73.9\n+3_14\t1_221\t26.56\t241\t150\t12\t40\t260\t40\t273\t4e-12\t60.8\n+3_16\t1_270\t37.50\t64\t40\t0\t14\t77\t74\t137\t3e-07\t41.2\n+3_17\t1_270\t45.63\t206\t106\t1\t1\t200\t1\t206\t1e-47\t 164\n+3_17\t1_619\t35.61\t205\t113\t7\t20\t207\t28\t230\t7e-23\t98.2\n+3_17\t1_619\t25.22\t226\t111\t8\t18\t202\t315\t523\t2e-06\t45.8\n+3_17\t1_21\t32.42\t219\t131\t7\t1\t204\t265\t481\t1e-22\t97.1\n+3_17\t1_234\t34.65\t202\t113\t6\t17\t200\t24\t224\t2e-16\t74.7\n+3_17\t1_608\t30.14\t209\t124\t6\t17\t204\t42\t249\t7e-16\t74.3\n+3_17\t1_385\t24.45\t229\t153\t6\t14\t230\t371\t591\t9e-15\t72.8\n+3_17\t1_301\t30.73\t205\t126\t6\t9\t201\t24\t224\t1e-14\t71.2\n+3_17\t1_5\t30.73\t218\t122\t10\t16\t216\t407\t612\t2e-14\t71.6\n+3_17\t1_40\t29.47\t207\t111\t8\t17\t197\t94\t291\t4e-13\t66.2\n+3_17\t1_395\t29.33\t208\t130\t6\t1\t196\t6\t208\t4e-13\t65.9\n+3_17\t1_101\t29.17\t216\t136\t6\t1\t204\t3\t213\t5e-13\t64.3\n+3_17\t1_543\t26.39\t216\t124\t8\t16\t197\t78\t292\t8e-10\t56.2\n+3_17\t1_261\t36.46\t96\t58\t2\t111\t204\t182\t276\t1e-09\t55.8\n+3_17\t1_261\t32.98\t94\t62\t1\t1\t94\t5\t97\t8e-09\t53.1\n+3_17\t1_609\t27.07\t181\t122\t5\t16\t187\t23\t202\t2e-09\t54.7\n+3_17\t1_33\t27.18\t195\t130\t5\t4\t194\t34\t220\t2e-09\t55.8\n+3_17\t1_33\t34.18\t79\t50\t1\t128\t204\t364\t442\t1e-08\t53.1\n+3_17\t1_491\t33.67\t98\t59\t3\t2\t94\t7\t103\t8e-09\t53.5\n+3_17\t1_491\t32.22\t90\t59\t1\t118\t205\t275\t364\t2e-06\t46.2\n+3_17\t1_542\t32.56\t86\t54\t2\t114\t196\t281\t365\t1e-06\t46.6\n+3_17\t1_86\t32.22\t90\t56\t3\t120\t205\t830\t918\t4e-06\t45.1\n+3_17\t1_535\t27.16\t81\t57\t1\t126\t204\t679\t759\t1e-05\t43.5\n+3_17\t1_293\t27.96\t211\t122\t7\t4\t191\t6\t209\t3e-05\t41.6\n+3_17\t1_4\t27.68\t112\t72\t3\t17\t121\t187\t296\t8e-05\t40.0\n+3_17\t1_536\t29.11\t79\t54\t1\t120\t196\t219\t297\t1e-04\t40.0\n+3_17\t1_271\t29.25\t106\t70\t4\t639\t742\t399\t501\t1e-04\t40.0\n+3_17\t1_384\t28.57\t105\t69\t2\t86\t184\t34\t138\t1e-04\t38.9\n+3_17\t1_415\t24.75\t202\t132\t6\t2\t196\t471\t659\t6e-04\t37.7\n+3_18\t1_270\t48.10\t210\t103\t1\t1\t204\t1\t210\t3e-50\t 172\n+3_18\t1_21\t34.10\t217\t120\t7\t16\t217\t284\t492\t3e-22\t96.3\n+3_18\t1_619\t38.30\t188\t101\t6\t20\t194\t28\t213\t1e-21\t94.7\n+3_18\t1_619\t27.87\t244\t113\t10\t19\t219\t316\t539\t7e-07\t47.0\n+3_18\t1_301\t31.40\t207\t121\t6\t1\t189\t10\t213\t2e-16\t76.6\n+3_18\t1_234\t30.56\t216\t124\t6\t20\t210\t27\t241\t1e-15\t72.8\n+3_18\t1_261\t25.91\t274\t131\t5\t1\t204\t5\t276\t7e-15\t72.0\n+3_18\t1_608\t27.01\t211\t132\t6\t15\t204\t40\t249\t2e-14\t70.1\n+3_18\t1_5\t30.37\t214\t128\t9\t11\t211\t402\t607\t2e-13\t68.2\n+3_18\t1_385\t28.09\t178\t105\t6\t24\t184\t381\t552\t4e-11\t61.2\n+3_18\t1_40\t28.43\t204\t123\t7\t14\t197\t91\t291\t4e-11\t60.1\n+3_18\t1_395\t26.15\t218\t140\t6\t1\t204\t6\t216\t2e-10\t57.8\n+3_18\t1_101\t26.89\t212\t136\t7\t1\t198\t3\t209\t3e-10\t55.8\n+3_18\t1_491\t34.69\t98\t58\t3\t2\t94\t7\t103\t1e-08\t52.8\n+3_18\t1_491\t26.50\t117\t79\t3\t95\t205\t249\t364\t2e-05\t42.4\n+3_18\t1_609\t29.49\t156\t101\t4\t12\t159\t19\t173\t2e-07\t48.1\n+3_18\t1_33\t28.75\t80\t55\t1\t128\t205\t364\t443\t6e-07\t47.4\n+3_18\t1_33\t37.31\t67\t39\t1\t28\t91\t58\t124\t5e-06\t44.7\n+3_18\t1_543\t23.50\t217\t141\t5\t5\t196\t67\t283\t2e-06\t45.4\n+3_18\t1_271\t27.03\t111\t80\t1\t635\t744\t399\t509\t9e-06\t43.5\n+3_18\t1_86\t34.09\t88\t53\t3\t120\t203\t830\t916\t4e-05\t42.0\n+3_18\t1_86\t48.89\t45\t21\t1\t10\t52\t625\t669\t7e-04\t37.7\n+3_18\t1_415\t28.49\t186\t121\t5\t14\t196\t483\t659\t4e-05\t41.6\n+3_18\t1_542\t28.28\t99\t66\t3\t127\t222\t294\t390\t1e-04\t40.0\n+3_18\t1_536\t30.23\t86\t57\t2\t113\t196\t213\t297\t2e-04\t38.9\n+3_18\t1_384\t28.48\t151\t97\t5\t86\t226\t34\t183\t6e-04\t36.6\n+3_19\t1_270\t48.10\t210\t103\t1\t1\t204\t1\t210\t1e-50\t 173\n+3_19\t1_619\t36.59\t205\t113\t5\t20\t208\t'..b'4\t464\t1e-07\t48.9\n+3_625\t1_608\t26.47\t238\t144\t9\t321\t534\t12\t242\t2e-07\t47.8\n+3_625\t1_535\t32.20\t118\t62\t6\t318\t425\t4\t113\t9e-06\t43.1\n+3_625\t1_491\t36.07\t61\t39\t0\t334\t394\t7\t67\t2e-05\t42.4\n+3_625\t1_33\t38.10\t63\t38\t1\t330\t392\t28\t89\t1e-04\t39.3\n+3_625\t1_542\t28.07\t114\t63\t5\t304\t400\t8\t119\t1e-04\t38.9\n+3_625\t1_395\t25.36\t209\t132\t8\t338\t533\t11\t208\t2e-04\t38.5\n+3_625\t1_234\t27.14\t199\t128\t7\t351\t534\t25\t221\t8e-04\t36.2\n+3_625\t1_301\t23.28\t232\t119\t9\t325\t522\t4\t210\t0.001\t36.2\n+3_626\t1_270\t30.54\t203\t120\t7\t335\t525\t1\t194\t5e-18\t79.0\n+3_626\t1_385\t25.46\t436\t271\t15\t119\t525\t145\t555\t3e-16\t76.6\n+3_626\t1_395\t29.33\t208\t124\t5\t343\t538\t16\t212\t5e-15\t71.2\n+3_626\t1_619\t31.18\t186\t108\t6\t352\t523\t26\t205\t1e-12\t64.7\n+3_626\t1_101\t31.43\t210\t113\t10\t335\t527\t3\t198\t3e-12\t61.6\n+3_626\t1_415\t30.30\t198\t124\t5\t336\t530\t471\t657\t7e-10\t56.2\n+3_626\t1_5\t24.26\t202\t137\t6\t336\t525\t392\t589\t4e-09\t53.9\n+3_626\t1_609\t27.03\t222\t142\t7\t329\t538\t1\t214\t5e-09\t52.4\n+3_626\t1_301\t26.11\t226\t147\t6\t326\t535\t1\t222\t8e-09\t52.4\n+3_626\t1_33\t36.00\t75\t44\t2\t466\t537\t364\t437\t3e-07\t47.8\n+3_626\t1_21\t24.34\t189\t118\t7\t350\t522\t284\t463\t1e-06\t45.8\n+3_626\t1_40\t27.86\t201\t121\t8\t340\t521\t83\t278\t6e-06\t43.1\n+3_626\t1_491\t39.13\t69\t40\t2\t336\t403\t7\t74\t5e-05\t40.8\n+3_626\t1_491\t28.48\t158\t97\t7\t388\t537\t209\t358\t2e-04\t38.5\n+3_626\t1_234\t28.26\t184\t96\t9\t336\t497\t12\t181\t7e-05\t39.3\n+3_626\t1_542\t38.98\t59\t33\t1\t466\t521\t295\t353\t2e-04\t38.9\n+3_626\t1_608\t25.58\t215\t122\t8\t351\t538\t42\t245\t2e-04\t38.5\n+3_626\t1_261\t31.67\t60\t38\t1\t465\t521\t197\t256\t4e-04\t37.7\n+3_627\t1_16\t35.19\t591\t310\t22\t66\t601\t177\t749\t6e-81\t 268\n+3_627\t1_568\t29.41\t510\t281\t20\t118\t580\t214\t691\t3e-28\t 115\n+3_627\t1_312\t29.86\t144\t81\t5\t110\t235\t44\t185\t6e-06\t43.9\n+3_627\t1_742\t35.62\t73\t42\t3\t124\t194\t202\t271\t4e-04\t38.1\n+3_630\t1_422\t22.89\t249\t170\t6\t4\t234\t173\t417\t3e-10\t54.7\n+3_631\t1_421\t35.11\t188\t113\t3\t5\t191\t107\t286\t6e-28\t 103\n+3_634\t1_487\t37.35\t324\t182\t7\t3\t316\t6\t318\t3e-59\t 191\n+3_635\t1_680\t31.06\t132\t64\t2\t5\t109\t8\t139\t1e-16\t70.9\n+3_638\t1_712\t29.54\t237\t151\t8\t7\t229\t26\t260\t4e-23\t90.5\n+3_638\t1_520\t30.26\t152\t104\t2\t83\t233\t126\t276\t1e-15\t68.9\n+3_639\t1_713\t39.23\t418\t228\t7\t6\t399\t14\t429\t2e-90\t 279\n+3_639\t1_159\t29.09\t110\t69\t3\t3\t104\t1\t109\t6e-08\t49.3\n+3_640\t1_292\t24.77\t214\t133\t7\t19\t217\t33\t233\t1e-10\t55.1\n+3_641\t1_511\t35.38\t325\t198\t6\t5\t318\t25\t348\t3e-42\t 151\n+3_642\t1_643\t36.45\t299\t139\t9\t183\t442\t248\t534\t2e-42\t 154\n+3_643\t1_644\t36.24\t149\t85\t5\t1\t143\t1\t145\t5e-18\t72.4\n+3_644\t1_36\t25.14\t350\t201\t15\t326\t656\t10\t317\t6e-09\t53.1\n+3_645\t1_456\t43.97\t812\t424\t14\t1\t788\t1\t805\t0.0\t 686\n+3_645\t1_333\t21.58\t695\t353\t25\t7\t601\t29\t631\t6e-18\t83.6\n+3_645\t1_598\t22.87\t328\t178\t14\t400\t701\t408\t686\t9e-13\t66.6\n+3_645\t1_598\t22.11\t398\t222\t17\t3\t387\t14\t336\t6e-11\t60.8\n+3_645\t1_159\t28.57\t126\t85\t3\t18\t141\t2\t124\t1e-05\t43.5\n+3_645\t1_159\t41.86\t43\t25\t0\t549\t591\t318\t360\t2e-05\t42.4\n+3_646\t1_37\t47.56\t656\t335\t5\t8\t658\t4\t655\t0.0\t 609\n+3_647\t1_139\t36.94\t111\t61\t2\t137\t247\t20\t121\t5e-14\t64.3\n+3_648\t1_309\t54.33\t127\t58\t0\t6\t132\t4\t130\t8e-42\t 134\n+3_649\t1_308\t43.41\t129\t73\t0\t14\t142\t16\t144\t3e-35\t 118\n+3_650\t1_9\t31.53\t222\t128\t7\t6\t215\t16\t225\t1e-23\t92.8\n+3_651\t1_754\t30.11\t269\t172\t5\t150\t409\t2\t263\t3e-28\t 107\n+3_652\t1_605\t42.47\t332\t180\t5\t6\t329\t4\t332\t3e-76\t 236\n+3_652\t1_24\t38.89\t54\t28\t1\t202\t250\t74\t127\t4e-04\t35.8\n+3_653\t1_677\t24.14\t145\t102\t3\t16\t154\t22\t164\t2e-06\t42.4\n+3_655\t1_172\t32.30\t997\t631\t13\t3\t976\t4\t979\t1e-150\t 471\n+3_655\t1_395\t34.44\t90\t53\t3\t879\t968\t140\t223\t0.001\t37.0\n+3_656\t1_468\t45.83\t48\t26\t0\t3\t50\t4\t51\t2e-10\t47.4\n+3_656\t1_682\t32.61\t46\t30\t1\t3\t48\t2\t46\t9e-04\t28.5\n+3_657\t1_467\t35.48\t341\t217\t3\t6\t345\t13\t351\t1e-66\t 212\n+3_657\t1_71\t27.74\t137\t85\t4\t185\t312\t72\t203\t2e-07\t46.2\n+3_664\t1_194\t41.18\t153\t88\t2\t8\t158\t6\t158\t2e-32\t 111\n+3_666\t1_589\t33.71\t89\t53\t2\t9\t96\t79\t162\t8e-07\t44.7\n+3_666\t1_594\t32.58\t89\t54\t2\t9\t96\t41\t124\t2e-06\t43.9\n+3_668\t1_598\t38.92\t848\t479\t12\t1\t816\t9\t849\t0.0\t 556\n+3_668\t1_333\t25.33\t679\t407\t19\t40\t633\t58\t721\t2e-41\t 158\n+3_668\t1_456\t21.89\t845\t501\t36\t5\t746\t2\t790\t5e-19\t87.0\n+3_668\t1_159\t27.10\t214\t121\t9\t347\t549\t181\t370\t2e-07\t49.3\n+3_668\t1_159\t31.48\t54\t37\t0\t36\t89\t19\t72\t9e-05\t40.4\n+3_671\t1_8\t29.15\t247\t156\t7\t351\t583\t113\t354\t3e-16\t75.9\n+3_672\t1_7\t37.88\t66\t38\t2\t1\t63\t1\t66\t7e-04\t32.0\n+3_673\t1_6\t76.60\t47\t11\t0\t1\t47\t1\t47\t4e-20\t72.4\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast3_2.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast3_2.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1109 @@\n+3_0\t2_474\t27.91\t326\t215\t8\t116\t433\t105\t418\t6e-32\t 121\n+3_2\t2_387\t45.41\t610\t306\t4\t10\t601\t1\t601\t5e-170\t 497\n+3_4\t2_191\t36.16\t318\t200\t2\t1\t317\t1\t316\t6e-70\t 219\n+3_4\t2_379\t30.79\t315\t197\t6\t4\t310\t10\t311\t1e-38\t 136\n+3_5\t2_191\t47.59\t311\t163\t0\t1\t311\t1\t311\t1e-101\t 300\n+3_5\t2_379\t31.29\t310\t200\t7\t6\t309\t9\t311\t4e-36\t 129\n+3_7\t2_301\t43.92\t296\t165\t1\t25\t320\t38\t332\t9e-83\t 253\n+3_7\t2_45\t31.37\t204\t125\t5\t115\t314\t91\t283\t5e-25\t99.0\n+3_8\t2_429\t29.46\t577\t362\t15\t1\t555\t1\t554\t4e-67\t 227\n+3_8\t2_138\t25.10\t494\t350\t11\t7\t493\t19\t499\t5e-38\t 143\n+3_8\t2_124\t25.00\t84\t57\t2\t582\t665\t21\t98\t4e-05\t38.1\n+3_9\t2_204\t29.48\t268\t186\t3\t1\t265\t1\t268\t4e-34\t 124\n+3_10\t2_200\t25.35\t213\t129\t7\t60\t244\t4\t214\t4e-10\t52.8\n+3_11\t2_386\t32.62\t564\t316\t21\t1\t534\t8\t537\t6e-67\t 223\n+3_13\t2_20\t52.96\t287\t133\t1\t3\t287\t2\t288\t4e-99\t 291\n+3_14\t2_378\t27.65\t293\t175\t12\t3\t262\t6\t294\t1e-12\t61.6\n+3_14\t2_208\t26.64\t229\t147\t8\t30\t243\t27\t249\t5e-11\t56.6\n+3_17\t2_471\t37.13\t202\t110\t6\t16\t204\t104\t301\t8e-25\t 100\n+3_17\t2_64\t33.63\t223\t123\t8\t1\t204\t232\t448\t1e-23\t99.4\n+3_17\t2_119\t32.31\t195\t105\t6\t20\t194\t26\t213\t1e-19\t87.4\n+3_17\t2_473\t30.26\t228\t144\t5\t4\t220\t59\t282\t2e-18\t80.9\n+3_17\t2_14\t30.21\t192\t116\t4\t13\t190\t364\t551\t6e-16\t75.5\n+3_17\t2_181\t28.65\t192\t117\t8\t27\t201\t47\t235\t1e-15\t72.4\n+3_17\t2_419\t29.33\t208\t118\t6\t13\t197\t95\t296\t7e-15\t70.9\n+3_17\t2_307\t27.14\t210\t130\t3\t13\t204\t86\t290\t5e-13\t65.5\n+3_17\t2_180\t25.82\t182\t123\t6\t16\t187\t23\t202\t3e-11\t58.9\n+3_17\t2_293\t23.30\t206\t132\t6\t16\t200\t21\t221\t1e-09\t53.9\n+3_17\t2_13\t26.21\t248\t148\t8\t17\t240\t383\t619\t2e-09\t54.7\n+3_17\t2_308\t30.04\t223\t124\t11\t1\t204\t1\t210\t4e-09\t52.8\n+3_17\t2_39\t37.37\t99\t56\t3\t1\t94\t6\t103\t6e-09\t53.1\n+3_17\t2_39\t37.33\t75\t43\t2\t126\t197\t346\t419\t2e-07\t48.1\n+3_17\t2_188\t31.91\t94\t61\t1\t2\t92\t8\t101\t7e-09\t53.1\n+3_17\t2_188\t32.91\t79\t51\t1\t121\t197\t361\t439\t2e-08\t51.2\n+3_17\t2_78\t33.73\t83\t53\t1\t114\t194\t195\t277\t3e-07\t47.8\n+3_17\t2_79\t32.10\t81\t53\t1\t126\t204\t683\t763\t1e-06\t45.8\n+3_17\t2_427\t31.71\t82\t51\t3\t128\t205\t838\t918\t6e-04\t37.4\n+3_18\t2_471\t35.15\t202\t114\t6\t16\t204\t104\t301\t1e-21\t91.3\n+3_18\t2_119\t33.33\t201\t107\t6\t20\t200\t26\t219\t2e-19\t86.7\n+3_18\t2_119\t27.27\t198\t122\t7\t20\t196\t340\t536\t4e-05\t40.8\n+3_18\t2_64\t31.22\t205\t120\t7\t16\t205\t251\t449\t2e-19\t86.3\n+3_18\t2_14\t29.66\t236\t138\t8\t13\t231\t364\t588\t2e-15\t73.9\n+3_18\t2_473\t31.61\t193\t115\t6\t13\t191\t68\t257\t2e-14\t68.9\n+3_18\t2_181\t28.80\t191\t114\t9\t27\t199\t47\t233\t2e-13\t65.9\n+3_18\t2_307\t27.70\t213\t131\t4\t10\t204\t83\t290\t2e-12\t63.9\n+3_18\t2_293\t27.14\t210\t133\t7\t16\t207\t21\t228\t1e-11\t59.7\n+3_18\t2_419\t26.29\t213\t132\t6\t13\t204\t95\t303\t1e-11\t60.8\n+3_18\t2_180\t26.56\t192\t128\t6\t16\t197\t23\t211\t8e-11\t57.8\n+3_18\t2_13\t28.00\t200\t121\t5\t26\t204\t392\t589\t8e-09\t52.8\n+3_18\t2_39\t30.88\t136\t86\t4\t1\t129\t6\t140\t2e-08\t51.6\n+3_18\t2_39\t30.14\t73\t49\t1\t127\t197\t347\t419\t4e-04\t37.7\n+3_18\t2_188\t32.89\t76\t48\t1\t20\t92\t26\t101\t1e-06\t45.8\n+3_18\t2_188\t46.15\t39\t21\t0\t121\t159\t361\t399\t4e-06\t44.3\n+3_18\t2_78\t32.53\t83\t54\t1\t114\t194\t195\t277\t8e-06\t42.7\n+3_18\t2_308\t28.49\t186\t111\t10\t32\t204\t34\t210\t3e-05\t40.4\n+3_18\t2_79\t31.51\t73\t48\t1\t127\t197\t684\t756\t9e-05\t39.7\n+3_18\t2_427\t62.07\t29\t11\t0\t17\t45\t632\t660\t1e-04\t39.3\n+3_18\t2_427\t36.84\t76\t43\t3\t128\t199\t838\t912\t7e-04\t37.0\n+3_19\t2_471\t36.14\t202\t114\t5\t15\t204\t103\t301\t6e-24\t98.6\n+3_19\t2_119\t32.03\t231\t127\t8\t4\t212\t8\t230\t6e-22\t94.7\n+3_19\t2_119\t27.88\t208\t128\t7\t18\t204\t338\t544\t4e-07\t47.4\n+3_19\t2_64\t31.07\t206\t123\t6\t13\t204\t248\t448\t5e-20\t88.2\n+3_19\t2_473\t31.48\t216\t127\t7\t16\t217\t71\t279\t7e-16\t73.2\n+3_19\t2_181\t26.79\t224\t137\t10\t1\t201\t16\t235\t1e-15\t72.4\n+3_19\t2_14\t30.93\t194\t110\t6\t14\t190\t365\t551\t3e-15\t73.2\n+3_19\t2_419\t27.39\t230\t126\t7\t5\t197\t71\t296\t2e-14\t69.7\n+3_19\t2_307\t29.06\t203\t121\t4\t24\t208\t97\t294\t4e-14\t68.9\n+3_19\t2_180\t28.98\t176\t112\t6\t32\t197\t39\t211\t1e-12\t63.2\n+3_19\t2_293\t25.91\t220\t143\t7\t11\t212\t16\t233\t4e-12\t61.2\n+3_19\t2_13\t27.62\t210\t127\t5\t32\t220\t398\t603\t1e-09\t55.1\n+3_19\t2_39\t33.94\t109\t66\t3\t1\t104\t6\t113\t6e-08\t50.1\n+3_19\t2_39\t34.25\t73\t46\t1\t127\t197\t347\t419\t6e-06\t43.5\n+3_19\t2_188\t32.91\t79\t51\t1\t121\t197\t361\t439\t3e-07\t48.1\n+3_19\t2_188\t26.55\t177\t106\t7\t18\t184\t24\t186\t3e-07\t47.8\n+3_19\t2_78\t25.21\t234\t116\t9\t20\t194\t44\t277\t3e-07\t47.8\n+3_19\t2_308\t26.15\t218\t139\t10\t1\t204\t1\t210\t8e-07\t45.4\n+3_19\t2_79\t31.25\t80\t53\t1\t127\t204\t684\t763\t8e-06\t43.5\n+3_19\t2_427\t3'..b'2_399\t26.46\t257\t158\t8\t280\t522\t403\t642\t2e-06\t44.3\n+3_623\t2_79\t34.38\t64\t39\t1\t462\t522\t683\t746\t4e-04\t37.4\n+3_623\t2_293\t23.74\t198\t117\t9\t349\t522\t21\t208\t6e-04\t35.8\n+3_625\t2_13\t28.28\t198\t122\t5\t314\t492\t345\t541\t3e-14\t69.7\n+3_625\t2_14\t24.54\t216\t148\t6\t318\t522\t336\t547\t5e-14\t68.9\n+3_625\t2_180\t27.64\t199\t120\t10\t338\t522\t13\t201\t2e-10\t55.8\n+3_625\t2_181\t27.23\t202\t120\t7\t340\t522\t27\t220\t6e-10\t54.7\n+3_625\t2_308\t28.99\t207\t110\t8\t334\t520\t2\t191\t4e-09\t52.0\n+3_625\t2_119\t28.11\t185\t110\t10\t363\t531\t36\t213\t7e-09\t52.4\n+3_625\t2_419\t27.40\t219\t132\t9\t336\t534\t85\t296\t4e-08\t49.3\n+3_625\t2_64\t26.59\t173\t102\t7\t365\t521\t267\t430\t4e-06\t43.1\n+3_625\t2_188\t29.65\t172\t90\t10\t333\t485\t7\t166\t9e-06\t42.4\n+3_625\t2_399\t26.46\t189\t125\t7\t318\t505\t447\t622\t1e-04\t38.5\n+3_625\t2_473\t26.06\t188\t118\t7\t346\t520\t68\t247\t2e-04\t37.4\n+3_625\t2_39\t33.33\t66\t34\t2\t334\t394\t7\t67\t8e-04\t36.2\n+3_626\t2_14\t28.10\t210\t136\t7\t324\t523\t343\t547\t2e-14\t70.1\n+3_626\t2_180\t28.23\t209\t133\t8\t340\t538\t13\t214\t5e-12\t60.8\n+3_626\t2_119\t31.43\t175\t94\t8\t368\t524\t40\t206\t2e-10\t57.0\n+3_626\t2_13\t27.47\t182\t114\t5\t351\t515\t383\t563\t2e-09\t53.9\n+3_626\t2_64\t26.19\t168\t105\t7\t368\t522\t269\t430\t4e-09\t53.1\n+3_626\t2_293\t29.69\t128\t76\t5\t406\t524\t86\t208\t1e-08\t50.1\n+3_626\t2_308\t27.70\t213\t124\t7\t335\t530\t1\t200\t1e-07\t47.8\n+3_626\t2_471\t25.95\t185\t118\t7\t350\t521\t104\t282\t5e-07\t45.8\n+3_626\t2_79\t38.98\t59\t33\t1\t466\t521\t685\t743\t2e-06\t44.7\n+3_626\t2_188\t35.62\t73\t46\t1\t334\t406\t6\t77\t2e-06\t44.3\n+3_626\t2_188\t29.55\t88\t58\t2\t453\t537\t355\t441\t4e-06\t43.5\n+3_626\t2_39\t34.07\t91\t56\t2\t451\t538\t333\t422\t2e-06\t44.3\n+3_626\t2_39\t37.68\t69\t41\t2\t334\t401\t5\t72\t2e-04\t38.1\n+3_626\t2_399\t36.25\t80\t48\t2\t336\t415\t464\t540\t3e-06\t43.9\n+3_626\t2_419\t24.44\t225\t148\t10\t316\t521\t62\t283\t1e-05\t41.6\n+3_626\t2_307\t27.03\t185\t114\t7\t368\t537\t107\t285\t3e-04\t37.4\n+3_626\t2_473\t23.66\t186\t129\t6\t345\t521\t66\t247\t4e-04\t36.6\n+3_627\t2_67\t24.69\t401\t173\t19\t165\t524\t72\t384\t6e-06\t43.1\n+3_630\t2_215\t25.37\t272\t166\t10\t3\t249\t146\t405\t1e-07\t46.2\n+3_631\t2_216\t35.50\t169\t103\t3\t6\t171\t25\t190\t3e-26\t96.7\n+3_634\t2_43\t37.46\t323\t178\t8\t1\t316\t5\t310\t2e-61\t 196\n+3_635\t2_51\t40.98\t61\t33\t1\t58\t115\t86\t146\t1e-09\t50.8\n+3_638\t2_254\t34.38\t192\t119\t4\t41\t225\t50\t241\t3e-23\t90.1\n+3_639\t2_255\t38.41\t414\t231\t9\t8\t401\t15\t424\t2e-81\t 254\n+3_641\t2_146\t29.31\t331\t217\t6\t1\t318\t8\t334\t8e-29\t 111\n+3_642\t2_93\t39.31\t290\t161\t6\t160\t442\t174\t455\t7e-51\t 176\n+3_643\t2_92\t37.62\t101\t54\t4\t1\t96\t1\t97\t1e-10\t50.8\n+3_644\t2_379\t28.71\t209\t111\t11\t327\t531\t14\t188\t1e-11\t60.8\n+3_644\t2_191\t23.75\t320\t209\t10\t326\t640\t10\t299\t4e-06\t43.1\n+3_645\t2_270\t46.16\t795\t417\t8\t1\t788\t1\t791\t0.0\t 716\n+3_645\t2_338\t21.74\t506\t255\t15\t306\t723\t248\t700\t1e-22\t97.8\n+3_645\t2_338\t25.33\t150\t95\t4\t36\t168\t42\t191\t7e-06\t43.5\n+3_645\t2_351\t25.84\t387\t204\t18\t385\t725\t434\t783\t4e-16\t76.6\n+3_645\t2_351\t30.63\t111\t69\t5\t8\t115\t24\t129\t3e-08\t51.2\n+3_645\t2_18\t29.01\t131\t90\t2\t29\t159\t2\t129\t2e-07\t48.1\n+3_645\t2_18\t43.48\t46\t25\t1\t546\t591\t285\t329\t2e-05\t42.0\n+3_646\t2_72\t43.40\t652\t357\t5\t10\t661\t11\t650\t0.0\t 559\n+3_647\t2_262\t36.36\t154\t79\t7\t141\t286\t294\t436\t4e-15\t69.3\n+3_648\t2_424\t52.34\t128\t59\t1\t7\t132\t5\t132\t3e-35\t 116\n+3_649\t2_425\t34.03\t144\t93\t1\t1\t142\t1\t144\t4e-31\t 106\n+3_650\t2_467\t31.05\t248\t151\t5\t6\t243\t6\t243\t8e-25\t95.5\n+3_651\t2_8\t31.39\t274\t154\t12\t152\t406\t2\t260\t5e-23\t92.4\n+3_652\t2_57\t42.77\t325\t174\t7\t1\t318\t3\t322\t9e-81\t 247\n+3_653\t2_388\t30.22\t139\t86\t6\t17\t151\t5\t136\t6e-11\t53.9\n+3_655\t2_302\t31.28\t1007\t613\t21\t10\t976\t11\t978\t5e-138\t 437\n+3_656\t2_330\t46.51\t43\t23\t0\t8\t50\t9\t51\t2e-08\t41.2\n+3_656\t2_53\t30.43\t46\t31\t1\t3\t48\t2\t46\t3e-04\t29.3\n+3_657\t2_329\t39.17\t337\t197\t4\t13\t344\t19\t352\t4e-69\t 218\n+3_657\t2_173\t27.61\t134\t89\t5\t185\t312\t72\t203\t2e-08\t48.9\n+3_664\t2_286\t42.68\t157\t86\t2\t7\t159\t4\t160\t1e-35\t 119\n+3_666\t2_97\t37.14\t70\t44\t0\t26\t95\t81\t150\t2e-08\t49.3\n+3_666\t2_317\t39.29\t56\t34\t0\t40\t95\t42\t97\t1e-05\t40.4\n+3_668\t2_338\t39.71\t836\t459\t17\t5\t817\t11\t824\t0.0\t 555\n+3_668\t2_351\t26.25\t701\t372\t22\t40\t633\t56\t718\t9e-40\t 152\n+3_668\t2_270\t21.77\t519\t269\t20\t242\t704\t310\t747\t4e-15\t73.6\n+3_668\t2_270\t25.81\t186\t118\t4\t5\t187\t2\t170\t2e-07\t48.9\n+3_668\t2_18\t22.22\t261\t145\t8\t320\t560\t128\t350\t1e-07\t48.9\n+3_671\t2_468\t26.94\t245\t165\t7\t351\t583\t115\t357\t1e-16\t76.6\n+3_672\t2_469\t25.23\t111\t77\t3\t1\t108\t10\t117\t1e-04\t33.5\n+3_673\t2_470\t65.96\t47\t16\t0\t1\t47\t1\t47\t4e-16\t61.2\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/blastout/Blast3_3.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/blastout/Blast3_3.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,2473 @@\n+3_0\t3_0\t100.00\t463\t0\t0\t1\t463\t1\t463\t0.0\t 925\n+3_1\t3_1\t100.00\t378\t0\t0\t1\t378\t1\t378\t0.0\t 754\n+3_2\t3_2\t100.00\t619\t0\t0\t1\t619\t1\t619\t0.0\t1245\n+3_3\t3_3\t100.00\t152\t0\t0\t1\t152\t1\t152\t4e-109\t 306\n+3_4\t3_4\t100.00\t327\t0\t0\t1\t327\t1\t327\t0.0\t 664\n+3_4\t3_5\t42.52\t294\t160\t5\t15\t304\t15\t303\t4e-68\t 214\n+3_4\t3_644\t24.93\t353\t216\t15\t9\t326\t325\t663\t8e-11\t57.8\n+3_5\t3_5\t100.00\t323\t0\t0\t1\t323\t1\t323\t0.0\t 661\n+3_5\t3_4\t42.72\t302\t164\t5\t7\t303\t7\t304\t1e-70\t 221\n+3_5\t3_644\t26.72\t363\t205\t16\t2\t317\t314\t662\t5e-14\t67.4\n+3_6\t3_6\t100.00\t189\t0\t0\t1\t189\t1\t189\t7e-139\t 385\n+3_7\t3_7\t100.00\t333\t0\t0\t1\t333\t1\t333\t0.0\t 667\n+3_7\t3_53\t31.34\t284\t164\t9\t45\t314\t17\t283\t2e-27\t 106\n+3_8\t3_8\t100.00\t673\t0\t0\t1\t673\t1\t673\t0.0\t1355\n+3_8\t3_91\t23.31\t519\t368\t12\t6\t512\t10\t510\t3e-31\t 125\n+3_9\t3_9\t100.00\t335\t0\t0\t1\t335\t1\t335\t0.0\t 664\n+3_10\t3_10\t100.00\t248\t0\t0\t1\t248\t1\t248\t2e-175\t 482\n+3_11\t3_11\t100.00\t534\t0\t0\t1\t534\t1\t534\t0.0\t1054\n+3_12\t3_12\t100.00\t81\t0\t0\t1\t81\t1\t81\t1e-55\t 165\n+3_13\t3_13\t100.00\t287\t0\t0\t1\t287\t1\t287\t0.0\t 578\n+3_13\t3_571\t36.25\t240\t140\t7\t1\t234\t1\t233\t8e-30\t 110\n+3_14\t3_14\t100.00\t281\t0\t0\t1\t281\t1\t281\t0.0\t 558\n+3_14\t3_451\t30.38\t260\t145\t10\t32\t265\t34\t283\t5e-22\t88.6\n+3_15\t3_15\t100.00\t120\t0\t0\t1\t120\t1\t120\t1e-74\t 216\n+3_16\t3_16\t100.00\t77\t0\t0\t1\t77\t1\t77\t2e-48\t 146\n+3_16\t3_18\t90.91\t66\t6\t0\t12\t77\t66\t131\t1e-33\t 117\n+3_16\t3_19\t90.91\t66\t6\t0\t12\t77\t66\t131\t1e-33\t 117\n+3_16\t3_17\t78.79\t66\t14\t0\t12\t77\t66\t131\t7e-27\t99.0\n+3_16\t3_298\t51.47\t68\t33\t0\t10\t77\t22\t89\t1e-16\t70.1\n+3_16\t3_297\t48.53\t68\t35\t0\t10\t77\t65\t132\t1e-15\t66.6\n+3_16\t3_306\t44.00\t75\t40\t1\t3\t77\t60\t132\t3e-14\t62.8\n+3_16\t3_307\t41.56\t77\t43\t1\t1\t77\t58\t132\t1e-13\t60.8\n+3_16\t3_379\t45.31\t64\t35\t0\t14\t77\t69\t132\t7e-13\t58.9\n+3_16\t3_333\t48.44\t64\t33\t0\t14\t77\t68\t131\t8e-12\t55.8\n+3_17\t3_17\t100.00\t755\t0\t0\t1\t755\t1\t755\t0.0\t1469\n+3_17\t3_18\t57.55\t742\t306\t7\t1\t740\t1\t735\t0.0\t 759\n+3_17\t3_19\t49.31\t793\t345\t13\t1\t755\t1\t774\t0.0\t 646\n+3_17\t3_306\t41.77\t802\t390\t21\t1\t755\t1\t772\t3e-163\t 490\n+3_17\t3_333\t38.32\t796\t446\t10\t1\t755\t1\t792\t5e-155\t 470\n+3_17\t3_298\t40.27\t745\t386\t13\t43\t755\t1\t718\t5e-151\t 457\n+3_17\t3_307\t48.87\t485\t232\t7\t1\t476\t1\t478\t7e-137\t 418\n+3_17\t3_307\t45.86\t181\t98\t0\t575\t755\t466\t646\t2e-37\t 144\n+3_17\t3_297\t50.11\t441\t212\t4\t1\t435\t1\t439\t3e-128\t 395\n+3_17\t3_297\t40.00\t185\t108\t2\t572\t755\t464\t646\t1e-30\t 123\n+3_17\t3_379\t34.30\t790\t460\t17\t1\t755\t1\t766\t5e-104\t 335\n+3_17\t3_281\t34.01\t691\t381\t17\t109\t755\t3\t662\t1e-88\t 291\n+3_17\t3_16\t78.79\t66\t14\t0\t66\t131\t12\t77\t8e-26\t99.0\n+3_17\t3_445\t34.20\t193\t112\t7\t20\t200\t83\t272\t1e-22\t94.4\n+3_17\t3_257\t29.03\t217\t122\t7\t17\t204\t23\t236\t1e-16\t76.6\n+3_17\t3_508\t26.76\t213\t143\t6\t1\t200\t6\t218\t4e-16\t76.6\n+3_17\t3_508\t26.52\t230\t141\t8\t11\t217\t277\t501\t3e-09\t54.7\n+3_17\t3_626\t27.40\t208\t137\t7\t1\t199\t335\t537\t7e-14\t69.7\n+3_17\t3_625\t30.23\t215\t121\t9\t2\t199\t334\t536\t2e-13\t68.2\n+3_17\t3_622\t30.57\t193\t120\t5\t16\t199\t349\t536\t5e-13\t66.6\n+3_17\t3_206\t25.50\t251\t133\t8\t1\t212\t1\t236\t9e-12\t62.8\n+3_17\t3_206\t28.44\t109\t73\t2\t98\t203\t415\t521\t2e-05\t42.0\n+3_17\t3_605\t33.17\t199\t116\t6\t2\t186\t8\t203\t2e-11\t61.6\n+3_17\t3_365\t39.78\t93\t53\t1\t2\t91\t39\t131\t4e-11\t60.8\n+3_17\t3_365\t37.04\t81\t49\t1\t121\t199\t501\t581\t4e-10\t57.8\n+3_17\t3_226\t26.60\t188\t115\t6\t20\t187\t1\t185\t5e-11\t60.1\n+3_17\t3_226\t26.04\t96\t70\t1\t114\t208\t369\t464\t2e-06\t45.4\n+3_17\t3_541\t36.73\t98\t57\t2\t1\t94\t10\t106\t9e-11\t59.3\n+3_17\t3_541\t36.71\t79\t44\t3\t126\t200\t230\t306\t2e-05\t42.4\n+3_17\t3_256\t28.72\t195\t127\t6\t13\t197\t16\t208\t3e-10\t56.6\n+3_17\t3_623\t29.58\t213\t123\t9\t2\t199\t335\t535\t7e-10\t56.6\n+3_17\t3_462\t29.47\t190\t124\t5\t22\t204\t4\t190\t1e-08\t51.2\n+3_17\t3_357\t27.03\t222\t136\t8\t1\t199\t9\t227\t1e-08\t51.2\n+3_17\t3_211\t32.98\t94\t59\t2\t114\t204\t267\t359\t7e-08\t50.1\n+3_17\t3_494\t32.43\t74\t48\t1\t126\t197\t615\t688\t2e-07\t48.9\n+3_17\t3_375\t31.40\t86\t57\t1\t121\t204\t111\t196\t6e-07\t46.6\n+3_17\t3_210\t21.92\t219\t132\t8\t15\t197\t142\t357\t6e-06\t43.9\n+3_17\t3_90\t33.33\t90\t55\t3\t120\t205\t826\t914\t2e-05\t42.7\n+3_17\t3_90\t34.15\t82\t50\t3\t121\t199\t486\t566\t3e-04\t38.9\n+3_17\t3_495\t25.23\t214\t117\t8\t16\t196\t29\t232\t5e-05\t40.8\n+3_17\t3_156\t37.93\t58\t32\t1\t119\t176\t594\t647\t1e-04\t39.7\n+3_18\t3_18\t100.00\t746\t0\t0\t1\t746\t1\t746\t0.0\t1466\n+3_18\t3_17\t57.68\t742\t305\t7\t1\t735\t1\t740\t0.0\t 775\n+3_18\t3_19\t48.02\t781\t360\t12\t1\t746\t1\t770\t0.0\t 610\n+3_18\t3_333\t37.94\t796\t436\t15\t1\t746\t1\t788\t5e-144\t 441\n+3'..b'9\t1\t249\t0.0\t 497\n+3_631\t3_631\t100.00\t195\t0\t0\t1\t195\t1\t195\t3e-142\t 394\n+3_632\t3_632\t100.00\t758\t0\t0\t1\t758\t1\t758\t0.0\t1486\n+3_633\t3_633\t100.00\t144\t0\t0\t1\t144\t1\t144\t5e-101\t 285\n+3_634\t3_634\t100.00\t322\t0\t0\t1\t322\t1\t322\t0.0\t 649\n+3_635\t3_635\t100.00\t190\t0\t0\t1\t190\t1\t190\t1e-141\t 392\n+3_636\t3_636\t100.00\t74\t0\t0\t1\t74\t1\t74\t7e-49\t 147\n+3_637\t3_637\t100.00\t184\t0\t0\t1\t184\t1\t184\t6e-135\t 374\n+3_638\t3_638\t100.00\t233\t0\t0\t1\t233\t1\t233\t2e-169\t 466\n+3_638\t3_140\t26.78\t239\t129\t11\t7\t225\t36\t248\t2e-06\t42.7\n+3_639\t3_639\t100.00\t406\t0\t0\t1\t406\t1\t406\t0.0\t 812\n+3_640\t3_640\t100.00\t227\t0\t0\t1\t227\t1\t227\t4e-163\t 449\n+3_641\t3_641\t100.00\t410\t0\t0\t1\t410\t1\t410\t0.0\t 811\n+3_642\t3_642\t100.00\t463\t0\t0\t1\t463\t1\t463\t0.0\t 934\n+3_643\t3_643\t100.00\t145\t0\t0\t1\t145\t1\t145\t5e-99\t 280\n+3_644\t3_644\t100.00\t665\t0\t0\t1\t665\t1\t665\t0.0\t1342\n+3_644\t3_5\t26.74\t344\t195\t15\t333\t662\t17\t317\t1e-12\t64.7\n+3_644\t3_4\t24.93\t353\t216\t15\t325\t663\t9\t326\t2e-10\t57.8\n+3_645\t3_645\t100.00\t790\t0\t0\t1\t790\t1\t790\t0.0\t1612\n+3_645\t3_668\t22.37\t854\t418\t29\t3\t759\t6\t711\t2e-25\t 107\n+3_645\t3_27\t23.36\t351\t176\t16\t400\t701\t447\t753\t7e-12\t63.5\n+3_645\t3_27\t26.44\t174\t115\t5\t8\t169\t27\t199\t5e-10\t57.4\n+3_645\t3_404\t36.26\t91\t55\t2\t29\t118\t3\t91\t2e-08\t52.0\n+3_645\t3_404\t32.32\t99\t57\t3\t515\t612\t266\t355\t2e-05\t42.4\n+3_646\t3_646\t100.00\t661\t0\t0\t1\t661\t1\t661\t0.0\t1327\n+3_647\t3_647\t100.00\t287\t0\t0\t1\t287\t1\t287\t0.0\t 564\n+3_648\t3_648\t100.00\t132\t0\t0\t1\t132\t1\t132\t2e-93\t 265\n+3_649\t3_649\t100.00\t144\t0\t0\t1\t144\t1\t144\t4e-106\t 298\n+3_650\t3_650\t100.00\t259\t0\t0\t1\t259\t1\t259\t0.0\t 513\n+3_651\t3_651\t100.00\t415\t0\t0\t1\t415\t1\t415\t0.0\t 834\n+3_652\t3_652\t100.00\t330\t0\t0\t1\t330\t1\t330\t0.0\t 658\n+3_653\t3_653\t100.00\t202\t0\t0\t1\t202\t1\t202\t2e-143\t 397\n+3_654\t3_654\t100.00\t627\t0\t0\t1\t627\t1\t627\t0.0\t1255\n+3_654\t3_520\t33.01\t409\t232\t8\t27\t422\t57\t436\t3e-53\t 194\n+3_654\t3_61\t29.46\t516\t282\t19\t6\t494\t3\t463\t3e-37\t 143\n+3_655\t3_655\t100.00\t979\t0\t0\t1\t979\t1\t979\t0.0\t1941\n+3_656\t3_656\t100.00\t50\t0\t0\t1\t50\t1\t50\t2e-30\t99.0\n+3_657\t3_657\t100.00\t345\t0\t0\t1\t345\t1\t345\t0.0\t 705\n+3_657\t3_170\t31.03\t203\t129\t4\t121\t314\t3\t203\t5e-18\t77.4\n+3_658\t3_658\t100.00\t561\t0\t0\t1\t561\t1\t561\t0.0\t1095\n+3_658\t3_659\t36.93\t566\t300\t18\t1\t555\t1\t520\t9e-88\t 280\n+3_658\t3_433\t25.31\t399\t254\t18\t185\t556\t158\t539\t2e-18\t83.2\n+3_659\t3_659\t100.00\t521\t0\t0\t1\t521\t1\t521\t0.0\t1025\n+3_659\t3_658\t36.93\t566\t300\t18\t1\t520\t1\t555\t5e-89\t 283\n+3_659\t3_433\t28.18\t369\t228\t13\t173\t520\t186\t538\t9e-24\t99.8\n+3_660\t3_660\t100.00\t1201\t0\t0\t1\t1201\t1\t1201\t0.0\t2432\n+3_660\t3_264\t23.91\t368\t237\t11\t11\t377\t11\t336\t2e-19\t89.0\n+3_660\t3_105\t25.10\t251\t164\t5\t14\t255\t4\t239\t9e-18\t83.6\n+3_660\t3_195\t23.00\t387\t238\t10\t14\t387\t4\t343\t9e-13\t67.4\n+3_660\t3_99\t31.65\t79\t51\t2\t287\t364\t260\t336\t4e-05\t42.4\n+3_661\t3_661\t100.00\t1303\t0\t0\t1\t1303\t1\t1303\t0.0\t2632\n+3_661\t3_194\t32.78\t299\t193\t4\t1\t296\t1\t294\t9e-40\t 155\n+3_661\t3_194\t28.22\t202\t103\t9\t738\t911\t532\t719\t3e-08\t53.1\n+3_661\t3_106\t29.05\t327\t215\t6\t15\t326\t17\t341\t3e-35\t 140\n+3_661\t3_106\t28.50\t200\t120\t7\t726\t916\t530\t715\t6e-12\t64.7\n+3_661\t3_265\t30.67\t313\t208\t6\t5\t315\t12\t317\t1e-32\t 132\n+3_661\t3_265\t32.95\t176\t100\t4\t738\t903\t541\t708\t1e-17\t83.6\n+3_661\t3_369\t26.72\t232\t153\t6\t6\t235\t21\t237\t4e-18\t85.1\n+3_661\t3_369\t28.19\t149\t84\t5\t1009\t1153\t718\t847\t2e-05\t43.5\n+3_661\t3_489\t28.09\t235\t151\t5\t3\t235\t2\t220\t7e-13\t68.2\n+3_661\t3_98\t24.83\t286\t182\t10\t15\t296\t31\t287\t2e-10\t59.7\n+3_661\t3_98\t25.55\t227\t136\t9\t1045\t1238\t864\t1090\t3e-04\t39.7\n+3_662\t3_662\t100.00\t284\t0\t0\t1\t284\t1\t284\t0.0\t 546\n+3_662\t3_622\t26.21\t206\t142\t5\t20\t217\t20\t223\t4e-07\t45.4\n+3_663\t3_663\t100.00\t204\t0\t0\t1\t204\t1\t204\t3e-144\t 400\n+3_664\t3_664\t100.00\t160\t0\t0\t1\t160\t1\t160\t3e-110\t 310\n+3_665\t3_665\t100.00\t520\t0\t0\t1\t520\t1\t520\t0.0\t1018\n+3_666\t3_666\t100.00\t321\t0\t0\t1\t321\t1\t321\t0.0\t 632\n+3_667\t3_667\t100.00\t637\t0\t0\t1\t637\t1\t637\t0.0\t1248\n+3_668\t3_668\t100.00\t822\t0\t0\t1\t822\t1\t822\t0.0\t1656\n+3_668\t3_27\t24.63\t735\t438\t16\t18\t657\t34\t747\t8e-50\t 184\n+3_668\t3_645\t22.37\t854\t418\t29\t6\t711\t3\t759\t3e-25\t 107\n+3_668\t3_404\t24.08\t191\t112\t7\t30\t220\t2\t159\t2e-06\t45.8\n+3_669\t3_669\t100.00\t359\t0\t0\t1\t359\t1\t359\t0.0\t 716\n+3_670\t3_670\t100.00\t867\t0\t0\t1\t867\t1\t867\t0.0\t1732\n+3_671\t3_671\t100.00\t609\t0\t0\t1\t609\t1\t609\t0.0\t1212\n+3_672\t3_672\t100.00\t112\t0\t0\t1\t112\t1\t112\t4e-75\t 217\n+3_673\t3_673\t100.00\t47\t0\t0\t1\t47\t1\t47\t1e-28\t94.0\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/proteomes/Mycoplasma_agalactiae.faa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/proteomes/Mycoplasma_agalactiae.faa Tue Oct 24 06:40:40 2017 -0400
[
b'@@ -0,0 +1,5438 @@\n+>gi|290752267|emb|CBH40238.1| Chromosomal replication initiator protein DnaA [Mycoplasma agalactiae]\n+MNINSPNDKEIALKSYTETFLDILRQELGDQMLYKNFFANFEIKDVSKIGHITIGTTNVTPNSQYVIRAY\n+ESSIQKSLDETFERKCTFSFVLLDSAVKKKVKRERKEAAIENIELSNREVDKTKTFENYVEGNFNKEAIR\n+IAKLIVEGEEDYNPIFIYGKSGIGKTHLLNAICNELLKKEVSVKYINANSFTRDISYFLQENDQRKLKQI\n+RNHFDNADIVMFDDFQSYGIGNKKATIELIFNILDSRINQKRTTIICSDRPIYSLQNSFDARLISRLSMG\n+LQLSIDEPQKADLLKILDYMIDINKMTPELWEDDAKNFIVKNYANSIRSLIGAVNRLRFYNSEIVKTNSR\n+YTLAIVNSILKDIQQVKEKVTPDVIIEYVAKYYKLSRSEILGKSRRKDVVLARHIAIWIVKKQLDLSLEQ\n+IGRFFGNRDHSTIINAVRKIEKETEQSDITFKRTISEISNEIFKKN\n+>gi|290752268|emb|CBH40239.1| DNA polymerase III, beta chain [Mycoplasma agalactiae]\n+MKIIINKNFLDDIIEVVSRFSDPISSLYGMRCIKITANHNFVKFEATNEITNIVKKIKVDDNKIIVEEDG\n+ELLVQANYFKNIIKKLNGFIEIKTYFNKMEIKQQDSVYTLTLNEISSFPQIDENINIKKFQINTEEFKKA\n+VKNVAFAASNGANLIYKCINFKSSGNKLNLAATDTFRLAYYTIKTNQILEDFDFSVNAKDVKELLPTDVP\n+KTVTMFYNSIKFGVEYDDTTITARITDLPYHNVEQLFNKAISETKHKITIEKSEFNNLLNKIWINSSADK\n+QNRIELKISNQEINVYTKIDELGDSNVRTAKFTLEGSPFVFDMNFNYLKDAISITEGETYILIDEKIQNI\n+VLFSKDNPNSKQIITPLRR\n+>gi|290752269|emb|CBH40240.1| Esterase/lipase [Mycoplasma agalactiae]\n+MKPIYKYNVVFKDNNNPNENIIFCHGLNSTADRFDIFKNYWTKSNYYSLQFPASNLTPVLDGDEPSVFCF\n+AKLLVEFVEKNNLKNVTLIGHSLGGGTISLAYQLRPDLFKKLVYLAPMNKPALALYDRYKKDYFPKDYEG\n+FLDLMRSLYYDISKFTSDPNWVKEQKENFDPYLYNNPDIVKLGTPDMNVFNAIEETLKIVKVPTLLILGE\n+KDGVILREECIDYFKKYVKDVETHWIPKTGHMMYLEDWDSFIKILEPFLDK\n+>gi|290752270|emb|CBH40241.1| Esterase/lipase [Mycoplasma agalactiae]\n+MNVIYKYDFVFKDNNNPDENIIFCHGFNSSPNSFKIFENYWTKSNYYALQFPGNNHTEIKEGDEATVECY\n+SDLLIKFIEDNKLKNIILIGHSMGGGTISLAYQKRPELFKKLIYLAPTNKSSQNVTEAFLRDYFPKTFDE\n+FIGFFKSLYYDVTKFTSNESWMRLVKNTFDPYDFNNPTIVGLGQYLISNYFHDKLELALQSVNVPALLIL\n+GEDDGVVDRDLCINYFKENVKGVQSLWMPKTGHMMFEEDWENFIKIVEEFINRSELASPKAL\n+>gi|290752271|emb|CBH40242.1| NADH dependent flavin oxidoreductase [Mycoplasma agalactiae]\n+MNKYEQLFRPFKLGNYSLKNRFVLSPMTLSLATKDGKVTIEEEKYSARRADCAPLLISGGTYFDDFGQLF\n+EYGYSAKSDDDIESLKKLAKAMKSKGNIAILQLAHAGKFSKASLKKYGYLYGPSYEKNHIPVEHEVFELS\n+ISQIKQIVKDYASATKRAIAAGFDGIEISMAQRLLIQTFFSSIVNKRNDEYSSDSFENRSRLCLEIVEEI\n+RKMINQYADENFIFGFRATPEETYGAELGYSIIDFIQLIEEIIKKGKINYLAIASWGHDIYLNKVRSENE\n+YKGQLVNKVIYDKFKGILPIISSGGINTPQKCLDALEYSDLVGLSSVFVADPEFVQKIENDQEDKINLNI\n+SFSQLKDLAIPESSFKGIVEMFGFCETIPTESLKTLEENSKS\n+>gi|290752272|emb|CBH40243.1| Lipoate protein ligase A [Mycoplasma agalactiae]\n+MILVEPIRNGKYIKDGAYYLATQIWALSHLKFDEIVAFPAVLDPYVQIGYFQNPEVEVNFKYLKEHNIPI\n+VRRDTGGGAIYIDSNQMGVCYLIPYKDNESILGNYEKFLEPAIKIIKELGAKNVVQSGKNDLTIDGFKVS\n+GAAMALIGDTIYGGNTYIYKIDYDAMSQVLKPNRKKIEAKGIKSVRQRIAPLSDYFNEPYKNMDIFEFKD\n+LVVKKLFNVDDLSNVKRYVLTENDWKQIDELVNAKYKNWDWNYGLSPRYEYNRDARLAIGTINFSLAVKG\n+QRIERIKISGDFFAKADINELEKSLVGIKMDYDELSNAIKQANLEKYFFNEISVDDVVRTILSEDDNE\n+>gi|290752273|emb|CBH40244.1| Lipoate protein ligase A [Mycoplasma agalactiae]\n+MILVEPIRNGKYVKDGAYWLAIQIWAMNHLRLNEKIVFPGIAAPHIQLGYFQNPEVEVNFKYLKDHNLEV\n+VRRNTGGGAIYIDDNSVNVCYLIPYDEKDNILGNYDKFYEPTIKMLKELGAKDVVQSGKNDLTIDGRKVS\n+GAAMMLNGDVIYGGNSLLYKVDYDAMVDSLKPNRKKIEAKGVKSIRQRVAPLSDYFDEPYRNLDIFEFKD\n+LVIKKLFGVDDLSKVKRYELTEEDWAQVDELVNTKYKNWDWNYGLSPRYEYNRDARLAIGTINFSLAVEG\n+QRIEKIKISGDFFAKKDITELEKALVGTKMTYENLVKAFKDADLQSYFFNEIKAEEVAKIILDEE\n+>gi|290752274|emb|CBH40245.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+MHTLNSVKELDSLINEADAIVIGIGSGMTSADGIGYSGQRFVQNFKDFIDEFKFLDMLQASVYHFDDIQN\n+YWAFHSRFMKLNYFDQPASESFLKLKEYLKGKNYHIITTNSDNSLEAADFEEDKIFYIQGKYNLLQCSKM\n+CHNTLYSNDKAVYEMIEKQKDMKVPLELIPRCPKCNNFLEVNKRLKGKGMVEDKRFFEEKKMYEDFIYRH\n+KGQKILFWEIGVGFSTPTLIKFPFWEMTKEFSNSKYVAMNNKSYRTPQEIRQRTYVWTDDIKQTINKLLE\n+VKNDFSRAN\n+>gi|290752275|emb|CBH40246.1| Glycine cleavage system H protein [Mycoplasma agalactiae]\n+MKKVVKYLVVEKLEGKDQFYLRFTPEMQDDIGTIGFIQYKNTDKKVLHKDDIFLNLEASKAILTLKMPFD\n+ATVVEINKEAMANPKLLSSPKDSENWVMILSDIDPKTLEQLEDF\n+>gi|290752276|emb|CBH40247.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+MKISILDHGLLTDQNNYEKAYKEVIELCQYVKDLNLYSFWISEQHNVNSLVISSPLILLDHLANSVSGIK\n+LGCGGIMLANYQAYNVAEQIQTLNLLHPERFIYGFGSNIGTKETIELLKPSLTSTEYQQKIIAVNEYLNN\n+KKKFDFKINPNINKPVDIVMLVTSEQSAIFAAQHKFKINYGWFLNPSK'..b'SILQNIDFNVLSNYLSEHLTTNYFEYKKSDLDYESNKEKVL\n+REKVALKTIRPKDGMMALIYGLFYNPGTNREFKANLIKMFNLSDKVSTIKVENGSGSVVTPDSDEEKLSF\n+SDFLAFFPALLSADQSKTIFKNQQINNDISYAKEHILKVMSAKGNSVGLHELDIKALEILKKFNIITNEI\n+TIDKKVIEKLNKVQSFIVQTTTSLDEKTKIVSETNKTLADLIYDFNSFDEGDESWKVWKGVIGSYGQASV\n+VNKFSLGAQAFDLLIPWINMLTYSNNATQKEALQFVNDFLKLSIDKSILEEINKLAQDENLPNFNSTNFG\n+LSIALHRPEQVTVFNESNGKFTNAKVEELASKNPKFRRYLSSQKRSLIELLGLIGASQQYSKYDKQPAET\n+GKIYAPNGIYYETIKKAVDRYFSTKEFWEIKDIVLLIARSMQINFPIELLGLSRIIINPVLRSMYPQLMT\n+SFLSTQKQSLGKINGNLAYIVSNRIGNFEEIIRDNSKKLELEAYFEQIWSNKDTSLVPLDYSEEITLALD\n+GARVNKIFNEQTKKVTIFGIDFLNLAGRVVNGIVEPKELKDIVFNDINSYYAKVNYAYLSKNNKAIYNGE\n+LPRNNVEMESLLNTIDDKYILDVNGIKFLIVGEDTTVDYIYPVIDENHLQVNTQNQALVYLNNYGFSRIM\n+AAYQGNVVKKNLLVVNGSKNSNEVVKRNITNIVDSSISDANKLKRVFSYDELDPINPERALRITTIEGMI\n+NVISSSIIALMSLFIIMVSVAIIFIIRRYIANKAKVFGILLAQGYRPIEIAISLLPFAMVTSLIGGILGY\n+SIGFRTQILLQNVFSNYWTLPKSAIPFDFFSLFFNVFIPFLGMSLLIIVVALISLRKSSIDLITGVDDAP\n+RGKLFNKIKKKFINKKNVKKRFSFTLAYSGFWKLASFGGSVLLTSIATMFGLANYKTFNNTINDTYKNRD\n+YRFKIDLESPTTEGKYYSLYNPSELKDLIYTPIGSLNEGNRETADYFKPGKSSIINPDNKANGNPGEFAP\n+HLLSQFSVNVTVDAGVAADPWLIAYNGMPDSQKAKIDKIRDLVGHQLEWTQSLDENGKLITDPNKPIIKV\n+DSNGLMSYEDASGKKYDFFKYYKSPNDKQGSFRLAHWDAANKEYIMKTIKTGDSGGRNEYRDFLVKAYQK\n+NDIVRMQHEKLLAEGKELINPITNWKESRSDSDFWLVDKSDLDRQWVNDYFIGFGGILFDKHYDETYTYI\n+SGSYNNISSKIYGYRKPEDIKSAKVKLIDKNGENLYDALYNFKIENNVYPLVVNDVFAKKHKLGIDDQID\n+FVISNRVDRYRQKLLEKIYANNPIKQADLKKQYDQNIKTKFRIVGINPTYINDELITTHSAANLLVGLPD\n+NESSFNGVLTQNANPVQVTESAGLYSPSGYWAGLDGFDVSSLDQGTVKKMFDEIFKVSDIPEKGGVLQSQ\n+HGFTKDEIAKFLDPKAEKFSDSLYESAKNSAKAHIEDFSRIYENKLFIALSNSIDSRDIEVGFVVQVGHT\n+IEQISIFIIVINFVISLIILIIMSSIIVSENERNIAIWSILGYSQKEKLMMFFGAFIPFLVAALIISIPI\n+VIAMINVFGSFLLSSSSIALLLSLKWWHVLITSGLMLIIFAVTSISVWISINKMKPVDLLKGK\n+>gi|290753083|emb|CBH41059.1| Cell division protein ftsH homolog [Mycoplasma agalactiae]\n+MENERKQKIAKIVLWTILSAVILLIITLLLWNRFKPQVRQGNFQDFVNDIVAASKSVDDNTYLAEVKIDG\n+VQDIAKYTFVENGIAKLREVSLGKGIVEKTFILPDKFTIGDKTYNIADLLKHPGADANVLSTQWSTVGLV\n+LEKPNTFARIALSVLPTLLWIIILFWLYRSMMKRSMNMIGAIGDEKNPAQKIKSDKTFKDVAGNKEAVEE\n+IKEIVDYLKNPKKYEIAGARMPHGILLGGPPGTGKTLLAKATAGEANVPFYFISASNFVEMFVGLGAKRV\n+RTVVDEARKNAPAIIFIDELDAIGRTRGSGIGGGHDEREQTLNQLLVEMDGMKDNNGILFFAATNRTDVL\n+DPALTRPGRFDRTITVGLPDVKEREEILNLHAKGKRVSPNVNLAQVAKRTPGYSGAQLENVINEAGLLAV\n+RRDSEIIERDDIDEAIDRVMAGPAKKNRVITKSELTMVAYHEAGHAVVGIKMPGANKVQKITIIPRGQAG\n+GYNLMTPEEEKYNLTKKELIAMITSFMGGRAAEEIIYGKENVSTGASDDLHKATKIARKMVTEWGMSDLG\n+PIQYEQDEGSPFLGRDYLKSAQFSAQVAHEIDIEVRNIITEAEKKAKEIIEENRELHELIKTALLEKETI\n+VAEEIEYIAKNMKLPSESKEEKAENVNLTIDDILDGKSEEKGETM\n+>gi|290753084|emb|CBH41060.1| Conserved hypothetical protein [Mycoplasma agalactiae]\n+MILLGVSGGPDSMYLLDLISSQRSDIVVATVNYNVRHDSAYDAEIVRKFCEDKDIIFECLEIDQKARFKG\n+NFEKWAREQRFSFFKKIYEKYNCETLYLAHHKDDFLESYFMQKESKRQPDFFGIKTENYIYGMKVVRPLV\n+DKVFKNEILEALHNKKIKYANDYTNDLPIYTRNRIRIWLKSLSNSQKSKIFDDIQKENNELAVLAQDTVL\n+EYEHWKKAQFSQDEFLNLSNKERLVYKFVHENYVDIKLSNRKIKSIISFILSNNRTSQYLIKNNVFIQKK\n+HGKLVF\n+>gi|290753085|emb|CBH41061.1| Peptidyl tRNA hydrolase [Mycoplasma agalactiae]\n+MKLIVGLGNPGNEYRFTRHNAGFLAIDKICEKLNISLNKEKFNGEFVVSDGFILAKPLTYMNKSGDFVYS\n+IASFYKINPSDIIVIYDDLSFSIGQAAIKIGGSSAGHKGIDSLMSKFSSNDFKRIRVGIGVNSGTTIKDY\n+VLSLFTKDEMIVVEEVLEKVADAAISLVYNDVNFVMNKFNTDNKKRVI\n+>gi|290753086|emb|CBH41062.1| Exodeoxyribonuclease V alpha chain [Mycoplasma agalactiae]\n+MFMSNESNSGAIRLKGKFLVVKWSGADNNIPRELWIFESSPERERFFIYTNKQELKSSCFYEIEVKLRAS\n+KRSKYQNSTYELLSFKIVSPDNDSDIEKMLVSNVAGLGVKGIQRIKSELGLSSIKELFDDVESAQNVLKT\n+AIYENLKAFINSFDQKDYDFFAENGLLKLYDKLRARFENNDFVSRYKNNGDPYELYVDHWIDFKLVDLFA\n+QCVNKNIEPYKIIRAFTYKILRTNFNNICTMYYDVLPFYKSLWNWYEDYRRDNSENSTLFEQSYVVSLLS\n+LLLQKRDISDDLIIESLNVMIQRGEVYFDSDSKRLSLNEVYEQELFVAKKLIKIRDSELKQQIIPLPSQK\n+LADEQKKAYASALNNPLSVITGYPGTGKSYLIAYIVETLLKDKHYKKKDIAVLTPTGRASTILAYKTGIE\n+ARTIHSFLKLSKSDEDDSFIESFEKENPIKVVVIDEFSMVSLPIMYELLKTCTSIERLILVGDRDQLPCI\n+GKGNLLEDIINSKKFPTFVLEEIHRTDKIDIFKHFIAINDNKVPKIDTENVKFIEQNGIQFLNNIVKIYE\n+EKVNKYSIDNVIILLPSYLELGQPGINEVNKRLQEWNIKRTGAKKNLSIHNNLTLFVGDRVIQTVNDYDK\n+NVFNGEIGIVEEINTDSKNTFIIVGFGQDKKVRYNRSEILENLTLAYAITVHKFQGSEASCVIFGILKNR\n+VEHMFTKKFMYTAVSRAKEELLLLGSKDLYIQKIQSRNADLKHYTNLKSLIEKEAK\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/proteomes/Mycoplasma_gallisepticum.faa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/proteomes/Mycoplasma_gallisepticum.faa Tue Oct 24 06:40:40 2017 -0400
[
b'@@ -0,0 +1,5394 @@\n+>gi|284811831|gb|AAP56351.2| ParA/Soj family protein [Mycoplasma gallisepticum str. R(low)]\n+MIISFINNKGGVLKTTLATNICGVFSKFFPKSRSVIVDLDGQGNVSATFGQHPERLKNTLIDIFRGEKDI\n+DDCVLNVFPSIDILPSNHELSFVDMDVARKEYKLSVIKNLIEKLEEMYDFVFLDTPPAMSTIVSVSMHIS\n+DMIVIPFEPDQYSILGLLRVIDTIETFRERNEDLKVLVVPTKVNARTRLHNDVLNIVKTKLSKKNIPLSK\n+NIVSFTTKSSASVGYEKLPIVLINQRSKYQEEYIEITKEIINLLKDNKNNEK\n+>gi|284811832|gb|AAP56352.2| unique hypothetical protein [Mycoplasma gallisepticum str. R(low)]\n+MKNKKAKKKERRFTDLSADLDEEVEKIDPEYEDFKEIKIEKNKDNQVIDKNDPFFYSESFEEARIQLIKD\n+KKVEVKKEEEKVQETTVKNKISEAKKEEAKDVYIDSSLEIASQEPLTKGMHFYTNSRIIRKVRECAKNKG\n+LSISRLITMILDKSIKEE\n+>gi|31541051|gb|AAP56353.1| chromosomal replication initiator protein DnaA [Mycoplasma gallisepticum str. R(low)]\n+MKTKLKRFLEEISVHFNEANSELLDAFVHSIDFVFEENDNIYIYFESPYFFNEFKNKLNHLINVENAVVF\n+NDYLSLEWKKIIKENKRVNLLNKKEADTLKEKLATLKKQEKYKINPLSKGIKEKYNFGNYLVFEFNKEAV\n+YLAKQIANKTTHSNWNPIIIEGKPGYGKSHLLQAIANERQKLFPEEKICVLSSDDFGSEFLKSVIAPDPT\n+HIESFKSKYKDYDLLMIDDVQIISNRPKTNETFFTIFNSLVDQKKTIVITLDCKIEEIQDKLTARMISRF\n+QKGINVRINQPNKNEIIQIFKQKFKENNLEKYMDDHVIEEISDFDEGDIRKIEGSVSTLVFMNQMYGSTK\n+TKDQILKSFIEKVTNRKNLILSKDPKYVFDKIKYHFNVSEDVLKSSKRKKEIVQARHICMYVLKNVYNKN\n+LSQIGKLLRKDHTTVRHGIDKVEEELENDPNLKSFLDLFKN\n+>gi|284811833|gb|AAP56354.2| ABC transporter component domain protein [Mycoplasma gallisepticum str. R(low)]\n+MRVNIFERYQSFSVKNTDKFEKASVLTRMTTDINFIHQSIQSGRTAIRGMSVFLFSLVLMFVTS\n+>gi|284811834|gb|AAP56355.2| ABC-type multidrug/protein/lipid (MdlB-like) transport system component domain protein [Mycoplasma gallisepticum str. R(low)]\n+MPVIIGGILLVYRFVIGNYKKLFKQYDQLNNLAKESIAGARVVKSYHQQDNEIQKFNRVAGFIYKNFTKI\n+ERITALISPIVLFCIYALAIAIAWIGTNNIVDGKLDIGSLASVFAYAFQMLINLLLLSVVYVTIITAKPS\n+KDRIIEVLTEKIDIKDKKYAIDTVSDYEVEYKDVSFKYVDTNPHHNLEKINIKIKKGQTIGIIGSTGSGK\n+TSIVNLLTRLYECNEGQVLLNNIQLNNYSIKALRDAIAIVPQKSILYSGTIKDNILMGGNYSDEEVEKAI\n+TQAQAAEFINKLPNKLDSIVEQKWN\n+>gi|284811835|gb|AAP56356.2| ABC-type multidrug/protein/lipid (MdlB-like) transport system component [Mycoplasma gallisepticum str. R(low)]\n+MSHKKERNAQKKKYFKELLRFIWKNKKWHLLIAFFLIIISSITLVLVNNFIKDLIDDYIAPLLREKSTGK\n+PLDFSGLIKYLSIIGLIFILGVLSNIISGQIMAKATHATLFKLRNNMYVHMQGLPIKYFDTTKHGDIMSY\n+YTNDVDTVRNLIVQIIPQSFQALVQIVVIFVFMLQISIVLTLITVLLLLPMLIFFGFFGKKTRVNFVANQ\n+VEIANLNGVIQEYIETQMISNLFNYSDQVIHKFKLANNKQAAIMKKANVLASIVFPVIFNYSNVMYIVVA\n+IASVFLFESYQNKPILGQQITLRVIVSFVALVRAFVGPLANISENVNFFARSKAGAERIYTMLDEKLEEN\n+KGKIILDYIEKYENGNWRIANKWTKQIGWVINGEIKPFQGKVEFKNVNFSYDGKKQVLKNINISGYPGEK\n+IALIGKTGSGKTTIANLISRFYNVSDGEIYFDDIPISSVDINSIRKTVGMVLQSTELFSGSIRDNIAYGN\n+KEAKLEDIIEAAKLANAHDFIMALPNEYDTYITNNGEGLSQGQKQLLTIARVSSMNPTIMVLDEATSNID\n+SRTEKVIKESMDKLMQNQTTFAIAHRLSTIKNFNQILVIQEGEIVERGNHEQLMAKKGLYESFYHSSFSD\n+EMS\n+>gi|31541055|gb|AAP56357.1| 50S ribosomal protein L34 [Mycoplasma gallisepticum str. R(low)]\n+MKRTYQPNKRKRAKTHGFRARMATASGRAVLAARKRKGRHILTVSDEAR\n+>gi|284811836|gb|AAP56358.2| ribonuclease P protein component [Mycoplasma gallisepticum str. R(low)]\n+MKRENSLKKITNFLELVKSKNKYYSNNYVIYAEKNRENKIKIGISVSKKLFAKAVIRNKIKREVRSFFDD\n+FTDWSKSLNILIKINNVNYLTNSYYLAKKEEFFDTYKKVVQKFKTI\n+>gi|31541057|gb|AAP56359.1| putative inner membrane protein translocase component YidC [Mycoplasma gallisepticum str. R(low)]\n+MNKVHSEIKTQSFNPFWNAATLKEKSRIDPNLKKALSYLWKFLKICVFLFLTVIGLWGCTQTYSEPWTVS\n+NPRIGVGLEIGYNYGVTGDYRYDLTSSNIGPYFSFANYQLSYGPFLAWFVWPASQIILPILYQTRVPLTQ\n+GIDYGLNTILAILILLFIIRLITIGITLNSTLNTERMGEVQGKIAEINAKYKNATDTQSKKMKQIEVMHI\n+YKKHKIKPAALFVQGFVTIPIFLIVYKMVSLTRPIKATILFGIWDLSVTPGTEIISDISRNWVYIFFVLL\n+VVPMQIVSQWLPQFWATRRNRNAKTTSQKGLEQLKKTRRIQWILIFVFALFPVITPSAVGLYWFLNSIFT\n+ILQSYITHVFIVKRRQRTKTISRLDQILNRELD\n+>gi|284811837|gb|AAP56360.2| dimethyladenosine transferase [Mycoplasma gallisepticum str. R(low)]\n+MINKINKFFKNNEFSPSKQRGQNFLIDQNIINNVVEAVSKINPSKVLEIGPGLGAISEQLIKRFADNYYA\n+IELDKKLFHHLNERLLKDHILHADALEIDWKSIFDNLGDNPTMVGNLPYNISSKLIKKFILSTYRCAIIM\n+VQKEMGLRLLAKINSKDYSAFSALCQYSLSVSKIIEINETAFIPQPKVRSTLLFLEKKDIAFNEGYEKFL\n+KLIFLSRRKTILNNLKNNYDPKLIIQSLVSLGFKKTSRAQELSPTQLFSLYESLSKLC\n+>gi|31541059|gb|AAP56361.1| diphosphocytidyl-2C-methyl-D-ery'..b"NYDKTNIYKYLINKKKQFVLVGNKVDEVDPTLNTG\n+EIQIKISAKNNDISDLIKYLEETSLAIFNDENKQDSIFQEEWQINLLQTALYNINLILNDPNQYHDLVIQ\n+HLNEANNSLLKVLSEYEDYNLIDEIFKNFCLGK\n+>gi|284812297|gb|AAP57070.2| DNA polymerase III subunit delta' [Mycoplasma gallisepticum str. R(low)]\n+MNLTNKYIPILLFENKGCYLKKYLEEYLINIVCTEANKPCKKCVWCSKIINNGYYDLIHVYPHNNVIRKQ\n+EIIDIQNKFNNTALESRGIKIYIIHQIEKANKESLNSLLKFLGEPKDNTIGILTTRKPYGVLDTIVSRCV\n+RYSTNSYEEKVEFKNKYKPKELELIKIMFYSYDDILQYESTKDIFKLLELIHLLELNNKKFDQIIKIRDL\n+FEKIDYYEISLVLNYLIFTGDFKRKSKLIPILNNLNLNLSKNAILISIID\n+>gi|284812298|gb|AAP57071.2| Thymidylate kinase [Mycoplasma gallisepticum str. R(low)]\n+MKKGVFIVIEGVDGSGKSSFLKRMMNEHTMINSQPIIYSREPGGCDTSEAVRELIMKLSNSDPLTEALLF\n+CASRNEHLKKKILPALNENKIAICDRFVVSSWIYQGLIKNAGYEKVKKINEYVTDGLEPDLTILFDVDPE\n+IAAKRISERSTMNHLDAYTKERINKIRNAYLERLKDNKKAKIINASLDLDTVYDQVVNIITLFVKNHELN\n+>gi|284812299|gb|AAP57072.2| Seryl-tRNA synthetase [Mycoplasma gallisepticum str. R(low)]\n+MLDKNLLKTNSKEIREQLKSRSFNLDWYDEFLRLEKQLSTLLRTIEKLNEQKNINAKKAATTESDAQRKK\n+LIQEGGLLRAELEKNEAKYNEIKEDFDYIYQRIPNLPTEDVPIGKDEKENVEMFKSRKPTFFDFKPLPHY\n+ELATKLEMIGLDVASKITGSRFSIYKKDGARLMRAIQQFCLYVNADKYEEYLPPVIVNKDSYYGSGQFPK\n+FVEDVFKLEGTNYYLASTAEVQLVNLHRNEILKEADLPKYYTASTACFRSEAGSAGKDTKGLIRQHQFYK\n+TELVKIVHPSTSKQEHEAMAKDAEKILELLELPYRRMVLCTGDMGFSATKTYDLEVWIPSENKYREISSI\n+SNCGDFQARRANIKFKDAISKKNLYVHTLNASALAHDRLFVAIVENYQQKDGSIKIPKALVKYFGKEYIK\n+>gi|31541774|gb|AAP57073.1| DNA gyrase subunit A [Mycoplasma gallisepticum str. R(low)]\n+MNPNDKNNIKELLNKTVVKEASITKELETSFMEYAMSVIVSRALPESRDGLKPVHRRVLYGAYTSGLTHD\n+KPYRKSAQIVGHVMGKYHPHSDSAIYETMVRMAQPFSLRYMLIDGHGNFGSIDGDSAAAMRYTEARLSKI\n+SAEMLRNIDKDTVDFVDNYDASEQEPIVLPSLFPNLLANGSSGIAVGMATNIPPHNLSELIGGIKHLLVN\n+ENATIEELKEFIKGPDFPTAAEILGETGINEYFNTGRGSVSVRAKSEIEELANNKSNIVITQIPYMVNKA\n+NLINKIAELVKTEQIQGIADLRDESNREGIRIVIETKRDVIPEVLLNQLYKSTQLQTNFSVAMLALVNNQ\n+PKVLNLKEALQIYIDHQFDILLRKTNFELKKAKASAHIVEGLVIATNNIDDVIETIKNAKDNEDAKNTLM\n+TKYELSDLQAKAILDMRLRSLSGLERENLQKELAKLKELIKDLEEILQNKERRIKIISDQLDEIDHKFGD\n+ERRTKICYGLNSTIDNEQLIPVETVVITRSSKGYLKRIPISAYKVQHRGGVGVKGMNTYEDDDVESLIVC\n+STHSDLLFFTNYGKVYRIRAHQVPLGSRISKGIPAINLISIEKDEKLMSLLSINDYDSGYFFFSTKKGLV\n+KRVKASEFSRIQNNGKIAIKLTENDSLFKVIKTAGDEEIYIGVSSGLLVRFKEDVVRSMGRTAQGVIGVK\n+FKNPNDEVIGLSSSHEGSLLLAVCEKGVGKMTDREEYRMTNRGSKGVITIKVTPKTGNIINTQLVNGNEE\n+LLMISSTGKIVRVPLAEVSEQGRNTSGVKLISLNEKETLQSVAIFDVEQDDSQQVGSDNPDTELSSDDSN\n+QDQDKE\n+>gi|31541775|gb|AAP57074.1| DNA gyrase subunit B [Mycoplasma gallisepticum str. R(low)]\n+MNNTKKDQYSSQSIKVLEGLSAVRKRPGMYIGSTDQKGLHHMIWEIIDNSVDEMMAGYGTTVKLTLKDNY\n+LVEVEDDGRGIPVDIHEKTNKSTVETVLTILHAGGKFDSDTYSMSGGLHGVGASVVNALSSSFKVWVNRD\n+YKIHYIEFKDGGVPLKPLEIIGTDSKKQGTRIQFVPDFSIMEQFEYDETIIADRIEQLAFLNKGIKFIFN\n+DERTDKKTKQEWLYEGGIKQYVENLNASKEPIIPQIIYGEKKTKVTLPKRNLEVTMLLEVAFQYTNGYYN\n+STYSFCNNIHTNQGGTHEEGFKNALYKIINRYALEKKFIKETDGKISKEDLSEGLTAIISIKHSEPQYQG\n+QTKDRLGNTEVREFTNSVVSELLERFFLENPEEAAKITAKAVSAMFSRKRSEAALESARKSPFESASLPG\n+KLADCTTKDMEISELYIVEGDSAGGSAKSGRDRFYQAILPLRGKVLNVEKANHEKIFKNEEIRTLITAIG\n+AGVNPEFSLDKIRYNKIIIMTDADVDGAHIRILLLTFFFRHMFPLIEKGHVYIAQPPLYRVSYNKQNKYI\n+YSDAQLEEWKNQNPNVRYELQRYKGLGEMDDVQLWETTMDPEKRTLLKVSINDAANADKTFSLLMGDEVS\n+PRRDFIEKNAKSVKNIDF\n+>gi|284812300|gb|AAP57075.2| DnaJ-like molecular chaperone [Mycoplasma gallisepticum str. R(low)]\n+MTLYELLEVDQNATLSEIKSSYKRLAKKYHPDVNKNGHDKFVQINNAYSILSDEVQREKYDFMLDHENSK\n+TFEFSADGLTYEYSGVEVWHENFTKNVSLTQQWDFNPSNYYYEEYNLYHKFDKISIDGLGAFLDFDISCA\n+FYELDTSFSLPNNLVKRLINRPDVIRYDISENELIEYLKHRYDFSSWLLLKKYFNIEAIIEVTQEEIDSQ\n+KIINIPIKIKVINLNRSFEIWHEELRNYAFIVPENTKTGDISEFFGKGNVALGWQGDLIVRFKVVPSVEK\n+RLKIFSSMLNNEKSSLWFLVPSENNKNPNTKIFNYKTYQFNN\n+>gi|284812301|gb|AAP57076.2| DNA polymerase III beta subunit DnaN [Mycoplasma gallisepticum str. R(low)]\n+MKFFTSKSSFLEAIKFSSNFSSDNNFEQLLKNLYIKIDNKECKIYSSNGQVSSIYKIEDDIDVEEEGEVI\n+VNAKKLITIIQSIVSDNFTLAKLDNQLIIRAGKMQTSLNLEEDVSYPEIEIDDSNFSVIDVDSFLFAKSI\n+KKVIHSTSFQTTKNSISSAINFQKEADDMNIWITGSDAIKLSSCYYKVNDTEDALKAKFNFSVNALSLSY\n+VAAFLKDKDQLLLKISKKSDKVVLTNNKFVLYLRVENEPFPEFKKILNANKVVSSFVVDKDLISNNLHAL\n+TGVLSLSDQGKNNADANFEILKNTLRISTNSFDIASYNSEFDISEFQGEVKDINLNPFYLQEHIKMFESK\n+DIEFKLLLQSAISGCILKVCEKNNDQFKLKFVQVLAPSSTN\n"
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/proteomes/Mycoplasma_genitalium.faa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/proteomes/Mycoplasma_genitalium.faa Tue Oct 24 06:40:40 2017 -0400
[
b'@@ -0,0 +1,3211 @@\n+>gi|84626162|gb|AAC71217.2| DNA polymerase III, beta subunit [Mycoplasma genitalium G37]\n+MKILINKSELNKILKKMNNVIISNNKIKPHHSYFLIEAKEKEINFYANNEYFSVKCNLNKNIDILEQGSL\n+IVKGKIFNDLINGIKEEIITIQEKDQTLLVKTKKTSINLNTINVNEFPRIRFNEKNDLSEFNQFKINYSL\n+LVKGIKKIFHSVSNNREISSKFNGVNFNGSNGKEIFLEASDTYKLSVFEIKQETEPFDFILESNLLSFIN\n+SFNPEEDKSIVFYYRKDNKDSFSTEMLISMDNFMISYTSVNEKFPEVNYFFEFEPETKIVVQKNELKDAL\n+QRIQTLAQNERTFLCDMQINSSELKIRAIVNNIGNSLEEISCLKFEGYKLNISFNPSSLLDHIESFESNE\n+INFDFQGNSKYFLITSKSEPELKQILVPSR\n+>gi|84626152|gb|AAC71218.2| DnaJ domain protein [Mycoplasma genitalium G37]\n+MNLYDLLELPTTASIKEIKIAYKRLAKRYHPDVNKLGSQTFVEINNAYSILSDPNQKEKYDSMLKVNDFQ\n+NRIKNLDISVRWHENFMEELELRKNWEFDFFSSDEDFFYSPFTKNKYASFLDKDVSLAFFQLYSKGKIDH\n+QLEKSLLKRRDVKEACQQNKNFIEVIKEQYNYFGWIEAKRYFNINVELELTQREIRDRDVVNLPLKIKVI\n+NNDFPNQLWYEIYKNYSFRLSWDIKNGEIAEFFNKGNRALGWKGDLIVRMKVVNKVNKRLRIFSSFFEND\n+KSKLWFLVPNDKQSNPNKGVFNYKTQHFID\n+>gi|1045671|gb|AAC71219.1| DNA gyrase, B subunit [Mycoplasma genitalium G37]\n+MEENNKANIYDSSSIKVLEGLEAVRKRPGMYIGSTGEEGLHHMIWEIVDNSIDEAMGGFASFVKLTLEDN\n+FVTRVEDDGRGIPVDIHPKTNRSTVETVFTVLHAGGKFDNDSYKVSGGLHGVGASVVNALSSSFKVWVFR\n+QNKKYFLSFSDGGKVIGDLVQEGNSEKEHGTIVEFVPDFSVMEKSDYKQTVIVSRLQQLAFLNKGIRIDF\n+VDNRKQNPQSFSWKYDGGLVEYIHHLNNEKEPLFNEVIADEKTETVKAVNRDENYTVKVEVAFQYNKTYN\n+QSIFSFCNNINTTEGGTHVEGFRNALVKIINRFAVENKFLKDSDEKINRDDVCEGLTAIISIKHPNPQYE\n+GQTKKKLGNTEVRPLVNSVVSEIFERFMLENPQEANAIIRKTLLAQEARRRSQEARELTRRKSPFDSGSL\n+PGKLADCTTRDPSISELYIVEGDSAGGTAKTGRDRYFQAILPLRGKILNVEKSNFEQIFNNAEISALVMA\n+IGCGIKPDFELEKLRYSKIVIMTDADVDGAHIRTLLLTFFFRFMYPLVEQGNIFIAQPPLYKVSYSHKDL\n+YMHTDVQLEQWKSQNPNVKFGLQRYKGLGEMDALQLWETTMDPKVRTLLKVTVEDASIADKAFSLLMGDE\n+VPPRREFIEKNARSVKNIDI\n+>gi|1045672|gb|AAC71220.1| DNA gyrase, A subunit [Mycoplasma genitalium G37]\n+MAKQQDQVDKIRENLDNSTVKSISLANELERSFMEYAMSVIVARALPDARDGLKPVHRRVLYGAYIGGMH\n+HDRPFKKSARIVGDVMSKFHPHGDMAIYDTMSRMAQDFSLRYLLIDGHGNFGSIDGDRPAAQRYTEARLS\n+KLAAELLKDIDKDTVDFIANYDGEEKEPTVLPAAFPNLLANGSSGIAVGMSTSIPSHNLSELIAGLIMLI\n+DNPQCTFQELLTVIKGPDFPTGANIIYTKGIESYFETGKGNVVIRSKVEIEQLQTRSALVVTEIPYMVNK\n+TTLIEKIVELVKAEEISGIADIRDESSREGIRLVIEVKRDTVPEVLLNQLFKSTRLQVRFPVNMLALVKG\n+APVLLNMKQALEVYLDHQIDVLVRKTKFVLNKQQERYHILSGLLIAALNIDEVVAIIKKSANNQEAINTL\n+NTKFKLDEIQAKAVLDMRLRSLSVLEVNKLQTEQKELKDSIEFCKKVLADQKLQLKIIKEELQKINDQFG\n+DERRSEILYDISEEIDDESLIKVENVVITMSTNGYLKRIGVDAYNLQHRGGVGVKGLTTYVDDSISQLLV\n+CSTHSDLLFFTDKGKVYRIRAHQIPYGFRTNKGIPAVNLIKIEKDERICSLLSVNNYDDGYFFFCTKNGI\n+VKRTSLNEFINILSNGKRAISFDDNDTLYSVIKTHGNDEIFIGSTNGFVVRFHENQLRVLSRTARGVFGI\n+SLNKGEFVNGLSTSSNGSLLLSVGQNGIGKLTSIDKYRLTKRNAKGVKTLRVTDRTGPVVTTTTVFGNED\n+LLMISSAGKIVRTSLQELSEQGKNTSGVKLIRLKDNERLERVTIFKEELEDKEMQLEDVGSKQITQ\n+>gi|1045673|gb|AAC71221.1| seryl-tRNA synthetase [Mycoplasma genitalium G37]\n+MLDPNKLRNNYDFFKKKLLERNVNEQLLNQFIQTDKLMRKNLQQLELANQKQSLLAKQVAKQKDNKKLLA\n+ESKELKQKIENLNNAYKDSQNISQDLLLNFPNIAHESVPVGKNESANLELLKEGRKPVFDFKPLPHRELC\n+EKLNLVAFDKATKISGTRFVAYTDKAAKLLRAITNLMIDLNKSKYQEWNLPVVINELSLRSTGQLPKFKD\n+DVFKLENTRYYLSPTLEVQLINLHANEIFNEEDLPKYYTATGINFRQEAGSAGKQTKGTIRLHQFQKTEL\n+VKFCKPENAINELEAMVRDAEQILKALKLPFRRLLLCTGDMGFSAEKTYDLEVWMAASNEYREVSSCSSC\n+GDFQARRAMIRYKDINNGKNSYVATLNGTALSIDRIFAAILENFQTKDGKILIPQALKKYLDFDTIK\n+>gi|1045674|gb|AAC71222.1| thymidylate kinase [Mycoplasma genitalium G37]\n+MNKGVFVVIEGVDGAGKTALIEGFKKLYPTKFLNYQLTYTREPGGTLLAEKIRQLLLNETMEPLTEAYLF\n+AAARTEHISKLIKPAIEKEQLVISDRFVFSSFAYQGLSKKIGIDTVKQINHHALRNMMPNFTFILDCNFK\n+EALQRMQKRGNDNLLDEFIKGKNDFDTVRSYYLSLVDKKNCFLINGDNKQEHLEKFIELLTRCLQQPTHY\n+>gi|1045675|gb|AAC71223.1| DNA polymerase III delta prime subunit, putative [Mycoplasma genitalium G37]\n+MLTTTHALLIIQRKGSFLKPFLDNYLTSIVCENKNGCKKCINCLEILNNKYNSLYWFDQINPFKRENALQ\n+LARIFNRERTSVNNKNIYLIEEIEKLSSNSINSLLRLVEDSPINSYGIFTTKNESLILSTFLSRVQKVVL\n+KKASKVPFKVSKNDQEIITSFFTVDEQIEAIENGSFNRFKIILDACLNKKTGTEQIYHAWQIFRDFSNSE\n+IAQLITLIINKTENIDKKSILFNCLKVLPYNPPKSTLFANLVSW\n+>gi|1045676|gb|AAC71224.1| tRNA modification GTPase TrmE [Mycoplasma genitalium G37]\n+MKSEINIFALATAPFNSALHIIRFSGPDVYEILNKITNKKITRKGMQIQRTWIVDENNKRIDDVLLFKFV\n+SPNSYTGEDLIEISCHGNMLIVNEICALLLKKGGVYAKPGEFTQRSFLNGKMSLQQASAVNKLILSPNLL\n+VKDIVLNNLAGEMDQQLEQ'..b'060|gb|AAC72485.1| ribonuclease P protein component [Mycoplasma genitalium G37]\n+MLNSRFPVSVKKSHSLRERKVFTTILQSKTRFFGTFINAYFIKNNHSTWRVAISIAKTKYKLAVQRNLIK\n+RQIRSIFQQISNNLEPWDILVIVNKGFIELTFKEKQKLFLQLLKRIKEVDAYQTSANK\n+>gi|3845061|gb|AAC72486.1| ribosomal protein L34 [Mycoplasma genitalium G37]\n+MKRTYQPSKLKRAKTHGFMARMATAQGRKVLRQRRFKNRAQLTVSSER\n+>gi|3845062|gb|AAC72487.1| ABC transporter, ATP-binding protein [Mycoplasma genitalium G37]\n+MKKGNKTVWNECIDILDNVKSPSFSANFDDYFKKSKSKPPKKNKKVLNNIKKAELKLKKKANKKQKANTL\n+YIPPFAQQAKGIVITINKMWKNVHNDDSKQEISILSDVSLQIAYGEIVIILGSSGSGKTTLLNLIGGYDS\n+ISLGSCIVANCPLEKCTSEQLLTYRKNNLGYVYQRYNLIELLSAYDNIAISQNLIPKYQRRLDIEELAEK\n+LDIKEILYKFPYEMSGGQKQRVAIARAIIKEPKLLLCDEPTGALDSNSAENIINLLQTINKTYKQTILMV\n+THDVSLTRIANRIIKISDGKIVSNQLVRPLV\n+>gi|3845063|gb|AAC72488.1| ABC transporter, permease protein [Mycoplasma genitalium G37]\n+MFSFFKQIFKSLKKFFFLLFGIIFVLFSIIFLETSIVQLSNNLVSTYTTLVSKTNSSDIVAPAILKEANP\n+VYIASLTNDSGYFSKIKIDDKKINYLFPYQENDFGSDSGQSNGSGDNQNKTIPRKGDVNEKDKLFLARKR\n+GILKAYGEANIAEKRIYKGLAVSFNNTDSFNGSDISDSITNRHIISDPQNLIYDASGNLLGYFADGLIKE\n+TISLRAGIARFPGDKGKSTGTQVKITQKQQTNNDPQKDSTVNSLYKTNNKDKVWFKSDETKADNTDISAN\n+YLFTGGNEAANWFPNLYANIPIDLEIDPGSQFWKDVNPFKEIVEEFQTQKESKDNQSFTLTFNLDISKLN\n+KLDNEQLKWLETNAKTIANNSSFGDWDLENKLKQLKKFELKINKDWLKKKVESEKDTILNSLPGFSDSDK\n+DTIFKTQNGMMVRNNNLSFQPSSNNLQLVQNQNSQASNGIADPNFSNVQTAYNKIHQSNNTPEKTLDAVY\n+AAVLDQWRSIFQEDLVKKTVDLLEKYRDHFLKATAFNNIDYSKQNIAIANNVSSAESASFLVSNKDEQRY\n+NDLSLIDGVDLKSWLFKPEQNESNPLDTIYGGQDANNGFLQKIDYEFKPSTSSGGMTASLKNTQALSPKS\n+TKFPIYPKLANIIAQAQLPEATNIPTTALDALKQWTNLDANGFNNLKEEDKRKAANNYLALLSYFTPAFQ\n+DPNELIETNRQMLEIPITVKNGVNPLILPTDQQNLVVQTPEAHGAVVSQQWLFRHNKEILPQEGEYAWKT\n+ALQTPNNFPNWLNDLPDRYKFSINGLTFAILGIGESVETGYPVLSLQSPLPNTQDEALIFVNDQAYRSIL\n+FAVPAANQENYYAFKSTDLKQHTDQDPVQFIANRLEGYLDVPRSDLAFNVKDISKFNYLTTARNYFPDLV\n+QSYLAIVSTVIAIFLIILALYLIILLIKSFIKKNQTEFSIIRAGGFSTTKFIVGMSVFAGIVAIVSSFLG\n+VLFAFLLEGQVKGIINRYWFIALPENSFNWLSFFGSFFITFFVFEFISWIAFKQLFSKPVNVLIDQGNET\n+KFSVLLHLLKHKSHTMSPLTKFRVSLIVSRFSRLFTYVGLSSVALLLIGIAGTIPQKFSAAQTSTSLNRN\n+FNYKLNLQTPTEQSGWYAIQPYSHFGVTDNNNGIKTLYNESVQANSQNEHPYKPSNLKLKNRQDQPIKAA\n+DGTELELGNLLLPSYGGAQQLNTDENFFRHASLSKWIIDFPIRVGGSNINPWEIVEKSIPKQITQLLSAS\n+SDQFLISVLTDDFFNNLNANGFLIRNPRTNQIQLDASRVLTTIDVFNPGGVKFNDSFLSFMLKVYGDFEL\n+AKQDSKLNFGIVPVDPAIEETYTYVEGPFGFQEDNLDENSPYTLTGINPESSFVNLIDGSGNSLRNLISS\n+DQEMNVIVNAGFQYANNINIGDYVYIKPKNTATRYSEKFLKAPLNNSTVAFKVVGVSTDAFGQELYINQH\n+IANNLLKLSGNQGRGIIRDVIKKTNGQSQSSDEYEIDYVKPNGYVPFNGVFSKELKPSLLNKALVLNSII\n+GVWGNFTDFGNNFQNLVRNKLDKVITSILPTDPEIINKLAQEKQIINTTSMNYESLRKELVNKYKTEWNS\n+VNLLSQNASSIFGNNIIAPVLNIDAAGTSAQIIRNNAEVLFNTVNQVDAFLLGTIIPFIFITCVVLGISM\n+LEEMKRIFISLKAIGYRDVQNLISLLTFFIPAFVLALLISIGVLAGVLIGIQAVVFNVAQVFLTNVFEFL\n+PYMVGIVLFGVTIFVIGSYFWIKLRSAELKEGF\n+>gi|3845064|gb|AAC72489.1| ABC transporter, ATP-binding protein [Mycoplasma genitalium G37]\n+MVLKTKENKKFDIYLKSSDFAVSKKASKLIKKLNKKHPKRKSLNSFEAKKYDIYFKEVCKAVTNGINNQL\n+ICNHINLKILPGEFVVILGKSGSGKTSLLSLISALDRPTSGDSFVCGTNTICCSDAKLTALRNKNVGYIF\n+QQYGLLRDLDVDDNIKLALPLKKRFNNNLEELLERLELKEHRHKKVHKLSGGQQQRVAIARALIKEPKIL\n+FGDEPTGAVNIDISKKILQFFVEYNRDKGTTIVIVTHNEKIVELAKRVIKIHDGKIIVDYLNQNPKTIEQ\n+INWV\n+>gi|3845066|gb|AAC72490.1| chromosomal replication initiator protein DnaA [Mycoplasma genitalium G37]\n+MEQFNAFKSLLKKHYEKTIGFHDKYIKDINRFVFKNNVLLILLENEFARNSLNDNSEIIHLAESLYEGIK\n+SVNFVNEQDFFFNLAKLEENSRDTLYQNSGLSKNYTFQNFVISEGNKRAYEAGVRLAETQDNEFSPLFIY\n+GETGLGKTHLLQAIGNEKFRNFPNARVKYVVSSDFAQEVVDAFYQRDKGIEKLKKNYENLDLVLIDDTQI\n+FGRKEKTLEILFNIFNNLVLNKKQIVLVSDKAPDELIDIDARMISRFKSGLLLKIEKHNLSSLCEILTVK\n+LKEKDPNIQITNEARHDAAQISGNDVRALNGIATKLLFFAKTSKQNLINTENLKEILFEEFEKFHKKSFD\n+PYLLIENVCRRFNVPMDSVLSENRKAELVRVRDVCNYLLRQKYNMQFQQIGKIFKRSHSSVLMAVKRVAK\n+MIENDSSLRDVITSLVI\n+>gi|3845067|gb|AAC72491.1| CobQ/CobB/MinD/ParA nucleotide binding domain [Mycoplasma genitalium G37]\n+MIISFVNNKGGVLKTTMATNVAGSLVKLCPERRKVILDLDGQGNVSASFGQNPERLNNTLIDILLKVPKF\n+SGSNNFIEIDDCLLSVYEGLDILPCNFELNFADIDISRKKYKASDIAEIVKQLAKRYEFVLLDTPPNMAT\n+LVSTAMSLSDVIVIPFEPDQYSMLGLMRIVETIDTFKEKNTNLKTILVPTKVNVRTRLHNEVIDLAKTKA\n+KKNNVAFSKNFVSLTSKSSAAVGYEKLPISLVSSPSKKYLNEYLEITKEILNLANYNVH\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/inputs/proteomes/Mycoplasma_hyopneumoniae.faa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/inputs/proteomes/Mycoplasma_hyopneumoniae.faa Tue Oct 24 06:40:40 2017 -0400
[
b'@@ -0,0 +1,4764 @@\n+>gi|144227417|gb|AAZ44095.2| chromosomal replication initiator protein [Mycoplasma hyopneumoniae J]\n+MQTNKNNLKVRTQQIRQQIENLLNDRMLYNNFFSTIYVLNETETEIIIDFTDLIAKQEVISRWVDTVEKA\n+IKNLEISKILTFNNTNNYTINSKESQNFSIKNKYCSFNINNVLNKFTFRNFIKSSYNFQIFSIYDAIVAN\n+SRLNYSPIFISGPSGIGKTHFINAIGNLLVEKQKKVFYINDYKFISCVSSWMQNGQNEKISEFLNWLSQV\n+DAFLFDDIQGLANKQQTSIVALEILNRFIEEDKTVIITSDKSPSLLGGFEERFITRFSSGLHIKLNKPKK\n+EDFLRIFKHKLVEEKLEKHIWTNDAFEFLSKHFRNSIRELEGALKSIVFYIQTNKNKFENEIYFDKKKMF\n+EIFVEKYEIEQTITPDLIIEVVSKYYGVSILDIKSEKRGKNIVHARDIAIWLIKNILDLTHNSVGTFFNN\n+RRHSTIISTLKKIDTLKQSNNNELEIALNHIYKQLNWSFKQRK\n+>gi|71851488|gb|AAZ44096.1| DNA polymerase III beta subunit [Mycoplasma hyopneumoniae J]\n+MKFTIEKKIIEWQIERMQSAILNNINSPLSSFFLKLTRSGLFIISTNSELSYKVFINKKDLIEIHDVGSC\n+LIDGVFLRDVIRKSDKQLSFHLIGSELKVFWEDALFSKTTRDSSFFPEINFEQKGIKLTVNAKNFKRAIK\n+NTAFATTNNPSQPILSAINLRSEAGFLHFSATDTSRFASEKIEISNKSRINISVSAKNLKDFIPPELDKD\n+IELNIESSKISYIYDNLTIQSRIFTIEYKDISNILPKDSEILYSLTINKRDILDLIDKTTIITPGKDNVI\n+NLSLSKNALKGYISQYDSGQSNVQTKNVLDFRFNPRFASDFRFDPELAQVNINYRYLKDAISVFDKVIDI\n+HINEKMNKMLIVSPEKPEICQLVGLVLV\n+>gi|144227418|gb|AAZ44097.2| glucose inhibited division protein A [Mycoplasma hyopneumoniae J]\n+MSKKSKNSSIEFDAIVVGGGHAGIEAVYALLKKKLKVVLITLDKKKLASMPCNPAIGGPAKGIITREIDA\n+LGGVQGKFSDLAMIQIKYLNESKGPAVLAIRAQIDKEKYSKLILKDLKKQENLLIIEDLVSELLVEKNRV\n+FGLKTAKKQVFFSKTVIITTGTYMDSKVLRGSLAIPSGPDGQQTSNLLSNNLKRLGFELQRLKTGTPPRI\n+FTSSIDFSKVEKEVLPVYNINFSFQSKHKIKKQISCYLTYTTAKTHDIINKNLGKSSMYSGLISGVGPRY\n+CPSIEDKIVRFSEKPRHQIFFEPETKKQDIMYINGLSTSMPEDVQLEMVKTIPGLENAKIAKFGYAIEYD\n+ALNPLELKKSLETKKVKGLFMAGQINGTSGYEEAAAQGLVAGINAGQFVLGKKPVEILRNDGYIGVLIDD\n+LVTKGTKEPYRMLTSRAEYRLILRNDNADIRMAKYALKSGLISKKEYLKIKAKYAKIDRKILELSKEFVS\n+PKDELAKKYNLEKRISKLKLISWPNVNFKDILPDFEFGYELTVMARLKGYIQKQNSEAQKMIRLEKLLIP\n+GDLNYEKVANLSSEALDKFQKVRPKTIGEASRISGVNPADIQMLLFHIKVLKMQKVSKI\n+>gi|144227419|gb|AAZ44098.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+MKISIISFGSSPREWLGLYKKEINKIKQFKYQIEFINLSEHSQENIELKKMLETKDILQKIPKNSSCYLF\n+TERGKTVTSKEFSQLLNFSNICFIIGGSYGVDEKLIAKSRPDIGFLSFGKLTFAHKIFKLIVLEQIYRGF\n+SIKFNRKYHHAD\n+>gi|71851491|gb|AAZ44099.1| putative MgpA like-protein [Mycoplasma hyopneumoniae J]\n+MKRKNYEKIIQNIENHDNIFIFHHIRPDGDCLGAQQGFGYAIAKRFPKKKVFFIGDNENIFNFLNFHFDN\n+ENLIQDEFFQNSLAITVDTADIKRIKKLDFFLNSNFKTRIKIDHHPDIFEEIYNEKWVDPTFSAASEMIG\n+YLLMEENWEINSEISKFIYLGILTDSGRFLFPSTTSRTFQVAAFLMKFNFDFAKLNWFLSNRTEQEVAFC\n+AEVLANYKKKDKVLWYFVSKEIQNKFKLRNDQLSAVNILANIGDARIWLFLIEMENGIRVRIRSNGPKVN\n+EIASEYGGGGHEYAAGINLEKSEKTKEISQEIIEKLVIQVKEFEQNE\n+>gi|144227420|gb|AAZ44100.2| putative DHH family phosphoesterase [Mycoplasma hyopneumoniae J]\n+MSNIKIKEIIKLIENHDTIVIFHHIRPDGDCIGAQLGLKNLILDNFKNKKVFAVGNHKGSFSFLNAKTDS\n+IPDKLILKNSLAIIVDANFKNRIESVFLFDQFKFKTILRIDHHPNEDDFEQIYRWVDPSYVATCEQIADL\n+AYKAKWKISRKSATFIYLGIYTDSGRFLYKNTSARTHFLTGILFRTGFNFALIHEKLNQKKLSDIDFDSY\n+IFSVKKIYKNVIFYTLSMEEQKKLNKNPSNSVRPNLLANIENFRIWLCLVQEKENSWRVEFRSSGPNVQK\n+VAQNWGGGGHLNASGAIIESLDKLDLLIKDCQAEYESWFSQLK\n+>gi|144227421|gb|AAZ44101.2| hypothetical protein MHJ_0007 [Mycoplasma hyopneumoniae J]\n+MEGINITNFLKYLFAYYYIDTGEREVYRTWVQKILWFTHWKFYRMYQIPFFSENFQSYKYGPISWTVLQT\n+QFFGIESFKNSQYNIDEILDFHQNNLVDEFKNRLKEDFLNDFNEDFGETFDENQIKGDLDLRWSCFVFVF\n+EKLKKFRPKDLINLSHSQKSFKIAAKNPHSKVIFNETILDDEEISILES\n+>gi|71851494|gb|AAZ44102.1| cell division protein ftsY [Mycoplasma hyopneumoniae J]\n+MSFFRKIREKIFGTKQEKPANLDKYVAGLTKSRLSFFKQIVQLQKKHIKIDENFFEELEEILIMSDISPN\n+FVRTIIDSLKAEVRHHNLNNPDLIPEIIMDKMYTIYSNRSVVNTNLNIKDGRINVFLISGVNGSGKTTSI\n+AKVARKFIIEGKKVLIIAADTFRAAAVEQLEIWANRVGALILKPEANEKDPGSVVFRGLDFAIKEKTDLV\n+LIDTAGRLQNNVNLMQELKKINKIISQKVPNAPHESLLVIDATTGQNGVSQAANFAKITPVSGIILTKMD\n+GTSKGGIIFSIKDQLDISVKLVGLGEAMDDLQPFDLDLFIFAITKEVKNQYQV\n+>gi|144227422|gb|AAZ44103.2| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+MAKISFFALGGQDENGKNCYILEIDDNIFIINSGAKIPLDSSVGVDTIIADFTYLEENQHKIRGVFITDA\n+KNESFSALPWLIMKLKKIKIYSSFFTKALIIERIHKYRLSESAFEVIPITSELKINEKISVSPFPVAGSM\n+PGTIGFCFHTEDGGIVFMANYVVGNLGVYGETNFELIKKISQNPKGILMFISDSGKSNLPGKAINKLFAK\n+NFLENFFLKADKNSRIVVSAYDEEMVSIQEIIDLSIKFNRQITAYGKKYDKLYDMIYKLDKLTTNKLKKL\n+'..b'FLTKKFFEKNKNKLVIEVLLSLWRIEPFKIKTNTTRRYIQYLSIKNVENFLKMFENELNYL\n+LENRAQAFKFIEKIAKIKEEYQILNKNFYNLYLKTELKPNIEQEKLNEKLKLSIPYPETKFENLKFSQTY\n+AQIALQTIKNDIKNVINHHNSLINSFDSDPYKIKIFITGYNCFLDLIKRSDNFRWLSSLQIYEIYFKFEQ\n+WLIKLLNQKALENILGTQNFFNNTFAEEFWGFWKQNSQQKILEERNKKAQKHFKVKKINSFHKENPYYQN\n+LKTNSKTLLRANILWQHEVIKMEKKLRNKNFQNSFFIKRIWVSSIENKLKKLKEKISKVEYENHFIFLKD\n+ALSDLKNFFYLKNLKKIDVFLKKNQFFIFCFDNKINFDILYKKYGVLTNDDLFFLETKKMQMGNYSRFLF\n+DEYSFLLETNYKQKLFQHFFNNGENSAQLFIYSRRTIKPIRDFSIIFIENGTLVEYIREIDLPLTPKTSF\n+GKFFYQNGTFERTNLPLLETQLYKQLQNEVFQNNSGGIKNNFESFINSWIPIKEFKLEFDSENKKYSLKK\n+DILVIDL\n+>gi|71852146|gb|AAZ44754.1| valyl-tRNA synthetase [Mycoplasma hyopneumoniae J]\n+MKNKYDFKLVEEKRNEKWQKKGFFIAPKQTKKPFSIISPPPNVTGQLHLGHSWNAFIQDSLVRYHKLQGF\n+DVLLLPSVDHAGIATQVKVEEDLAKKGIKKSDLKREEFIKKCYHWKEKQYLKIKEQWDKLGICYDFSKER\n+FTLDQDAQIAVSDFFIKLWEKNLIYRGQKAINWDIKLQTAISNIEVINKPVEQKMYYLKYFLENSNEFLT\n+VATTRIETISSDVALAINPKDKRYLHLVGKKVVHPLTKKLIIIIADSNVSSDFGSGIMKVSAHSILDFEI\n+MEKHNLESKDCIDNYGNLNHEVPEFQGQNRFFARDLIAKKLEKEGFLAKIETVISNVGFSQRSDEIVEIL\n+KKPQWFVKMDELAKSLISHLNSKDKIKFYPKNFEKNLRKWFEKIHDWTISRQLWWGHRIPVWCKNDEFKV\n+QIDSPGQGWIQDEDVLDTWFSSGISAFAFLGWPQNFDLIKSYFPTSLLVTGWDILFFWVARMYFSSLFIM\n+KQKPFEKVLLHGLIRDEIGRKMSKSLGNGLDPMEIIEKYGSDTLRQALIFNSSPGKDIKFNIEKLNTAWN\n+LNNKIWNIAKYIADLDTFFAKPDLIDLWMENKIYILKRQIVKNIKKYNFSVIGTEINNFIYGDFSSRYIE\n+LIKTRKNGFYARKLLRKVLIILHPFLPFLTDFLMEKIFKMEILEQKMPRIRQFKENQKVENILEIIDNLR\n+TYREKFQISKKIILEYCIINDKFSNAEIDIINKLTFGKWLENKELVIKTKNFEIAIKVPEELKKEQKGRE\n+LKEIQFLKSEILRAEKILTNKGFLEKAPREKIDLERTKLEKLKEKLVFYEKK\n+>gi|144227749|gb|AAZ44755.2| hypothetical protein MHJ_0672 [Mycoplasma hyopneumoniae J]\n+MKKLKIYKNLNYFLPSFVFLGGAFFVLVSCGSTHFGLNISRESQTGIENAKKLKKIVNSPNLIELSPENN\n+EKIYEDKDAKFFLFDLNSAVNGGKNLELMPEFTTKFSPKTEITYLNFINRYYNTRQLQQKKKSLNQDSNS\n+IYIPHVDEKFKDFWYVFMIPTSIGFSALELNGKKTVIDREKTKLPSTLIPYSSVEVKILKKGIISADKKN\n+YLQINVNQMINSFAFREKKSNEPNSSEINVFGFQDNKAYPNYKLIFDSLDSSKKIIKFKLHRKNDNLHEE\n+RSAKNKLNSYISVMNFIYKAKEYKQNLNPDDFFEKNTEQKDKNSEYPFVRFYTQTFIVPFEGKEEVFDSD\n+FSILIEKSE\n+>gi|144227750|gb|AAZ44756.2| hypothetical protein MHJ_0673 [Mycoplasma hyopneumoniae J]\n+MKNKITPCIWSLISNTHLRKAESLEILIRALLLNNEEINQNFKNKWLKIYKNKNWKPIGDLNEHLKLAAQ\n+LGVTKTDILTPGQQKINILAKLVNSGIIKIREYISIILFNLVSFINYEYRHIFKMTLELLKKQNNSPVSV\n+DEIFQNFNFGEPVCAEFNIKLLRYNLKQKDHIFYILISGVFFEVLSSRGKNQQYNINFFKIKLYDHWYSR\n+IDELIKRCNNQLESYNFEKASLIRLDSEKWSNYLTQNSQANYDYIVDVLMQKESNNLDEKNDNTINFKAS\n+INHLENQVQKNLENSLQETQINQDISTTISNNPEKVDIELEAILENSQENKVDLSELPANFNDKDQAESH\n+QISLENADLTSTNSVEKLEIEEKIQEKQSDIRIISNNLEQNCCPEQNVVEKEIEKTYEDNIEKNSFYSNF\n+YQDQFERDFNKISEPSGEKNLQDNAQSEICAAEKCCNHIQLEKENLEHIDSSKQEKVVKINSNYLNKGEK\n+NNSNTNKKVPSLPLLYQAKQEMQREISKYPISKSVNSKEHYYNYFIHKINKLFNFSLENMLNKTNFKQNF\n+FNILDFHKKNHEIILKPKKTIIKSGKNLLLISPSANLIYSKIKNELCKTEISEKNYEIVTFFDDYNPESF\n+IGYNDFVLGSKEKLNFIPGPFARILHKAYWNPEKKYCLILENIDNDAAKITLAPLKPLFIRGENGESLLG\n+ISQFDLSFYIFSHPEEKNFIPGNLTIIGTVNSNLDRDFVDLYPDFLENWEIKYLERDNLYSHITKYQICD\n+TGLSWKHFSEKLNSLLESENLNNKWFLPNQIETKILENPRIFVDKVLFSLWNFTSPEKRKIIFRSNSYSV\n+MVKEFLETKGSKRLNIFKFDYEKIKNI\n+>gi|71852149|gb|AAZ44757.1| conserved hypothetical protein [Mycoplasma hyopneumoniae J]\n+MKNRKIRPKAFDYFQSQNNQNKKTFKFKGFFKFLKIFFYTIIFGISLTGCIQSMVVKTSYNPGEALEFYN\n+SKEEITPNYTIFRESKNKDLPGIDIVTKNNNFLVSADNKKVNQEKILNALRKQIKNENAEFGEFSSLIMF\n+QKGENEFEYLKGDKNNEFIFFSSSENSIEQKTNWTEIKIPSPKYFSLKSDKQYFEKLRDVKSLPINTYSF\n+DKSSSENAAISEKIDSYFFNLDNKIPPVNRSYAIFARDVFQVIYNKLILLPQFSQGKLEKAIAEFEQKSG\n+KDVSPETEKILSGYANLVKKLVFPTNFSRIDIQNKTYSWNNNDESAAKNIAFQNKIPAFPIVSWAESWKL\n+GPFYAIFVYPLSKIILWVTASQSLYEWSGWITILSILAVVVFTKIISFIFRFKTIFGQNKQMELQLKKAK\n+IDAKYENYKKNKVMQQRHRQEIVDLYKKNNFSPFSPFSQILVTMPIFIAVWRALQGIPSFKVTYFLGLEL\n+AATSYQKLFEGYWIYLPIIIVTVLVQALQQIIPKILNKKKSNRIMNVQENETLKKQQKTQRIVSIIFIFF\n+GVIFQASLQIYWIIGGIWEILQTLGIFYLQKSNFYREKMRPWLERKKWV\n+>gi|71852150|gb|AAZ44758.1| ribonuclease P protein component [Mycoplasma hyopneumoniae J]\n+MQKIRSIKKNWEFQAIINKKNQIVTNYLIFYYVKSDFFEIGISVPKKFANAVKRNYYKRQIKNALYILWK\n+KGEIFLNFRVVLIARKNFLPLSFETKYQKLAKIFKELKRNEK\n+>gi|71852151|gb|AAZ44759.1| 50S ribosomal protein L34 [Mycoplasma hyopneumoniae J]\n+MKRTYQPNKRKHLKTHGFRARMSTADGRKILAARRAKGRKRLTVSDK\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results/Orthogroups.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results/Orthogroups.csv Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,537 @@\n+\tMycoplasma_agalactiae\tMycoplasma_gallisepticum\tMycoplasma_genitalium\tMycoplasma_hyopneumoniae\r\n+OG0000000\t\tgi|284811953|gb|ADB96857.1|, gi|284811954|gb|ADB96858.1|, gi|284811955|gb|AAP56548.2|, gi|284811956|gb|ADB96859.1|, gi|284811957|gb|ADB96860.1|, gi|284811958|gb|ADB96861.1|, gi|284811959|gb|ADB96862.1|, gi|284811960|gb|ADB96863.1|, gi|284811961|gb|ADB96864.1|, gi|284811962|gb|ADB96865.1|, gi|284812039|gb|AAP56686.2|, gi|284812040|gb|ADB96873.1|, gi|284812041|gb|ADB96874.1|, gi|284812042|gb|ADB96875.1|, gi|284812103|gb|ADB96879.1|, gi|284812104|gb|ADB96880.1|, gi|284812105|gb|AAP56776.2|, gi|284812107|gb|ADB96881.1|, gi|284812108|gb|ADB96882.1|, gi|284812128|gb|AAP56805.2|, gi|284812129|gb|AAP56806.2|, gi|284812217|gb|ADB96891.1|, gi|284812218|gb|ADB96892.1|, gi|284812219|gb|AAP56940.2|, gi|31541243|gb|AAP56545.1|, gi|31541245|gb|AAP56547.1|, gi|31541247|gb|AAP56549.1|, gi|31541248|gb|AAP56550.1|, gi|31541249|gb|AAP56551.1|, gi|31541250|gb|AAP56552.1|, gi|31541251|gb|AAP56553.1|, gi|31541252|gb|AAP56554.1|, gi|31541253|gb|AAP56555.1|, gi|31541386|gb|AAP56687.1|, gi|31541387|gb|AAP56688.1|, gi|31541388|gb|AAP56689.1|, gi|31541389|gb|AAP56690.1|, gi|31541390|gb|AAP56691.1|, gi|31541391|gb|AAP56692.1|, gi|31541392|gb|AAP56693.1|, gi|31541393|gb|AAP56694.1|, gi|31541394|gb|AAP56695.1|, gi|31541395|gb|AAP56696.1|, gi|31541396|gb|AAP56697.1|, gi|31541398|gb|AAP56699.1|, gi|31541472|gb|AAP56773.1|, gi|31541473|gb|AAP56774.1|, gi|31541474|gb|AAP56775.1|, gi|31541478|gb|AAP56779.1|, gi|31541641|gb|AAP56941.1|, gi|31541642|gb|AAP56942.1|, gi|31541643|gb|AAP56943.1|, gi|31541644|gb|AAP56944.1|, gi|31541645|gb|AAP56945.1|, gi|31541646|gb|AAP56946.1|, gi|31541647|gb|AAP56947.1|\t\t\r\n+OG0000001\tgi|290752501|emb|CBH40473.1|, gi|290752503|emb|CBH40475.1|, gi|290752692|emb|CBH40666.1|, gi|290752693|emb|CBH40667.1|, gi|290752812|emb|CBH40787.1|, gi|290752813|emb|CBH40788.1|, gi|290752814|emb|CBH40789.1|, gi|290752815|emb|CBH40790.1|, gi|290752816|emb|CBH40791.1|, gi|290752817|emb|CBH40792.1|, gi|290752818|emb|CBH40793.1|, gi|290753029|emb|CBH41005.1|, gi|290753030|emb|CBH41006.1|, gi|290753031|emb|CBH41007.1|, gi|290753032|emb|CBH41008.1|, gi|290753033|emb|CBH41009.1|, gi|290753034|emb|CBH41010.1|, gi|290753035|emb|CBH41011.1|, gi|290753036|emb|CBH41012.1|, gi|290753037|emb|CBH41013.1|, gi|290753040|emb|CBH41016.1|, gi|290753041|emb|CBH41017.1|, gi|290753042|emb|CBH41018.1|, gi|290753043|emb|CBH41019.1|, gi|290753044|emb|CBH41020.1|, gi|290753045|emb|CBH41021.1|, gi|290753046|emb|CBH41022.1|\t\t\t\r\n+OG0000002\tgi|290752269|emb|CBH40240.1|, gi|290752270|emb|CBH40241.1|, gi|290752414|emb|CBH40385.1|, gi|290752490|emb|CBH40462.1|, gi|290752766|emb|CBH40741.1|\tgi|31541260|gb|AAP56562.1|, gi|31541382|gb|AAP56683.1|\tgi|1046010|gb|AAC71532.1|, gi|3844907|gb|AAC71551.1|, gi|3844927|gb|AAC71569.1|\tgi|144227478|gb|AAZ44221.2|\r\n+OG0000003\tgi|290753066|emb|CBH41042.1|\tgi|284811924|gb|AAP56500.2|, gi|284811927|gb|ADB96855.1|, gi|284811928|gb|ADB96856.1|, gi|284812192|gb|AAP56901.2|, gi|31541553|gb|AAP56853.1|\tgi|1046012|gb|AAC71534.1|, gi|3844628|gb|AAC71235.1|, gi|3844797|gb|AAC71418.1|, gi|3844975|gb|AAC71613.1|\tgi|71851550|gb|AAZ44158.1|\r\n+OG0000004\tgi|290752526|emb|CBH40498.1|, gi|290753081|emb|CBH41057.1|\tgi|31541070|gb|AAP56372.1|, gi|31541268|gb|AAP56569.1|\tgi|1045740|gb|AAC71283.1|, gi|1045987|gb|AAC71511.1|, gi|3845062|gb|AAC72487.1|, gi|3845064|gb|AAC72489.1|\tgi|144227640|gb|AAZ44535.2|, gi|71851837|gb|AAZ44445.1|\r\n+OG0000005\tgi|290752591|emb|CBH40563.1|, gi|290752592|emb|CBH40564.1|, gi|290752893|emb|CBH40868.1|, gi|290752894|emb|CBH40869.1|\tgi|284811835|gb|AAP56356.2|, gi|284812058|gb|AAP56715.2|, gi|31541415|gb|AAP56716.1|\tgi|1045683|gb|AAC71230.1|, gi|1045684|gb|AAC71231.1|\t\r\n+OG0000006\t\tgi|31541304|gb|AAP56605.1|\t\tgi|71851504|gb|AAZ44112.1|, gi|71851505|gb|AAZ44113.1|, gi|71851506|gb|AAZ44114.1|, gi|71851779|gb|AAZ44387.1|, gi|71851788|gb|AAZ44396.1|, gi|71851789|gb|AAZ44397.1|, gi|71851814|gb|AAZ44422.1|, gi|71851859|gb|AA'..b'\tgi|284811949|gb|AAP56536.2|\tgi|1045973|gb|AAC71500.1|\t\r\n+OG0000478\t\tgi|284811950|gb|AAP56538.2|\tgi|1045972|gb|AAC71499.1|\t\r\n+OG0000479\t\tgi|31541239|gb|AAP56541.1|\tgi|3844896|gb|AAC71541.1|\t\r\n+OG0000480\t\tgi|284811951|gb|AAP56544.2|\t\tgi|144227642|gb|AAZ44540.2|\r\n+OG0000481\t\tgi|284811972|gb|AAP56572.2|\tgi|1045980|gb|AAC71506.1|\t\r\n+OG0000482\t\tgi|31541272|gb|AAP56573.1|\tgi|1045981|gb|AAC71507.1|\t\r\n+OG0000483\t\tgi|284811973|gb|AAP56574.2|\tgi|1045982|gb|AAC71508.1|\t\r\n+OG0000484\t\tgi|284811978|gb|AAP56579.2|\tgi|3845040|gb|AAC72467.1|\t\r\n+OG0000485\t\tgi|31541293|gb|AAP56594.1|\tgi|1045977|gb|AAC71503.1|\t\r\n+OG0000486\t\tgi|284811990|gb|AAP56599.2|\t\tgi|144227563|gb|AAZ44390.2|\r\n+OG0000487\t\tgi|284811995|gb|AAP56607.2|\t\tgi|144227427|gb|AAZ44116.2|\r\n+OG0000488\t\tgi|284812002|gb|AAP56617.2|\tgi|3844925|gb|AAC71567.1|\t\r\n+OG0000489\t\tgi|284812013|gb|AAP56637.2|\tgi|3845048|gb|AAC72474.1|\t\r\n+OG0000490\t\tgi|31541356|gb|AAP56657.1|\tgi|3844990|gb|AAC71626.1|\t\r\n+OG0000491\t\tgi|31541362|gb|AAP56663.1|\t\tgi|71851833|gb|AAZ44441.1|\r\n+OG0000492\t\tgi|284812025|gb|AAP56664.2|\tgi|3844809|gb|AAC71429.1|\t\r\n+OG0000493\t\tgi|31541364|gb|AAP56665.1|\tgi|84626132|gb|ABC59631.1|\t\r\n+OG0000494\t\tgi|31541370|gb|AAP56671.1|\tgi|3844818|gb|AAC71437.1|\t\r\n+OG0000495\t\tgi|31541380|gb|AAP56681.1|\tgi|1045963|gb|AAC71491.1|\t\r\n+OG0000496\t\tgi|284812060|gb|AAP56718.2|\tgi|3844837|gb|AAC71454.1|\t\r\n+OG0000497\t\tgi|284812061|gb|AAP56721.2|\tgi|3844840|gb|AAC71457.1|\t\r\n+OG0000498\t\tgi|284812062|gb|AAP56722.2|\tgi|3844841|gb|AAC71458.1|\t\r\n+OG0000499\t\tgi|284812074|gb|AAP56734.2|\tgi|3844846|gb|AAC71463.1|\t\r\n+OG0000500\t\tgi|284812077|gb|AAP56738.2|\tgi|1045939|gb|AAC71468.1|\t\r\n+OG0000501\t\tgi|31541448|gb|AAP56749.1|\tgi|3844826|gb|AAC71444.1|\t\r\n+OG0000502\t\tgi|284812091|gb|AAP56756.2|\tgi|3844811|gb|AAC71430.1|\t\r\n+OG0000503\t\tgi|31541465|gb|AAP56766.1|\t\tgi|144227651|gb|AAZ44558.2|\r\n+OG0000504\t\tgi|31541498|gb|AAP56798.1|\tgi|3844971|gb|AAC71609.1|\t\r\n+OG0000505\t\tgi|284812125|gb|AAP56801.2|\tgi|3844978|gb|AAC71616.1|\t\r\n+OG0000506\t\tgi|31541512|gb|AAP56812.1|\tgi|3844689|gb|AAC71319.1|\t\r\n+OG0000507\t\tgi|284812140|gb|AAP56821.2|\tgi|3844721|gb|AAC71348.1|\t\r\n+OG0000508\t\tgi|284812145|gb|AAP56827.2|\tgi|84626131|gb|AAC71620.2|\t\r\n+OG0000509\t\tgi|31541528|gb|AAP56828.1|\tgi|3844984|gb|AAC71621.1|\t\r\n+OG0000510\t\tgi|31541549|gb|AAP56849.1|\tgi|3844959|gb|AAC71598.1|\t\r\n+OG0000511\t\tgi|31541558|gb|AAP56858.1|\tgi|3844638|gb|AAC71244.1|\t\r\n+OG0000512\t\tgi|284812164|gb|AAP56866.2|\tgi|3844898|gb|AAC71543.1|\t\r\n+OG0000513\t\tgi|284812171|gb|AAP56875.2|\tgi|84626128|gb|AAC71502.2|\t\r\n+OG0000514\t\tgi|284812173|gb|AAP56879.2|\tgi|3845020|gb|AAC72448.1|\t\r\n+OG0000515\t\tgi|31541590|gb|AAP56890.1|\tgi|3844885|gb|AAC71528.1|\t\r\n+OG0000516\t\tgi|31541595|gb|AAP56895.1|\tgi|3844719|gb|AAC71346.1|\t\r\n+OG0000517\t\tgi|284812188|gb|AAP56896.2|\tgi|3844718|gb|AAC71345.1|\t\r\n+OG0000518\t\tgi|284812202|gb|AAP56917.2|\tgi|3844893|gb|AAC71538.1|\t\r\n+OG0000519\t\tgi|284812208|gb|AAP56924.2|\tgi|1045731|gb|AAC71274.1|\t\r\n+OG0000520\t\tgi|284812210|gb|AAP56926.2|\tgi|3844778|gb|AAC71401.1|\t\r\n+OG0000521\t\tgi|31541648|gb|AAP56948.1|\tgi|1045712|gb|AAC71256.1|\t\r\n+OG0000522\t\tgi|31541655|gb|AAP56955.1|\tgi|3844989|gb|AAC71625.1|\t\r\n+OG0000523\t\tgi|284812225|gb|AAP56960.2|\tgi|3844682|gb|AAC71313.1|\t\r\n+OG0000524\t\tgi|284812227|gb|AAP56967.2|\tgi|3844647|gb|AAC71253.1|\t\r\n+OG0000525\t\tgi|284812245|gb|AAP56998.2|\tgi|1045728|gb|AAC71271.1|\t\r\n+OG0000526\t\tgi|284812254|gb|AAP57010.2|\tgi|3844631|gb|AAC71238.1|\t\r\n+OG0000527\t\tgi|31541720|gb|AAP57020.1|\t\tgi|144227662|gb|AAZ44577.2|\r\n+OG0000528\t\tgi|284812276|gb|AAP57047.2|, gi|284812287|gb|AAP57056.2|\t\t\r\n+OG0000529\t\tgi|284812281|gb|AAP57051.2|\tgi|3845001|gb|AAC71636.1|\t\r\n+OG0000530\t\tgi|284812282|gb|AAP57052.2|\tgi|84626126|gb|AAC71234.2|\t\r\n+OG0000531\t\tgi|31541763|gb|AAP57062.1|\tgi|84626158|gb|AAC72481.2|\t\r\n+OG0000532\t\tgi|284812300|gb|AAP57075.2|\tgi|84626152|gb|AAC71218.2|\t\r\n+OG0000533\t\t\tgi|84626147|gb|AAC71280.2|\tgi|71851703|gb|AAZ44311.1|\r\n+OG0000534\t\t\tgi|3844705|gb|AAC71333.1|\tgi|71851627|gb|AAZ44235.1|\r\n+OG0000535\t\t\tgi|3844873|gb|AAC71515.1|\tgi|71851777|gb|AAZ44385.1|\r\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results/Orthogroups.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results/Orthogroups.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1331 @@\n+OG0000000: gi|284811953|gb|ADB96857.1| gi|284811954|gb|ADB96858.1| gi|284811955|gb|AAP56548.2| gi|284811956|gb|ADB96859.1| gi|284811957|gb|ADB96860.1| gi|284811958|gb|ADB96861.1| gi|284811959|gb|ADB96862.1| gi|284811960|gb|ADB96863.1| gi|284811961|gb|ADB96864.1| gi|284811962|gb|ADB96865.1| gi|284812039|gb|AAP56686.2| gi|284812040|gb|ADB96873.1| gi|284812041|gb|ADB96874.1| gi|284812042|gb|ADB96875.1| gi|284812103|gb|ADB96879.1| gi|284812104|gb|ADB96880.1| gi|284812105|gb|AAP56776.2| gi|284812107|gb|ADB96881.1| gi|284812108|gb|ADB96882.1| gi|284812128|gb|AAP56805.2| gi|284812129|gb|AAP56806.2| gi|284812217|gb|ADB96891.1| gi|284812218|gb|ADB96892.1| gi|284812219|gb|AAP56940.2| gi|31541243|gb|AAP56545.1| gi|31541245|gb|AAP56547.1| gi|31541247|gb|AAP56549.1| gi|31541248|gb|AAP56550.1| gi|31541249|gb|AAP56551.1| gi|31541250|gb|AAP56552.1| gi|31541251|gb|AAP56553.1| gi|31541252|gb|AAP56554.1| gi|31541253|gb|AAP56555.1| gi|31541386|gb|AAP56687.1| gi|31541387|gb|AAP56688.1| gi|31541388|gb|AAP56689.1| gi|31541389|gb|AAP56690.1| gi|31541390|gb|AAP56691.1| gi|31541391|gb|AAP56692.1| gi|31541392|gb|AAP56693.1| gi|31541393|gb|AAP56694.1| gi|31541394|gb|AAP56695.1| gi|31541395|gb|AAP56696.1| gi|31541396|gb|AAP56697.1| gi|31541398|gb|AAP56699.1| gi|31541472|gb|AAP56773.1| gi|31541473|gb|AAP56774.1| gi|31541474|gb|AAP56775.1| gi|31541478|gb|AAP56779.1| gi|31541641|gb|AAP56941.1| gi|31541642|gb|AAP56942.1| gi|31541643|gb|AAP56943.1| gi|31541644|gb|AAP56944.1| gi|31541645|gb|AAP56945.1| gi|31541646|gb|AAP56946.1| gi|31541647|gb|AAP56947.1|\n+OG0000001: gi|290752501|emb|CBH40473.1| gi|290752503|emb|CBH40475.1| gi|290752692|emb|CBH40666.1| gi|290752693|emb|CBH40667.1| gi|290752812|emb|CBH40787.1| gi|290752813|emb|CBH40788.1| gi|290752814|emb|CBH40789.1| gi|290752815|emb|CBH40790.1| gi|290752816|emb|CBH40791.1| gi|290752817|emb|CBH40792.1| gi|290752818|emb|CBH40793.1| gi|290753029|emb|CBH41005.1| gi|290753030|emb|CBH41006.1| gi|290753031|emb|CBH41007.1| gi|290753032|emb|CBH41008.1| gi|290753033|emb|CBH41009.1| gi|290753034|emb|CBH41010.1| gi|290753035|emb|CBH41011.1| gi|290753036|emb|CBH41012.1| gi|290753037|emb|CBH41013.1| gi|290753040|emb|CBH41016.1| gi|290753041|emb|CBH41017.1| gi|290753042|emb|CBH41018.1| gi|290753043|emb|CBH41019.1| gi|290753044|emb|CBH41020.1| gi|290753045|emb|CBH41021.1| gi|290753046|emb|CBH41022.1|\n+OG0000002: gi|1046010|gb|AAC71532.1| gi|144227478|gb|AAZ44221.2| gi|290752269|emb|CBH40240.1| gi|290752270|emb|CBH40241.1| gi|290752414|emb|CBH40385.1| gi|290752490|emb|CBH40462.1| gi|290752766|emb|CBH40741.1| gi|31541260|gb|AAP56562.1| gi|31541382|gb|AAP56683.1| gi|3844907|gb|AAC71551.1| gi|3844927|gb|AAC71569.1|\n+OG0000003: gi|1046012|gb|AAC71534.1| gi|284811924|gb|AAP56500.2| gi|284811927|gb|ADB96855.1| gi|284811928|gb|ADB96856.1| gi|284812192|gb|AAP56901.2| gi|290753066|emb|CBH41042.1| gi|31541553|gb|AAP56853.1| gi|3844628|gb|AAC71235.1| gi|3844797|gb|AAC71418.1| gi|3844975|gb|AAC71613.1| gi|71851550|gb|AAZ44158.1|\n+OG0000004: gi|1045740|gb|AAC71283.1| gi|1045987|gb|AAC71511.1| gi|144227640|gb|AAZ44535.2| gi|290752526|emb|CBH40498.1| gi|290753081|emb|CBH41057.1| gi|31541070|gb|AAP56372.1| gi|31541268|gb|AAP56569.1| gi|3845062|gb|AAC72487.1| gi|3845064|gb|AAC72489.1| gi|71851837|gb|AAZ44445.1|\n+OG0000005: gi|1045683|gb|AAC71230.1| gi|1045684|gb|AAC71231.1| gi|284811835|gb|AAP56356.2| gi|284812058|gb|AAP56715.2| gi|290752591|emb|CBH40563.1| gi|290752592|emb|CBH40564.1| gi|290752893|emb|CBH40868.1| gi|290752894|emb|CBH40869.1| gi|31541415|gb|AAP56716.1|\n+OG0000006: gi|31541304|gb|AAP56605.1| gi|71851504|gb|AAZ44112.1| gi|71851505|gb|AAZ44113.1| gi|71851506|gb|AAZ44114.1| gi|71851779|gb|AAZ44387.1| gi|71851788|gb|AAZ44396.1| gi|71851789|gb|AAZ44397.1| gi|71851814|gb|AAZ44422.1| gi|71851859|gb|AAZ44467.1|\n+OG0000007: gi|31541315|gb|AAP56616.1| gi|71851791|gb|AAZ44399.1| gi|71851810|gb|AAZ44418.1| gi|71851917|gb|AAZ44525.1| gi|71851970|gb|AAZ44578.1| gi|71851995|gb|AAZ44603.1| gi|71852017|gb|AAZ44625.1| gi|7185'..b'01230: gi|144227613|gb|AAZ44488.2|\n+OG0001231: gi|71851881|gb|AAZ44489.1|\n+OG0001232: gi|144227616|gb|AAZ44498.2|\n+OG0001233: gi|144227617|gb|AAZ44499.2|\n+OG0001234: gi|144227618|gb|AAZ44501.2|\n+OG0001235: gi|71851895|gb|AAZ44503.1|\n+OG0001236: gi|71851899|gb|AAZ44507.1|\n+OG0001237: gi|71851900|gb|AAZ44508.1|\n+OG0001238: gi|71851902|gb|AAZ44510.1|\n+OG0001239: gi|144227625|gb|AAZ44516.2|\n+OG0001240: gi|71851909|gb|AAZ44517.1|\n+OG0001241: gi|144227629|gb|AAZ44523.2|\n+OG0001242: gi|144227630|gb|AAZ44524.2|\n+OG0001243: gi|144227631|gb|AAZ44526.2|\n+OG0001244: gi|144227632|gb|AAZ44527.2|\n+OG0001245: gi|144227633|gb|ABO93479.1|\n+OG0001246: gi|144227634|gb|AAZ44528.2|\n+OG0001247: gi|71851921|gb|AAZ44529.1|\n+OG0001248: gi|144227635|gb|AAZ44530.2|\n+OG0001249: gi|144227636|gb|AAZ44531.2|\n+OG0001250: gi|71851929|gb|AAZ44537.1|\n+OG0001251: gi|71851936|gb|AAZ44544.1|\n+OG0001252: gi|144227644|gb|AAZ44545.2|\n+OG0001253: gi|144227645|gb|AAZ44546.2|\n+OG0001254: gi|144227647|gb|AAZ44549.2|\n+OG0001255: gi|144227650|gb|AAZ44554.2|\n+OG0001256: gi|71851956|gb|AAZ44564.1|\n+OG0001257: gi|144227656|gb|AAZ44567.2|\n+OG0001258: gi|144227660|gb|AAZ44572.2|\n+OG0001259: gi|71851966|gb|AAZ44574.1|\n+OG0001260: gi|144227661|gb|AAZ44576.2|\n+OG0001261: gi|71851971|gb|AAZ44579.1|\n+OG0001262: gi|71851972|gb|AAZ44580.1|\n+OG0001263: gi|71851985|gb|AAZ44593.1|\n+OG0001264: gi|71851986|gb|AAZ44594.1|\n+OG0001265: gi|144227667|gb|AAZ44595.2|\n+OG0001266: gi|71851988|gb|AAZ44596.1|\n+OG0001267: gi|71851989|gb|AAZ44597.1|\n+OG0001268: gi|144227668|gb|AAZ44598.2|\n+OG0001269: gi|71851991|gb|AAZ44599.1|\n+OG0001270: gi|144227669|gb|AAZ44600.2|\n+OG0001271: gi|144227670|gb|AAZ44601.2|\n+OG0001272: gi|144227671|gb|AAZ44602.2|\n+OG0001273: gi|144227672|gb|AAZ44604.2|\n+OG0001274: gi|144227673|gb|AAZ44605.2|\n+OG0001275: gi|144227674|gb|AAZ44606.2|\n+OG0001276: gi|144227675|gb|AAZ44607.2|\n+OG0001277: gi|144227676|gb|ABO93480.1|\n+OG0001278: gi|144227681|gb|AAZ44617.2|\n+OG0001279: gi|144227683|gb|AAZ44623.2|\n+OG0001280: gi|144227688|gb|ABO93481.1|\n+OG0001281: gi|144227689|gb|AAZ44632.2|\n+OG0001282: gi|71852025|gb|AAZ44633.1|\n+OG0001283: gi|144227690|gb|AAZ44637.2|\n+OG0001284: gi|71852030|gb|AAZ44638.1|\n+OG0001285: gi|144227691|gb|AAZ44639.2|\n+OG0001286: gi|71852032|gb|AAZ44640.1|\n+OG0001287: gi|71852034|gb|AAZ44642.1|\n+OG0001288: gi|71852035|gb|AAZ44643.1|\n+OG0001289: gi|144227693|gb|AAZ44644.2|\n+OG0001290: gi|144227694|gb|ABO93482.1|\n+OG0001291: gi|144227695|gb|AAZ44645.2|\n+OG0001292: gi|71852038|gb|AAZ44646.1|\n+OG0001293: gi|144227696|gb|AAZ44647.2|\n+OG0001294: gi|71852040|gb|AAZ44648.1|\n+OG0001295: gi|144227697|gb|AAZ44650.2|\n+OG0001296: gi|71852043|gb|AAZ44651.1|\n+OG0001297: gi|144227698|gb|ABO93483.1|\n+OG0001298: gi|144227699|gb|AAZ44652.2|\n+OG0001299: gi|144227700|gb|AAZ44653.2|\n+OG0001300: gi|144227701|gb|AAZ44654.2|\n+OG0001301: gi|71852048|gb|AAZ44656.1|\n+OG0001302: gi|144227703|gb|AAZ44657.2|\n+OG0001303: gi|144227704|gb|AAZ44658.2|\n+OG0001304: gi|71852052|gb|AAZ44660.1|\n+OG0001305: gi|144227707|gb|AAZ44671.2|\n+OG0001306: gi|144227709|gb|ABO93484.1|\n+OG0001307: gi|144227715|gb|AAZ44680.2|\n+OG0001308: gi|144227716|gb|AAZ44681.2|\n+OG0001309: gi|144227717|gb|AAZ44682.2|\n+OG0001310: gi|71852075|gb|AAZ44683.1|\n+OG0001311: gi|144227718|gb|AAZ44684.2|\n+OG0001312: gi|71852077|gb|AAZ44685.1|\n+OG0001313: gi|144227719|gb|AAZ44686.2|\n+OG0001314: gi|144227725|gb|AAZ44696.2|\n+OG0001315: gi|144227730|gb|AAZ44708.2|\n+OG0001316: gi|71852101|gb|AAZ44709.1|\n+OG0001317: gi|144227731|gb|AAZ44711.2|\n+OG0001318: gi|144227732|gb|AAZ44712.2|\n+OG0001319: gi|144227736|gb|AAZ44718.2|\n+OG0001320: gi|71852114|gb|AAZ44722.1|\n+OG0001321: gi|144227745|gb|AAZ44743.2|\n+OG0001322: gi|144227746|gb|AAZ44744.2|\n+OG0001323: gi|144227747|gb|AAZ44745.2|\n+OG0001324: gi|71852138|gb|AAZ44746.1|\n+OG0001325: gi|71852139|gb|AAZ44747.1|\n+OG0001326: gi|71852141|gb|AAZ44749.1|\n+OG0001327: gi|144227748|gb|AAZ44751.2|\n+OG0001328: gi|71852145|gb|AAZ44753.1|\n+OG0001329: gi|144227749|gb|AAZ44755.2|\n+OG0001330: gi|144227750|gb|AAZ44756.2|\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results/Orthogroups_SpeciesOverlaps.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results/Orthogroups_SpeciesOverlaps.csv Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,5 @@
+ Mycoplasma_agalactiae Mycoplasma_gallisepticum Mycoplasma_genitalium Mycoplasma_hyopneumoniae
+Mycoplasma_agalactiae 432 363 305 391
+Mycoplasma_gallisepticum 363 462 385 346
+Mycoplasma_genitalium 305 385 394 296
+Mycoplasma_hyopneumoniae 391 346 296 416
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results/Orthogroups_UnassignedGenes.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results/Orthogroups_UnassignedGenes.csv Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,796 @@\n+\tMycoplasma_agalactiae\tMycoplasma_gallisepticum\tMycoplasma_genitalium\tMycoplasma_hyopneumoniae\r\n+OG0000536\tgi|290752272|emb|CBH40243.1|\t\t\t\r\n+OG0000537\tgi|290752276|emb|CBH40247.1|\t\t\t\r\n+OG0000538\tgi|290752279|emb|CBH40250.1|\t\t\t\r\n+OG0000539\tgi|290752285|emb|CBH40256.1|\t\t\t\r\n+OG0000540\tgi|290752286|emb|CBH40257.1|\t\t\t\r\n+OG0000541\tgi|290752287|emb|CBH40258.1|\t\t\t\r\n+OG0000542\tgi|290752288|emb|CBH40259.1|\t\t\t\r\n+OG0000543\tgi|290752289|emb|CBH40260.1|\t\t\t\r\n+OG0000544\tgi|290752290|emb|CBH40261.1|\t\t\t\r\n+OG0000545\tgi|290752291|emb|CBH40262.1|\t\t\t\r\n+OG0000546\tgi|290752293|emb|CBH40264.1|\t\t\t\r\n+OG0000547\tgi|290752294|emb|CBH40265.1|\t\t\t\r\n+OG0000548\tgi|290752295|emb|CBH40266.1|\t\t\t\r\n+OG0000549\tgi|290752296|emb|CBH40267.1|\t\t\t\r\n+OG0000550\tgi|290752297|emb|CBH40268.1|\t\t\t\r\n+OG0000551\tgi|290752306|emb|CBH40277.1|\t\t\t\r\n+OG0000552\tgi|290752310|emb|CBH40281.1|\t\t\t\r\n+OG0000553\tgi|290752313|emb|CBH40284.1|\t\t\t\r\n+OG0000554\tgi|290752314|emb|CBH40285.1|\t\t\t\r\n+OG0000555\tgi|290752319|emb|CBH40290.1|\t\t\t\r\n+OG0000556\tgi|290752342|emb|CBH40313.1|\t\t\t\r\n+OG0000557\tgi|290752345|emb|CBH40316.1|\t\t\t\r\n+OG0000558\tgi|290752348|emb|CBH40319.1|\t\t\t\r\n+OG0000559\tgi|290752349|emb|CBH40320.1|\t\t\t\r\n+OG0000560\tgi|290752350|emb|CBH40321.1|\t\t\t\r\n+OG0000561\tgi|290752353|emb|CBH40324.1|\t\t\t\r\n+OG0000562\tgi|290752355|emb|CBH40326.1|\t\t\t\r\n+OG0000563\tgi|290752359|emb|CBH40330.1|\t\t\t\r\n+OG0000564\tgi|290752362|emb|CBH40333.1|\t\t\t\r\n+OG0000565\tgi|290752367|emb|CBH40338.1|\t\t\t\r\n+OG0000566\tgi|290752368|emb|CBH40339.1|\t\t\t\r\n+OG0000567\tgi|290752374|emb|CBH40345.1|\t\t\t\r\n+OG0000568\tgi|290752375|emb|CBH40346.1|\t\t\t\r\n+OG0000569\tgi|290752377|emb|CBH40348.1|\t\t\t\r\n+OG0000570\tgi|290752380|emb|CBH40351.1|\t\t\t\r\n+OG0000571\tgi|290752387|emb|CBH40358.1|\t\t\t\r\n+OG0000572\tgi|290752389|emb|CBH40360.1|\t\t\t\r\n+OG0000573\tgi|290752396|emb|CBH40367.1|\t\t\t\r\n+OG0000574\tgi|290752398|emb|CBH40369.1|\t\t\t\r\n+OG0000575\tgi|290752399|emb|CBH40370.1|\t\t\t\r\n+OG0000576\tgi|290752400|emb|CBH40371.1|\t\t\t\r\n+OG0000577\tgi|290752405|emb|CBH40376.1|\t\t\t\r\n+OG0000578\tgi|290752407|emb|CBH40378.1|\t\t\t\r\n+OG0000579\tgi|290752409|emb|CBH40380.1|\t\t\t\r\n+OG0000580\tgi|290752411|emb|CBH40382.1|\t\t\t\r\n+OG0000581\tgi|290752412|emb|CBH40383.1|\t\t\t\r\n+OG0000582\tgi|290752413|emb|CBH40384.1|\t\t\t\r\n+OG0000583\tgi|290752415|emb|CBH40386.1|\t\t\t\r\n+OG0000584\tgi|290752417|emb|CBH40388.1|\t\t\t\r\n+OG0000585\tgi|290752419|emb|CBH40390.1|\t\t\t\r\n+OG0000586\tgi|290752421|emb|CBH40392.1|\t\t\t\r\n+OG0000587\tgi|290752423|emb|CBH40394.1|\t\t\t\r\n+OG0000588\tgi|290752424|emb|CBH40395.1|\t\t\t\r\n+OG0000589\tgi|290752425|emb|CBH40396.1|\t\t\t\r\n+OG0000590\tgi|290752428|emb|CBH40399.1|\t\t\t\r\n+OG0000591\tgi|290752429|emb|CBH40400.1|\t\t\t\r\n+OG0000592\tgi|290752430|emb|CBH40401.1|\t\t\t\r\n+OG0000593\tgi|290752432|emb|CBH40403.1|\t\t\t\r\n+OG0000594\tgi|290752436|emb|CBH40407.1|\t\t\t\r\n+OG0000595\tgi|290752439|emb|CBH40410.1|\t\t\t\r\n+OG0000596\tgi|290752444|emb|CBH40415.1|\t\t\t\r\n+OG0000597\tgi|290752447|emb|CBH40418.1|\t\t\t\r\n+OG0000598\tgi|290752448|emb|CBH40420.1|\t\t\t\r\n+OG0000599\tgi|290752449|emb|CBH40421.1|\t\t\t\r\n+OG0000600\tgi|290752453|emb|CBH40425.1|\t\t\t\r\n+OG0000601\tgi|290752457|emb|CBH40429.1|\t\t\t\r\n+OG0000602\tgi|290752462|emb|CBH40434.1|\t\t\t\r\n+OG0000603\tgi|290752466|emb|CBH40438.1|\t\t\t\r\n+OG0000604\tgi|290752472|emb|CBH40444.1|\t\t\t\r\n+OG0000605\tgi|290752473|emb|CBH40445.1|\t\t\t\r\n+OG0000606\tgi|290752474|emb|CBH40446.1|\t\t\t\r\n+OG0000607\tgi|290752475|emb|CBH40447.1|\t\t\t\r\n+OG0000608\tgi|290752476|emb|CBH40448.1|\t\t\t\r\n+OG0000609\tgi|290752495|emb|CBH40467.1|\t\t\t\r\n+OG0000610\tgi|290752500|emb|CBH40472.1|\t\t\t\r\n+OG0000611\tgi|290752502|emb|CBH40474.1|\t\t\t\r\n+OG0000612\tgi|290752505|emb|CBH40477.1|\t\t\t\r\n+OG0000613\tgi|290752506|emb|CBH40478.1|\t\t\t\r\n+OG0000614\tgi|290752507|emb|CBH40479.1|\t\t\t\r\n+OG0000615\tgi|290752509|emb|CBH40481.1|\t\t\t\r\n+OG0000616\tgi|290752510|emb|CBH40482.1|\t\t\t\r\n+OG0000617\tgi|290752511|emb|CBH40483.1|\t\t\t\r\n+OG0000618\tgi|290752512|emb|CBH40484.1|\t\t\t\r\n+OG0000619\tgi|290752514|emb|CBH40486.1|\t\t\t\r\n+OG0000620\tgi|290752517|emb|CBH40489.1|\t\t\t\r\n+OG0000621\tgi|290752524|emb|CBH40496.1|\t\t\t\r\n+OG0000622\tgi|290752528|emb|CBH40500.1|\t\t\t\r\n+OG0000623\tgi|290752537|emb|CBH40509.1|\t\t\t\r\n+OG0000624\tg'..b'\t\t\t\tgi|71851900|gb|AAZ44508.1|\r\n+OG0001238\t\t\t\tgi|71851902|gb|AAZ44510.1|\r\n+OG0001239\t\t\t\tgi|144227625|gb|AAZ44516.2|\r\n+OG0001240\t\t\t\tgi|71851909|gb|AAZ44517.1|\r\n+OG0001241\t\t\t\tgi|144227629|gb|AAZ44523.2|\r\n+OG0001242\t\t\t\tgi|144227630|gb|AAZ44524.2|\r\n+OG0001243\t\t\t\tgi|144227631|gb|AAZ44526.2|\r\n+OG0001244\t\t\t\tgi|144227632|gb|AAZ44527.2|\r\n+OG0001245\t\t\t\tgi|144227633|gb|ABO93479.1|\r\n+OG0001246\t\t\t\tgi|144227634|gb|AAZ44528.2|\r\n+OG0001247\t\t\t\tgi|71851921|gb|AAZ44529.1|\r\n+OG0001248\t\t\t\tgi|144227635|gb|AAZ44530.2|\r\n+OG0001249\t\t\t\tgi|144227636|gb|AAZ44531.2|\r\n+OG0001250\t\t\t\tgi|71851929|gb|AAZ44537.1|\r\n+OG0001251\t\t\t\tgi|71851936|gb|AAZ44544.1|\r\n+OG0001252\t\t\t\tgi|144227644|gb|AAZ44545.2|\r\n+OG0001253\t\t\t\tgi|144227645|gb|AAZ44546.2|\r\n+OG0001254\t\t\t\tgi|144227647|gb|AAZ44549.2|\r\n+OG0001255\t\t\t\tgi|144227650|gb|AAZ44554.2|\r\n+OG0001256\t\t\t\tgi|71851956|gb|AAZ44564.1|\r\n+OG0001257\t\t\t\tgi|144227656|gb|AAZ44567.2|\r\n+OG0001258\t\t\t\tgi|144227660|gb|AAZ44572.2|\r\n+OG0001259\t\t\t\tgi|71851966|gb|AAZ44574.1|\r\n+OG0001260\t\t\t\tgi|144227661|gb|AAZ44576.2|\r\n+OG0001261\t\t\t\tgi|71851971|gb|AAZ44579.1|\r\n+OG0001262\t\t\t\tgi|71851972|gb|AAZ44580.1|\r\n+OG0001263\t\t\t\tgi|71851985|gb|AAZ44593.1|\r\n+OG0001264\t\t\t\tgi|71851986|gb|AAZ44594.1|\r\n+OG0001265\t\t\t\tgi|144227667|gb|AAZ44595.2|\r\n+OG0001266\t\t\t\tgi|71851988|gb|AAZ44596.1|\r\n+OG0001267\t\t\t\tgi|71851989|gb|AAZ44597.1|\r\n+OG0001268\t\t\t\tgi|144227668|gb|AAZ44598.2|\r\n+OG0001269\t\t\t\tgi|71851991|gb|AAZ44599.1|\r\n+OG0001270\t\t\t\tgi|144227669|gb|AAZ44600.2|\r\n+OG0001271\t\t\t\tgi|144227670|gb|AAZ44601.2|\r\n+OG0001272\t\t\t\tgi|144227671|gb|AAZ44602.2|\r\n+OG0001273\t\t\t\tgi|144227672|gb|AAZ44604.2|\r\n+OG0001274\t\t\t\tgi|144227673|gb|AAZ44605.2|\r\n+OG0001275\t\t\t\tgi|144227674|gb|AAZ44606.2|\r\n+OG0001276\t\t\t\tgi|144227675|gb|AAZ44607.2|\r\n+OG0001277\t\t\t\tgi|144227676|gb|ABO93480.1|\r\n+OG0001278\t\t\t\tgi|144227681|gb|AAZ44617.2|\r\n+OG0001279\t\t\t\tgi|144227683|gb|AAZ44623.2|\r\n+OG0001280\t\t\t\tgi|144227688|gb|ABO93481.1|\r\n+OG0001281\t\t\t\tgi|144227689|gb|AAZ44632.2|\r\n+OG0001282\t\t\t\tgi|71852025|gb|AAZ44633.1|\r\n+OG0001283\t\t\t\tgi|144227690|gb|AAZ44637.2|\r\n+OG0001284\t\t\t\tgi|71852030|gb|AAZ44638.1|\r\n+OG0001285\t\t\t\tgi|144227691|gb|AAZ44639.2|\r\n+OG0001286\t\t\t\tgi|71852032|gb|AAZ44640.1|\r\n+OG0001287\t\t\t\tgi|71852034|gb|AAZ44642.1|\r\n+OG0001288\t\t\t\tgi|71852035|gb|AAZ44643.1|\r\n+OG0001289\t\t\t\tgi|144227693|gb|AAZ44644.2|\r\n+OG0001290\t\t\t\tgi|144227694|gb|ABO93482.1|\r\n+OG0001291\t\t\t\tgi|144227695|gb|AAZ44645.2|\r\n+OG0001292\t\t\t\tgi|71852038|gb|AAZ44646.1|\r\n+OG0001293\t\t\t\tgi|144227696|gb|AAZ44647.2|\r\n+OG0001294\t\t\t\tgi|71852040|gb|AAZ44648.1|\r\n+OG0001295\t\t\t\tgi|144227697|gb|AAZ44650.2|\r\n+OG0001296\t\t\t\tgi|71852043|gb|AAZ44651.1|\r\n+OG0001297\t\t\t\tgi|144227698|gb|ABO93483.1|\r\n+OG0001298\t\t\t\tgi|144227699|gb|AAZ44652.2|\r\n+OG0001299\t\t\t\tgi|144227700|gb|AAZ44653.2|\r\n+OG0001300\t\t\t\tgi|144227701|gb|AAZ44654.2|\r\n+OG0001301\t\t\t\tgi|71852048|gb|AAZ44656.1|\r\n+OG0001302\t\t\t\tgi|144227703|gb|AAZ44657.2|\r\n+OG0001303\t\t\t\tgi|144227704|gb|AAZ44658.2|\r\n+OG0001304\t\t\t\tgi|71852052|gb|AAZ44660.1|\r\n+OG0001305\t\t\t\tgi|144227707|gb|AAZ44671.2|\r\n+OG0001306\t\t\t\tgi|144227709|gb|ABO93484.1|\r\n+OG0001307\t\t\t\tgi|144227715|gb|AAZ44680.2|\r\n+OG0001308\t\t\t\tgi|144227716|gb|AAZ44681.2|\r\n+OG0001309\t\t\t\tgi|144227717|gb|AAZ44682.2|\r\n+OG0001310\t\t\t\tgi|71852075|gb|AAZ44683.1|\r\n+OG0001311\t\t\t\tgi|144227718|gb|AAZ44684.2|\r\n+OG0001312\t\t\t\tgi|71852077|gb|AAZ44685.1|\r\n+OG0001313\t\t\t\tgi|144227719|gb|AAZ44686.2|\r\n+OG0001314\t\t\t\tgi|144227725|gb|AAZ44696.2|\r\n+OG0001315\t\t\t\tgi|144227730|gb|AAZ44708.2|\r\n+OG0001316\t\t\t\tgi|71852101|gb|AAZ44709.1|\r\n+OG0001317\t\t\t\tgi|144227731|gb|AAZ44711.2|\r\n+OG0001318\t\t\t\tgi|144227732|gb|AAZ44712.2|\r\n+OG0001319\t\t\t\tgi|144227736|gb|AAZ44718.2|\r\n+OG0001320\t\t\t\tgi|71852114|gb|AAZ44722.1|\r\n+OG0001321\t\t\t\tgi|144227745|gb|AAZ44743.2|\r\n+OG0001322\t\t\t\tgi|144227746|gb|AAZ44744.2|\r\n+OG0001323\t\t\t\tgi|144227747|gb|AAZ44745.2|\r\n+OG0001324\t\t\t\tgi|71852138|gb|AAZ44746.1|\r\n+OG0001325\t\t\t\tgi|71852139|gb|AAZ44747.1|\r\n+OG0001326\t\t\t\tgi|71852141|gb|AAZ44749.1|\r\n+OG0001327\t\t\t\tgi|144227748|gb|AAZ44751.2|\r\n+OG0001328\t\t\t\tgi|71852145|gb|AAZ44753.1|\r\n+OG0001329\t\t\t\tgi|144227749|gb|AAZ44755.2|\r\n+OG0001330\t\t\t\tgi|144227750|gb|AAZ44756.2|\r\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results/Statistics_Overall.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results/Statistics_Overall.csv Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,51 @@
+Number of genes 2733
+Number of genes in orthogroups 1938
+Number of unassigned genes 795
+Percentage of genes in orthogroups 70.9
+Percentage of unassigned genes 29.1
+Number of orthogroups 536
+Number of species-specific orthogroups 6
+Number of genes in species-specific orthogroups 97
+Percentage of genes in species-specific orthogroups 3.5
+Mean orthogroup size 3.6
+Median orthogroup size 4.0
+G50 (assigned genes) 4
+G50 (all genes) 4
+O50 (assigned genes) 200
+O50 (all genes) 299
+Number of orthogroups with all species present 280
+Number of single-copy orthogroups 254
+Date 2017-06-06
+Orthogroups file Orthogroups.csv
+Unassigned genes file Orthogroups_UnassignedGenes.csv
+Per-species statistics Statistics_PerSpecies.csv
+Overall statistics Statistics_Overall.csv
+Orthogroups shared between species Orthogroups_SpeciesOverlaps.csv
+
+Average number of genes per-species in orthogroup Number of orthogroups Percentage of orthogroups Number of genes Percentage of genes
+<1 222 41.4 510 26.3
+'1 304 56.7 1270 65.5
+'2 8 1.5 75 3.9
+'3 0 0.0 0 0.0
+'4 0 0.0 0 0.0
+'5 0 0.0 0 0.0
+'6 1 0.2 27 1.4
+'7 0 0.0 0 0.0
+'8 0 0.0 0 0.0
+'9 0 0.0 0 0.0
+'10 0 0.0 0 0.0
+11-15 1 0.2 56 2.9
+16-20 0 0.0 0 0.0
+21-50 0 0.0 0 0.0
+51-100 0 0.0 0 0.0
+101-150 0 0.0 0 0.0
+151-200 0 0.0 0 0.0
+201-500 0 0.0 0 0.0
+501-1000 0 0.0 0 0.0
+'1001+ 0 0.0 0 0.0
+
+Number of species in orthogroup Number of orthogroups
+1 6
+2 172
+3 78
+4 280
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results/Statistics_PerSpecies.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results/Statistics_PerSpecies.csv Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,100 @@
+ Mycoplasma_agalactiae Mycoplasma_gallisepticum Mycoplasma_genitalium Mycoplasma_hyopneumoniae
+Number of genes 820 763 476 674
+Number of genes in orthogroups 503 561 429 445
+Number of unassigned genes 317 202 47 229
+Percentage of genes in orthogroups 61.3 73.5 90.1 66.0
+Percentage of unassigned genes 38.7 26.5 9.9 34.0
+Number of orthogroups containing species 432 462 394 416
+Percentage of orthogroups containing species 80.6 86.2 73.5 77.6
+Number of species-specific orthogroups 2 3 0 1
+Number of genes in species-specific orthogroups 29 63 0 5
+Percentage of genes in species-specific orthogroups 3.5 8.3 0.0 0.7
+
+
+Number of genes per-species in orthogroup Number of orthogroups Number of orthogroups Number of orthogroups Number of orthogroups
+'0 104 74 142 120
+'1 400 429 368 403
+'2 22 24 19 9
+'3 6 6 5 1
+'4 1 0 2 0
+'5 2 2 0 1
+'6 0 0 0 0
+'7 0 0 0 0
+'8 0 0 0 2
+'9 0 0 0 0
+'10 0 0 0 0
+11-15 0 0 0 0
+16-20 0 0 0 0
+21-50 1 0 0 0
+51-100 0 1 0 0
+101-150 0 0 0 0
+151-200 0 0 0 0
+201-500 0 0 0 0
+501-1000 0 0 0 0
+'1001+ 0 0 0 0
+
+Number of genes per-species in orthogroup Percentage of orthogroups Percentage of orthogroups Percentage of orthogroups Percentage of orthogroups
+'0 19.4 13.8 26.5 22.4
+'1 74.6 80.0 68.7 75.2
+'2 4.1 4.5 3.5 1.7
+'3 1.1 1.1 0.9 0.2
+'4 0.2 0.0 0.4 0.0
+'5 0.4 0.4 0.0 0.2
+'6 0.0 0.0 0.0 0.0
+'7 0.0 0.0 0.0 0.0
+'8 0.0 0.0 0.0 0.4
+'9 0.0 0.0 0.0 0.0
+'10 0.0 0.0 0.0 0.0
+11-15 0.0 0.0 0.0 0.0
+16-20 0.0 0.0 0.0 0.0
+21-50 0.2 0.0 0.0 0.0
+51-100 0.0 0.2 0.0 0.0
+101-150 0.0 0.0 0.0 0.0
+151-200 0.0 0.0 0.0 0.0
+201-500 0.0 0.0 0.0 0.0
+501-1000 0.0 0.0 0.0 0.0
+'1001+ 0.0 0.0 0.0 0.0
+
+Number of genes per-species in orthogroup Number of genes Number of genes Number of genes Number of genes
+'0 0 0 0 0
+'1 400 429 368 403
+'2 44 48 38 18
+'3 18 18 15 3
+'4 4 0 8 0
+'5 10 10 0 5
+'6 0 0 0 0
+'7 0 0 0 0
+'8 0 0 0 16
+'9 0 0 0 0
+'10 0 0 0 0
+11-15 0 0 0 0
+16-20 0 0 0 0
+21-50 27 0 0 0
+51-100 0 56 0 0
+101-150 0 0 0 0
+151-200 0 0 0 0
+201-500 0 0 0 0
+501-1000 0 0 0 0
+'1001+ 0 0 0 0
+
+Number of genes per-species in orthogroup Percentage of genes Percentage of genes Percentage of genes Percentage of genes
+'0 0.0 0.0 0.0 0.0
+'1 48.8 56.2 77.3 59.8
+'2 5.4 6.3 8.0 2.7
+'3 2.2 2.4 3.2 0.4
+'4 0.5 0.0 1.7 0.0
+'5 1.2 1.3 0.0 0.7
+'6 0.0 0.0 0.0 0.0
+'7 0.0 0.0 0.0 0.0
+'8 0.0 0.0 0.0 2.4
+'9 0.0 0.0 0.0 0.0
+'10 0.0 0.0 0.0 0.0
+11-15 0.0 0.0 0.0 0.0
+16-20 0.0 0.0 0.0 0.0
+21-50 3.3 0.0 0.0 0.0
+51-100 0.0 7.3 0.0 0.0
+101-150 0.0 0.0 0.0 0.0
+151-200 0.0 0.0 0.0 0.0
+201-500 0.0 0.0 0.0 0.0
+501-1000 0.0 0.0 0.0 0.0
+'1001+ 0.0 0.0 0.0 0.0
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results_fromblast/Orthogroups.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results_fromblast/Orthogroups.csv Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,537 @@\n+\tMycoplasma_agalactiae\tMycoplasma_gallisepticum\tMycoplasma_genitalium\tMycoplasma_hyopneumoniae\r\n+OG0000000\t\tgi|284811953|gb|ADB96857.1|, gi|284811954|gb|ADB96858.1|, gi|284811955|gb|AAP56548.2|, gi|284811956|gb|ADB96859.1|, gi|284811957|gb|ADB96860.1|, gi|284811958|gb|ADB96861.1|, gi|284811959|gb|ADB96862.1|, gi|284811960|gb|ADB96863.1|, gi|284811961|gb|ADB96864.1|, gi|284811962|gb|ADB96865.1|, gi|284812039|gb|AAP56686.2|, gi|284812040|gb|ADB96873.1|, gi|284812041|gb|ADB96874.1|, gi|284812042|gb|ADB96875.1|, gi|284812103|gb|ADB96879.1|, gi|284812104|gb|ADB96880.1|, gi|284812105|gb|AAP56776.2|, gi|284812107|gb|ADB96881.1|, gi|284812108|gb|ADB96882.1|, gi|284812128|gb|AAP56805.2|, gi|284812129|gb|AAP56806.2|, gi|284812217|gb|ADB96891.1|, gi|284812218|gb|ADB96892.1|, gi|284812219|gb|AAP56940.2|, gi|31541243|gb|AAP56545.1|, gi|31541245|gb|AAP56547.1|, gi|31541247|gb|AAP56549.1|, gi|31541248|gb|AAP56550.1|, gi|31541249|gb|AAP56551.1|, gi|31541250|gb|AAP56552.1|, gi|31541251|gb|AAP56553.1|, gi|31541252|gb|AAP56554.1|, gi|31541253|gb|AAP56555.1|, gi|31541386|gb|AAP56687.1|, gi|31541387|gb|AAP56688.1|, gi|31541388|gb|AAP56689.1|, gi|31541389|gb|AAP56690.1|, gi|31541390|gb|AAP56691.1|, gi|31541391|gb|AAP56692.1|, gi|31541392|gb|AAP56693.1|, gi|31541393|gb|AAP56694.1|, gi|31541394|gb|AAP56695.1|, gi|31541395|gb|AAP56696.1|, gi|31541396|gb|AAP56697.1|, gi|31541398|gb|AAP56699.1|, gi|31541472|gb|AAP56773.1|, gi|31541473|gb|AAP56774.1|, gi|31541474|gb|AAP56775.1|, gi|31541478|gb|AAP56779.1|, gi|31541641|gb|AAP56941.1|, gi|31541642|gb|AAP56942.1|, gi|31541643|gb|AAP56943.1|, gi|31541644|gb|AAP56944.1|, gi|31541645|gb|AAP56945.1|, gi|31541646|gb|AAP56946.1|, gi|31541647|gb|AAP56947.1|\t\t\r\n+OG0000001\tgi|290752501|emb|CBH40473.1|, gi|290752503|emb|CBH40475.1|, gi|290752692|emb|CBH40666.1|, gi|290752693|emb|CBH40667.1|, gi|290752812|emb|CBH40787.1|, gi|290752813|emb|CBH40788.1|, gi|290752814|emb|CBH40789.1|, gi|290752815|emb|CBH40790.1|, gi|290752816|emb|CBH40791.1|, gi|290752817|emb|CBH40792.1|, gi|290752818|emb|CBH40793.1|, gi|290753029|emb|CBH41005.1|, gi|290753030|emb|CBH41006.1|, gi|290753031|emb|CBH41007.1|, gi|290753032|emb|CBH41008.1|, gi|290753033|emb|CBH41009.1|, gi|290753034|emb|CBH41010.1|, gi|290753035|emb|CBH41011.1|, gi|290753036|emb|CBH41012.1|, gi|290753037|emb|CBH41013.1|, gi|290753040|emb|CBH41016.1|, gi|290753041|emb|CBH41017.1|, gi|290753042|emb|CBH41018.1|, gi|290753043|emb|CBH41019.1|, gi|290753044|emb|CBH41020.1|, gi|290753045|emb|CBH41021.1|, gi|290753046|emb|CBH41022.1|\t\t\t\r\n+OG0000002\tgi|290752526|emb|CBH40498.1|, gi|290752801|emb|CBH40776.1|, gi|290752802|emb|CBH40777.1|, gi|290753081|emb|CBH41057.1|\tgi|31541070|gb|AAP56372.1|, gi|31541268|gb|AAP56569.1|, gi|31541628|gb|AAP56928.1|, gi|31541629|gb|AAP56929.1|\tgi|1045740|gb|AAC71283.1|, gi|1045987|gb|AAC71511.1|, gi|3844775|gb|AAC71398.1|, gi|3844776|gb|AAC71399.1|, gi|3844882|gb|AAC71525.1|, gi|3845062|gb|AAC72487.1|, gi|3845064|gb|AAC72489.1|, gi|84626133|gb|AAC71526.2|\tgi|144227640|gb|AAZ44535.2|, gi|71851738|gb|AAZ44346.1|, gi|71851739|gb|AAZ44347.1|, gi|71851837|gb|AAZ44445.1|\r\n+OG0000003\tgi|290752269|emb|CBH40240.1|, gi|290752270|emb|CBH40241.1|, gi|290752414|emb|CBH40385.1|, gi|290752490|emb|CBH40462.1|, gi|290752766|emb|CBH40741.1|\tgi|31541260|gb|AAP56562.1|, gi|31541382|gb|AAP56683.1|\tgi|1046010|gb|AAC71532.1|, gi|3844907|gb|AAC71551.1|, gi|3844927|gb|AAC71569.1|\tgi|144227478|gb|AAZ44221.2|\r\n+OG0000004\tgi|290753066|emb|CBH41042.1|\tgi|284811924|gb|AAP56500.2|, gi|284811927|gb|ADB96855.1|, gi|284811928|gb|ADB96856.1|, gi|284812192|gb|AAP56901.2|, gi|31541553|gb|AAP56853.1|\tgi|1046012|gb|AAC71534.1|, gi|3844628|gb|AAC71235.1|, gi|3844797|gb|AAC71418.1|, gi|3844975|gb|AAC71613.1|\tgi|71851550|gb|AAZ44158.1|\r\n+OG0000005\tgi|290752591|emb|CBH40563.1|, gi|290752592|emb|CBH40564.1|, gi|290752893|emb|CBH40868.1|, gi|290752894|emb|CBH40869.1|\tgi|284811835|gb|AAP56356.2|, gi|284812058|gb|AAP56715.2|, gi|31541415|gb|AAP56716.1|\tgi|1045683|gb|AAC71230.1|, '..b'477\t\tgi|284811945|gb|AAP56529.2|\tgi|3844895|gb|AAC71540.1|\t\r\n+OG0000478\t\tgi|284811949|gb|AAP56536.2|\tgi|1045973|gb|AAC71500.1|\t\r\n+OG0000479\t\tgi|284811950|gb|AAP56538.2|\tgi|1045972|gb|AAC71499.1|\t\r\n+OG0000480\t\tgi|31541239|gb|AAP56541.1|\tgi|3844896|gb|AAC71541.1|\t\r\n+OG0000481\t\tgi|284811951|gb|AAP56544.2|\t\tgi|144227642|gb|AAZ44540.2|\r\n+OG0000482\t\tgi|284811972|gb|AAP56572.2|\tgi|1045980|gb|AAC71506.1|\t\r\n+OG0000483\t\tgi|31541272|gb|AAP56573.1|\tgi|1045981|gb|AAC71507.1|\t\r\n+OG0000484\t\tgi|284811973|gb|AAP56574.2|\tgi|1045982|gb|AAC71508.1|\t\r\n+OG0000485\t\tgi|284811978|gb|AAP56579.2|\tgi|3845040|gb|AAC72467.1|\t\r\n+OG0000486\t\tgi|31541293|gb|AAP56594.1|\tgi|1045977|gb|AAC71503.1|\t\r\n+OG0000487\t\tgi|284811990|gb|AAP56599.2|\t\tgi|144227563|gb|AAZ44390.2|\r\n+OG0000488\t\tgi|284811995|gb|AAP56607.2|\t\tgi|144227427|gb|AAZ44116.2|\r\n+OG0000489\t\tgi|284812002|gb|AAP56617.2|\tgi|3844925|gb|AAC71567.1|\t\r\n+OG0000490\t\tgi|284812013|gb|AAP56637.2|\tgi|3845048|gb|AAC72474.1|\t\r\n+OG0000491\t\tgi|31541356|gb|AAP56657.1|\tgi|3844990|gb|AAC71626.1|\t\r\n+OG0000492\t\tgi|31541362|gb|AAP56663.1|\t\tgi|71851833|gb|AAZ44441.1|\r\n+OG0000493\t\tgi|284812025|gb|AAP56664.2|\tgi|3844809|gb|AAC71429.1|\t\r\n+OG0000494\t\tgi|31541364|gb|AAP56665.1|\tgi|84626132|gb|ABC59631.1|\t\r\n+OG0000495\t\tgi|31541370|gb|AAP56671.1|\tgi|3844818|gb|AAC71437.1|\t\r\n+OG0000496\t\tgi|31541380|gb|AAP56681.1|\tgi|1045963|gb|AAC71491.1|\t\r\n+OG0000497\t\tgi|284812060|gb|AAP56718.2|\tgi|3844837|gb|AAC71454.1|\t\r\n+OG0000498\t\tgi|284812061|gb|AAP56721.2|\tgi|3844840|gb|AAC71457.1|\t\r\n+OG0000499\t\tgi|284812062|gb|AAP56722.2|\tgi|3844841|gb|AAC71458.1|\t\r\n+OG0000500\t\tgi|284812074|gb|AAP56734.2|\tgi|3844846|gb|AAC71463.1|\t\r\n+OG0000501\t\tgi|284812077|gb|AAP56738.2|\tgi|1045939|gb|AAC71468.1|\t\r\n+OG0000502\t\tgi|31541448|gb|AAP56749.1|\tgi|3844826|gb|AAC71444.1|\t\r\n+OG0000503\t\tgi|284812091|gb|AAP56756.2|\tgi|3844811|gb|AAC71430.1|\t\r\n+OG0000504\t\tgi|31541465|gb|AAP56766.1|\t\tgi|144227651|gb|AAZ44558.2|\r\n+OG0000505\t\tgi|31541498|gb|AAP56798.1|\tgi|3844971|gb|AAC71609.1|\t\r\n+OG0000506\t\tgi|284812125|gb|AAP56801.2|\tgi|3844978|gb|AAC71616.1|\t\r\n+OG0000507\t\tgi|31541512|gb|AAP56812.1|\tgi|3844689|gb|AAC71319.1|\t\r\n+OG0000508\t\tgi|284812140|gb|AAP56821.2|\tgi|3844721|gb|AAC71348.1|\t\r\n+OG0000509\t\tgi|284812145|gb|AAP56827.2|\tgi|84626131|gb|AAC71620.2|\t\r\n+OG0000510\t\tgi|31541528|gb|AAP56828.1|\tgi|3844984|gb|AAC71621.1|\t\r\n+OG0000511\t\tgi|31541549|gb|AAP56849.1|\tgi|3844959|gb|AAC71598.1|\t\r\n+OG0000512\t\tgi|31541558|gb|AAP56858.1|\tgi|3844638|gb|AAC71244.1|\t\r\n+OG0000513\t\tgi|284812164|gb|AAP56866.2|\tgi|3844898|gb|AAC71543.1|\t\r\n+OG0000514\t\tgi|284812171|gb|AAP56875.2|\tgi|84626128|gb|AAC71502.2|\t\r\n+OG0000515\t\tgi|284812173|gb|AAP56879.2|\tgi|3845020|gb|AAC72448.1|\t\r\n+OG0000516\t\tgi|31541590|gb|AAP56890.1|\tgi|3844885|gb|AAC71528.1|\t\r\n+OG0000517\t\tgi|31541595|gb|AAP56895.1|\tgi|3844719|gb|AAC71346.1|\t\r\n+OG0000518\t\tgi|284812188|gb|AAP56896.2|\tgi|3844718|gb|AAC71345.1|\t\r\n+OG0000519\t\tgi|284812202|gb|AAP56917.2|\tgi|3844893|gb|AAC71538.1|\t\r\n+OG0000520\t\tgi|284812208|gb|AAP56924.2|\tgi|1045731|gb|AAC71274.1|\t\r\n+OG0000521\t\tgi|284812210|gb|AAP56926.2|\tgi|3844778|gb|AAC71401.1|\t\r\n+OG0000522\t\tgi|31541648|gb|AAP56948.1|\tgi|1045712|gb|AAC71256.1|\t\r\n+OG0000523\t\tgi|31541655|gb|AAP56955.1|\tgi|3844989|gb|AAC71625.1|\t\r\n+OG0000524\t\tgi|284812225|gb|AAP56960.2|\tgi|3844682|gb|AAC71313.1|\t\r\n+OG0000525\t\tgi|284812227|gb|AAP56967.2|\tgi|3844647|gb|AAC71253.1|\t\r\n+OG0000526\t\tgi|284812245|gb|AAP56998.2|\tgi|1045728|gb|AAC71271.1|\t\r\n+OG0000527\t\tgi|284812254|gb|AAP57010.2|\tgi|3844631|gb|AAC71238.1|\t\r\n+OG0000528\t\tgi|31541720|gb|AAP57020.1|\t\tgi|144227662|gb|AAZ44577.2|\r\n+OG0000529\t\tgi|284812281|gb|AAP57051.2|\tgi|3845001|gb|AAC71636.1|\t\r\n+OG0000530\t\tgi|284812282|gb|AAP57052.2|\tgi|84626126|gb|AAC71234.2|\t\r\n+OG0000531\t\tgi|31541763|gb|AAP57062.1|\tgi|84626158|gb|AAC72481.2|\t\r\n+OG0000532\t\tgi|284812300|gb|AAP57075.2|\tgi|84626152|gb|AAC71218.2|\t\r\n+OG0000533\t\t\tgi|84626147|gb|AAC71280.2|\tgi|71851703|gb|AAZ44311.1|\r\n+OG0000534\t\t\tgi|3844705|gb|AAC71333.1|\tgi|71851627|gb|AAZ44235.1|\r\n+OG0000535\t\t\tgi|3844873|gb|AAC71515.1|\tgi|71851777|gb|AAZ44385.1|\r\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results_fromblast/Orthogroups.txt
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results_fromblast/Orthogroups.txt Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,1331 @@\n+OG0000000: gi|284811953|gb|ADB96857.1| gi|284811954|gb|ADB96858.1| gi|284811955|gb|AAP56548.2| gi|284811956|gb|ADB96859.1| gi|284811957|gb|ADB96860.1| gi|284811958|gb|ADB96861.1| gi|284811959|gb|ADB96862.1| gi|284811960|gb|ADB96863.1| gi|284811961|gb|ADB96864.1| gi|284811962|gb|ADB96865.1| gi|284812039|gb|AAP56686.2| gi|284812040|gb|ADB96873.1| gi|284812041|gb|ADB96874.1| gi|284812042|gb|ADB96875.1| gi|284812103|gb|ADB96879.1| gi|284812104|gb|ADB96880.1| gi|284812105|gb|AAP56776.2| gi|284812107|gb|ADB96881.1| gi|284812108|gb|ADB96882.1| gi|284812128|gb|AAP56805.2| gi|284812129|gb|AAP56806.2| gi|284812217|gb|ADB96891.1| gi|284812218|gb|ADB96892.1| gi|284812219|gb|AAP56940.2| gi|31541243|gb|AAP56545.1| gi|31541245|gb|AAP56547.1| gi|31541247|gb|AAP56549.1| gi|31541248|gb|AAP56550.1| gi|31541249|gb|AAP56551.1| gi|31541250|gb|AAP56552.1| gi|31541251|gb|AAP56553.1| gi|31541252|gb|AAP56554.1| gi|31541253|gb|AAP56555.1| gi|31541386|gb|AAP56687.1| gi|31541387|gb|AAP56688.1| gi|31541388|gb|AAP56689.1| gi|31541389|gb|AAP56690.1| gi|31541390|gb|AAP56691.1| gi|31541391|gb|AAP56692.1| gi|31541392|gb|AAP56693.1| gi|31541393|gb|AAP56694.1| gi|31541394|gb|AAP56695.1| gi|31541395|gb|AAP56696.1| gi|31541396|gb|AAP56697.1| gi|31541398|gb|AAP56699.1| gi|31541472|gb|AAP56773.1| gi|31541473|gb|AAP56774.1| gi|31541474|gb|AAP56775.1| gi|31541478|gb|AAP56779.1| gi|31541641|gb|AAP56941.1| gi|31541642|gb|AAP56942.1| gi|31541643|gb|AAP56943.1| gi|31541644|gb|AAP56944.1| gi|31541645|gb|AAP56945.1| gi|31541646|gb|AAP56946.1| gi|31541647|gb|AAP56947.1|\n+OG0000001: gi|290752501|emb|CBH40473.1| gi|290752503|emb|CBH40475.1| gi|290752692|emb|CBH40666.1| gi|290752693|emb|CBH40667.1| gi|290752812|emb|CBH40787.1| gi|290752813|emb|CBH40788.1| gi|290752814|emb|CBH40789.1| gi|290752815|emb|CBH40790.1| gi|290752816|emb|CBH40791.1| gi|290752817|emb|CBH40792.1| gi|290752818|emb|CBH40793.1| gi|290753029|emb|CBH41005.1| gi|290753030|emb|CBH41006.1| gi|290753031|emb|CBH41007.1| gi|290753032|emb|CBH41008.1| gi|290753033|emb|CBH41009.1| gi|290753034|emb|CBH41010.1| gi|290753035|emb|CBH41011.1| gi|290753036|emb|CBH41012.1| gi|290753037|emb|CBH41013.1| gi|290753040|emb|CBH41016.1| gi|290753041|emb|CBH41017.1| gi|290753042|emb|CBH41018.1| gi|290753043|emb|CBH41019.1| gi|290753044|emb|CBH41020.1| gi|290753045|emb|CBH41021.1| gi|290753046|emb|CBH41022.1|\n+OG0000002: gi|1045740|gb|AAC71283.1| gi|1045987|gb|AAC71511.1| gi|144227640|gb|AAZ44535.2| gi|290752526|emb|CBH40498.1| gi|290752801|emb|CBH40776.1| gi|290752802|emb|CBH40777.1| gi|290753081|emb|CBH41057.1| gi|31541070|gb|AAP56372.1| gi|31541268|gb|AAP56569.1| gi|31541628|gb|AAP56928.1| gi|31541629|gb|AAP56929.1| gi|3844775|gb|AAC71398.1| gi|3844776|gb|AAC71399.1| gi|3844882|gb|AAC71525.1| gi|3845062|gb|AAC72487.1| gi|3845064|gb|AAC72489.1| gi|71851738|gb|AAZ44346.1| gi|71851739|gb|AAZ44347.1| gi|71851837|gb|AAZ44445.1| gi|84626133|gb|AAC71526.2|\n+OG0000003: gi|1046010|gb|AAC71532.1| gi|144227478|gb|AAZ44221.2| gi|290752269|emb|CBH40240.1| gi|290752270|emb|CBH40241.1| gi|290752414|emb|CBH40385.1| gi|290752490|emb|CBH40462.1| gi|290752766|emb|CBH40741.1| gi|31541260|gb|AAP56562.1| gi|31541382|gb|AAP56683.1| gi|3844907|gb|AAC71551.1| gi|3844927|gb|AAC71569.1|\n+OG0000004: gi|1046012|gb|AAC71534.1| gi|284811924|gb|AAP56500.2| gi|284811927|gb|ADB96855.1| gi|284811928|gb|ADB96856.1| gi|284812192|gb|AAP56901.2| gi|290753066|emb|CBH41042.1| gi|31541553|gb|AAP56853.1| gi|3844628|gb|AAC71235.1| gi|3844797|gb|AAC71418.1| gi|3844975|gb|AAC71613.1| gi|71851550|gb|AAZ44158.1|\n+OG0000005: gi|1045683|gb|AAC71230.1| gi|1045684|gb|AAC71231.1| gi|284811835|gb|AAP56356.2| gi|284812058|gb|AAP56715.2| gi|290752591|emb|CBH40563.1| gi|290752592|emb|CBH40564.1| gi|290752893|emb|CBH40868.1| gi|290752894|emb|CBH40869.1| gi|31541415|gb|AAP56716.1|\n+OG0000006: gi|31541304|gb|AAP56605.1| gi|71851504|gb|AAZ44112.1| gi|71851505|gb|AAZ44113.1| gi|71851506|gb|AAZ44114.1| gi|71851779|gb|AAZ44387.1| gi|71851788|gb|AAZ44396.1| gi|71851789|gb|AAZ'..b'01230: gi|144227613|gb|AAZ44488.2|\n+OG0001231: gi|71851881|gb|AAZ44489.1|\n+OG0001232: gi|144227616|gb|AAZ44498.2|\n+OG0001233: gi|144227617|gb|AAZ44499.2|\n+OG0001234: gi|144227618|gb|AAZ44501.2|\n+OG0001235: gi|71851895|gb|AAZ44503.1|\n+OG0001236: gi|71851899|gb|AAZ44507.1|\n+OG0001237: gi|71851900|gb|AAZ44508.1|\n+OG0001238: gi|71851902|gb|AAZ44510.1|\n+OG0001239: gi|144227625|gb|AAZ44516.2|\n+OG0001240: gi|71851909|gb|AAZ44517.1|\n+OG0001241: gi|144227629|gb|AAZ44523.2|\n+OG0001242: gi|144227630|gb|AAZ44524.2|\n+OG0001243: gi|144227631|gb|AAZ44526.2|\n+OG0001244: gi|144227632|gb|AAZ44527.2|\n+OG0001245: gi|144227633|gb|ABO93479.1|\n+OG0001246: gi|144227634|gb|AAZ44528.2|\n+OG0001247: gi|71851921|gb|AAZ44529.1|\n+OG0001248: gi|144227635|gb|AAZ44530.2|\n+OG0001249: gi|144227636|gb|AAZ44531.2|\n+OG0001250: gi|71851929|gb|AAZ44537.1|\n+OG0001251: gi|71851936|gb|AAZ44544.1|\n+OG0001252: gi|144227644|gb|AAZ44545.2|\n+OG0001253: gi|144227645|gb|AAZ44546.2|\n+OG0001254: gi|144227647|gb|AAZ44549.2|\n+OG0001255: gi|144227650|gb|AAZ44554.2|\n+OG0001256: gi|71851956|gb|AAZ44564.1|\n+OG0001257: gi|144227656|gb|AAZ44567.2|\n+OG0001258: gi|144227660|gb|AAZ44572.2|\n+OG0001259: gi|71851966|gb|AAZ44574.1|\n+OG0001260: gi|144227661|gb|AAZ44576.2|\n+OG0001261: gi|71851971|gb|AAZ44579.1|\n+OG0001262: gi|71851972|gb|AAZ44580.1|\n+OG0001263: gi|71851985|gb|AAZ44593.1|\n+OG0001264: gi|71851986|gb|AAZ44594.1|\n+OG0001265: gi|144227667|gb|AAZ44595.2|\n+OG0001266: gi|71851988|gb|AAZ44596.1|\n+OG0001267: gi|71851989|gb|AAZ44597.1|\n+OG0001268: gi|144227668|gb|AAZ44598.2|\n+OG0001269: gi|71851991|gb|AAZ44599.1|\n+OG0001270: gi|144227669|gb|AAZ44600.2|\n+OG0001271: gi|144227670|gb|AAZ44601.2|\n+OG0001272: gi|144227671|gb|AAZ44602.2|\n+OG0001273: gi|144227672|gb|AAZ44604.2|\n+OG0001274: gi|144227673|gb|AAZ44605.2|\n+OG0001275: gi|144227674|gb|AAZ44606.2|\n+OG0001276: gi|144227675|gb|AAZ44607.2|\n+OG0001277: gi|144227676|gb|ABO93480.1|\n+OG0001278: gi|144227681|gb|AAZ44617.2|\n+OG0001279: gi|144227683|gb|AAZ44623.2|\n+OG0001280: gi|144227688|gb|ABO93481.1|\n+OG0001281: gi|144227689|gb|AAZ44632.2|\n+OG0001282: gi|71852025|gb|AAZ44633.1|\n+OG0001283: gi|144227690|gb|AAZ44637.2|\n+OG0001284: gi|71852030|gb|AAZ44638.1|\n+OG0001285: gi|144227691|gb|AAZ44639.2|\n+OG0001286: gi|71852032|gb|AAZ44640.1|\n+OG0001287: gi|71852034|gb|AAZ44642.1|\n+OG0001288: gi|71852035|gb|AAZ44643.1|\n+OG0001289: gi|144227693|gb|AAZ44644.2|\n+OG0001290: gi|144227694|gb|ABO93482.1|\n+OG0001291: gi|144227695|gb|AAZ44645.2|\n+OG0001292: gi|71852038|gb|AAZ44646.1|\n+OG0001293: gi|144227696|gb|AAZ44647.2|\n+OG0001294: gi|71852040|gb|AAZ44648.1|\n+OG0001295: gi|144227697|gb|AAZ44650.2|\n+OG0001296: gi|71852043|gb|AAZ44651.1|\n+OG0001297: gi|144227698|gb|ABO93483.1|\n+OG0001298: gi|144227699|gb|AAZ44652.2|\n+OG0001299: gi|144227700|gb|AAZ44653.2|\n+OG0001300: gi|144227701|gb|AAZ44654.2|\n+OG0001301: gi|71852048|gb|AAZ44656.1|\n+OG0001302: gi|144227703|gb|AAZ44657.2|\n+OG0001303: gi|144227704|gb|AAZ44658.2|\n+OG0001304: gi|71852052|gb|AAZ44660.1|\n+OG0001305: gi|144227707|gb|AAZ44671.2|\n+OG0001306: gi|144227709|gb|ABO93484.1|\n+OG0001307: gi|144227715|gb|AAZ44680.2|\n+OG0001308: gi|144227716|gb|AAZ44681.2|\n+OG0001309: gi|144227717|gb|AAZ44682.2|\n+OG0001310: gi|71852075|gb|AAZ44683.1|\n+OG0001311: gi|144227718|gb|AAZ44684.2|\n+OG0001312: gi|71852077|gb|AAZ44685.1|\n+OG0001313: gi|144227719|gb|AAZ44686.2|\n+OG0001314: gi|144227725|gb|AAZ44696.2|\n+OG0001315: gi|144227730|gb|AAZ44708.2|\n+OG0001316: gi|71852101|gb|AAZ44709.1|\n+OG0001317: gi|144227731|gb|AAZ44711.2|\n+OG0001318: gi|144227732|gb|AAZ44712.2|\n+OG0001319: gi|144227736|gb|AAZ44718.2|\n+OG0001320: gi|71852114|gb|AAZ44722.1|\n+OG0001321: gi|144227745|gb|AAZ44743.2|\n+OG0001322: gi|144227746|gb|AAZ44744.2|\n+OG0001323: gi|144227747|gb|AAZ44745.2|\n+OG0001324: gi|71852138|gb|AAZ44746.1|\n+OG0001325: gi|71852139|gb|AAZ44747.1|\n+OG0001326: gi|71852141|gb|AAZ44749.1|\n+OG0001327: gi|144227748|gb|AAZ44751.2|\n+OG0001328: gi|71852145|gb|AAZ44753.1|\n+OG0001329: gi|144227749|gb|AAZ44755.2|\n+OG0001330: gi|144227750|gb|AAZ44756.2|\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results_fromblast/Orthogroups_SpeciesOverlaps.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results_fromblast/Orthogroups_SpeciesOverlaps.csv Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,5 @@
+ Mycoplasma_agalactiae Mycoplasma_gallisepticum Mycoplasma_genitalium Mycoplasma_hyopneumoniae
+Mycoplasma_agalactiae 430 358 302 389
+Mycoplasma_gallisepticum 358 459 383 344
+Mycoplasma_genitalium 302 383 392 294
+Mycoplasma_hyopneumoniae 389 344 294 416
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results_fromblast/Orthogroups_UnassignedGenes.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results_fromblast/Orthogroups_UnassignedGenes.csv Tue Oct 24 06:40:40 2017 -0400
b
b'@@ -0,0 +1,796 @@\n+\tMycoplasma_agalactiae\tMycoplasma_gallisepticum\tMycoplasma_genitalium\tMycoplasma_hyopneumoniae\r\n+OG0000536\tgi|290752272|emb|CBH40243.1|\t\t\t\r\n+OG0000537\tgi|290752276|emb|CBH40247.1|\t\t\t\r\n+OG0000538\tgi|290752279|emb|CBH40250.1|\t\t\t\r\n+OG0000539\tgi|290752285|emb|CBH40256.1|\t\t\t\r\n+OG0000540\tgi|290752286|emb|CBH40257.1|\t\t\t\r\n+OG0000541\tgi|290752287|emb|CBH40258.1|\t\t\t\r\n+OG0000542\tgi|290752288|emb|CBH40259.1|\t\t\t\r\n+OG0000543\tgi|290752289|emb|CBH40260.1|\t\t\t\r\n+OG0000544\tgi|290752290|emb|CBH40261.1|\t\t\t\r\n+OG0000545\tgi|290752291|emb|CBH40262.1|\t\t\t\r\n+OG0000546\tgi|290752293|emb|CBH40264.1|\t\t\t\r\n+OG0000547\tgi|290752294|emb|CBH40265.1|\t\t\t\r\n+OG0000548\tgi|290752295|emb|CBH40266.1|\t\t\t\r\n+OG0000549\tgi|290752296|emb|CBH40267.1|\t\t\t\r\n+OG0000550\tgi|290752297|emb|CBH40268.1|\t\t\t\r\n+OG0000551\tgi|290752306|emb|CBH40277.1|\t\t\t\r\n+OG0000552\tgi|290752310|emb|CBH40281.1|\t\t\t\r\n+OG0000553\tgi|290752313|emb|CBH40284.1|\t\t\t\r\n+OG0000554\tgi|290752314|emb|CBH40285.1|\t\t\t\r\n+OG0000555\tgi|290752319|emb|CBH40290.1|\t\t\t\r\n+OG0000556\tgi|290752342|emb|CBH40313.1|\t\t\t\r\n+OG0000557\tgi|290752345|emb|CBH40316.1|\t\t\t\r\n+OG0000558\tgi|290752348|emb|CBH40319.1|\t\t\t\r\n+OG0000559\tgi|290752349|emb|CBH40320.1|\t\t\t\r\n+OG0000560\tgi|290752350|emb|CBH40321.1|\t\t\t\r\n+OG0000561\tgi|290752353|emb|CBH40324.1|\t\t\t\r\n+OG0000562\tgi|290752355|emb|CBH40326.1|\t\t\t\r\n+OG0000563\tgi|290752359|emb|CBH40330.1|\t\t\t\r\n+OG0000564\tgi|290752362|emb|CBH40333.1|\t\t\t\r\n+OG0000565\tgi|290752367|emb|CBH40338.1|\t\t\t\r\n+OG0000566\tgi|290752368|emb|CBH40339.1|\t\t\t\r\n+OG0000567\tgi|290752374|emb|CBH40345.1|\t\t\t\r\n+OG0000568\tgi|290752375|emb|CBH40346.1|\t\t\t\r\n+OG0000569\tgi|290752377|emb|CBH40348.1|\t\t\t\r\n+OG0000570\tgi|290752380|emb|CBH40351.1|\t\t\t\r\n+OG0000571\tgi|290752387|emb|CBH40358.1|\t\t\t\r\n+OG0000572\tgi|290752389|emb|CBH40360.1|\t\t\t\r\n+OG0000573\tgi|290752396|emb|CBH40367.1|\t\t\t\r\n+OG0000574\tgi|290752398|emb|CBH40369.1|\t\t\t\r\n+OG0000575\tgi|290752399|emb|CBH40370.1|\t\t\t\r\n+OG0000576\tgi|290752400|emb|CBH40371.1|\t\t\t\r\n+OG0000577\tgi|290752405|emb|CBH40376.1|\t\t\t\r\n+OG0000578\tgi|290752407|emb|CBH40378.1|\t\t\t\r\n+OG0000579\tgi|290752409|emb|CBH40380.1|\t\t\t\r\n+OG0000580\tgi|290752411|emb|CBH40382.1|\t\t\t\r\n+OG0000581\tgi|290752412|emb|CBH40383.1|\t\t\t\r\n+OG0000582\tgi|290752413|emb|CBH40384.1|\t\t\t\r\n+OG0000583\tgi|290752415|emb|CBH40386.1|\t\t\t\r\n+OG0000584\tgi|290752417|emb|CBH40388.1|\t\t\t\r\n+OG0000585\tgi|290752419|emb|CBH40390.1|\t\t\t\r\n+OG0000586\tgi|290752421|emb|CBH40392.1|\t\t\t\r\n+OG0000587\tgi|290752423|emb|CBH40394.1|\t\t\t\r\n+OG0000588\tgi|290752424|emb|CBH40395.1|\t\t\t\r\n+OG0000589\tgi|290752425|emb|CBH40396.1|\t\t\t\r\n+OG0000590\tgi|290752428|emb|CBH40399.1|\t\t\t\r\n+OG0000591\tgi|290752429|emb|CBH40400.1|\t\t\t\r\n+OG0000592\tgi|290752430|emb|CBH40401.1|\t\t\t\r\n+OG0000593\tgi|290752432|emb|CBH40403.1|\t\t\t\r\n+OG0000594\tgi|290752436|emb|CBH40407.1|\t\t\t\r\n+OG0000595\tgi|290752439|emb|CBH40410.1|\t\t\t\r\n+OG0000596\tgi|290752444|emb|CBH40415.1|\t\t\t\r\n+OG0000597\tgi|290752447|emb|CBH40418.1|\t\t\t\r\n+OG0000598\tgi|290752448|emb|CBH40420.1|\t\t\t\r\n+OG0000599\tgi|290752449|emb|CBH40421.1|\t\t\t\r\n+OG0000600\tgi|290752453|emb|CBH40425.1|\t\t\t\r\n+OG0000601\tgi|290752457|emb|CBH40429.1|\t\t\t\r\n+OG0000602\tgi|290752462|emb|CBH40434.1|\t\t\t\r\n+OG0000603\tgi|290752466|emb|CBH40438.1|\t\t\t\r\n+OG0000604\tgi|290752472|emb|CBH40444.1|\t\t\t\r\n+OG0000605\tgi|290752473|emb|CBH40445.1|\t\t\t\r\n+OG0000606\tgi|290752474|emb|CBH40446.1|\t\t\t\r\n+OG0000607\tgi|290752475|emb|CBH40447.1|\t\t\t\r\n+OG0000608\tgi|290752476|emb|CBH40448.1|\t\t\t\r\n+OG0000609\tgi|290752495|emb|CBH40467.1|\t\t\t\r\n+OG0000610\tgi|290752500|emb|CBH40472.1|\t\t\t\r\n+OG0000611\tgi|290752502|emb|CBH40474.1|\t\t\t\r\n+OG0000612\tgi|290752505|emb|CBH40477.1|\t\t\t\r\n+OG0000613\tgi|290752506|emb|CBH40478.1|\t\t\t\r\n+OG0000614\tgi|290752507|emb|CBH40479.1|\t\t\t\r\n+OG0000615\tgi|290752509|emb|CBH40481.1|\t\t\t\r\n+OG0000616\tgi|290752510|emb|CBH40482.1|\t\t\t\r\n+OG0000617\tgi|290752511|emb|CBH40483.1|\t\t\t\r\n+OG0000618\tgi|290752512|emb|CBH40484.1|\t\t\t\r\n+OG0000619\tgi|290752514|emb|CBH40486.1|\t\t\t\r\n+OG0000620\tgi|290752517|emb|CBH40489.1|\t\t\t\r\n+OG0000621\tgi|290752524|emb|CBH40496.1|\t\t\t\r\n+OG0000622\tgi|290752528|emb|CBH40500.1|\t\t\t\r\n+OG0000623\tgi|290752537|emb|CBH40509.1|\t\t\t\r\n+OG0000624\tg'..b'\t\t\t\tgi|71851900|gb|AAZ44508.1|\r\n+OG0001238\t\t\t\tgi|71851902|gb|AAZ44510.1|\r\n+OG0001239\t\t\t\tgi|144227625|gb|AAZ44516.2|\r\n+OG0001240\t\t\t\tgi|71851909|gb|AAZ44517.1|\r\n+OG0001241\t\t\t\tgi|144227629|gb|AAZ44523.2|\r\n+OG0001242\t\t\t\tgi|144227630|gb|AAZ44524.2|\r\n+OG0001243\t\t\t\tgi|144227631|gb|AAZ44526.2|\r\n+OG0001244\t\t\t\tgi|144227632|gb|AAZ44527.2|\r\n+OG0001245\t\t\t\tgi|144227633|gb|ABO93479.1|\r\n+OG0001246\t\t\t\tgi|144227634|gb|AAZ44528.2|\r\n+OG0001247\t\t\t\tgi|71851921|gb|AAZ44529.1|\r\n+OG0001248\t\t\t\tgi|144227635|gb|AAZ44530.2|\r\n+OG0001249\t\t\t\tgi|144227636|gb|AAZ44531.2|\r\n+OG0001250\t\t\t\tgi|71851929|gb|AAZ44537.1|\r\n+OG0001251\t\t\t\tgi|71851936|gb|AAZ44544.1|\r\n+OG0001252\t\t\t\tgi|144227644|gb|AAZ44545.2|\r\n+OG0001253\t\t\t\tgi|144227645|gb|AAZ44546.2|\r\n+OG0001254\t\t\t\tgi|144227647|gb|AAZ44549.2|\r\n+OG0001255\t\t\t\tgi|144227650|gb|AAZ44554.2|\r\n+OG0001256\t\t\t\tgi|71851956|gb|AAZ44564.1|\r\n+OG0001257\t\t\t\tgi|144227656|gb|AAZ44567.2|\r\n+OG0001258\t\t\t\tgi|144227660|gb|AAZ44572.2|\r\n+OG0001259\t\t\t\tgi|71851966|gb|AAZ44574.1|\r\n+OG0001260\t\t\t\tgi|144227661|gb|AAZ44576.2|\r\n+OG0001261\t\t\t\tgi|71851971|gb|AAZ44579.1|\r\n+OG0001262\t\t\t\tgi|71851972|gb|AAZ44580.1|\r\n+OG0001263\t\t\t\tgi|71851985|gb|AAZ44593.1|\r\n+OG0001264\t\t\t\tgi|71851986|gb|AAZ44594.1|\r\n+OG0001265\t\t\t\tgi|144227667|gb|AAZ44595.2|\r\n+OG0001266\t\t\t\tgi|71851988|gb|AAZ44596.1|\r\n+OG0001267\t\t\t\tgi|71851989|gb|AAZ44597.1|\r\n+OG0001268\t\t\t\tgi|144227668|gb|AAZ44598.2|\r\n+OG0001269\t\t\t\tgi|71851991|gb|AAZ44599.1|\r\n+OG0001270\t\t\t\tgi|144227669|gb|AAZ44600.2|\r\n+OG0001271\t\t\t\tgi|144227670|gb|AAZ44601.2|\r\n+OG0001272\t\t\t\tgi|144227671|gb|AAZ44602.2|\r\n+OG0001273\t\t\t\tgi|144227672|gb|AAZ44604.2|\r\n+OG0001274\t\t\t\tgi|144227673|gb|AAZ44605.2|\r\n+OG0001275\t\t\t\tgi|144227674|gb|AAZ44606.2|\r\n+OG0001276\t\t\t\tgi|144227675|gb|AAZ44607.2|\r\n+OG0001277\t\t\t\tgi|144227676|gb|ABO93480.1|\r\n+OG0001278\t\t\t\tgi|144227681|gb|AAZ44617.2|\r\n+OG0001279\t\t\t\tgi|144227683|gb|AAZ44623.2|\r\n+OG0001280\t\t\t\tgi|144227688|gb|ABO93481.1|\r\n+OG0001281\t\t\t\tgi|144227689|gb|AAZ44632.2|\r\n+OG0001282\t\t\t\tgi|71852025|gb|AAZ44633.1|\r\n+OG0001283\t\t\t\tgi|144227690|gb|AAZ44637.2|\r\n+OG0001284\t\t\t\tgi|71852030|gb|AAZ44638.1|\r\n+OG0001285\t\t\t\tgi|144227691|gb|AAZ44639.2|\r\n+OG0001286\t\t\t\tgi|71852032|gb|AAZ44640.1|\r\n+OG0001287\t\t\t\tgi|71852034|gb|AAZ44642.1|\r\n+OG0001288\t\t\t\tgi|71852035|gb|AAZ44643.1|\r\n+OG0001289\t\t\t\tgi|144227693|gb|AAZ44644.2|\r\n+OG0001290\t\t\t\tgi|144227694|gb|ABO93482.1|\r\n+OG0001291\t\t\t\tgi|144227695|gb|AAZ44645.2|\r\n+OG0001292\t\t\t\tgi|71852038|gb|AAZ44646.1|\r\n+OG0001293\t\t\t\tgi|144227696|gb|AAZ44647.2|\r\n+OG0001294\t\t\t\tgi|71852040|gb|AAZ44648.1|\r\n+OG0001295\t\t\t\tgi|144227697|gb|AAZ44650.2|\r\n+OG0001296\t\t\t\tgi|71852043|gb|AAZ44651.1|\r\n+OG0001297\t\t\t\tgi|144227698|gb|ABO93483.1|\r\n+OG0001298\t\t\t\tgi|144227699|gb|AAZ44652.2|\r\n+OG0001299\t\t\t\tgi|144227700|gb|AAZ44653.2|\r\n+OG0001300\t\t\t\tgi|144227701|gb|AAZ44654.2|\r\n+OG0001301\t\t\t\tgi|71852048|gb|AAZ44656.1|\r\n+OG0001302\t\t\t\tgi|144227703|gb|AAZ44657.2|\r\n+OG0001303\t\t\t\tgi|144227704|gb|AAZ44658.2|\r\n+OG0001304\t\t\t\tgi|71852052|gb|AAZ44660.1|\r\n+OG0001305\t\t\t\tgi|144227707|gb|AAZ44671.2|\r\n+OG0001306\t\t\t\tgi|144227709|gb|ABO93484.1|\r\n+OG0001307\t\t\t\tgi|144227715|gb|AAZ44680.2|\r\n+OG0001308\t\t\t\tgi|144227716|gb|AAZ44681.2|\r\n+OG0001309\t\t\t\tgi|144227717|gb|AAZ44682.2|\r\n+OG0001310\t\t\t\tgi|71852075|gb|AAZ44683.1|\r\n+OG0001311\t\t\t\tgi|144227718|gb|AAZ44684.2|\r\n+OG0001312\t\t\t\tgi|71852077|gb|AAZ44685.1|\r\n+OG0001313\t\t\t\tgi|144227719|gb|AAZ44686.2|\r\n+OG0001314\t\t\t\tgi|144227725|gb|AAZ44696.2|\r\n+OG0001315\t\t\t\tgi|144227730|gb|AAZ44708.2|\r\n+OG0001316\t\t\t\tgi|71852101|gb|AAZ44709.1|\r\n+OG0001317\t\t\t\tgi|144227731|gb|AAZ44711.2|\r\n+OG0001318\t\t\t\tgi|144227732|gb|AAZ44712.2|\r\n+OG0001319\t\t\t\tgi|144227736|gb|AAZ44718.2|\r\n+OG0001320\t\t\t\tgi|71852114|gb|AAZ44722.1|\r\n+OG0001321\t\t\t\tgi|144227745|gb|AAZ44743.2|\r\n+OG0001322\t\t\t\tgi|144227746|gb|AAZ44744.2|\r\n+OG0001323\t\t\t\tgi|144227747|gb|AAZ44745.2|\r\n+OG0001324\t\t\t\tgi|71852138|gb|AAZ44746.1|\r\n+OG0001325\t\t\t\tgi|71852139|gb|AAZ44747.1|\r\n+OG0001326\t\t\t\tgi|71852141|gb|AAZ44749.1|\r\n+OG0001327\t\t\t\tgi|144227748|gb|AAZ44751.2|\r\n+OG0001328\t\t\t\tgi|71852145|gb|AAZ44753.1|\r\n+OG0001329\t\t\t\tgi|144227749|gb|AAZ44755.2|\r\n+OG0001330\t\t\t\tgi|144227750|gb|AAZ44756.2|\r\n'
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results_fromblast/Statistics_Overall.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results_fromblast/Statistics_Overall.csv Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,51 @@
+Number of genes 2733
+Number of genes in orthogroups 1938
+Number of unassigned genes 795
+Percentage of genes in orthogroups 70.9
+Percentage of unassigned genes 29.1
+Number of orthogroups 536
+Number of species-specific orthogroups 6
+Number of genes in species-specific orthogroups 100
+Percentage of genes in species-specific orthogroups 3.7
+Mean orthogroup size 3.6
+Median orthogroup size 4.0
+G50 (assigned genes) 4
+G50 (all genes) 4
+O50 (assigned genes) 199
+O50 (all genes) 299
+Number of orthogroups with all species present 278
+Number of single-copy orthogroups 254
+Date 2017-06-08
+Orthogroups file Orthogroups.csv
+Unassigned genes file Orthogroups_UnassignedGenes.csv
+Per-species statistics Statistics_PerSpecies.csv
+Overall statistics Statistics_Overall.csv
+Orthogroups shared between species Orthogroups_SpeciesOverlaps.csv
+
+Average number of genes per-species in orthogroup Number of orthogroups Percentage of orthogroups Number of genes Percentage of genes
+<1 224 41.8 516 26.6
+'1 302 56.3 1254 64.7
+'2 7 1.3 65 3.4
+'3 0 0.0 0 0.0
+'4 0 0.0 0 0.0
+'5 1 0.2 20 1.0
+'6 1 0.2 27 1.4
+'7 0 0.0 0 0.0
+'8 0 0.0 0 0.0
+'9 0 0.0 0 0.0
+'10 0 0.0 0 0.0
+11-15 1 0.2 56 2.9
+16-20 0 0.0 0 0.0
+21-50 0 0.0 0 0.0
+51-100 0 0.0 0 0.0
+101-150 0 0.0 0 0.0
+151-200 0 0.0 0 0.0
+201-500 0 0.0 0 0.0
+501-1000 0 0.0 0 0.0
+'1001+ 0 0.0 0 0.0
+
+Number of species in orthogroup Number of orthogroups
+1 6
+2 177
+3 75
+4 278
b
diff -r 000000000000 -r bfb20dbe1309 test-data/results_fromblast/Statistics_PerSpecies.csv
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/results_fromblast/Statistics_PerSpecies.csv Tue Oct 24 06:40:40 2017 -0400
b
@@ -0,0 +1,100 @@
+ Mycoplasma_agalactiae Mycoplasma_gallisepticum Mycoplasma_genitalium Mycoplasma_hyopneumoniae
+Number of genes 820 763 476 674
+Number of genes in orthogroups 503 561 429 445
+Number of unassigned genes 317 202 47 229
+Percentage of genes in orthogroups 61.3 73.5 90.1 66.0
+Percentage of unassigned genes 38.7 26.5 9.9 34.0
+Number of orthogroups containing species 430 459 392 416
+Percentage of orthogroups containing species 80.2 85.6 73.1 77.6
+Number of species-specific orthogroups 3 2 0 1
+Number of genes in species-specific orthogroups 34 61 0 5
+Percentage of genes in species-specific orthogroups 4.1 8.0 0.0 0.7
+
+
+Number of genes per-species in orthogroup Number of orthogroups Number of orthogroups Number of orthogroups Number of orthogroups
+'0 106 77 144 120
+'1 398 427 368 405
+'2 21 21 17 6
+'3 6 6 5 1
+'4 2 2 1 1
+'5 2 2 0 1
+'6 0 0 0 0
+'7 0 0 0 0
+'8 0 0 1 2
+'9 0 0 0 0
+'10 0 0 0 0
+11-15 0 0 0 0
+16-20 0 0 0 0
+21-50 1 0 0 0
+51-100 0 1 0 0
+101-150 0 0 0 0
+151-200 0 0 0 0
+201-500 0 0 0 0
+501-1000 0 0 0 0
+'1001+ 0 0 0 0
+
+Number of genes per-species in orthogroup Percentage of orthogroups Percentage of orthogroups Percentage of orthogroups Percentage of orthogroups
+'0 19.8 14.4 26.9 22.4
+'1 74.3 79.7 68.7 75.6
+'2 3.9 3.9 3.2 1.1
+'3 1.1 1.1 0.9 0.2
+'4 0.4 0.4 0.2 0.2
+'5 0.4 0.4 0.0 0.2
+'6 0.0 0.0 0.0 0.0
+'7 0.0 0.0 0.0 0.0
+'8 0.0 0.0 0.2 0.4
+'9 0.0 0.0 0.0 0.0
+'10 0.0 0.0 0.0 0.0
+11-15 0.0 0.0 0.0 0.0
+16-20 0.0 0.0 0.0 0.0
+21-50 0.2 0.0 0.0 0.0
+51-100 0.0 0.2 0.0 0.0
+101-150 0.0 0.0 0.0 0.0
+151-200 0.0 0.0 0.0 0.0
+201-500 0.0 0.0 0.0 0.0
+501-1000 0.0 0.0 0.0 0.0
+'1001+ 0.0 0.0 0.0 0.0
+
+Number of genes per-species in orthogroup Number of genes Number of genes Number of genes Number of genes
+'0 0 0 0 0
+'1 398 427 368 405
+'2 42 42 34 12
+'3 18 18 15 3
+'4 8 8 4 4
+'5 10 10 0 5
+'6 0 0 0 0
+'7 0 0 0 0
+'8 0 0 8 16
+'9 0 0 0 0
+'10 0 0 0 0
+11-15 0 0 0 0
+16-20 0 0 0 0
+21-50 27 0 0 0
+51-100 0 56 0 0
+101-150 0 0 0 0
+151-200 0 0 0 0
+201-500 0 0 0 0
+501-1000 0 0 0 0
+'1001+ 0 0 0 0
+
+Number of genes per-species in orthogroup Percentage of genes Percentage of genes Percentage of genes Percentage of genes
+'0 0.0 0.0 0.0 0.0
+'1 48.5 56.0 77.3 60.1
+'2 5.1 5.5 7.1 1.8
+'3 2.2 2.4 3.2 0.4
+'4 1.0 1.0 0.8 0.6
+'5 1.2 1.3 0.0 0.7
+'6 0.0 0.0 0.0 0.0
+'7 0.0 0.0 0.0 0.0
+'8 0.0 0.0 1.7 2.4
+'9 0.0 0.0 0.0 0.0
+'10 0.0 0.0 0.0 0.0
+11-15 0.0 0.0 0.0 0.0
+16-20 0.0 0.0 0.0 0.0
+21-50 3.3 0.0 0.0 0.0
+51-100 0.0 7.3 0.0 0.0
+101-150 0.0 0.0 0.0 0.0
+151-200 0.0 0.0 0.0 0.0
+201-500 0.0 0.0 0.0 0.0
+501-1000 0.0 0.0 0.0 0.0
+'1001+ 0.0 0.0 0.0 0.0