Repository 'funannotate_predict'
hg clone https://toolshed.g2.bx.psu.edu/repos/iuc/funannotate_predict

Changeset 7:51b6ee65ef7f (2023-04-13)
Previous changeset 6:7abc5f6dd595 (2023-01-22) Next changeset 8:f31125bb85ea (2023-04-25)
Commit message:
planemo upload for repository https://github.com/galaxyproject/tools-iuc/tree/main/tools/funannotate commit 2589d2785ca90160a22a5fe14e03311e189ea51d
modified:
funannotate_predict.xml
macros.xml
test-data/genome_masked.fa
test-data/predict_scratch/Genus_species.discrepency.report.txt
test-data/predict_scratch/Genus_species.error.summary.txt
test-data/predict_scratch/Genus_species.stats.json
test-data/predict_scratch/Genus_species.validation.txt
added:
test-data/funannotate_db/insecta/hmms/EOG090W00C1.hmm
test-data/funannotate_db/insecta/hmms/EOG090W01M6.hmm
test-data/funannotate_db/insecta/hmms/EOG090W02B6.hmm
test-data/funannotate_db/insecta/hmms/EOG090W02CW.hmm
test-data/funannotate_db/insecta/hmms/EOG090W04UC.hmm
test-data/funannotate_db/insecta/hmms/EOG090W06CL.hmm
test-data/funannotate_db/insecta/hmms/EOG090W06HU.hmm
test-data/funannotate_db/insecta/hmms/EOG090W06OE.hmm
test-data/funannotate_db/insecta/hmms/EOG090W07NX.hmm
test-data/funannotate_db/insecta/hmms/EOG090W08R7.hmm
test-data/funannotate_db/insecta/hmms/EOG090W09HB.hmm
test-data/funannotate_db/insecta/hmms/EOG090W0CIU.hmm
test-data/funannotate_db/insecta/hmms/EOG090W0DGR.hmm
test-data/funannotate_db/insecta/hmms/EOG090W0E07.hmm
test-data/funannotate_db/insecta/hmms/EOG090W0EOF.hmm
test-data/funannotate_db/insecta/hmms/EOG090W0IVU.hmm
test-data/funannotate_db/insecta/hmms/EOG090W0MBV.hmm
test-data/funannotate_db/insecta/prfl/EOG090W00C1.prfl
test-data/funannotate_db/insecta/prfl/EOG090W01M6.prfl
test-data/funannotate_db/insecta/prfl/EOG090W02B6.prfl
test-data/funannotate_db/insecta/prfl/EOG090W02CW.prfl
test-data/funannotate_db/insecta/prfl/EOG090W04UC.prfl
test-data/funannotate_db/insecta/prfl/EOG090W06CL.prfl
test-data/funannotate_db/insecta/prfl/EOG090W06HU.prfl
test-data/funannotate_db/insecta/prfl/EOG090W06OE.prfl
test-data/funannotate_db/insecta/prfl/EOG090W07NX.prfl
test-data/funannotate_db/insecta/prfl/EOG090W08R7.prfl
test-data/funannotate_db/insecta/prfl/EOG090W09HB.prfl
test-data/funannotate_db/insecta/prfl/EOG090W0CIU.prfl
test-data/funannotate_db/insecta/prfl/EOG090W0DGR.prfl
test-data/funannotate_db/insecta/prfl/EOG090W0E07.prfl
test-data/funannotate_db/insecta/prfl/EOG090W0EOF.prfl
test-data/funannotate_db/insecta/prfl/EOG090W0IVU.prfl
test-data/funannotate_db/insecta/prfl/EOG090W0MBV.prfl
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f funannotate_predict.xml
--- a/funannotate_predict.xml Sun Jan 22 17:30:57 2023 +0000
+++ b/funannotate_predict.xml Thu Apr 13 17:16:35 2023 +0000
b
@@ -371,7 +371,7 @@
                 <not_has_text text="Found 16 alignments, wrote GFF3 and Augustus hints to file"/>
                 <not_has_text text="Extracting hints from RNA-seq BAM file using bam2hints"/>
                 <has_text text="Mapping 13 proteins to genome using diamond and exonerate"/>
-                <has_text text="Found 4 preliminary alignments --> aligning with exonerate"/>
+                <has_text text="Found 4 preliminary alignments with diamond"/>
             </assert_stderr>
         </test>
 
@@ -436,7 +436,7 @@
                 <not_has_text text="Found 16 alignments, wrote GFF3 and Augustus hints to file"/>
                 <not_has_text text="Extracting hints from RNA-seq BAM file using bam2hints"/>
                 <has_text text="Mapping 13 proteins to genome using diamond and exonerate"/>
-                <has_text text="Found 4 preliminary alignments --> aligning with exonerate"/>
+                <has_text text="Found 4 preliminary alignments with diamond"/>
             </assert_stderr>
         </test>
 
@@ -509,7 +509,7 @@
                 <has_text text="Found 16 alignments, wrote GFF3 and Augustus hints to file"/>
                 <has_text text="Extracting hints from RNA-seq BAM file using bam2hints"/>
                 <has_text text="Mapping 16 proteins to genome using diamond and exonerate"/>
-                <has_text text="Found 21 preliminary alignments --> aligning with exonerate"/>
+                <has_text text="Found 21 preliminary alignments with diamond"/>
             </assert_stderr>
             <assert_command>
                 <has_text text="--protein_evidence"/>
@@ -583,7 +583,7 @@
                 <not_has_text text="Found 16 alignments, wrote GFF3 and Augustus hints to file"/>
                 <not_has_text text="Extracting hints from RNA-seq BAM file using bam2hints"/>
                 <has_text text="Mapping 16 proteins to genome using diamond and exonerate"/>
-                <has_text text="Found 21 preliminary alignments --> aligning with exonerate"/>
+                <has_text text="Found 21 preliminary alignments with diamond"/>
             </assert_stderr>
             <assert_command>
                 <has_text text="--protein_evidence"/>
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f macros.xml
--- a/macros.xml Sun Jan 22 17:30:57 2023 +0000
+++ b/macros.xml Thu Apr 13 17:16:35 2023 +0000
b
@@ -1,7 +1,7 @@
 <?xml version="1.0"?>
 <macros>
-    <token name="@TOOL_VERSION@">1.8.9</token>
-    <token name="@VERSION_SUFFIX@">3</token>
+    <token name="@TOOL_VERSION@">1.8.15</token>
+    <token name="@VERSION_SUFFIX@">0</token>
 
     <xml name="requirements">
         <requirement type="package" version="@TOOL_VERSION@">funannotate</requirement>
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W00C1.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W00C1.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,4084 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W00C1\n+LENG  1354\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:04:56 2016\n+NSEQ  42\n+EFFN  0.679321\n+CKSUM 1578165604\n+STATS LOCAL MSV      -13.1616  0.69495\n+STATS LOCAL VITERBI  -14.4353  0.69495\n+STATS LOCAL FORWARD   -7.3499  0.69495\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.57441  4.16262  2.99810  2.76343  3.12186  3.07323  3.77318  2.63927  2.72202  2.29429  3.49996  3.17298  3.46979  3.15717  2.99681  2.73779  2.88211  2.52749  4.25091  3.39827\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.18691  3.94363  1.88981  0.61958  0.77255  0.00000        *\n+      1   2.62911  5.02950  2.23384  1.74344  4.30054  3.23321  3.61266  3.74901  2.45053  3.31684  4.14230  2.72854  3.75026  2.76878  2.97863  2.48083  2.93986  3.38757  5.52131  3.88237      1 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03412  3.79084  4.51318  0.61958  0.77255  0.61585  0.77693\n+      2   2.43849  4.61681  2.63603  2.35102  4.06046  3.12134  3.67576  3.47583  2.53742  3.03286  3.92976  2.75939  3.30297  2.85668  2.98387  2.02088  2.75212  3.11813  5.34660  4.02240      2 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03412  3.79084  4.51318  0.61958  0.77255  0.61585  0.77693\n+      3   2.50819  4.48365  2.98156  2.41390  3.80268  3.29727  3.59860  3.02388  2.52519  2.84922  3.71772  3.00896  3.77828  2.90867  2.90855  2.40606  2.16579  2.86980  5.14860  3.86479      3 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.07774  3.79084  2.95237  0.61958  0.77255  0.61585  0.77693\n+      4   2.45303  4.37393  3.07931  2.72005  3.70829  3.19950  3.80755  3.07532  2.65557  2.68670  3.75206  3.10400  2.14831  3.06767  2.98981  2.59842  2.66818  2.80090  5.14532  3.67841      4 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04667  3.74871  3.81451  0.61958  0.77255  0.62985  0.76073\n+      5   2.75504  4.34975  3.79706  3.25081  3.15934  3.77200  4.05264  2.27308  3.08422  1.49815  3.03425  3.60378  3.76830  3.42870  3.36275  3.07338  3.00031  2.21884  4.88384  3.52906      5 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03555  3.75041  4.47276  0.61958  0.77255  0.47303  0.97580\n+      6   2.25342  4.27458  3.16843  2.78774  4.05998  3.04638  3.91183  3.34636  2.80219  3.12786  3.96791  3.02231  3.16694  3.14084  3.16963  1.58118  2.48814  3.02484  5.39240  4.13410      6 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03104  3.88369  4.60603  0.61958  0.77255  0.52553  0.89464\n+      7   2.66779  4.73943  3.05029  2.55470  3.99433  3.42397  3.64278  3.37958  2.28142  2.76413  3.86631  3.02514  3.85273  1.94903 '..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03351  3.80855  4.53090  0.61958  0.77255  0.60255  0.79278\n+   1347   1.78718  4.36979  2.94274  2.64009  4.06671  2.37848  3.83409  3.42660  2.44894  3.11541  3.97246  3.02705  3.70228  3.05479  3.04232  2.50156  2.75898  3.03630  5.37914  4.11032   1369 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03351  3.80855  4.53090  0.61958  0.77255  0.60255  0.79278\n+   1348   3.25348  4.65911  4.13591  3.74882  1.78664  4.05293  3.44366  3.03935  3.62290  2.45193  3.67986  3.77565  4.40523  3.76463  3.78558  3.41116  3.49132  2.94536  3.67172  1.24793   1370 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03351  3.80855  4.53090  0.61958  0.77255  0.60255  0.79278\n+   1349   2.66660  4.93953  2.32159  1.68255  4.23414  3.24129  3.64228  3.61752  2.50956  3.25217  4.09859  2.77191  3.76344  2.80723  2.98966  2.60105  2.93387  2.96375  5.48690  4.10293   1371 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.07884  3.80855  2.92561  0.61958  0.77255  0.60255  0.79278\n+   1350   2.55513  4.70512  2.41241  2.30976  4.21639  3.09898  3.72846  3.71655  2.62129  3.33495  4.19107  1.78795  3.52911  2.92777  3.05544  2.47846  2.90213  3.31322  5.49974  4.12160   1372 n - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03503  3.76475  4.48709  0.61958  0.77255  0.57673  0.82492\n+   1351   2.52713  4.62036  2.56122  2.41652  4.10662  3.14853  3.73925  3.57717  2.59682  3.20295  4.06169  2.89157  3.73752  2.66602  3.00490  1.70059  2.86458  3.20147  5.40649  4.06301   1373 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03351  3.80855  4.53090  0.61958  0.77255  0.60255  0.79278\n+   1352   3.04848  4.47189  4.38464  3.83047  3.11050  4.22028  4.54319  2.00917  3.67891  1.20443  2.65686  4.14524  4.49014  3.92405  3.89627  3.54955  3.28587  1.90435  5.09032  3.94632   1374 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03351  3.80855  4.53090  0.61958  0.77255  0.60255  0.79278\n+   1353   2.72695  4.82964  3.03308  2.56132  4.22330  3.39753  3.59981  3.63509  2.06912  3.18733  4.04291  2.74424  3.55341  2.76055  1.68769  2.76304  2.96834  3.30390  5.32788  4.07028   1375 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03351  3.80855  4.53090  0.61958  0.77255  0.60255  0.79278\n+   1354   3.10963  4.51643  4.44664  3.89372  3.06332  4.28824  4.57784  1.92985  3.72053  1.12396  2.63392  4.20864  4.53435  3.96293  3.92409  3.62298  3.34172  2.09521  5.07467  3.92677   1376 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02268  3.79772        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W01M6.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W01M6.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1321 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W01M6\n+LENG  433\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:16:53 2016\n+NSEQ  42\n+EFFN  0.817749\n+CKSUM 1517915722\n+STATS LOCAL MSV      -11.7026  0.69878\n+STATS LOCAL VITERBI  -12.4285  0.69878\n+STATS LOCAL FORWARD   -6.2533  0.69878\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.64874  4.34739  2.98352  2.65645  3.14500  2.96619  3.72043  2.73609  2.68309  2.41542  3.60690  3.11777  3.42799  3.03591  2.92095  2.69183  2.89496  2.57229  4.49671  3.27303\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.06129  4.04908  3.16980  0.61958  0.77255  0.00000        *\n+      1   2.99274  5.09177  3.40159  2.75925  4.44771  3.64963  3.61478  3.83310  1.82846  3.31408  4.18253  3.17539  4.01658  2.63225  1.30281  3.00178  3.16599  3.52787  5.39574  3.95109      1 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02717  4.01496  4.73730  0.61958  0.77255  0.49600  0.93894\n+      2   3.09259  4.47438  4.59558  4.02195  3.02431  4.29636  4.59996  1.96958  3.90086  1.27647  1.96237  4.27854  4.54463  4.05677  4.05908  3.61501  3.15485  2.21126  5.05857  3.95696      2 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02676  4.03003  4.75237  0.61958  0.77255  0.50611  0.92340\n+      3   2.90822  4.34399  3.90187  3.78087  3.52703  4.08102  4.55961  1.20233  3.69527  2.21790  3.40804  4.06087  4.45939  3.98732  3.94445  3.43195  3.17445  1.59809  5.29076  4.06076      3 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02676  4.03003  4.75237  0.61958  0.77255  0.50611  0.92340\n+      4   2.97332  4.70169  3.59796  3.46161  4.43906  3.38041  4.52404  4.02760  3.53290  3.63629  4.69454  3.75125  0.58063  3.91685  3.75846  3.14630  3.42778  3.65456  5.57990  4.56267      4 P - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02676  4.03003  4.75237  0.61958  0.77255  0.50611  0.92340\n+      5   2.29186  4.22425  3.42579  3.15083  4.18543  3.01052  4.20902  3.53954  3.15355  3.30374  4.19981  3.32764  3.74763  3.49306  3.44945  1.06659  2.68453  2.90158  5.58065  4.31467      5 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02676  4.03003  4.75237  0.61958  0.77255  0.50611  0.92340\n+      6   3.11159  4.65104  4.04171  3.63940  3.16523  4.01857  4.36268  2.48797  3.36516  0.90497  3.15961  3.95399  4.41614  3.48231  3.57004  3.45253  3.38016  2.54465  5.02595  3.74647      6 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02676  4.03003  4.75237  0.61958  0.77255  0.50611  0.92340\n+      7   2.54458  4.34339  2.91937  2.45854  4.08786  3.20552  3.65445  3.50865  2.44550  3.10751  3.91732  2.53639  3.78512  2.80685  '..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02628  4.04778  4.77013  0.61958  0.77255  0.49635  0.93841\n+    426   2.55894  4.14542  3.69639  3.12141  2.63958  3.59921  3.87253  2.37837  2.90589  2.16923  3.25283  3.44670  3.97349  3.15974  3.22053  2.62367  2.75493  2.32656  4.73704  3.16014    431 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02628  4.04778  4.77013  0.61958  0.77255  0.49635  0.93841\n+    427   2.55921  4.74833  2.87125  2.36394  4.04304  1.91156  3.70695  3.16737  2.45040  3.06704  3.91319  2.98250  3.84701  2.75078  2.91826  2.70307  2.90557  3.12369  5.32960  4.01937    432 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04143  4.04778  3.76696  0.61958  0.77255  0.49635  0.93841\n+    428   2.79931  4.24337  4.20599  3.48514  3.41808  3.96864  4.34339  1.55570  3.53651  2.10011  3.33161  3.91999  4.32467  3.81500  3.76746  3.10134  3.04508  1.52243  5.07226  3.86457    433 v - - -\n+          2.68618  4.42208  2.77520  2.73123  3.46354  2.40513  3.72495  3.29354  2.67741  2.69355  4.24690  2.90347  2.73740  3.18146  2.89801  2.37887  2.77520  2.98518  4.58477  3.61503\n+          0.04048  3.47164  4.75538  0.56309  0.84268  0.51199  0.91455\n+    429   2.68305  4.81487  3.13781  2.54430  3.79426  3.49021  3.62089  3.45643  1.83175  3.04450  3.71755  3.03085  3.86880  2.77967  2.03846  2.72553  2.90022  3.07049  5.26264  3.69930    435 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02668  4.03303  4.75538  0.61958  0.77255  0.51199  0.91455\n+    430   1.75213  4.42239  3.27734  2.74457  3.68986  3.41527  3.78451  2.91366  2.67908  2.67746  3.41247  3.17153  3.86464  2.85205  3.05846  2.42970  2.81028  2.75526  5.08698  3.82553    436 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02668  4.03303  4.75538  0.61958  0.77255  0.51199  0.91455\n+    431   2.83104  5.11951  2.92240  2.42867  4.48496  3.51299  3.48461  3.88659  1.91361  3.36989  4.18577  3.00288  3.90690  2.55663  1.61155  2.81100  3.03328  3.52942  5.47900  4.19917    437 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02668  4.03303  4.75538  0.61958  0.77255  0.51199  0.91455\n+    432   2.27231  4.54307  3.08274  2.47455  3.84795  3.23327  3.73904  3.20775  2.59916  2.51551  3.74651  3.06809  2.41509  2.94951  3.01005  2.66174  2.72587  2.91634  5.19570  3.91173    438 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02668  4.03303  4.75538  0.61958  0.77255  0.51199  0.91455\n+    433   2.55221  4.56809  3.04831  2.64140  4.00030  3.30168  3.53618  3.42810  2.58672  3.00053  3.92179  3.07915  1.82207  2.99651  2.89740  2.51926  2.66257  3.09058  5.31364  4.01905    439 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01804  4.02439        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W02B6.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W02B6.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,799 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W02B6\n+LENG  259\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:06:43 2016\n+NSEQ  41\n+EFFN  0.573059\n+CKSUM 71403834\n+STATS LOCAL MSV      -10.7412  0.70258\n+STATS LOCAL VITERBI  -11.8067  0.70258\n+STATS LOCAL FORWARD   -5.3626  0.70258\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.58551  3.95142  2.93538  2.65555  3.19899  2.68147  3.73109  2.86853  2.68910  2.53366  3.70254  2.99935  3.47440  3.10133  3.03761  2.69046  2.91059  2.66720  4.14923  3.24922\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.05385  3.91683  3.42582  0.61958  0.77255  0.00000        *\n+      1   2.57563  4.29816  3.42874  2.87971  3.42655  3.42999  3.78252  2.74851  2.59874  1.89027  3.03797  3.27284  3.91669  3.03711  3.02132  2.66738  2.81332  2.53821  4.87996  3.64362      1 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03073  3.89371  4.61606  0.61958  0.77255  0.50735  0.92153\n+      2   3.28512  4.68059  4.26785  3.98622  0.97760  3.97024  3.88627  2.80601  3.89268  2.17109  3.53292  4.04299  4.42823  4.05476  4.00717  3.55407  3.58620  2.79830  4.12875  2.49298      2 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03073  3.89371  4.61606  0.61958  0.77255  0.50735  0.92153\n+      3   2.52699  4.84771  2.60918  2.20896  4.11201  3.28400  3.32154  3.43124  2.30734  3.06800  3.91257  2.76498  3.75293  2.69515  2.74350  2.47454  2.72876  3.13962  5.33073  3.70604      3 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03073  3.89371  4.61606  0.61958  0.77255  0.50735  0.92153\n+      4   2.61780  5.07635  2.30159  2.00832  4.37269  3.15166  3.49552  3.83577  2.16309  3.26651  4.14614  2.55311  3.75789  2.71350  2.87941  2.61338  2.79178  3.44361  5.53209  4.13014      4 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03073  3.89371  4.61606  0.61958  0.77255  0.50735  0.92153\n+      5   3.28512  4.68059  4.26785  3.98622  0.97760  3.97024  3.88627  2.80601  3.89268  2.17109  3.53292  4.04299  4.42823  4.05476  4.00717  3.55407  3.58620  2.79830  4.12875  2.49298      5 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03073  3.89371  4.61606  0.61958  0.77255  0.50735  0.92153\n+      6   2.52574  4.29845  3.38725  2.81673  3.43274  3.51672  3.75806  2.58616  2.58097  2.26866  3.07537  3.23232  3.89498  2.82155  3.02013  2.76287  2.69813  2.35902  4.87883  3.64302      6 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03073  3.89371  4.61606  0.61958  0.77255  0.50735  0.92153\n+      7   2.49438  4.59633  3.00250  2.46963  3.79998  3.35856  3.45953  2.94077  2.28801  2.75200  3.68084  2.91052  3.79975  2.75316  2.7'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04215  3.91412  3.84848  0.61958  0.77255  0.49619  0.93865\n+    252   2.72228  4.85214  3.33547  2.71103  4.17224  3.54395  3.61290  3.51379  1.95762  3.01720  3.79275  3.13151  3.93412  2.77418  1.52439  2.86875  3.02350  3.23081  5.28280  4.05793    253 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03046  3.90243  4.62478  0.61958  0.77255  0.50708  0.92193\n+    253   2.89180  4.31740  4.28033  3.72995  3.07498  4.07258  4.37817  1.89583  3.62162  1.87913  3.17915  4.00435  4.39351  3.87003  3.84989  3.38725  3.13313  1.34821  4.99368  3.51638    254 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03046  3.90243  4.62478  0.61958  0.77255  0.50708  0.92193\n+    254   2.99605  4.54939  3.85523  3.38631  2.26082  3.87705  3.58635  2.81264  3.24695  2.45320  3.57902  3.60461  4.24492  3.30523  3.49280  3.18900  3.23184  2.80947  3.98835  1.38310    255 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04779  3.90243  3.63170  0.61958  0.77255  0.50708  0.92193\n+    255   2.86895  4.79868  3.35393  2.87800  4.27248  3.16102  3.77328  3.75286  2.20798  3.30302  4.22462  3.25529  3.94230  2.97090  1.13271  2.94613  3.14746  3.42765  5.33779  4.16294    256 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03098  3.88563  4.60797  0.61958  0.77255  0.52231  0.89930\n+    256   2.39495  4.29242  3.23272  3.00632  4.01335  1.24309  4.10420  3.13144  3.04981  3.16602  4.12473  3.27155  3.75853  3.41004  3.34616  2.56561  2.84496  3.02378  5.39536  4.12823    257 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03098  3.88563  4.60797  0.61958  0.77255  0.52231  0.89930\n+    257   2.85254  5.30913  1.31568  2.03440  4.62051  3.17606  3.72287  4.10485  2.63785  3.65833  4.51978  2.66736  3.79471  2.89706  3.27864  2.66124  3.14816  3.70481  5.83674  4.36108    258 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03098  3.88563  4.60797  0.61958  0.77255  0.52231  0.89930\n+    258   2.57543  4.72763  2.41079  2.35700  4.35200  1.79355  3.80871  3.83835  2.74701  3.44104  4.28482  2.23390  3.74808  3.00510  3.21046  2.61543  2.93841  3.40418  5.61727  4.25444    259 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03098  3.88563  4.60797  0.61958  0.77255  0.52231  0.89930\n+    259   2.37183  4.27895  3.26612  2.85389  3.88471  3.15333  3.90665  3.14295  2.68120  2.92493  3.81418  3.18256  3.75809  3.16151  3.11452  2.30927  1.70984  2.64002  5.26583  4.01708    260 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02096  3.87561        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W02CW.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W02CW.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,934 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W02CW\n+LENG  304\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:02:17 2016\n+NSEQ  42\n+EFFN  0.612671\n+CKSUM 955681691\n+STATS LOCAL MSV      -11.4617  0.70115\n+STATS LOCAL VITERBI  -11.9236  0.70115\n+STATS LOCAL FORWARD   -4.9460  0.70115\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.59865  4.32362  2.92347  2.71276  3.28259  2.77543  3.65001  2.84542  2.60536  2.37332  3.59908  3.17474  3.50206  3.05463  2.76450  2.74314  2.97461  2.60191  4.47674  3.47706\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.10081  3.94306  2.57042  0.61958  0.77255  0.00000        *\n+      1   2.35557  4.29472  3.19763  2.84224  3.88559  3.09543  3.91480  3.31420  2.79125  3.04108  3.56516  3.05924  3.73536  3.17891  3.12118  1.44315  2.75694  2.94505  5.27902  3.96543      1 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03136  3.87362  4.59596  0.61958  0.77255  0.54943  0.86104\n+      2   2.56222  4.93545  2.48547  1.53546  4.24250  3.27700  3.67324  3.58742  2.50194  3.24171  3.90393  2.82409  3.79767  2.83943  2.95126  2.69128  2.96218  3.25991  5.49628  4.12507      2 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03136  3.87362  4.59596  0.61958  0.77255  0.54943  0.86104\n+      3   2.99070  5.11937  0.91641  2.33541  4.49650  3.21142  3.93186  4.08490  3.01617  3.69299  4.67105  2.89187  3.86428  3.17096  3.53260  2.95288  3.32927  3.72394  5.66490  4.36911      3 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03136  3.87362  4.59596  0.61958  0.77255  0.54943  0.86104\n+      4   3.15648  4.61836  4.19136  3.83114  3.13602  3.98365  4.48651  2.34004  3.59888  0.87378  3.15847  4.10651  4.41876  3.96694  3.77479  3.55454  3.45065  2.37769  5.01580  3.73941      4 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03136  3.87362  4.59596  0.61958  0.77255  0.54943  0.86104\n+      5   3.15648  4.61836  4.19136  3.83114  3.13602  3.98365  4.48651  2.34004  3.59888  0.87378  3.15847  4.10651  4.41876  3.96694  3.77479  3.55454  3.45065  2.37769  5.01580  3.73941      5 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03136  3.87362  4.59596  0.61958  0.77255  0.54943  0.86104\n+      6   2.88150  4.86740  2.90352  2.65818  4.03614  3.36669  3.81653  3.66699  2.47887  3.16924  4.19698  3.11796  3.92011  1.23200  2.76306  2.92916  3.17843  3.39657  5.30791  4.00170      6 q - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03136  3.87362  4.59596  0.61958  0.77255  0.54943  0.86104\n+      7   2.19930  4.30360  3.15462  2.93901  4.10942  3.03826  4.08460  3.44832  2.99567  3.16960  4.13205  3.22489  1.40669  3.36265  3.'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    297   2.68949  4.34463  3.62863  3.06645  3.34280  3.69463  3.95942  2.32509  2.93148  1.97487  3.17913  3.45835  4.05972  2.74751  3.24757  2.96678  2.92553  1.91454  4.95587  3.73141    297 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    298   3.03374  4.42596  4.46767  3.93972  3.21929  4.23727  4.62910  1.36024  3.77485  1.69960  2.54182  4.21800  4.53431  4.04124  3.97796  3.59172  3.28311  1.87773  5.17235  3.99921    298 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    299   2.96308  5.08661  0.95484  2.32029  4.46038  3.19207  3.90968  4.04294  2.98917  3.65590  4.63377  2.87526  3.84312  3.14901  3.50171  2.92851  3.30123  3.68492  5.63386  4.33785    299 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    300   2.96308  5.08661  0.95484  2.32029  4.46038  3.19207  3.90968  4.04294  2.98917  3.65590  4.63377  2.87526  3.84312  3.14901  3.50171  2.92851  3.30123  3.68492  5.63386  4.33785    300 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    301   2.86927  5.37796  1.57081  1.58824  4.66400  3.16503  3.70363  4.16174  2.70706  3.69223  4.55352  2.64091  3.78111  2.87391  3.28282  2.76564  3.15740  3.75564  5.85198  4.37248    301 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    302   2.70309  4.69830  2.69534  2.57844  4.05793  3.16750  3.90157  3.76319  2.80333  3.41302  4.36866  1.20343  3.81828  3.17454  3.15690  2.77141  3.08429  3.38794  5.36678  4.00828    302 n - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    303   2.59653  4.29323  4.15219  3.68818  3.52695  3.83220  4.51291  1.88381  3.55248  2.14129  3.39925  3.93128  4.30928  3.88987  3.80505  3.22122  3.08690  1.22269  5.32169  4.08447    303 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03221  3.84729  4.56964  0.61958  0.77255  0.55175  0.85788\n+    304   2.30315  4.22304  3.18507  3.00000  4.05139  2.95342  4.11039  3.57074  3.07206  3.29304  4.22146  3.22860  3.69021  3.42341  3.35865  1.12966  2.78146  3.11137  5.42596  4.13486    304 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02180  3.83687        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W04UC.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W04UC.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1129 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W04UC\n+LENG  369\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:07:47 2016\n+NSEQ  42\n+EFFN  0.443481\n+CKSUM 170555600\n+STATS LOCAL MSV      -11.2713  0.69978\n+STATS LOCAL VITERBI  -12.3283  0.69978\n+STATS LOCAL FORWARD   -5.7536  0.69978\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.60051  4.05562  2.90441  2.79768  3.08045  2.77920  3.55934  2.78516  2.81025  2.41855  3.62471  3.09461  3.33994  3.22268  3.06952  2.70345  2.92429  2.55458  4.70343  3.12090\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04083  3.82855  4.00248  0.61958  0.77255  0.00000        *\n+      1   2.76756  4.32554  4.05291  3.71545  3.51346  3.66934  4.52645  2.05651  3.58240  2.21023  3.48752  3.91327  4.23345  3.94639  3.79969  3.17043  3.13084  1.09282  5.28881  4.01675      1 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03309  3.82081  4.54315  0.61958  0.77255  0.49248  0.94445\n+      2   2.25729  4.30656  3.23421  2.78256  3.22793  3.26075  3.79747  2.99870  2.76328  2.72160  3.63924  3.15826  3.79182  3.09658  3.12698  1.86250  2.75869  2.72140  4.99482  3.51028      2 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03309  3.82081  4.54315  0.61958  0.77255  0.49248  0.94445\n+      3   3.17437  4.68428  3.76277  3.48336  2.29772  3.77057  3.59738  3.19097  3.34237  2.65801  3.87166  3.66117  4.24608  3.66082  3.53629  3.31589  3.46107  3.05922  3.93918  1.05625      3 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03309  3.82081  4.54315  0.61958  0.77255  0.49248  0.94445\n+      4   2.66097  4.42738  3.94606  3.58114  1.47146  3.73176  3.93337  2.54648  3.50029  2.06955  3.35070  3.75822  4.21413  3.74292  3.70618  3.15795  3.18490  2.47569  4.36458  2.79775      4 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03309  3.82081  4.54315  0.61958  0.77255  0.49248  0.94445\n+      5   3.27992  4.66981  4.17848  3.79374  1.73939  4.07994  3.44095  3.05466  3.66683  2.45979  3.69015  3.79922  4.42680  3.79300  3.81949  3.43694  3.51569  2.96273  3.65885  1.24017      5 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03309  3.82081  4.54315  0.61958  0.77255  0.49248  0.94445\n+      6   2.50783  4.06219  2.64489  2.40708  4.03475  3.23700  3.65926  3.46162  2.49744  3.08273  3.91169  2.14579  3.73822  2.77243  2.94060  2.37612  2.79729  3.11075  5.31881  3.98749      6 n - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03309  3.82081  4.54315  0.61958  0.77255  0.49248  0.94445\n+      7   2.24564  4.39159  2.90457  2.62505  4.04043  2.86201  3.61183  3.48392  2.70096  3.13638  3.99576  3.01901  1.96306  3.06297  3'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    362   2.89657  4.34002  4.33540  3.86273  3.43409  4.04249  4.64277  1.70131  3.72059  2.00918  3.30382  4.11271  4.45492  4.04177  3.95704  3.43375  3.19082  1.20150  5.32051  4.07504    362 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    363   2.83261  5.18882  2.09783  1.32798  4.49241  3.18246  3.70804  3.95203  2.65147  3.53766  4.42002  2.70351  3.78384  2.88868  3.15837  2.76639  3.12143  3.58451  5.69627  4.28281    363 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    364   2.12952  4.40848  2.93902  2.62267  4.04684  3.11452  3.81059  3.40224  2.49786  3.08898  3.95484  3.02254  2.15104  3.02656  2.99350  2.48412  2.77720  3.02948  5.36130  4.08386    364 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    365   2.22784  4.64487  2.89320  2.45699  4.05088  3.19517  3.64426  3.44617  2.02999  3.06441  3.89730  2.77162  3.41346  2.81515  2.78575  2.59254  2.74884  3.04422  5.30201  3.99898    365 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    366   2.55256  4.59631  2.76318  2.52687  3.90914  3.17834  3.76371  3.46646  2.58622  3.15645  3.85746  1.66698  3.77587  2.99977  2.94417  2.59089  2.90158  3.12277  5.28065  3.87771    366 n - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    367   2.90522  5.00113  2.46727  1.11001  4.34053  3.23867  3.82214  3.78306  2.69558  3.41004  4.38792  2.90405  3.84092  3.03986  3.09745  2.89431  3.20947  3.47334  5.52306  4.24672    367 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    368   3.25513  4.62909  4.23937  3.85121  1.29318  4.09308  3.49584  2.93028  3.72181  2.30942  3.56696  3.84598  4.43324  3.83335  3.85715  3.45289  3.49099  2.86788  3.71009  1.77181    368 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03329  3.81507  4.53741  0.61958  0.77255  0.49740  0.93677\n+    369   3.25721  4.66570  4.13098  3.74599  1.81001  4.05255  3.44699  3.04758  3.61945  2.46129  3.68955  3.77574  4.40704  3.76496  3.78364  3.41279  3.49599  2.95277  3.67635  1.22702    369 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02253  3.80431        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W06CL.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W06CL.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,886 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W06CL\n+LENG  288\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:05:51 2016\n+NSEQ  41\n+EFFN  0.858337\n+CKSUM 1720946982\n+STATS LOCAL MSV      -10.9811  0.70162\n+STATS LOCAL VITERBI  -11.8379  0.70162\n+STATS LOCAL FORWARD   -5.5881  0.70162\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.61753  4.04645  3.15863  2.73171  3.16702  3.19559  3.69289  2.64376  2.74411  2.33857  3.58831  3.17207  3.20968  3.10720  3.00118  2.70592  2.76070  2.48372  4.43931  3.42879\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04574  4.06079  3.59464  0.61958  0.77255  0.00000        *\n+      1   3.10981  4.63359  4.23476  3.84405  3.29252  3.96224  4.54017  2.48548  3.60195  1.86439  1.08751  4.09974  4.42645  3.97425  3.78680  3.47514  3.41985  2.51057  5.15408  3.92927      1 m - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02645  4.04150  4.76385  0.61958  0.77255  0.50660  0.92266\n+      2   3.19211  4.51590  4.78050  4.26748  3.05949  4.48093  4.83165  1.07047  4.13244  1.72918  3.17306  4.49829  4.74370  4.34191  4.30224  3.85076  3.43940  1.84939  5.23419  3.97542      2 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02645  4.04150  4.76385  0.61958  0.77255  0.50660  0.92266\n+      3   2.91714  5.38936  2.11318  1.14636  4.69931  3.25984  3.77880  4.18666  2.74180  3.72557  4.57777  2.74555  3.86482  2.94610  3.28751  2.73065  3.20499  3.78233  5.89247  4.42366      3 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02645  4.04150  4.76385  0.61958  0.77255  0.50660  0.92266\n+      4   3.03423  4.42875  4.80618  4.28130  3.49737  4.47157  4.96105  1.18069  4.16726  1.83128  3.29963  4.51322  4.74980  4.40543  4.35651  3.83719  3.36939  1.46582  5.45725  4.28251      4 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02645  4.04150  4.76385  0.61958  0.77255  0.50660  0.92266\n+      5   2.56296  4.77906  2.89850  2.43626  4.04409  3.40031  3.62834  3.37994  2.24585  3.06019  3.87751  2.81546  3.80779  2.74094  2.76577  2.39483  2.14824  3.08322  5.30058  3.97283      5 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02645  4.04150  4.76385  0.61958  0.77255  0.50660  0.92266\n+      6   0.95678  4.20526  3.67847  3.41066  4.09347  3.07992  4.37649  3.13401  3.37735  3.05737  4.07942  3.49944  3.82532  3.70361  3.62925  2.55531  2.82454  2.67221  5.58723  4.35795      6 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02645  4.04150  4.76385  0.61958  0.77255  0.50660  0.92266\n+      7   2.95841  5.13032  3.22273  2.67758  4.55993  3.58718  3.63425  3.93858  1.20293  3.41027  4.26019  2.94602  3.99001  2.77094  2'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    281   3.18281  4.46400  4.95398  4.43523  3.54302  4.59037  5.10053  1.19078  4.32711  1.85851  3.33524  4.65262  4.84696  4.55240  4.50242  3.96721  3.43389  1.31901  5.54085  4.36499    283 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    282   2.60692  5.01807  2.94034  2.39203  4.33316  3.42648  3.07643  3.77183  2.02698  3.29410  4.07696  2.70731  3.81977  2.33719  2.51894  2.59697  2.52383  3.39489  5.45443  4.10371    284 k - - -\n+          2.68614  4.42225  2.77520  2.73123  3.46354  2.40513  3.72495  3.29354  2.67741  2.69355  4.24690  2.90347  2.73740  3.18146  2.89801  2.37887  2.77520  2.98518  4.58477  3.61503\n+          0.04031  3.46099  4.81428  0.55464  0.85397  0.50576  0.92394\n+    283   3.24128  4.54389  4.90725  4.39054  3.38468  4.58002  5.02129  1.07847  4.23685  1.58278  3.19896  4.62532  4.82728  4.45924  4.39995  3.95995  3.48982  1.77762  5.42054  4.25040    286 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    284   3.45407  4.84059  4.32542  3.90811  1.84015  4.24835  2.66412  3.40230  3.77598  2.64543  3.97515  3.90240  4.57391  3.89322  3.93864  3.56926  3.67336  3.25812  3.71823  1.04470    287 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    285   2.09980  4.29816  3.32746  3.00342  4.30311  3.05112  4.13214  3.70000  3.05959  3.37928  4.20816  3.26123  1.59195  3.37140  3.41124  1.92597  2.66897  3.20150  5.62932  4.38955    288 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    286   1.90896  4.20989  3.54911  3.19585  4.20963  3.03827  4.22013  3.52525  3.19270  3.28184  4.13273  3.36322  3.75956  3.49737  3.50523  2.07725  1.35091  3.06394  5.57967  4.36808    289 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    287   2.40894  4.35769  3.40750  2.84606  3.52338  3.54694  3.81847  2.60986  2.79726  2.26730  3.29937  2.67864  3.93761  3.11672  3.16682  2.79476  2.29316  2.48906  4.96665  3.72263    290 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02513  4.09193  4.81428  0.61958  0.77255  0.50576  0.92394\n+    288   2.43194  4.35496  3.46257  3.01310  3.89035  3.29079  4.03812  2.83216  2.94091  2.85074  3.81103  3.33284  1.58849  3.30077  3.28019  2.66481  2.59961  2.63176  5.33350  4.08739    291 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01699  4.08379        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W06HU.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W06HU.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1024 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W06HU\n+LENG  334\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:01:40 2016\n+NSEQ  41\n+EFFN  0.663147\n+CKSUM 2945484408\n+STATS LOCAL MSV      -10.8149  0.70043\n+STATS LOCAL VITERBI  -12.0742  0.70043\n+STATS LOCAL FORWARD   -5.4175  0.70043\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.63031  4.47982  2.79854  2.52974  3.24472  3.19301  3.71740  2.84057  2.58980  2.52570  3.68457  3.08117  3.29060  3.05690  2.80023  2.70795  2.87610  2.63826  4.71613  3.25094\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.15217  3.98708  2.09876  0.61958  0.77255  0.00000        *\n+      1   2.66832  4.35615  3.64662  3.20149  3.36774  3.53917  4.06915  2.59203  3.03439  2.13150  1.72249  3.52005  3.38042  3.42122  3.30239  2.92926  2.97616  2.48604  5.01745  3.78143      1 m - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03159  3.86650  4.58884  0.61958  0.77255  0.59581  0.80099\n+      2   1.92729  4.24641  3.31164  2.86160  3.84623  3.14054  3.90715  2.95833  2.82152  2.87610  3.77160  3.18542  2.32168  3.16267  3.17665  2.44399  2.71592  2.64738  5.24420  3.99424      2 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03159  3.86650  4.58884  0.61958  0.77255  0.59581  0.80099\n+      3   2.74355  4.50190  3.35008  3.18824  4.18395  3.18975  4.26620  3.72782  3.24503  3.35531  4.40490  3.49555  0.83881  3.63400  3.49125  2.91085  3.18465  3.37387  5.37215  4.30453      3 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03159  3.86650  4.58884  0.61958  0.77255  0.59581  0.80099\n+      4   2.40950  4.25456  3.42279  3.17451  3.96360  3.09404  4.19229  3.09000  3.11737  2.95371  4.00461  3.38485  3.79732  3.51249  3.37635  2.61070  1.18207  2.78562  5.40193  4.18023      4 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03159  3.86650  4.58884  0.61958  0.77255  0.59581  0.80099\n+      5   3.00478  4.38062  4.54528  4.05830  3.42418  4.24293  4.79787  1.24775  3.92306  1.93576  3.25876  4.30322  4.59359  4.21091  4.13789  3.63000  3.28001  1.48578  5.37263  4.15888      5 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03159  3.86650  4.58884  0.61958  0.77255  0.52405  0.89678\n+      6   2.74493  5.11509  2.26624  1.52551  4.37159  3.27806  3.65344  3.82063  2.50850  3.06571  4.21808  2.76627  3.79751  2.73233  2.99730  2.70241  3.00090  3.45979  5.58384  4.17649      6 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03005  3.91569  4.63804  0.61958  0.77255  0.55394  0.85491\n+      7   2.60258  4.19140  3.19038  2.58983  4.13934  3.46125  3.60690  3.51353  1.81406  3.09578  3.93737  3.04717  3.86196  2.76192  '..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03089  3.88858  4.61093  0.61958  0.77255  0.56841  0.83569\n+    327   2.48944  4.43102  3.09193  2.75296  3.78634  3.20988  3.59700  3.30513  2.70249  2.95587  3.89188  3.13303  1.75399  3.11415  3.03647  2.62394  2.84808  2.76384  5.19486  3.85305    329 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03089  3.88858  4.61093  0.61958  0.77255  0.56841  0.83569\n+    328   2.12764  4.42872  3.03425  2.66101  3.92205  3.18896  3.45835  3.34706  2.65613  3.00940  3.88154  3.06641  2.08208  3.03337  3.02585  2.56815  2.79248  2.93121  5.27253  3.97494    330 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03089  3.88858  4.61093  0.61958  0.77255  0.56841  0.83569\n+    329   2.46471  4.07375  3.06072  2.59933  3.90224  2.11908  3.73240  3.19026  2.56496  2.96251  3.81029  2.73601  3.76490  2.71767  2.95849  2.57287  2.77334  2.97466  5.22900  3.93889    331 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03089  3.88858  4.61093  0.61958  0.77255  0.56841  0.83569\n+    330   2.80101  5.24208  1.97452  1.44647  4.52988  3.21549  3.68531  3.98370  2.61745  3.54603  4.39104  2.70041  3.78984  2.84603  3.15226  2.72956  3.07674  3.44418  5.73437  4.28559    332 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03089  3.88858  4.61093  0.61958  0.77255  0.54797  0.86305\n+    331   2.83789  5.33712  1.95196  1.41332  4.62636  3.20897  3.68944  4.11192  2.55869  3.63394  4.47043  2.67763  3.79476  2.84863  3.17939  2.67787  3.11334  3.70718  5.80633  4.34010    333 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03047  3.90218  4.62453  0.61958  0.77255  0.55664  0.85128\n+    332   2.69087  5.21194  1.84664  1.63227  4.50161  3.23437  3.66546  3.75115  2.57386  3.50539  4.33383  2.71405  3.78485  2.81752  3.10594  2.70308  3.03472  3.56132  5.69787  4.25690    334 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03047  3.90218  4.62453  0.61958  0.77255  0.55664  0.85128\n+    333   2.82042  5.27238  1.96160  1.42217  4.54654  3.22268  3.69152  4.01345  2.62453  3.41485  4.41338  2.70311  3.79827  2.85273  3.15952  2.74403  3.09452  3.62800  5.74655  4.29565    335 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03047  3.90218  4.62453  0.61958  0.77255  0.55664  0.85128\n+    334   2.64628  5.04557  2.30949  1.54019  4.32335  3.27746  3.65448  3.59114  2.50907  3.22767  4.16828  2.78206  3.79157  2.80941  2.99628  2.68478  2.97214  3.36960  5.55179  4.15383    336 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02061  3.89233        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W06OE.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W06OE.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1006 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W06OE\n+LENG  328\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:05:48 2016\n+NSEQ  42\n+EFFN  0.515259\n+CKSUM 4035949497\n+STATS LOCAL MSV      -11.1747  0.70061\n+STATS LOCAL VITERBI  -11.8897  0.70061\n+STATS LOCAL FORWARD   -5.4671  0.70061\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.53280  4.21132  2.88026  2.65781  3.29259  2.95408  3.81492  2.77567  2.75151  2.41709  3.65418  3.04753  3.29178  3.11705  2.87688  2.66825  2.87156  2.58939  4.63567  3.47445\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.08261  3.88316  2.83526  0.61958  0.77255  0.00000        *\n+      1   2.93920  4.49442  4.00763  3.59867  3.19191  3.80484  4.34292  2.36364  3.36868  1.79301  1.45527  3.88084  4.26570  3.75344  3.57850  3.28396  3.24399  2.36507  5.02718  3.78518      1 m - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03268  3.83323  4.55558  0.61958  0.77255  0.52974  0.88858\n+      2   1.32562  4.08881  3.31778  3.06494  4.10491  2.88832  4.13058  3.39004  3.10682  3.19213  4.07742  3.22812  3.63208  3.42187  3.39859  1.99615  2.65156  2.93336  5.49334  4.26175      2 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03268  3.83323  4.55558  0.61958  0.77255  0.52974  0.88858\n+      3   3.08726  4.48401  4.48146  3.94881  3.14474  4.28155  4.63760  1.79098  3.78462  1.18394  2.98597  4.24309  4.55760  4.03604  3.98893  3.63294  3.33306  1.88417  5.14300  3.96959      3 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03268  3.83323  4.55558  0.61958  0.77255  0.52974  0.88858\n+      4   2.91261  5.02058  3.24448  2.65988  4.40325  3.55125  3.55547  3.77445  1.78955  3.25883  4.12780  3.08476  3.93677  2.45174  1.54332  2.91993  3.09507  3.46445  5.35088  4.14913      4 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03268  3.83323  4.55558  0.61958  0.77255  0.52974  0.88858\n+      5   2.39279  4.23756  3.39442  3.14538  3.93534  3.07793  4.16555  3.05773  3.08757  2.92259  3.97618  3.36061  3.77884  3.48453  3.34775  2.59369  1.24022  2.75691  5.37663  4.15216      5 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03268  3.83323  4.55558  0.61958  0.77255  0.52974  0.88858\n+      6   3.24711  4.68364  4.06653  3.69391  1.93421  4.01960  3.46898  3.07151  3.56283  2.49801  3.72552  3.75491  4.39260  3.74248  3.74010  3.39540  3.49376  2.97063  3.71522  1.16348      6 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03268  3.83323  4.55558  0.61958  0.77255  0.52974  0.88858\n+      7   2.61789  4.39646  3.28355  3.17836  4.31997  0.79231  4.30043  3.91061  3.35422  3.56954  4.54548  3.44802  3.78633  3.68159  '..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03337  3.81249  4.53483  0.61958  0.77255  0.54684  0.86459\n+    321   2.94005  4.78087  3.42481  2.95019  4.12027  3.43787  3.78477  3.65890  2.21901  3.18587  4.18887  3.31389  3.94450  3.00918  1.07425  3.02785  3.21084  3.38576  5.22841  4.06193    323 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03337  3.81249  4.53483  0.61958  0.77255  0.54684  0.86459\n+    322   2.78150  4.36743  3.80905  3.15743  3.24953  3.79043  4.11700  2.18465  3.10360  1.91677  1.96643  3.64133  4.16808  3.47401  3.37107  3.11257  3.03242  2.21898  4.97925  3.76254    324 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03337  3.81249  4.53483  0.61958  0.77255  0.54684  0.86459\n+    323   2.88081  4.86310  3.27884  2.75819  4.03236  3.49009  3.37723  3.66585  2.03082  3.17179  4.09580  3.15414  3.93349  2.81824  1.35806  2.92933  3.10723  3.37348  5.18398  3.90214    325 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03337  3.81249  4.53483  0.61958  0.77255  0.54684  0.86459\n+    324   2.87740  4.86209  3.21296  2.62034  4.22148  3.46288  3.65494  3.64103  2.06161  3.18870  4.11769  3.14358  3.92284  2.83482  1.33342  2.92717  3.11194  3.35014  5.29589  4.08996    326 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03337  3.81249  4.53483  0.61958  0.77255  0.53183  0.88559\n+    325   3.08478  4.55133  4.27027  3.81128  3.05380  4.11507  4.47013  2.08774  3.56432  1.04741  3.01389  4.09739  4.46780  3.90699  3.76348  3.52472  3.35429  2.17353  5.00429  3.72314    327 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03301  3.82325  4.54560  0.61958  0.77255  0.53805  0.87680\n+    326   1.34269  4.19846  3.47430  3.14345  3.40325  3.13812  4.10996  2.81685  3.11878  2.67982  3.75194  3.36541  3.80337  3.45073  3.41033  2.58669  2.79414  2.56102  5.21829  3.91412    328 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03301  3.82325  4.54560  0.61958  0.77255  0.53805  0.87680\n+    327   2.55893  4.62827  2.60101  2.46693  4.08551  3.09997  3.81758  3.71165  2.69548  3.36926  4.26923  1.51117  3.75254  3.05656  3.07077  2.52248  2.94259  3.30516  5.42443  4.01949    329 n - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03301  3.82325  4.54560  0.61958  0.77255  0.53805  0.87680\n+    328   2.39904  4.28648  3.26107  2.93909  3.90566  3.11537  3.97581  3.14500  2.79431  2.92252  3.90231  3.22946  3.76496  3.24867  2.91649  2.57341  1.47200  2.83062  5.30729  4.05471    330 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02234  3.81258        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W07NX.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W07NX.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,766 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W07NX\n+LENG  248\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:06:01 2016\n+NSEQ  41\n+EFFN  0.573059\n+CKSUM 3514167566\n+STATS LOCAL MSV      -10.8240  0.70299\n+STATS LOCAL VITERBI  -11.6806  0.70299\n+STATS LOCAL FORWARD   -5.0886  0.70299\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.60313  4.37196  3.01014  2.72928  3.10909  2.88768  3.58848  2.82785  2.74596  2.41420  3.69554  3.21181  3.31694  3.12638  2.84641  2.67578  2.83774  2.58052  4.29270  3.27269\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03992  3.92507  3.94280  0.61958  0.77255  0.00000        *\n+      1   2.91061  5.00125  3.38240  2.72048  4.36052  3.59601  3.58290  3.56424  1.65099  3.16294  4.10010  3.13741  3.96454  2.72738  1.55148  2.93085  3.09333  3.41531  5.34487  4.13946      1 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03006  3.91522  4.63756  0.61958  0.77255  0.47993  0.96450\n+      2   3.19055  4.61459  4.46602  3.98945  3.07618  4.27425  4.61488  2.07550  3.74977  0.93264  2.99065  4.26791  4.58510  4.04956  3.93075  3.67699  3.44957  2.20665  5.07680  3.83710      2 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02977  3.92507  4.64742  0.61958  0.77255  0.48576  0.95510\n+      3   1.55569  4.25328  3.77152  3.30242  3.63320  3.45289  4.21115  2.14909  3.21200  2.43569  3.54099  3.56406  4.01341  3.54065  3.51029  2.83185  2.89773  2.07150  5.24671  4.01545      3 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02977  3.92507  4.64742  0.61958  0.77255  0.48576  0.95510\n+      4   2.74672  4.96378  2.50073  1.38447  4.35527  3.26183  3.75089  3.68038  2.58355  3.34495  4.24013  2.85545  3.82985  2.92714  3.01508  2.74691  2.63171  3.34490  5.59986  4.23534      4 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02977  3.92507  4.64742  0.61958  0.77255  0.48576  0.95510\n+      5   2.92753  4.37606  4.35966  3.85886  3.39618  4.06680  4.60027  1.93543  3.70358  1.96609  2.78599  4.11245  4.45792  4.00952  3.92947  3.43920  3.20915  1.17812  5.26334  4.05100      5 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02977  3.92507  4.64742  0.61958  0.77255  0.48576  0.95510\n+      6   1.96352  4.20608  3.21750  3.05023  4.31965  1.24616  4.21510  3.69015  3.20854  3.43261  4.30821  3.25514  3.69174  3.50237  3.50919  2.44427  2.76621  3.17192  5.64406  4.43956      6 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02977  3.92507  4.64742  0.61958  0.77255  0.48576  0.95510\n+      7   2.89161  5.08227  3.18026  2.61094  4.48827  3.54332  3.57708  3.86753  1.55425  3.34199  4.18492  2.69780  3.93299  2.71081  1'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    241   2.79843  4.55009  3.40941  3.25341  4.24591  3.23557  4.32812  3.80026  3.31372  3.42333  4.47455  3.55663  0.76399  3.70142  3.55540  2.96699  3.24275  3.44160  5.42291  4.36699    245 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    242   2.79843  4.55009  3.40941  3.25341  4.24591  3.23557  4.32812  3.80026  3.31372  3.42333  4.47455  3.55663  0.76399  3.70142  3.55540  2.96699  3.24275  3.44160  5.42291  4.36699    246 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    243   3.30348  4.69474  4.28756  4.00868  0.95519  3.98521  3.89275  2.82262  3.91477  2.18439  3.54741  4.05923  4.44289  4.07290  4.02571  3.57168  3.60457  2.81596  4.13100  2.49344    247 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    244   2.07430  4.17351  3.24977  3.03077  4.19574  2.92555  4.14861  3.57668  3.10417  3.32498  4.20575  3.22863  3.67255  3.42932  3.40523  1.19096  2.71628  3.08462  5.56731  4.30854    248 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    245   3.19505  4.64665  4.24672  3.88655  3.14904  4.02747  4.53110  2.35484  3.65395  0.83256  3.16054  4.15859  4.45658  4.01376  3.82427  3.60222  3.48761  2.40145  5.04145  3.77305    249 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    246   2.98262  5.10141  2.50220  0.97579  4.45204  3.29680  3.88643  3.91300  2.77142  3.52431  4.49656  2.95270  3.90301  3.10122  3.18410  2.96127  3.28706  3.59309  5.61690  4.33892    250 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    247   2.33232  4.25329  3.23715  3.05436  4.11166  2.98250  4.16333  3.63899  3.13052  3.35640  4.27938  3.27359  3.72420  3.47702  3.41561  1.03861  2.81508  3.16630  5.48126  4.19532    251 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03028  3.90810  4.63044  0.61958  0.77255  0.49268  0.94414\n+    248   2.59291  4.86673  3.04888  2.65111  4.31784  3.41353  3.70234  3.63149  1.28118  3.24824  4.16102  3.08654  3.90981  2.87081  2.43884  2.84731  3.06866  3.31808  5.42867  4.18251    252 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02048  3.89830        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W08R7.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W08R7.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1048 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W08R7\n+LENG  342\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:10:44 2016\n+NSEQ  42\n+EFFN  1.653442\n+CKSUM 4217172673\n+STATS LOCAL MSV      -11.2894  0.70029\n+STATS LOCAL VITERBI  -11.9277  0.70029\n+STATS LOCAL FORWARD   -5.5782  0.70029\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.52492  3.93388  3.08871  2.69483  3.37394  2.92621  3.80731  2.70456  2.60624  2.45509  3.58533  3.05410  3.44016  3.13165  2.97679  2.71989  2.79768  2.54632  4.49833  3.41916\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.32000  4.47246  1.33775  0.61958  0.77255  0.00000        *\n+      1   2.94737  4.59816  3.79259  3.35043  3.39494  3.82862  4.17955  2.73344  3.06267  2.10634  1.28051  3.69552  4.25919  3.06063  3.30313  3.21115  3.21519  2.69741  5.09529  3.84607      1 m - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02309  4.17555  4.89789  0.61958  0.77255  0.78841  0.60618\n+      2   1.95856  4.83771  3.00999  2.23743  4.09098  3.26112  3.65209  3.50761  2.42840  3.01936  3.61284  2.97907  3.84159  2.71026  2.53436  2.52399  2.86144  3.18000  5.34007  4.00674      2 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02248  4.20238  4.92473  0.61958  0.77255  0.72507  0.66221\n+      3   2.64685  4.62987  3.21260  2.64391  3.20319  3.52677  3.73231  3.19154  1.89304  2.73024  3.28907  3.12453  3.91047  2.93873  2.47788  2.74981  2.71814  2.76897  5.16338  3.88140      3 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02145  4.24837  4.97072  0.61958  0.77255  0.66538  0.72171\n+      4   2.59540  4.14349  4.09038  3.50634  3.25820  3.76877  4.07471  1.76511  3.16924  2.20692  2.89178  3.73286  4.13615  3.62029  3.38263  2.85035  2.89615  1.85980  4.77968  3.58563      4 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02036  4.30007  5.02242  0.61958  0.77255  0.57784  0.82350\n+      5   2.40171  4.14296  4.29818  3.70976  3.24321  3.84447  4.16765  1.87485  3.57250  1.86168  2.58783  3.87325  3.65966  3.77483  3.71668  2.99972  2.94107  1.99800  4.79023  3.60498      5 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01907  4.36485  5.08719  0.61958  0.77255  0.64255  0.74644\n+      6   2.68244  5.09684  2.86431  2.40714  4.41275  3.46210  3.64474  3.62009  1.79220  3.20869  4.14851  2.31368  3.85497  2.68109  2.58630  2.54795  2.70916  3.47238  5.54316  4.16315      6 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01907  4.36485  5.08719  0.61958  0.77255  0.58589  0.81331\n+      7   2.51351  4.09196  4.28340  3.68888  2.18693  3.78520  4.09958  2.36237  3.54158  1.94491  3.02368  3.52894  4.15208  3.73439  '..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    335   2.54168  4.43326  3.70105  3.37276  4.24265  3.29361  4.38353  3.50559  3.34625  3.30877  4.22554  3.56791  1.03537  3.68229  3.64261  2.51985  2.99128  2.41738  5.66446  4.42056    341 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    336   2.90806  5.30009  3.12274  2.44681  4.69330  3.60571  3.70129  4.11898  1.64699  3.56708  4.35386  1.97253  3.99565  2.56063  2.10091  2.87138  3.11507  3.72225  5.65220  4.34017    342 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    337   2.02634  4.41061  3.07357  2.28466  4.09454  3.49812  3.70301  3.30049  2.36604  2.95220  3.92988  2.96758  3.88855  2.85519  2.65799  2.19494  2.89750  3.09478  5.36176  4.02984    343 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    338   2.64769  4.36413  4.29826  2.91236  3.57743  4.09194  4.45494  1.50780  3.65512  2.36346  3.49273  4.02428  4.44479  3.92457  3.89671  3.39592  3.16022  1.38233  5.20426  3.99587    344 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    339   2.75239  5.18760  2.97323  2.30107  4.53049  3.49801  3.66767  3.98771  1.59116  3.47522  4.23945  2.50058  3.89653  2.67585  2.58444  2.41672  2.76005  3.57938  5.60679  4.23546    345 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    340   2.70660  4.12566  4.37982  3.78533  2.83089  3.85178  4.17324  2.14750  3.63287  1.97313  2.58658  3.91128  3.19599  3.81652  3.74557  2.96980  2.93908  1.70721  4.75725  3.57626    346 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    341   3.32293  4.78756  4.34495  3.86901  0.91299  4.21403  3.82304  3.23246  3.61634  2.71670  3.83904  3.98140  4.56913  3.89721  2.72889  3.54226  3.55340  3.09892  4.15054  2.33505    347 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01857  4.39113  5.11348  0.61958  0.77255  0.62444  0.76693\n+    342   2.61106  1.60800  3.84637  3.30444  3.51845  3.56943  4.07660  2.85126  3.20483  2.60135  3.50967  3.57647  4.04954  3.28050  3.47821  2.50116  2.64374  2.41911  4.99322  3.56723    348 c - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01254  4.38510        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W09HB.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W09HB.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1360 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W09HB\n+LENG  446\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:05:17 2016\n+NSEQ  41\n+EFFN  1.053528\n+CKSUM 3267506956\n+STATS LOCAL MSV      -11.6146  0.69862\n+STATS LOCAL VITERBI  -12.6740  0.69862\n+STATS LOCAL FORWARD   -5.9898  0.69862\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.56368  4.04930  3.03333  2.66716  3.18413  3.09109  3.74873  2.91459  2.61734  2.36754  3.61990  3.07269  3.26390  3.02405  2.88886  2.60366  2.78703  2.72775  4.37673  3.59396\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.10450  4.19352  2.47539  0.61958  0.77255  0.00000        *\n+      1   2.45739  4.70808  3.03798  2.49387  3.97066  3.26831  3.66445  3.23724  2.42950  3.00032  3.67881  2.92525  2.76408  2.72664  2.92731  2.18245  2.65608  3.06395  5.26268  3.94587      1 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02459  4.11361  4.83595  0.61958  0.77255  0.56130  0.84505\n+      2   2.48116  4.63798  3.09550  2.48994  3.63514  3.35405  3.67547  3.23624  2.45404  2.64950  3.56764  2.95745  3.00611  2.81078  2.96145  2.22041  2.73603  2.90997  5.17279  3.87244      2 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02437  4.12251  4.84485  0.61958  0.77255  0.56853  0.83553\n+      3   2.53236  4.44644  2.73806  2.12571  4.34185  3.38401  3.58324  3.80335  2.07854  3.32138  4.08378  2.75333  3.21591  2.45440  2.81723  2.46445  2.79525  3.40369  5.48525  4.09670      3 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02437  4.12251  4.84485  0.61958  0.77255  0.56853  0.83553\n+      4   3.56372  4.87554  4.60171  4.24427  1.92519  4.31595  3.67473  3.25223  4.03522  2.57067  3.85027  4.12940  4.67144  4.13520  4.11408  3.74416  3.80605  3.20187  1.07833  2.15042      4 w - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02437  4.12251  4.84485  0.61958  0.77255  0.56853  0.83553\n+      5   2.64955  4.75457  3.11163  2.54345  3.99005  3.47812  3.41902  3.21244  1.71999  3.00282  3.42181  3.03714  3.86694  2.82786  2.77577  2.65630  2.48681  3.08332  5.25679  3.95749      5 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02437  4.12251  4.84485  0.61958  0.77255  0.56853  0.83553\n+      6   2.67238  4.95114  2.94097  2.45189  4.24270  3.45909  3.06311  3.66505  2.04275  3.15247  3.70205  2.96566  3.84436  2.73996  2.00934  2.67805  2.63896  3.31531  5.39873  4.07013      6 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02437  4.12251  4.84485  0.61958  0.77255  0.56853  0.83553\n+      7   3.11874  4.82639  3.75407  3.63445  4.59623  3.50012  4.68503  4.21414  3.71480  3.81033  4.87559  3.91260  0.47107  4.09566  '..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.29826  4.17824  1.41648  0.61958  0.77255  0.51853  0.90485\n+    439   2.71317  5.17837  2.12661  1.72660  4.48078  3.12730  3.62240  3.95802  2.47507  3.47146  4.26714  2.59302  3.36837  2.75839  2.82515  2.65525  2.96686  3.55327  5.63991  4.21220    445 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03022  3.91020  4.63255  0.61958  0.77255  0.74538  0.64351\n+    440   2.43687  4.86368  2.56020  2.26004  4.12815  3.16127  3.45102  3.37099  2.28929  3.13372  3.92928  2.75206  3.75946  2.64524  2.82944  2.50947  2.73664  3.21082  5.34709  3.65771    446 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.14065  3.92430  2.19415  0.61958  0.77255  0.42615  1.05849\n+    441   2.73257  5.19884  2.15142  2.15076  4.51119  2.39160  3.65443  3.98821  2.12350  3.49709  4.28293  2.61776  3.81081  2.78401  2.99650  2.49130  2.98275  3.57877  5.66040  4.23773    447 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02588  4.06305  4.78540  0.61958  0.77255  0.44299  1.02754\n+    442   2.58771  4.44266  3.31964  2.76846  3.65070  2.48223  3.79492  2.91935  2.59757  2.24130  3.58545  3.20662  3.91059  3.05699  3.10977  2.54952  2.40790  2.65204  5.05296  3.79630    448 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02303  4.17824  4.90059  0.61958  0.77255  0.51853  0.90485\n+    443   3.55236  4.84250  4.67005  4.28681  1.70659  4.40531  3.63578  2.85488  4.13319  2.60292  3.83851  4.13391  4.71335  4.15102  4.19902  3.74896  3.77447  3.12220  3.80340  0.96103    449 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02303  4.17824  4.90059  0.61958  0.77255  0.51853  0.90485\n+    444   2.33172  4.35038  3.43320  2.87080  3.50811  3.55252  3.82390  2.61466  2.82280  2.50309  3.36514  3.15222  3.94400  3.13604  3.18607  2.59335  1.98780  2.62172  4.94447  3.40884    450 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02303  4.17824  4.90059  0.61958  0.77255  0.51853  0.90485\n+    445   2.68805  3.53973  4.10372  3.53213  2.79165  3.76713  3.92992  2.59544  3.40480  2.09680  3.25747  3.71853  3.67445  3.61835  3.58368  3.05718  2.92030  2.41268  2.00974  2.89681    451 w - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.05871  4.17824  3.17734  0.61958  0.77255  0.51853  0.90485\n+    446   2.59405  4.40351  3.35451  2.70444  3.18347  3.52987  3.79583  2.79753  2.75360  2.51202  3.39181  3.23151  3.92449  3.07835  3.13395  1.83245  2.67484  2.65821  4.98899  3.73249    452 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01612  4.13565        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W0CIU.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W0CIU.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,616 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W0CIU\n+LENG  198\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:07:10 2016\n+NSEQ  42\n+EFFN  0.730591\n+CKSUM 142938255\n+STATS LOCAL MSV      -10.2781  0.70546\n+STATS LOCAL VITERBI  -11.1685  0.70546\n+STATS LOCAL FORWARD   -5.0749  0.70546\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.51868  4.31129  2.87345  2.82349  3.26011  2.81771  3.86625  2.70631  2.74327  2.39929  3.56532  3.13425  3.49021  3.14788  2.96117  2.71678  2.84342  2.54373  4.57683  3.24577\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.05525  4.03111  3.32441  0.61958  0.77255  0.00000        *\n+      1   2.59649  4.55704  3.14375  2.66458  3.77503  3.40350  3.73846  3.21645  2.53784  2.87305  3.45517  3.00726  1.91835  2.96654  2.81461  2.70946  2.86693  2.93702  5.14022  3.68947      1 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02749  4.00336  4.72570  0.61958  0.77255  0.51463  0.91060\n+      2   2.01091  4.44307  3.13629  2.66223  3.71241  3.39093  3.73748  3.08093  2.63970  2.76757  3.50355  3.10925  3.66140  2.97104  3.04765  2.32517  2.49759  2.71625  5.08960  3.58857      2 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02749  4.00336  4.72570  0.61958  0.77255  0.51463  0.91060\n+      3   2.61552  4.64353  3.03862  2.57569  3.68732  3.40128  3.70728  3.30034  2.33344  2.93717  3.81276  3.04805  2.01807  2.79343  2.86272  2.70017  2.87510  2.92443  5.21747  3.91269      3 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02749  4.00336  4.72570  0.61958  0.77255  0.51463  0.91060\n+      4   2.60521  4.68297  2.88485  2.45376  3.87210  1.82198  3.73021  3.46730  2.43809  3.09605  3.94169  2.99439  3.82606  2.91880  2.81058  2.55253  2.88932  3.13762  5.34291  4.03687      4 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02749  4.00336  4.72570  0.61958  0.77255  0.48363  0.95853\n+      5   2.16537  4.43133  3.10013  2.49492  3.78133  3.14250  3.66442  3.09252  2.44721  2.69628  3.67382  3.03357  3.83053  2.69080  2.94712  2.41520  2.80036  2.85763  5.12375  3.65546      5 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02698  4.02180  4.74415  0.61958  0.77255  0.49563  0.93953\n+      6   2.53482  4.12300  3.83807  3.26464  2.18762  3.64942  3.92633  2.29819  3.04465  2.11344  3.15043  3.44677  4.02244  3.42228  3.40095  2.80052  2.81995  2.31604  4.69916  3.46484      6 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02698  4.02180  4.74415  0.61958  0.77255  0.49563  0.93953\n+      7   2.65505  4.49269  3.09179  2.74683  3.29007  3.52082  3.39201  3.04710  2.71579  2.64994  3.61415  3.18329  3.93169  3.06001  3.'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    191   2.92056  5.07756  3.25412  2.67062  4.45664  3.58737  3.61992  3.82967  1.25477  3.32227  4.17823  3.11461  3.97419  2.58835  2.16239  2.92413  3.11266  3.30103  5.43051  4.20491    192 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    192   3.06698  4.52713  4.14063  3.66583  1.94845  3.99127  3.61576  2.80455  3.55006  2.53083  3.61867  3.77333  4.34743  3.72427  3.74135  3.01456  3.30113  2.81075  3.92855  1.31645    193 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    193   2.63860  4.91892  2.92055  2.32859  4.20337  3.40896  3.12510  3.63078  2.30023  3.12950  3.99053  2.91825  3.81006  2.16634  2.58614  2.38629  2.64225  3.28093  5.38255  4.04335    194 q - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    194   2.82259  4.31452  4.08812  3.52178  3.26204  3.93631  4.23799  1.81001  3.39147  1.64640  3.15772  3.82782  4.27092  3.07808  3.63410  3.23041  3.05658  1.88543  4.97280  3.79173    195 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    195   1.58287  4.23369  3.44857  3.02656  3.98521  1.99999  4.05401  2.99575  3.00919  3.04267  3.91498  3.28528  3.76589  3.32422  3.35106  2.46632  2.74283  2.81084  5.37632  4.14157    196 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    196   2.68076  3.95473  4.08999  3.52487  3.18284  3.80551  4.18065  1.71848  3.42516  2.27459  3.29023  3.60454  4.18396  3.67723  3.65230  3.10769  2.47583  1.70924  4.91875  3.71367    197 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    197   2.78271  2.90307  4.43002  3.87365  3.38841  3.97990  4.42976  1.51414  3.74808  2.15786  3.30870  4.04835  4.35206  3.98009  3.92014  3.19186  3.03944  1.58417  5.05278  3.85391    198 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02697  4.02222  4.74456  0.61958  0.77255  0.49519  0.94021\n+    198   2.55725  4.62987  2.71205  2.51565  3.95402  3.34864  3.70795  3.33905  2.55608  2.99389  3.47560  2.85775  3.81155  2.89435  2.99346  2.49903  1.87947  3.02456  5.27005  3.96094    199 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01824  4.01348        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W0DGR.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W0DGR.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,385 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W0DGR\n+LENG  121\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:12:24 2016\n+NSEQ  42\n+EFFN  0.725464\n+CKSUM 3354938972\n+STATS LOCAL MSV      -10.0588  0.71332\n+STATS LOCAL VITERBI  -10.7388  0.71332\n+STATS LOCAL FORWARD   -4.5657  0.71332\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.52207  3.51288  2.81360  2.60860  3.34142  3.02217  3.62540  3.04280  2.70386  2.56694  3.62701  2.94579  3.03764  2.98608  2.96621  2.63768  2.89749  2.84438  4.89704  3.41984\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.11954  4.02783  2.35540  0.61958  0.77255  0.00000        *\n+      1   2.65331  5.00898  2.89391  2.27962  4.33758  3.41587  3.57529  3.75739  1.72526  3.27773  4.08300  2.84891  3.56748  2.61259  2.40483  2.55683  2.92465  3.39697  5.43007  4.11005      1 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02939  3.93768  4.66003  0.61958  0.77255  0.57373  0.82879\n+      2   2.53258  5.08487  2.08533  1.92241  4.37375  3.30043  3.60275  3.83751  2.38455  3.36693  4.15620  2.67464  3.62249  2.73353  2.87132  2.62614  2.90854  3.44816  5.54556  3.75527      2 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02939  3.93768  4.66003  0.61958  0.77255  0.57373  0.82879\n+      3   2.47034  4.86035  2.63913  2.33716  3.97030  3.35806  3.06277  3.55863  2.36332  2.97145  3.93068  2.63258  3.66450  2.56928  2.83518  2.41873  2.80878  3.20939  5.34629  3.98836      3 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02939  3.93768  4.66003  0.61958  0.77255  0.55713  0.85063\n+      4   2.43548  4.08224  3.77751  3.19972  2.65453  3.45835  3.88215  2.32144  3.10698  2.09444  2.93860  3.39762  3.83479  3.36440  3.26132  2.87181  2.76896  2.32601  4.67964  3.31640      4 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02908  3.94819  4.67054  0.61958  0.77255  0.56425  0.84115\n+      5   2.82884  4.29235  4.18793  3.61335  2.59237  3.93445  4.15599  2.38262  3.49407  1.29632  2.79438  3.86557  3.95649  3.69873  3.68882  3.22851  3.05586  2.32316  4.39923  3.47777      5 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02908  3.94819  4.67054  0.61958  0.77255  0.56425  0.84115\n+      6   2.32639  4.47223  3.15557  2.60774  3.73334  3.06450  3.69701  3.11895  2.57331  2.74425  3.64089  3.00487  3.69817  2.91639  2.87906  2.29881  2.41427  2.77872  4.63994  3.81678      6 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02908  3.94819  4.67054  0.61958  0.77255  0.56425  0.84115\n+      7   2.57770  5.20400  1.64260  2.03987  4.51907  2.95830  3.67148  3.99452  2.57366  3.52151  4.33336  2.61377  3.79093  2.81945  3'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02894  3.95264  4.67499  0.61958  0.77255  0.53716  0.87805\n+    114   0.90415  4.23307  3.54480  3.34014  4.13296  3.05539  4.35261  3.27054  3.35848  3.14842  4.17173  3.46923  3.80222  3.69237  3.60328  2.58282  2.86574  2.91108  5.55212  4.36137    115 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02894  3.95264  4.67499  0.61958  0.77255  0.53716  0.87805\n+    115   1.08261  4.19026  3.39990  3.13922  4.15938  2.99391  4.20247  3.42325  3.17224  3.20871  4.12431  3.31923  3.10912  3.49438  3.46395  2.46913  2.75673  2.99602  5.54311  4.33231    116 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02894  3.95264  4.67499  0.61958  0.77255  0.53716  0.87805\n+    116   2.82230  4.92162  3.03147  2.63711  4.37380  3.42480  3.69502  3.77850  1.24216  3.34242  4.22303  3.07728  3.91920  2.85965  2.42397  2.62099  3.08554  3.43663  5.45261  4.19230    117 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02894  3.95264  4.67499  0.61958  0.77255  0.53716  0.87805\n+    117   2.89466  5.03468  2.96803  2.59328  4.43201  3.45847  3.67128  3.86994  1.22133  3.39743  4.27163  2.77155  3.93628  2.83066  2.38627  2.90015  3.13379  3.52910  5.46858  4.20505    118 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02894  3.95264  4.67499  0.61958  0.77255  0.53716  0.87805\n+    118   2.76666  4.53390  3.45683  3.36654  4.50690  0.61547  4.48170  4.12623  3.55870  3.77025  4.74682  3.62114  3.92761  3.87653  3.78573  2.94091  3.25414  3.63908  5.58066  4.61159    119 G - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.06439  3.95264  3.14296  0.61958  0.77255  0.53716  0.87805\n+    119   2.56577  4.17005  3.75002  3.18623  2.67213  3.64845  3.87861  2.07722  3.09725  2.12264  3.23374  3.00514  4.01786  3.36818  3.36791  2.92234  2.83802  2.32458  4.65562  3.18611    120 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02997  3.91822  4.64057  0.61958  0.77255  0.56846  0.83563\n+    120   2.60272  4.90870  2.55628  2.29833  4.16723  3.34910  3.09972  3.61810  2.35206  3.11146  3.72635  2.23372  3.76930  2.71577  2.74715  2.60111  2.83744  3.26317  5.37679  4.01107    121 n - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02997  3.91822  4.64057  0.61958  0.77255  0.56846  0.83563\n+    121   2.83428  4.29755  4.18215  3.65057  3.41210  3.98146  4.39800  1.86586  3.51278  1.95477  3.32813  3.73841  4.35439  3.82652  3.76267  3.31309  3.09497  1.30538  5.14502  3.90194    122 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02027  3.90853        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W0E07.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W0E07.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,697 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W0E07\n+LENG  225\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:09:23 2016\n+NSEQ  41\n+EFFN  1.113586\n+CKSUM 4294424761\n+STATS LOCAL MSV      -10.5468  0.70398\n+STATS LOCAL VITERBI  -11.2573  0.70398\n+STATS LOCAL FORWARD   -5.0856  0.70398\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.45272  4.46999  3.02627  2.57319  3.22427  3.03909  3.79627  2.72588  2.69524  2.27846  3.63709  3.05164  3.75549  3.07294  2.92976  2.69253  2.86896  2.63954  4.74934  3.47638\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.05069  4.24993  3.34771  0.61958  0.77255  0.00000        *\n+      1   2.67882  4.37879  3.84649  3.26983  3.34826  3.79752  4.04932  2.52597  3.06209  1.28206  3.17054  3.61475  4.15665  3.05737  3.16031  3.07810  3.00890  2.52314  4.94525  3.75069      1 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02205  4.22128  4.94363  0.61958  0.77255  0.52268  0.89876\n+      2   2.56536  4.53061  3.28372  2.71490  3.31223  3.54306  3.76108  2.76955  2.22708  2.73399  3.15028  3.17722  3.92508  2.99924  2.17317  2.77240  2.86390  2.67589  5.08227  3.81710      2 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02205  4.22128  4.94363  0.61958  0.77255  0.52268  0.89876\n+      3   2.41694  4.85632  2.94373  1.58521  4.13579  3.43723  3.70106  3.36476  2.49838  3.14341  3.96993  2.98986  3.86489  2.77939  2.95041  2.61507  2.90597  2.83798  5.39777  4.06108      3 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02205  4.22128  4.94363  0.61958  0.77255  0.49622  0.93860\n+      4   3.46563  4.74660  5.19748  4.62125  2.81262  4.76839  5.04801  1.80666  4.49433  0.83607  2.66085  4.83692  4.90066  4.50099  4.54354  4.12216  3.67824  2.38393  5.24347  4.19955      4 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02177  4.23395  4.95629  0.61958  0.77255  0.50666  0.92257\n+      5   2.52146  4.94408  2.98452  2.36843  3.87765  3.44665  3.63256  3.65211  1.87213  3.21446  4.00633  2.81898  3.83691  2.68686  2.52686  2.65043  2.46525  3.29742  5.41608  3.69015      5 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02177  4.23395  4.95629  0.61958  0.77255  0.50666  0.92257\n+      6   2.64041  5.15204  3.20146  2.59622  4.52222  3.58776  3.14982  3.92487  1.75322  3.40947  4.21726  3.08216  3.96316  2.69929  1.66544  2.64765  3.06400  3.56415  5.51973  4.23988      6 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02177  4.23395  4.95629  0.61958  0.77255  0.50666  0.92257\n+      7   3.21371  5.26061  3.73722  3.00198  4.69062  3.82782  3.72798  4.03120  1.78535  3.25344  4.37372  3.37128  4.18373  2.86866  0'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    218   2.60154  3.59028  3.88388  3.30300  3.24333  3.67133  3.61941  2.35999  3.01892  1.80967  3.00010  3.57898  4.04331  3.45565  2.88406  2.84816  2.83334  2.29177  4.34271  3.53723    221 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    219   3.02941  5.62951  1.16269  2.09214  4.92017  3.33175  3.85192  4.44449  2.74495  3.92471  4.75911  2.21109  3.94173  3.01048  3.44682  2.71790  3.31235  4.00539  6.08202  4.56986    222 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    220   1.43850  3.65193  3.77347  3.25641  3.70208  3.16318  4.11039  2.86659  3.19199  2.77110  3.66581  3.48742  3.91984  3.47253  3.49368  2.28259  2.82127  2.23283  5.15488  3.94472    223 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    221   3.50880  4.82215  5.04905  4.53478  3.18082  4.74118  5.06367  2.01958  4.32734  0.69850  2.99853  4.78952  4.92743  4.47822  4.43685  4.14088  3.74322  2.33516  5.31142  4.19288    224 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    222   2.57806  4.14180  3.08141  2.51897  3.82305  3.47343  3.67530  3.37190  2.29730  2.99620  3.68177  2.85661  3.86092  2.32525  2.41459  2.58583  2.85689  3.07006  3.52885  3.94697    225 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    223   2.71716  5.12674  2.87247  2.36580  4.46794  3.34885  3.62018  3.91609  1.96883  3.40816  4.17998  2.79783  3.85831  2.47160  1.92964  2.63798  2.74543  3.51782  5.54136  4.18326    226 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    224   3.03020  4.40182  4.69920  4.10993  2.85299  4.22466  4.53026  1.84241  3.96710  1.29152  2.15251  4.27790  4.50135  4.09039  3.75721  3.54017  3.25434  2.28553  4.97162  3.85736    227 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02204  4.22165  4.94400  0.61958  0.77255  0.52222  0.89944\n+    225   2.88351  3.97797  4.31535  3.77723  1.42386  3.93232  3.82766  2.77140  3.38847  2.44565  3.42622  3.85905  4.28790  3.79490  3.76504  3.08182  3.11336  2.59084  2.90343  2.39864    228 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01489  4.21450        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W0EOF.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W0EOF.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,439 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W0EOF\n+LENG  139\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:16:47 2016\n+NSEQ  39\n+EFFN  0.680786\n+CKSUM 4228045402\n+STATS LOCAL MSV      -10.3175  0.71065\n+STATS LOCAL VITERBI  -11.0722  0.71065\n+STATS LOCAL FORWARD   -4.6314  0.71065\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.59984  4.10585  2.90344  2.71421  3.05446  2.27988  3.64451  3.05594  2.65284  2.67879  3.69718  3.15910  3.67161  3.08247  2.85073  2.76548  2.94379  2.80442  4.09757  3.28919\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.11069  3.99879  2.44826  0.61958  0.77255  0.00000        *\n+      1   2.57734  4.70516  2.75537  2.45555  4.15952  1.97320  3.70151  3.57787  2.40570  3.17994  4.01307  2.93949  3.56461  2.87541  2.57922  2.56192  2.87253  3.21693  5.40287  4.09013      1 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02998  3.91808  4.64042  0.61958  0.77255  0.55143  0.85832\n+      2   2.52064  4.25844  4.17091  3.65525  3.50301  3.88734  4.43086  1.70956  3.55346  2.22682  3.37780  3.91529  4.08498  3.84643  3.80660  3.23468  3.05246  1.34903  5.21567  4.00610      2 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02975  3.92556  4.64791  0.61958  0.77255  0.55637  0.85165\n+      3   1.87320  4.15449  3.73868  3.30656  3.73752  3.27219  4.19881  2.52838  3.23663  2.66156  3.65831  3.50062  3.89615  3.54624  3.51850  2.59577  2.62213  1.60929  5.26532  4.05186      3 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02975  3.92556  4.64791  0.61958  0.77255  0.55637  0.85165\n+      4   2.65012  4.94711  3.12542  2.64166  4.37320  3.48075  3.63949  3.72481  1.30889  3.27250  4.14850  3.08045  3.92466  2.79237  2.24235  2.86663  3.07063  3.40312  5.41249  4.17916      4 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02975  3.92556  4.64791  0.61958  0.77255  0.55637  0.85165\n+      5   2.53118  3.90951  3.27977  2.71855  3.53000  3.46224  3.72471  2.76192  2.50151  2.59273  3.47247  2.92895  3.85659  2.99956  3.05312  2.55867  2.42011  2.43876  4.94213  3.55212      5 t - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02975  3.92556  4.64791  0.61958  0.77255  0.55637  0.85165\n+      6   2.73136  4.50167  3.41602  3.32210  4.46367  0.65170  4.43924  4.07609  3.51060  3.72360  4.69969  3.58027  3.89451  3.83054  3.74093  2.90478  3.21672  3.59416  5.54491  4.56732      6 G - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02975  3.92556  4.64791  0.61958  0.77255  0.55637  0.85165\n+      7   1.80345  4.20092  3.32460  2.94553  4.06020  1.82946  4.01711  3.40289  2.95081  3.12755  3.69418  3.20533  3.69485  3.27147  3'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    132   2.68734  3.35014  4.39526  3.84354  3.40281  4.01713  4.47184  1.53799  3.73474  2.15060  3.15869  4.05506  4.37674  3.97719  3.93366  3.34844  3.05856  1.48429  5.11563  3.92029    132 v - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    133   1.43364  4.20464  3.40033  3.02157  3.88110  3.10037  4.03507  3.09524  2.97574  2.63406  3.85056  3.27431  3.75697  3.32301  3.29080  2.23137  2.73906  2.76187  5.31012  4.05812    133 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    134   2.92515  4.34411  4.36030  3.78811  2.45917  4.06502  4.25932  2.15969  3.67115  1.31520  2.65065  4.01794  4.35074  3.83569  3.83669  3.36830  3.14883  2.31501  4.73661  3.16084    134 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    135   3.07888  4.55092  4.30969  3.79349  3.09225  4.14360  4.47243  2.22906  3.56280  1.46793  1.60746  4.09344  4.46441  3.87543  3.76740  3.50804  3.33065  2.28093  5.03905  3.83691    135 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    136   1.13672  4.11946  3.39934  3.15959  4.15062  2.92512  4.20952  3.40941  3.19604  3.23590  4.13344  3.29716  3.67780  3.51079  3.47488  2.17368  2.69687  2.95708  5.54945  4.32052    136 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    137   2.75330  4.75981  3.27942  2.78415  4.21305  3.40876  3.70707  3.66874  2.14781  3.23509  4.13117  3.16590  3.90904  2.88928  1.35456  2.56202  3.03631  3.33307  5.34265  4.09577    137 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    138   1.97234  4.35278  3.25515  2.73499  3.69645  3.32571  3.78078  2.88610  2.69228  2.58093  3.62273  2.85221  3.80927  3.03173  3.07532  2.39002  2.65275  2.64797  5.08949  3.83034    138 a - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03015  3.91257  4.63492  0.61958  0.77255  0.52450  0.89612\n+    139   2.70283  4.83781  3.02782  2.51085  4.01504  3.45287  3.59879  3.50588  2.21876  2.92577  3.92893  2.87954  3.85578  1.90058  2.41303  2.73551  2.92333  3.19969  5.23922  3.67711    139 q - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02039  3.90282        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W0IVU.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W0IVU.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,334 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W0IVU\n+LENG  104\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:12:29 2016\n+NSEQ  41\n+EFFN  0.818298\n+CKSUM 4143370715\n+STATS LOCAL MSV       -9.4496  0.71659\n+STATS LOCAL VITERBI  -10.4389  0.71659\n+STATS LOCAL FORWARD   -4.1748  0.71659\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.42818  4.27224  3.32694  2.85240  3.27847  2.72914  3.61667  2.88884  2.45813  2.55698  3.70949  3.11380  3.58361  3.13719  2.57718  2.76933  2.84041  2.65262  4.39396  3.33476\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.04558  4.08561  3.58468  0.61958  0.77255  0.00000        *\n+      1   2.82587  5.04330  2.98991  2.54305  4.43064  3.47874  3.66493  3.84133  1.40860  3.35850  4.19606  3.02743  2.71011  2.68274  2.49895  2.82658  3.05609  3.49095  5.49370  4.21088      1 k - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02581  4.06584  4.78818  0.61958  0.77255  0.50765  0.92107\n+      2   2.93561  5.00417  3.41048  2.78166  4.37759  3.62225  3.65819  3.74833  1.93150  3.06561  4.14519  3.19529  4.01182  2.80964  1.29901  2.78340  3.13433  3.44259  5.39418  4.18284      2 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02581  4.06584  4.78818  0.61958  0.77255  0.50765  0.92107\n+      3   2.66360  4.60933  3.17089  2.66139  3.16396  3.32178  1.99965  3.20011  2.62138  2.83692  3.72037  3.05481  3.63249  2.97657  3.02007  2.76506  2.89999  2.93657  4.84261  3.07413      3 h - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02581  4.06584  4.78818  0.61958  0.77255  0.50765  0.92107\n+      4   2.73919  4.70005  2.63926  2.83520  4.56665  0.84750  4.22939  4.10503  3.26257  3.74688  4.64065  3.25295  3.92660  3.49890  3.65349  2.84315  3.17709  3.62373  5.75674  4.56560      4 g - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02581  4.06584  4.78818  0.61958  0.77255  0.50765  0.92107\n+      5   2.96335  5.01804  2.93051  2.76145  4.39973  3.53589  3.79457  3.87690  2.27934  3.41422  4.30756  3.20534  4.01504  2.96989  1.06643  2.99456  3.21175  3.54989  5.47225  4.23918      5 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02581  4.06584  4.78818  0.61958  0.77255  0.50765  0.92107\n+      6   2.94232  4.53094  3.95370  3.59251  3.40642  3.31603  4.35340  2.62752  3.40978  0.90574  3.45884  3.86109  4.26937  3.79762  3.62167  3.25326  3.26223  2.55388  5.10744  3.84161      6 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02581  4.06584  4.78818  0.61958  0.77255  0.50765  0.92107\n+      7   3.35776  4.70885  4.42849  3.99849  1.85823  4.21615  3.52163  3.23966  3.84265  2.70844  3.83471  3.93558  4.53959  3.93127  3'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+     97   2.42280  4.33517  4.38080  3.89013  3.55799  4.03612  4.65369  1.22195  3.77697  2.18177  3.40478  4.12155  4.45816  4.07025  4.00984  3.40965  3.17728  1.67156  5.36692  4.16082     98 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+     98   2.39881  4.32402  4.05116  3.50657  3.32343  3.84429  4.26704  2.25622  3.38363  1.94142  1.88090  3.80128  4.23738  3.67028  3.63775  3.16428  3.04808  1.98936  5.04588  3.86474     99 m - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+     99   2.80211  4.33487  3.99413  3.43631  3.17731  3.86127  4.13533  2.29922  3.27579  1.29488  3.02871  3.74343  4.21531  3.58091  3.52085  2.90783  3.04130  2.29673  4.87219  3.50780    100 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+    100   2.57264  4.05708  3.52770  2.96137  3.27014  3.55876  3.81092  2.60242  2.76471  2.44755  3.36019  3.33640  3.94382  3.18728  3.11306  2.81946  2.51436  2.50421  4.79344  2.23439    101 y - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+    101   2.57295  4.52238  3.12293  2.65589  3.46749  3.38996  3.60008  3.11892  2.55758  2.85344  3.73148  3.10308  1.96273  2.98440  2.98816  2.59066  2.84630  2.90826  5.09744  3.77278    102 p - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+    102   2.48533  3.99761  3.14454  2.63508  3.91504  3.29971  3.75407  3.31199  2.59547  2.96693  3.65820  2.64697  3.79506  2.83407  3.00149  1.75571  2.72820  2.98338  5.24314  3.95635    103 s - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02740  4.00656  4.72891  0.61958  0.77255  0.52812  0.89090\n+    103   2.63545  4.76323  3.08568  2.52582  4.06230  3.43390  3.63388  3.28495  2.23180  3.05812  3.88873  2.96316  3.70159  2.79318  1.97560  2.47009  2.54611  3.14084  5.28534  3.99233    104 r - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03954  4.00656  3.88361  0.61958  0.77255  0.52812  0.89090\n+    104   2.86872  4.26972  4.38547  3.82394  2.98721  4.07194  4.40815  1.49102  3.71006  1.77706  3.18676  3.83574  4.39389  3.93325  3.90106  3.38632  3.10731  1.75112  5.00105  3.78840    105 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.01875  3.98577        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/hmms/EOG090W0MBV.hmm
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/hmms/EOG090W0MBV.hmm Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,307 @@\n+HMMER3/f [3.1b1 | May 2013]\n+NAME  EOG090W0MBV\n+LENG  95\n+ALPH  amino\n+RF    no\n+MM    no\n+CONS  yes\n+CS    no\n+MAP   yes\n+DATE  Tue Jul 19 12:14:30 2016\n+NSEQ  40\n+EFFN  0.522461\n+CKSUM 2466610219\n+STATS LOCAL MSV       -9.1620  0.71848\n+STATS LOCAL VITERBI  -10.2836  0.71848\n+STATS LOCAL FORWARD   -4.1820  0.71848\n+HMM          A        C        D        E        F        G        H        I        K        L        M        N        P        Q        R        S        T        V        W        Y   \n+            m->m     m->i     m->d     i->m     i->i     d->m     d->d\n+  COMPO   2.56450  4.28309  2.76772  2.56684  3.52985  2.98984  3.92958  2.60319  2.65378  2.43726  3.50008  3.20375  3.32766  3.12900  2.79306  2.83380  2.86717  2.62548  4.82581  3.47921\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.12078  3.88848  2.37195  0.61958  0.77255  0.00000        *\n+      1   2.73776  5.24526  1.51161  1.96938  4.54883  3.07989  3.66859  4.01576  2.53217  3.56646  4.41644  2.64410  3.75762  2.83675  3.18082  2.71671  3.08140  3.62383  5.75511  4.29766      1 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03375  3.80145  4.52379  0.61958  0.77255  0.56026  0.84644\n+      2   2.73482  5.13721  1.72435  1.96660  4.37896  3.21556  3.62614  3.85554  2.44602  3.40992  4.24267  2.69454  3.75706  2.78499  3.03922  2.67813  2.99576  3.48531  5.59602  3.77562      2 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03375  3.80145  4.52379  0.61958  0.77255  0.56026  0.84644\n+      3   2.88000  4.44985  3.38497  3.26359  1.59717  3.76325  3.58869  2.84234  3.22452  2.40749  3.50517  3.51646  4.15213  3.45819  3.49024  3.08880  3.12319  2.69164  4.03170  2.24342      3 f - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03375  3.80145  4.52379  0.61958  0.77255  0.56026  0.84644\n+      4   2.80226  5.12724  1.29463  2.12543  4.44534  3.12132  3.74491  4.01484  2.77908  3.61191  4.50817  2.54823  3.76387  2.94546  3.32572  2.74529  3.12775  3.61855  5.70534  4.25110      4 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03375  3.80145  4.52379  0.61958  0.77255  0.56026  0.84644\n+      5   2.71029  5.03800  1.64640  2.10574  4.30687  3.20638  3.65258  3.45863  2.56624  3.35621  4.20700  2.62319  3.75987  2.82200  3.07438  2.67558  2.98543  3.38537  5.56176  4.14234      5 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03375  3.80145  4.52379  0.61958  0.77255  0.49483  0.94078\n+      6   2.71323  4.88348  2.58228  1.54187  4.15656  3.11457  3.69279  3.52774  2.49648  2.88392  4.08288  2.86916  3.81467  2.87544  2.90741  2.72752  2.98618  3.21871  5.42887  4.07525      6 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03215  3.84920  4.57155  0.61958  0.77255  0.52088  0.90140\n+      7   2.79294  5.25376  1.85349  1.56821  4.50309  3.20417  3.66083  3.99534  2.59623  3.53617  4.37580  2.67759  3.77401  2.82123  3.'..b'.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     88   3.01488  4.43972  4.30556  3.92076  3.36037  4.04362  4.65292  1.10414  3.74848  1.95094  3.29925  4.16904  4.47705  4.09906  3.94745  3.53710  3.31451  1.84597  5.24671  3.98305     88 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     89   2.84663  5.16630  1.18530  2.15457  4.48708  3.14565  3.78488  4.06518  2.83317  3.66386  4.56946  2.61503  3.79435  2.98913  3.38472  2.78699  3.17578  3.66817  5.74192  4.29188     89 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     90   2.93480  5.04093  2.47954  1.05544  4.38460  3.26094  3.84625  3.83437  2.72418  3.45496  4.43017  2.92178  3.86461  3.06251  3.13066  2.91949  3.23897  3.52046  5.56013  4.28265     90 e - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     91   3.13208  4.60068  4.15587  3.79587  3.12816  3.95543  4.45816  2.33136  3.56381  0.90134  3.15808  4.07334  4.39454  3.93714  3.74320  3.52421  3.42737  2.36322  4.99963  3.71804     91 l - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     92   2.78777  4.31274  4.07176  3.62654  3.47204  3.82941  4.44751  1.34812  3.47644  2.11913  3.35641  3.88916  4.29334  3.82939  3.72104  3.22215  2.65644  1.84493  5.25390  4.02404     92 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     93   3.03418  4.42910  4.46153  3.96261  3.28247  4.22664  4.67031  1.23093  3.77603  1.78914  2.93305  4.23228  4.55455  4.08275  3.98412  3.60501  3.29746  1.80417  5.23328  4.01717     93 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     94   2.54494  4.19420  3.65897  3.14205  3.45783  3.52080  4.00117  1.85097  3.04255  2.42025  3.40734  3.29510  3.98222  3.36966  3.34007  2.74772  2.50192  2.04405  4.98400  3.75521     94 i - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.03207  3.85159  4.57394  0.61958  0.77255  0.51882  0.90442\n+     95   2.96756  5.09199  0.94846  2.32268  4.46630  3.19520  3.91325  4.04980  2.99351  3.66196  4.63984  2.87790  3.84654  3.15253  3.50671  2.93244  3.30577  3.69129  5.63895  4.34295     95 d - - -\n+          2.68618  4.42225  2.77519  2.73123  3.46354  2.40513  3.72494  3.29354  2.67741  2.69355  4.24690  2.90347  2.73739  3.18146  2.89801  2.37887  2.77519  2.98518  4.58477  3.61503\n+          0.02170  3.84122        *  0.61958  0.77255  0.00000        *\n+//\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W00C1.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W00C1.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,1316 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t227\n+\n+[block]\n+# block no. 0 follows, 32 sequences, length 25\n+# corresponding to MSA columns:\n+# 250-274\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01279\t0.01289\t0.09935\t0.01354\t0.01674\t0.01120\t0.01246\t0.02092\t0.21099\t0.02247\t0.03036\t0.05394\t0.02985\t0.01440\t0.00823\t0.00274\t0.00639\t0.40689\t0.00595\t0.00788\n+1\t0.02197\t0.01487\t0.14850\t0.01256\t0.01779\t0.01034\t0.01190\t0.02614\t0.03798\t0.41734\t0.17879\t0.02738\t0.02565\t0.00918\t0.00694\t0.00210\t0.00592\t0.00764\t0.00703\t0.00997\n+2\t0.02202\t0.07806\t0.09380\t0.01961\t0.10645\t0.41654\t0.01487\t0.09763\t0.05172\t0.02087\t0.01216\t0.01381\t0.00972\t0.00689\t0.00614\t0.00184\t0.01021\t0.00488\t0.00385\t0.00892\n+3\t0.01554\t0.01697\t0.03473\t0.11423\t0.03462\t0.01669\t0.54504\t0.02241\t0.08665\t0.02164\t0.01478\t0.01878\t0.01109\t0.00614\t0.00766\t0.00226\t0.01041\t0.00765\t0.00370\t0.00902\n+4\t0.01875\t0.01639\t0.10359\t0.12721\t0.28295\t0.01449\t0.03556\t0.02479\t0.10023\t0.18223\t0.01742\t0.01899\t0.01269\t0.00703\t0.00670\t0.00210\t0.00759\t0.00628\t0.00478\t0.01024\n+5\t0.01203\t0.00630\t0.00718\t0.00718\t0.00846\t0.00645\t0.00531\t0.01416\t0.01287\t0.02187\t0.01988\t0.02449\t0.01632\t0.01530\t0.09696\t0.12291\t0.00533\t0.00630\t0.58498\t0.00572\n+6\t0.00836\t0.00621\t0.00776\t0.00892\t0.00980\t0.00569\t0.00623\t0.00974\t0.01348\t0.01743\t0.04331\t0.53293\t0.19451\t0.04395\t0.00930\t0.00277\t0.00403\t0.06394\t0.00616\t0.00550\n+7\t0.01435\t0.18134\t0.59064\t0.01760\t0.02668\t0.01778\t0.02213\t0.02102\t0.01406\t0.02016\t0.01150\t0.01349\t0.00852\t0.00625\t0.00596\t0.00199\t0.00937\t0.00468\t0.00284\t0.00966\n+8\t0.01060\t0.00710\t0.00925\t0.07213\t0.01255\t0.00702\t0.00690\t0.01154\t0.01250\t0.04772\t0.05087\t0.19403\t0.13470\t0.23455\t0.01784\t0.10114\t0.00545\t0.05380\t0.00504\t0.00528\n+9\t0.19480\t0.01393\t0.01400\t0.01259\t0.01642\t0.01601\t0.01000\t0.06782\t0.47377\t0.02883\t0.02316\t0.02444\t0.01812\t0.00897\t0.00637\t0.00227\t0.00545\t0.04721\t0.00618\t0.00964\n+10\t0.01116\t0.01003\t0.08305\t0.00973\t0.01247\t0.00749\t0.00847\t0.01464\t0.01809\t0.07160\t0.52471\t0.04662\t0.11107\t0.01303\t0.00772\t0.00215\t0.00413\t0.03002\t0.00685\t0.00697\n+11\t0.01610\t0.01624\t0.03011\t0.09026\t0.48275\t0.01615\t0.20697\t0.02058\t0.01529\t0.02145\t0.01283\t0.01711\t0.01038\t0.00594\t0.00700\t0.00209\t0.00896\t0.00651\t0.00332\t0.00996\n+12\t0.00859\t0.00669\t0.00730\t0.00739\t0.00893\t0.00595\t0.00520\t0.01005\t0.01428\t0.01789\t0.12435\t0.10917\t0.42988\t0.18427\t0.01387\t0.00325\t0.00416\t0.02752\t0.00587\t0.00537\n+13\t0.09223\t0.00841\t0.00952\t0.01010\t0.01166\t0.00881\t0.00722\t0.01596\t0.15960\t0.02080\t0.03325\t0.50301\t0.06024\t0.01685\t0.00772\t0.00255\t0.00431\t0.01490\t0.00614\t0.00673\n+14\t0.01661\t0.01594\t0.02724\t0.04119\t0.72233\t0.01594\t0.02059\t0.02059\t0.01528\t0.02192\t0.01262\t0.01661\t0.01063\t0.00598\t0.00664\t0.00199\t0.00797\t0.00598\t0.00332\t0.01063\n+15\t0.01109\t0.00799\t0.01074\t0.01180\t0.08636\t0.00743\t0.00762\t0.01370\t0.01690\t0.06007\t0.41412\t0.07057\t0.14954\t0.09019\t0.01043\t0.00259\t0.00422\t0.01149\t0.00645\t0.00670\n+16\t0.00977\t0.00742\t0.00914\t0.00889\t0.00963\t0.00772\t0.00618\t0.01109\t0.01323\t0.01800\t0.20056\t0.13684\t0.12810\t0.30258\t0.01957\t0.00398\t0.08487\t0.01171\t0.00533\t0.00537\n+17\t0.01878\t0.00955\t0.01219\t0.01044\t0.01369\t0.00918\t0.00827\t0.02352\t0.10158\t0.30165\t0.19853\t0.03156\t0.04664\t0.01443\t0.08525\t0.00300\t0.00602\t0.00838\t0.08856\t0.00880\n+18\t0.00940\t0.00707\t0.00993\t0.00993\t0.01113\t0.00785\t0.00752\t0.01146\t0.01122\t0.01561\t0.02439\t0.03289\t0.10298\t0.12284\t0.57350\t0.00929\t0.01497\t0.00831\t0.00397\t0.00574\n+19\t0.01110\t0.00929\t0.00915\t0.00945\t0.01103\t0.08430\t0.00675\t0.01268\t0.01495\t0.05160\t0.09758\t0.36660\t0.23750\t0.03537\t0.00860\t0.00250\t0.00472\t0.01468\t0.00607\t0.00608\n+20\t0.01018\t0.01042\t0.08591\t0.00988\t0.01216\t0.00825\t0.00810\t0.01433\t0.09830\t0.01938\t0.11200\t0.22540\t0.17753\t0.16239\t0.01294\t0.00318\t0.00504\t0.01253\t0.00564\t0.00643\n+21\t0.09481\t0.01076\t0.01187\t0.01110\t0.01387\t0.01174\t0.00872\t0.02322\t0.30936\t0.02699\t0.28122\t0.03827\t0.03686\t0.01152\t0.00722\t0.00228\t0.00460\t0.08067\t0.00669\t0.00822\n+22\t0.00974\t0.00658\t0.00769\t0.00769\t0.00782\t0.00671\t0.00453\t0.01000\t0.00987\t0.01329\t0.02080\t'..b'0.00621\t0.00463\t0.00965\t0.01074\t0.01422\t0.02702\t0.21639\t0.06003\t0.55294\t0.02686\t0.00541\t0.00574\t0.01219\t0.00468\t0.00447\n+45\t0.62393\t0.10844\t0.06240\t0.01015\t0.01494\t0.01677\t0.00923\t0.05005\t0.01277\t0.02827\t0.00982\t0.01134\t0.00770\t0.00626\t0.00444\t0.00200\t0.00586\t0.00382\t0.00402\t0.00780\n+46\t0.01054\t0.00767\t0.00930\t0.00834\t0.01081\t0.00663\t0.00636\t0.01327\t0.01739\t0.05500\t0.42696\t0.04827\t0.22947\t0.01326\t0.00750\t0.00201\t0.00356\t0.01142\t0.00670\t0.10552\n+47\t0.01567\t0.01498\t0.02554\t0.20972\t0.56114\t0.01570\t0.02013\t0.01977\t0.01483\t0.02078\t0.01246\t0.01691\t0.01023\t0.00615\t0.00666\t0.00205\t0.00820\t0.00597\t0.00324\t0.00987\n+48\t0.01618\t0.01278\t0.01396\t0.01256\t0.01605\t0.01424\t0.00980\t0.03093\t0.53021\t0.07483\t0.11506\t0.03095\t0.05698\t0.01019\t0.00706\t0.00226\t0.00501\t0.02418\t0.00696\t0.00982\n+49\t0.02506\t0.03198\t0.01901\t0.01729\t0.02074\t0.73725\t0.01296\t0.02679\t0.01901\t0.01642\t0.01037\t0.01210\t0.00864\t0.00691\t0.00605\t0.00173\t0.01210\t0.00432\t0.00346\t0.00778\n+50\t0.00839\t0.00675\t0.00704\t0.00701\t0.00879\t0.00587\t0.00498\t0.00986\t0.01448\t0.01774\t0.10302\t0.05963\t0.54164\t0.16032\t0.01297\t0.00307\t0.00398\t0.01318\t0.00589\t0.00540\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+6\t69\n+\n+[block]\n+# block no. 19 follows, 32 sequences, length 15\n+# corresponding to MSA columns:\n+# 1815-1829\n+name=unknown_T\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.03716\t0.01847\t0.02320\t0.01797\t0.02297\t0.10967\t0.18252\t0.31564\t0.02300\t0.08479\t0.01731\t0.07162\t0.01400\t0.00844\t0.00706\t0.00212\t0.00852\t0.02030\t0.00550\t0.00974\n+1\t0.01359\t0.03380\t0.69157\t0.01963\t0.02937\t0.01566\t0.06173\t0.02126\t0.01426\t0.02126\t0.01213\t0.01438\t0.00859\t0.00634\t0.00646\t0.00213\t0.00999\t0.00512\t0.00286\t0.00987\n+2\t0.00926\t0.00685\t0.00864\t0.00820\t0.00988\t0.00623\t0.00615\t0.01221\t0.01844\t0.02559\t0.62144\t0.05228\t0.16149\t0.01421\t0.00792\t0.00213\t0.00320\t0.01244\t0.00721\t0.00623\n+3\t0.07251\t0.01559\t0.01698\t0.05709\t0.01829\t0.12606\t0.04865\t0.11828\t0.01548\t0.02091\t0.01531\t0.08382\t0.01507\t0.14932\t0.01545\t0.00312\t0.18909\t0.00747\t0.00418\t0.00734\n+4\t0.01260\t0.00995\t0.01063\t0.00960\t0.01219\t0.01015\t0.00722\t0.11739\t0.14569\t0.02366\t0.11198\t0.04541\t0.31114\t0.12883\t0.01158\t0.00287\t0.00480\t0.01085\t0.00620\t0.00726\n+5\t0.16206\t0.01191\t0.01222\t0.01072\t0.01415\t0.01292\t0.00853\t0.17290\t0.12648\t0.02706\t0.03254\t0.03252\t0.22699\t0.01602\t0.10064\t0.00327\t0.00681\t0.00844\t0.00571\t0.00809\n+6\t0.01404\t0.01283\t0.02022\t0.02823\t0.43535\t0.01224\t0.01497\t0.01719\t0.01463\t0.02076\t0.02092\t0.15696\t0.06672\t0.00939\t0.00684\t0.00200\t0.00645\t0.00868\t0.00416\t0.12744\n+7\t0.13660\t0.06839\t0.39689\t0.15145\t0.02824\t0.01609\t0.01918\t0.02120\t0.06262\t0.02202\t0.01252\t0.01492\t0.00924\t0.00657\t0.00601\t0.00211\t0.00853\t0.00505\t0.00335\t0.00903\n+8\t0.01542\t0.01160\t0.01228\t0.01135\t0.01379\t0.11659\t0.00883\t0.01765\t0.01426\t0.14759\t0.02611\t0.02947\t0.12367\t0.03098\t0.38149\t0.00652\t0.01259\t0.00775\t0.00485\t0.00721\n+9\t0.13208\t0.14982\t0.01505\t0.01060\t0.01330\t0.01314\t0.00836\t0.11913\t0.01566\t0.02268\t0.02455\t0.39560\t0.02718\t0.01400\t0.00684\t0.00228\t0.00523\t0.01191\t0.00537\t0.00722\n+10\t0.01421\t0.01794\t0.13729\t0.02604\t0.17160\t0.01441\t0.32643\t0.01902\t0.01491\t0.02074\t0.01747\t0.15429\t0.01634\t0.00867\t0.00754\t0.00227\t0.00904\t0.00912\t0.00382\t0.00884\n+11\t0.01101\t0.00904\t0.01356\t0.01853\t0.22484\t0.00882\t0.01014\t0.01283\t0.01308\t0.01784\t0.02752\t0.38391\t0.04868\t0.15373\t0.01270\t0.00319\t0.00560\t0.01326\t0.00495\t0.00677\n+12\t0.01495\t0.02564\t0.38101\t0.12482\t0.02639\t0.12479\t0.01834\t0.02045\t0.01478\t0.02059\t0.01359\t0.01641\t0.01020\t0.00677\t0.00606\t0.00198\t0.00885\t0.00525\t0.15057\t0.00854\n+13\t0.16022\t0.01072\t0.01194\t0.00986\t0.01416\t0.00949\t0.00800\t0.01632\t0.01446\t0.02390\t0.12371\t0.02811\t0.02192\t0.00856\t0.00591\t0.00168\t0.00491\t0.10524\t0.00486\t0.41602\n+14\t0.01135\t0.00879\t0.00985\t0.00926\t0.01177\t0.00842\t0.00735\t0.11704\t0.01850\t0.02376\t0.17547\t0.05610\t0.38810\t0.01524\t0.00794\t0.00232\t0.00438\t0.11110\t0.00651\t0.00675\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t4981\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W00C1.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W01M6.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W01M6.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,938 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+2\t960\n+\n+[block]\n+# block no. 0 follows, 27 sequences, length 13\n+# corresponding to MSA columns:\n+# 1014-1026\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01262\t0.01087\t0.01456\t0.01804\t0.16280\t0.03739\t0.01076\t0.01544\t0.01737\t0.02369\t0.22838\t0.25888\t0.08833\t0.01527\t0.00842\t0.00245\t0.00546\t0.01367\t0.00630\t0.04933\n+1\t0.01079\t0.00774\t0.00962\t0.01010\t0.01099\t0.00778\t0.00687\t0.04609\t0.01419\t0.01896\t0.03396\t0.34556\t0.08237\t0.23100\t0.12397\t0.00548\t0.00767\t0.01500\t0.00579\t0.00605\n+2\t0.01021\t0.00785\t0.01037\t0.07592\t0.01458\t0.00755\t0.00802\t0.01307\t0.01821\t0.02466\t0.37453\t0.20534\t0.16831\t0.01688\t0.00879\t0.00253\t0.00432\t0.01488\t0.00721\t0.00678\n+3\t0.02351\t0.02383\t0.17162\t0.01763\t0.02437\t0.02092\t0.01664\t0.41236\t0.14635\t0.03880\t0.01905\t0.01912\t0.01371\t0.00871\t0.00737\t0.00231\t0.00838\t0.00673\t0.00650\t0.01210\n+4\t0.01632\t0.01408\t0.01473\t0.01343\t0.01725\t0.01576\t0.01040\t0.03307\t0.53258\t0.02862\t0.04018\t0.03739\t0.17049\t0.01201\t0.00782\t0.00252\t0.00541\t0.01001\t0.00741\t0.01054\n+5\t0.18242\t0.00831\t0.00902\t0.00995\t0.01149\t0.00841\t0.00703\t0.01291\t0.01411\t0.02223\t0.03732\t0.51271\t0.09946\t0.01922\t0.00833\t0.00281\t0.00457\t0.01681\t0.00638\t0.00650\n+6\t0.01806\t0.51489\t0.09322\t0.01221\t0.01796\t0.02327\t0.01240\t0.02126\t0.01525\t0.02029\t0.01368\t0.01575\t0.01162\t0.00693\t0.00507\t0.00169\t0.00723\t0.00476\t0.17539\t0.00908\n+7\t0.79154\t0.01436\t0.01091\t0.00976\t0.01436\t0.01665\t0.00804\t0.02182\t0.01263\t0.03331\t0.01034\t0.01206\t0.00804\t0.00689\t0.00459\t0.00230\t0.00574\t0.00402\t0.00459\t0.00804\n+8\t0.05711\t0.01551\t0.02179\t0.16978\t0.23525\t0.06675\t0.04143\t0.01938\t0.01472\t0.02040\t0.01517\t0.02452\t0.01418\t0.16977\t0.01555\t0.00346\t0.07551\t0.00734\t0.00380\t0.00859\n+9\t0.00947\t0.00696\t0.00891\t0.00991\t0.01099\t0.00641\t0.00702\t0.01142\t0.01617\t0.02153\t0.17973\t0.46148\t0.14583\t0.02079\t0.00927\t0.00282\t0.00420\t0.05361\t0.00715\t0.00631\n+10\t0.02042\t0.01485\t0.01677\t0.01442\t0.01826\t0.01620\t0.01132\t0.31095\t0.13266\t0.06408\t0.02634\t0.20007\t0.02421\t0.01704\t0.07313\t0.00338\t0.00783\t0.01073\t0.00707\t0.01028\n+11\t0.20133\t0.01302\t0.01583\t0.01244\t0.01793\t0.01218\t0.01027\t0.03300\t0.01934\t0.55065\t0.02509\t0.02234\t0.01609\t0.00868\t0.00683\t0.00230\t0.00619\t0.00670\t0.00817\t0.01162\n+12\t0.00954\t0.00685\t0.00888\t0.00981\t0.01063\t0.00638\t0.00670\t0.01134\t0.01584\t0.02148\t0.20988\t0.48307\t0.07693\t0.07257\t0.01130\t0.00312\t0.00429\t0.01816\t0.00705\t0.00618\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+4\t6\n+\n+[block]\n+# block no. 1 follows, 27 sequences, length 9\n+# corresponding to MSA columns:\n+# 1033-1041\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.12611\t0.02214\t0.15622\t0.06242\t0.14677\t0.06950\t0.12057\t0.06562\t0.04166\t0.06533\t0.01745\t0.01976\t0.03842\t0.00771\t0.00717\t0.00232\t0.00931\t0.00672\t0.00453\t0.01027\n+1\t0.01466\t0.01347\t0.08467\t0.02016\t0.18461\t0.01085\t0.01340\t0.01826\t0.01763\t0.08713\t0.18780\t0.18049\t0.08857\t0.01377\t0.00831\t0.00249\t0.00614\t0.03250\t0.00623\t0.00886\n+2\t0.01877\t0.01484\t0.04354\t0.13827\t0.12182\t0.03610\t0.10851\t0.02318\t0.03527\t0.16615\t0.07182\t0.08806\t0.05782\t0.01154\t0.02849\t0.00270\t0.00841\t0.00933\t0.00567\t0.00969\n+3\t0.01572\t0.00730\t0.01072\t0.01016\t0.01095\t0.00706\t0.00706\t0.01334\t0.01127\t0.10766\t0.01516\t0.02294\t0.01365\t0.02349\t0.02603\t0.67587\t0.00643\t0.00659\t0.00405\t0.00453\n+4\t0.02340\t0.10791\t0.05975\t0.01634\t0.02188\t0.07939\t0.01396\t0.30598\t0.23131\t0.03470\t0.02001\t0.01971\t0.01495\t0.00876\t0.00707\t0.00222\t0.00802\t0.00667\t0.00642\t0.01155\n+5\t0.00947\t0.00711\t0.00878\t0.00928\t0.01069\t0.00642\t0.00661\t0.01165\t0.01719\t0.02288\t0.26795\t0.33675\t0.21933\t0.01940\t0.00905\t0.00266\t0.00390\t0.01713\t0.00732\t0.00642\n+6\t0.01891\t0.14835\t0.24026\t0.11473\t0.02870\t0.07070\t0.04192\t0.05328\t0.04152\t0.07564\t0.01477\t0.01685\t0.01107\t0.00721\t0.00666\t0.00208\t0.00932\t0.00565\t0.00420\t0.08819\n+7\t0.01608\t0.01408\t0.01806\t0.01535\t0.01896\t0.01530\t0.10026\t0.02924\t0.40075\t0.02567\t0.02887\t0.03367\t0.05640\t0.17682\t0.01470\t0.00359\t0.00699\t0.00937\t0.00630'..b'1\t0.08430\t0.14408\t0.04693\t0.03572\t0.02265\t0.01339\t0.01647\t0.01074\t0.00726\t0.00806\t0.00221\t0.05576\t0.00614\t0.00371\t0.01031\n+8\t0.01352\t0.01207\t0.01530\t0.01402\t0.01462\t0.04600\t0.01080\t0.01505\t0.01184\t0.01675\t0.01670\t0.02885\t0.01715\t0.21971\t0.24646\t0.00702\t0.27556\t0.00803\t0.00384\t0.00670\n+9\t0.01796\t0.08543\t0.04565\t0.01963\t0.14123\t0.01476\t0.06125\t0.03980\t0.03922\t0.06228\t0.01481\t0.01699\t0.01182\t0.00634\t0.00629\t0.00164\t0.00716\t0.00548\t0.00452\t0.39775\n+10\t0.02660\t0.02288\t0.05477\t0.05963\t0.08978\t0.16634\t0.03695\t0.08593\t0.02157\t0.14900\t0.02143\t0.02562\t0.01722\t0.01587\t0.07760\t0.00401\t0.07231\t0.00788\t0.03253\t0.01208\n+11\t0.02055\t0.03609\t0.54247\t0.02413\t0.03409\t0.01910\t0.09894\t0.02672\t0.01877\t0.06322\t0.01878\t0.02283\t0.01442\t0.01006\t0.00912\t0.00317\t0.01203\t0.00740\t0.00512\t0.01301\n+12\t0.01678\t0.01288\t0.01582\t0.01608\t0.05237\t0.01327\t0.01090\t0.01891\t0.07753\t0.02247\t0.02780\t0.04078\t0.05993\t0.24534\t0.27700\t0.00817\t0.05834\t0.01034\t0.00609\t0.00921\n+13\t0.02248\t0.13167\t0.23480\t0.15981\t0.07092\t0.06550\t0.07086\t0.04790\t0.01953\t0.06228\t0.01833\t0.02301\t0.01472\t0.01014\t0.00881\t0.00304\t0.01126\t0.00734\t0.00535\t0.01225\n+14\t0.01641\t0.01597\t0.07950\t0.01520\t0.01754\t0.07963\t0.01161\t0.01733\t0.01837\t0.02441\t0.09848\t0.48363\t0.04475\t0.02119\t0.01058\t0.00353\t0.00739\t0.01756\t0.00766\t0.00927\n+15\t0.01469\t0.01100\t0.01348\t0.01417\t0.01512\t0.01057\t0.00980\t0.01490\t0.01732\t0.02400\t0.10443\t0.55148\t0.04881\t0.02326\t0.01250\t0.00372\t0.07479\t0.01923\t0.00798\t0.00875\n+16\t0.02213\t0.02277\t0.09375\t0.10330\t0.19299\t0.06997\t0.12504\t0.06113\t0.03797\t0.02753\t0.01967\t0.04927\t0.01692\t0.01127\t0.01104\t0.00322\t0.08184\t0.00863\t0.02942\t0.01214\n+17\t0.01269\t0.01003\t0.01436\t0.07007\t0.01835\t0.01026\t0.05384\t0.07635\t0.01731\t0.02277\t0.03618\t0.27359\t0.09943\t0.02073\t0.06097\t0.00358\t0.00743\t0.17847\t0.00622\t0.00738\n+18\t0.01373\t0.00874\t0.01223\t0.01321\t0.01519\t0.00866\t0.01123\t0.01686\t0.01680\t0.08836\t0.03658\t0.12083\t0.03848\t0.02295\t0.07678\t0.00409\t0.00784\t0.47330\t0.00680\t0.00733\n+19\t0.00983\t0.00759\t0.01111\t0.01151\t0.01254\t0.00710\t0.05531\t0.01139\t0.01427\t0.01892\t0.03911\t0.57796\t0.07857\t0.09260\t0.01219\t0.00336\t0.00517\t0.01888\t0.00642\t0.00619\n+20\t0.02553\t0.22426\t0.02698\t0.01830\t0.08763\t0.07340\t0.01416\t0.29037\t0.02468\t0.12128\t0.01639\t0.01688\t0.01221\t0.00791\t0.00662\t0.00203\t0.00831\t0.00588\t0.00583\t0.01137\n+21\t0.01740\t0.08900\t0.28763\t0.02164\t0.14121\t0.01681\t0.01925\t0.07422\t0.01824\t0.06948\t0.08363\t0.02456\t0.06679\t0.00902\t0.00773\t0.00228\t0.02865\t0.00731\t0.00474\t0.01042\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t7\n+\n+[block]\n+# block no. 23 follows, 27 sequences, length 7\n+# corresponding to MSA columns:\n+# 2719-2725\n+name=unknown_X\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01660\t0.04485\t0.08412\t0.05611\t0.12205\t0.03271\t0.20906\t0.06238\t0.01812\t0.02463\t0.05562\t0.02715\t0.08785\t0.00870\t0.00772\t0.00223\t0.00893\t0.02368\t0.00460\t0.10290\n+1\t0.01443\t0.01375\t0.02235\t0.59278\t0.04534\t0.01764\t0.01982\t0.01877\t0.01421\t0.01877\t0.01256\t0.01914\t0.00987\t0.00844\t0.01052\t0.00262\t0.14091\t0.00658\t0.00329\t0.00822\n+2\t0.01497\t0.01329\t0.01808\t0.01337\t0.01941\t0.01055\t0.08762\t0.01841\t0.01552\t0.02358\t0.01640\t0.09333\t0.01513\t0.00750\t0.00632\t0.00147\t0.00621\t0.00672\t0.00459\t0.60754\n+3\t0.01968\t0.01502\t0.01883\t0.01562\t0.01977\t0.01619\t0.08147\t0.10777\t0.33896\t0.09883\t0.02573\t0.02925\t0.02056\t0.14289\t0.01319\t0.00332\t0.00716\t0.00857\t0.00674\t0.01043\n+4\t0.02024\t0.01363\t0.01529\t0.01342\t0.01718\t0.01478\t0.01024\t0.03350\t0.41589\t0.17097\t0.02877\t0.03100\t0.02254\t0.14335\t0.01307\t0.00333\t0.00621\t0.00863\t0.00734\t0.01061\n+5\t0.01287\t0.01036\t0.01452\t0.04066\t0.09188\t0.01039\t0.03903\t0.04610\t0.05287\t0.02400\t0.22084\t0.12100\t0.08664\t0.15765\t0.03543\t0.00367\t0.00642\t0.01196\t0.00613\t0.00758\n+6\t0.30950\t0.01714\t0.09049\t0.02001\t0.14315\t0.01532\t0.08411\t0.02291\t0.01576\t0.10811\t0.02108\t0.02244\t0.08384\t0.00835\t0.00660\t0.00233\t0.00744\t0.00683\t0.00498\t0.00960\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t308\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W01M6.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W02B6.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W02B6.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,547 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+35\t2346\n+\n+[block]\n+# block no. 0 follows, 32 sequences, length 21\n+# corresponding to MSA columns:\n+# 2826-2846\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.04488\t0.13434\t0.18209\t0.01894\t0.12152\t0.08159\t0.04855\t0.08363\t0.03227\t0.03817\t0.01654\t0.02060\t0.04125\t0.01082\t0.06075\t0.00266\t0.00902\t0.03938\t0.00398\t0.00903\n+1\t0.03618\t0.00862\t0.01066\t0.00953\t0.01193\t0.00836\t0.00745\t0.01612\t0.01654\t0.16463\t0.25189\t0.07830\t0.25644\t0.01362\t0.00892\t0.00226\t0.07349\t0.01120\t0.00664\t0.00723\n+2\t0.01383\t0.01584\t0.09368\t0.02155\t0.14293\t0.04306\t0.19186\t0.01852\t0.04434\t0.02133\t0.10205\t0.07627\t0.08011\t0.01010\t0.00816\t0.00229\t0.03883\t0.06241\t0.00455\t0.00830\n+3\t0.06016\t0.11229\t0.16403\t0.12925\t0.12084\t0.04001\t0.08695\t0.02041\t0.01468\t0.07367\t0.03048\t0.04000\t0.01296\t0.00759\t0.00702\t0.00211\t0.03511\t0.02977\t0.00382\t0.00885\n+4\t0.01060\t0.00822\t0.01263\t0.09945\t0.01677\t0.00853\t0.05783\t0.01294\t0.01300\t0.04272\t0.02908\t0.25779\t0.09652\t0.06344\t0.20573\t0.00494\t0.00906\t0.03956\t0.00489\t0.00629\n+5\t0.01722\t0.00915\t0.01216\t0.01175\t0.05220\t0.00834\t0.00842\t0.04391\t0.01738\t0.27030\t0.16554\t0.20849\t0.12046\t0.01333\t0.00755\t0.00225\t0.00468\t0.01159\t0.00704\t0.00825\n+6\t0.08546\t0.05379\t0.07765\t0.09064\t0.15658\t0.11650\t0.09860\t0.10453\t0.03490\t0.06724\t0.01339\t0.01581\t0.01024\t0.00689\t0.00704\t0.00206\t0.03952\t0.00569\t0.00412\t0.00932\n+7\t0.01584\t0.01648\t0.14378\t0.05307\t0.11120\t0.03325\t0.04219\t0.09071\t0.06562\t0.08824\t0.04683\t0.12976\t0.04474\t0.03685\t0.04844\t0.00282\t0.00773\t0.00864\t0.00500\t0.00880\n+8\t0.30047\t0.01304\t0.01391\t0.01152\t0.01555\t0.01417\t0.00943\t0.12043\t0.05068\t0.22218\t0.04479\t0.02036\t0.05272\t0.00856\t0.00729\t0.00216\t0.07164\t0.00612\t0.00592\t0.00905\n+9\t0.00952\t0.00696\t0.00919\t0.04044\t0.01206\t0.00685\t0.00731\t0.04836\t0.01444\t0.01932\t0.08167\t0.61018\t0.04214\t0.01910\t0.00837\t0.00264\t0.00434\t0.04496\t0.00620\t0.00595\n+10\t0.01613\t0.09003\t0.06760\t0.08245\t0.12965\t0.08873\t0.06703\t0.01987\t0.03381\t0.06863\t0.09911\t0.06892\t0.01991\t0.00930\t0.00833\t0.00217\t0.08035\t0.03515\t0.00442\t0.00841\n+11\t0.01625\t0.01744\t0.11550\t0.09213\t0.31467\t0.01637\t0.04661\t0.04837\t0.01473\t0.05687\t0.01282\t0.01674\t0.01039\t0.00902\t0.03606\t0.00255\t0.15450\t0.00599\t0.00356\t0.00945\n+12\t0.00872\t0.00645\t0.00832\t0.00894\t0.00987\t0.00632\t0.00628\t0.01027\t0.01293\t0.01725\t0.08872\t0.34930\t0.14915\t0.10899\t0.17146\t0.00479\t0.00714\t0.01408\t0.00550\t0.00552\n+13\t0.02167\t0.15913\t0.09718\t0.01469\t0.01992\t0.16051\t0.01309\t0.16066\t0.14906\t0.11435\t0.01670\t0.01665\t0.01239\t0.00745\t0.00613\t0.00192\t0.00795\t0.00551\t0.00517\t0.00987\n+14\t0.04102\t0.01622\t0.09592\t0.04680\t0.04446\t0.01474\t0.07936\t0.12596\t0.15126\t0.20642\t0.02082\t0.06632\t0.01580\t0.00868\t0.00741\t0.00220\t0.03332\t0.00733\t0.00590\t0.01005\n+15\t0.21062\t0.02001\t0.15830\t0.13645\t0.08327\t0.08863\t0.14867\t0.02048\t0.01431\t0.02229\t0.01296\t0.01600\t0.02684\t0.00655\t0.00621\t0.00211\t0.00878\t0.00562\t0.00348\t0.00844\n+16\t0.01793\t0.03565\t0.08622\t0.04679\t0.08046\t0.01483\t0.01294\t0.27422\t0.02033\t0.06648\t0.01914\t0.11116\t0.01710\t0.04020\t0.10343\t0.00343\t0.00854\t0.02671\t0.00530\t0.00913\n+17\t0.11861\t0.05745\t0.08956\t0.01631\t0.04411\t0.20843\t0.05758\t0.17558\t0.03759\t0.02584\t0.01257\t0.01409\t0.00971\t0.00670\t0.00595\t0.00184\t0.00855\t0.00499\t0.00433\t0.10023\n+18\t0.16610\t0.03265\t0.04295\t0.04718\t0.11312\t0.03509\t0.01258\t0.12980\t0.01660\t0.08796\t0.01500\t0.01686\t0.03578\t0.00773\t0.00815\t0.00203\t0.11277\t0.00552\t0.00456\t0.10757\n+19\t0.05087\t0.03470\t0.01667\t0.03200\t0.01773\t0.03266\t0.04229\t0.15401\t0.03416\t0.11082\t0.01963\t0.09147\t0.04437\t0.03637\t0.00849\t0.00209\t0.05948\t0.00727\t0.00527\t0.19968\n+20\t0.01605\t0.01741\t0.01565\t0.07206\t0.01879\t0.28049\t0.03934\t0.01893\t0.03953\t0.01665\t0.01576\t0.05121\t0.01449\t0.05985\t0.28764\t0.00554\t0.01322\t0.00668\t0.00373\t0.00695\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+1\t4\n+\n+[block]\n+# block no. 1 follows, 32 sequences, length 25\n+# corresponding to MSA columns:\n+# 2851-2875\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\t'..b'016\t0.00584\t0.00768\t0.00223\t0.01074\t0.00755\t0.00346\t0.00912\n+25\t0.81159\t0.01298\t0.00986\t0.00882\t0.01298\t0.01505\t0.00727\t0.01972\t0.01142\t0.03010\t0.00934\t0.01090\t0.00727\t0.00623\t0.00415\t0.00208\t0.00519\t0.00363\t0.00415\t0.00727\n+26\t0.00959\t0.00719\t0.01078\t0.01078\t0.01198\t0.00839\t0.00839\t0.01198\t0.01078\t0.01558\t0.01797\t0.02636\t0.01677\t0.05032\t0.73760\t0.01078\t0.01797\t0.00719\t0.00359\t0.00599\n+27\t0.00959\t0.00719\t0.01078\t0.01078\t0.01198\t0.00839\t0.00839\t0.01198\t0.01078\t0.01558\t0.01797\t0.02636\t0.01677\t0.05032\t0.73760\t0.01078\t0.01797\t0.00719\t0.00359\t0.00599\n+28\t0.01239\t0.01144\t0.01909\t0.67485\t0.04285\t0.01411\t0.01769\t0.01665\t0.01352\t0.01733\t0.01432\t0.04882\t0.01210\t0.00798\t0.00694\t0.00231\t0.00859\t0.04842\t0.00330\t0.00730\n+29\t0.00920\t0.00677\t0.00861\t0.00831\t0.00988\t0.00618\t0.00617\t0.01204\t0.01807\t0.02509\t0.58722\t0.10627\t0.14184\t0.01468\t0.00797\t0.00218\t0.00325\t0.01291\t0.00716\t0.00618\n+30\t0.00960\t0.00715\t0.01058\t0.01058\t0.01171\t0.00828\t0.00813\t0.01185\t0.01072\t0.01543\t0.01816\t0.02739\t0.01722\t0.09223\t0.69630\t0.01053\t0.01730\t0.00734\t0.00362\t0.00588\n+31\t0.01267\t0.01193\t0.02013\t0.74806\t0.04621\t0.01491\t0.01863\t0.01714\t0.01342\t0.01714\t0.01193\t0.01789\t0.00894\t0.00671\t0.00671\t0.00224\t0.00894\t0.00596\t0.00298\t0.00745\n+32\t0.81159\t0.01298\t0.00986\t0.00882\t0.01298\t0.01505\t0.00727\t0.01972\t0.01142\t0.03010\t0.00934\t0.01090\t0.00727\t0.00623\t0.00415\t0.00208\t0.00519\t0.00363\t0.00415\t0.00727\n+33\t0.01846\t0.67758\t0.03366\t0.01310\t0.04862\t0.02564\t0.01198\t0.07222\t0.01508\t0.01809\t0.00999\t0.01143\t0.00891\t0.00593\t0.00459\t0.00150\t0.00723\t0.00388\t0.00318\t0.00891\n+34\t0.60982\t0.01785\t0.01221\t0.01099\t0.01497\t0.20032\t0.00873\t0.02154\t0.01337\t0.02659\t0.00961\t0.01121\t0.00762\t0.00640\t0.00464\t0.00199\t0.00696\t0.00381\t0.00397\t0.00740\n+35\t0.01709\t0.01413\t0.01514\t0.01328\t0.01703\t0.01603\t0.01041\t0.12845\t0.52909\t0.02997\t0.10922\t0.02678\t0.02435\t0.00951\t0.00694\t0.00222\t0.00535\t0.00791\t0.00688\t0.01022\n+36\t0.01251\t0.00625\t0.00625\t0.00625\t0.00782\t0.00625\t0.00469\t0.01563\t0.01407\t0.02502\t0.02189\t0.02502\t0.01720\t0.00782\t0.00469\t0.00156\t0.00313\t0.00625\t0.80144\t0.00625\n+37\t0.81159\t0.01298\t0.00986\t0.00882\t0.01298\t0.01505\t0.00727\t0.01972\t0.01142\t0.03010\t0.00934\t0.01090\t0.00727\t0.00623\t0.00415\t0.00208\t0.00519\t0.00363\t0.00415\t0.00727\n+38\t0.00912\t0.00666\t0.00858\t0.00849\t0.00989\t0.00611\t0.00622\t0.01179\t0.01753\t0.02436\t0.53808\t0.18741\t0.10998\t0.01537\t0.00804\t0.00224\t0.00332\t0.01362\t0.00708\t0.00611\n+39\t0.02542\t0.02821\t0.01906\t0.01663\t0.02056\t0.55288\t0.01276\t0.16403\t0.02157\t0.05944\t0.01239\t0.01349\t0.00963\t0.00722\t0.00622\t0.00181\t0.01080\t0.00480\t0.00438\t0.00871\n+40\t0.01564\t0.02116\t0.21118\t0.04592\t0.07397\t0.01595\t0.35222\t0.02282\t0.08294\t0.04740\t0.01547\t0.01939\t0.01174\t0.00667\t0.00729\t0.00223\t0.00975\t0.02496\t0.00382\t0.00948\n+41\t0.01281\t0.03680\t0.01288\t0.01270\t0.01495\t0.01047\t0.01093\t0.06006\t0.11342\t0.02243\t0.03222\t0.06254\t0.03330\t0.01610\t0.00859\t0.00285\t0.00617\t0.51737\t0.00618\t0.00721\n+42\t0.02331\t0.01074\t0.01411\t0.01094\t0.01567\t0.00907\t0.00887\t0.02608\t0.01810\t0.46475\t0.14187\t0.02570\t0.02324\t0.00856\t0.00659\t0.00186\t0.00513\t0.00711\t0.00727\t0.17105\n+43\t0.02338\t0.01774\t0.01894\t0.01501\t0.02000\t0.01982\t0.01224\t0.54003\t0.19493\t0.03886\t0.01881\t0.01826\t0.01359\t0.00831\t0.00674\t0.00208\t0.00688\t0.00641\t0.00674\t0.01122\n+44\t0.02496\t0.01852\t0.01983\t0.01533\t0.02060\t0.02055\t0.01262\t0.65842\t0.07399\t0.04140\t0.01681\t0.01667\t0.01198\t0.00812\t0.00672\t0.00203\t0.00725\t0.00614\t0.00672\t0.01136\n+45\t0.02995\t0.01167\t0.01573\t0.01206\t0.01725\t0.01023\t0.00996\t0.05541\t0.01962\t0.70368\t0.02612\t0.02261\t0.01643\t0.00830\t0.00675\t0.00207\t0.00577\t0.00672\t0.00825\t0.01142\n+46\t0.00875\t0.00673\t0.00800\t0.00790\t0.00962\t0.00598\t0.00584\t0.01114\t0.01692\t0.02249\t0.39559\t0.12889\t0.31642\t0.01574\t0.00799\t0.00223\t0.00333\t0.01364\t0.00682\t0.00598\n+47\t0.00887\t0.00653\t0.00831\t0.00852\t0.00981\t0.00596\t0.00614\t0.01121\t0.01655\t0.02265\t0.41661\t0.27844\t0.14262\t0.01647\t0.00812\t0.00233\t0.00343\t0.01461\t0.00687\t0.00596\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t3\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W02B6.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W02CW.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W02CW.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,544 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t160\n+\n+[block]\n+# block no. 0 follows, 29 sequences, length 16\n+# corresponding to MSA columns:\n+# 207-222\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.02504\t0.01956\t0.02001\t0.01612\t0.02114\t0.07615\t0.01329\t0.54430\t0.03024\t0.03968\t0.01924\t0.02483\t0.01556\t0.00987\t0.00741\t0.00226\t0.00807\t0.08936\t0.00678\t0.01109\n+1\t0.01449\t0.08837\t0.62806\t0.01934\t0.02909\t0.01698\t0.02453\t0.02207\t0.01506\t0.02206\t0.01381\t0.01802\t0.01062\t0.00736\t0.00676\t0.00225\t0.01011\t0.03761\t0.00319\t0.01022\n+2\t0.01904\t0.75404\t0.03731\t0.01218\t0.01828\t0.02818\t0.01218\t0.02132\t0.01447\t0.01675\t0.00990\t0.01142\t0.00914\t0.00609\t0.00457\t0.00152\t0.00761\t0.00381\t0.00305\t0.00914\n+3\t0.00868\t0.00620\t0.00826\t0.00991\t0.01033\t0.00578\t0.00661\t0.00991\t0.01363\t0.01818\t0.03925\t0.74510\t0.04710\t0.02231\t0.00909\t0.00289\t0.00413\t0.02024\t0.00661\t0.00578\n+4\t0.00868\t0.00620\t0.00826\t0.00991\t0.01033\t0.00578\t0.00661\t0.00991\t0.01363\t0.01818\t0.03925\t0.74510\t0.04710\t0.02231\t0.00909\t0.00289\t0.00413\t0.02024\t0.00661\t0.00578\n+5\t0.01681\t0.01921\t0.04202\t0.03001\t0.03721\t0.01801\t0.67947\t0.02281\t0.01681\t0.02281\t0.01441\t0.01921\t0.01080\t0.00600\t0.00840\t0.00240\t0.01200\t0.00840\t0.00360\t0.00960\n+6\t0.01696\t0.01259\t0.01499\t0.01082\t0.01704\t0.00962\t0.00870\t0.02007\t0.01548\t0.11090\t0.01463\t0.01597\t0.01145\t0.00573\t0.00551\t0.00120\t0.00537\t0.00459\t0.00481\t0.69357\n+7\t0.80005\t0.01377\t0.01047\t0.00936\t0.01377\t0.01597\t0.00771\t0.02093\t0.01212\t0.03195\t0.00991\t0.01157\t0.00771\t0.00661\t0.00441\t0.00220\t0.00551\t0.00386\t0.00441\t0.00771\n+8\t0.01558\t0.01558\t0.02181\t0.01869\t0.01869\t0.02181\t0.01558\t0.01714\t0.01091\t0.01714\t0.00935\t0.01558\t0.00935\t0.01246\t0.02337\t0.00312\t0.73672\t0.00623\t0.00312\t0.00779\n+9\t0.01008\t0.00728\t0.00952\t0.00896\t0.01064\t0.00672\t0.00672\t0.01344\t0.02016\t0.02855\t0.70158\t0.05319\t0.06719\t0.01456\t0.00840\t0.00224\t0.00336\t0.01288\t0.00784\t0.00672\n+10\t0.01008\t0.00728\t0.00952\t0.00896\t0.01064\t0.00672\t0.00672\t0.01344\t0.02016\t0.02855\t0.70158\t0.05319\t0.06719\t0.01456\t0.00840\t0.00224\t0.00336\t0.01288\t0.00784\t0.00672\n+11\t0.01762\t0.01692\t0.02890\t0.04371\t0.70533\t0.01692\t0.02185\t0.02185\t0.01621\t0.02326\t0.01339\t0.01762\t0.01128\t0.00634\t0.00705\t0.00211\t0.00846\t0.00634\t0.00352\t0.01128\n+12\t0.01428\t0.03683\t0.71286\t0.02030\t0.03082\t0.01654\t0.02631\t0.02255\t0.01503\t0.02255\t0.01278\t0.01503\t0.00902\t0.00677\t0.00677\t0.00226\t0.01052\t0.00526\t0.00301\t0.01052\n+13\t0.01345\t0.01266\t0.02136\t0.73264\t0.04904\t0.01582\t0.01978\t0.01819\t0.01424\t0.01819\t0.01266\t0.01898\t0.00949\t0.00712\t0.00712\t0.00237\t0.00949\t0.00633\t0.00316\t0.00791\n+14\t0.01237\t0.00618\t0.00928\t0.00928\t0.00928\t0.00618\t0.00618\t0.00928\t0.00928\t0.01237\t0.01237\t0.02165\t0.01237\t0.02474\t0.02783\t0.79283\t0.00618\t0.00618\t0.00309\t0.00309\n+15\t0.01729\t0.01658\t0.02830\t0.09873\t0.65291\t0.01683\t0.02169\t0.02156\t0.01606\t0.02286\t0.01334\t0.01773\t0.01114\t0.00641\t0.00706\t0.00214\t0.00854\t0.00634\t0.00350\t0.01101\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t9\n+\n+[block]\n+# block no. 1 follows, 29 sequences, length 54\n+# corresponding to MSA columns:\n+# 232-285\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01008\t0.00728\t0.00952\t0.00896\t0.01064\t0.00672\t0.00672\t0.01344\t0.02016\t0.02855\t0.70158\t0.05319\t0.06719\t0.01456\t0.00840\t0.00224\t0.00336\t0.01288\t0.00784\t0.00672\n+1\t0.00987\t0.00723\t0.00929\t0.00915\t0.01078\t0.00666\t0.00690\t0.01286\t0.01887\t0.02611\t0.52869\t0.12395\t0.12780\t0.01601\t0.00856\t0.00239\t0.00367\t0.05715\t0.00751\t0.00655\n+2\t0.01524\t0.01448\t0.02459\t0.43724\t0.33045\t0.01629\t0.02067\t0.01976\t0.01509\t0.02037\t0.01297\t0.01840\t0.01026\t0.00679\t0.00709\t0.00226\t0.00905\t0.00634\t0.00332\t0.00935\n+3\t0.01742\t0.01671\t0.02854\t0.07709\t0.67353\t0.01687\t0.02175\t0.02168\t0.01612\t0.02302\t0.01336\t0.01769\t0.01119\t0.00638\t0.00705\t0.00213\t0.00851\t0.00634\t0.00351\t0.01112\n+4\t0.00842\t0.00721\t0.00721\t0.00721\t0.00962\t0.00601\t0.00541\t0.01022\t0.01623\t0.01924\t0.07213\t0.06853\t0.70244\t0.01803\t0.00842\t0.00240\t0.00361\t0.01503\t0.00661'..b'01646\t0.00961\t0.00961\t0.02987\t0.02033\t0.55522\t0.18126\t0.03082\t0.02890\t0.01012\t0.00744\t0.00221\t0.00545\t0.00846\t0.00859\t0.01089\n+6\t0.02707\t0.01995\t0.02137\t0.01638\t0.02208\t0.02208\t0.01353\t0.68159\t0.03348\t0.04488\t0.01710\t0.01710\t0.01211\t0.00855\t0.00712\t0.00214\t0.00784\t0.00641\t0.00712\t0.01211\n+7\t0.01551\t0.01713\t0.03662\t0.02680\t0.03291\t0.01605\t0.57186\t0.02075\t0.01630\t0.02207\t0.01838\t0.13530\t0.01661\t0.00861\t0.00851\t0.00248\t0.01075\t0.01030\t0.00408\t0.00899\n+8\t0.01237\t0.00618\t0.00928\t0.00928\t0.00928\t0.00618\t0.00618\t0.00928\t0.00928\t0.01237\t0.01237\t0.02165\t0.01237\t0.02474\t0.02783\t0.79283\t0.00618\t0.00618\t0.00309\t0.00309\n+9\t0.01762\t0.01692\t0.02890\t0.04371\t0.70533\t0.01692\t0.02185\t0.02185\t0.01621\t0.02326\t0.01339\t0.01762\t0.01128\t0.00634\t0.00705\t0.00211\t0.00846\t0.00634\t0.00352\t0.01128\n+10\t0.02707\t0.01995\t0.02137\t0.01638\t0.02208\t0.02208\t0.01353\t0.68159\t0.03348\t0.04488\t0.01710\t0.01710\t0.01211\t0.00855\t0.00712\t0.00214\t0.00784\t0.00641\t0.00712\t0.01211\n+11\t0.01681\t0.01921\t0.04202\t0.03001\t0.03721\t0.01801\t0.67947\t0.02281\t0.01681\t0.02281\t0.01441\t0.01921\t0.01080\t0.00600\t0.00840\t0.00240\t0.01200\t0.00840\t0.00360\t0.00960\n+12\t0.01036\t0.00690\t0.00777\t0.00777\t0.00777\t0.00690\t0.00431\t0.01036\t0.01036\t0.01381\t0.02244\t0.04660\t0.02589\t0.74975\t0.03624\t0.00690\t0.00690\t0.01036\t0.00431\t0.00431\n+13\t0.01904\t0.75404\t0.03731\t0.01218\t0.01828\t0.02818\t0.01218\t0.02132\t0.01447\t0.01675\t0.00990\t0.01142\t0.00914\t0.00609\t0.00457\t0.00152\t0.00761\t0.00381\t0.00305\t0.00914\n+14\t0.01904\t0.75404\t0.03731\t0.01218\t0.01828\t0.02818\t0.01218\t0.02132\t0.01447\t0.01675\t0.00990\t0.01142\t0.00914\t0.00609\t0.00457\t0.00152\t0.00761\t0.00381\t0.00305\t0.00914\n+15\t0.02707\t0.01995\t0.02137\t0.01638\t0.02208\t0.02208\t0.01353\t0.68159\t0.03348\t0.04488\t0.01710\t0.01710\t0.01211\t0.00855\t0.00712\t0.00214\t0.00784\t0.00641\t0.00712\t0.01211\n+16\t0.01472\t0.10324\t0.65031\t0.01954\t0.02966\t0.01761\t0.02500\t0.02244\t0.01498\t0.02201\t0.01251\t0.01470\t0.00903\t0.00670\t0.00656\t0.00219\t0.01025\t0.00513\t0.00301\t0.01040\n+17\t0.01552\t0.22313\t0.53738\t0.01819\t0.02756\t0.01956\t0.02264\t0.02223\t0.01489\t0.02104\t0.01203\t0.01410\t0.00905\t0.00659\t0.00619\t0.00206\t0.00977\t0.00488\t0.00302\t0.01016\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t1\n+\n+[block]\n+# block no. 10 follows, 29 sequences, length 9\n+# corresponding to MSA columns:\n+# 1173-1181\n+name=unknown_K\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01771\t0.01530\t0.01610\t0.01449\t0.01852\t0.01771\t0.01127\t0.03784\t0.69247\t0.02979\t0.02898\t0.02657\t0.02174\t0.00966\t0.00725\t0.00242\t0.00564\t0.00805\t0.00725\t0.01127\n+1\t0.01904\t0.75404\t0.03731\t0.01218\t0.01828\t0.02818\t0.01218\t0.02132\t0.01447\t0.01675\t0.00990\t0.01142\t0.00914\t0.00609\t0.00457\t0.00152\t0.00761\t0.00381\t0.00305\t0.00914\n+2\t0.14537\t0.03084\t0.01869\t0.01697\t0.02075\t0.61287\t0.01283\t0.02728\t0.01894\t0.01966\t0.01084\t0.01265\t0.00895\t0.00723\t0.00611\t0.00189\t0.01172\t0.00447\t0.00378\t0.00817\n+3\t0.01342\t0.03213\t0.60466\t0.01870\t0.02767\t0.01489\t0.02328\t0.02061\t0.01482\t0.02188\t0.01684\t0.12714\t0.01487\t0.00915\t0.00712\t0.00235\t0.00954\t0.00756\t0.00356\t0.00980\n+4\t0.01237\t0.00618\t0.00928\t0.00928\t0.00928\t0.00618\t0.00618\t0.00928\t0.00928\t0.01237\t0.01237\t0.02165\t0.01237\t0.02474\t0.02783\t0.79283\t0.00618\t0.00618\t0.00309\t0.00309\n+5\t0.01838\t0.01857\t0.02748\t0.08164\t0.58994\t0.09575\t0.02082\t0.02237\t0.01654\t0.02231\t0.01308\t0.01717\t0.01094\t0.00650\t0.00698\t0.00210\t0.00901\t0.00615\t0.00352\t0.01074\n+6\t0.42985\t0.01475\t0.01969\t0.09547\t0.02366\t0.01565\t0.16637\t0.02143\t0.01404\t0.05767\t0.01231\t0.01501\t0.00931\t0.00651\t0.00584\t0.00217\t0.00748\t0.00537\t0.00426\t0.07316\n+7\t0.01428\t0.03683\t0.71286\t0.02030\t0.03082\t0.01654\t0.02631\t0.02255\t0.01503\t0.02255\t0.01278\t0.01503\t0.00902\t0.00677\t0.00677\t0.00226\t0.01052\t0.00526\t0.00301\t0.01052\n+8\t0.05407\t0.02350\t0.02495\t0.01979\t0.02462\t0.28921\t0.18632\t0.07805\t0.01847\t0.02248\t0.01243\t0.01531\t0.00998\t0.00723\t0.00827\t0.00203\t0.07589\t0.00580\t0.00399\t0.11760\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+7\t701\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W02CW.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W04UC.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W04UC.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,491 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t186\n+\n+[block]\n+# block no. 0 follows, 39 sequences, length 75\n+# corresponding to MSA columns:\n+# 186-260\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.00837\t0.00604\t0.00790\t0.00744\t0.00883\t0.00558\t0.00558\t0.01116\t0.01674\t0.02371\t0.75216\t0.04417\t0.05580\t0.01209\t0.00697\t0.00186\t0.00279\t0.01069\t0.00651\t0.00558\n+1\t0.02139\t0.01412\t0.01577\t0.01231\t0.01646\t0.01518\t0.01000\t0.52412\t0.02357\t0.15588\t0.01618\t0.01765\t0.01199\t0.07475\t0.04069\t0.00245\t0.00659\t0.00575\t0.00584\t0.00931\n+2\t0.00845\t0.00634\t0.00950\t0.00950\t0.01056\t0.00739\t0.00739\t0.01056\t0.00950\t0.01373\t0.01584\t0.02323\t0.01478\t0.04435\t0.76873\t0.00950\t0.01584\t0.00634\t0.00317\t0.00528\n+3\t0.01052\t0.00620\t0.00723\t0.00689\t0.00737\t0.00605\t0.00413\t0.01076\t0.00949\t0.09143\t0.01914\t0.03671\t0.02077\t0.70825\t0.02752\t0.00532\t0.00566\t0.00832\t0.00398\t0.00428\n+4\t0.00848\t0.00621\t0.00885\t0.00885\t0.00967\t0.00703\t0.00657\t0.01014\t0.00931\t0.01324\t0.01644\t0.02657\t0.01623\t0.20554\t0.60952\t0.00869\t0.01366\t0.00682\t0.00326\t0.00491\n+5\t0.01999\t0.10518\t0.01781\t0.01383\t0.01719\t0.50346\t0.03636\t0.09555\t0.01684\t0.01775\t0.01075\t0.01231\t0.00872\t0.00613\t0.00516\t0.00152\t0.00890\t0.00419\t0.09117\t0.00716\n+6\t0.10193\t0.01066\t0.01231\t0.00916\t0.01394\t0.00900\t0.00741\t0.01687\t0.01247\t0.11221\t0.01175\t0.01299\t0.00920\t0.00512\t0.00514\t0.00117\t0.03782\t0.00385\t0.00396\t0.60304\n+7\t0.01550\t0.66974\t0.12633\t0.01117\t0.01665\t0.04702\t0.01170\t0.01804\t0.01224\t0.01456\t0.00857\t0.00992\t0.00758\t0.00517\t0.00409\t0.00135\t0.00679\t0.00334\t0.00254\t0.00772\n+8\t0.00837\t0.00604\t0.00790\t0.00744\t0.00883\t0.00558\t0.00558\t0.01116\t0.01674\t0.02371\t0.75216\t0.04417\t0.05580\t0.01209\t0.00697\t0.00186\t0.00279\t0.01069\t0.00651\t0.00558\n+9\t0.83394\t0.01144\t0.00869\t0.00778\t0.01144\t0.01327\t0.00640\t0.01738\t0.01006\t0.02653\t0.00823\t0.00961\t0.00640\t0.00549\t0.00366\t0.00183\t0.00457\t0.00320\t0.00366\t0.00640\n+10\t0.02209\t0.02819\t0.01676\t0.01524\t0.01828\t0.76843\t0.01143\t0.02361\t0.01676\t0.01447\t0.00914\t0.01066\t0.00762\t0.00609\t0.00533\t0.00152\t0.01066\t0.00381\t0.00305\t0.00686\n+11\t0.00860\t0.00573\t0.00645\t0.00645\t0.00645\t0.00573\t0.00358\t0.00860\t0.00860\t0.01147\t0.01863\t0.03870\t0.02150\t0.79217\t0.03010\t0.00573\t0.00573\t0.00860\t0.00358\t0.00358\n+12\t0.01294\t0.01294\t0.01811\t0.01553\t0.01553\t0.01811\t0.01294\t0.01423\t0.00906\t0.01423\t0.00776\t0.01294\t0.00776\t0.01035\t0.01941\t0.00259\t0.78134\t0.00518\t0.00259\t0.00647\n+13\t0.00845\t0.00634\t0.00950\t0.00950\t0.01056\t0.00739\t0.00739\t0.01056\t0.00950\t0.01373\t0.01584\t0.02323\t0.01478\t0.04435\t0.76873\t0.00950\t0.01584\t0.00634\t0.00317\t0.00528\n+14\t0.83394\t0.01144\t0.00869\t0.00778\t0.01144\t0.01327\t0.00640\t0.01738\t0.01006\t0.02653\t0.00823\t0.00961\t0.00640\t0.00549\t0.00366\t0.00183\t0.00457\t0.00320\t0.00366\t0.00640\n+15\t0.01367\t0.01055\t0.01238\t0.00919\t0.01409\t0.00853\t0.00734\t0.01759\t0.08146\t0.08653\t0.03373\t0.01478\t0.01148\t0.00520\t0.00475\t0.00110\t0.00442\t0.00422\t0.00417\t0.65481\n+16\t0.81340\t0.01129\t0.00861\t0.00772\t0.01132\t0.01307\t0.00635\t0.01729\t0.01012\t0.02642\t0.00851\t0.00992\t0.00662\t0.00552\t0.00367\t0.00182\t0.00453\t0.00326\t0.02416\t0.00638\n+17\t0.01294\t0.01294\t0.01811\t0.01553\t0.01553\t0.01811\t0.01294\t0.01423\t0.00906\t0.01423\t0.00776\t0.01294\t0.00776\t0.01035\t0.01941\t0.00259\t0.78134\t0.00518\t0.00259\t0.00647\n+18\t0.01226\t0.01051\t0.01226\t0.00876\t0.01401\t0.00788\t0.00701\t0.01489\t0.01226\t0.01927\t0.01051\t0.01226\t0.00876\t0.00438\t0.00438\t0.00088\t0.00438\t0.00350\t0.00350\t0.82832\n+19\t0.00953\t0.00681\t0.00953\t0.01089\t0.01225\t0.00681\t0.00953\t0.01225\t0.01361\t0.01770\t0.03131\t0.06671\t0.03403\t0.01634\t0.00817\t0.00272\t0.00545\t0.71547\t0.00545\t0.00545\n+20\t0.01464\t0.01405\t0.02400\t0.03630\t0.75528\t0.01405\t0.01815\t0.01815\t0.01347\t0.01932\t0.01112\t0.01464\t0.00937\t0.00527\t0.00585\t0.00176\t0.00703\t0.00527\t0.00293\t0.00937\n+21\t0.01226\t0.01051\t0.01226\t0.00876\t0.01401\t0.00788\t0.00701\t0.01489\t0.01226\t0.01927\t0.01051\t0.01226\t0.00876\t0.00438\t0.00438\t0.00088\t0.00438\t0.00350\t0.00350\t0.82832\n+22\t0.01307\t0.01334\t0.02034\t0.01678\t0.01757\t0.01769\t0.10876\t0.01486\t0.00971\t0.01486\t0.00832\t0'..b'01346\t0.00801\t0.08378\t0.01541\t0.04654\t0.13383\t0.09821\t0.04324\t0.23075\t0.01184\t0.00722\t0.00209\t0.02290\t0.18362\t0.00544\t0.04993\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t1\n+\n+[block]\n+# block no. 4 follows, 39 sequences, length 21\n+# corresponding to MSA columns:\n+# 594-614\n+name=unknown_E\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01386\t0.04719\t0.04956\t0.02101\t0.04969\t0.01413\t0.49127\t0.01898\t0.05735\t0.03678\t0.05888\t0.01747\t0.01245\t0.00579\t0.00683\t0.00189\t0.02742\t0.00662\t0.00348\t0.05935\n+1\t0.01594\t0.08285\t0.15448\t0.08086\t0.02287\t0.01293\t0.21191\t0.03551\t0.02797\t0.18848\t0.01684\t0.04818\t0.03750\t0.02889\t0.00677\t0.00199\t0.00733\t0.00638\t0.00415\t0.00816\n+2\t0.01350\t0.43535\t0.29835\t0.01242\t0.01837\t0.01800\t0.01399\t0.01715\t0.01212\t0.01581\t0.01150\t0.08730\t0.01066\t0.00659\t0.00484\t0.00160\t0.00693\t0.00495\t0.00281\t0.00774\n+3\t0.01232\t0.04691\t0.46276\t0.01405\t0.02036\t0.01243\t0.01621\t0.01927\t0.11757\t0.05457\t0.01860\t0.08858\t0.05901\t0.00802\t0.00595\t0.00195\t0.00699\t0.02250\t0.00376\t0.00819\n+4\t0.01581\t0.79572\t0.03099\t0.01012\t0.01518\t0.02340\t0.01012\t0.01771\t0.01202\t0.01391\t0.00822\t0.00949\t0.00759\t0.00506\t0.00379\t0.00126\t0.00632\t0.00316\t0.00253\t0.00759\n+5\t0.01449\t0.01334\t0.02057\t0.15591\t0.48183\t0.04885\t0.01593\t0.04471\t0.01386\t0.04296\t0.01332\t0.06776\t0.01176\t0.00668\t0.00601\t0.00185\t0.00698\t0.02139\t0.00337\t0.00844\n+6\t0.00961\t0.00801\t0.01154\t0.15249\t0.03484\t0.00842\t0.04172\t0.01293\t0.05812\t0.01710\t0.04600\t0.20057\t0.16220\t0.01270\t0.00721\t0.00220\t0.02250\t0.14725\t0.03867\t0.00591\n+7\t0.00810\t0.00603\t0.00753\t0.00716\t0.00867\t0.00547\t0.00537\t0.01064\t0.01611\t0.02221\t0.61793\t0.04664\t0.19096\t0.01265\t0.00698\t0.00189\t0.00283\t0.01104\t0.00631\t0.00547\n+8\t0.01226\t0.10705\t0.68852\t0.01618\t0.02455\t0.01470\t0.02068\t0.01863\t0.01244\t0.01825\t0.01037\t0.01219\t0.00750\t0.00556\t0.00544\t0.00181\t0.00850\t0.00425\t0.00250\t0.00862\n+9\t0.01574\t0.01091\t0.01374\t0.01163\t0.07766\t0.00891\t0.00844\t0.04089\t0.01382\t0.17310\t0.01333\t0.01416\t0.01007\t0.00515\t0.00488\t0.00118\t0.00481\t0.00422\t0.00432\t0.56303\n+10\t0.05239\t0.01350\t0.01726\t0.02017\t0.28855\t0.09039\t0.01210\t0.02170\t0.03813\t0.24141\t0.03905\t0.01658\t0.01237\t0.00618\t0.00560\t0.00166\t0.00618\t0.00525\t0.00457\t0.10696\n+11\t0.02167\t0.02698\t0.01655\t0.01502\t0.01807\t0.71240\t0.01135\t0.05116\t0.01708\t0.01548\t0.01011\t0.01276\t0.00864\t0.00649\t0.00545\t0.00158\t0.01032\t0.02871\t0.00324\t0.00693\n+12\t0.01186\t0.03059\t0.76153\t0.01686\t0.02560\t0.01373\t0.02185\t0.01873\t0.01249\t0.01873\t0.01061\t0.01249\t0.00749\t0.00562\t0.00562\t0.00187\t0.00874\t0.00437\t0.00250\t0.00874\n+13\t0.00857\t0.00586\t0.00709\t0.00709\t0.00731\t0.00608\t0.00438\t0.00901\t0.00879\t0.01194\t0.01805\t0.03546\t0.02009\t0.63556\t0.18478\t0.00652\t0.00785\t0.00813\t0.00350\t0.00394\n+14\t0.00848\t0.00623\t0.00895\t0.00895\t0.00982\t0.00709\t0.00670\t0.01021\t0.00934\t0.01332\t0.01635\t0.02604\t0.01600\t0.17986\t0.63489\t0.00882\t0.01401\t0.00675\t0.00324\t0.00497\n+15\t0.03991\t0.43951\t0.06160\t0.01247\t0.01744\t0.10014\t0.05930\t0.12803\t0.01530\t0.06143\t0.01047\t0.01152\t0.00843\t0.00564\t0.00470\t0.00150\t0.00706\t0.00404\t0.00344\t0.00808\n+16\t0.70509\t0.13495\t0.01220\t0.00815\t0.01203\t0.01486\t0.00699\t0.01743\t0.01037\t0.02455\t0.00823\t0.00959\t0.00659\t0.00542\t0.00368\t0.00174\t0.00485\t0.00320\t0.00348\t0.00659\n+17\t0.01538\t0.52007\t0.24277\t0.01211\t0.01821\t0.01960\t0.01344\t0.01875\t0.01248\t0.06526\t0.00993\t0.01107\t0.00803\t0.00537\t0.00447\t0.00148\t0.00694\t0.00370\t0.00284\t0.00809\n+18\t0.01569\t0.01697\t0.06292\t0.06089\t0.47851\t0.12492\t0.09596\t0.01923\t0.01398\t0.03836\t0.01120\t0.01428\t0.00905\t0.00546\t0.00589\t0.00177\t0.00796\t0.00521\t0.00304\t0.00871\n+19\t0.01523\t0.74276\t0.02937\t0.00999\t0.01474\t0.02215\t0.00981\t0.01707\t0.01197\t0.01399\t0.00985\t0.06166\t0.00970\t0.00596\t0.00405\t0.00134\t0.00613\t0.00408\t0.00273\t0.00740\n+20\t0.01689\t0.02031\t0.02771\t0.02107\t0.02578\t0.28989\t0.44583\t0.02049\t0.01481\t0.01715\t0.01079\t0.01392\t0.00844\t0.00557\t0.00680\t0.00184\t0.03642\t0.00576\t0.00300\t0.00752\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t57\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W04UC.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W06CL.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W06CL.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,521 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t7\n+\n+[block]\n+# block no. 0 follows, 35 sequences, length 11\n+# corresponding to MSA columns:\n+# 7-17\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01022\t0.00730\t0.01022\t0.01168\t0.01314\t0.00730\t0.01022\t0.01314\t0.01460\t0.01899\t0.03359\t0.07156\t0.03651\t0.01752\t0.00876\t0.00292\t0.00584\t0.69478\t0.00584\t0.00584\n+1\t0.00761\t0.00630\t0.00656\t0.00674\t0.00857\t0.00537\t0.00490\t0.00908\t0.01393\t0.01680\t0.05862\t0.14688\t0.61711\t0.05219\t0.00873\t0.00238\t0.00341\t0.01376\t0.00579\t0.00526\n+2\t0.01372\t0.10227\t0.63944\t0.01722\t0.02600\t0.01597\t0.02166\t0.05646\t0.01421\t0.02065\t0.01135\t0.01319\t0.00819\t0.00605\t0.00586\t0.00194\t0.00901\t0.00462\t0.00287\t0.00933\n+3\t0.00910\t0.00666\t0.00727\t0.00711\t0.00923\t0.00567\t0.00533\t0.01086\t0.01488\t0.06758\t0.12618\t0.11345\t0.56318\t0.01550\t0.00747\t0.00215\t0.00338\t0.01309\t0.00613\t0.00578\n+4\t0.01699\t0.03773\t0.01751\t0.06292\t0.10823\t0.06115\t0.02803\t0.13098\t0.31901\t0.04597\t0.06928\t0.02217\t0.03564\t0.00811\t0.00641\t0.00201\t0.00625\t0.00680\t0.00548\t0.00934\n+5\t0.02680\t0.01043\t0.01419\t0.01101\t0.01562\t0.00904\t0.00904\t0.02930\t0.01814\t0.68087\t0.08540\t0.02379\t0.01946\t0.00829\t0.00647\t0.00197\t0.00519\t0.00681\t0.00778\t0.01039\n+6\t0.01627\t0.01568\t0.02389\t0.13421\t0.54922\t0.06107\t0.01826\t0.06717\t0.01548\t0.02111\t0.01194\t0.01557\t0.00977\t0.00594\t0.00626\t0.00190\t0.00787\t0.00556\t0.00332\t0.00952\n+7\t0.00782\t0.00556\t0.00733\t0.00872\t0.00906\t0.00521\t0.00577\t0.00886\t0.01197\t0.01596\t0.03407\t0.72903\t0.04082\t0.06530\t0.00955\t0.00279\t0.00383\t0.01751\t0.00577\t0.00507\n+8\t0.00904\t0.00704\t0.00835\t0.00857\t0.01017\t0.00673\t0.00638\t0.01273\t0.09134\t0.02017\t0.22208\t0.24355\t0.24670\t0.01559\t0.00764\t0.00228\t0.00368\t0.06572\t0.00623\t0.00601\n+9\t0.13445\t0.01459\t0.01735\t0.31364\t0.08409\t0.10218\t0.01401\t0.02039\t0.11834\t0.01973\t0.01262\t0.01586\t0.00991\t0.00709\t0.00749\t0.00209\t0.08948\t0.00535\t0.00359\t0.00773\n+10\t0.56839\t0.07491\t0.01285\t0.03475\t0.01464\t0.05539\t0.00821\t0.02078\t0.01251\t0.13149\t0.01136\t0.01225\t0.00840\t0.00619\t0.00448\t0.00190\t0.00561\t0.00398\t0.00433\t0.00758\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t2\n+\n+[block]\n+# block no. 1 follows, 35 sequences, length 19\n+# corresponding to MSA columns:\n+# 20-38\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.02163\t0.01373\t0.01596\t0.01229\t0.01718\t0.01365\t0.01004\t0.26978\t0.08565\t0.23192\t0.01782\t0.01726\t0.01256\t0.00716\t0.00636\t0.00173\t0.02663\t0.00555\t0.00605\t0.20705\n+1\t0.00953\t0.00732\t0.00883\t0.00837\t0.01018\t0.00706\t0.00629\t0.01407\t0.10400\t0.02392\t0.51584\t0.07219\t0.16194\t0.01317\t0.00738\t0.00206\t0.00330\t0.01148\t0.00671\t0.00635\n+2\t0.00993\t0.00762\t0.00935\t0.00927\t0.01019\t0.04114\t0.00673\t0.01154\t0.01044\t0.01456\t0.01775\t0.02911\t0.01765\t0.25757\t0.46436\t0.00812\t0.01276\t0.00734\t0.04935\t0.00522\n+3\t0.01150\t0.00670\t0.00849\t0.00861\t0.00989\t0.00618\t0.00602\t0.01275\t0.01297\t0.13158\t0.05834\t0.35873\t0.10466\t0.19176\t0.01334\t0.00325\t0.00453\t0.03909\t0.00577\t0.00583\n+4\t0.01892\t0.01270\t0.01420\t0.01132\t0.01565\t0.01282\t0.00911\t0.22309\t0.15479\t0.13654\t0.01871\t0.01864\t0.01370\t0.00717\t0.00572\t0.00169\t0.00526\t0.00570\t0.12950\t0.18478\n+5\t0.74376\t0.01347\t0.01022\t0.00905\t0.01299\t0.05354\t0.00739\t0.05033\t0.01203\t0.02829\t0.00917\t0.01059\t0.00712\t0.00600\t0.00413\t0.00194\t0.00535\t0.00357\t0.00400\t0.00707\n+6\t0.01306\t0.09164\t0.68828\t0.01751\t0.02658\t0.01555\t0.02245\t0.02000\t0.01335\t0.01968\t0.01118\t0.01314\t0.00804\t0.00598\t0.00587\t0.00196\t0.00917\t0.00459\t0.00268\t0.00928\n+7\t0.01546\t0.01337\t0.01416\t0.15006\t0.01988\t0.12549\t0.01069\t0.04401\t0.15272\t0.08214\t0.18192\t0.02828\t0.04695\t0.00940\t0.00705\t0.00204\t0.02888\t0.03514\t0.02462\t0.00773\n+8\t0.00836\t0.00641\t0.00766\t0.00746\t0.00913\t0.00571\t0.00555\t0.01073\t0.01633\t0.02185\t0.44706\t0.09416\t0.30759\t0.01451\t0.00752\t0.00208\t0.00311\t0.01256\t0.00652\t0.00571\n+9\t0.01186\t0.02659\t0.56151\t0.01604\t0.02366\t0.01282\t0.04173\t0.01810\t0.01415\t0.02058\t0.11354\t0.02202\t0.07466\t0.00777\t0.00639\t0.00202\t0.00805\t0.00641\t0.00354\t0.00856\n+10'..b'692\t0.11307\t0.01355\t0.15521\t0.16627\t0.04339\t0.01850\t0.01957\t0.05355\t0.03809\t0.00713\t0.00208\t0.00739\t0.00600\t0.00464\t0.00904\n+12\t0.00790\t0.00603\t0.00727\t0.00795\t0.00913\t0.00541\t0.00565\t0.00950\t0.01386\t0.01791\t0.14400\t0.39862\t0.28882\t0.01749\t0.00782\t0.00235\t0.00348\t0.03541\t0.00604\t0.00536\n+13\t0.01740\t0.26794\t0.07201\t0.01232\t0.01748\t0.13266\t0.01112\t0.07272\t0.01515\t0.04301\t0.01089\t0.01239\t0.00897\t0.00590\t0.00557\t0.00144\t0.03716\t0.00406\t0.00356\t0.24826\n+14\t0.00811\t0.00645\t0.00728\t0.00707\t0.00895\t0.00562\t0.00531\t0.01030\t0.01592\t0.02059\t0.34300\t0.05537\t0.45402\t0.01478\t0.00749\t0.00208\t0.00312\t0.01259\t0.00635\t0.00562\n+15\t0.01272\t0.03281\t0.74418\t0.01808\t0.02746\t0.01473\t0.02344\t0.02009\t0.01339\t0.02009\t0.01138\t0.01339\t0.00804\t0.00603\t0.00603\t0.00201\t0.00938\t0.00469\t0.00268\t0.00938\n+16\t0.01578\t0.01363\t0.01434\t0.01291\t0.01650\t0.01578\t0.01004\t0.03371\t0.72602\t0.02654\t0.02582\t0.02367\t0.01937\t0.00861\t0.00646\t0.00215\t0.00502\t0.00717\t0.00646\t0.01004\n+17\t0.01044\t0.00761\t0.01083\t0.01275\t0.04160\t0.00761\t0.01059\t0.01339\t0.01460\t0.01905\t0.03274\t0.06936\t0.03547\t0.01706\t0.00866\t0.00288\t0.00591\t0.66771\t0.00574\t0.00601\n+18\t0.00882\t0.00674\t0.00815\t0.00787\t0.00962\t0.00618\t0.00599\t0.01187\t0.03901\t0.02269\t0.47764\t0.05194\t0.25622\t0.01398\t0.00752\t0.00209\t0.00327\t0.04787\t0.00658\t0.00592\n+19\t0.01102\t0.00551\t0.00826\t0.00826\t0.00826\t0.00551\t0.00551\t0.00826\t0.00826\t0.01102\t0.01102\t0.01928\t0.01102\t0.02204\t0.02479\t0.81543\t0.00551\t0.00551\t0.00275\t0.00275\n+20\t0.02093\t0.34170\t0.02443\t0.01390\t0.01823\t0.38335\t0.01166\t0.08473\t0.01692\t0.01747\t0.00988\t0.01125\t0.00839\t0.00617\t0.00509\t0.00154\t0.00910\t0.00394\t0.00331\t0.00799\n+21\t0.00886\t0.00637\t0.00817\t0.00923\t0.00993\t0.00616\t0.00632\t0.05773\t0.01337\t0.01784\t0.03360\t0.72054\t0.03980\t0.01903\t0.00798\t0.00253\t0.00391\t0.01718\t0.00592\t0.00554\n+22\t0.01287\t0.01097\t0.01295\t0.00945\t0.01478\t0.00842\t0.00755\t0.01565\t0.01295\t0.02026\t0.01167\t0.01397\t0.00984\t0.00766\t0.05635\t0.00158\t0.00555\t0.00397\t0.00373\t0.75983\n+23\t0.00807\t0.00631\t0.00732\t0.00735\t0.00900\t0.00556\t0.00540\t0.01011\t0.01540\t0.02004\t0.30532\t0.16115\t0.38532\t0.01549\t0.00758\t0.00215\t0.00320\t0.01337\t0.00629\t0.00556\n+24\t0.01703\t0.01695\t0.02148\t0.07718\t0.14139\t0.13261\t0.10363\t0.05887\t0.13956\t0.04149\t0.01388\t0.01645\t0.01105\t0.00766\t0.00951\t0.00214\t0.17067\t0.00591\t0.00395\t0.00860\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t1\n+\n+[block]\n+# block no. 13 follows, 35 sequences, length 8\n+# corresponding to MSA columns:\n+# 480-487\n+name=unknown_N\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.00763\t0.00627\t0.00672\t0.00694\t0.00874\t0.00536\t0.00508\t0.00924\t0.01428\t0.01749\t0.10103\t0.18393\t0.57228\t0.01653\t0.00760\t0.00221\t0.00328\t0.01408\t0.00596\t0.00536\n+1\t0.00986\t0.00795\t0.01140\t0.01099\t0.01177\t0.00968\t0.00852\t0.01169\t0.01016\t0.01472\t0.01694\t0.07717\t0.01695\t0.10254\t0.50300\t0.00795\t0.15194\t0.00757\t0.00350\t0.00570\n+2\t0.01747\t0.01263\t0.01460\t0.01085\t0.01619\t0.01117\t0.00879\t0.16011\t0.05042\t0.11817\t0.01453\t0.01516\t0.01096\t0.00588\t0.00533\t0.00132\t0.00526\t0.00465\t0.00494\t0.51155\n+3\t0.01891\t0.01343\t0.01481\t0.01274\t0.01670\t0.01486\t0.01007\t0.09012\t0.53204\t0.16499\t0.02478\t0.02257\t0.01795\t0.00838\t0.00643\t0.00209\t0.00526\t0.00690\t0.00671\t0.01025\n+4\t0.01661\t0.01436\t0.01288\t0.01185\t0.01478\t0.17084\t0.00909\t0.02351\t0.23976\t0.11662\t0.05064\t0.12504\t0.11552\t0.01102\t0.00677\t0.00210\t0.00602\t0.03880\t0.00579\t0.00801\n+5\t0.01413\t0.01093\t0.01276\t0.00963\t0.01461\t0.00890\t0.00766\t0.01826\t0.08023\t0.08139\t0.05137\t0.01941\t0.05791\t0.00642\t0.00531\t0.00126\t0.00461\t0.00525\t0.00464\t0.58532\n+6\t0.01456\t0.01089\t0.01500\t0.01404\t0.08808\t0.00994\t0.05875\t0.04858\t0.07411\t0.10909\t0.05713\t0.17066\t0.05353\t0.00963\t0.00642\t0.00182\t0.00527\t0.00856\t0.00517\t0.23877\n+7\t0.01612\t0.01490\t0.04899\t0.04713\t0.02409\t0.04490\t0.30085\t0.01991\t0.01458\t0.12169\t0.01534\t0.06975\t0.01250\t0.00697\t0.00723\t0.00189\t0.04287\t0.00688\t0.00412\t0.17928\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+8\t16\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W06CL.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W06HU.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W06HU.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,464 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+13\t36\n+\n+[block]\n+# block no. 0 follows, 32 sequences, length 73\n+# corresponding to MSA columns:\n+# 75-147\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01405\t0.09379\t0.60732\t0.01935\t0.02863\t0.01662\t0.08683\t0.02118\t0.01428\t0.02082\t0.01196\t0.01425\t0.00867\t0.00625\t0.00635\t0.00208\t0.00982\t0.00512\t0.00289\t0.00973\n+1\t0.01468\t0.01398\t0.02376\t0.38709\t0.39148\t0.01544\t0.01963\t0.01890\t0.01437\t0.01958\t0.01228\t0.01723\t0.00980\t0.00634\t0.00667\t0.00211\t0.00845\t0.00597\t0.00316\t0.00907\n+2\t0.01423\t0.01352\t0.02295\t0.46762\t0.31445\t0.01532\t0.01941\t0.01851\t0.01416\t0.01904\t0.01220\t0.01738\t0.00961\t0.00642\t0.00668\t0.00214\t0.00856\t0.00597\t0.00312\t0.00871\n+3\t0.02322\t0.01671\t0.01825\t0.01434\t0.01911\t0.01826\t0.01171\t0.55320\t0.05927\t0.06922\t0.08368\t0.04555\t0.01804\t0.00909\t0.00690\t0.00206\t0.00670\t0.00716\t0.00683\t0.01069\n+4\t0.01402\t0.13590\t0.56510\t0.08642\t0.02899\t0.01706\t0.02234\t0.02070\t0.01402\t0.02009\t0.01165\t0.01404\t0.00856\t0.00632\t0.00611\t0.00204\t0.00944\t0.00486\t0.00285\t0.00950\n+5\t0.00818\t0.00603\t0.00759\t0.00882\t0.00954\t0.00552\t0.00596\t0.00941\t0.01320\t0.01719\t0.04219\t0.61169\t0.16730\t0.04204\t0.00920\t0.00275\t0.00388\t0.01790\t0.00617\t0.00545\n+6\t0.00928\t0.07820\t0.01005\t0.00774\t0.01010\t0.00779\t0.00605\t0.01138\t0.01600\t0.02012\t0.22818\t0.07889\t0.46238\t0.01523\t0.00761\t0.00216\t0.00371\t0.01281\t0.00621\t0.00610\n+7\t0.01363\t0.00827\t0.00874\t0.00842\t0.01051\t0.00872\t0.00658\t0.05219\t0.12238\t0.02587\t0.02372\t0.02933\t0.01943\t0.00903\t0.00555\t0.00184\t0.00396\t0.06938\t0.56529\t0.00717\n+8\t0.01354\t0.01308\t0.02298\t0.57865\t0.14264\t0.01525\t0.08263\t0.01805\t0.01391\t0.01824\t0.01218\t0.01772\t0.00930\t0.00650\t0.00681\t0.00220\t0.00903\t0.00615\t0.00307\t0.00806\n+9\t0.08580\t0.00769\t0.00927\t0.00855\t0.01064\t0.00730\t0.00653\t0.01425\t0.01801\t0.06689\t0.56220\t0.04598\t0.10592\t0.01296\t0.00750\t0.00212\t0.00352\t0.01118\t0.00705\t0.00666\n+10\t0.01631\t0.01770\t0.09310\t0.03912\t0.65731\t0.01591\t0.02099\t0.02065\t0.01517\t0.02186\t0.01257\t0.01638\t0.01043\t0.00602\t0.00662\t0.00201\t0.00815\t0.00588\t0.00328\t0.01056\n+11\t0.00943\t0.00715\t0.01041\t0.01041\t0.01171\t0.00813\t0.00808\t0.01176\t0.01121\t0.01582\t0.02266\t0.02994\t0.08270\t0.04720\t0.66916\t0.00998\t0.01661\t0.00784\t0.00384\t0.00596\n+12\t0.15848\t0.00816\t0.00786\t0.00754\t0.00969\t0.00862\t0.00577\t0.05524\t0.01448\t0.02620\t0.02068\t0.09085\t0.01760\t0.00878\t0.00507\t0.00179\t0.00382\t0.00697\t0.53573\t0.00666\n+13\t0.02420\t0.03068\t0.02094\t0.01832\t0.02209\t0.66969\t0.07721\t0.02630\t0.01872\t0.01690\t0.01067\t0.01266\t0.00879\t0.00680\t0.00623\t0.00178\t0.01203\t0.00466\t0.00345\t0.00790\n+14\t0.01854\t0.01787\t0.01667\t0.01479\t0.01826\t0.14742\t0.01155\t0.07162\t0.47949\t0.02569\t0.02185\t0.02120\t0.01671\t0.00889\t0.00811\t0.00222\t0.07669\t0.00674\t0.00585\t0.00985\n+15\t0.01023\t0.00636\t0.00852\t0.00959\t0.01043\t0.00586\t0.00657\t0.01153\t0.01344\t0.08371\t0.03600\t0.69069\t0.04177\t0.01983\t0.00839\t0.00266\t0.00406\t0.01792\t0.00642\t0.00601\n+16\t0.01543\t0.01188\t0.01407\t0.01013\t0.01602\t0.00903\t0.00813\t0.01838\t0.01441\t0.08800\t0.01329\t0.01475\t0.01056\t0.00528\t0.00514\t0.00110\t0.00504\t0.00424\t0.00438\t0.73076\n+17\t0.01794\t0.76823\t0.03516\t0.01148\t0.01722\t0.02655\t0.01148\t0.02009\t0.01363\t0.01579\t0.00933\t0.01076\t0.00861\t0.00574\t0.00431\t0.00144\t0.00718\t0.00359\t0.00287\t0.00861\n+18\t0.00793\t0.00680\t0.00680\t0.00680\t0.00906\t0.00566\t0.00510\t0.00963\t0.01529\t0.01813\t0.06797\t0.06457\t0.71961\t0.01699\t0.00793\t0.00227\t0.00340\t0.01416\t0.00623\t0.00566\n+19\t0.01447\t0.01191\t0.01397\t0.01001\t0.01594\t0.00898\t0.00802\t0.01744\t0.01410\t0.04610\t0.01243\t0.01422\t0.01017\t0.00508\t0.00503\t0.00103\t0.00499\t0.00407\t0.00412\t0.77792\n+20\t0.01027\t0.00691\t0.00774\t0.00758\t0.00776\t0.00697\t0.00435\t0.03233\t0.01047\t0.01397\t0.02098\t0.04300\t0.02397\t0.73946\t0.03325\t0.00636\t0.00653\t0.00964\t0.00415\t0.00431\n+21\t0.01794\t0.76823\t0.03516\t0.01148\t0.01722\t0.02655\t0.01148\t0.02009\t0.01363\t0.01579\t0.00933\t0.01076\t0.00861\t0.00574\t0.00431\t0.00144\t0.00718\t0.00359\t0.00287\t0.00861\n+22\t0.01050\t0.00830\t0.01027\t0.00958\t0.01223\t0.00686\t0.00693\t0.01240\t0.01328\t0.01904\t0.02685\t0.'..b'\t0.00637\t0.00637\t0.00212\t0.00992\t0.00496\t0.00283\t0.00992\n+30\t0.01349\t0.01155\t0.01378\t0.01023\t0.01538\t0.00934\t0.00817\t0.01641\t0.01424\t0.02206\t0.08613\t0.01777\t0.01549\t0.00628\t0.00627\t0.00122\t0.04805\t0.00494\t0.00427\t0.67492\n+31\t0.01563\t0.01190\t0.01449\t0.01079\t0.01594\t0.00998\t0.00870\t0.01844\t0.01441\t0.10170\t0.04345\t0.01654\t0.01287\t0.00633\t0.00683\t0.00134\t0.07198\t0.00481\t0.00452\t0.60935\n+32\t0.57911\t0.01425\t0.01365\t0.01147\t0.01565\t0.06535\t0.08852\t0.01969\t0.01281\t0.02724\t0.01363\t0.01537\t0.04553\t0.00686\t0.00495\t0.00206\t0.00620\t0.00487\t0.04541\t0.00738\n+33\t0.01473\t0.24216\t0.53307\t0.01696\t0.02570\t0.01868\t0.02103\t0.02092\t0.01402\t0.01970\t0.01127\t0.01320\t0.00853\t0.00620\t0.00579\t0.00193\t0.00914\t0.00457\t0.00284\t0.00955\n+34\t0.01406\t0.13303\t0.63636\t0.01810\t0.02746\t0.01705\t0.02301\t0.02109\t0.01409\t0.02052\t0.01168\t0.01371\t0.00851\t0.00629\t0.00610\t0.00203\t0.00955\t0.00477\t0.00284\t0.00974\n+35\t0.01568\t0.39770\t0.38585\t0.01534\t0.02319\t0.02101\t0.01820\t0.02068\t0.01390\t0.01855\t0.01070\t0.01248\t0.00855\t0.00606\t0.00535\t0.00178\t0.00856\t0.00428\t0.00285\t0.00927\n+36\t0.01454\t0.21255\t0.56110\t0.01727\t0.02618\t0.01824\t0.02156\t0.02097\t0.01404\t0.01992\t0.01138\t0.01334\t0.00853\t0.00622\t0.00587\t0.00196\t0.00925\t0.00463\t0.00284\t0.00960\n+37\t0.01382\t0.13225\t0.60466\t0.01756\t0.02658\t0.01663\t0.02215\t0.02059\t0.01414\t0.02038\t0.01410\t0.01589\t0.03931\t0.00675\t0.00616\t0.00204\t0.00927\t0.00517\t0.00299\t0.00956\n+38\t0.01356\t0.12769\t0.49865\t0.01650\t0.02439\t0.01555\t0.01995\t0.01967\t0.01428\t0.02050\t0.04436\t0.02058\t0.01362\t0.00900\t0.03082\t0.00236\t0.00905\t0.05881\t0.00337\t0.03728\n+39\t0.01313\t0.08301\t0.58942\t0.01708\t0.02572\t0.01513\t0.02141\t0.01980\t0.01439\t0.02075\t0.03951\t0.01982\t0.07730\t0.00756\t0.00642\t0.00209\t0.00889\t0.00596\t0.00330\t0.00931\n+40\t0.01338\t0.10943\t0.42770\t0.01622\t0.02349\t0.01463\t0.04140\t0.01915\t0.01472\t0.02098\t0.07258\t0.02542\t0.01732\t0.00849\t0.00664\t0.00212\t0.00830\t0.09929\t0.00376\t0.05499\n+41\t0.01387\t0.14305\t0.56900\t0.01728\t0.02592\t0.01656\t0.02151\t0.02045\t0.01434\t0.02063\t0.04305\t0.01732\t0.01192\t0.00701\t0.00623\t0.00205\t0.00908\t0.02813\t0.00315\t0.00944\n+42\t0.01414\t0.07595\t0.51914\t0.04965\t0.02743\t0.01532\t0.06433\t0.02056\t0.01429\t0.04474\t0.01390\t0.05784\t0.01104\t0.00717\t0.00645\t0.00209\t0.00912\t0.00595\t0.00330\t0.03759\n+43\t0.01460\t0.14395\t0.47049\t0.01710\t0.02494\t0.05615\t0.04387\t0.02094\t0.03211\t0.02067\t0.06059\t0.01824\t0.01351\t0.00721\t0.00630\t0.00203\t0.00898\t0.02570\t0.00340\t0.00923\n+44\t0.01378\t0.10101\t0.49102\t0.01743\t0.02568\t0.01545\t0.07141\t0.02008\t0.01462\t0.02125\t0.07071\t0.01710\t0.01332\t0.00675\t0.00630\t0.00197\t0.00879\t0.00556\t0.00335\t0.07439\n+45\t0.04189\t0.09187\t0.53880\t0.01908\t0.05577\t0.01614\t0.05576\t0.02120\t0.01435\t0.04245\t0.01300\t0.01628\t0.00984\t0.00671\t0.00632\t0.00210\t0.00927\t0.02634\t0.00320\t0.00963\n+46\t0.04654\t0.07846\t0.41595\t0.01785\t0.02560\t0.01635\t0.09795\t0.05063\t0.09666\t0.02311\t0.03525\t0.01669\t0.01188\t0.00681\t0.00639\t0.00207\t0.00870\t0.00569\t0.00375\t0.03364\n+47\t0.10232\t0.05312\t0.26087\t0.01897\t0.10804\t0.03268\t0.07738\t0.03711\t0.05728\t0.04561\t0.07796\t0.02230\t0.03327\t0.00793\t0.00655\t0.00213\t0.00784\t0.03534\t0.00424\t0.00907\n+48\t0.07175\t0.09756\t0.23328\t0.04833\t0.05557\t0.01674\t0.17539\t0.02276\t0.10860\t0.04224\t0.03861\t0.01772\t0.01266\t0.00691\t0.00683\t0.00212\t0.02352\t0.00617\t0.00394\t0.00929\n+49\t0.03434\t0.04274\t0.26010\t0.01806\t0.02447\t0.12294\t0.16487\t0.02106\t0.01565\t0.06205\t0.01962\t0.02308\t0.08282\t0.00799\t0.00682\t0.00209\t0.00909\t0.03838\t0.00395\t0.03988\n+50\t0.11087\t0.05688\t0.26057\t0.06930\t0.02504\t0.01521\t0.11556\t0.02290\t0.09561\t0.08845\t0.01735\t0.01871\t0.04162\t0.00717\t0.00638\t0.00211\t0.00803\t0.00609\t0.00424\t0.02793\n+51\t0.08908\t0.06673\t0.25069\t0.06192\t0.07339\t0.01623\t0.15104\t0.06054\t0.06051\t0.04701\t0.03086\t0.01679\t0.01148\t0.00665\t0.00645\t0.00208\t0.00853\t0.00590\t0.00391\t0.03022\n+52\t0.08923\t0.06676\t0.20309\t0.01870\t0.06932\t0.05357\t0.13792\t0.02404\t0.12885\t0.06920\t0.03385\t0.01770\t0.01283\t0.00691\t0.00641\t0.00205\t0.00815\t0.00602\t0.00430\t0.04111\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+38\t328\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W06HU.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W06OE.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W06OE.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,477 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t31\n+\n+[block]\n+# block no. 0 follows, 38 sequences, length 63\n+# corresponding to MSA columns:\n+# 32-58,69-104\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.00969\t0.00692\t0.00969\t0.01108\t0.01246\t0.00692\t0.00969\t0.01246\t0.01385\t0.01800\t0.03185\t0.06786\t0.03462\t0.01662\t0.00831\t0.00277\t0.00554\t0.71057\t0.00554\t0.00554\n+1\t0.02610\t0.01167\t0.01485\t0.01138\t0.01607\t0.01097\t0.00940\t0.18161\t0.01962\t0.59953\t0.02172\t0.01917\t0.01388\t0.00740\t0.00604\t0.00185\t0.00544\t0.00591\t0.00714\t0.01024\n+2\t0.00738\t0.00548\t0.00689\t0.00786\t0.00863\t0.00499\t0.00539\t0.00867\t0.01240\t0.01625\t0.09662\t0.57966\t0.18264\t0.01760\t0.00752\t0.00232\t0.00335\t0.01572\t0.00567\t0.00499\n+3\t0.01240\t0.01220\t0.02203\t0.53063\t0.15033\t0.01383\t0.13934\t0.01652\t0.01266\t0.01671\t0.01104\t0.01589\t0.00844\t0.00575\t0.00619\t0.00197\t0.00825\t0.00565\t0.00278\t0.00737\n+4\t0.01496\t0.01292\t0.01360\t0.01224\t0.01564\t0.01496\t0.00952\t0.03197\t0.74019\t0.02516\t0.02448\t0.02244\t0.01836\t0.00816\t0.00612\t0.00204\t0.00476\t0.00680\t0.00612\t0.00952\n+5\t0.00860\t0.00641\t0.00947\t0.00947\t0.01047\t0.00741\t0.00727\t0.01061\t0.00961\t0.01382\t0.01630\t0.02464\t0.01548\t0.09277\t0.71769\t0.00942\t0.01545\t0.00659\t0.00325\t0.00526\n+6\t0.83108\t0.01163\t0.00884\t0.00791\t0.01163\t0.01350\t0.00651\t0.01768\t0.01024\t0.02699\t0.00838\t0.00977\t0.00651\t0.00558\t0.00372\t0.00186\t0.00465\t0.00326\t0.00372\t0.00651\n+7\t0.01594\t0.76439\t0.05805\t0.01054\t0.01583\t0.02344\t0.01073\t0.01805\t0.01224\t0.01433\t0.00845\t0.00976\t0.00772\t0.00517\t0.00393\t0.00131\t0.00652\t0.00326\t0.00257\t0.00776\n+8\t0.01471\t0.01412\t0.02410\t0.07340\t0.71594\t0.01425\t0.01838\t0.01831\t0.01362\t0.01944\t0.01128\t0.01495\t0.00945\t0.00539\t0.00596\t0.00180\t0.00719\t0.00536\t0.00296\t0.00939\n+9\t0.01247\t0.01069\t0.01247\t0.00891\t0.01426\t0.00802\t0.00713\t0.01515\t0.01247\t0.01960\t0.01069\t0.01247\t0.00891\t0.00446\t0.00446\t0.00089\t0.00446\t0.00356\t0.00356\t0.82536\n+10\t0.00750\t0.00608\t0.00665\t0.00656\t0.00838\t0.00524\t0.00490\t0.00937\t0.01455\t0.01838\t0.24778\t0.07517\t0.53934\t0.01454\t0.00712\t0.00201\t0.00300\t0.01233\t0.00587\t0.00524\n+11\t0.02329\t0.01557\t0.01719\t0.01324\t0.01798\t0.01684\t0.01092\t0.58495\t0.05240\t0.16064\t0.01641\t0.01577\t0.01133\t0.00729\t0.00603\t0.00182\t0.00629\t0.00558\t0.00627\t0.01021\n+12\t0.00875\t0.00583\t0.00656\t0.00656\t0.00656\t0.00583\t0.00365\t0.00875\t0.00875\t0.01166\t0.01895\t0.03937\t0.02187\t0.78858\t0.03062\t0.00583\t0.00583\t0.00875\t0.00365\t0.00365\n+13\t0.01420\t0.01623\t0.03550\t0.02535\t0.03144\t0.01521\t0.72921\t0.01927\t0.01420\t0.01927\t0.01217\t0.01623\t0.00913\t0.00507\t0.00710\t0.00203\t0.01014\t0.00710\t0.00304\t0.00811\n+14\t0.00774\t0.00583\t0.00717\t0.00745\t0.00867\t0.00525\t0.00535\t0.00963\t0.01430\t0.01909\t0.32595\t0.29774\t0.23331\t0.01528\t0.00730\t0.00211\t0.00311\t0.01346\t0.00600\t0.00525\n+15\t0.03469\t0.03058\t0.73673\t0.01689\t0.02564\t0.01396\t0.02179\t0.01901\t0.01263\t0.01927\t0.01073\t0.01262\t0.00759\t0.00571\t0.00566\t0.00190\t0.00877\t0.00441\t0.00257\t0.00882\n+16\t0.01231\t0.07764\t0.71305\t0.01673\t0.02539\t0.01457\t0.02150\t0.01899\t0.01267\t0.01875\t0.01065\t0.01251\t0.00763\t0.00568\t0.00560\t0.00187\t0.00874\t0.00437\t0.00254\t0.00882\n+17\t0.35601\t0.02164\t0.01366\t0.01237\t0.01573\t0.45468\t0.00952\t0.02141\t0.01424\t0.01978\t0.00892\t0.01040\t0.00724\t0.00595\t0.00472\t0.00168\t0.00829\t0.00362\t0.00336\t0.00678\n+18\t0.83108\t0.01163\t0.00884\t0.00791\t0.01163\t0.01350\t0.00651\t0.01768\t0.01024\t0.02699\t0.00838\t0.00977\t0.00651\t0.00558\t0.00372\t0.00186\t0.00465\t0.00326\t0.00372\t0.00651\n+19\t0.01219\t0.05545\t0.73421\t0.01693\t0.02570\t0.01429\t0.02184\t0.01902\t0.01269\t0.01889\t0.01072\t0.01260\t0.00762\t0.00570\t0.00566\t0.00189\t0.00881\t0.00441\t0.00254\t0.00885\n+20\t0.00861\t0.00637\t0.00929\t0.00929\t0.01023\t0.00731\t0.00704\t0.01050\t0.00955\t0.01368\t0.01646\t0.02557\t0.01588\t0.13669\t0.67432\t0.00920\t0.01485\t0.00673\t0.00327\t0.00516\n+21\t0.00861\t0.00638\t0.00933\t0.00933\t0.01029\t0.00734\t0.00710\t0.01053\t0.00957\t0.01372\t0.01642\t0.02534\t0.01578\t0.12561\t0.68526\t0.00925\t0.01500\t0.00669\t0.00327\t0.00518\n+22\t0.01076\t0.00575\t0.00630\t0.00630\t0.00765\t0.00594\t0.00477\t0.01345\t0.01211\t0.02097\t0.019'..b'89\t0.00745\t0.00605\t0.00186\t0.00512\t0.00605\t0.00745\t0.01024\n+16\t0.01207\t0.03112\t0.75741\t0.01715\t0.02604\t0.01397\t0.02223\t0.01905\t0.01270\t0.01905\t0.01080\t0.01270\t0.00762\t0.00572\t0.00572\t0.00191\t0.00889\t0.00445\t0.00254\t0.00889\n+17\t0.00969\t0.00692\t0.00969\t0.01108\t0.01246\t0.00692\t0.00969\t0.01246\t0.01385\t0.01800\t0.03185\t0.06786\t0.03462\t0.01662\t0.00831\t0.00277\t0.00554\t0.71057\t0.00554\t0.00554\n+18\t0.01207\t0.03112\t0.75741\t0.01715\t0.02604\t0.01397\t0.02223\t0.01905\t0.01270\t0.01905\t0.01080\t0.01270\t0.00762\t0.00572\t0.00572\t0.00191\t0.00889\t0.00445\t0.00254\t0.00889\n+19\t0.01489\t0.01429\t0.02442\t0.03692\t0.75106\t0.01429\t0.01846\t0.01846\t0.01370\t0.01965\t0.01132\t0.01489\t0.00953\t0.00536\t0.00596\t0.00179\t0.00715\t0.00536\t0.00298\t0.00953\n+20\t0.01489\t0.01429\t0.02442\t0.03692\t0.75106\t0.01429\t0.01846\t0.01846\t0.01370\t0.01965\t0.01132\t0.01489\t0.00953\t0.00536\t0.00596\t0.00179\t0.00715\t0.00536\t0.00298\t0.00953\n+21\t0.00711\t0.00609\t0.00609\t0.00609\t0.00813\t0.00508\t0.00457\t0.00863\t0.01371\t0.01625\t0.06094\t0.05789\t0.74862\t0.01524\t0.00711\t0.00203\t0.00305\t0.01270\t0.00559\t0.00508\n+22\t0.01136\t0.01069\t0.01804\t0.77412\t0.04143\t0.01337\t0.01671\t0.01537\t0.01203\t0.01537\t0.01069\t0.01604\t0.00802\t0.00601\t0.00601\t0.00200\t0.00802\t0.00535\t0.00267\t0.00668\n+23\t0.01608\t0.79220\t0.03152\t0.01029\t0.01544\t0.02380\t0.01029\t0.01801\t0.01222\t0.01415\t0.00836\t0.00965\t0.00772\t0.00515\t0.00386\t0.00129\t0.00643\t0.00322\t0.00257\t0.00772\n+24\t0.01420\t0.01623\t0.03550\t0.02535\t0.03144\t0.01521\t0.72921\t0.01927\t0.01420\t0.01927\t0.01217\t0.01623\t0.00913\t0.00507\t0.00710\t0.00203\t0.01014\t0.00710\t0.00304\t0.00811\n+25\t0.01608\t0.79220\t0.03152\t0.01029\t0.01544\t0.02380\t0.01029\t0.01801\t0.01222\t0.01415\t0.00836\t0.00965\t0.00772\t0.00515\t0.00386\t0.00129\t0.00643\t0.00322\t0.00257\t0.00772\n+26\t0.01136\t0.01069\t0.01804\t0.77412\t0.04143\t0.01337\t0.01671\t0.01537\t0.01203\t0.01537\t0.01069\t0.01604\t0.00802\t0.00601\t0.00601\t0.00200\t0.00802\t0.00535\t0.00267\t0.00668\n+27\t0.02247\t0.02867\t0.01705\t0.01550\t0.01860\t0.76443\t0.01162\t0.02402\t0.01705\t0.01472\t0.00930\t0.01085\t0.00775\t0.00620\t0.00542\t0.00155\t0.01085\t0.00387\t0.00310\t0.00697\n+28\t0.01496\t0.01292\t0.01360\t0.01224\t0.01564\t0.01496\t0.00952\t0.03197\t0.74019\t0.02516\t0.02448\t0.02244\t0.01836\t0.00816\t0.00612\t0.00204\t0.00476\t0.00680\t0.00612\t0.00952\n+29\t0.01136\t0.01069\t0.01804\t0.77412\t0.04143\t0.01337\t0.01671\t0.01537\t0.01203\t0.01537\t0.01069\t0.01604\t0.00802\t0.00601\t0.00601\t0.00200\t0.00802\t0.00535\t0.00267\t0.00668\n+30\t0.01136\t0.01069\t0.01804\t0.77412\t0.04143\t0.01337\t0.01671\t0.01537\t0.01203\t0.01537\t0.01069\t0.01604\t0.00802\t0.00601\t0.00601\t0.00200\t0.00802\t0.00535\t0.00267\t0.00668\n+31\t0.00970\t0.00951\t0.09182\t0.01126\t0.01354\t0.00752\t0.01058\t0.01282\t0.01371\t0.01795\t0.03236\t0.06081\t0.10106\t0.01528\t0.00791\t0.00260\t0.00567\t0.56483\t0.00521\t0.00586\n+32\t0.01156\t0.01096\t0.01809\t0.69048\t0.03860\t0.01392\t0.01632\t0.01527\t0.01172\t0.01527\t0.01038\t0.01572\t0.00801\t0.00651\t0.00753\t0.00207\t0.09290\t0.00534\t0.00267\t0.00667\n+33\t0.01144\t0.01295\t0.09960\t0.69063\t0.03973\t0.01343\t0.01732\t0.01578\t0.01210\t0.01578\t0.01070\t0.01567\t0.00798\t0.00598\t0.00598\t0.00199\t0.00812\t0.00525\t0.00266\t0.00693\n+34\t0.00731\t0.00533\t0.00688\t0.00812\t0.00866\t0.00491\t0.00547\t0.00840\t0.01176\t0.01546\t0.03622\t0.70449\t0.11797\t0.01845\t0.00762\t0.00240\t0.00344\t0.01662\t0.00558\t0.00491\n+35\t0.02498\t0.00975\t0.01314\t0.01025\t0.01439\t0.00851\t0.00827\t0.02705\t0.01628\t0.67321\t0.02321\t0.02256\t0.01566\t0.09361\t0.00876\t0.00230\t0.00520\t0.00635\t0.00703\t0.00951\n+36\t0.02252\t0.02737\t0.01716\t0.01532\t0.01860\t0.68217\t0.01160\t0.10200\t0.01829\t0.01728\t0.00987\t0.01124\t0.00802\t0.00631\t0.00549\t0.00158\t0.01038\t0.00404\t0.00342\t0.00733\n+37\t0.01457\t0.01268\t0.01409\t0.09628\t0.01849\t0.01479\t0.01031\t0.03014\t0.65987\t0.02408\t0.02296\t0.02174\t0.01722\t0.00792\t0.00611\t0.00204\t0.00512\t0.00664\t0.00574\t0.00921\n+38\t0.01421\t0.01159\t0.01263\t0.01140\t0.01443\t0.01313\t0.00883\t0.02799\t0.58108\t0.05003\t0.10371\t0.02535\t0.02241\t0.03046\t0.04309\t0.00248\t0.00513\t0.00726\t0.00602\t0.00877\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t31\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W06OE.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W07NX.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W07NX.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,407 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t69\n+\n+[block]\n+# block no. 0 follows, 33 sequences, length 11\n+# corresponding to MSA columns:\n+# 88-98\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.00800\t0.00580\t0.00757\t0.00899\t0.00950\t0.00536\t0.00603\t0.00919\t0.01278\t0.01688\t0.03846\t0.71417\t0.09230\t0.02034\t0.00836\t0.00264\t0.00378\t0.01837\t0.00611\t0.00536\n+1\t0.02807\t0.01088\t0.01481\t0.01146\t0.01630\t0.00942\t0.00942\t0.03066\t0.01883\t0.68089\t0.07666\t0.02435\t0.01962\t0.00853\t0.00670\t0.00204\t0.00542\t0.00700\t0.00808\t0.01084\n+2\t0.01320\t0.03405\t0.73453\t0.01876\t0.02849\t0.01529\t0.02432\t0.02085\t0.01390\t0.02085\t0.01181\t0.01390\t0.00834\t0.00625\t0.00625\t0.00208\t0.00973\t0.00486\t0.00278\t0.00973\n+3\t0.00932\t0.00673\t0.00880\t0.00828\t0.00984\t0.00621\t0.00621\t0.01242\t0.01863\t0.02640\t0.72410\t0.04918\t0.06212\t0.01346\t0.00776\t0.00207\t0.00311\t0.01191\t0.00725\t0.00621\n+4\t0.81514\t0.01273\t0.00968\t0.00866\t0.01273\t0.01477\t0.00713\t0.01935\t0.01120\t0.02954\t0.00917\t0.01069\t0.00713\t0.00611\t0.00407\t0.00204\t0.00509\t0.00356\t0.00407\t0.00713\n+5\t0.01431\t0.01362\t0.02314\t0.40568\t0.37777\t0.01512\t0.01922\t0.01847\t0.01405\t0.01910\t0.01203\t0.01694\t0.00958\t0.00623\t0.00655\t0.00208\t0.00831\t0.00586\t0.00309\t0.00883\n+6\t0.00802\t0.00573\t0.00764\t0.00917\t0.00955\t0.00535\t0.00611\t0.00917\t0.01260\t0.01681\t0.03628\t0.76434\t0.04354\t0.02062\t0.00840\t0.00267\t0.00382\t0.01872\t0.00611\t0.00535\n+7\t0.01256\t0.09012\t0.49756\t0.01561\t0.02293\t0.01394\t0.01878\t0.01851\t0.01468\t0.02122\t0.14755\t0.06189\t0.02046\t0.00836\t0.00649\t0.00206\t0.00792\t0.00685\t0.00381\t0.00871\n+8\t0.01893\t0.10311\t0.05847\t0.01509\t0.06858\t0.03503\t0.03064\t0.08666\t0.20816\t0.16007\t0.03995\t0.06990\t0.01746\t0.00848\t0.00640\t0.00199\t0.00629\t0.00705\t0.00569\t0.05201\n+9\t0.01640\t0.01116\t0.01346\t0.00995\t0.01529\t0.00870\t0.00799\t0.01920\t0.01498\t0.16457\t0.04909\t0.01916\t0.04423\t0.00643\t0.00548\t0.00129\t0.00488\t0.00524\t0.00500\t0.57750\n+10\t0.01598\t0.01533\t0.02616\t0.09754\t0.67286\t0.01556\t0.02005\t0.01993\t0.01484\t0.02113\t0.01233\t0.01639\t0.01030\t0.00592\t0.00652\t0.00197\t0.00790\t0.00586\t0.00323\t0.01018\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t1\n+\n+[block]\n+# block no. 1 follows, 33 sequences, length 41\n+# corresponding to MSA columns:\n+# 100-140\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.08639\t0.10657\t0.06567\t0.01864\t0.04246\t0.01708\t0.24850\t0.07235\t0.16441\t0.08759\t0.01652\t0.01776\t0.01227\t0.00677\t0.00650\t0.00206\t0.00793\t0.00639\t0.00467\t0.00946\n+1\t0.57803\t0.07938\t0.11796\t0.01055\t0.01553\t0.01567\t0.01013\t0.04144\t0.01267\t0.02737\t0.03443\t0.01264\t0.00944\t0.00640\t0.00461\t0.00199\t0.00593\t0.00411\t0.00397\t0.00772\n+2\t0.01717\t0.05763\t0.10713\t0.05499\t0.46228\t0.05908\t0.01874\t0.08395\t0.03582\t0.02266\t0.01271\t0.01569\t0.01026\t0.00625\t0.00635\t0.00194\t0.00814\t0.00558\t0.00358\t0.01005\n+3\t0.00940\t0.00705\t0.01058\t0.01058\t0.01176\t0.00823\t0.00823\t0.01176\t0.01058\t0.01528\t0.01763\t0.02586\t0.01646\t0.04937\t0.74255\t0.01058\t0.01763\t0.00705\t0.00353\t0.00588\n+4\t0.01412\t0.20897\t0.42268\t0.01797\t0.08580\t0.01697\t0.01903\t0.01947\t0.01386\t0.01931\t0.01381\t0.05953\t0.01209\t0.00751\t0.00605\t0.00199\t0.00838\t0.04024\t0.00319\t0.00904\n+5\t0.01714\t0.01397\t0.01491\t0.01330\t0.01710\t0.01598\t0.01038\t0.03481\t0.67490\t0.06877\t0.02675\t0.02444\t0.01987\t0.00889\t0.00669\t0.00222\t0.00523\t0.00739\t0.00678\t0.01047\n+6\t0.81514\t0.01273\t0.00968\t0.00866\t0.01273\t0.01477\t0.00713\t0.01935\t0.01120\t0.02954\t0.00917\t0.01069\t0.00713\t0.00611\t0.00407\t0.00204\t0.00509\t0.00356\t0.00407\t0.00713\n+7\t0.01554\t0.01776\t0.03885\t0.02775\t0.03441\t0.01665\t0.70366\t0.02109\t0.01554\t0.02109\t0.01332\t0.01776\t0.00999\t0.00555\t0.00777\t0.00222\t0.01110\t0.00777\t0.00333\t0.00888\n+8\t0.00832\t0.00594\t0.00796\t0.00938\t0.00993\t0.00559\t0.00651\t0.00973\t0.01314\t0.01755\t0.07146\t0.66646\t0.04399\t0.02004\t0.00843\t0.00267\t0.00398\t0.07728\t0.00617\t0.00545\n+9\t0.00879\t0.00651\t0.00696\t0.00696\t0.00793\t0.00602\t0.00443\t0.00952\t0.01195\t0.01496\t0.04084\t0.05195\t0.33059\t0.43967\t0.02225\t0.00456\t0.00505\t0.01146\t0.00492\t0.00468'..b'845\t0.00579\t0.00446\t0.00145\t0.00771\t0.00362\t0.00290\t0.00834\n+9\t0.81514\t0.01273\t0.00968\t0.00866\t0.01273\t0.01477\t0.00713\t0.01935\t0.01120\t0.02954\t0.00917\t0.01069\t0.00713\t0.00611\t0.00407\t0.00204\t0.00509\t0.00356\t0.00407\t0.00713\n+10\t0.01004\t0.00808\t0.01176\t0.01149\t0.01236\t0.00980\t0.00896\t0.01207\t0.01078\t0.01559\t0.01872\t0.12593\t0.01891\t0.03915\t0.52207\t0.00822\t0.13782\t0.00845\t0.00378\t0.00602\n+11\t0.01926\t0.01249\t0.01453\t0.01285\t0.01663\t0.01335\t0.01039\t0.07215\t0.37041\t0.20734\t0.02733\t0.03229\t0.02173\t0.01031\t0.00710\t0.00231\t0.00559\t0.12711\t0.00695\t0.00990\n+12\t0.00957\t0.00638\t0.00718\t0.00718\t0.00718\t0.00638\t0.00399\t0.00957\t0.00957\t0.01276\t0.02074\t0.04308\t0.02393\t0.76864\t0.03351\t0.00638\t0.00638\t0.00957\t0.00399\t0.00399\n+13\t0.01760\t0.77260\t0.03450\t0.01126\t0.01690\t0.02605\t0.01126\t0.01971\t0.01338\t0.01549\t0.00915\t0.01056\t0.00845\t0.00563\t0.00422\t0.00141\t0.00704\t0.00352\t0.00282\t0.00845\n+14\t0.01227\t0.00614\t0.00614\t0.00614\t0.00767\t0.00614\t0.00460\t0.01534\t0.01381\t0.02454\t0.02148\t0.02454\t0.01687\t0.00767\t0.00460\t0.00153\t0.00307\t0.00614\t0.80518\t0.00614\n+15\t0.01311\t0.01239\t0.02097\t0.62759\t0.16526\t0.01480\t0.01862\t0.01742\t0.01348\t0.01764\t0.01182\t0.01733\t0.00907\t0.00646\t0.00657\t0.00215\t0.00861\t0.00585\t0.00298\t0.00786\n+16\t0.00799\t0.00668\t0.00696\t0.00689\t0.00902\t0.00565\t0.00517\t0.00986\t0.01551\t0.01897\t0.15746\t0.06140\t0.63339\t0.01623\t0.00778\t0.00220\t0.00330\t0.01362\t0.00627\t0.00565\n+17\t0.01365\t0.01170\t0.01365\t0.00975\t0.01560\t0.00878\t0.00780\t0.01658\t0.01365\t0.02145\t0.01170\t0.01365\t0.00975\t0.00488\t0.00488\t0.00098\t0.00488\t0.00390\t0.00390\t0.80888\n+18\t0.01365\t0.01170\t0.01365\t0.00975\t0.01560\t0.00878\t0.00780\t0.01658\t0.01365\t0.02145\t0.01170\t0.01365\t0.00975\t0.00488\t0.00488\t0.00098\t0.00488\t0.00390\t0.00390\t0.80888\n+19\t0.00957\t0.00638\t0.00718\t0.00718\t0.00718\t0.00638\t0.00399\t0.00957\t0.00957\t0.01276\t0.02074\t0.04308\t0.02393\t0.76864\t0.03351\t0.00638\t0.00638\t0.00957\t0.00399\t0.00399\n+20\t0.02565\t0.01744\t0.01914\t0.01467\t0.01992\t0.01893\t0.01212\t0.61263\t0.02928\t0.13684\t0.01721\t0.01672\t0.01190\t0.00794\t0.00659\t0.00198\t0.00702\t0.00602\t0.00680\t0.01120\n+21\t0.00802\t0.00573\t0.00764\t0.00917\t0.00955\t0.00535\t0.00611\t0.00917\t0.01260\t0.01681\t0.03628\t0.76434\t0.04354\t0.02062\t0.00840\t0.00267\t0.00382\t0.01872\t0.00611\t0.00535\n+22\t0.01320\t0.03405\t0.73453\t0.01876\t0.02849\t0.01529\t0.02432\t0.02085\t0.01390\t0.02085\t0.01181\t0.01390\t0.00834\t0.00625\t0.00625\t0.00208\t0.00973\t0.00486\t0.00278\t0.00973\n+23\t0.02503\t0.01844\t0.01976\t0.01515\t0.02042\t0.02042\t0.01251\t0.70562\t0.03095\t0.04149\t0.01581\t0.01581\t0.01120\t0.00790\t0.00659\t0.00198\t0.00724\t0.00593\t0.00659\t0.01120\n+24\t0.01812\t0.01503\t0.02514\t0.03645\t0.62944\t0.01482\t0.01875\t0.02184\t0.01552\t0.11962\t0.01426\t0.01714\t0.01124\t0.00618\t0.00653\t0.00197\t0.00751\t0.00597\t0.00393\t0.01053\n+25\t0.01658\t0.01323\t0.01511\t0.01164\t0.01674\t0.05157\t0.03606\t0.03899\t0.11991\t0.10520\t0.03509\t0.01890\t0.03647\t0.00667\t0.00573\t0.00147\t0.00561\t0.00549\t0.00498\t0.45457\n+26\t0.01496\t0.38596\t0.29756\t0.01424\t0.02086\t0.01940\t0.01614\t0.01931\t0.01382\t0.01811\t0.01371\t0.02063\t0.01247\t0.00760\t0.00567\t0.00189\t0.00793\t0.09788\t0.00325\t0.00861\n+27\t0.10060\t0.22628\t0.30685\t0.01455\t0.04365\t0.01682\t0.01558\t0.01935\t0.01349\t0.02037\t0.01233\t0.01406\t0.02841\t0.00612\t0.00530\t0.00172\t0.00747\t0.00449\t0.00322\t0.13935\n+28\t0.14568\t0.12128\t0.10204\t0.01270\t0.01804\t0.05265\t0.03299\t0.08866\t0.06852\t0.04368\t0.01436\t0.03938\t0.01196\t0.00706\t0.00556\t0.00175\t0.00662\t0.02611\t0.00434\t0.19660\n+29\t0.13785\t0.01382\t0.01374\t0.01197\t0.03766\t0.06930\t0.00914\t0.12212\t0.10513\t0.09091\t0.02545\t0.02506\t0.14684\t0.00874\t0.00608\t0.00186\t0.00571\t0.00683\t0.00543\t0.15638\n+30\t0.07072\t0.01424\t0.01617\t0.01579\t0.11463\t0.05532\t0.01089\t0.05826\t0.20681\t0.12656\t0.01933\t0.01935\t0.03198\t0.00723\t0.00602\t0.00180\t0.00597\t0.00588\t0.00536\t0.20768\n+31\t0.11235\t0.03854\t0.01450\t0.01148\t0.01541\t0.10438\t0.03035\t0.03945\t0.09773\t0.06291\t0.04780\t0.02205\t0.01587\t0.11222\t0.00953\t0.00233\t0.00636\t0.02184\t0.00467\t0.23023\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t52\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W07NX.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W08R7.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W08R7.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,503 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+4\t78\n+\n+[block]\n+# block no. 0 follows, 28 sequences, length 7\n+# corresponding to MSA columns:\n+# 108-114\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01782\t0.00959\t0.01067\t0.00908\t0.01234\t0.00910\t0.00713\t0.07647\t0.01768\t0.12970\t0.02250\t0.02434\t0.01697\t0.00817\t0.00564\t0.00174\t0.00446\t0.00651\t0.49950\t0.11060\n+1\t0.01911\t0.02194\t0.19850\t0.02212\t0.08531\t0.01691\t0.15576\t0.12299\t0.10621\t0.08825\t0.01974\t0.04869\t0.01557\t0.00870\t0.00766\t0.00239\t0.00900\t0.03515\t0.00526\t0.01075\n+2\t0.12135\t0.12449\t0.24483\t0.01899\t0.07759\t0.12287\t0.03452\t0.06015\t0.03417\t0.05585\t0.01421\t0.03469\t0.01126\t0.00753\t0.00642\t0.00213\t0.00923\t0.00569\t0.00414\t0.00992\n+3\t0.02257\t0.01059\t0.01324\t0.01101\t0.01504\t0.00970\t0.00880\t0.02697\t0.07894\t0.37264\t0.11385\t0.03554\t0.12605\t0.01111\t0.00737\t0.00223\t0.00508\t0.00922\t0.11008\t0.00997\n+4\t0.01986\t0.01675\t0.11072\t0.03720\t0.06496\t0.01365\t0.11232\t0.10744\t0.02022\t0.18867\t0.13480\t0.07406\t0.04591\t0.01022\t0.00781\t0.00233\t0.00751\t0.00916\t0.00633\t0.01007\n+5\t0.01953\t0.01680\t0.10746\t0.11825\t0.17329\t0.01442\t0.03820\t0.02612\t0.10525\t0.18698\t0.07957\t0.02535\t0.03877\t0.00874\t0.00743\t0.00230\t0.00761\t0.00766\t0.00574\t0.01054\n+6\t0.01247\t0.01149\t0.01140\t0.01127\t0.01287\t0.11377\t0.00829\t0.01432\t0.01392\t0.01724\t0.03022\t0.10008\t0.14123\t0.14123\t0.31932\t0.00710\t0.01249\t0.01023\t0.00471\t0.00635\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+3\t10\n+\n+[block]\n+# block no. 1 follows, 28 sequences, length 7\n+# corresponding to MSA columns:\n+# 125-131\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01394\t0.08127\t0.01520\t0.01079\t0.01510\t0.03609\t0.00842\t0.01649\t0.01535\t0.02187\t0.08610\t0.17401\t0.02490\t0.04263\t0.00789\t0.00193\t0.00552\t0.00890\t0.00506\t0.40852\n+1\t0.01607\t0.08459\t0.02626\t0.31839\t0.17793\t0.01756\t0.08906\t0.02214\t0.08164\t0.02157\t0.01465\t0.01884\t0.01150\t0.00700\t0.00703\t0.00220\t0.00887\t0.00647\t0.00383\t0.06439\n+2\t0.01671\t0.01846\t0.08813\t0.09657\t0.25079\t0.05706\t0.01843\t0.04373\t0.01570\t0.02196\t0.05177\t0.04983\t0.01524\t0.00965\t0.01197\t0.00251\t0.21089\t0.00722\t0.00392\t0.00946\n+3\t0.01363\t0.00815\t0.00967\t0.00883\t0.01148\t0.00720\t0.00678\t0.01633\t0.01849\t0.13666\t0.27141\t0.05286\t0.30338\t0.01465\t0.00802\t0.00229\t0.00398\t0.01241\t0.08633\t0.00747\n+4\t0.01415\t0.01162\t0.01303\t0.01263\t0.01524\t0.01279\t0.00941\t0.02638\t0.38949\t0.02624\t0.10057\t0.27289\t0.03571\t0.01477\t0.00816\t0.00261\t0.00499\t0.01296\t0.00724\t0.00913\n+5\t0.00987\t0.00731\t0.00920\t0.00895\t0.01066\t0.00664\t0.00663\t0.01282\t0.01926\t0.02653\t0.52778\t0.12449\t0.17050\t0.01623\t0.00865\t0.00238\t0.00355\t0.01425\t0.00767\t0.00664\n+6\t0.00888\t0.00721\t0.00788\t0.00806\t0.01009\t0.00621\t0.00591\t0.01086\t0.01673\t0.02085\t0.15907\t0.17391\t0.50181\t0.01858\t0.00870\t0.00251\t0.00373\t0.01587\t0.00693\t0.00621\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t14\n+\n+[block]\n+# block no. 2 follows, 28 sequences, length 38\n+# corresponding to MSA columns:\n+# 146-183\n+name=unknown_C\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.07024\t0.01341\t0.02160\t0.52801\t0.14958\t0.01585\t0.01894\t0.01911\t0.01502\t0.02097\t0.04911\t0.02047\t0.01298\t0.00751\t0.00713\t0.00236\t0.00890\t0.00664\t0.00363\t0.00855\n+1\t0.02038\t0.01916\t0.02559\t0.11570\t0.41160\t0.11583\t0.01920\t0.07938\t0.04088\t0.06056\t0.01489\t0.01808\t0.01177\t0.00715\t0.00713\t0.00217\t0.00911\t0.00633\t0.00430\t0.01079\n+2\t0.03042\t0.01477\t0.01753\t0.01372\t0.01910\t0.05017\t0.01122\t0.13645\t0.04651\t0.51788\t0.02584\t0.02312\t0.01681\t0.00889\t0.00720\t0.00221\t0.00674\t0.00706\t0.03241\t0.01196\n+3\t0.01650\t0.06161\t0.23715\t0.03047\t0.34473\t0.01728\t0.02133\t0.04008\t0.01648\t0.02367\t0.05425\t0.03627\t0.01487\t0.00787\t0.00796\t0.00225\t0.04607\t0.00673\t0.00383\t0.01059\n+4\t0.01728\t0.17465\t0.10616\t0.05256\t0.34147\t0.01884\t0.04494\t0.04450\t0.01665\t0.02280\t0.04255\t0.05630\t0.01504\t0.00778\t0.00685\t0.00211\t0.00840\t0.00691\t0.00391\t0.01032\n+5\t0.01329\t0.18912\t0.15799\t0.05065\t0.01990\t0.01470\t0.'..b'9624\t0.01841\t0.00859\t0.00245\t0.00368\t0.01534\t0.00675\t0.00614\n+8\t0.01943\t0.74891\t0.03809\t0.01244\t0.01866\t0.02876\t0.01244\t0.02177\t0.01477\t0.01710\t0.01011\t0.01166\t0.00933\t0.00622\t0.00466\t0.00155\t0.00777\t0.00389\t0.00311\t0.00933\n+9\t0.14244\t0.05974\t0.02208\t0.02123\t0.11926\t0.39823\t0.03776\t0.02547\t0.01764\t0.02107\t0.01136\t0.01399\t0.00952\t0.00752\t0.00762\t0.00208\t0.06534\t0.00506\t0.00377\t0.00884\n+10\t0.01561\t0.03736\t0.65087\t0.02056\t0.03073\t0.07388\t0.02581\t0.02351\t0.01578\t0.02259\t0.01290\t0.01516\t0.00922\t0.00695\t0.00688\t0.00227\t0.01094\t0.00532\t0.00312\t0.01055\n+11\t0.01905\t0.18317\t0.37558\t0.01753\t0.02564\t0.07263\t0.01981\t0.07717\t0.01752\t0.08153\t0.01419\t0.01580\t0.01054\t0.00865\t0.02908\t0.00240\t0.00996\t0.00534\t0.00401\t0.01040\n+12\t0.01046\t0.00749\t0.01018\t0.01018\t0.01096\t0.00827\t0.00722\t0.01202\t0.01124\t0.01576\t0.02084\t0.03615\t0.02147\t0.33011\t0.44465\t0.00983\t0.01451\t0.00890\t0.00410\t0.00566\n+13\t0.01607\t0.25661\t0.50096\t0.01817\t0.02752\t0.02054\t0.02242\t0.02263\t0.01517\t0.02120\t0.01214\t0.01421\t0.00925\t0.00669\t0.00622\t0.00207\t0.00983\t0.00491\t0.00308\t0.01031\n+14\t0.01264\t0.00806\t0.01069\t0.01040\t0.01244\t0.00739\t0.00801\t0.01557\t0.01853\t0.09307\t0.37883\t0.18588\t0.05337\t0.01620\t0.00868\t0.00252\t0.00442\t0.10792\t0.00752\t0.03788\n+15\t0.01646\t0.01571\t0.02674\t0.28969\t0.46609\t0.01687\t0.02155\t0.02097\t0.01583\t0.02189\t0.01340\t0.01849\t0.01086\t0.00676\t0.00722\t0.00225\t0.00901\t0.00647\t0.00347\t0.01028\n+16\t0.01777\t0.01348\t0.01580\t0.01146\t0.01779\t0.01084\t0.00924\t0.07374\t0.01718\t0.09029\t0.01479\t0.01619\t0.01159\t0.00600\t0.00572\t0.00128\t0.00567\t0.00478\t0.00500\t0.65140\n+17\t0.01027\t0.00758\t0.00879\t0.00858\t0.01078\t0.00665\t0.00651\t0.01274\t0.01801\t0.05007\t0.28483\t0.09455\t0.39358\t0.01708\t0.00863\t0.00245\t0.00384\t0.04113\t0.00727\t0.00665\n+18\t0.01690\t0.01787\t0.06368\t0.15547\t0.42681\t0.01741\t0.12634\t0.02170\t0.01606\t0.02255\t0.01354\t0.01828\t0.01095\t0.00679\t0.00799\t0.00229\t0.03461\t0.00675\t0.00351\t0.01050\n+19\t0.01042\t0.00765\t0.00873\t0.00847\t0.01071\t0.00670\t0.00642\t0.01278\t0.01772\t0.05358\t0.25221\t0.06296\t0.42021\t0.04574\t0.00972\t0.00262\t0.00400\t0.04561\t0.00713\t0.00659\n+20\t0.01843\t0.01696\t0.05235\t0.09843\t0.15892\t0.01776\t0.01545\t0.12591\t0.32033\t0.02920\t0.02250\t0.05499\t0.01781\t0.00919\t0.00739\t0.00237\t0.00725\t0.00787\t0.00593\t0.01097\n+21\t0.00921\t0.00672\t0.00866\t0.00958\t0.01055\t0.00618\t0.00665\t0.01110\t0.01594\t0.02146\t0.21615\t0.49038\t0.12008\t0.02024\t0.00902\t0.00273\t0.00395\t0.01814\t0.00708\t0.00618\n+22\t0.00942\t0.00687\t0.00880\t0.00974\t0.01075\t0.00638\t0.00690\t0.01130\t0.01563\t0.02085\t0.17467\t0.43439\t0.12910\t0.05622\t0.01049\t0.00299\t0.00433\t0.06816\t0.00688\t0.00611\n+23\t0.01607\t0.01351\t0.01561\t0.01124\t0.01765\t0.01071\t0.00903\t0.07062\t0.01660\t0.02545\t0.01328\t0.01526\t0.01089\t0.00565\t0.00553\t0.00116\t0.00559\t0.00448\t0.00454\t0.72710\n+24\t0.02012\t0.02303\t0.04896\t0.11419\t0.31923\t0.23266\t0.09232\t0.02408\t0.01759\t0.02123\t0.01293\t0.01674\t0.01051\t0.00686\t0.00715\t0.00214\t0.01061\t0.00612\t0.00359\t0.00994\n+25\t0.02536\t0.01503\t0.01847\t0.07411\t0.06906\t0.04201\t0.01265\t0.19811\t0.02297\t0.30790\t0.05079\t0.05751\t0.05303\t0.00988\t0.00746\t0.00227\t0.00707\t0.00812\t0.00723\t0.01098\n+26\t0.01149\t0.00777\t0.00947\t0.00890\t0.01113\t0.00689\t0.00672\t0.01425\t0.01899\t0.08065\t0.40766\t0.08568\t0.27151\t0.01589\t0.00851\t0.00237\t0.00377\t0.01371\t0.00762\t0.00703\n+27\t0.01911\t0.02182\t0.08495\t0.06250\t0.38854\t0.14038\t0.05036\t0.02527\t0.09191\t0.02314\t0.01498\t0.01806\t0.01203\t0.00709\t0.00715\t0.00218\t0.00950\t0.00636\t0.00399\t0.01068\n+28\t0.01023\t0.00746\t0.00945\t0.00971\t0.01120\t0.00700\t0.00737\t0.01280\t0.01739\t0.02346\t0.32739\t0.12733\t0.14757\t0.10269\t0.01228\t0.00315\t0.00464\t0.14553\t0.00701\t0.00634\n+29\t0.01057\t0.00705\t0.00793\t0.00793\t0.00793\t0.00705\t0.00440\t0.01057\t0.01057\t0.01409\t0.02290\t0.04757\t0.02643\t0.74454\t0.03700\t0.00705\t0.00705\t0.01057\t0.00440\t0.00440\n+30\t0.01521\t0.00963\t0.01118\t0.00993\t0.01250\t0.01003\t0.03488\t0.08933\t0.07525\t0.02898\t0.07781\t0.02803\t0.02200\t0.01094\t0.03525\t0.00230\t0.00512\t0.00751\t0.50622\t0.00790\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t10\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W08R7.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W09HB.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W09HB.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,581 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+9\t86\n+\n+[block]\n+# block no. 0 follows, 36 sequences, length 16\n+# corresponding to MSA columns:\n+# 86-101\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01502\t0.01593\t0.06705\t0.06213\t0.57360\t0.01489\t0.12091\t0.01916\t0.01414\t0.02010\t0.01179\t0.01554\t0.00964\t0.00555\t0.00633\t0.00190\t0.00799\t0.00576\t0.00306\t0.00951\n+1\t0.01474\t0.01503\t0.02135\t0.23706\t0.34625\t0.11345\t0.05078\t0.01818\t0.01417\t0.01828\t0.03568\t0.06151\t0.01257\t0.00690\t0.00631\t0.00194\t0.00796\t0.00633\t0.00330\t0.00820\n+2\t0.02353\t0.01219\t0.02013\t0.06043\t0.04979\t0.01114\t0.16913\t0.02673\t0.01667\t0.51180\t0.02059\t0.01972\t0.01344\t0.00699\t0.00650\t0.00197\t0.00673\t0.00644\t0.00621\t0.00986\n+3\t0.00759\t0.00542\t0.00723\t0.00868\t0.00904\t0.00506\t0.00578\t0.00868\t0.01193\t0.01591\t0.03434\t0.77697\t0.04121\t0.01952\t0.00795\t0.00253\t0.00361\t0.01771\t0.00578\t0.00506\n+4\t0.01888\t0.01498\t0.02903\t0.02212\t0.06684\t0.01400\t0.44856\t0.05422\t0.01621\t0.22567\t0.01604\t0.01789\t0.01121\t0.00606\t0.00693\t0.00203\t0.00870\t0.00687\t0.00457\t0.00920\n+5\t0.02441\t0.04436\t0.07466\t0.01538\t0.11424\t0.01141\t0.01177\t0.05846\t0.01728\t0.53085\t0.02073\t0.01907\t0.01357\t0.00717\t0.00613\t0.00189\t0.00602\t0.00589\t0.00642\t0.01029\n+6\t0.01177\t0.01107\t0.01869\t0.76606\t0.04291\t0.01384\t0.01730\t0.01592\t0.01246\t0.01592\t0.01107\t0.01661\t0.00831\t0.00623\t0.00623\t0.00208\t0.00831\t0.00554\t0.00277\t0.00692\n+7\t0.00854\t0.00647\t0.00794\t0.00861\t0.01006\t0.00599\t0.00678\t0.01054\t0.01396\t0.01781\t0.10674\t0.16608\t0.29478\t0.05691\t0.00916\t0.00263\t0.00425\t0.25162\t0.00576\t0.00537\n+8\t0.01963\t0.03954\t0.01964\t0.07492\t0.14275\t0.34760\t0.04518\t0.10876\t0.03873\t0.03931\t0.05506\t0.01574\t0.01227\t0.00678\t0.00601\t0.00177\t0.00885\t0.00530\t0.00394\t0.00822\n+9\t0.17296\t0.01568\t0.01783\t0.05924\t0.09628\t0.14437\t0.10619\t0.08152\t0.03398\t0.04283\t0.01359\t0.05222\t0.01128\t0.00716\t0.00641\t0.00192\t0.04397\t0.00578\t0.07904\t0.00776\n+10\t0.03923\t0.04745\t0.01903\t0.05244\t0.05085\t0.22632\t0.08178\t0.11341\t0.12866\t0.02196\t0.01342\t0.01481\t0.01049\t0.00634\t0.00576\t0.00168\t0.00781\t0.00507\t0.00414\t0.14934\n+11\t0.01807\t0.06921\t0.03994\t0.08807\t0.08140\t0.09959\t0.03906\t0.24727\t0.09443\t0.04188\t0.01667\t0.07629\t0.01417\t0.00826\t0.00628\t0.00195\t0.00719\t0.03667\t0.00482\t0.00879\n+12\t0.05799\t0.01554\t0.01543\t0.03240\t0.04588\t0.15382\t0.03031\t0.18373\t0.05360\t0.04192\t0.04298\t0.09860\t0.08449\t0.00933\t0.00717\t0.00194\t0.05564\t0.00735\t0.00483\t0.05704\n+13\t0.10275\t0.01597\t0.01507\t0.06098\t0.03731\t0.20261\t0.04219\t0.06951\t0.07487\t0.07831\t0.03826\t0.04913\t0.09876\t0.00850\t0.00655\t0.00191\t0.03564\t0.00664\t0.02792\t0.02711\n+14\t0.05521\t0.04733\t0.06278\t0.07749\t0.09544\t0.06529\t0.02964\t0.21311\t0.14823\t0.07810\t0.03556\t0.01718\t0.01286\t0.00706\t0.00601\t0.00189\t0.00683\t0.00569\t0.00496\t0.02937\n+15\t0.13615\t0.05539\t0.08902\t0.01478\t0.07220\t0.13596\t0.03191\t0.12796\t0.04897\t0.06630\t0.02880\t0.05698\t0.01235\t0.00713\t0.00563\t0.00178\t0.00698\t0.00555\t0.00435\t0.09181\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+2\t23\n+\n+[block]\n+# block no. 1 follows, 36 sequences, length 20\n+# corresponding to MSA columns:\n+# 125-144\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01667\t0.15017\t0.10484\t0.12085\t0.02108\t0.06769\t0.01250\t0.15002\t0.01652\t0.07867\t0.04554\t0.01665\t0.01229\t0.01098\t0.08736\t0.00262\t0.00823\t0.00525\t0.00412\t0.06795\n+1\t0.01585\t0.03482\t0.04096\t0.01263\t0.01639\t0.07187\t0.07904\t0.12627\t0.08030\t0.08227\t0.03429\t0.04675\t0.08916\t0.10049\t0.00963\t0.00236\t0.02301\t0.02598\t0.00487\t0.10306\n+2\t0.01491\t0.05695\t0.03536\t0.03078\t0.16138\t0.01271\t0.05064\t0.15088\t0.02812\t0.03877\t0.04405\t0.07326\t0.07605\t0.05334\t0.00761\t0.00202\t0.00605\t0.00715\t0.02215\t0.12781\n+3\t0.04596\t0.09045\t0.01497\t0.05477\t0.03079\t0.15442\t0.00935\t0.06325\t0.04180\t0.06921\t0.13345\t0.06071\t0.05942\t0.00980\t0.02633\t0.00200\t0.00645\t0.01758\t0.03770\t0.07161\n+4\t0.10454\t0.04666\t0.01748\t0.01383\t0.04517\t0.08750\t0.05089\t0.24133\t0.03661\t0.15564\t0.02778\t0.01590\t0.01166\t0.00677\t0.00571\t0.00175\t0.00657\t0.00529\t0.02724\t'..b'0974\t0.00589\t0.03987\t0.00947\t0.01172\t0.01543\t0.03276\t0.48235\t0.10337\t0.18885\t0.01321\t0.00326\t0.00452\t0.03728\t0.00521\t0.00498\n+14\t0.05357\t0.01724\t0.01650\t0.01481\t0.05646\t0.18923\t0.02851\t0.23033\t0.04989\t0.02449\t0.01553\t0.11870\t0.01405\t0.00859\t0.00688\t0.00187\t0.04979\t0.00669\t0.00465\t0.09223\n+15\t0.01640\t0.07497\t0.14570\t0.04338\t0.14108\t0.03336\t0.01348\t0.09299\t0.03511\t0.09719\t0.01383\t0.03590\t0.01089\t0.00630\t0.00562\t0.00163\t0.00663\t0.00516\t0.00410\t0.21625\n+16\t0.01656\t0.13141\t0.14543\t0.07434\t0.12214\t0.04721\t0.01408\t0.10803\t0.01556\t0.09223\t0.01470\t0.04376\t0.02551\t0.00820\t0.02540\t0.00206\t0.05037\t0.00564\t0.02617\t0.03120\n+17\t0.00888\t0.00727\t0.00805\t0.00821\t0.00988\t0.02667\t0.00617\t0.01171\t0.05475\t0.01925\t0.21367\t0.19158\t0.31969\t0.01523\t0.00748\t0.00221\t0.00374\t0.07386\t0.00600\t0.00572\n+18\t0.00787\t0.00564\t0.00748\t0.00848\t0.00910\t0.00525\t0.00581\t0.00938\t0.01323\t0.01798\t0.19542\t0.60997\t0.04523\t0.01797\t0.00781\t0.00240\t0.00346\t0.01624\t0.00603\t0.00525\n+19\t0.09848\t0.02038\t0.24361\t0.05780\t0.19296\t0.03959\t0.07940\t0.09597\t0.01505\t0.02240\t0.02664\t0.01473\t0.00978\t0.00638\t0.00677\t0.00197\t0.05058\t0.00527\t0.00342\t0.00881\n+20\t0.01550\t0.02798\t0.01754\t0.11235\t0.02016\t0.05005\t0.05712\t0.14023\t0.09078\t0.04725\t0.04801\t0.07601\t0.03869\t0.00945\t0.01000\t0.00218\t0.19895\t0.00713\t0.02275\t0.00784\n+21\t0.00904\t0.00629\t0.00751\t0.00792\t0.00848\t0.00617\t0.00542\t0.00991\t0.01094\t0.01427\t0.02780\t0.09056\t0.09741\t0.48824\t0.02270\t0.00473\t0.00555\t0.16810\t0.00453\t0.00444\n+22\t0.01161\t0.00581\t0.00581\t0.00581\t0.00726\t0.00581\t0.00436\t0.01452\t0.01307\t0.02323\t0.02033\t0.02323\t0.01597\t0.00726\t0.00436\t0.00145\t0.00290\t0.00581\t0.81562\t0.00581\n+23\t0.01855\t0.04932\t0.02039\t0.24141\t0.05237\t0.10244\t0.07231\t0.26867\t0.01953\t0.05310\t0.01311\t0.01545\t0.00971\t0.00664\t0.00610\t0.00189\t0.00795\t0.00548\t0.02694\t0.00865\n+24\t0.01867\t0.03903\t0.05529\t0.01183\t0.01676\t0.01312\t0.01010\t0.20793\t0.12075\t0.15552\t0.05999\t0.01834\t0.01494\t0.00705\t0.00580\t0.00165\t0.00559\t0.00563\t0.00556\t0.22645\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+2\t5\n+\n+[block]\n+# block no. 11 follows, 36 sequences, length 10\n+# corresponding to MSA columns:\n+# 741-750\n+name=unknown_L\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.07397\t0.04444\t0.09690\t0.02031\t0.14408\t0.01512\t0.17770\t0.07126\t0.08490\t0.07037\t0.01446\t0.03247\t0.01163\t0.03931\t0.00854\t0.00220\t0.07345\t0.00622\t0.00400\t0.00865\n+1\t0.01493\t0.16415\t0.01681\t0.01150\t0.01462\t0.15396\t0.03049\t0.08569\t0.07623\t0.02024\t0.13019\t0.13623\t0.09979\t0.01033\t0.00627\t0.00188\t0.00614\t0.00848\t0.00486\t0.00723\n+2\t0.00923\t0.00704\t0.00911\t0.07512\t0.01253\t0.00724\t0.00708\t0.01217\t0.06920\t0.01748\t0.12885\t0.27805\t0.08585\t0.15507\t0.04705\t0.00336\t0.00520\t0.05960\t0.00523\t0.00557\n+3\t0.01404\t0.31101\t0.48347\t0.01513\t0.02290\t0.01824\t0.01844\t0.01933\t0.01297\t0.01785\t0.01025\t0.01198\t0.00793\t0.00570\t0.00521\t0.00174\t0.00827\t0.00413\t0.00264\t0.00876\n+4\t0.01782\t0.01410\t0.01627\t0.23392\t0.02411\t0.06968\t0.01214\t0.30712\t0.02001\t0.05636\t0.01601\t0.08309\t0.01311\t0.00808\t0.00617\t0.00193\t0.00690\t0.00658\t0.07825\t0.00835\n+5\t0.00979\t0.00628\t0.00807\t0.00847\t0.00966\t0.00575\t0.00605\t0.01142\t0.01377\t0.08184\t0.17401\t0.41206\t0.12082\t0.06058\t0.00902\t0.00253\t0.00381\t0.04434\t0.00605\t0.00569\n+6\t0.01410\t0.08018\t0.02112\t0.05677\t0.37669\t0.01361\t0.05626\t0.01861\t0.07096\t0.02058\t0.06186\t0.05059\t0.01561\t0.00704\t0.00599\t0.00184\t0.00635\t0.00650\t0.10686\t0.00851\n+7\t0.00918\t0.00636\t0.00843\t0.00843\t0.00913\t0.00695\t0.00595\t0.01059\t0.00988\t0.01423\t0.01812\t0.03073\t0.01836\t0.32975\t0.41419\t0.00778\t0.01144\t0.00754\t0.06807\t0.00489\n+8\t0.01868\t0.05896\t0.01866\t0.08029\t0.02038\t0.12572\t0.06212\t0.24944\t0.12002\t0.04622\t0.03331\t0.03922\t0.01334\t0.00769\t0.00671\t0.00191\t0.03953\t0.00608\t0.04300\t0.00871\n+9\t0.03697\t0.09360\t0.02018\t0.05103\t0.14927\t0.20996\t0.06192\t0.06246\t0.05633\t0.05498\t0.07714\t0.04965\t0.01544\t0.00752\t0.00640\t0.00184\t0.02692\t0.00614\t0.00412\t0.00813\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+6\t28\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W09HB.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W0CIU.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W0CIU.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,319 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+5\t46\n+\n+[block]\n+# block no. 0 follows, 38 sequences, length 6\n+# corresponding to MSA columns:\n+# 47-52\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.07580\t0.01070\t0.03658\t0.01195\t0.01525\t0.01011\t0.10380\t0.11111\t0.01515\t0.16596\t0.02345\t0.18464\t0.07686\t0.01433\t0.09445\t0.00291\t0.00677\t0.00878\t0.02399\t0.00741\n+1\t0.01301\t0.00881\t0.01065\t0.01106\t0.06488\t0.02754\t0.00739\t0.09632\t0.01390\t0.10522\t0.02490\t0.19870\t0.06857\t0.25243\t0.01421\t0.00328\t0.00535\t0.06258\t0.00500\t0.00621\n+2\t0.01143\t0.09962\t0.01390\t0.01086\t0.01265\t0.01186\t0.00876\t0.06624\t0.07008\t0.01687\t0.01677\t0.11029\t0.01616\t0.02734\t0.37804\t0.00578\t0.10600\t0.00714\t0.00379\t0.00642\n+3\t0.01766\t0.02192\t0.09265\t0.02203\t0.17201\t0.30705\t0.16177\t0.05029\t0.01534\t0.01803\t0.01057\t0.01326\t0.00850\t0.00607\t0.00684\t0.00181\t0.05805\t0.00505\t0.00310\t0.00803\n+4\t0.01110\t0.08303\t0.01184\t0.01081\t0.06559\t0.06934\t0.00720\t0.01226\t0.01083\t0.01377\t0.01780\t0.03398\t0.01919\t0.41469\t0.10677\t0.00484\t0.00755\t0.09063\t0.00363\t0.00517\n+5\t0.01223\t0.01450\t0.15480\t0.01526\t0.14099\t0.01024\t0.01189\t0.01676\t0.05894\t0.02023\t0.10149\t0.02064\t0.03964\t0.00675\t0.00558\t0.00152\t0.00557\t0.02812\t0.00392\t0.33092\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+4\t20\n+\n+[block]\n+# block no. 1 follows, 38 sequences, length 26\n+# corresponding to MSA columns:\n+# 73-98\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.25149\t0.14113\t0.01520\t0.00997\t0.01415\t0.08546\t0.00832\t0.05911\t0.03392\t0.11335\t0.06561\t0.01483\t0.01249\t0.00626\t0.00476\t0.00157\t0.00554\t0.00448\t0.00432\t0.14804\n+1\t0.07348\t0.03934\t0.09680\t0.01255\t0.01712\t0.07805\t0.08044\t0.07005\t0.06659\t0.09585\t0.07928\t0.04540\t0.01554\t0.02752\t0.00630\t0.00177\t0.00624\t0.00589\t0.00444\t0.17736\n+2\t0.08510\t0.23408\t0.01867\t0.04879\t0.01552\t0.08762\t0.04348\t0.03912\t0.02883\t0.01637\t0.01269\t0.04703\t0.01215\t0.11685\t0.10930\t0.00332\t0.06561\t0.00559\t0.00330\t0.00658\n+3\t0.35836\t0.00885\t0.00838\t0.00776\t0.01002\t0.00953\t0.00573\t0.01427\t0.02999\t0.04830\t0.01823\t0.05324\t0.07276\t0.24103\t0.06152\t0.00355\t0.00559\t0.00657\t0.00409\t0.03222\n+4\t0.01246\t0.01056\t0.03903\t0.06333\t0.03420\t0.01068\t0.00844\t0.12065\t0.17397\t0.02060\t0.06523\t0.04484\t0.09549\t0.24432\t0.01370\t0.00315\t0.00550\t0.02223\t0.00485\t0.00679\n+5\t0.01619\t0.01600\t0.07018\t0.02326\t0.15347\t0.03000\t0.36561\t0.04394\t0.09232\t0.10516\t0.01459\t0.01677\t0.01076\t0.00585\t0.00652\t0.00194\t0.00829\t0.00637\t0.00393\t0.00885\n+6\t0.01180\t0.01118\t0.01773\t0.49506\t0.05675\t0.01425\t0.01521\t0.01500\t0.01157\t0.01566\t0.03468\t0.01810\t0.01061\t0.00778\t0.00977\t0.00219\t0.21140\t0.03167\t0.00291\t0.00668\n+7\t0.02122\t0.01675\t0.01688\t0.01353\t0.01790\t0.07746\t0.01096\t0.50091\t0.18339\t0.05351\t0.01650\t0.01608\t0.01195\t0.00735\t0.00599\t0.00184\t0.00651\t0.00561\t0.00585\t0.00981\n+8\t0.06401\t0.01299\t0.02198\t0.01963\t0.12843\t0.01318\t0.25928\t0.06407\t0.08114\t0.07788\t0.01608\t0.08407\t0.01372\t0.03165\t0.05228\t0.00257\t0.03770\t0.00720\t0.00412\t0.00803\n+9\t0.06281\t0.01403\t0.03314\t0.04081\t0.01793\t0.04917\t0.03358\t0.22506\t0.11750\t0.29667\t0.01842\t0.01763\t0.01268\t0.00801\t0.02309\t0.00204\t0.00635\t0.00571\t0.00594\t0.00945\n+10\t0.01355\t0.01107\t0.01287\t0.00927\t0.01456\t0.00871\t0.00745\t0.06050\t0.01361\t0.04244\t0.01131\t0.01283\t0.00917\t0.00472\t0.00460\t0.00098\t0.00461\t0.00375\t0.00383\t0.75017\n+11\t0.01027\t0.00728\t0.00835\t0.00782\t0.01004\t0.00668\t0.00614\t0.06519\t0.01585\t0.07182\t0.21508\t0.04989\t0.40942\t0.01352\t0.00706\t0.00204\t0.00365\t0.07790\t0.00599\t0.00601\n+12\t0.01444\t0.01238\t0.01315\t0.01186\t0.01511\t0.01421\t0.00921\t0.03030\t0.68177\t0.02508\t0.08292\t0.02426\t0.02147\t0.00850\t0.00620\t0.00203\t0.00461\t0.00713\t0.00616\t0.00921\n+13\t0.01471\t0.01264\t0.01342\t0.01219\t0.01549\t0.01458\t0.00953\t0.03104\t0.70555\t0.02482\t0.02484\t0.02461\t0.01914\t0.00856\t0.00623\t0.00208\t0.00480\t0.04036\t0.00609\t0.00933\n+14\t0.53004\t0.01166\t0.01067\t0.00926\t0.01307\t0.01300\t0.00752\t0.02254\t0.15877\t0.15005\t0.01423\t0.01414\t0.01033\t0.00642\t0.00460\t0.00190\t0.00475\t0.00445\t0.00484\t0.007'..b'143\t0.01337\t0.01671\t0.01537\t0.01203\t0.01537\t0.01069\t0.01604\t0.00802\t0.00601\t0.00601\t0.00200\t0.00802\t0.00535\t0.00267\t0.00668\n+19\t0.01608\t0.79220\t0.03152\t0.01029\t0.01544\t0.02380\t0.01029\t0.01801\t0.01222\t0.01415\t0.00836\t0.00965\t0.00772\t0.00515\t0.00386\t0.00129\t0.00643\t0.00322\t0.00257\t0.00772\n+20\t0.07376\t0.00967\t0.01138\t0.00951\t0.01300\t0.00955\t0.00762\t0.02511\t0.16193\t0.36885\t0.02180\t0.02067\t0.01518\t0.00735\t0.00543\t0.00178\t0.00441\t0.00590\t0.21845\t0.00864\n+21\t0.01164\t0.01085\t0.01856\t0.66480\t0.06503\t0.01308\t0.05513\t0.01562\t0.01224\t0.01612\t0.01128\t0.01635\t0.00853\t0.00599\t0.00597\t0.00197\t0.00782\t0.00546\t0.04673\t0.00681\n+22\t0.07526\t0.01642\t0.01689\t0.01317\t0.01779\t0.06320\t0.01081\t0.55360\t0.02504\t0.12562\t0.01490\t0.01468\t0.01042\t0.00708\t0.00584\t0.00180\t0.00657\t0.00526\t0.00587\t0.00979\n+23\t0.00992\t0.07644\t0.00992\t0.00815\t0.00925\t0.04905\t0.00580\t0.01076\t0.01068\t0.01348\t0.02367\t0.10083\t0.10697\t0.35575\t0.11551\t0.03480\t0.00692\t0.04345\t0.00392\t0.00474\n+24\t0.01398\t0.01249\t0.01461\t0.01078\t0.01581\t0.04649\t0.04576\t0.07815\t0.01404\t0.02075\t0.01092\t0.01279\t0.00894\t0.00504\t0.00536\t0.00113\t0.03464\t0.00399\t0.00369\t0.64063\n+25\t0.01436\t0.01389\t0.02416\t0.09048\t0.62339\t0.01400\t0.06701\t0.01805\t0.01372\t0.01945\t0.03582\t0.01607\t0.01096\t0.00562\t0.00608\t0.00182\t0.00728\t0.00566\t0.00308\t0.00909\n+26\t0.00854\t0.00631\t0.00889\t0.00889\t0.00982\t0.00707\t0.00663\t0.01025\t0.00972\t0.01366\t0.01910\t0.02845\t0.05650\t0.18228\t0.58618\t0.00853\t0.01348\t0.00722\t0.00343\t0.00503\n+27\t0.01548\t0.01479\t0.02488\t0.08571\t0.02524\t0.01588\t0.32385\t0.16342\t0.10193\t0.02266\t0.01392\t0.03561\t0.01096\t0.00702\t0.00835\t0.00207\t0.10936\t0.00658\t0.00399\t0.00830\n+28\t0.00854\t0.00740\t0.01122\t0.00999\t0.01203\t0.00669\t0.11545\t0.01073\t0.01381\t0.01803\t0.18368\t0.26156\t0.28933\t0.01415\t0.00727\t0.00212\t0.00422\t0.01277\t0.00541\t0.00560\n+29\t0.35512\t0.01090\t0.01184\t0.00958\t0.01377\t0.01095\t0.00789\t0.04454\t0.01468\t0.41869\t0.03498\t0.01653\t0.01236\t0.00680\t0.00512\t0.00186\t0.00492\t0.00501\t0.00586\t0.00860\n+30\t0.01010\t0.00847\t0.00884\t0.00832\t0.01041\t0.03290\t0.00625\t0.01566\t0.18843\t0.02053\t0.24690\t0.04218\t0.29003\t0.05455\t0.00803\t0.00217\t0.00380\t0.01007\t0.02605\t0.00631\n+31\t0.00895\t0.00620\t0.00686\t0.00671\t0.00838\t0.00571\t0.00501\t0.02902\t0.01457\t0.02047\t0.23442\t0.08868\t0.31088\t0.01235\t0.00637\t0.00185\t0.00305\t0.01048\t0.21455\t0.00549\n+32\t0.01619\t0.10104\t0.01615\t0.01236\t0.01602\t0.06426\t0.00992\t0.09365\t0.53279\t0.02429\t0.02094\t0.02045\t0.01607\t0.00778\t0.00586\t0.00192\t0.00552\t0.02013\t0.00551\t0.00914\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+1\t2\n+\n+[block]\n+# block no. 6 follows, 38 sequences, length 7\n+# corresponding to MSA columns:\n+# 294-300\n+name=unknown_G\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.05286\t0.23850\t0.15343\t0.01594\t0.08273\t0.08953\t0.06896\t0.12641\t0.01581\t0.08512\t0.01169\t0.01294\t0.00892\t0.00589\t0.00528\t0.00167\t0.00748\t0.00456\t0.00368\t0.00859\n+1\t0.68141\t0.08182\t0.01163\t0.00885\t0.01264\t0.08693\t0.00734\t0.01832\t0.01107\t0.02468\t0.00846\t0.00987\t0.00674\t0.00561\t0.00390\t0.00178\t0.00541\t0.00331\t0.00356\t0.00667\n+2\t0.01084\t0.00712\t0.00841\t0.00771\t0.00966\t0.00683\t0.00589\t0.04921\t0.04952\t0.06484\t0.40564\t0.03893\t0.14590\t0.01108\t0.00643\t0.00183\t0.00327\t0.00948\t0.15119\t0.00624\n+3\t0.04218\t0.01748\t0.19430\t0.01534\t0.07807\t0.05936\t0.04927\t0.12165\t0.11178\t0.02264\t0.09217\t0.06371\t0.07146\t0.00843\t0.00649\t0.00194\t0.02417\t0.00701\t0.00446\t0.00810\n+4\t0.00788\t0.00612\t0.00717\t0.00691\t0.00860\t0.00541\t0.00518\t0.01013\t0.01554\t0.02059\t0.43955\t0.05075\t0.36730\t0.01362\t0.00710\t0.00195\t0.00293\t0.01169\t0.00616\t0.00541\n+5\t0.01522\t0.09663\t0.25634\t0.01961\t0.12625\t0.01617\t0.13252\t0.13288\t0.07957\t0.02207\t0.01254\t0.01444\t0.00952\t0.00612\t0.00636\t0.00187\t0.03415\t0.00528\t0.00356\t0.00893\n+6\t0.51302\t0.14545\t0.05695\t0.01029\t0.04448\t0.01469\t0.00874\t0.01837\t0.01141\t0.06614\t0.00968\t0.01093\t0.00755\t0.00555\t0.00414\t0.00170\t0.00532\t0.00359\t0.00364\t0.05837\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+8\t18\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W0CIU.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W0DGR.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W0DGR.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,248 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+17\t81\n+\n+[block]\n+# block no. 0 follows, 31 sequences, length 13\n+# corresponding to MSA columns:\n+# 102-114\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01605\t0.01785\t0.12492\t0.15234\t0.32647\t0.01507\t0.08790\t0.02075\t0.01518\t0.05380\t0.01334\t0.01695\t0.01039\t0.00624\t0.00670\t0.00201\t0.00849\t0.00596\t0.00357\t0.09601\n+1\t0.01562\t0.31021\t0.22505\t0.06927\t0.05495\t0.05811\t0.01612\t0.01972\t0.01397\t0.01807\t0.01207\t0.01530\t0.01016\t0.01321\t0.11792\t0.00324\t0.01026\t0.00495\t0.00309\t0.00871\n+2\t0.01934\t0.20946\t0.02568\t0.01626\t0.02034\t0.13531\t0.10537\t0.10636\t0.01676\t0.05001\t0.01282\t0.01688\t0.01105\t0.06723\t0.01115\t0.00239\t0.13647\t0.00575\t0.00396\t0.02741\n+3\t0.03705\t0.00960\t0.01030\t0.06894\t0.01377\t0.06514\t0.00766\t0.01287\t0.01307\t0.01694\t0.03030\t0.15493\t0.13911\t0.23696\t0.08735\t0.00447\t0.00738\t0.04984\t0.00480\t0.02951\n+4\t0.00953\t0.00684\t0.00893\t0.00973\t0.01077\t0.00634\t0.00695\t0.01106\t0.01364\t0.01849\t0.08683\t0.45784\t0.04038\t0.08734\t0.01147\t0.02774\t0.00463\t0.11006\t0.00596\t0.06546\n+5\t0.04486\t0.01396\t0.01530\t0.08372\t0.01929\t0.07013\t0.01074\t0.12343\t0.16524\t0.13619\t0.07294\t0.07628\t0.02026\t0.01073\t0.00851\t0.06692\t0.00646\t0.00772\t0.00600\t0.04133\n+6\t0.05064\t0.51091\t0.08725\t0.04034\t0.01988\t0.10115\t0.01301\t0.02236\t0.06518\t0.01819\t0.01130\t0.01275\t0.00962\t0.00635\t0.00503\t0.00167\t0.00794\t0.00425\t0.00334\t0.00885\n+7\t0.01568\t0.09483\t0.01468\t0.01148\t0.01425\t0.08739\t0.00912\t0.01981\t0.08575\t0.11248\t0.21363\t0.16228\t0.03589\t0.01299\t0.00746\t0.00226\t0.00566\t0.08023\t0.00632\t0.00780\n+8\t0.01032\t0.00738\t0.00904\t0.00967\t0.01060\t0.00726\t0.00671\t0.06551\t0.01430\t0.01892\t0.03409\t0.44689\t0.07508\t0.18197\t0.01433\t0.00357\t0.00500\t0.06764\t0.00590\t0.00581\n+9\t0.00880\t0.00638\t0.00829\t0.00964\t0.01038\t0.00598\t0.00684\t0.01028\t0.01359\t0.01781\t0.03976\t0.54961\t0.10844\t0.05709\t0.01007\t0.00298\t0.00441\t0.11779\t0.00623\t0.00562\n+10\t0.01478\t0.08642\t0.02312\t0.50386\t0.03906\t0.01701\t0.07174\t0.05462\t0.08398\t0.02013\t0.01383\t0.01819\t0.01049\t0.00697\t0.00671\t0.00220\t0.00869\t0.00618\t0.00365\t0.00838\n+11\t0.01621\t0.17578\t0.40638\t0.01803\t0.07619\t0.01683\t0.01922\t0.02180\t0.01532\t0.08918\t0.07004\t0.01777\t0.01419\t0.00714\t0.00626\t0.00201\t0.00842\t0.00562\t0.00385\t0.00975\n+12\t0.00901\t0.00653\t0.00840\t0.00922\t0.01016\t0.00610\t0.00656\t0.01084\t0.01483\t0.01989\t0.19882\t0.40698\t0.10818\t0.07465\t0.01055\t0.00291\t0.00418\t0.08001\t0.00646\t0.00575\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+6\t18\n+\n+[block]\n+# block no. 1 follows, 31 sequences, length 6\n+# corresponding to MSA columns:\n+# 137-142\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.09577\t0.09388\t0.07624\t0.01438\t0.01963\t0.15583\t0.01244\t0.19606\t0.10820\t0.05326\t0.01500\t0.01560\t0.01138\t0.00723\t0.00601\t0.00187\t0.00782\t0.00524\t0.00501\t0.09913\n+1\t0.00977\t0.00733\t0.01100\t0.01100\t0.01222\t0.00855\t0.00855\t0.01222\t0.01100\t0.01588\t0.01833\t0.02688\t0.01710\t0.05131\t0.73245\t0.01100\t0.01833\t0.00733\t0.00367\t0.00611\n+2\t0.01066\t0.06915\t0.01392\t0.01143\t0.01335\t0.00925\t0.07431\t0.01273\t0.01373\t0.01805\t0.07289\t0.24696\t0.10645\t0.13477\t0.08076\t0.00395\t0.00692\t0.08928\t0.00526\t0.00618\n+3\t0.01659\t0.48640\t0.13434\t0.01430\t0.05399\t0.02164\t0.01380\t0.01989\t0.01423\t0.01818\t0.01238\t0.01712\t0.01132\t0.00687\t0.00527\t0.00168\t0.00748\t0.05460\t0.00331\t0.08661\n+4\t0.01283\t0.04006\t0.08467\t0.01103\t0.01416\t0.01000\t0.00949\t0.06469\t0.01569\t0.05256\t0.15607\t0.09245\t0.06434\t0.11242\t0.13964\t0.00424\t0.00794\t0.02741\t0.00527\t0.07501\n+5\t0.04474\t0.09592\t0.08936\t0.06065\t0.02147\t0.01372\t0.10824\t0.04062\t0.03607\t0.02170\t0.04114\t0.06875\t0.01638\t0.01140\t0.06147\t0.00258\t0.00801\t0.04143\t0.00422\t0.21212\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+2\t17\n+\n+[block]\n+# block no. 2 follows, 31 sequences, length 6\n+# corresponding to MSA columns:\n+# 161-166\n+name=unknown_C\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.10874\t0.04947\t0.01714\t0.01352\t0.01744\t0.1046'..b'4266\t0.10685\t0.01478\t0.10322\t0.01682\t0.02070\t0.01146\t0.01328\t0.00951\t0.00823\t0.03449\t0.00210\t0.00893\t0.00454\t0.00351\t0.00924\n+31\t0.01275\t0.00638\t0.00638\t0.00638\t0.00797\t0.00638\t0.00478\t0.01594\t0.01435\t0.02551\t0.02232\t0.02551\t0.01754\t0.00797\t0.00478\t0.00159\t0.00319\t0.00638\t0.79755\t0.00638\n+32\t0.01916\t0.01386\t0.01593\t0.01193\t0.01762\t0.01255\t0.00966\t0.17363\t0.06900\t0.11631\t0.01615\t0.01667\t0.01212\t0.00652\t0.00584\t0.00148\t0.00574\t0.00516\t0.00546\t0.46523\n+33\t0.10667\t0.07948\t0.06995\t0.01483\t0.04954\t0.07931\t0.03998\t0.15084\t0.03756\t0.12096\t0.05665\t0.02106\t0.05977\t0.00809\t0.00632\t0.00195\t0.00708\t0.00635\t0.00534\t0.07828\n+34\t0.07343\t0.20322\t0.08721\t0.03912\t0.02332\t0.10514\t0.14088\t0.10852\t0.01749\t0.04356\t0.01341\t0.01699\t0.01090\t0.00696\t0.00618\t0.00192\t0.00868\t0.03190\t0.00406\t0.05712\n+35\t0.05328\t0.13095\t0.07725\t0.01543\t0.02071\t0.11914\t0.06991\t0.20752\t0.02036\t0.06460\t0.04347\t0.01809\t0.03663\t0.00774\t0.00681\t0.00193\t0.03131\t0.00593\t0.00487\t0.06406\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+27\t59\n+\n+[block]\n+# block no. 7 follows, 31 sequences, length 16\n+# corresponding to MSA columns:\n+# 448-463\n+name=unknown_H\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01520\t0.04600\t0.12089\t0.15838\t0.03083\t0.04111\t0.25183\t0.04412\t0.03836\t0.02120\t0.01601\t0.04710\t0.01368\t0.00807\t0.00776\t0.00227\t0.03053\t0.06091\t0.00386\t0.04188\n+1\t0.80789\t0.01323\t0.01006\t0.00900\t0.01323\t0.01535\t0.00741\t0.02011\t0.01164\t0.03070\t0.00953\t0.01111\t0.00741\t0.00635\t0.00423\t0.00212\t0.00529\t0.00370\t0.00423\t0.00741\n+2\t0.01466\t0.17766\t0.53107\t0.01721\t0.02615\t0.01756\t0.02122\t0.02108\t0.01432\t0.02061\t0.01172\t0.01374\t0.00881\t0.00626\t0.00597\t0.00194\t0.00915\t0.00470\t0.00299\t0.07319\n+3\t0.01577\t0.01507\t0.02567\t0.24457\t0.52337\t0.01595\t0.02042\t0.01998\t0.01503\t0.02094\t0.01266\t0.01731\t0.01034\t0.00631\t0.00679\t0.00210\t0.00841\t0.00609\t0.00329\t0.00990\n+4\t0.00834\t0.00595\t0.00794\t0.00953\t0.00992\t0.00556\t0.00635\t0.00953\t0.01310\t0.01746\t0.03771\t0.75510\t0.04525\t0.02143\t0.00873\t0.00278\t0.00397\t0.01945\t0.00635\t0.00556\n+5\t0.01419\t0.01216\t0.01419\t0.01013\t0.01621\t0.00912\t0.00811\t0.01723\t0.01419\t0.02229\t0.01216\t0.01419\t0.01013\t0.00507\t0.00507\t0.00101\t0.00507\t0.00405\t0.00405\t0.80139\n+6\t0.00846\t0.00695\t0.00745\t0.00733\t0.00947\t0.00594\t0.00549\t0.01055\t0.01648\t0.02060\t0.22144\t0.06236\t0.56066\t0.01654\t0.00808\t0.00227\t0.00341\t0.01395\t0.00663\t0.00594\n+7\t0.03070\t0.01164\t0.01588\t0.01217\t0.01746\t0.01006\t0.01006\t0.03334\t0.01958\t0.72163\t0.02699\t0.02329\t0.01694\t0.00847\t0.00688\t0.00212\t0.00582\t0.00688\t0.00847\t0.01164\n+8\t0.03070\t0.01164\t0.01588\t0.01217\t0.01746\t0.01006\t0.01006\t0.03334\t0.01958\t0.72163\t0.02699\t0.02329\t0.01694\t0.00847\t0.00688\t0.00212\t0.00582\t0.00688\t0.00847\t0.01164\n+9\t0.01693\t0.01626\t0.02777\t0.04199\t0.71689\t0.01626\t0.02100\t0.02100\t0.01558\t0.02235\t0.01287\t0.01693\t0.01084\t0.00610\t0.00677\t0.00203\t0.00813\t0.00610\t0.00339\t0.01084\n+10\t0.01693\t0.01626\t0.02777\t0.04199\t0.71689\t0.01626\t0.02100\t0.02100\t0.01558\t0.02235\t0.01287\t0.01693\t0.01084\t0.00610\t0.00677\t0.00203\t0.00813\t0.00610\t0.00339\t0.01084\n+11\t0.80789\t0.01323\t0.01006\t0.00900\t0.01323\t0.01535\t0.00741\t0.02011\t0.01164\t0.03070\t0.00953\t0.01111\t0.00741\t0.00635\t0.00423\t0.00212\t0.00529\t0.00370\t0.00423\t0.00741\n+12\t0.01375\t0.01303\t0.01075\t0.01030\t0.01223\t0.17639\t0.00737\t0.01512\t0.01472\t0.04641\t0.03571\t0.09202\t0.24690\t0.19990\t0.07218\t0.00396\t0.00765\t0.01045\t0.00502\t0.00614\n+13\t0.01942\t0.11552\t0.04806\t0.04707\t0.02040\t0.33926\t0.01368\t0.02162\t0.01572\t0.01715\t0.01338\t0.04884\t0.01278\t0.00951\t0.01001\t0.00219\t0.17562\t0.05837\t0.00362\t0.00778\n+14\t0.00995\t0.00789\t0.00914\t0.00910\t0.01056\t0.03878\t0.00663\t0.01251\t0.01759\t0.02389\t0.47086\t0.21679\t0.10927\t0.01570\t0.00814\t0.00229\t0.00383\t0.01385\t0.00698\t0.00626\n+15\t0.11919\t0.01393\t0.03595\t0.10356\t0.08135\t0.06191\t0.03267\t0.06942\t0.01557\t0.02251\t0.10075\t0.02829\t0.09275\t0.10014\t0.01183\t0.00277\t0.08750\t0.00777\t0.00457\t0.00756\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t3\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W0DGR.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W0E07.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W0E07.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,389 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t75\n+\n+[block]\n+# block no. 0 follows, 31 sequences, length 8\n+# corresponding to MSA columns:\n+# 111-118\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01137\t0.00833\t0.01309\t0.05863\t0.01594\t0.00796\t0.08460\t0.01351\t0.01422\t0.07339\t0.03401\t0.50463\t0.06871\t0.01742\t0.00839\t0.00264\t0.00537\t0.04519\t0.00598\t0.00662\n+1\t0.01337\t0.01043\t0.01586\t0.27280\t0.11241\t0.01117\t0.01327\t0.01669\t0.01523\t0.07459\t0.09780\t0.03802\t0.11282\t0.06585\t0.00953\t0.00266\t0.00682\t0.09820\t0.00493\t0.00754\n+2\t0.01760\t0.02598\t0.44202\t0.01644\t0.02421\t0.01402\t0.01903\t0.07571\t0.01745\t0.16411\t0.09905\t0.02074\t0.01721\t0.00792\t0.00679\t0.00215\t0.00823\t0.00638\t0.00487\t0.01010\n+3\t0.00856\t0.00642\t0.00779\t0.00878\t0.00979\t0.00586\t0.00613\t0.00994\t0.01377\t0.01763\t0.04581\t0.44892\t0.24392\t0.07847\t0.01065\t0.00297\t0.00418\t0.05867\t0.00617\t0.00556\n+4\t0.01811\t0.01749\t0.05121\t0.12262\t0.26326\t0.10838\t0.01600\t0.02519\t0.16841\t0.07567\t0.01727\t0.02014\t0.01362\t0.04346\t0.00809\t0.00233\t0.00804\t0.00644\t0.00456\t0.00973\n+5\t0.01699\t0.01458\t0.02376\t0.27335\t0.29973\t0.01612\t0.04475\t0.05502\t0.01566\t0.08102\t0.01368\t0.01776\t0.01062\t0.00721\t0.00837\t0.00223\t0.07961\t0.00623\t0.00385\t0.00946\n+6\t0.01269\t0.01177\t0.01966\t0.62371\t0.08437\t0.01426\t0.01781\t0.01687\t0.01374\t0.01778\t0.01486\t0.09487\t0.01299\t0.00831\t0.00703\t0.00232\t0.00852\t0.00747\t0.00341\t0.00759\n+7\t0.01799\t0.01845\t0.06660\t0.07026\t0.42788\t0.09006\t0.08926\t0.02212\t0.01627\t0.06718\t0.03849\t0.01817\t0.01267\t0.00666\t0.00689\t0.00206\t0.00876\t0.00634\t0.00384\t0.01005\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+3\t10\n+\n+[block]\n+# block no. 1 follows, 31 sequences, length 14\n+# corresponding to MSA columns:\n+# 133-146\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.59575\t0.01560\t0.08782\t0.01054\t0.01557\t0.01489\t0.00961\t0.02098\t0.05427\t0.02876\t0.01120\t0.01265\t0.00863\t0.00642\t0.00473\t0.00203\t0.00580\t0.00413\t0.00424\t0.08638\n+1\t0.06812\t0.01431\t0.04534\t0.01399\t0.07506\t0.04805\t0.03342\t0.01824\t0.01458\t0.02261\t0.03986\t0.01643\t0.01244\t0.00736\t0.02928\t0.00169\t0.00646\t0.00489\t0.02511\t0.50277\n+2\t0.01565\t0.02124\t0.18125\t0.02370\t0.09759\t0.05513\t0.30546\t0.02096\t0.01573\t0.02191\t0.04216\t0.01778\t0.01219\t0.00626\t0.00702\t0.00201\t0.00956\t0.00656\t0.00360\t0.13427\n+3\t0.04090\t0.01447\t0.08598\t0.01789\t0.15960\t0.01121\t0.02937\t0.01930\t0.01537\t0.09749\t0.06018\t0.06165\t0.05255\t0.00792\t0.00634\t0.00175\t0.00618\t0.00685\t0.00472\t0.30028\n+4\t0.01411\t0.01439\t0.11937\t0.01331\t0.05846\t0.01029\t0.01117\t0.01894\t0.06702\t0.07400\t0.13250\t0.06782\t0.08467\t0.00933\t0.00661\t0.00182\t0.00559\t0.00792\t0.00527\t0.27742\n+5\t0.01828\t0.04616\t0.11064\t0.01546\t0.02042\t0.18810\t0.07613\t0.04866\t0.06106\t0.07698\t0.05744\t0.09734\t0.01780\t0.00876\t0.00668\t0.00195\t0.00813\t0.00731\t0.00477\t0.12792\n+6\t0.01555\t0.01335\t0.01806\t0.15259\t0.14288\t0.03359\t0.01292\t0.01886\t0.01476\t0.06339\t0.03217\t0.01818\t0.02931\t0.00679\t0.00703\t0.00169\t0.05096\t0.00555\t0.00408\t0.35827\n+7\t0.01292\t0.01216\t0.02052\t0.74312\t0.04712\t0.01520\t0.01900\t0.01748\t0.01368\t0.01748\t0.01216\t0.01824\t0.00912\t0.00684\t0.00684\t0.00228\t0.00912\t0.00608\t0.00304\t0.00760\n+8\t0.07198\t0.02001\t0.01976\t0.05973\t0.02230\t0.10668\t0.01306\t0.53180\t0.02827\t0.03762\t0.01504\t0.01572\t0.01089\t0.00788\t0.00661\t0.00204\t0.00807\t0.00580\t0.00605\t0.01069\n+9\t0.15653\t0.05027\t0.01840\t0.01622\t0.07365\t0.13489\t0.03073\t0.10746\t0.20101\t0.11687\t0.01802\t0.01800\t0.01336\t0.00768\t0.00624\t0.00208\t0.00731\t0.00590\t0.00555\t0.00983\n+10\t0.01045\t0.00767\t0.00962\t0.00930\t0.00954\t0.00855\t0.00619\t0.01110\t0.01021\t0.01413\t0.01956\t0.03800\t0.02161\t0.53785\t0.17276\t0.00711\t0.08853\t0.00900\t0.00393\t0.00490\n+11\t0.01042\t0.00767\t0.00945\t0.00985\t0.01119\t0.00750\t0.00704\t0.08363\t0.01607\t0.02142\t0.11638\t0.48262\t0.12038\t0.01997\t0.03978\t0.00293\t0.00483\t0.01609\t0.00642\t0.00636\n+12\t0.01537\t0.29809\t0.47586\t0.01669\t0.02526\t0.01992\t0.02038\t0.02124\t0.01425\t0.01966\t0.01128\t0.01319\t0.00871\t0.00627\t0.00574\t0.00191\t0.00910\t0.00455\t0.00290\t0.0'..b'02\t0.00630\t0.00515\t0.00163\t0.00865\t0.00414\t0.00330\t0.00891\n+50\t0.02577\t0.01203\t0.01515\t0.01192\t0.01654\t0.01132\t0.00973\t0.14805\t0.02140\t0.46099\t0.10190\t0.02675\t0.04616\t0.00932\t0.00694\t0.00209\t0.00562\t0.00760\t0.05016\t0.01058\n+51\t0.00834\t0.00595\t0.00794\t0.00953\t0.00992\t0.00556\t0.00635\t0.00953\t0.01310\t0.01746\t0.03771\t0.75510\t0.04525\t0.02143\t0.00873\t0.00278\t0.00397\t0.01945\t0.00635\t0.00556\n+52\t0.01558\t0.01367\t0.02207\t0.22222\t0.08978\t0.04680\t0.16552\t0.05424\t0.01523\t0.04517\t0.01521\t0.02204\t0.01263\t0.04003\t0.01069\t0.10324\t0.00850\t0.03089\t0.05871\t0.00777\n+53\t0.04480\t0.05102\t0.04593\t0.29908\t0.17901\t0.05632\t0.11047\t0.03560\t0.07170\t0.02108\t0.01361\t0.01751\t0.01056\t0.00670\t0.00675\t0.00215\t0.00889\t0.00617\t0.00363\t0.00900\n+54\t0.00947\t0.00706\t0.00914\t0.03221\t0.01216\t0.00677\t0.00789\t0.01150\t0.01446\t0.01865\t0.06090\t0.29380\t0.17906\t0.07288\t0.01066\t0.00305\t0.00497\t0.23342\t0.00611\t0.00583\n+55\t0.01028\t0.00658\t0.00785\t0.00785\t0.00799\t0.00667\t0.00470\t0.01019\t0.01005\t0.01372\t0.02014\t0.03982\t0.02243\t0.59077\t0.08049\t0.10705\t0.00722\t0.00913\t0.03286\t0.00421\n+56\t0.50023\t0.08150\t0.05555\t0.01404\t0.08271\t0.01698\t0.01097\t0.01977\t0.01230\t0.02621\t0.01025\t0.01267\t0.00837\t0.00702\t0.00687\t0.00215\t0.09691\t0.00435\t0.02314\t0.00800\n+57\t0.01188\t0.00966\t0.01091\t0.01083\t0.01302\t0.01020\t0.00805\t0.02046\t0.28311\t0.02300\t0.10350\t0.27631\t0.14264\t0.01528\t0.00790\t0.00248\t0.00445\t0.03187\t0.00670\t0.00775\n+58\t0.01704\t0.01713\t0.09951\t0.04785\t0.02030\t0.08291\t0.04572\t0.08837\t0.09168\t0.08002\t0.05286\t0.11523\t0.01902\t0.01151\t0.03449\t0.00252\t0.08402\t0.00806\t0.00509\t0.07663\n+59\t0.01509\t0.34252\t0.12729\t0.04327\t0.01964\t0.01889\t0.04450\t0.01832\t0.01387\t0.01853\t0.03360\t0.10552\t0.01541\t0.00872\t0.00717\t0.00194\t0.06963\t0.00670\t0.05027\t0.03912\n+60\t0.05488\t0.02132\t0.01858\t0.01562\t0.01943\t0.26138\t0.03268\t0.21955\t0.06958\t0.06614\t0.01531\t0.01750\t0.01205\t0.04469\t0.00915\t0.00227\t0.07086\t0.00585\t0.03399\t0.00916\n+61\t0.01620\t0.04338\t0.01835\t0.12204\t0.07055\t0.01424\t0.04354\t0.19920\t0.02002\t0.02656\t0.06214\t0.04123\t0.02440\t0.01198\t0.00784\t0.00249\t0.00727\t0.25452\t0.00558\t0.00848\n+62\t0.01688\t0.01586\t0.02436\t0.15413\t0.31093\t0.05378\t0.09322\t0.05378\t0.04660\t0.04166\t0.01431\t0.01904\t0.01175\t0.04952\t0.00899\t0.00237\t0.03416\t0.00647\t0.00387\t0.03834\n+63\t0.01430\t0.01252\t0.01567\t0.01120\t0.01732\t0.00958\t0.04696\t0.01749\t0.01430\t0.02227\t0.01226\t0.01443\t0.01015\t0.00511\t0.00524\t0.00109\t0.00543\t0.00428\t0.00402\t0.75639\n+64\t0.00880\t0.00663\t0.00760\t0.00810\t0.00925\t0.00604\t0.00557\t0.01006\t0.01361\t0.01726\t0.06599\t0.25377\t0.30509\t0.20285\t0.01497\t0.00355\t0.00452\t0.04515\t0.00584\t0.00535\n+65\t0.01726\t0.17030\t0.02358\t0.13830\t0.06880\t0.11662\t0.06489\t0.05013\t0.01581\t0.02034\t0.01176\t0.01455\t0.00963\t0.00606\t0.00580\t0.00163\t0.00803\t0.00489\t0.00361\t0.24800\n+66\t0.01032\t0.00698\t0.00810\t0.00812\t0.00852\t0.00718\t0.00501\t0.01161\t0.03882\t0.01513\t0.02232\t0.07561\t0.02445\t0.57379\t0.10125\t0.00639\t0.00742\t0.00983\t0.05431\t0.00483\n+67\t0.03866\t0.12932\t0.05854\t0.08157\t0.13766\t0.21504\t0.06987\t0.07276\t0.05501\t0.03618\t0.01466\t0.01675\t0.03058\t0.00709\t0.00635\t0.00195\t0.00918\t0.00568\t0.00397\t0.00915\n+68\t0.01142\t0.01006\t0.03924\t0.01606\t0.11997\t0.00881\t0.05123\t0.01403\t0.01473\t0.03699\t0.07565\t0.36491\t0.08499\t0.01552\t0.00806\t0.00247\t0.00548\t0.06891\t0.00561\t0.04585\n+69\t0.03612\t0.11341\t0.10550\t0.06891\t0.09656\t0.07655\t0.13185\t0.02316\t0.10862\t0.04129\t0.03744\t0.01790\t0.01306\t0.00700\t0.00686\t0.00200\t0.02635\t0.00608\t0.00410\t0.07723\n+70\t0.06129\t0.00808\t0.01008\t0.01048\t0.04246\t0.00753\t0.00735\t0.01374\t0.01614\t0.05693\t0.28460\t0.20809\t0.13361\t0.03284\t0.00841\t0.00239\t0.00420\t0.03670\t0.00644\t0.04864\n+71\t0.10133\t0.11876\t0.14669\t0.03538\t0.07914\t0.10683\t0.05225\t0.10737\t0.01761\t0.04077\t0.04916\t0.02094\t0.07966\t0.00804\t0.00634\t0.00201\t0.00802\t0.00634\t0.00438\t0.00898\n+72\t0.01523\t0.08087\t0.05360\t0.01412\t0.05601\t0.01291\t0.04920\t0.09089\t0.05841\t0.04356\t0.06392\t0.09386\t0.08159\t0.00965\t0.00665\t0.00189\t0.00606\t0.03162\t0.00513\t0.22483\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t32\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W0E07.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W0EOF.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W0EOF.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,184 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t54\n+\n+[block]\n+# block no. 0 follows, 27 sequences, length 98\n+# corresponding to MSA columns:\n+# 56-115,125-162\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01451\t0.00867\t0.01109\t0.00984\t0.01257\t0.00770\t0.00758\t0.01768\t0.02032\t0.14786\t0.46576\t0.05090\t0.14257\t0.01428\t0.00842\t0.00231\t0.00411\t0.01237\t0.00806\t0.03343\n+1\t0.01757\t0.00984\t0.01264\t0.01100\t0.01410\t0.00927\t0.00857\t0.02273\t0.09003\t0.21257\t0.43958\t0.04429\t0.05096\t0.01300\t0.00828\t0.00234\t0.00452\t0.01127\t0.00839\t0.00904\n+2\t0.01912\t0.01739\t0.02949\t0.04395\t0.65914\t0.01730\t0.02219\t0.02345\t0.01712\t0.05790\t0.01473\t0.01872\t0.01209\t0.00674\t0.00736\t0.00221\t0.00869\t0.00666\t0.00395\t0.01180\n+3\t0.01686\t0.01532\t0.01432\t0.01310\t0.01626\t0.11623\t0.01005\t0.04711\t0.27356\t0.02739\t0.16852\t0.03432\t0.07698\t0.01429\t0.05441\t0.00294\t0.00714\t0.00923\t0.07283\t0.00917\n+4\t0.79154\t0.01436\t0.01091\t0.00976\t0.01436\t0.01665\t0.00804\t0.02182\t0.01263\t0.03331\t0.01034\t0.01206\t0.00804\t0.00689\t0.00459\t0.00230\t0.00574\t0.00402\t0.00459\t0.00804\n+5\t0.53971\t0.01378\t0.01301\t0.01091\t0.01588\t0.01475\t0.00899\t0.02659\t0.01549\t0.25405\t0.01663\t0.01645\t0.01147\t0.00765\t0.00555\t0.00230\t0.00593\t0.00516\t0.00612\t0.00957\n+6\t0.01165\t0.00835\t0.01210\t0.01179\t0.01257\t0.00976\t0.00886\t0.01269\t0.01128\t0.01609\t0.01779\t0.02849\t0.01737\t0.11452\t0.43156\t0.17414\t0.08355\t0.00778\t0.00380\t0.00583\n+7\t0.01499\t0.01404\t0.02361\t0.48572\t0.22613\t0.01617\t0.02029\t0.01969\t0.01583\t0.02117\t0.05934\t0.02182\t0.01450\t0.00773\t0.00749\t0.00239\t0.00916\t0.00707\t0.00373\t0.00914\n+8\t0.01069\t0.00786\t0.01160\t0.01160\t0.01280\t0.00905\t0.00887\t0.01298\t0.01178\t0.01691\t0.01991\t0.03028\t0.01896\t0.10121\t0.64306\t0.03537\t0.01861\t0.00810\t0.00399\t0.00638\n+9\t0.06757\t0.15910\t0.53985\t0.01893\t0.02868\t0.01931\t0.02358\t0.02318\t0.01537\t0.02312\t0.01260\t0.01478\t0.00933\t0.00692\t0.00649\t0.00222\t0.01010\t0.00512\t0.00324\t0.01053\n+10\t0.02045\t0.60616\t0.03555\t0.06078\t0.02168\t0.11365\t0.01344\t0.02294\t0.01581\t0.01765\t0.01066\t0.01262\t0.00956\t0.00659\t0.00518\t0.00169\t0.00875\t0.00425\t0.00327\t0.00933\n+11\t0.63040\t0.01487\t0.01279\t0.01091\t0.01577\t0.01674\t0.00899\t0.09274\t0.01593\t0.10412\t0.01312\t0.01406\t0.00961\t0.00735\t0.00520\t0.00229\t0.00606\t0.00467\t0.00538\t0.00901\n+12\t0.02102\t0.01646\t0.01767\t0.01528\t0.01985\t0.01863\t0.01206\t0.13622\t0.53343\t0.08060\t0.02824\t0.02600\t0.02081\t0.00983\t0.00753\t0.00246\t0.00626\t0.00806\t0.00765\t0.01195\n+13\t0.01400\t0.01268\t0.02078\t0.42038\t0.16364\t0.01442\t0.01774\t0.01849\t0.01673\t0.02259\t0.17678\t0.02815\t0.02480\t0.00914\t0.00773\t0.00239\t0.00814\t0.00825\t0.00455\t0.00862\n+14\t0.01061\t0.00795\t0.01193\t0.01193\t0.01326\t0.00928\t0.00928\t0.01326\t0.01193\t0.01723\t0.01988\t0.02916\t0.01856\t0.05568\t0.70968\t0.01193\t0.01988\t0.00795\t0.00398\t0.00663\n+15\t0.00955\t0.00755\t0.00860\t0.00834\t0.01051\t0.00660\t0.00625\t0.01216\t0.01876\t0.02442\t0.35110\t0.06426\t0.41117\t0.01717\t0.00877\t0.00243\t0.00364\t0.01466\t0.00747\t0.00660\n+16\t0.79154\t0.01436\t0.01091\t0.00976\t0.01436\t0.01665\t0.00804\t0.02182\t0.01263\t0.03331\t0.01034\t0.01206\t0.00804\t0.00689\t0.00459\t0.00230\t0.00574\t0.00402\t0.00459\t0.00804\n+17\t0.02034\t0.37538\t0.21566\t0.01584\t0.02314\t0.06092\t0.01676\t0.07040\t0.05056\t0.06731\t0.01400\t0.01512\t0.01096\t0.00717\t0.00600\t0.00195\t0.00887\t0.00508\t0.00412\t0.01041\n+18\t0.01289\t0.00645\t0.00967\t0.00967\t0.00967\t0.00645\t0.00645\t0.00967\t0.00967\t0.01289\t0.01289\t0.02257\t0.01289\t0.02579\t0.02901\t0.78401\t0.00645\t0.00645\t0.00322\t0.00322\n+19\t0.02748\t0.05979\t0.02174\t0.01878\t0.02282\t0.64766\t0.01427\t0.06422\t0.02158\t0.01971\t0.01178\t0.01358\t0.00973\t0.00767\t0.00667\t0.00192\t0.01291\t0.00486\t0.00400\t0.00886\n+20\t0.11480\t0.02016\t0.02969\t0.04761\t0.07636\t0.09093\t0.28324\t0.12725\t0.06419\t0.04983\t0.01586\t0.01857\t0.01189\t0.00731\t0.00756\t0.00235\t0.01011\t0.00715\t0.00485\t0.01030\n+21\t0.05932\t0.05313\t0.02434\t0.33606\t0.24648\t0.08693\t0.01908\t0.02125\t0.01599\t0.02127\t0.01399\t0.04419\t0.01178\t0.00769\t0.00711\t0.00230\t0.00938\t0.00668\t0.00367\t0.00937\n+22\t0.79154\t0.01436\t0.01091\t0.00976\t0.01436\t0.01665\t0.00804\t0.02182\t0.01263\t0.03331\t0.0'..b'19\t0.00730\t0.00741\t0.00243\t0.00973\t0.00660\t0.00336\t0.00880\n+25\t0.01598\t0.01509\t0.02551\t0.32239\t0.38422\t0.01642\t0.02087\t0.02041\t0.01588\t0.02173\t0.01537\t0.06468\t0.01337\t0.00801\t0.00752\t0.00237\t0.00898\t0.00753\t0.00372\t0.00994\n+26\t0.01543\t0.01465\t0.02456\t0.26330\t0.35117\t0.01554\t0.04258\t0.01967\t0.01616\t0.02180\t0.02207\t0.04897\t0.09464\t0.00890\t0.00767\t0.00237\t0.00855\t0.00826\t0.00405\t0.00968\n+27\t0.01523\t0.04134\t0.02327\t0.45572\t0.14363\t0.01671\t0.01889\t0.01958\t0.01503\t0.02033\t0.01299\t0.01850\t0.01030\t0.00736\t0.00813\t0.00227\t0.05404\t0.00622\t0.00349\t0.10696\n+28\t0.01384\t0.00692\t0.00692\t0.00692\t0.00865\t0.00692\t0.00519\t0.01730\t0.01557\t0.02768\t0.02422\t0.02768\t0.01903\t0.00865\t0.00519\t0.00173\t0.00346\t0.00692\t0.78031\t0.00692\n+29\t0.01561\t0.01366\t0.01702\t0.01226\t0.01883\t0.01067\t0.04532\t0.01966\t0.03748\t0.02439\t0.01386\t0.01606\t0.01140\t0.00569\t0.00575\t0.00122\t0.00590\t0.00477\t0.00447\t0.71598\n+30\t0.01702\t0.34114\t0.41655\t0.01753\t0.02652\t0.02245\t0.02111\t0.02296\t0.01542\t0.02092\t0.01203\t0.01406\t0.00946\t0.00675\t0.00607\t0.00202\t0.00967\t0.00483\t0.00315\t0.01035\n+31\t0.01280\t0.00820\t0.01003\t0.00921\t0.01172\t0.00725\t0.00703\t0.01567\t0.01964\t0.11109\t0.39550\t0.05710\t0.27540\t0.01566\t0.00860\t0.00239\t0.00395\t0.01344\t0.00786\t0.00747\n+32\t0.00987\t0.00756\t0.00905\t0.00868\t0.01070\t0.00674\t0.00651\t0.01278\t0.01952\t0.02622\t0.46471\t0.06129\t0.29642\t0.01650\t0.00876\t0.00240\t0.00360\t0.01424\t0.00771\t0.00674\n+33\t0.01790\t0.02059\t0.04297\t0.03084\t0.03822\t0.04405\t0.64198\t0.02399\t0.01765\t0.02357\t0.01489\t0.01978\t0.01120\t0.00631\t0.00869\t0.00248\t0.01255\t0.00862\t0.00376\t0.00996\n+34\t0.01583\t0.01504\t0.02554\t0.44009\t0.31813\t0.01697\t0.02152\t0.02056\t0.01570\t0.02117\t0.01351\t0.01920\t0.01067\t0.00709\t0.00739\t0.00236\t0.00945\t0.00660\t0.00346\t0.00971\n+35\t0.03310\t0.01297\t0.01743\t0.01337\t0.01912\t0.01141\t0.01104\t0.06207\t0.02181\t0.67126\t0.02882\t0.02496\t0.01814\t0.00918\t0.00746\t0.00229\t0.00639\t0.00743\t0.00912\t0.01263\n+36\t0.01752\t0.02003\t0.04380\t0.03129\t0.03880\t0.01877\t0.66583\t0.02378\t0.01752\t0.02378\t0.01502\t0.02003\t0.01126\t0.00626\t0.00876\t0.00250\t0.01252\t0.00876\t0.00375\t0.01001\n+37\t0.01837\t0.01764\t0.03013\t0.04557\t0.69279\t0.01764\t0.02278\t0.02278\t0.01690\t0.02425\t0.01396\t0.01837\t0.01176\t0.00661\t0.00735\t0.00220\t0.00882\t0.00661\t0.00367\t0.01176\n+38\t0.01042\t0.00748\t0.00828\t0.00825\t0.01036\t0.00673\t0.00629\t0.01312\t0.01768\t0.02414\t0.21555\t0.05948\t0.35971\t0.01597\t0.00815\t0.00237\t0.00383\t0.05341\t0.16217\t0.00662\n+39\t0.03220\t0.01441\t0.01833\t0.01405\t0.01984\t0.01354\t0.01161\t0.17351\t0.02422\t0.55641\t0.02680\t0.02365\t0.01713\t0.00913\t0.00746\t0.00228\t0.00672\t0.00730\t0.00881\t0.01263\n+40\t0.01007\t0.00711\t0.00937\t0.01052\t0.01115\t0.00702\t0.00740\t0.01155\t0.01368\t0.01827\t0.03459\t0.40321\t0.04002\t0.18909\t0.08509\t0.00491\t0.00691\t0.11812\t0.00605\t0.00587\n+41\t0.01180\t0.00843\t0.01178\t0.01349\t0.01512\t0.00841\t0.01168\t0.01510\t0.01693\t0.02204\t0.03940\t0.11981\t0.04308\t0.02066\t0.01021\t0.00340\t0.00670\t0.60836\t0.00684\t0.00679\n+42\t0.03331\t0.01263\t0.01723\t0.01321\t0.01895\t0.01091\t0.01091\t0.03618\t0.02125\t0.69794\t0.02929\t0.02527\t0.01838\t0.00919\t0.00747\t0.00230\t0.00632\t0.00747\t0.00919\t0.01263\n+43\t0.01402\t0.01319\t0.02227\t0.72126\t0.05113\t0.01649\t0.02062\t0.01897\t0.01484\t0.01897\t0.01319\t0.01979\t0.00990\t0.00742\t0.00742\t0.00247\t0.00990\t0.00660\t0.00330\t0.00825\n+44\t0.02830\t0.01877\t0.01856\t0.01510\t0.02012\t0.14830\t0.01209\t0.17846\t0.07464\t0.31900\t0.07060\t0.02363\t0.01940\t0.00933\t0.00741\t0.00223\t0.00787\t0.00727\t0.00755\t0.01139\n+45\t0.01622\t0.01788\t0.03821\t0.02794\t0.03433\t0.01686\t0.55762\t0.02174\t0.01685\t0.02289\t0.01807\t0.09693\t0.01573\t0.01092\t0.04913\t0.00310\t0.01206\t0.01003\t0.00410\t0.00939\n+46\t0.01390\t0.00842\t0.00943\t0.01006\t0.04901\t0.00846\t0.00679\t0.03918\t0.03860\t0.02650\t0.06400\t0.03353\t0.06974\t0.08224\t0.00916\t0.00243\t0.00440\t0.00831\t0.50857\t0.00727\n+47\t0.01909\t0.23971\t0.22756\t0.01861\t0.02597\t0.08305\t0.11735\t0.06856\t0.01789\t0.04542\t0.01733\t0.01906\t0.05372\t0.00773\t0.00676\t0.00211\t0.00972\t0.00628\t0.00405\t0.01005\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t11\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W0EOF.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W0IVU.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W0IVU.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,147 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+14\t117\n+\n+[block]\n+# block no. 0 follows, 27 sequences, length 123\n+# corresponding to MSA columns:\n+# 136-183,206-233,285-305,307-332\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.07166\t0.01473\t0.01922\t0.02045\t0.17246\t0.01471\t0.01327\t0.08495\t0.13432\t0.19177\t0.08909\t0.02467\t0.02093\t0.00882\t0.00720\t0.00219\t0.00657\t0.00744\t0.00661\t0.08894\n+1\t0.06030\t0.02377\t0.27665\t0.05467\t0.17380\t0.01606\t0.01976\t0.04444\t0.07825\t0.07425\t0.02071\t0.02223\t0.06195\t0.00827\t0.00716\t0.00230\t0.00855\t0.00687\t0.00464\t0.03537\n+2\t0.01668\t0.07868\t0.10209\t0.03779\t0.02096\t0.04513\t0.03935\t0.04066\t0.09281\t0.04814\t0.08574\t0.07411\t0.02098\t0.00898\t0.00686\t0.00193\t0.00702\t0.00753\t0.00523\t0.25930\n+3\t0.01943\t0.04174\t0.02122\t0.02410\t0.26169\t0.01400\t0.01439\t0.04427\t0.05798\t0.14328\t0.14443\t0.02640\t0.02435\t0.00878\t0.00728\t0.00208\t0.00667\t0.00773\t0.00592\t0.12427\n+4\t0.01759\t0.01428\t0.02032\t0.02367\t0.26016\t0.01292\t0.01397\t0.02225\t0.05384\t0.08148\t0.09107\t0.02244\t0.01911\t0.00754\t0.00681\t0.00181\t0.00656\t0.00668\t0.00513\t0.31237\n+5\t0.01230\t0.00969\t0.01292\t0.01429\t0.09221\t0.00895\t0.00912\t0.03841\t0.01713\t0.02396\t0.20509\t0.26209\t0.06490\t0.06848\t0.01043\t0.00272\t0.00514\t0.01340\t0.00633\t0.12244\n+6\t0.02163\t0.01665\t0.02456\t0.09309\t0.29432\t0.01729\t0.04275\t0.15289\t0.07641\t0.12346\t0.04840\t0.02186\t0.01619\t0.00816\t0.00752\t0.00229\t0.00810\t0.00728\t0.00568\t0.01145\n+7\t0.01856\t0.01424\t0.02237\t0.23613\t0.25939\t0.01474\t0.01746\t0.02318\t0.04178\t0.13159\t0.01875\t0.07268\t0.01537\t0.00854\t0.00740\t0.00228\t0.00802\t0.00770\t0.00490\t0.07495\n+8\t0.01539\t0.01333\t0.01948\t0.30427\t0.12506\t0.03860\t0.01628\t0.01948\t0.01654\t0.04745\t0.06839\t0.03350\t0.02110\t0.01014\t0.00777\t0.00241\t0.00816\t0.12463\t0.00474\t0.10329\n+9\t0.01447\t0.01282\t0.01699\t0.01780\t0.15060\t0.01163\t0.01138\t0.01746\t0.01567\t0.02275\t0.05457\t0.02925\t0.13451\t0.04196\t0.00962\t0.00208\t0.06623\t0.00770\t0.00477\t0.35777\n+10\t0.01212\t0.00963\t0.01410\t0.13971\t0.09856\t0.01043\t0.01073\t0.01428\t0.01311\t0.01789\t0.05051\t0.07431\t0.02362\t0.31380\t0.16016\t0.00626\t0.01008\t0.00968\t0.00438\t0.00665\n+11\t0.01831\t0.01781\t0.03114\t0.04452\t0.64469\t0.01772\t0.07008\t0.02286\t0.01695\t0.02422\t0.01404\t0.01850\t0.01172\t0.00659\t0.00745\t0.00223\t0.00909\t0.00677\t0.00368\t0.01163\n+12\t0.01421\t0.01329\t0.02232\t0.59546\t0.12444\t0.01595\t0.01999\t0.01886\t0.01505\t0.01959\t0.01507\t0.06571\t0.01265\t0.00835\t0.00755\t0.00248\t0.00941\t0.00754\t0.00357\t0.00852\n+13\t0.07275\t0.01527\t0.01921\t0.01667\t0.01777\t0.04971\t0.01359\t0.01779\t0.01219\t0.01916\t0.01206\t0.01909\t0.01170\t0.05716\t0.10373\t0.00424\t0.46994\t0.00652\t0.00360\t0.05784\n+14\t0.73478\t0.06800\t0.01297\t0.00998\t0.01470\t0.01759\t0.00838\t0.02185\t0.01281\t0.03214\t0.01034\t0.01205\t0.00815\t0.00685\t0.00461\t0.00224\t0.00590\t0.00402\t0.00449\t0.00815\n+15\t0.01445\t0.06692\t0.02349\t0.66914\t0.04877\t0.01744\t0.02003\t0.01921\t0.01486\t0.01886\t0.01298\t0.01921\t0.00987\t0.00734\t0.00723\t0.00241\t0.00975\t0.00640\t0.00329\t0.00834\n+16\t0.06660\t0.00704\t0.00878\t0.01029\t0.01103\t0.00681\t0.00698\t0.01118\t0.01410\t0.02001\t0.03867\t0.68114\t0.04608\t0.02205\t0.00912\t0.00296\t0.00441\t0.01985\t0.00672\t0.00618\n+17\t0.01109\t0.00806\t0.01174\t0.06315\t0.01471\t0.00916\t0.00892\t0.01289\t0.01173\t0.01643\t0.01951\t0.03180\t0.01913\t0.18617\t0.46695\t0.07476\t0.01549\t0.00830\t0.00397\t0.00604\n+18\t0.03331\t0.01263\t0.01723\t0.01321\t0.01895\t0.01091\t0.01091\t0.03618\t0.02125\t0.69794\t0.02929\t0.02527\t0.01838\t0.00919\t0.00747\t0.00230\t0.00632\t0.00747\t0.00919\t0.01263\n+19\t0.01838\t0.01751\t0.02915\t0.04333\t0.64325\t0.01770\t0.02197\t0.02401\t0.06563\t0.02475\t0.01516\t0.01906\t0.01256\t0.00687\t0.00736\t0.00223\t0.00860\t0.00675\t0.00396\t0.01176\n+20\t0.06299\t0.01270\t0.01698\t0.01307\t0.01877\t0.01114\t0.01080\t0.03562\t0.02091\t0.67192\t0.02855\t0.02475\t0.01797\t0.00910\t0.00735\t0.00230\t0.00629\t0.00733\t0.00901\t0.01245\n+21\t0.01038\t0.00803\t0.00952\t0.00906\t0.01120\t0.00740\t0.00682\t0.01432\t0.05615\t0.02665\t0.45112\t0.05916\t0.27068\t0.01608\t0.00870\t0.00240\t0.00372\t0.01388\t0.00772\t0.00703\n+22\t0.01080\t0.00720\t0.00810\t0.00810\t0.00810\t0.00720\t0.00450\t0.01080'..b'230\t0.00632\t0.00747\t0.00919\t0.01263\n+100\t0.01682\t0.01605\t0.02733\t0.28669\t0.46382\t0.01723\t0.02201\t0.02142\t0.01617\t0.02237\t0.01369\t0.01888\t0.01109\t0.00690\t0.00738\t0.00230\t0.00920\t0.00661\t0.00354\t0.01051\n+101\t0.01080\t0.00720\t0.00810\t0.00810\t0.00810\t0.00720\t0.00450\t0.01080\t0.01080\t0.01439\t0.02339\t0.04858\t0.02699\t0.73910\t0.03779\t0.00720\t0.00720\t0.01080\t0.00450\t0.00450\n+102\t0.01941\t0.01992\t0.02704\t0.11491\t0.47552\t0.12953\t0.02056\t0.02439\t0.05405\t0.02306\t0.01438\t0.01824\t0.01180\t0.00706\t0.00726\t0.00220\t0.00952\t0.00641\t0.00387\t0.01086\n+103\t0.01869\t0.01584\t0.02122\t0.36437\t0.05431\t0.01860\t0.01701\t0.18499\t0.17381\t0.02882\t0.01831\t0.02110\t0.01358\t0.00838\t0.00745\t0.00242\t0.00851\t0.00704\t0.00532\t0.01024\n+104\t0.02773\t0.03538\t0.02104\t0.01913\t0.02295\t0.70930\t0.01434\t0.02964\t0.02104\t0.01817\t0.01148\t0.01339\t0.00956\t0.00765\t0.00669\t0.00191\t0.01339\t0.00478\t0.00383\t0.00861\n+105\t0.00904\t0.00646\t0.00861\t0.01034\t0.01077\t0.00603\t0.00689\t0.01034\t0.01421\t0.01895\t0.04092\t0.73426\t0.04910\t0.02326\t0.00948\t0.00301\t0.00431\t0.02110\t0.00689\t0.00603\n+106\t0.01539\t0.01319\t0.01539\t0.01100\t0.01759\t0.00990\t0.00880\t0.01869\t0.01539\t0.02419\t0.01319\t0.01539\t0.01100\t0.00550\t0.00550\t0.00110\t0.00550\t0.00440\t0.00440\t0.78449\n+107\t0.30239\t0.01330\t0.01482\t0.01179\t0.01720\t0.01288\t0.00971\t0.02959\t0.01768\t0.40440\t0.02118\t0.01973\t0.01407\t0.00806\t0.00628\t0.00220\t0.00604\t0.00598\t0.00715\t0.07557\n+108\t0.01799\t0.07782\t0.02506\t0.02720\t0.26585\t0.04541\t0.01702\t0.02472\t0.15040\t0.02330\t0.04021\t0.02031\t0.01527\t0.00939\t0.01185\t0.00250\t0.20403\t0.00690\t0.00447\t0.01029\n+109\t0.03331\t0.01263\t0.01723\t0.01321\t0.01895\t0.01091\t0.01091\t0.03618\t0.02125\t0.69794\t0.02929\t0.02527\t0.01838\t0.00919\t0.00747\t0.00230\t0.00632\t0.00747\t0.00919\t0.01263\n+110\t0.01165\t0.00844\t0.01153\t0.01307\t0.01486\t0.00832\t0.01134\t0.01492\t0.01707\t0.02200\t0.04282\t0.08254\t0.10608\t0.02034\t0.01011\t0.00333\t0.00653\t0.58142\t0.00684\t0.00678\n+111\t0.79154\t0.01436\t0.01091\t0.00976\t0.01436\t0.01665\t0.00804\t0.02182\t0.01263\t0.03331\t0.01034\t0.01206\t0.00804\t0.00689\t0.00459\t0.00230\t0.00574\t0.00402\t0.00459\t0.00804\n+112\t0.01606\t0.01601\t0.02489\t0.17159\t0.08937\t0.02065\t0.06621\t0.01899\t0.01307\t0.01913\t0.01126\t0.01747\t0.01007\t0.01072\t0.01805\t0.00293\t0.45487\t0.00670\t0.00334\t0.00862\n+113\t0.05710\t0.01326\t0.02164\t0.68184\t0.04909\t0.01650\t0.01992\t0.01913\t0.01472\t0.01976\t0.01304\t0.01936\t0.00979\t0.00739\t0.00727\t0.00246\t0.00967\t0.00645\t0.00337\t0.00824\n+114\t0.00904\t0.00753\t0.00789\t0.00780\t0.01019\t0.00638\t0.00585\t0.01117\t0.01755\t0.02154\t0.16915\t0.06900\t0.59490\t0.01825\t0.00877\t0.00248\t0.00372\t0.01532\t0.00709\t0.00638\n+115\t0.01402\t0.01319\t0.02227\t0.72126\t0.05113\t0.01649\t0.02062\t0.01897\t0.01484\t0.01897\t0.01319\t0.01979\t0.00990\t0.00742\t0.00742\t0.00247\t0.00990\t0.00660\t0.00330\t0.00825\n+116\t0.00877\t0.00752\t0.00752\t0.00752\t0.01003\t0.00627\t0.00564\t0.01065\t0.01692\t0.02005\t0.07520\t0.07144\t0.68978\t0.01880\t0.00877\t0.00251\t0.00376\t0.01567\t0.00689\t0.00627\n+117\t0.01168\t0.00835\t0.01160\t0.01307\t0.01472\t0.00827\t0.01121\t0.01501\t0.01738\t0.02287\t0.10804\t0.10971\t0.04590\t0.02007\t0.01006\t0.00329\t0.00637\t0.54862\t0.00698\t0.00682\n+118\t0.01117\t0.00805\t0.01017\t0.01116\t0.01222\t0.00791\t0.00782\t0.08003\t0.01650\t0.02200\t0.03842\t0.63682\t0.04503\t0.02165\t0.00928\t0.00295\t0.00480\t0.04033\t0.00695\t0.00675\n+119\t0.01140\t0.00875\t0.01326\t0.04537\t0.05845\t0.00999\t0.01036\t0.01423\t0.01250\t0.01812\t0.01948\t0.02850\t0.01798\t0.06649\t0.58633\t0.01034\t0.01771\t0.00784\t0.03592\t0.00699\n+120\t0.01639\t0.01401\t0.01680\t0.01328\t0.04808\t0.01162\t0.01007\t0.06073\t0.01655\t0.02539\t0.01339\t0.01572\t0.01108\t0.00608\t0.00648\t0.00131\t0.03548\t0.00473\t0.00451\t0.66831\n+121\t0.02619\t0.01918\t0.02062\t0.01620\t0.02161\t0.02118\t0.01334\t0.57119\t0.06161\t0.04384\t0.01967\t0.02161\t0.01472\t0.00942\t0.00740\t0.00226\t0.00771\t0.03298\t0.05726\t0.01198\n+122\t0.01630\t0.01502\t0.02225\t0.56278\t0.07076\t0.04263\t0.01927\t0.09026\t0.01736\t0.02239\t0.01367\t0.01910\t0.01030\t0.00748\t0.00731\t0.00236\t0.00961\t0.00645\t0.00383\t0.04085\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t21\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W0IVU.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/funannotate_db/insecta/prfl/EOG090W0MBV.prfl
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/funannotate_db/insecta/prfl/EOG090W0MBV.prfl Thu Apr 13 17:16:35 2023 +0000
[
b'@@ -0,0 +1,181 @@\n+[name]\n+unknown\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t7\n+\n+[block]\n+# block no. 0 follows, 35 sequences, length 10\n+# corresponding to MSA columns:\n+# 7-16\n+name=unknown_A\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.02359\t0.19577\t0.01918\t0.01164\t0.01632\t0.03856\t0.01007\t0.07779\t0.01745\t0.42598\t0.02068\t0.02254\t0.01514\t0.00808\t0.00602\t0.00189\t0.00609\t0.06745\t0.00618\t0.00960\n+1\t0.01775\t0.66813\t0.07291\t0.01131\t0.01692\t0.02308\t0.01145\t0.02013\t0.01339\t0.08060\t0.01043\t0.01139\t0.00882\t0.00568\t0.00439\t0.00145\t0.00681\t0.00374\t0.00317\t0.00845\n+2\t0.14091\t0.35037\t0.26236\t0.01289\t0.01934\t0.01867\t0.01426\t0.02031\t0.01318\t0.08020\t0.01104\t0.01222\t0.00855\t0.00590\t0.00489\t0.00172\t0.00723\t0.00408\t0.00332\t0.00858\n+3\t0.01482\t0.36147\t0.37657\t0.01646\t0.07589\t0.01933\t0.01759\t0.01956\t0.01325\t0.01786\t0.01029\t0.01215\t0.00823\t0.00573\t0.00518\t0.00171\t0.00809\t0.00419\t0.00273\t0.00888\n+4\t0.07353\t0.00686\t0.00825\t0.00817\t0.00888\t0.00741\t0.00551\t0.01070\t0.00969\t0.01443\t0.01806\t0.03327\t0.01927\t0.46201\t0.28058\t0.00723\t0.00983\t0.00792\t0.00370\t0.00472\n+5\t0.01615\t0.63838\t0.16866\t0.01223\t0.01841\t0.02313\t0.01325\t0.01920\t0.01299\t0.01591\t0.00931\t0.01079\t0.00812\t0.00554\t0.00444\t0.00148\t0.00728\t0.00364\t0.00271\t0.00838\n+6\t0.28659\t0.04777\t0.04361\t0.01184\t0.01587\t0.18001\t0.00983\t0.02236\t0.06765\t0.11491\t0.03453\t0.01465\t0.01120\t0.00685\t0.00592\t0.00184\t0.04358\t0.00466\t0.00440\t0.07192\n+7\t0.01686\t0.60647\t0.14042\t0.01240\t0.01825\t0.08191\t0.01289\t0.01967\t0.01338\t0.01576\t0.00929\t0.01077\t0.00813\t0.00561\t0.00450\t0.00148\t0.00755\t0.00365\t0.00275\t0.00827\n+8\t0.01596\t0.60458\t0.20079\t0.01256\t0.01892\t0.02266\t0.01382\t0.01925\t0.01301\t0.01614\t0.00942\t0.01093\t0.00812\t0.00557\t0.00453\t0.00151\t0.00739\t0.00370\t0.00271\t0.00843\n+9\t0.08097\t0.00754\t0.00928\t0.00848\t0.01061\t0.00706\t0.00645\t0.01429\t0.01660\t0.09376\t0.50524\t0.10529\t0.04697\t0.01208\t0.00699\t0.00199\t0.00353\t0.01050\t0.00655\t0.04580\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t3\n+\n+[block]\n+# block no. 1 follows, 35 sequences, length 6\n+# corresponding to MSA columns:\n+# 20-25\n+name=unknown_B\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.08074\t0.57984\t0.10591\t0.01146\t0.01715\t0.02190\t0.01177\t0.02002\t0.01319\t0.07374\t0.01037\t0.01143\t0.00862\t0.00572\t0.00445\t0.00152\t0.00680\t0.00377\t0.00321\t0.00838\n+1\t0.01490\t0.53226\t0.12754\t0.01173\t0.01691\t0.02045\t0.01205\t0.01771\t0.01246\t0.01560\t0.01070\t0.01338\t0.00957\t0.01340\t0.14428\t0.00310\t0.00905\t0.00421\t0.00284\t0.00785\n+2\t0.01062\t0.15131\t0.01283\t0.00864\t0.01000\t0.01023\t0.00639\t0.01169\t0.01020\t0.01352\t0.01700\t0.03065\t0.01810\t0.41286\t0.24385\t0.00647\t0.00954\t0.00740\t0.00350\t0.00520\n+3\t0.01793\t0.67280\t0.03105\t0.01164\t0.01676\t0.12969\t0.01106\t0.01991\t0.01362\t0.01501\t0.00896\t0.01036\t0.00815\t0.00559\t0.00431\t0.00140\t0.00745\t0.00349\t0.00279\t0.00803\n+4\t0.01482\t0.57086\t0.09009\t0.01066\t0.01581\t0.02050\t0.01082\t0.01724\t0.01323\t0.01579\t0.01942\t0.01998\t0.14412\t0.00747\t0.00488\t0.00156\t0.00634\t0.00538\t0.00331\t0.00773\n+5\t0.01332\t0.12525\t0.09355\t0.00978\t0.01335\t0.01020\t0.00895\t0.01635\t0.01618\t0.13131\t0.33326\t0.03633\t0.14596\t0.01079\t0.00665\t0.00192\t0.00466\t0.00905\t0.00584\t0.00731\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+9\t12\n+\n+[block]\n+# block no. 2 follows, 35 sequences, length 13\n+# corresponding to MSA columns:\n+# 42-54\n+name=unknown_C\n+#\n+# <colnr> <probs for GDERKNQSTAVLIFYWHMCP>\n+#\tG\tD\tE\tR\tK\tN\tQ\tS\tT\tA\tV\tL\tI\tF\tY\tW\tH\tM\tC\tP\n+0\t0.01426\t0.01482\t0.02773\t0.01992\t0.02579\t0.01338\t0.42471\t0.01851\t0.01409\t0.02024\t0.01207\t0.01552\t0.00949\t0.00534\t0.00700\t0.00172\t0.03930\t0.00603\t0.00339\t0.30669\n+1\t0.01272\t0.03281\t0.74418\t0.01808\t0.02746\t0.01473\t0.02344\t0.02009\t0.01339\t0.02009\t0.01138\t0.01339\t0.00804\t0.00603\t0.00603\t0.00201\t0.00938\t0.00469\t0.00268\t0.00938\n+2\t0.01380\t0.25406\t0.49537\t0.01553\t0.02331\t0.01747\t0.01891\t0.01932\t0.01308\t0.01828\t0.01091\t0.01302\t0.00846\t0.00796\t0.04333\t0.00223\t0.00899\t0.00441\t0.00273\t0.00882\n+3\t0.01471\t0.38281\t0.41155\t0.01470\t0.02223\t0.01958\t0.01755\t0.'..b'490\t0.01607\t0.00750\t0.00214\t0.00321\t0.01339\t0.00589\t0.00536\n+63\t0.00763\t0.00643\t0.00661\t0.00657\t0.00865\t0.00541\t0.00492\t0.00936\t0.01477\t0.01788\t0.12422\t0.05983\t0.67449\t0.01579\t0.00750\t0.00213\t0.00319\t0.01322\t0.00599\t0.00541\n+64\t0.00750\t0.00643\t0.00643\t0.00643\t0.00857\t0.00536\t0.00482\t0.00910\t0.01446\t0.01714\t0.06427\t0.06105\t0.73490\t0.01607\t0.00750\t0.00214\t0.00321\t0.01339\t0.00589\t0.00536\n+65\t0.01198\t0.01128\t0.01903\t0.76180\t0.04369\t0.01409\t0.01762\t0.01621\t0.01268\t0.01621\t0.01128\t0.01691\t0.00846\t0.00634\t0.00634\t0.00211\t0.00846\t0.00564\t0.00282\t0.00705\n+66\t0.01198\t0.01128\t0.01903\t0.76180\t0.04369\t0.01409\t0.01762\t0.01621\t0.01268\t0.01621\t0.01128\t0.01691\t0.00846\t0.00634\t0.00634\t0.00211\t0.00846\t0.00564\t0.00282\t0.00705\n+67\t0.00910\t0.00667\t0.00954\t0.00954\t0.01044\t0.00757\t0.00711\t0.01091\t0.01000\t0.01424\t0.01759\t0.02825\t0.01731\t0.19410\t0.60736\t0.00938\t0.01481\t0.00728\t0.00349\t0.00530\n+68\t0.00773\t0.00552\t0.00736\t0.00883\t0.00920\t0.00515\t0.00589\t0.00883\t0.01215\t0.01619\t0.03497\t0.77291\t0.04196\t0.01987\t0.00810\t0.00258\t0.00368\t0.01803\t0.00589\t0.00515\n+69\t0.01315\t0.01128\t0.01315\t0.00940\t0.01503\t0.00846\t0.00752\t0.01597\t0.01315\t0.02067\t0.01128\t0.01315\t0.00940\t0.00470\t0.00470\t0.00094\t0.00470\t0.00376\t0.00376\t0.81583\n+70\t0.01696\t0.78087\t0.03324\t0.01085\t0.01628\t0.02510\t0.01085\t0.01900\t0.01289\t0.01493\t0.00882\t0.01018\t0.00814\t0.00543\t0.00407\t0.00136\t0.00678\t0.00339\t0.00271\t0.00814\n+71\t0.08422\t0.01896\t0.01854\t0.01592\t0.01783\t0.24248\t0.03317\t0.05512\t0.01374\t0.03718\t0.00975\t0.01321\t0.00852\t0.00884\t0.01330\t0.00228\t0.39117\t0.00502\t0.00335\t0.00741\n+72\t0.02412\t0.01777\t0.01904\t0.01460\t0.01967\t0.01967\t0.01206\t0.71633\t0.02983\t0.03998\t0.01523\t0.01523\t0.01079\t0.00762\t0.00635\t0.00190\t0.00698\t0.00571\t0.00635\t0.01079\n+73\t0.00908\t0.00671\t0.00975\t0.00975\t0.01073\t0.00769\t0.00738\t0.01104\t0.01006\t0.01440\t0.01740\t0.02717\t0.01683\t0.14621\t0.65462\t0.00965\t0.01553\t0.00713\t0.00346\t0.00542\n+74\t0.01272\t0.03281\t0.74418\t0.01808\t0.02746\t0.01473\t0.02344\t0.02009\t0.01339\t0.02009\t0.01138\t0.01339\t0.00804\t0.00603\t0.00603\t0.00201\t0.00938\t0.00469\t0.00268\t0.00938\n+75\t0.01696\t0.78087\t0.03324\t0.01085\t0.01628\t0.02510\t0.01085\t0.01900\t0.01289\t0.01493\t0.00882\t0.01018\t0.00814\t0.00543\t0.00407\t0.00136\t0.00678\t0.00339\t0.00271\t0.00814\n+76\t0.01102\t0.00551\t0.00826\t0.00826\t0.00826\t0.00551\t0.00551\t0.00826\t0.00826\t0.01102\t0.01102\t0.01928\t0.01102\t0.02204\t0.02479\t0.81543\t0.00551\t0.00551\t0.00275\t0.00275\n+77\t0.45751\t0.01405\t0.01304\t0.01071\t0.01499\t0.01580\t0.00882\t0.28592\t0.01840\t0.05279\t0.01227\t0.01311\t0.00904\t0.00667\t0.00494\t0.00192\t0.00563\t0.00450\t0.04144\t0.00844\n+78\t0.00750\t0.00643\t0.00643\t0.00643\t0.00857\t0.00536\t0.00482\t0.00910\t0.01446\t0.01714\t0.06427\t0.06105\t0.73490\t0.01607\t0.00750\t0.00214\t0.00321\t0.01339\t0.00589\t0.00536\n+79\t0.01726\t0.74700\t0.03255\t0.01110\t0.01643\t0.05788\t0.01092\t0.01928\t0.01312\t0.01495\t0.00886\t0.01023\t0.00814\t0.00548\t0.00414\t0.00137\t0.00699\t0.00342\t0.00274\t0.00811\n+80\t0.01272\t0.03281\t0.74418\t0.01808\t0.02746\t0.01473\t0.02344\t0.02009\t0.01339\t0.02009\t0.01138\t0.01339\t0.00804\t0.00603\t0.00603\t0.00201\t0.00938\t0.00469\t0.00268\t0.00938\n+81\t0.00773\t0.00552\t0.00736\t0.00883\t0.00920\t0.00515\t0.00589\t0.00883\t0.01215\t0.01619\t0.03497\t0.77291\t0.04196\t0.01987\t0.00810\t0.00258\t0.00368\t0.01803\t0.00589\t0.00515\n+82\t0.00789\t0.00677\t0.00681\t0.00674\t0.00895\t0.00586\t0.00507\t0.01028\t0.04858\t0.01759\t0.06242\t0.05926\t0.70059\t0.01571\t0.00745\t0.00214\t0.00330\t0.01309\t0.00592\t0.00558\n+83\t0.00773\t0.00650\t0.00675\t0.00688\t0.00896\t0.00552\t0.00528\t0.00945\t0.01447\t0.01730\t0.06164\t0.06195\t0.67504\t0.01619\t0.00761\t0.00221\t0.00344\t0.07179\t0.00589\t0.00540\n+84\t0.01003\t0.00825\t0.00877\t0.00820\t0.01064\t0.00797\t0.00627\t0.05412\t0.13111\t0.02133\t0.16491\t0.05013\t0.46700\t0.01387\t0.00726\t0.00211\t0.00369\t0.01163\t0.00619\t0.00653\n+85\t0.01696\t0.78087\t0.03324\t0.01085\t0.01628\t0.02510\t0.01085\t0.01900\t0.01289\t0.01493\t0.00882\t0.01018\t0.00814\t0.00543\t0.00407\t0.00136\t0.00678\t0.00339\t0.00271\t0.00814\n+\n+[dist]\n+# distance from previous block\n+# <min> <max>\n+0\t1\n+\n+# created by:\n+# /home/cegg/simao/soft/augustus-3.2.1/scripts/msa2prfl.pl ./align_prep/EOG090W0MBV.fa\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/genome_masked.fa
--- a/test-data/genome_masked.fa Sun Jan 22 17:30:57 2023 +0000
+++ b/test-data/genome_masked.fa Thu Apr 13 17:16:35 2023 +0000
b
b'@@ -4313,7 +4313,10104 @@\n CATGTCAAGTATTATTATCGAGCAACTACAAACGAAATACAAACATACAT\n TTAATTGCCAAGAATGTTCCTAGCCAAACAAATGTCGAAATAATGTCGGG\n CCACGGCCAAAGATTTATCATATTCACTCGACTGTCATAAAAAGCAATTA\n-GGCCCGGGCGAAAGATACACGACCGGCAGTCCCGAAATGT\n+GGCCCGGGCGAAAGATACACGACCGGCAGTCCCGAAATGTAATAAAAAaa\n+taacaaaatACACCGAAGGGGCGCAGCGAAAGAAGAAAGAAACGATGTGT\n+GATTTGAAGTTGTTTCTGGTTTTCGGTTTCGCTTAATGAGTTTGCCGCAC\n+AAAAAGTCGCTTCGAGGGAAGCGATTAAAGATTCCACATCCAGTGCGGCA\n+CGTCGGGGTTGTTGCTTCTGTAGCGGATGGTCCTGCACCCGAAAAAATAA\n+TTTCACTCGAGGCTATCAGAAAATGGTGTAGCGGTGTGGTCCAGATATGC\n+CTCCAGATATTGAGTACGCCGTGTCAGTGAATTTGAATTCAAAAAATGTT\n+TGAAAACTTTAATTGTTTTCCTCTCTCCTGATGATAACTACTTTGAACGA\n+CGGAAAAACGTACTATAAACAAAGTATAATTAAATCTTTTCCATTTGTTA\n+TAGAGTACTCTTTACTTAAATAGTTTGAATTTGGCCTAAAAGTTATCAGT\n+GATAACTGAGCGTTATTCATCACGTTATTCTTTGGTCGACTTCTTAGATT\n+TTTTGGATGGAGTCTAAGTCTGCCTAATTTCAGATTTCAGATAATTTAAT\n+TTAAATGAGTGGGACAATTTCTTTAAGTGCAGCGTGTCTCTTGTAATTAG\n+TATGCCTGCACACTCGCCGTGCCctgtgccctgtgccctTCGAAATAAAA\n+GCGGAAGCGGAGGTCCCCGCGAACAGTTGGCCCTTTGGGACAGAGAAAGG\n+CAGGTTCGGTTTGAAGGGCACTCGTCAGCAGAAACGAAAGGTGGGGAGGG\n+GCGGCGATACTATCCACGTTCCGATCCGAAAACAAGCGACCTGCCGATTC\n+GGATTGGTGTGAAAAGTCCGCCCCATGGCAACTGGCCTTGTTTTTTCCGT\n+CTGTTGCATATTTTCACAAGTAATTAACATGTGCCCGACGTTGTCCTTGT\n+CCGTAGCCAGGGATCCGGGAAGCCAGCCTGTTCCCGCGCAACTGTCCAAA\n+CAGGCTGCCCCGTTGTTGTTCGTCAGCGGGGTAACAAAGCGCTGCCTCCG\n+CATTAATTTGCATTATTTTCACATTTAACTTTCAAGCGAGTGCGCCTGCC\n+GAAGTTGCACTCTGCCGGCGAGCGGACAGGTGGAGCAGGTGGAACTGAAG\n+TGCCACTTCTAATTGTGCGGTGATTGGGGCACGGCTTTGAAAGATTCCGT\n+TCGAATGGCTTCCATCGGCAAACACCAACTATCGTCCCTGCCTTGATTGA\n+GTTAATAAGGGTTTAGGAATAATTTGATTGGCGTTAATAAAATATTGgta\n+aaacatcggtaaaacgTTATGTTGTATGCAAGTTTCACAATGAAGCTACA\n+ATAATATGATAATTTGCTTTAGCGAAGATTAGTACCAATAATTTGATTta\n+ATTTGAGTCGAAACTTTAAATATCAATTAATTCATTAACCGGGAGGGTAT\n+GATTAAAATATGCACCCTGTTGCTAAAATTAAATTTATGGTTTCTGTTGC\n+AAAGAATTTTACAGTGATGACAGAATGACGAGAGACACATTTCTGATCAA\n+CCTCTCCACCTCAGAAAAGATCTCAAATTTTAAGCAGCAGTTGCATCCAC\n+TTACTTTAAAACGACAACTTATAATTTGATCAGTGCTCTCAACATATATC\n+CAATTTATTAGATTTCCATGGCACCAATTCGATTTTTACTTTTAAATGGA\n+AAATCAAAAAGGGGAGAGAATCCCGGAAAGAGGAGCACTGATTTCTAGAA\n+TATTTATTTAGGAACATTTTAATATTGAATTCTTCAAGCCGGAGGAACAT\n+GCCACTTACAGTTCAATAGTTTTTACTTAGAAATTACATATCATTGCTAT\n+CATTACTTTTCGATCGCTATTCAGTGTTTATTTTATGGCTTTCGATCCCC\n+AAACTGTGTTAGGCTTAAGTTTAAATAATATTCCTTCGATTCTAGAACGC\n+TGTGCCCTGTTTCATAAACTTACATAGTTCATGGGCGGAAAACTTactta\n+ctgactgGCGATGATGCTGCCCCATTGCCCCATTTGGGCCATTTAGTTCG\n+CCGTTGATGATAAATTCTGCACTATGGCCCCGGGCGAATGTGCAATAAAA\n+TGCTCCCCGCGCTCCGCACAGCAACAAACCTTGCAACATAAATTAAGGCG\n+CAAAATGTTTATTTACGCTGCGGGAGGGAGTCGGAGGGAAGTCGGGAGAA\n+AGGGGCAAACACGCCGGCTGTTTCCTGCGCAACATTTGCATTTTGACGCC\n+GCATTACGCGTGATGTGAGGAGCCCCGGCCACTCGGCTTATCAGCCCAGA\n+GAAATCAAACGGCGCAGAAGTCGGCGGAGATTGTGGAGTTGCACGTCCAC\n+TGCCCGCAGCATCTTGCAACATTTTGTTTTAATTTCGCACTCTTGAAAAG\n+TGGCAGCCGCCACTCGGACGGTTTTTGAATTGGCCAAGTGAATTGCCACG\n+GACCACAGCGGCAGGGAATGTAGTAGAGTCCAAGACAGGGAATGGAGCCA\n+GCTGCTGGTCGATCTCACCTAGGGAATGGAGTCCATCGCTTTCCTTTCCC\n+CTTTGCAATGCTGCAATACCTTAAGATATTTCCTATACTTCGGCTTTAAT\n+ttggaaaaaaaaGTAACACTTACTAAGGTAAAATGAAATCTCGTATCTCT\n+GCTTAAGTAAAATTAGAATCAGTAGGGAACATTCCAAGTGCTTTGGAATA\n+TTAAACTTCATATCATACCAAGAATGATATTTCTCTGCCCTGAATTTATC\n+ACTCATTGTCGGTTCATTCAAGTGATTCCTTTTTTAAATATGATTATTGA\n+TTATCAATTTCTTTCATGTTGAGTCCCATTCCCCTTGCAACAGAAAACTT\n+CACACTCGGCTGTTTTTTCAGGCATTTTTAAAATCAAGGGGCCCACATCA\n+AAGGGCATTGCCTAAGAAACGAAGCCAATTGTATCTGCGTCCCAGTGCGT\n+GTATACACGTATCTGcatctgtatctgtaGTATATCAGtataTCAATGGC\n+CGTATCTGAAGGTGCGAGTTTTGATTGCGTTCGCTCTGTCAGGCAGAGGG\n+ACAGAAGGGCGCTTTATTTGATTTCAAGTTATGTTGTTTTTAGTGAGTTC\n+CTCTGGCACTCCCCTCCAGGTTTTTTGGCTTTTGTTTGTTGAACTTTGGC\n+TGACTAATAGCTGGTGAAGGGGGACCTCCAGGGGAGTGGGGCAGTTATGA\n+CGATGCCATAGTTTTTCGAACACATCCGAACATGTGTATTTATTACCGCC\n+TGATGCGGGCTGTTTGTTCCCAGCGCCCTGCACCGTGATTTGATTTATTT\n+GTACACAGTTTTATGATATTTACATGTCTGCAACTGAGGGTCCATGGTGT\n+GGCAAGGAGGGGTTGGTGGCCAGCGGTGCGGCAGGAGCAGCAAATGCAAT\n+CTACACCAGTGATTCAATTCTAGGTTCATCGAGTTCGCCTTGCACTTCTT\n+CGTTTTGTTCAAGGGTTATACAATAGTAGGTTAAGTTATTATATAAAAAT\n+ATGTTATGCGGCTCATAGTACGCCAGTACATAGAAAGCGCTGAGTTTAAA\n+ATTTGATTGCCGCTCCGGATTAATTTGTATTTTATTCGATCATAGTAAAT\n+GACGTTTTCAAATTAAAGTATAAATTGTGT'..b'CGCT\n+CAAATGGAACCCAAACCCTTTGACCTtcgacctTTGTATACTTTGGATTC\n+GGAAACGCATTCTTGTGCCTGTTACGTGTTGTTCTAAAGACTTACCTCTT\n+CTCTTCCTGCTCCTCGTCTTTTCCGTGGCACATTGCGAACACCCTTAGCT\n+TGGAGTTCTGCCAGTGGGAGCGCATGGAGATTATGTAGGGCAGGAGAATT\n+GTGAGACCTACATGTATTCCCAATGACTTGTGGATTAGTTGCAAAGTGGC\n+TGATTACGACCAAGTACCCACCTCCGTCGTCGTACAGCCAGAAGACATCG\n+ATTGTGCCCTTGGGCTGTTTGCGCGTGAATATGGTCATGGCGTCCAGCAA\n+GTTTTGGGGTATGTCCGATCCGCCCTTGGTGTGGTAGGTGACGGCGGGCT\n+CATCCGAGCTGGTCACCTTGTAGCTGCGGGAGTTGCGCTGCATGTTGGGC\n+ATCGGTGCTGGCTGGGGCATTGTGAAAGAGGAGTTGGGGCTGTCCATGCT\n+GGCTAGGTTCAGGTTGGAGTCAATGTGCAGCAGCTCCGAGGCTGCATTGG\n+CCGCCGGCATCAGTTCGTTGGTGAATCCATGCGCATTGGCGGTATGCATG\n+TGACCCATTCCGTTGGCCGGCAGAGTGACCTCGGAACTCAGCTCAGAGAA\n+ATCCAATCCGTTGGGCAGTCGGAGCAGGGCCACGCCCATACGCTGAGAAA\n+AAGCATTGCTATGGAAGAGGTGGACTTGGTAAGGCATCCAATAACATAGT\n+TTGGGGAAATAACTTACTACAAAATGGAAAAGTAACTCTCCACCTCCTCC\n+TTGCGACAGCGATTCCAGTCCGGCTTGTAGCCCACCAGCACAATGTTCGG\n+AGACATTTTGCCGAAGCCCGTTGACTTTGTCAACGCATTTATTCCGTCCT\n+CCAGGCTGAACCCATCAATCACATTGTAGAAGGCCTTGATCTTGCGGGCA\n+TCCAGGTACTTTTGTCCATCCTTCACCAGGTGCTGCCGGTTCTTGTAGCC\n+CACCCGCACCTGAAAGGATATAACAAGTATTTTAGTAAGAATCACCATTC\n+CGCTTTTCTTGATGTCCAACAAAATGGGTGAGTTTTCCCTTATCAAGAAA\n+TCCATTCACGTACCGGTATTATATTTGCCACGAACATGAGGGAGTTGTTC\n+TTGGTCAGCAGGTAGCCAAAGTCCACGAGTGGCGGTCTGGTCTTGGGATC\n+GCCGGAGAGCACCAGCACCTGGGGATGGTAGTTCTTGACGTGATCCGAGA\n+CGTTCTGCAGTCGGTGGACGGCCATTAGAGCAGCCTTGTACTGCTGAGCC\n+TGCGTGGTGGATCCCCAGTTGGCCTCCGGCTTGCGGTACATGACCACCAG\n+ATAGAGGGCGAAGATGATGCCAAAGGTGATGATGGCGGCCACGTAGTTGA\n+TCAGGAACATGATGGCCACGCACATGGCGAACCCGAAGAGGCTGAGCCAG\n+GCGTTGTAGTACTTAAAGGTGGGTCGCCATCCCAATGGCTTCACGAAGGC\n+CGCGTGGAATGTGCAAAAGTTGATGAGGGCGTAGGAGGCCAGGTAGAAGG\n+TGGAGATCAGAGGAGCGATCAGGTTAAGCTCTCCGATCAGCAGGAAGCCG\n+GTggtgatgaagaagGTGAGCACGTAGCCGCGATACGGTTCGCCGTGCTT\n+GCCGTACGGCTTCGAGAAGAAGATTAGACCCGGGTAGATCTGGTCAATGC\n+CCAGGGCCTGCACCAGCCTGGGAACGGAAAGCAAGTTGGTCAGGGCCGTG\n+CTTAACGTGGCTGCAAAGCAGCCGGCGTAGATGAGTGGTCCCCACAGCGA\n+CATCTCCTGCATCATTTCGTACGAGTTGAAGAGACCCCAGGTGCAGTTGC\n+CCGTGGCCATGCACGGCAGCTCCGAGGAAACAATGGTGCCATTGACGAGG\n+TCAGCTGGTATACCGGAGGCATCTCTTACAGCAGCGCCACCGGCGAAGAG\n+GACAAAGAGAGCGTATGAGGACATCGAGATGAGCAGGGACCAGAAGGTGC\n+CCTTCGGTATAGCAGCTCCGGCATCCTTGAGGTCTCCGCAGATATTTGCT\n+CCTGCCTGGATGCCCGTCACGCTGGGAAAGAAGATAGCGAACACGCTGAA\n+AAAGTCGTGGTTTACGCCCTCCGCATAGCGATAGTCCGATCCGAAGTTCT\n+CCTTCAAAGTAGCCCCTAATTTAGGTAACCAGTTATGAGGTTATTACTTT\n+CTTAAGTTCTCTTATGAACTCACATGAAAAGCCGACGAAACCCCTAGAGA\n+TTTGCTCCTCATTACCCTGGGGTCCAATGGCAGCTCCGATCAGGAAATTG\n+AAGATGGCCAGGACAATCGTGACGATCAGGAAGTTCTGCGCCTTCGTCTC\n+CCACTCCATACCCACGCAGCAGATTAGGATGAGCACCAGCACGGTTATCG\n+ATCCCACGATCCGGATGTCATTGATCCCGTTGTCGACAATCTTCAGGTCG\n+TTGTTCTCTGGAAATGAGATTAATGATTACTCCGGAACTAAGTTAAGGAT\n+ATCCTCAAACTTAATTAAACCAGACTGGATCCATGAAATATAGTGAAAGT\n+CGTTTCTATTTCAACCTTTATTTTTTATCCTATTTATTTAGGACATTTAA\n+AGCTGCCCCATTTGTGGCCACCCTATTCAAGTTAATCGAATGGCCTCTGT\n+GTGCACAAGTCAATTGATACTCACTGAGTAAAACATTTAGCGATTCGCAG\n+AAGCCGATGGTGTTCATCGAGGCTGAgacggcgttggcgaaggcgaagac\n+cacgcccacCGACGCCCCAAACTCGGGGCCCAGCGAACGGGATATGAtga\n+agtagacgccgccgccCTTGACCTCGCCGTTGGTGCTAATGGCCGACAGC\n+GAGAGCGTCGTGATGACGCAGACCACCGCGGAGATCGTAATTATAATCAG\n+GGACTGCAGGATGCCCGACTCGGCCACCACCCAGCTGAGGCGCAGGAAGA\n+GCATTACGCCCCAGATGTTGAGAAGGCAAGGTATCAGCACGCCCACGATC\n+CATCCTAGCTTGATGTGTCCGCCAGTTGCCTCCGGTTCGGgttcgGGAAT\n+AGTGATGCTCTGCAATGGAGAAACGATCTTATGGATAATAAaaatatata\n+tgtatgtaGtatgtaGGTCGTCCTTATAAGTAATACCTTTCTTAAGTAAG\n+ACACATTAGTATTAACTTTTCACATAGGTTATGTTCAATCTAGCCGGCTA\n+ATGATTTGGGCAAACGGGAAAAGGCCGTCATCGGATTGTTATTTGCCTGA\n+TAATGGGATCTTGACATAAGTGGCATTCAATCGAATGTGTGCTAACTGTG\n+TGAGATTGAATTGAGTTCGGCTtttttttttAACTGTATACGACTCGAAC\n+AGCTGCTTGGGTGAGTTTTTATCCGGAATTACTCATACGACATGTGTGCA\n+ATTTAGTACTCGGATTCAATTAACGACCCGttaacgacccCCAAAATACG\n+AAAGCAGCAGCAAGCGAAGGCACAGCCACAACCAGATTATGAGCAGCAGC\n+TCACATTGCTTTCCATTCTAATTAAAGTTCACTTTTATTAGCCGCACTTA\n+AACTGGAAACATTATGAAAATGTTCACATAAAAGCTGAAACCCACCCAAT\n+GAGATGCCACCAAGTCAACTATTTAACGTATGCCCCAAAGTATTTCCTTT\n+GTTCGGTTCGGATATAGTTCGTCCAATAGGGCGGCAAGTGCAAAAACAAA\n+GACGAAATCCACTTTAACTGCGGCGAGGAA\n >sample2\n GAAAATCATTCATTTGGAATTGTAATCACCTATGCACTTTGGTATAAGCT\n TTTCTGTGCACATTTTCCTGGAAAATGAATGAGACTCCTCGGCAGCCATT\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/predict_scratch/Genus_species.discrepency.report.txt
--- a/test-data/predict_scratch/Genus_species.discrepency.report.txt Sun Jan 22 17:30:57 2023 +0000
+++ b/test-data/predict_scratch/Genus_species.discrepency.report.txt Thu Apr 13 17:16:35 2023 +0000
b
b'@@ -3,11 +3,12 @@\n Summary\n DISC_PROTEIN_NAMES:All proteins have same name "hypothetical protein"\n DISC_SOURCE_QUALS_ASNDISC:taxname (all present, all same)\n-DISC_FEATURE_COUNT:gene: 16 present\n-DISC_FEATURE_COUNT:CDS: 16 present\n-DISC_FEATURE_COUNT:mRNA: 16 present\n+DISC_FEATURE_COUNT:gene: 70 present\n+DISC_FEATURE_COUNT:CDS: 69 present\n+DISC_FEATURE_COUNT:mRNA: 69 present\n+DISC_FEATURE_COUNT:tRNA: 1 present\n DISC_COUNT_NUCLEOTIDES:4 nucleotide Bioseqs are present\n-JOINED_FEATURES:26 features have joined locations.\n+JOINED_FEATURES:116 features have joined locations.\n NO_ANNOTATION:2 bioseqs have no features\n DISC_QUALITY_SCORES:Quality scores are missing on all sequences.\n FATAL: DISC_BACTERIAL_PARTIAL_NONEXTENDABLE_PROBLEMS:1 features have partial ends that do not abut the end of the sequence or a gap, and cannot be extended by 3 or fewer nucleotides to do so\n@@ -16,7 +17,7 @@\n MOLTYPE_NOT_MRNA:4 molecule types are not set as mRNA.\n TECHNIQUE_NOT_TSA:4 technique are not set as TSA\n MISSING_STRUCTURED_COMMENT:4 sequences do not include structured comments.\n-MISSING_PROJECT:20 sequences do not include project.\n+MISSING_PROJECT:73 sequences do not include project.\n DISC_INCONSISTENT_MOLINFO_TECH:Molinfo Technique Report (some missing, all same)\n \n \n@@ -26,43 +27,134 @@\n \n DiscRep_ALL:DISC_SOURCE_QUALS_ASNDISC::taxname (all present, all same)\n DiscRep_SUB:DISC_SOURCE_QUALS_ASNDISC::4 sources have \'Genus species\' for taxname\n-DiscRep_ALL:DISC_FEATURE_COUNT::gene: 16 present\n-DiscRep_ALL:DISC_FEATURE_COUNT::CDS: 16 present\n-DiscRep_ALL:DISC_FEATURE_COUNT::mRNA: 16 present\n+DiscRep_ALL:DISC_FEATURE_COUNT::gene: 70 present\n+DiscRep_ALL:DISC_FEATURE_COUNT::CDS: 69 present\n+DiscRep_ALL:DISC_FEATURE_COUNT::mRNA: 69 present\n+DiscRep_ALL:DISC_FEATURE_COUNT::tRNA: 1 present\n DiscRep_ALL:DISC_COUNT_NUCLEOTIDES::4 nucleotide Bioseqs are present\n-genome:sample (length 215740)\n+genome:sample (length 720580)\n genome:sample2 (length 2030)\n genome:sample3 (length 2100)\n genome:sample4 (length 7560)\n \n-DiscRep_ALL:JOINED_FEATURES::26 features have joined locations.\n-DiscRep_SUB:JOINED_FEATURES::26 features have joined location but no exception\n-genome:CDS\thypothetical protein\t(sample4:2126-2199, 2258-3224, 3284->3537)\tFUN_000016\n-genome:mRNA\thypothetical protein\t(sample4:2126-2199, 2258-3224, 3284->3537)\tFUN_000016\n-genome:mRNA\thypothetical protein\t(sample:c3142-3138, c3004-2883, c2686-2565)\tFUN_000002\n-genome:CDS\thypothetical protein\t(sample:c3142-3138, c3004-2883, c2686-2565)\tFUN_000002\n-genome:mRNA\thypothetical protein\t(sample:c5802-5797, c5539-4937, c4742-4248)\tFUN_000003\n-genome:CDS\thypothetical protein\t(sample:c5802-5797, c5539-4937, c4742-4248)\tFUN_000003\n-genome:CDS\thypothetical protein\t(sample:c10664-10657, c10499-8707, c8385-7691)\tFUN_000004\n-genome:mRNA\thypothetical protein\t(sample:c10664-10657, c10499-8707, c8385-7691)\tFUN_000004\n-genome:mRNA\thypothetical protein\t(sample:c15214-15209, c14648-14247)\tFUN_000005\n-genome:CDS\thypothetical protein\t(sample:c15214-15209, c14648-14247)\tFUN_000005\n-genome:CDS\thypothetical protein\t(sample:15539-15543, 15646-15919, 16485-16619)\tFUN_000006\n-genome:mRNA\thypothetical protein\t(sample:15539-15543, 15646-15919, 16485-16619)\tFUN_000006\n-genome:CDS\thypothetical protein\t(sample:c21705-21700, c21515-19638, c19482-18358)\tFUN_000007\n-genome:mRNA\thypothetical protein\t(sample:c21705-21700, c21515-19638, c19482-18358)\tFUN_000007\n-genome:CDS\thypothetical protein\t(sample:40223-40396, 40659-41193, 41707-42080, 43409-43609, 43678-44130)\tFUN_000009\n-genome:mRNA\thypothetical protein\t(sample:40223-40396, 40659-41193, 41707-42080, 43409-43609, 43678-44130)\tFUN_000009\n-genome:mRNA\thypothetical protein\t(sample:87202-87207, 88054-88320)\tFUN_000010\n-genome:CDS\thypothetical protein\t(sample:87202-87207, 88054-88320)\tFUN_000010\n-genome:CDS\thypothetical protein\t(sample:c106221-106216, c104632-104258, c103947-103696, c103618-103229, c103151-102510)\tFUN_000011\n-genome:mRNA\thypothetical protein\t(sample:c106221-106216, c104632-1'..b'h 215740)\n-genome:ncbi:FUN_000001-T1 (length 124)\n-genome:ncbi:FUN_000002-T1 (length 82)\n-genome:ncbi:FUN_000003-T1 (length 367)\n-genome:ncbi:FUN_000004-T1 (length 831)\n-genome:ncbi:FUN_000005-T1 (length 135)\n-genome:ncbi:FUN_000006-T1 (length 137)\n-genome:ncbi:FUN_000007-T1 (length 1002)\n-genome:ncbi:FUN_000008-T1 (length 278)\n-genome:ncbi:FUN_000009-T1 (length 578)\n-genome:ncbi:FUN_000010-T1 (length 90)\n-genome:ncbi:FUN_000011-T1 (length 554)\n-genome:ncbi:FUN_000012-T1 (length 479)\n-genome:ncbi:FUN_000013-T1 (length 61)\n-genome:ncbi:FUN_000014-T1 (length 484)\n+DiscRep_ALL:MISSING_PROJECT::73 sequences do not include project.\n+genome:sample (length 720580)\n+genome:ncbi:FUN_000001-T1 (length 458)\n+genome:ncbi:FUN_000002-T1 (length 375)\n+genome:ncbi:FUN_000003-T1 (length 957)\n+genome:ncbi:FUN_000004-T1 (length 2136)\n+genome:ncbi:FUN_000005-T1 (length 315)\n+genome:ncbi:FUN_000006-T1 (length 278)\n+genome:ncbi:FUN_000007-T1 (length 365)\n+genome:ncbi:FUN_000008-T1 (length 171)\n+genome:ncbi:FUN_000009-T1 (length 132)\n+genome:ncbi:FUN_000010-T1 (length 338)\n+genome:ncbi:FUN_000011-T1 (length 294)\n+genome:ncbi:FUN_000012-T1 (length 341)\n+genome:ncbi:FUN_000013-T1 (length 589)\n+genome:ncbi:FUN_000014-T1 (length 146)\n+genome:ncbi:FUN_000015-T1 (length 576)\n+genome:ncbi:FUN_000016-T1 (length 139)\n+genome:ncbi:FUN_000017-T1 (length 224)\n+genome:ncbi:FUN_000018-T1 (length 151)\n+genome:ncbi:FUN_000019-T1 (length 68)\n+genome:ncbi:FUN_000020-T1 (length 182)\n+genome:ncbi:FUN_000021-T1 (length 193)\n+genome:ncbi:FUN_000022-T1 (length 550)\n+genome:ncbi:FUN_000023-T1 (length 515)\n+genome:ncbi:FUN_000024-T1 (length 96)\n+genome:ncbi:FUN_000025-T1 (length 277)\n+genome:ncbi:FUN_000026-T1 (length 406)\n+genome:ncbi:FUN_000027-T1 (length 635)\n+genome:ncbi:FUN_000028-T1 (length 1138)\n+genome:ncbi:FUN_000029-T1 (length 307)\n+genome:ncbi:FUN_000030-T1 (length 229)\n+genome:ncbi:FUN_000031-T1 (length 397)\n+genome:ncbi:FUN_000032-T1 (length 430)\n+genome:ncbi:FUN_000033-T1 (length 214)\n+genome:ncbi:FUN_000034-T1 (length 67)\n+genome:ncbi:FUN_000035-T1 (length 506)\n+genome:ncbi:FUN_000036-T1 (length 143)\n+genome:ncbi:FUN_000037-T1 (length 785)\n+genome:ncbi:FUN_000038-T1 (length 198)\n+genome:ncbi:FUN_000039-T1 (length 501)\n+genome:ncbi:FUN_000040-T1 (length 282)\n+genome:ncbi:FUN_000041-T1 (length 562)\n+genome:ncbi:FUN_000042-T1 (length 186)\n+genome:ncbi:FUN_000043-T1 (length 215)\n+genome:ncbi:FUN_000044-T1 (length 170)\n+genome:ncbi:FUN_000045-T1 (length 550)\n+genome:ncbi:FUN_000046-T1 (length 392)\n+genome:ncbi:FUN_000047-T1 (length 231)\n+genome:ncbi:FUN_000048-T1 (length 179)\n+genome:ncbi:FUN_000049-T1 (length 280)\n+genome:ncbi:FUN_000050-T1 (length 117)\n+genome:ncbi:FUN_000051-T1 (length 120)\n+genome:ncbi:FUN_000052-T1 (length 209)\n+genome:ncbi:FUN_000053-T1 (length 132)\n+genome:ncbi:FUN_000054-T1 (length 268)\n+genome:ncbi:FUN_000055-T1 (length 687)\n+genome:ncbi:FUN_000056-T1 (length 207)\n+genome:ncbi:FUN_000057-T1 (length 131)\n+genome:ncbi:FUN_000058-T1 (length 527)\n+genome:ncbi:FUN_000059-T1 (length 271)\n+genome:ncbi:FUN_000060-T1 (length 1569)\n+genome:ncbi:FUN_000062-T1 (length 477)\n+genome:ncbi:FUN_000063-T1 (length 1091)\n+genome:ncbi:FUN_000064-T1 (length 157)\n+genome:ncbi:FUN_000065-T1 (length 394)\n+genome:ncbi:FUN_000066-T1 (length 293)\n+genome:ncbi:FUN_000067-T1 (length 370)\n+genome:ncbi:FUN_000068-T1 (length 438)\n genome:sample2 (length 2030)\n genome:sample3 (length 2100)\n genome:sample4 (length 7560)\n-genome:ncbi:FUN_000015-T1 (length 124)\n-genome:ncbi:FUN_000016-T1 (length 432)\n+genome:ncbi:FUN_000069-T1 (length 458)\n+genome:ncbi:FUN_000070-T1 (length 375)\n \n DiscRep_ALL:DISC_INCONSISTENT_MOLINFO_TECH::Molinfo Technique Report (some missing, all same)\n DiscRep_SUB:DISC_INCONSISTENT_MOLINFO_TECH::technique (all missing)\n DiscRep_SUB:DISC_INCONSISTENT_MOLINFO_TECH::4 Molinfos are missing field technique\n-genome:sample (length 215740)\n+genome:sample (length 720580)\n genome:sample2 (length 2030)\n genome:sample3 (length 2100)\n genome:sample4 (length 7560)\n'
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/predict_scratch/Genus_species.error.summary.txt
--- a/test-data/predict_scratch/Genus_species.error.summary.txt Sun Jan 22 17:30:57 2023 +0000
+++ b/test-data/predict_scratch/Genus_species.error.summary.txt Thu Apr 13 17:16:35 2023 +0000
b
@@ -0,0 +1,1 @@
+     1 WARNING: SEQ_FEAT.ShortExon
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/predict_scratch/Genus_species.stats.json
--- a/test-data/predict_scratch/Genus_species.stats.json Sun Jan 22 17:30:57 2023 +0000
+++ b/test-data/predict_scratch/Genus_species.stats.json Thu Apr 13 17:16:35 2023 +0000
b
@@ -1,11 +1,11 @@
 {
     "format": "annotation",
-    "command": "/home/abretaud/miniconda3/envs/__funannotate@1.8.7/bin/funannotate predict --input /tmp/tmpm833xrq1/files/e/1/c/dataset_e1c34c74-e579-4cab-b0ed-5ce938ce4e4b.dat --out output --database /home/abretaud/.planemo/planemo_tmp_yntx6ieu/test-data/funannotate_db --species Genus species --isolate  --strain  --organism other --ploidy 1 --SeqCenter CFMR --SeqAccession 12345 --name FUN_ --numbering 1 --p2g_pident 80 --p2g_prefilter diamond --min_training_models 3 --busco_seed_species fly --busco_db insecta --evm-partition-interval 1500 --min_intronlen 10 --max_intronlen 3000 --min_protlen 50 --repeat_filter overlap blast --cpus 1",
+    "command": "/home/abretaud/miniconda3/envs/__funannotate@1.8.15/bin/funannotate predict --input input/input.fasta --out output --database /home/abretaud/git/iuc_tools/tools/funannotate/test-data/funannotate_db --species Genus species --isolate  --strain  --organism other --ploidy 1 --SeqCenter CFMR --SeqAccession 12345 --name FUN_ --numbering 1 --p2g_pident 80 --p2g_prefilter diamond --busco_seed_species fly --busco_db insecta --min_training_models 3 --evm-partition-interval 1500 --min_intronlen 10 --max_intronlen 3000 --min_protlen 50 --repeat_filter overlap blast --cpus 1",
     "organism": "Genus_species",
     "software": {
         "name": "funannotate",
-        "version": "1.8.7",
-        "date": "2021-07-21",
+        "version": "1.8.15",
+        "date": "2023-04-13",
         "resources": {
             "merops": {
                 "type": "diamond",
@@ -71,38 +71,38 @@
     },
     "assembly": {
         "num_contigs": 4,
-        "length": 227430,
-        "mean_length": 56857.5,
-        "N50": 215740,
+        "length": 732270,
+        "mean_length": 183067.5,
+        "N50": 720580,
         "L50": 1,
-        "N90": 215740,
+        "N90": 720580,
         "L90": 1,
-        "GC_content": 42.86
+        "GC_content": 43.15
     },
     "annotation": {
-        "genes": 16,
+        "genes": 70,
         "common_name": 0,
-        "mRNA": 16,
-        "tRNA": 0,
+        "mRNA": 69,
+        "tRNA": 1,
         "ncRNA": 0,
         "rRNA": 0,
-        "avg_gene_length": 1660.69,
+        "avg_gene_length": 1544.77,
         "transcript-level": {
-            "CDS_transcripts": 16,
+            "CDS_transcripts": 69,
             "CDS_five_utr": 0,
             "CDS_three_utr": 0,
-            "CDS_no_utr": 16,
+            "CDS_no_utr": 69,
             "CDS_five_three_utr": 0,
-            "CDS_complete": 15,
+            "CDS_complete": 68,
             "CDS_no-start": 0,
             "CDS_no-stop": 1,
             "CDS_no-start_no-stop": 0,
-            "total_exons": 42,
-            "total_cds_exons": 42,
-            "multiple_exon_transcript": 13,
-            "single_exon_transcript": 3,
-            "avg_exon_length": 402.36,
-            "avg_protein_length": 359.81,
+            "total_exons": 209,
+            "total_cds_exons": 209,
+            "multiple_exon_transcript": 58,
+            "single_exon_transcript": 11,
+            "avg_exon_length": 362.67,
+            "avg_protein_length": 393.62,
             "functional": {
                 "go_terms": 0,
                 "interproscan": 0,
@@ -113,7 +113,7 @@
                 "busco": 0,
                 "secretion": 0
             },
-            "pct_exon_overlap_protein_evidence": 11.9
+            "pct_exon_overlap_protein_evidence": 3.81
         }
     }
 }
\ No newline at end of file
b
diff -r 7abc5f6dd595 -r 51b6ee65ef7f test-data/predict_scratch/Genus_species.validation.txt
--- a/test-data/predict_scratch/Genus_species.validation.txt Sun Jan 22 17:30:57 2023 +0000
+++ b/test-data/predict_scratch/Genus_species.validation.txt Thu Apr 13 17:16:35 2023 +0000
[
@@ -0,0 +1,1 @@
+WARNING: valid [SEQ_FEAT.ShortExon] Internal coding region exon is too short FEATURE: CDS: hypothetical protein [(lcl|sample:391297-391301, 391479-391489, 391758-392254, 392500-392851, 393283-393638)] [lcl|sample: raw, dna len= 720580] -> [gnl|ncbi|FUN_000026-T1]