# HG changeset patch
# User rnateam
# Date 1586979217 14400
# Node ID aaefa93c2dd2ec0d58bee467a354dbb391dcfaa9
# Parent c5908940967d92b8ce62be1a4e3d36275712f1f1
"planemo upload for repository https://github.com/bgruening/galaxytools/tree/master/tools/mafft commit eff9db2cd18c82a7de37851571b8989b48014c71"
diff -r c5908940967d -r aaefa93c2dd2 macros.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/macros.xml Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,16 @@
+
+
+ 1
+ 7.455
+
+
+ mafft
+ fasta3
+
+
+
+
+ 10.1093/molbev/mst010
+
+
+
diff -r c5908940967d -r aaefa93c2dd2 mafft-add.xml
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/mafft-add.xml Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,88 @@
+
+
+ Align a sequence,alignment or fragments to an existing alignment.
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+ '$outputAlignment'
+ #if $map == '--mapout'
+ && mv '${inputSequences}.map' '$outputmap'
+ #end if
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ map == True
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
diff -r c5908940967d -r aaefa93c2dd2 mafft.xml
--- a/mafft.xml Sat Nov 11 15:06:34 2017 -0500
+++ b/mafft.xml Wed Apr 15 15:33:37 2020 -0400
@@ -1,229 +1,294 @@
-
- Multiple alignment program for amino acid or nucleotide sequences
-
- mafft
-
-
-
-
-
-
-
-
-
- $outputAlignment;
-
- #if $getTree == "--treeout"
- mv ${inputSequences}.tree $outputTree;
- #end if
- ]]>
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- getTree == True
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
-
- output]
-
-- G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information):
-
- - mafft --globalpair --maxiterate 1000 input [> output]
-
-- E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences):
-
- - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps.
-
-
-**Speed-oriented methods:**
-
-- FFT-NS-i (iterative refinement method; two cycles only):
-
- - mafft --retree 2 --maxiterate 2 input [> output]
-
-- FFT-NS-i (iterative refinement method; max. 1000 iterations):
-
- - mafft --retree 2 --maxiterate 1000 input [> output]
-
-- FFT-NS-2 (fast; progressive method):
-
- - mafft --retree 2 --maxiterate 0 input [> output]
-
-- FFT-NS-1 (very fast; recommended for >2000 sequences; progressive method with a rough guide tree):
-
- - mafft --retree 1 --maxiterate 0 input [> output]
-
-- NW-NS-i (iterative refinement method without FFT approximation; two cycles only):
-
- - mafft --retree 2 --maxiterate 2 --nofft input [> output]
-
-- NW-NS-2 (fast; progressive method without the FFT approximation):
-
- - mafft --retree 2 --maxiterate 0 --nofft input [> output]
-
-- NW-NS-PartTree-1 (recommended for ~10,000 to ~50,000 sequences; progressive method with the PartTree algorithm):
-
- - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output]
-
-**Options:**
-
---auto
- Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2)
---adjustdirection
- Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored.
---op
- Gap opening penalty, default: 1.53
---ep
- Offset (works like gap extension penalty), default: 0.0
---maxiterate
- Maximum number of iterative refinement, default: 0
---clustalout
- Output: clustal format, default: fasta
---thread
- Number of threads (if unsure, --thread -1)
---retree number
- Guide tree is built number times in the progressive stage. Valid with 6mer distance. Default: 2
- ]]>
-
-
- 10.1093/molbev/mst010
-
-
+
+
+ Multiple alignment program for amino acid or nucleotide sequences
+
+ macros.xml
+
+
+
+
+
+
+
+
+
+ '$outputAlignment';
+
+ #if $getTree == "--treeout"
+ mv '${inputSequences}.tree' '$outputTree';
+ #end if
+ ]]>
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ getTree == True
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+
+ output]
+ - G-INS-i (suitable for sequences of similar lengths; recommended for <200 sequences; iterative refinement method incorporating global pairwise alignment information):
+ - mafft --globalpair --maxiterate 1000 input [> output]
+ - E-INS-i (suitable for sequences containing large unalignable regions; recommended for <200 sequences):
+ - mafft --ep 0 --genafpair --maxiterate 1000 input [> output]. For E-INS-i, the --ep 0 option is recommended to allow large gaps.
+ **Speed-oriented methods:**
+ - FFT-NS-i (iterative refinement method; two cycles only):
+ - mafft --retree 2 --maxiterate 2 input [> output]
+ - FFT-NS-i (iterative refinement method; max. 1000 iterations):
+ - mafft --retree 2 --maxiterate 1000 input [> output]
+ - FFT-NS-2 (fast; progressive method):
+ - mafft --retree 2 --maxiterate 0 input [> output]
+ - FFT-NS-1 (very fast; recommended for >2000 sequences; progressive method with a rough guide tree):
+ - mafft --retree 1 --maxiterate 0 input [> output]
+ - NW-NS-i (iterative refinement method without FFT approximation; two cycles only):
+ - mafft --retree 2 --maxiterate 2 --nofft input [> output]
+ - NW-NS-2 (fast; progressive method without the FFT approximation):
+ - mafft --retree 2 --maxiterate 0 --nofft input [> output]
+ - NW-NS-PartTree-1 (recommended for ~10,000 to ~50,000 sequences; progressive method with the PartTree algorithm):
+ - mafft --retree 1 --maxiterate 0 --nofft --parttree input [> output]
+
+ **Options:**
+ --auto
+ Automatically selects an appropriate strategy from L-INS-i, FFT-NS-i and FFT-NS-2, according to data size. Default: off (always FFT-NS-2)
+ --adjustdirection
+ Generate reverse complement sequences, as necessary, and align them together with the remaining sequences. In the case of protein alignment, these options are just ignored.
+ --op
+ Gap opening penalty, default: 1.53
+ --ep
+ Offset (works like gap extension penalty), default: 0.0
+ --maxiterate
+ Maximum number of iterative refinement, default: 0
+ --clustalout
+ Output: clustal format, default: fasta
+ --thread
+ Number of threads (if unsure, --thread -1)
+ --retree number
+ Guide tree is built number times in the progressive stage.
+ Valid with 6mer distance. Default: 2
+ ]]>
+
+
+
diff -r c5908940967d -r aaefa93c2dd2 test-data/add_seq.fa
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/add_seq.fa Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,2 @@
+> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+MNGTEGDNFYVPFSNKTGLARSPYEYPQYYLAEPWKYSALAAYMFFLILVGFPVNFLTLF
diff -r c5908940967d -r aaefa93c2dd2 test-data/mafft_add_result.aln
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mafft_add_result.aln Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,481 @@
+> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+----------------------------------------MNG----------------T
+E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM
+N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM
+GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF
+VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H
+QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL
+GDDE--SGASTSKTEVSSVS-TSPVSPA--------------------------------
+---------------------------------------------------------
+> 2== U22180 1 rat opsin [J.Mol.Neurosci.5(3),207-209'94]
+----------------------------------------MNG----------------T
+E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML
+AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL
+H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM
+GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF
+VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H
+QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL
+GDDE--ASATASKTE------TSQVAPA--------------------------------
+---------------------------------------------------------
+> 3== M92038 1 chicken green sensitive cone opsin [PNAS89,5932-5936'9
+----------------------------------------MNG----------------T
+E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV
+CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW
+N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM
+GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF
+VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N
+KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF
+GDEDVSSTVSQSKTEVSSVS-SSQVSPA--------------------------------
+---------------------------------------------------------
+> 4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish
+----------------------------------------MNG----------------T
+E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL
+ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI
+N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA
+GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF
+VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N
+KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL
+GDDE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
+> 5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish
+----------------------------------------MNG----------------T
+E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL
+AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI
+N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA
+GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF
+ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N
+KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL
+GDEE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
+> 6== L11864 1 Carassius auratus blue cone opsin [Biochemistry32,208-
+----------------------------------------MKQ----------------V
+PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM
+SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF
+N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA
+GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF
+CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H
+RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I
+EEDE--ASTSSQVTQVSS------VAPEK-------------------------------
+---------------------------------------------------------
+> 7== M13299 1 human BCP <>[Science232(4747),193-202'86]
+----------------------------------------MRK----------------M
+S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ
+AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC
+N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT
+VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF
+IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N
+RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M
+TDES--DTCSSQKTEVSTVS-STQVGPN--------------------------------
+---------------------------------------------------------
+> 8=opsin, greensensitive human (fragment) S07060
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------DLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFC-----------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------------------------
+> 9== K03494 1 human GCP <>[Science232(4747),193-202'86]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV
+Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N
+PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+> 10== Z68193 1 human Red Opsin <>[]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N
+PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+> 11== M92036 1 Gecko gecko P521 [PNAS89,6841-6845'92]
+----------------------------------------MTEAWNVAVFAARRSRDD-D
+DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV
+SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI
+F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII
+GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM
+ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V
+DDGS--EASTTSRTEVSSVS-NSSVAPA--------------------------------
+---------------------------------------------------------
+> 12== M62903 1 chicken visual pigment <>[BBRC173,1212-1217'90]
+----------------------------------------MAA-WEAAFAARRRHEE--E
+DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT
+SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI
+S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA
+GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM
+VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--EVST-SRTEVSSVS-NSSVSPA--------------------------------
+---------------------------------------------------------
+> 13== S75720 1 chicken P-opsin <>[Science267(5203),1502-1506'95]
+----------------------------------------MS-----------------S
+NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV
+AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI
+N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS
+GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF
+VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H
+KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T
+GKAS--PGTPGPHADVTAAGLRNKVMPAHPV-----------------------------
+---------------------------------------------------------
+> 14== M17718 1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87]
+----------MESGNVSS------------SLFGNVST-ALRP----------------E
+ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL
+GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA
+MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N
+EKAP--ESSAVASTSTTQEP--QQTTAA--------------------------------
+---------------------------------------------------------
+> 15== X65879 1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92
+----------MEYHNVSS------------VL-GNVSS-VLRP----------------D
+ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL
+GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA
+MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VDSL------------------------------------------------------
+----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S
+EKAP--ESRAAISTSTTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
+> 16== M17730 1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87]
+----------ME------------------PL-CNASEPPLRP----------------E
+AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF
+H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N
+EKSG--EISSAQST-TTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
+> 17== X65880 1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92
+----------MD------------------AL-CNASEPPLRP----------------E
+ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF
+H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N
+EKSG--EASSAQST-TTQEQ-TQQTSAA--------------------------------
+---------------------------------------------------------
+> 18== D50584 1 Hemigrapsus sanguineus opsin BcRh2 [J.Exp.Biol.1
+--------------------------------MTNATGPQMAY----------------Y
+GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL
+GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF
+SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV
+FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF
+VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VSTL------------------------------------------------------
+----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G
+DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T
+ETKS--NDDSQSNSTVAQDK-A--------------------------------------
+---------------------------------------------------------
+> 19== D50583 1 Hemigrapsus sanguineus opsin BcRh1 [J.Exp.Biol.1
+--------------------------------MANVTGPQMAF----------------Y
+GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL
+GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF
+SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF
+MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF
+IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VTNL------------------------------------------------------
+----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G
+NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K
+DPND--VEENQSSNTQTQEK-S--------------------------------------
+---------------------------------------------------------
+> 20== K02320 1 D.melanogaster opsin <>[Cell40,851-858'85]
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
+> 21== K02315 1 D.melanogaster ninaE <>[Cell40,839-850'85]
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
+> 22== X65877 1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204'
+----------MD----SF------------AAVATQLGPQFAA----------------P
+S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL
+TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSEAQSQA-TTSEA-ESKA-----------------------------------
+---------------------------------------------------------
+> 23== M12896 1 D.melanogaster Rh2 <>[Cell44,705-710'86]
+-----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q
+SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL
+GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS
+LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T
+DEPK--PDAPASDTETTSEA-DSKA-----------------------------------
+---------------------------------------------------------
+> 24== X65878 1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92
+-----MERSLLP----EP------------PLAMALLGPRFEA----------------Q
+TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL
+GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS
+LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T
+DEPK--PDAPPSDTETTSEA-ESKD-----------------------------------
+---------------------------------------------------------
+> 25== U26026 1 Apis mellifera long-wavelength rhodopsin <>[]
+--------------------------------MIAVSGPSYEA----------------F
+SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL
+GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY
+Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI
+RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG
+IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N
+L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A
+EPSS--DAVSTTSGTTTVTD-NEKSNA---------------------------------
+---------------------------------------------------------
+> 26== L03781 1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93]
+----------------------------------MANQLSYSS----------------L
+GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL
+GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF
+A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL
+LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG
+LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S
+SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G
+ESGS--DVKSEASATTTMEE-KPKIPEA--------------------------------
+---------------------------------------------------------
+> 27== X07797 1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88]
+---------------------------------------MVES----------------T
+TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV
+GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF
+M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL
+MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY
+FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G
+PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C
+EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP
+QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
+> 28== X70498 1 Todarodes pacificus rhodopsin [FEBS317(1-2),5-11'93]
+----------------------------------------MGR----------------D
+LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL
+GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF
+L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI
+MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF
+ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G
+PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T
+EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP
+QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA
+> 29== L21195 1 human serotonin 5-HT7 receptor protein 30== L15228 1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93]
+------------------------------------------------------------
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
+> 31=p A47425 serotonin receptor 5HT-7 - rat
+------------------------------------------------------------
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
+> 32== M83181 1 human serotonin receptor <>[JBC267(11),7553-7562'92]
+----------MDVLSP--------------------------------------------
+---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR--
+-------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG--
+PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ----
+------------------------------------------------------------
+---------------------------------------------------------
+> 33=p A35181 serotonin receptor class 1A - rat
+----------MDVFSF--------------------------------------------
+---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG--
+-------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG--
+SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR----
+------------------------------------------------------------
+---------------------------------------------------------
+> 34== L06803 1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93]
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+------------------------------------------------------------
+---------------------------------------------------------
+> 35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+------------------------------------------------------------
+---------------------------------------------------------
+> 36== X95604 1 Bombyx mori serotonin receptor [InsectBiochem.Mol.Bi
+-MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T
+VVPN--TTWW------------QASAPFDTPAALVRAAAK--------------------
+AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV
+V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM
+MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT
+ASSFYVPVLIILILYWRIY-------QTARKRIR--------------------------
+-------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA
+AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV
+AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C
+DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR--
+------A---------------PQ------------------------------------
+---------------------------------------------------------
+> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
+----------------------------------------MNG----------------T
+E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+AAYMFFLILVGFPVNFLTLF----------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------------------------
diff -r c5908940967d -r aaefa93c2dd2 test-data/mafft_custom_result.aln
--- /dev/null Thu Jan 01 00:00:00 1970 +0000
+++ b/test-data/mafft_custom_result.aln Wed Apr 15 15:33:37 2020 -0400
@@ -0,0 +1,458 @@
+CLUSTAL format alignment by MAFFT F-INS-i (v7.455)
+
+
+1== MN------------------------GTE--GDNFYVPFS--------NKTGL-ARSPYE
+2== MN------------------------GTE--GPNFYVPFS--------NITGV-VRSPFE
+3== MN------------------------GTE--GINFYVPMS--------NKTGV-VRSPFE
+4=p MN------------------------GTE--GKNFYVPMS--------NRTGL-VRSPFE
+5=p MN------------------------GTE--GNNFYVPLS--------NRTGL-VRSPFE
+6== MK------------------------QVPEFHEDFYIPIP-------LDINNLSAYSPFL
+7== MR------------------------KMS--EEEFYL------------FKNISSVGPWD
+8=opsin, ------------------------------------------------------------
+9== MAQQWSLQ-RLAGRHPQDS----YEDSTQ--SSIFTYTNS--------NS----TRGPFE
+10== MAQQWSLQ-RLAGRHPQDS----YEDSTQ--SSIFTYTNS--------NS----TRGPFE
+11== MTEAWNVAVFAARRSRDD------DDTTR--GSVFTYTNT--------NN----TRGPFE
+12== MA-AWEAA-FAARRRHEE------EDTTR--DSVFTYTNS--------NN----TRGPFE
+13== MS----------------------SNSSQ--------------AP--PNG----TPGPFD
+14== MESG-NV-----------------------------------------SSSLFGNVSTAL
+15== MEYH-NV------------------------------------------SSVLGNVSSVL
+16== MEPLCNA------------------------------------------------SEPPL
+17== MDALCNA------------------------------------------------SEPPL
+18== MT-------------------------------------------------------NAT
+19== MA-------------------------------------------------------NVT
+20== ME-------------------------------------------------SFAVAAAQL
+21== ME-------------------------------------------------SFAVAAAQL
+22== MD-------------------------------------------------SFAAVATQL
+23== MERS--------------------------------------------HLPETPFDLAHS
+24== MERS--------------------------------------------LLPEPPLAMALL
+25== MI-------------------------------------------------------AVS
+26== M-----------------------------------------------------------
+27== MVESTT------------------------------------------------------
+28== MGRD--------------------------------------------------------
+29== MM-----DVNSSGRPDLYGH-----------LRSFLLPEVGRGLPDLSPDGGADPVAGSW
+30== M-----------------------------------------------------------
+31=p M-----------------------------------------------------------
+32== MD------VLSPGQ----------------------------------GNNTTSPPAPFE
+33=p MD------VFSFGQ----------------------------------GNNTTASQEPFG
+34== MA------NFTFGDLALDVARMGGLASTPS------------------GLRSTGLTTPGL
+35=p MA------NFTFGDLALDVARMGGLASTPS------------------GLRSTGLTTPGL
+36== ME-------GAEGQEELD-------------WEALYLRL---------PLQNCSWNSTGW
+
+
+1== YP----------------------------------------------------------
+2== QP----------------------------------------------------------
+3== YP----------------------------------------------------------
+4=p YP----------------------------------------------------------
+5=p YP----------------------------------------------------------
+6== VP----------------------------------------------------------
+7== GP----------------------------------------------------------
+8=opsin, ------------------------------------------------------------
+9== GP----------------------------------------------------------
+10== GP----------------------------------------------------------
+11== GP----------------------------------------------------------
+12== GP----------------------------------------------------------
+13== GP----------------------------------------------------------
+14== RPEARL----------------------SAETRLLGWNVPPEELRHIPEHWL--------
+15== RPDARL----------------------SAESRLLGWNVPPDELRHIPEHWL--------
+16== RPEAR-SSG-------------------NGDLQFLGWNVPPDQIQYIPEHWL--------
+17== RPEARMSSG-------------------SDELQFLGWNVPPDQIQYIPEHWL--------
+18== GPQMAYYGAASMDFG-------------YPEGVSIVDFVRPEIKPYVHQHWY--------
+19== GPQMAFYGSGAATFG-------------YPEGMTVADFVPDRVKHMVLDHWY--------
+20== GPHFAPLS-----------------------NGSVVDKVTPDMAHLISPYWN--------
+21== GPHFAPLS-----------------------NGSVVDKVTPDMAHLISPYWN--------
+22== GPQFAAPS-----------------------NGSVVDKVTPDMAHLISPYWD--------
+23== GPRFQAQSSG---------------------NGSVLDNVLPDMAHLVNPYWS--------
+24== GPRFEAQTGG---------------------NRSVLDNVLPDMAPLVNPHWS--------
+25== GPSYEAFSYG--GQA-------------RFNNQTVVDKVPPDMLHLIDANWY--------
+26== -ANQLSYSSL--GWP-------------YQPNASVVDTMPKEMLYMIHEHWY--------
+27== ----------LVNQT-------------WWYNPTV----------DIHPHWA--------
+28== ---------LRDNET-------------WWYNPSI----------VVHPHWR--------
+29== APHLLS-----------------------------------EVTASPAPTWDAPPDNASG
+30== -PHLLSGF--------------------------------LEVTASPAPTWDAPPDNVSG
+31=p -PHLLSGF--------------------------------LEVTASPAPTWDAPPDNVSG
+32== TG--------------------------------------GNTTGI--------------
+33=p TG--------------------------------------GNVTSI--------------
+34== SPTGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDTSATNMTD--DRYWSL-------
+35=p SPTGLVTSDFNDSYGLTGQFINGSHSSRSRDNASANDTSATNMTD--DRYWSL-------
+36== EPNW-------------------------------------NVTVVPNTTWWQ-------
+
+
+1== -----QY-YLAEPWKYSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAM
+2== -----QY-YLAEPWQFSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAV
+3== -----QY-YLAEPWKYRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAV
+4=p -----QY-YLAEPWQFKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAV
+5=p -----QY-YLAEPWQFKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAV
+6== -----QD-HLGNQGIFMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSI
+7== -----QY-HIAPVWAFYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSF
+8=opsin, ------------------------------------------------------------
+9== -----NY-HIAPRWVYHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAV
+10== -----NY-HIAPRWVYHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAV
+11== -----NY-HIAPRWVYNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAF
+12== -----NY-HIAPRWVYNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAV
+13== -----QWPYQAPQSTYVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAV
+14== -----TY-PEPPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAF
+15== -----IY-PEPPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAF
+16== -----TQ-LEPPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAV
+17== -----TQ-LEPPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAV
+18== -----NY-PPVNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLAL
+19== -----NY-PPVNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLAL
+20== -----QF-PAMDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI
+21== -----QF-PAMDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI
+22== -----QF-PAMDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAI
+23== -----RF-APMDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAF
+24== -----RF-APMDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAF
+25== -----QY-PPLNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAI
+26== -----AF-PPMNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAF
+27== -----KF-DPIPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAM
+28== -----EF-DQVPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAF
+29== CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLAL
+30== CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLAL
+31=p CGEQINY----GRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLAL
+32== SDVTVSY--------QVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAV
+33=p SDVTFSY--------QVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAV
+34== TVYSHEH--------LVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAV
+35=p TVYSHEH--------LVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAV
+36== --ASAPFDTPAALVRAAAKAVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAV
+
+
+1== ANLFMVLFG-FTVTMYTSMNG-YFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYI
+2== ADLFMVFGG-FTTTLYTSLHG-YFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYV
+3== ADLFMACFG-FTVTFYTAWNG-YFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYI
+4=p AGTIMVCFG-FTVTFYTAING-YFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYI
+5=p AGAIMVCFG-FTVTFYTAING-YFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYI
+6== ANLFVAIFG-SPLSFYSFFNR-YFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWL
+7== GGFLLCIFS-VFPVFVASCNG-YFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYI
+8=opsin, -DLAETVIA-STISIVNQVSG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWL
+9== ADLAETVIA-STISVVNQVYG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWM
+10== ADLAETVIA-STISIVNQVSG-YFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWL
+11== VDLVETLVA-STISVFNQIFG-YFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWF
+12== ADLGETVIA-STISVINQISG-YFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWF
+13== ADLLVTLCG-SSVSLSNNING-FFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYV
+14== CDFMMMVK--TPIFIYNSFHQ-GYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFN
+15== CDFMMMIK--TPIFIYNSFHQ-GYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYN
+16== FDLIMCLK--APIF--NSFHR-GFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYN
+17== FDLIMCLK--APIFIYNSFHR-GFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYN
+18== SDLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYN
+19== SDLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYN
+20== SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ
+21== SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ
+22== SDFGIMITN-TPMMGINLYFE-TWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQ
+23== SDFCMMASQ-SPVMIINFYYE-TWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYN
+24== SDFCMMASQ-SPVMIINFYYE-TWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYN
+25== SNFLMMFCM-SPPMVINCYYE-TWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYN
+26== SDFCMMAFM-MPTMTSNCFAE-TWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYN
+27== SDLSFSAINGFPLKTISAFMK-KWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYN
+28== SDFTFSLVNGFPLMTISCFLK-KWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYN
+29== ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL
+30== ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL
+31=p ADLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYL
+32== TDLMVSVLV-LPMAALYQVLN-KWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYW
+33=p TDLMVSVLV-LPMAALYQVLN-KWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYW
+34== ADLMVAVLV-MPLSVVSEISK-VWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYW
+35=p ADLMVAVLV-MPLSVVSEISK-VWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYW
+36== ADLLVACLV-MPLGAVYEVVQ-RWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYW
+ . : : * : : :*:
+
+1== VICKPMGNFR-FGNTHAIMGVAFTWIMALACA-APPLV-GWSRYIPEGMQCSCGPDYYTL
+2== VVCKPMSNFR-FGENHAIMGVAFTWVMALACA-APPLV-GWSRYIPEGMQCSCGIDYYTL
+3== VVCKPMGNFR-FSATHAMMGIAFTWVMAFSCA-APPLF-GWSRYMPEGMQCSCGPDYYTH
+4=p VVCKPMGSFK-FSSSHAFAGIAFTWVMALACA-APPLF-GWSRYIPEGMQCSCGPDYYTL
+5=p VVCKPMGSFK-FSSTHASAGIAFTWVMAMACA-APPLV-GWSRYIPEGIQCSCGPDYYTL
+6== VICKPLGNFT-FKTPHAIAGCILPWISALAAS-LPPLF-GWSRYIPEGLQCSCGPDWYTT
+7== VICKPFGNFR-FSSKHALTVVLATWTIGIGVS-IPPFF-GWSRFIPEGLQCSCGPDWYTV
+8=opsin, VVCKPFGNVR-FDAKLAIVGIAFSWIWAAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+9== VVCKPFGNVR-FDAKLAIVGIAFSWIWAAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+10== VVCKPFGNVR-FDAKLAIVGIAFSWIWSAVWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+11== VVCKPFGNIK-FDSKLAIIGIVFSWVWAWGWS-APPIF-GWSRYWPHGLKTSCGPDVFSG
+12== VVCKPFGNIK-FDGKLAVAGILFSWLWSCAWT-APPIF-GWSRYWPHGLKTSCGPDVFSG
+13== VVCKPLGDFQ-FQRRHAVSGCAFTWGWALLWS-APPLL-GWSSYVPEGLRTSCGPNWYTG
+14== VITRPMEGK--MTHGKAIAMIIFIYMYATPWV-VACYTETWGRFVPEGYLTSCTFDYLTD
+15== VITRPMEGK--MTHGKAIAMIIFIYLYATPWV-VACYTESWGRFVPEGYLTSCTFDYLTD
+16== VITKPMNRN--MTFTKAVIMNIIIWLYCTPWV-VLPLTQFWDRFVPEGYLTSCSFDYLSD
+17== VITKPMNRN--MTFTKAVIMNIIIWLYCTPWV-VLPLTQFWDRFVPEGYLTSCSFDYLSD
+18== IICNGFNGPK-LTTGKAVVFALISWVIAIGCA-LPPFF-GWGNYILEGILDSCSYDYLTQ
+19== IICNGFNGPK-LTQGKATFMCGLAWVISVGWS-LPPFF-GWGSYTLEGILDSCSYDYFTR
+20== VIVKGMAGRP-MTIPLALGKM----------------------YVPEGNLTSCGIDYLER
+21== VIVKGMAGRP-MTIPLALGKIAYIWFMSSIWC-LAPAF-GWSRYVPEGNLTSCGIDYLER
+22== VIVKGMAGRP-MTIPLALGKIAYIWFMSTIWCCLAPVF-GWSRYVPEGNLTSCGIDYLER
+23== VIVKGINGTP-MTIKTSIMKILFIWMMAVFWT-VMPLI-GWSAYVPEGNLTACSIDYMTR
+24== VIVKGINGTP-MTIKTSIMKIAFIWMMAVFWT-IMPLI-GWSSYVPEGNLTACSIDYMTR
+25== VIVKGLSGKP-LSINGALIRIIAIWLFSLGWT-IAPMF-GWNRYVPEGNMTACGTDYFNR
+26== VIVRGMAAAP-LTHKKATLLLLFVWIWSGGWT-ILPFF-GWSRYVPEGNLTSCTVDYLTK
+27== VIGRPMAASKKMSHRRAFLMIIFVWMWSIVWS-VGPVF-NWGAYVPEGILTSCSFDYLST
+28== VIGRPMAASKKMSHRRAFIMIIFVWLWSVLWA-IGPIF-GWGAYTLEGVLCNCSFDYISR
+29== GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ
+30== GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ
+31=p GITRPLTYPVRQNGKCMAKMILSVWLLSASIT-LPPLF-GWAQNVNDDKVC-----LISQ
+32== AITDPIDYVNKRTPRRAAALISLTWLIGFLIS-IPPML-GWRTPEDRSDPDAC---TISK
+33=p AITDPIDYVNKRTPRRAAALISLTWLIGFLIS-IPPML-GWRTPEDRSDPDAC---TISK
+34== AVTS-IDYIRRRSARRILLMIMVVWIVALFIS-IPPLF-GWRD--PNNDPDKTGTCIISQ
+35=p AVTS-IDYIRRRSARRILLMIMVVWIVALFIS-IPPLF-GWRD--PNNDPDKTGTCIISQ
+36== AVTN-IDYIHASTAKRVGMMIACVWTVSFFVC-IAQLL-GWKDPDWNQRVSEDLRCVVSQ
+ : :
+
+1== NPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTVKEAAAAQQE---------------
+2== KPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTVKEAAAQQQE---------------
+3== NPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKVREAAAQQQE---------------
+4=p NPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTVKAAAAQQQD---------------
+5=p NPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTVKAAAAQQQD---------------
+6== NNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITLKLAAKAQAD---------------
+7== GTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRALKAVAAQQQE---------------
+8=opsin, SSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAIRAVAKQQKE---------------
+9== SSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAIRAVAKQQKE---------------
+10== SSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAIRAVAKQQKE---------------
+11== SVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAIRAVAAQQKE---------------
+12== SSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAIRAVAAQQKE---------------
+13== GS--NNNSYILSLFVTCFVLPLSLILFSYTNLLLTLRAAAAQQKE---------------
+14== NF--DTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKKMNVESLRSNV-
+15== NF--DTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKKMNVDSLRSNV-
+16== NF--DTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKKMNVESLRSNV-
+17== NF--DTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKKMNVESLRSNV-
+18== DF--NTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKKMNVSTLRSN--
+19== DM--NTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKKMNVTNLRSN--
+20== DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS--
+21== DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS--
+22== DW--NPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKKMNVKSLRSS--
+23== MW--NPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKKMNVKSLRSS--
+24== QW--NPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKKMNVKSLRSS--
+25== GL--LSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKKMNVASLRSS--
+26== DW--SSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKKMNVASLRANA-
+27== DP--STRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKRLNAKELRKA--
+28== DS--TTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKRLNAKELRKA--
+29== D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP--------------
+30== D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP--------------
+31=p D-----FGYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKFP--------------
+32== D-----HGYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRKTVKKVEKTGADTRHGASP
+33=p D-----HGYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRKTVRKVEKKGAGTSLGTSS
+34== D-----KGYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEETTLV
+35=p D-----KGYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEETTLV
+36== D-----VGYQIFATASSFYVPVLIILILYWRIYQTARKRIRRRRGA-------TARGGVG
+ * : * :
+
+1== ------------------------------------------------------------
+2== ------------------------------------------------------------
+3== ------------------------------------------------------------
+4=p ------------------------------------------------------------
+5=p ------------------------------------------------------------
+6== ------------------------------------------------------------
+7== ------------------------------------------------------------
+8=opsin, ------------------------------------------------------------
+9== ------------------------------------------------------------
+10== ------------------------------------------------------------
+11== ------------------------------------------------------------
+12== ------------------------------------------------------------
+13== ------------------------------------------------------------
+14== ------------------------------------------------------------
+15== ------------------------------------------------------------
+16== ------------------------------------------------------------
+17== ------------------------------------------------------------
+18== ------------------------------------------------------------
+19== ------------------------------------------------------------
+20== ------------------------------------------------------------
+21== ------------------------------------------------------------
+22== ------------------------------------------------------------
+23== ------------------------------------------------------------
+24== ------------------------------------------------------------
+25== ------------------------------------------------------------
+26== ------------------------------------------------------------
+27== ------------------------------------------------------------
+28== ------------------------------------------------------------
+29== GFPRVE--------------------------------PDSVI----------ALNGIVK
+30== GFPRVQ--------------------------------PESVI----------SLNGVVK
+31=p GFPRVQ--------------------------------PESVI----------SLNGVVK
+32== A-PQPKKS-VNGESGSRNWRLGVESKAGGAL-----C-----------------ANGAVR
+33=p A-PPPKKS-LNGQPGSGDWRRCAENRAVGTP-----C-----------------TNGAVR
+34== ASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGV--
+35=p ASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGV--
+36== PPPVPAGGALVAGGGSGGIAAAVVAVIGR---------PLPTISET-------TTTGFTN
+
+
+1== ------------------------------------------------------------
+2== ------------------------------------------------------------
+3== ------------------------------------------------------------
+4=p ------------------------------------------------------------
+5=p ------------------------------------------------------------
+6== ------------------------------------------------------------
+7== ------------------------------------------------------------
+8=opsin, ------------------------------------------------------------
+9== ------------------------------------------------------------
+10== ------------------------------------------------------------
+11== ------------------------------------------------------------
+12== ------------------------------------------------------------
+13== ------------------------------------------------------------
+14== ------------------------------------------------------------
+15== ------------------------------------------------------------
+16== ------------------------------------------------------------
+17== ------------------------------------------------------------
+18== ------------------------------------------------------------
+19== ------------------------------------------------------------
+20== ------------------------------------------------------------
+21== ------------------------------------------------------------
+22== ------------------------------------------------------------
+23== ------------------------------------------------------------
+24== ------------------------------------------------------------
+25== ------------------------------------------------------------
+26== ------------------------------------------------------------
+27== ------------------------------------------------------------
+28== ------------------------------------------------------------
+29== -------------LQKEVEEC-AN------------------LSRLLKHER---------
+30== -------------LQKEVEEC-AN------------------LSRLLKHER---------
+31=p -------------LQKEVEEC-AN------------------LSRLLKHER---------
+32== QGDDGAALEV-----IEVHRV-GNSKEHLPLPSEAGP--TPCAPASFERKNERN------
+33=p QGDDEATLEV-----IEVHRV-GNSKEHLPLPSESGS--NSYAPACLERKNERN------
+34== -NSNSSSSERLKQIQIETAEAFANGC------------AEEASIAMLERQCNNGKKISSN
+35=p -NSNSSSSERLKQIQIETAEAFANGC------------AEEASIAMLERQCNNGKKISSN
+36== VSSNNTSP--------EKQSC-ANGLEADPPTTGYGAVAAAYYPSLVRRKP---------
+
+
+1== --------SASTQKAEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT--HQGSDFGAT-FM
+2== --------SATTQKAEKEVTRMVIIMVIFFLICWLPYASVAMYIFT--HQGSNFGPI-FM
+3== --------SATTQKAEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT--NKGADFTAT-LM
+4=p --------SASTQKAEREVTKMVILMVFGFLIAWTPYATVAAWIFF--NKGADFSAK-FM
+5=p --------SASTQKAEREVTKMVILMVLGFLVAWTPYATVAAWIFF--NKGAAFSAQ-FM
+6== --------SASTQKAEREVTKMVVVMVLGFLVCWAPYASFSLWIVS--HRGEEFDLR-MA
+7== --------SATTQKAEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN--NRNHGLDLR-LV
+8=opsin, --------SESTQKAEKEVTRMVVVMVLAFC-----------------------------
+9== --------SESTQKAEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA--NPGYPFHPL-MA
+10== --------SESTQKAEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA--NPGYAFHPL-MA
+11== --------SESTQKAEREVSRMVVVMIVAFCICWGPYASFVSFAAA--NPGYAFHPL-AA
+12== --------SESTQKAEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA--NPGYAFHPL-AA
+13== --------ADTTQRAEREVTRMVIVMVMAFLLCWLPYSTFALVVAT--HKGIIIQPV-LA
+14== --------DKNKETAEIRIAKAAITICFLFFCSWTPYGVMSLIGAF--GDKTLLTPG-AT
+15== --------DKSKEAAEIRIAKAAITICFLFFASWTPYGVMSLIGAF--GDKTLLTPG-AT
+16== --------DKSKETAEIRIAKAAITICFLFFVSWTPYGVMSLIGAF--GDKSLLTQG-AT
+17== --------DKSKETAEIRIAKAAITICFLFFVSWTPYGVMSLIGAF--GDKSLLTPG-AT
+18== --------EADAQRAEIRIAKTALVNVSLWFICWTPYALISLKGVM--GDTSGITPL-VS
+19== --------EAETQRAEIRIAKTALVNVSLWFICWTPYAAITIQGLL--GNAEGITPL-LT
+20== --------EDAEKSAEGKLAKVALVTITLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT
+21== --------EDAEKSAEGKLAKVALVTITLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT
+22== --------EDADKSAEGKLAKVALVTISLWFMAWTPYLVINCMGLF--KF-EGLTPL-NT
+23== --------EDCDKSAEGKLAKVALTTISLWFMAWTPYLVICYFGLF--KI-DGLTPL-TT
+24== --------EDCDKSAENKLAKVALTTISLWFMAWTPYLIICYFGLF--KI-DGLTPL-TT
+25== --------ENQNTSAECKLAKVALMTISLWFMAWTPYLVINFSGIF--NL-VKISPL-FT
+26== --------DQQKQSAECRLAKVAMMTVGLWFMAWTPYLIISWAGVF--SSGTRLTPL-AT
+27== --------Q-AGASAEMKLAKISMVIITQFMLSWSPYAIIALLAQF--GPAEWVTPY-AA
+28== --------Q-AGANAEMRLAKISIVIVSQFLLSWSPYAVVALLAQF--GPLEWVTPY-AA
+29== -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE
+30== -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE
+31=p -------KNISIFKREQKAATTLGIIVGAFTVCWLPFFLLSTARPFICGTSCSCIPLWVE
+32== ----AEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-CESSCHMPTL-LG
+33=p ----AEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-CESSCHMPAL-LG
+34== DTPYSRTREKLELKRERKAARTLAIITGAFLICWLPFFIIALIGPF--VDPEGIPPF-AR
+35=p DTPYSRTREKLELKRERKAARTLAIITGAFLICWLPFFIIALIGPF--VDPEGIPPF-AR
+36== -------KEAADSKRERKAAKTLAIITGAFVACWLPFFVLAILVPT-CD--CEVSPV-LT
+ * . :
+
+1== TLPAFFAKSSALYNPVIYILMNKQFRNCMITTL-----CC-----GKNPLGDDE-SGA-S
+2== TLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSL-----CC-----GKNPLGDDE-ASA-T
+3== AVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTI-----CC-----GKNPFGDEDVSSTVS
+4=p AIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTI-----FC-----GKNPLGDDE-SSTVS
+5=p AIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTL-----FC-----GKNPLGDEE-SSTVS
+6== TIPSCLSKASTVYNPVIYVLMNKQFRSCMMK-M-----VC-----GKN-IEEDE-AST-S
+7== TIPSFFSKSACIYNPIIYCFMNKQFQACIMK-M-----VC-----GKA-MTDES-DTC-S
+8=opsin, ------------------------------------------------------------
+9== ALPAFFAKSATIYNPVIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-ELS-S
+10== ALPAYFAKSATIYNPVIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-ELS-S
+11== ALPAYFAKSATIYNPVIYVFMNRQFRNCIMQ-L-----F------GKK-VDDGS-EAS-T
+12== ALPAYFAKSATIYNPIIYVFMNRQFRNCILQ-L-----F------GKK-VDDGS-EVS-T
+13== SLPSYFSKTATVYNPIIYVFMNKQFQSCLLEML-----CC-----GYQPQRTGKASPGTP
+14== MIPACACKMVACIDPFVYAISHPRYRMELQKRCPW---LALN---EK----APE-SSA-V
+15== MIPACTCKMVACIDPFVYAISHPRYRMELQKRCPW---LAIS---EK----APE-SRA-A
+16== MIPACTCKLVACIDPFVYAISHPRYRLELQKRCPW---LGVN---EK----SGE-ISS-A
+17== MIPACTCKLVACIEPFVYAISHPRYRMELQKRCPW---LGVN---EK----SGE-ASS-A
+18== TLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPW---FCVH---ET----ETK-SND-D
+19== TLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPW---FCVH---EK----DPN-DVE-E
+20== IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSD-A
+21== IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSD-A
+22== IWGACFAKSAACYNPIVYGISHPKYRLALKEKCP----CCVF---GKV--DDGK-SSE-A
+23== IWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCP----MCVF---GNT--DEPK-PDA-P
+24== IWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCP----MCVC---GTT--DEPK-PDA-P
+25== IWGSLFAKANAVYNPIVYGISHPKYRAALFAKFP----SLAC---AA----EPS-SDA-V
+26== IWGSVFAKANSCYNPIVYGISHPRYKAALYQRFP----SLAC---GS---GESG-SDV-K
+27== ELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQF---DEK--ECED-AND-A
+28== QLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQF---DDK--ETED-DKD-A
+29== RTFLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL------SAAGM
+30== RTCLWLGYANSLINPFIYAFFNRDLRPTSRSLL-----QCQYRNINRKL------SAAGM
+31=p RTCLWLGYANSLINPFIYAFFNRDLRTTYRSLL-----QCQYRNINRKL------SAAGM
+32== AIINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKF---CRQ------------
+33=p AIINWLGYSNSLLNPVIYAYFNKDFQNAFKKII-----KCKF---CRR------------
+34== SFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYR-RGHR------------
+35=p SFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKIL-----FGKYR-RGHR------------
+36== SLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLL------CGRRVRRRR------------
+
+
+1== TSKTEVSSVSTS------------------------------------------------
+2== ASKTETSQVA--------------------------------------------------
+3== QSKTEVSSVSSS------------------------------------------------
+4=p TSKTEVSSVS--------------------------------------------------
+5=p TSKTEVSSVS--------------------------------------------------
+6== SQVTQVSSVA--------------------------------------------------
+7== SQKTEVSTVSST------------------------------------------------
+8=opsin, ------------------------------------------------------------
+9== ASKTEVSSVS--------------------------------------------------
+10== ASKTEVSSVS--------------------------------------------------
+11== TSRTEVSSVSNS------------------------------------------------
+12== -SRTEVSSVSNS------------------------------------------------
+13== GPHADVTAAGLR------------------------------------------------
+14== ASTS-TTQEPQ-------------------------------------------------
+15== ISTS-TTQEQQ-------------------------------------------------
+16== QSTT-TQEQ-Q-------------------------------------------------
+17== QSTT-TQEQTQ-------------------------------------------------
+18== SQSNSTVAQDK-------------------------------------------------
+19== NQSSNTQTQEK-------------------------------------------------
+20== QSQA-TASEAE-------------------------------------------------
+21== QSQA-TASEAE-------------------------------------------------
+22== QSQA-TTSEAE-------------------------------------------------
+23== ASDTETTSEAD-------------------------------------------------
+24== PSDTETTSEAE-------------------------------------------------
+25== STTSGTTTVTDN------------------------------------------------
+26== SEASATTTMEEK------------------------------------------------
+27== EEEV-VASERG--GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PPQGYPPQGA
+28== ETEI-PAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPPQGYPPQG-
+29== HEALKLAERPERP-----------------EFVLQNA-----------------------
+30== HEALKLAERPERS-----------------EFVLQNS-----------------------
+31=p HEALKLAERPERS-----------------EFVLQNS-----------------------
+32== ------------------------------------------------------------
+33=p ------------------------------------------------------------
+34== ------------------------------------------------------------
+35=p ------------------------------------------------------------
+36== ------------------------------------------------------------
+
+
+1== --------------------------------------------PVSP-A---
+2== -----------------------------------------------P-A---
+3== --------------------------------------------QVSP-A---
+4=p -----------------------------------------------P-A---
+5=p -----------------------------------------------P-A---
+6== -----------------------------------------------PEK---
+7== --------------------------------------------QVGP-N---
+8=opsin, -----------------------------------------------------
+9== --------------------------------------------SVSP-A---
+10== --------------------------------------------SVSP-A---
+11== --------------------------------------------SVAP-A---
+12== --------------------------------------------SVSP-A---
+13== -------------------------------------------NKVMP-AHPV
+14== --------------------------------------------QTTA-A---
+15== --------------------------------------------QTTA-A---
+16== --------------------------------------------QTTA-A---
+17== --------------------------------------------QTSA-A---
+18== -------------------------------------------------A---
+19== -------------------------------------------------S---
+20== ----------------------------------------------SK-A---
+21== ----------------------------------------------SK-A---
+22== ----------------------------------------------SK-A---
+23== ----------------------------------------------SK-A---
+24== ----------------------------------------------SK-D---
+25== -------------------------------------------EK-SN-A---
+26== -------------------------------------------PKIPE-A---
+27== YPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQ-A---
+28== YPP-QGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQ-A---
+29== -------------------------------------------DYCRKKGHDS
+30== -------------------------------------------DHCGKKGHDT
+31=p -------------------------------------------DHCGKKGHDT
+32== -----------------------------------------------------
+33=p -----------------------------------------------------
+34== -----------------------------------------------------
+35=p -----------------------------------------------------
+36== -------------------------------------------------A-PQ
+
diff -r c5908940967d -r aaefa93c2dd2 test-data/mafft_fftns_result.aln
--- a/test-data/mafft_fftns_result.aln Sat Nov 11 15:06:34 2017 -0500
+++ b/test-data/mafft_fftns_result.aln Wed Apr 15 15:33:37 2020 -0400
@@ -1,504 +1,468 @@
> 1== M63632 1 Lampetra japonica rhodopsin <>[BBRC174,1125-1132'91]
---------------------------------MNGTE--------------GDNF-----
--------------YVP-----F-SNKTG----------LARSPYEYPQY-YLAEPWK---
---------------YSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMA
-NLFMVLFG-FTVTMYTSMN-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIV
-ICKPMGN-FRFGNTHAIMGVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPD
-YYTLNPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTV----KE--------------
-------------------------------------------------------AAAAQQ
+----------------------------------------MNG----------------T
+E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM
+N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM
+GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF
+VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ--------------------------
------------------------------------------------------------
---------------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVA
-FYIFT-HQGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC------
---GKNPLGDDE--SGASTSKTEVSSVS-TSPVS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H
+QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL
+GDDE--SGASTSKTEVSSVS-TSPVSPA--------------------------------
+---------------------------------------------------------
> 2== U22180 1 rat opsin [J.Mol.Neurosci.5(3),207-209'94]
---------------------------------MNGTE--------------GPNF-----
--------------YVP-----F-SNITG----------VVRSPFEQPQY-YLAEPWQ---
---------------FSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVA
-DLFMVFGG-FTTTLYTSLH-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVV
-VCKPMSN-FRFGENHAIMGVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGID
-YYTLKPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTV----KE--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML
+AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL
+H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM
+GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF
+VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ--------------------------
------------------------------------------------------------
---------------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVA
-MYIFT-HQGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC------
---GKNPLGDDE--ASATASKTE------TSQVA---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H
+QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL
+GDDE--ASATASKTE------TSQVAPA--------------------------------
+---------------------------------------------------------
> 3== M92038 1 chicken green sensitive cone opsin [PNAS89,5932-5936'9
---------------------------------MNGTE--------------GINF-----
--------------YVP-----M-SNKTG----------VVRSPFEYPQY-YLAEPWK---
---------------YRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVA
-DLFMACFG-FTVTFYTAWN-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIV
-VCKPMGN-FRFSATHAMMGIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPD
-YYTHNPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKV----RE--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV
+CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW
+N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM
+GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF
+VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ--------------------------
------------------------------------------------------------
---------------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVA
-FWIFT-NKGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC------
---GKNPFGDEDVSSTVSQSKTEVSSVS-SSQVS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N
+KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF
+GDEDVSSTVSQSKTEVSSVS-SSQVSPA--------------------------------
+---------------------------------------------------------
> 4=p A45229 opsin, green-sensitive (clone GFgr-1) - goldfish
---------------------------------MNGTE--------------GKNF-----
--------------YVP-----M-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
---------------FKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVA
-GTIMVCFG-FTVTFYTAIN-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-VCKPMGS-FKFSSSHAFAGIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPD
-YYTLNPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTV----KA--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL
+ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI
+N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA
+GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF
+VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ--------------------------
------------------------------------------------------------
---------------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVA
-AWIFF-NKGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC------
---GKNPLGDDE-SSTVSTSKTEVSS------VS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N
+KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL
+GDDE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
> 5=p B45229 opsin, green-sensitive (clone GFgr-2) - goldfish
---------------------------------MNGTE--------------GNNF-----
--------------YVP-----L-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
---------------FKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVA
-GAIMVCFG-FTVTFYTAIN-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-VCKPMGS-FKFSSTHASAGIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPD
-YYTLNPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTV----KA--------------
-------------------------------------------------------AAAQQQ
+----------------------------------------MNG----------------T
+E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL
+AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI
+N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA
+GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF
+ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ--------------------------
------------------------------------------------------------
---------------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVA
-AWIFF-NKGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC------
---GKNPLGDEE-SSTVSTSKTEVSS------VS---------------------------
------------------------------------PA-----------------------
---
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N
+KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL
+GDEE-SSTVSTSKTEVSS------VSPA--------------------------------
+---------------------------------------------------------
> 6== L11864 1 Carassius auratus blue cone opsin [Biochemistry32,208-
---------------------------------MKQVPEF------------HEDF-----
--------------YIPIP-LDI-NNLS------------AYSPFLVPQD-HLGNQGI---
---------------FMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIA
-NLFVAIFG-SPLSFYSFFN-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLV
-ICKPLGN-FTFKTPHAIAGCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPD
-WYTTNNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITL----KL--------------
-------------------------------------------------------AAKAQA
+----------------------------------------MKQ----------------V
+PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM
+SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF
+N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA
+GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF
+CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA--------------------------
------------------------------------------------------------
---------------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFS
-LWIVS-HRGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC------
---GKN-IEEDE--ASTSSQVTQVSS------VA---------------------------
------------------------------------PEK----------------------
---
+------------------------------------------------------------
+-------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H
+RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I
+EEDE--ASTSSQVTQVSS------VAPEK-------------------------------
+---------------------------------------------------------
> 7== M13299 1 human BCP <>[Science232(4747),193-202'86]
---------------------------------MRKMS--------------EEEF-----
--------------YL------F-KNIS------------SVGPWDGPQY-HIAPVWA---
---------------FYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFG
-GFLLCIFS-VFPVFVASCN-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIV
-ICKPFGN-FRFSSKHALTVVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPD
-WYTVGTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRAL----KA--------------
-------------------------------------------------------VAAQQQ
+----------------------------------------MRK----------------M
+S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ
+AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC
+N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT
+VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF
+IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ--------------------------
------------------------------------------------------------
---------------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFA
-MYMVN-NRNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC------
---GKA-MTDES--DTCSSQKTEVSTVS-STQVG---------------------------
------------------------------------PN-----------------------
---
+------------------------------------------------------------
+-------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N
+RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M
+TDES--DTCSSQKTEVSTVS-STQVGPN--------------------------------
+---------------------------------------------------------
> 8=opsin, greensensitive human (fragment) S07060
------------------------------------------------------------
------------------------------------------------------------
+------------------------------------------DLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
------------------------------------------------------------
-DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-------------------------------------------------------VAKQQK
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFC-----------------
+------------------------------------------------------------
+------------------------------------------------------------
+---------------------------------------------------------
+> 9== K03494 1 human GCP <>[Science232(4747),193-202'86]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV
+Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV
+GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N
+PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+> 10== Z68193 1 human Red Opsin <>[]
+----------------------------------------MAQQWSLQRLAGRHPQDSYE
+DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV
+S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK--------------------------
+------------------------------------------------------------
------------------------------------------------------------
---------------------ESESTQK------AEKEVTRMVVVMVLAFC----------
+-------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N
+PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+---------------------------------------------------------
+> 11== M92036 1 Gecko gecko P521 [PNAS89,6841-6845'92]
+----------------------------------------MTEAWNVAVFAARRSRDD-D
+DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV
+SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI
+F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII
+GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM
+ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK--------------------------
+------------------------------------------------------------
------------------------------------------------------------
+-------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V
+DDGS--EASTTSRTEVSSVS-NSSVAPA--------------------------------
+---------------------------------------------------------
+> 12== M62903 1 chicken visual pigment <>[BBRC173,1212-1217'90]
+----------------------------------------MAA-WEAAFAARRRHEE--E
+DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT
+SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI
+S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA
+GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM
+VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK--------------------------
+------------------------------------------------------------
+------------------------------------------------------------
+-------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N
+PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V
+DDGS--EVST-SRTEVSSVS-NSSVSPA--------------------------------
+---------------------------------------------------------
+> 13== S75720 1 chicken P-opsin <>[Science267(5203),1502-1506'95]
+----------------------------------------MS-----------------S
+NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV
+AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI
+N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS
+GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF
+VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK--------------------------
------------------------------------------------------------
------------------------------------------------------------
---
-> 9== K03494 1 human GCP <>[Science232(4747),193-202'86]
---------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
--------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
---------------YHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-DLAETVIA-STISVVNQVY-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMV
-VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-------------------------------------------------------VAKQQK
-------------------------------------------------------------
---------------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFA
-CFAAA-NPGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
---GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
------------------------------------PA-----------------------
---
-> 10== Z68193 1 human Red Opsin <>[]
---------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
--------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
---------------YHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-VCKPFGN-VRFDAKLAIVGIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAI----RA--------------
-------------------------------------------------------VAKQQK
-------------------------------------------------------------
---------------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFA
-CFAAA-NPGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
---GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
------------------------------------PA-----------------------
---
-> 11== M92036 1 Gecko gecko P521 [PNAS89,6841-6845'92]
---------------------------------MTEAWNVAVFAARRSRDD-DDTT-----
--------------RGSV--FTY-TNTNN-----------TRGPFEGPNY-HIAPRWV---
---------------YNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFV
-DLVETLVA-STISVFNQIF-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFV
-VCKPFGN-IKFDSKLAIIGIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAI----RA--------------
-------------------------------------------------------VAAQQK
-------------------------------------------------------------
---------------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFV
-SFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF-------
---GKK-VDDGS--EASTTSRTEVSSVS-NSSVA---------------------------
------------------------------------PA-----------------------
---
-> 12== M62903 1 chicken visual pigment <>[BBRC173,1212-1217'90]
---------------------------------MAA-WEAAFAARRRHEE--EDTT-----
--------------RDSV--FTY-TNSNN-----------TRGPFEGPNY-HIAPRWV---
---------------YNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVA
-DLGETVIA-STISVINQIS-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFV
-VCKPFGN-IKFDGKLAVAGILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-VFSGSSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAI----RA--------------
-------------------------------------------------------VAAQQK
-------------------------------------------------------------
---------------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFA
-CFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF-------
---GKK-VDDGS--EVST-SRTEVSSVS-NSSVS---------------------------
------------------------------------PA-----------------------
---
-> 13== S75720 1 chicken P-opsin <>[Science267(5203),1502-1506'95]
---------------------------------MS-----------------SNSS-----
--------------QAP---------PNG-----------TPGPFDGPQWPYQAPQST---
---------------YVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVA
-DLLVTLCG-SSVSLSNNIN-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVV
-VCKPLGD-FQFQRRHAVSGCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPN
-WYTGGSNN--NSYILSLFVTCFVLPLSLILFSYTNLLLTL----RA--------------
-------------------------------------------------------AAAQQK
-------------------------------------------------------------
---------------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFA
-LVVAT-HKGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY---
--QPQR-TGKAS--PGTPGPHADVTAAGLRNKVM---------------------------
------------------------------------PAHPV--------------------
---
+-------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H
+KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T
+GKAS--PGTPGPHADVTAAGLRNKVMPAHPV-----------------------------
+---------------------------------------------------------
> 14== M17718 1 D.melanogaster Rh3 <>[J.Neurosci.7,1550-1557'87]
-----------MES--GNV-----------SSSLFGNVSTAL----------RPEA-----
--------------RLSA------ETRLL----------GWNVPPEELR--HIPEHWLTYP
-E--------PPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFC
-DFMMMVK--TPIFIYNSFH-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNV
-ITRPMEG--KMTHGKAIAMIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFD
-YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-------------------------------------------------------LRDQAK
-KMN---------------VESLRS------------------------------------
--------------------NVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMS
-LIGAF-GDKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---
----NE-KAPES----SAVASTSTTQEPQQTTAA---------------------------
-------------------------------------------------------------
---
+----------MESGNVSS------------SLFGNVST-ALRP----------------E
+ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL
+GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA
+MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N
+EKAP--ESSAVASTSTTQEP--QQTTAA--------------------------------
+---------------------------------------------------------
> 15== X65879 1 Drosophila pseudoobscura Dpse\Rh3 <>[Genetics132(1),193-204'92
-----------MEY--HNV-----------SSVL-GNVSSVL----------RPDA-----
--------------RLSA------ESRLL----------GWNVPPDELR--HIPEHWLIYP
-E--------PPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFC
-DFMMMIK--TPIFIYNSFH-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNV
-ITRPMEG--KMTHGKAIAMIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFD
-YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-------------------------------------------------------LRDQAK
-KMN---------------VDSLRS------------------------------------
--------------------NVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMS
-LIGAF-GDKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---
----SE-KAPES----RAAISTSTTQEQQQTTAA---------------------------
-------------------------------------------------------------
---
+----------MEYHNVSS------------VL-GNVSS-VLRP----------------D
+ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL
+GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF
+H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA
+MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VDSL------------------------------------------------------
+----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G
+DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S
+EKAP--ESRAAISTSTTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
> 16== M17730 1 D.melanogaster Rh4 opsin <>[J.Neurosci.7,1558-1566'87]
-----------ME-------------------PLCNASEPPL----------RPEA-----
--------------R-SSG---NGDLQFL----------GWNVPPDQIQ--YIPEHWLTQL
-E--------PPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-DLIMCLK--APIF--NSFH-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-YLS--DNFDTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKA--------------
-------------------------------------------------------LREQAK
-KMN---------------VESLRS------------------------------------
--------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-LIGAF-GDKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---
----NE-KSGEI----SSAQSTTTQEQ-QQTTAA---------------------------
-------------------------------------------------------------
---
+----------ME------------------PL-CNASEPPLRP----------------E
+AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF
+H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N
+EKSG--EISSAQST-TTQEQ--QQTTAA--------------------------------
+---------------------------------------------------------
> 17== X65880 1 Drosophila pseudoobscura Dpse\Rh4 <>[Genetics132(1),193-204'92
-----------MD-------------------ALCNASEPPL----------RPEA-----
--------------RMSSG---SDELQFL----------GWNVPPDQIQ--YIPEHWLTQL
-E--------PPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-DLIMCLK--APIFIYNSFH-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-YLS--DNFDTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKA--------------
-------------------------------------------------------LREQAK
-KMN---------------VESLRS------------------------------------
--------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-LIGAF-GDKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---
----NE-KSGEA----SSAQSTTTQEQTQQTSAA---------------------------
-------------------------------------------------------------
---
+----------MD------------------AL-CNASEPPLRP----------------E
+ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF
+H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK-------------------------
+--------------------------------------------------MN--------
+--VESL------------------------------------------------------
+----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N
+EKSG--EASSAQST-TTQEQ-TQQTSAA--------------------------------
+---------------------------------------------------------
> 18== D50584 1 Hemigrapsus sanguineus opsin BcRh2 [J.Exp.Biol.1
---------------------------------MTNATGPQM----------AYYG-----
--------------AASMD-FGYPEGVSI----------VDFVRPEIKP--YVHQHWYNYP
-P--------VNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALS
-DLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNI
-ICNGFNG-PKLTTGKAVVFALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYD
-YLT--QDFNTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAA--------------
-------------------------------------------------------MRAQAK
-KMN---------------VSTLRS------------------------------------
---------------------NEADAQR------AEIRIAKTALVNVSLWFICWTPYALIS
-LKGVM-GDTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV---
----HE-TETKS-NDDSQSNSTVAQDKA---------------------------------
-------------------------------------------------------------
---
+--------------------------------MTNATGPQMAY----------------Y
+GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL
+GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF
+SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV
+FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF
+VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VSTL------------------------------------------------------
+----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G
+DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T
+ETKS--NDDSQSNSTVAQDK-A--------------------------------------
+---------------------------------------------------------
> 19== D50583 1 Hemigrapsus sanguineus opsin BcRh1 [J.Exp.Biol.1
---------------------------------MANVTGPQM----------AFYG-----
--------------SGAAT-FGYPEGMTV----------ADFVPDRVKH--MVLDHWYNYP
-P--------VNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALS
-DLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNI
-ICNGFNG-PKLTQGKATFMCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYD
-YFT--RDMNTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAA--------------
-------------------------------------------------------MRAQAK
-KMN---------------VTNLRS------------------------------------
---------------------NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAIT
-IQGLL-GNAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV---
----HE-KDPND-VEENQSSNTQTQEKS---------------------------------
-------------------------------------------------------------
---
+--------------------------------MANVTGPQMAF----------------Y
+GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL
+GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF
+SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF
+MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF
+IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+--------------------------------------------------MN--------
+--VTNL------------------------------------------------------
+----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G
+NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K
+DPND--VEENQSSNTQTQEK-S--------------------------------------
+---------------------------------------------------------
> 20== K02320 1 D.melanogaster opsin <>[Cell40,851-858'85]
----------------MES-----------FAVAAAQLGPHF----------APLS-----
-------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-IVKGMAG-RPMTIPLALGKM---------------------------YVPEGNLTSCGID
-YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
----GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-------------------------------------------------------------
---
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
> 21== K02315 1 D.melanogaster ninaE <>[Cell40,839-850'85]
----------------MES-----------FAVAAAQLGPHF----------APLS-----
-------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-IVKGMAG-RPMTIPLALGKIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGID
-YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
----GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-------------------------------------------------------------
---
+----------ME----SF------------AVAAAQLGPHFAP----------------L
+S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+---------------------------------------------------------
> 22== X65877 1 Drosophila pseudoobscura Dpse\ninaE <>[Genetics132(1),193-204'
----------------MDS-----------FAAVATQLGPQF----------AAPS-----
-------------------------NGSV----------VDKVTPDMAH--LISPYWDQFP
-A--------MDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-IVKGMAG-RPMTIPLALGKIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGID
-YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVIN
-CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
----GK-VDDGK-SSEAQSQATTSEAESKA-------------------------------
-------------------------------------------------------------
---
+----------MD----SF------------AAVATQLGPQFAA----------------P
+S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL
+TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K
+F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+DDGK--SSEAQSQA-TTSEA-ESKA-----------------------------------
+---------------------------------------------------------
> 23== M12896 1 D.melanogaster Rh2 <>[Cell44,705-710'86]
-----------MERSHLPE-----------TPFDLAHSGPRF----------QAQS-----
--------------SG---------NGSV----------LDNVLPDMAH--LVNPYWSRFA
-P--------MDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNV
-IVKGING-TPMTIKTSIMKILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSID
-YMT--RMWNPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKA--------------
-------------------------------------------------------MREQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVIC
-YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF---
----GN-TDEPKPDAPASDTETTSEADSKA-------------------------------
-------------------------------------------------------------
---
+-----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q
+SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL
+GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS
+LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T
+DEPK--PDAPASDTETTSEA-DSKA-----------------------------------
+---------------------------------------------------------
> 24== X65878 1 Drosophila pseudoobscura Dpse\Rh2 <>[Genetics132(1),193-204'92
-----------MERSLLPE-----------PPLAMALLGPRF----------EAQT-----
--------------GG---------NRSV----------LDNVLPDMAP--LVNPHWSRFA
-P--------MDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNV
-IVKGING-TPMTIKTSIMKIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSID
-YMT--RQWNPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKA--------------
-------------------------------------------------------MRDQAK
-KMN---------------VKSLRS------------------------------------
---------------------SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIIC
-YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC---
----GT-TDEPKPDAPPSDTETTSEAESKD-------------------------------
-------------------------------------------------------------
---
+-----MERSLLP----EP------------PLAMALLGPRFEA----------------Q
+TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL
+GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS
+LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK-------------------------
+--------------------------------------------------MN--------
+--VKSL------------------------------------------------------
+----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K
+I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T
+DEPK--PDAPPSDTETTSEA-ESKD-----------------------------------
+---------------------------------------------------------
> 25== U26026 1 Apis mellifera long-wavelength rhodopsin <>[]
---------------------------------MIAVSGPSY----------EAFS-----
--------------YGGQARF---NNQTV----------VDKVPPDMLH--LIDANWYQYP
-P--------LNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAIS
-NFLMMFCM-SPPMVINCYY-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNV
-IVKGLSG-KPLSINGALIRIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTD
-YFN--RGLLSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKN--------------
-------------------------------------------------------MREQAK
-KMN---------------VASLRS------------------------------------
---------------------SENQNTS------AECKLAKVALMTISLWFMAWTPYLVIN
-FSGIF-NL-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC---
-----A-AEPSS-DAVSTTSGTTTVTDNEKSNA----------------------------
-------------------------------------------------------------
---
+--------------------------------MIAVSGPSYEA----------------F
+SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL
+GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY
+Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI
+RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG
+IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N
+L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A
+EPSS--DAVSTTSGTTTVTD-NEKSNA---------------------------------
+---------------------------------------------------------
> 26== L03781 1 Limulus polyphemus opsin <>[PNAS90,6150-6154'93]
-----------------------------------MANQLSY----------SSLG-----
--------------WPYQP------NASV----------VDTMPKEMLY--MIHEHWYAFP
-P--------MNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFS
-DFCMMAFM-MPTMTSNCFA-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNV
-IVRGMAA-APLTHKKATLLLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVD
-YLT--KDWSSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQ--------------
-------------------------------------------------------LREQAK
-KMN---------------VASLRA------------------------------------
--------------------NADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIIS
-WAGVF-SSGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC---
----GS-GESGS-DVKSEASATTTMEEKPKIPEA---------------------------
-------------------------------------------------------------
---
+----------------------------------MANQLSYSS----------------L
+GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL
+GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF
+A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL
+LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG
+LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK-------------------------
+--------------------------------------------------MN--------
+--VASL------------------------------------------------------
+----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S
+SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G
+ESGS--DVKSEASATTTMEE-KPKIPEA--------------------------------
+---------------------------------------------------------
> 27== X07797 1 Octopus dofleini rhodopsin <>[FEBS232(1),69-72'88]
----------------------------------------MV----------ESTT-----
--------------LVNQT-WWY--NPTV----------D------------IHPHWAKFD
-P--------IPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMS
-DLSFSAINGFPLKTISAFM-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNV
-IGRPMAASKKMSHRRAFLMIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFD
-YLS--TDPSTRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKE--------------
-------------------------------------------------------MAAMAK
-RLN---------------AKELR-------------------------------------
---------------------KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIA
-LLAQF-GPAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQ
-FDEKE-CEDAN-DAEEEVVASER--GGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQG
-Y--PPQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAY
-QA
+---------------------------------------MVES----------------T
+TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV
+GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF
+M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL
+MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY
+FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G
+PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C
+EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP
+QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
> 28== X70498 1 Todarodes pacificus rhodopsin [FEBS317(1-2),5-11'93]
-----------------------------------------M----------GRDL-----
--------------RDNET-WWY--NPSI----------V------------VHPHWREFD
-Q--------VPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFS
-DFTFSLVNGFPLMTISCFL-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNV
-IGRPMAASKKMSHRRAFIMIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFD
-YIS--RDSTTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKE--------------
-------------------------------------------------------MAAMAK
-RLN---------------AKELR-------------------------------------
---------------------KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVA
-LLAQF-GPLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQ
-FDDKE-TEDDK-DAETEIPAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQG
-YAPPPQGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAY
-QA
+----------------------------------------MGR----------------D
+LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL
+GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF
+L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI
+MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF
+ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+--------------------------------------------------LN--------
+--AKEL------------------------------------------------------
+----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G
+PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T
+EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP
+QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA
> 29== L21195 1 human serotonin 5-HT7 receptor protein 30== L15228 1 rat 5HT-7 serotonin receptor <>[JBC268,18200-18204'93]
------------------------------------------------------------
-----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
---------------------------------------------P----GFPRVQPESVI
-SLNG--------------VVKLQ----------------------KEVEECANLSR----
---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQC------
----QY-RNINR--KLSAAGMHEALKLAER-------------------------------
------------------------------------PERSEFVL-QNSDHCGKKGHDT---
---
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
> 31=p A47425 serotonin receptor 5HT-7 - rat
------------------------------------------------------------
-----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
----------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
---------------------------------------------P----GFPRVQPESVI
-SLNG--------------VVKLQ----------------------KEVEECANLSR----
---------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
----QY-RNINR--KLSAAGMHEALKLAER-------------------------------
------------------------------------PERSEFVL-QNSDHCGKKGHDT---
---
+------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+---------------------------------PGFPRV----QPESVISLNG-------
+--VVKL----------------------QK---------EVEECAN--------------
+----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+--------------------------------------------CGKKGHDT-----
> 32== M83181 1 human serotonin receptor <>[JBC267(11),7553-7562'92]
-----------MDVLSPG------------QGNNTTSPPAPF----------ETGG-----
--------------NTTGI-----SDVTV--------------------------------
-------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
--------------------------TVKKVEKTGADTRHGASPAP---------QPKKS-
--VNGESGSRNWRL-----GVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPL
-PSEAG--PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-LVLPF-CESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
----KF-CRQ---------------------------------------------------
+----------MDVLSP--------------------------------------------
+---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR--
+-------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG--
+PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ----
------------------------------------------------------------
---
+---------------------------------------------------------
> 33=p A35181 serotonin receptor class 1A - rat
-----------MDVFSFG------------QGNNTTASQEPF----------GTGG-----
--------------NVTSI-----SDVTF--------------------------------
-------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
--------------------------TVRKVEKKGAGTSLGTSSAP---------PPKKS-
--LNGQPGSGDWRR-----CAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPL
-PSESG--SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-LVLPF-CESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
----KF-CRR---------------------------------------------------
+----------MDVFSF--------------------------------------------
+---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT
+SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+--------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG--
+-------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG--
+SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR----
------------------------------------------------------------
---
+---------------------------------------------------------
> 34== L06803 1 Lymnaea stagnalis serotonin receptor <>[PNAS90,11-15'93]
-MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
--------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
----KY-RRGHR-------------------------------------------------
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
------------------------------------------------------------
---
+---------------------------------------------------------
> 35=p A47174 serotonin receptor, 5HTlym receptor - great pond snail
-MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
--------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
----KY-RRGHR-------------------------------------------------
+MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+-------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+-----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
------------------------------------------------------------
---
+---------------------------------------------------------
> 36== X95604 1 Bombyx mori serotonin receptor [InsectBiochem.Mol.Bi
--MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGW----------EPNW-----
--------------NVTVV-----PNTTW---------WQASAPFDTPA--ALVRAAAK--
-------------------AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVA
-DLLVACLV-MPLGAVYEVV-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWA
-VTN-IDYIHASTAKRVGMMIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQD
-V----------GYQIFATASSFYVPVLIILILYWRIYQTARKRIR---------------
-------------------------------RRRGATARGGVGPPP---------VPAGGA
-LVAGGGSGGIAAAVVAVIGRPLPTISETTTTGFTNVSSNNTS---PEKQSCANGLEADPP
-TTGYGAVAAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLA
-ILVPT-CDCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCG------
----RR-VRRRR--A----------------------------------------------
------------------------------------PQ-----------------------
---
+-MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T
+VVPN--TTWW------------QASAPFDTPAALVRAAAK--------------------
+AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV
+V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM
+MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT
+ASSFYVPVLIILILYWRIY-------QTARKRIR--------------------------
+-------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA
+AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV
+AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C
+DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR--
+------A---------------PQ------------------------------------
+---------------------------------------------------------
diff -r c5908940967d -r aaefa93c2dd2 test-data/mafft_nwns_result.aln
--- a/test-data/mafft_nwns_result.aln Sat Nov 11 15:06:34 2017 -0500
+++ b/test-data/mafft_nwns_result.aln Wed Apr 15 15:33:37 2020 -0400
@@ -1,270 +1,270 @@
-CLUSTAL format alignment by MAFFT NW-NS-2 (v7.221)
+CLUSTAL format alignment by MAFFT NW-NS-2 (v7.455)
-1== --------------------------------MNGTE--------------GDNF-----
-2== --------------------------------MNGTE--------------GPNF-----
-3== --------------------------------MNGTE--------------GINF-----
-4=p --------------------------------MNGTE--------------GKNF-----
-5=p --------------------------------MNGTE--------------GNNF-----
-6== --------------------------------MKQVPEF------------HEDF-----
-7== --------------------------------MRKMS--------------EEEF-----
+1== ----------------------------------------MNG----------------T
+2== ----------------------------------------MNG----------------T
+3== ----------------------------------------MNG----------------T
+4=p ----------------------------------------MNG----------------T
+5=p ----------------------------------------MNG----------------T
+6== ----------------------------------------MKQ----------------V
+7== ----------------------------------------MRK----------------M
8=opsin, ------------------------------------------------------------
-9== --------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
-10== --------------------------------MAQQWSLQRLAGRHPQDSYEDST-----
-11== --------------------------------MTEAWNVAVFAARRSRDD-DDTT-----
-12== --------------------------------MAA-WEAAFAARRRHEE--EDTT-----
-13== --------------------------------MS-----------------SNSS-----
-14== ----------MES--GNV-----------SSSLFGNVSTAL----------RPEA-----
-15== ----------MEY--HNV-----------SSVL-GNVSSVL----------RPDA-----
-16== ----------ME-------------------PLCNASEPPL----------RPEA-----
-17== ----------MD-------------------ALCNASEPPL----------RPEA-----
-18== --------------------------------MTNATGPQM----------AYYG-----
-19== --------------------------------MANVTGPQM----------AFYG-----
-20== ---------------MES-----------FAVAAAQLGPHF----------APLS-----
-21== ---------------MES-----------FAVAAAQLGPHF----------APLS-----
-22== ---------------MDS-----------FAAVATQLGPQF----------AAPS-----
-23== ----------MERSHLPE-----------TPFDLAHSGPRF----------QAQS-----
-24== ----------MERSLLPE-----------PPLAMALLGPRF----------EAQT-----
-25== --------------------------------MIAVSGPSY----------EAFS-----
-26== ----------------------------------MANQLSY----------SSLG-----
-27== ---------------------------------------MV----------ESTT-----
-28== ----------------------------------------M----------GRDL-----
-29== ---------MMDVNSSGRPDLYGHLRSF-LLPEVGRGLPDL----------SPDGGADPV
+9== ----------------------------------------MAQQWSLQRLAGRHPQDSYE
+10== ----------------------------------------MAQQWSLQRLAGRHPQDSYE
+11== ----------------------------------------MTEAWNVAVFAARRSRDD-D
+12== ----------------------------------------MAA-WEAAFAARRRHEE--E
+13== ----------------------------------------MS-----------------S
+14== ----------MESGNVSS------------SLFGNVST-ALRP----------------E
+15== ----------MEYHNVSS------------VL-GNVSS-VLRP----------------D
+16== ----------ME------------------PL-CNASEPPLRP----------------E
+17== ----------MD------------------AL-CNASEPPLRP----------------E
+18== --------------------------------MTNATGPQMAY----------------Y
+19== --------------------------------MANVTGPQMAF----------------Y
+20== ----------ME----SF------------AVAAAQLGPHFAP----------------L
+21== ----------ME----SF------------AVAAAQLGPHFAP----------------L
+22== ----------MD----SF------------AAVATQLGPQFAA----------------P
+23== -----MERSHLP----ET------------PFDLAHSGPRFQA----------------Q
+24== -----MERSLLP----EP------------PLAMALLGPRFEA----------------Q
+25== --------------------------------MIAVSGPSYEA----------------F
+26== ----------------------------------MANQLSYSS----------------L
+27== ---------------------------------------MVES----------------T
+28== ----------------------------------------MGR----------------D
+29== ---------MMDVNSSGRPDLYGHLRSFL-LPEVGRGLPDLSPDGGA------------D
30== ------------------------------------------------------------
31=p ------------------------------------------------------------
-32== ----------MDVLSPG------------QGNNTTSPPAPF----------ETGG-----
-33=p ----------MDVFSFG------------QGNNTTASQEPF----------GTGG-----
-34== MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
-35=p MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGL----------SPTG-----
-36== -MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGW----------EPNW-----
+32== ----------MDVLSP--------------------------------------------
+33=p ----------MDVFSF--------------------------------------------
+34== MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+35=p MANFTFGDLALDVARMG-----GLASTPSGLRSTGLTTPGLSPTGLV------------T
+36== -MEGAEGQEELDWEAL-------YLRLP--LQNCSWNSTGWEPNWNV------------T
-1== -------------YVP-----F-SNKTG----------LARSPYEYPQY-YLAEPWK---
-2== -------------YVP-----F-SNITG----------VVRSPFEQPQY-YLAEPWQ---
-3== -------------YVP-----M-SNKTG----------VVRSPFEYPQY-YLAEPWK---
-4=p -------------YVP-----M-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
-5=p -------------YVP-----L-SNRTG----------LVRSPFEYPQY-YLAEPWQ---
-6== -------------YIPIP-LDI-NNLS------------AYSPFLVPQD-HLGNQGI---
-7== -------------YL------F-KNIS------------SVGPWDGPQY-HIAPVWA---
+1== E--G--DNFYVP----FSNKTGLARSPYEYPQY-------YLAEPWK---------YSAL
+2== E--G--PNFYVP----FSNITGVVRSPFEQPQY-------YLAEPWQ---------FSML
+3== E--G--INFYVP----MSNKTGVVRSPFEYPQY-------YLAEPWK---------YRLV
+4=p E--G--KNFYVP----MSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKIL
+5=p E--G--NNFYVP----LSNRTGLVRSPFEYPQY-------YLAEPWQ---------FKLL
+6== PEFH--EDFYIPIPLDINNLS--AYSPFLVPQD-------HLGNQGI---------FMAM
+7== S--E--EEFYL-----FKNIS--SVGPWDGPQY-------HIAPVWA---------FYLQ
8=opsin, ------------------------------------------------------------
-9== -------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
-10== -------------QSSI--FTY-TNSNS-----------TRGPFEGPNY-HIAPRWV---
-11== -------------RGSV--FTY-TNTNN-----------TRGPFEGPNY-HIAPRWV---
-12== -------------RDSV--FTY-TNSNN-----------TRGPFEGPNY-HIAPRWV---
-13== -------------QAP---------PNG-----------TPGPFDGPQWPYQAPQST---
-14== -------------RLSA------ETRLL----------GWNVPPEELR--HIPEHWLTYP
-15== -------------RLSA------ESRLL----------GWNVPPDELR--HIPEHWLIYP
-16== -------------R-SSG---NGDLQFL----------GWNVPPDQIQ--YIPEHWLTQL
-17== -------------RMSSG---SDELQFL----------GWNVPPDQIQ--YIPEHWLTQL
-18== -------------AASMD-FGYPEGVSI----------VDFVRPEIKP--YVHQHWYNYP
-19== -------------SGAAT-FGYPEGMTV----------ADFVPDRVKH--MVLDHWYNYP
-20== ------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-21== ------------------------NGSV----------VDKVTPDMAH--LISPYWNQFP
-22== ------------------------NGSV----------VDKVTPDMAH--LISPYWDQFP
-23== -------------SG---------NGSV----------LDNVLPDMAH--LVNPYWSRFA
-24== -------------GG---------NRSV----------LDNVLPDMAP--LVNPHWSRFA
-25== -------------YGGQARF---NNQTV----------VDKVPPDMLH--LIDANWYQYP
-26== -------------WPYQP------NASV----------VDTMPKEMLY--MIHEHWYAFP
-27== -------------LVNQT-WWY--NPTV----------D------------IHPHWAKFD
-28== -------------RDNET-WWY--NPSI----------V------------VHPHWREFD
-29== AGSWAPHLLS---EVTAS-----PAPTW------------DAPPDNAS--GCGEQIN---
-30== ----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
-31=p ----MPHLLSGFLEVTAS-----PAPTW------------DAPPDNVS--GCGEQIN---
-32== -------------NTTGI-----SDVTV--------------------------------
-33=p -------------NVTSI-----SDVTF--------------------------------
-34== -------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-35=p -------------LVTSD-----FNDSYGLTGQFINGSHSSRSRDNAS--ANDTSATNMT
-36== -------------NVTVV-----PNTTW---------WQASAPFDTPA--ALVRAAAK--
-
-
-1== --------------YSALAAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMA
-2== --------------FSMLAAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVA
-3== --------------YRLVCCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVA
-4=p --------------FKILALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVA
-5=p --------------FKLLAVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVA
-6== --------------FMAMSVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIA
-7== --------------FYLQAAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFG
-8=opsin, ------------------------------------------------------------
-9== --------------YHLTSVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-10== --------------YHLTSVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVA
-11== --------------YNLVSFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFV
-12== --------------YNLTSVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVA
-13== --------------YVGVAVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVA
-14== E--------PPESMNYLLGTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFC
-15== E--------PPESMNYLLGTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFC
-16== E--------PPASMHYMLGVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-17== E--------PPASMHYMLGVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVF
-18== P--------VNPMWHYLLGVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALS
-19== P--------VNPMWHYLLGVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALS
-20== A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-21== A--------MDPIWAKILTAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-22== A--------MDPIWAKILTAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAIS
-23== P--------MDPMMSKILGLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-24== P--------MDPTMSKILGLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFS
-25== P--------LNPMWHGILGFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAIS
-26== P--------MNPLWYSILGVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFS
-27== P--------IPDAVYYSVGIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMS
-28== Q--------VPDAVYYSLGIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFS
-29== ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALA
-30== ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-31=p ---------YGRVEKVVIGSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALA
-32== ------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-33=p ------------SYQVITSLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVT
-34== DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-35=p DDRYWSLTVYSHEHLVLTSVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVA
-36== ------------------AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVA
+9== DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+10== DSTQ--SSIFT-----YTNSNS-TRGPFEGPNY-------HIAPRWV---------YHLT
+11== DTTR--GSVFT-----YTNTNN-TRGPFEGPNY-------HIAPRWV---------YNLV
+12== DTTR--DSVFT-----YTNSNN-TRGPFEGPNY-------HIAPRWV---------YNLT
+13== NSSQ--AP-----------PNG-TPGPFDGPQW------PYQAPQST---------YVGV
+14== ARLS--A----------ETRLLGWNVPPEELR--------HIPEHWLTYPEPPESMNYLL
+15== ARLS--A----------ESRLLGWNVPPDELR--------HIPEHWLIYPEPPESMNYLL
+16== AR-S--SG---N----GDLQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+17== ARMS--SG---S----DELQFLGWNVPPDQIQ--------YIPEHWLTQLEPPASMHYML
+18== GAAS--MD-FGY----PEGVSIVDFVRPEIKP--------YVHQHWYNYPPVNPMWHYLL
+19== GSGA--AT-FGY----PEGMTVADFVPDRVKH--------MVLDHWYNYPPVNPMWHYLL
+20== S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+21== S-----------------NGSVVDKVTPDMAH--------LISPYWNQFPAMDPIWAKIL
+22== S-----------------NGSVVDKVTPDMAH--------LISPYWDQFPAMDPIWAKIL
+23== SSG---------------NGSVLDNVLPDMAH--------LVNPYWSRFAPMDPMMSKIL
+24== TGG---------------NRSVLDNVLPDMAP--------LVNPHWSRFAPMDPTMSKIL
+25== SYGG--QARF-------NNQTVVDKVPPDMLH--------LIDANWYQYPPLNPMWHGIL
+26== GWPY--QP----------NASVVDTMPKEMLY--------MIHEHWYAFPPMNPLWYSIL
+27== TLVN--QT-WWY------NPTVD------------------IHPHWAKFDPIPDAVYYSV
+28== LRDN--ET-WWY------NPSIV------------------VHPHWREFDQVPDAVYYSL
+29== PVAGSWAPHLLS------EVTASPAPTWDAPPDNASGCGEQIN--------YGRVEKVVI
+30== ------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+31=p ------MPHLLS---GFLEVTASPAPTWDAPPDNVSGCGEQIN--------YGRVEKVVI
+32== ---------------GQGNNTTSPPAPFET-GGNTTGISDVT---------VSYQ--VIT
+33=p ---------------GQGNNTTASQEPFGT-GGNVTSISDVT---------FSYQ--VIT
+34== SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+35=p SDFN--DSYGLT---GQFINGSHSSRSRDNASANDTSATNMTDDRYWSLTVYSHEHLVLT
+36== VVPN--TTWW------------QASAPFDTPAALVRAAAK--------------------
-1== NLFMVLFG-FTVTMYTSMN-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIV
-2== DLFMVFGG-FTTTLYTSLH-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVV
-3== DLFMACFG-FTVTFYTAWN-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIV
-4=p GTIMVCFG-FTVTFYTAIN-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-5=p GAIMVCFG-FTVTFYTAIN-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIV
-6== NLFVAIFG-SPLSFYSFFN-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLV
-7== GFLLCIFS-VFPVFVASCN-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIV
-8=opsin, DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-9== DLAETVIA-STISVVNQVY-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMV
-10== DLAETVIA-STISIVNQVS-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLV
-11== DLVETLVA-STISVFNQIF-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFV
-12== DLGETVIA-STISVINQIS-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFV
-13== DLLVTLCG-SSVSLSNNIN-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVV
-14== DFMMMVK--TPIFIYNSFH-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNV
-15== DFMMMIK--TPIFIYNSFH-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNV
-16== DLIMCLK--APIF--NSFH-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-17== DLIMCLK--APIFIYNSFH-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNV
-18== DLIMLTTN-VPFFTYNCFSGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNI
-19== DLIMLTTN-FPPFCYNCFSGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNI
-20== DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-21== DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-22== DFGIMITN-TPMMGINLYF-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQV
-23== DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNV
-24== DFCMMASQ-SPVMIINFYY-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNV
-25== NFLMMFCM-SPPMVINCYY-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNV
-26== DFCMMAFM-MPTMTSNCFA-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNV
-27== DLSFSAINGFPLKTISAFM-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNV
-28== DFTFSLVNGFPLMTISCFL-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNV
-29== DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-30== DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-31=p DLSVAVAV-MPFVSVTDLIGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLG
-32== DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-33=p DLMVSVLV-LPMAALYQVL-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWA
-34== DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-35=p DLMVAVLV-MPLSVVSEIS-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWA
-36== DLLVACLV-MPLGAVYEVV-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWA
- . : : * : : :*:
+1== AAYMFFLILVGFPVNFLTLFVTVQHKKLRTPLNYILLNLAMANLFMVLFG-FTVTMYTSM
+2== AAYMFLLIVLGFPINFLTLYVTVQHKKLRTPLNYILLNLAVADLFMVFGG-FTTTLYTSL
+3== CCYIFFLISTGLPINLLTLLVTFKHKKLRQPLNYILVNLAVADLFMACFG-FTVTFYTAW
+4=p ALYLFFLMSMGLPINGLTLVVTAQHKKLRQPLNFILVNLAVAGTIMVCFG-FTVTFYTAI
+5=p AVYMFFLICLGLPINGLTLICTAQHKKLRQPLNFILVNLAVAGAIMVCFG-FTVTFYTAI
+6== SVFMFFIFIGGASINILTILCTIQFKKLRSHLNYILVNLSIANLFVAIFG-SPLSFYSFF
+7== AAFMGTVFLIGFPLNAMVLVATLRYKKLRQPLNYILVNVSFGGFLLCIFS-VFPVFVASC
+8=opsin, ------------------------------------------DLAETVIA-STISIVNQV
+9== SVWMIFVVIASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISVVNQV
+10== SVWMIFVVTASVFTNGLVLAATMKFKKLRHPLNWILVNLAVADLAETVIA-STISIVNQV
+11== SFFMIIVVIASCFTNGLVLVATAKFKKLRHPLNWILVNLAFVDLVETLVA-STISVFNQI
+12== SVWMIFVVAASVFTNGLVLVATWKFKKLRHPLNWILVNLAVADLGETVIA-STISVINQI
+13== AVLMGTVVACASVVNGLVIVVSICYKKLRSPLNYILVNLAVADLLVTLCG-SSVSLSNNI
+14== GTLYIFFTLMSMLGNGLVIWVFSAAKSLRTPSNILVINLAFCDFMMMVK--TPIFIYNSF
+15== GTLYIFFTVISMIGNGLVMWVFSAAKSLRTPSNILVINLAFCDFMMMIK--TPIFIYNSF
+16== GVFYIFLFCASTVGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIF--NSF
+17== GVFYIFLFFASTLGNGMVIWIFSTSKSLRTPSNMFVLNLAVFDLIMCLK--APIFIYNSF
+18== GVIYLFLGTVSIFGNGLVIYLFNKSAALRTPANILVVNLALSDLIMLTTN-VPFFTYNCF
+19== GVVYLFLGVISIAGNGLVIYLYMKSQALKTPANMLIVNLALSDLIMLTTN-FPPFCYNCF
+20== TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+21== TAYMIMIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+22== TAYMIIIGMISWCGNGVVIYIFATTKSLRTPANLLVINLAISDFGIMITN-TPMMGINLY
+23== GLFTLAIMIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+24== GLFTLVILIISCCGNGVVVYIFGGTKSLRTPANLLVLNLAFSDFCMMASQ-SPVMIINFY
+25== GFVIGMLGFVSAMGNGMVVYIFLSTKSLRTPSNLFVINLAISNFLMMFCM-SPPMVINCY
+26== GVAMIILGIICVLGNGMVIYLMMTTKSLRTPTNLLVVNLAFSDFCMMAFM-MPTMTSNCF
+27== GIFIGVVGIIGILGNGVVIYLFSKTKSLQTPANMFIINLAMSDLSFSAINGFPLKTISAF
+28== GIFIGICGIIGCGGNGIVIYLFTKTKSLQTPANMFIINLAFSDFTFSLVNGFPLMTISCF
+29== GSILTLITLLTIAGNCLVVISVCFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+30== GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+31=p GSILTLITLLTIAGNCLVVISVSFVKKLRQPSNYLIVSLALADLSVAVAV-MPFVSVTDL
+32== SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+33=p SLLLGTLIFCAVLGNACVVAAIALERSLQNVANYLIGSLAVTDLMVSVLV-LPMAALYQV
+34== SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+35=p SVILGLFVLCCIIGNCFVIAAVMLERSLHNVANYLILSLAVADLMVAVLV-MPLSVVSEI
+36== AVVLGLLILATVVGNVFVIAAILLERHLRSAANNLILSLAVADLLVACLV-MPLGAVYEV
+ .
+
+1== N-GYFV--FGPTMCSIEGFFATLGGEVALWSLVVLAIERYIVICKPMGN-FRFGNTHAIM
+2== H-GYFV--FGPTGCNLEGFFATLGGEIGLWSLVVLAIERYVVVCKPMSN-FRFGENHAIM
+3== N-GYFV--FGPVGCAVEGFFATLGGQVALWSLVVLAIERYIVVCKPMGN-FRFSATHAMM
+4=p N-GYFV--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSSHAFA
+5=p N-GYFA--LGPTGCAVEGFMATLGGEVALWSLVVLAIERYIVVCKPMGS-FKFSSTHASA
+6== N-RYFI--FGATACKIEGFLATLGGMVGLWSLAVVAFERWLVICKPLGN-FTFKTPHAIA
+7== N-GYFV--FGRHVCALEGFLGTVAGLVTGWSLAFLAFERYIVICKPFGN-FRFSSKHALT
+8=opsin, S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+9== Y-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWMVVCKPFGN-VRFDAKLAIV
+10== S-GYFV--LGHPMCVLEGYTVSLCGITGLWSLAIISWERWLVVCKPFGN-VRFDAKLAIV
+11== F-GYFI--LGHPLCVIEGYVVSSCGITGLWSLAIISWERWFVVCKPFGN-IKFDSKLAII
+12== S-GYFI--LGHPMCVVEGYTVSACGITALWSLAIISWERWFVVCKPFGN-IKFDGKLAVA
+13== N-GFFV--FGRRMCELEGFMVSLTGIVGLWSLAILALERYVVVCKPLGD-FQFQRRHAVS
+14== H-QGYA--LGHLGCQIFGIIGSYTGIAAGATNAFIAYDRFNVITRPMEG--KMTHGKAIA
+15== H-QGYA--LGHLGCQIFGVIGSYTGIAAGATNAFIAYDRYNVITRPMEG--KMTHGKAIA
+16== H-RGFAIYLGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+17== H-RGFA--LGNTWCQIFASIGSYSGIGAGMTNAAIGYDRYNVITKPMNR--NMTFTKAVI
+18== SGGVWM--FSPQYCEIYACLGAITGVCSIWLLCMISFDRYNIICNGFNG-PKLTTGKAVV
+19== SGGRWM--FSGTYCEIYAALGAITGVCSIWTLCMISFDRYNIICNGFNG-PKLTQGKATF
+20== F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+21== F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+22== F-ETWV--LGPMMCDIYAGLGSAFGCSSIWSMCMISLDRYQVIVKGMAG-RPMTIPLALG
+23== Y-ETWV--LGPLWCDIYAGCGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+24== Y-ETWV--LGPLWCDIYAACGSLFGCVSIWSMCMIAFDRYNVIVKGING-TPMTIKTSIM
+25== Y-ETWV--LGPLFCQIYAMLGSLFGCGSIWTMTMIAFDRYNVIVKGLSG-KPLSINGALI
+26== A-ETWI--LGPFMCEVYGMAGSLFGCASIWSMVMITLDRYNVIVRGMAA-APLTHKKATL
+27== M-KKWI--FGKVACQLYGLLGGIFGFMSINTMAMISIDRYNVIGRPMAASKKMSHRRAFL
+28== L-KKWI--FGFAACKVYGFIGGIFGFMSIMTMAMISIDRYNVIGRPMAASKKMSHRRAFI
+29== IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+30== IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+31=p IGGKWI--FGHFFCNVFIAMDVMCCTASIMTLCVISIDRYLGITRPLTYPVRQNGKCMAK
+32== L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+33=p L-NKWT--LGQVTCDLFIALDVLCCTSSILHLCAIALDRYWAITDPIDYVNKRTPRRAAA
+34== S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+35=p S-KVWF--LHSEVCDMWISVDVLCCTASILHLVAIAMDRYWAVTS-IDYIRRRSARRILL
+36== V-QRWT--LGPELCDMWTSGDVLCCTASILHLVAIALDRYWAVTN-IDYIHASTAKRVGM
+ : : * : : :*: : :
-1== ICKPMGN-FRFGNTHAIMGVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPD
-2== VCKPMSN-FRFGENHAIMGVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGID
-3== VCKPMGN-FRFSATHAMMGIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPD
-4=p VCKPMGS-FKFSSSHAFAGIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPD
-5=p VCKPMGS-FKFSSTHASAGIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPD
-6== ICKPLGN-FTFKTPHAIAGCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPD
-7== ICKPFGN-FRFSSKHALTVVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPD
-8=opsin, VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-9== VCKPFGN-VRFDAKLAIVGIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-10== VCKPFGN-VRFDAKLAIVGIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-11== VCKPFGN-IKFDSKLAIIGIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPD
-12== VCKPFGN-IKFDGKLAVAGILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPD
-13== VCKPLGD-FQFQRRHAVSGCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPN
-14== ITRPMEG--KMTHGKAIAMIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFD
-15== ITRPMEG--KMTHGKAIAMIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFD
-16== ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-17== ITKPMNR--NMTFTKAVIMNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFD
-18== ICNGFNG-PKLTTGKAVVFALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYD
-19== ICNGFNG-PKLTQGKATFMCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYD
-20== IVKGMAG-RPMTIPLALGKM---------------------------YVPEGNLTSCGID
-21== IVKGMAG-RPMTIPLALGKIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGID
-22== IVKGMAG-RPMTIPLALGKIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGID
-23== IVKGING-TPMTIKTSIMKILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSID
-24== IVKGING-TPMTIKTSIMKIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSID
-25== IVKGLSG-KPLSINGALIRIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTD
-26== IVRGMAA-APLTHKKATLLLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVD
-27== IGRPMAASKKMSHRRAFLMIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFD
-28== IGRPMAASKKMSHRRAFIMIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFD
-29== ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-30== ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-31=p ITRPLTYPVRQNGKCMAKMILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQD
-32== ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-33=p ITDPIDYVNKRTPRRAAALISLTWLIGFLI-SIPPMLG-WRTPEDRSDPDA---CTISKD
-34== VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-35=p VTS-IDYIRRRSARRILLMIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQD
-36== VTN-IDYIHASTAKRVGMMIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQD
- : : :
+1== GVAFTWIMALAC-AAPPLVG-W-----SRYIPEGMQCSCGPDYYTLNPNFNNESYVVYMF
+2== GVAFTWVMALAC-AAPPLVG-W-----SRYIPEGMQCSCGIDYYTLKPEVNNESFVIYMF
+3== GIAFTWVMAFSC-AAPPLFG-W-----SRYMPEGMQCSCGPDYYTHNPDYHNESYVLYMF
+4=p GIAFTWVMALAC-AAPPLFG-W-----SRYIPEGMQCSCGPDYYTLNPDYNNESYVIYMF
+5=p GIAFTWVMAMAC-AAPPLVG-W-----SRYIPEGIQCSCGPDYYTLNPEYNNESYVLYMF
+6== GCILPWISALAA-SLPPLFG-W-----SRYIPEGLQCSCGPDWYTTNNKYNNESYVMFLF
+7== VVLATWTIGIGV-SIPPFFG-W-----SRFIPEGLQCSCGPDWYTVGTKYRSESYTWFLF
+8=opsin, GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+9== GIAFSWIWAAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+10== GIAFSWIWSAVW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSYPGVQSYMIVLM
+11== GIVFSWVWAWGW-SAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSVELGCQSFMLTLM
+12== GILFSWLWSCAW-TAPPIFG-W-----SRYWPHGLKTSCGPDVFSGSSDPGVQSYMVVLM
+13== GCAFTWGWALLW-SAPPLLG-W-----SSYVPEGLRTSCGPNWYTGGSNN--NSYILSLF
+14== MIIFIYMYATPW-VVACYTETW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+15== MIIFIYLYATPW-VVACYTESW-----GRFVPEGYLTSCTFDYLT--DNFDTRLFVACIF
+16== MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+17== MNIIIWLYCTPW-VVLPLTQFW-----DRFVPEGYLTSCSFDYLS--DNFDTRLFVGTIF
+18== FALISWVIAIGC-ALPPFFG-W-----GNYILEGILDSCSYDYLT--QDFNTFSYNIFIF
+19== MCGLAWVISVGW-SLPPFFG-W-----GSYTLEGILDSCSYDYFT--RDMNTITYNICIF
+20== KM---------------------------YVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+21== KIAYIWFMSSIW-CLAPAFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+22== KIAYIWFMSTIWCCLAPVFG-W-----SRYVPEGNLTSCGIDYLE--RDWNPRSYLIFYS
+23== KILFIWMMAVFW-TVMPLIG-W-----SAYVPEGNLTACSIDYMT--RMWNPRSYLITYS
+24== KIAFIWMMAVFW-TIMPLIG-W-----SSYVPEGNLTACSIDYMT--RQWNPRSYLITYS
+25== RIIAIWLFSLGW-TIAPMFG-W-----NRYVPEGNMTACGTDYFN--RGLLSASYLVCYG
+26== LLLFVWIWSGGW-TILPFFG-W-----SRYVPEGNLTSCTVDYLT--KDWSSASYVVIYG
+27== MIIFVWMWSIVW-SVGPVFN-W-----GAYVPEGILTSCSFDYLS--TDPSTRSFILCMY
+28== MIIFVWLWSVLW-AIGPIFG-W-----GAYTLEGVLCNCSFDYIS--RDSTTRSNILCMF
+29== MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+30== MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+31=p MILSVWLLSASI-TLPPLFG-W-----AQNVNDDKVCLISQDF----------GYTIYST
+32== LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+33=p LISLTWLIGFLI-SIPPMLG-WRTPEDRSDPD---ACTISKDH----------GYTIYST
+34== MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+35=p MIMVVWIVALFI-SIPPLFG-WRDP--NNDPDKTGTCIISQDK----------GYTIFST
+36== MIACVWTVSFFV-CIAQLLG-WKDPDWNQRVSEDLRCVVSQDV----------GYQIFAT
+ :
-1== YYTLNPNFNNESYVVYMFVVHFLVPFVIIFFCYGRLLCTV----KE--------------
-2== YYTLKPEVNNESFVIYMFVVHFTIPMIVIFFCYGQLVFTV----KE--------------
-3== YYTHNPDYHNESYVLYMFVIHFIIPVVVIFFSYGRLICKV----RE--------------
-4=p YYTLNPDYNNESYVIYMFVCHFILPVAVIFFTYGRLVCTV----KA--------------
-5=p YYTLNPEYNNESYVLYMFICHFILPVTIIFFTYGRLVCTV----KA--------------
-6== WYTTNNKYNNESYVMFLFCFCFAVPFGTIVFCYGQLLITL----KL--------------
-7== WYTVGTKYRSESYTWFLFIFCFIVPLSLICFSYTQLLRAL----KA--------------
-8=opsin, VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-9== VFSGSSYPGVQSYMIVLMVTCCITPLSIIVLCYLQVWLAI----RA--------------
-10== VFSGSSYPGVQSYMIVLMVTCCIIPLAIIMLCYLQVWLAI----RA--------------
-11== VFSGSVELGCQSFMLTLMITCCFLPLFIIIVCYLQVWMAI----RA--------------
-12== VFSGSSDPGVQSYMVVLMVTCCFFPLAIIILCYLQVWLAI----RA--------------
-13== WYTGGSNN--NSYILSLFVTCFVLPLSLILFSYTNLLLTL----RA--------------
-14== YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-15== YLT--DNFDTRLFVACIFFFSFVCPTTMITYYYSQIVGHVFSHEKA--------------
-16== YLS--DNFDTRLFVGTIFFFSFVCPTLMILYYYSQIVGHVFSHEKA--------------
-17== YLS--DNFDTRLFVGTIFLFSFVVPTLMILYYYSQIVGHVFNHEKA--------------
-18== YLT--QDFNTFSYNIFIFVFDYFLPAAIIVFSYVFIVKAIFAHEAA--------------
-19== YFT--RDMNTITYNICIFIFDFFLPASVIVFSYVFIVKAIFAHEAA--------------
-20== YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-21== YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-22== YLE--RDWNPRSYLIFYSIFVYYIPLFLICYSYWFIIAAVSAHEKA--------------
-23== YMT--RMWNPRSYLITYSLFVYYTPLFLICYSYWFIIAAVAAHEKA--------------
-24== YMT--RQWNPRSYLITYSLFVYYTPLFMICYSYWFIIATVAAHEKA--------------
-25== YFN--RGLLSASYLVCYGIWVYFVPLFLIIYSYWFIIQAVAAHEKN--------------
-26== YLT--KDWSSASYVVIYGLAVYFLPLITMIYCYFFIVHAVAEHEKQ--------------
-27== YLS--TDPSTRSFILCMYFCGFMLPIIIIAFCYFNIVMSVSNHEKE--------------
-28== YIS--RDSTTRSNILCMFILGFFGPILIIFFCYFNIVMSVSNHEKE--------------
-29== F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
-30== F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
-31=p F----------GYTIYSTAVAFYIPMSVMLFMYYQIYKAARKSAAKHKF-----------
-32== H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
-33=p H----------GYTIYSTFGAFYIPLLLMLVLYGRIFRAARFRIRK--------------
-34== K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-35=p K----------GYTIFSTVGAFYLPMLVMMIIYIRIWLVARSRIRKDKFQMTKARLKTEE
-36== V----------GYQIFATASSFYVPVLIILILYWRIYQTARKRIR---------------
- * : * :
+1== VVHFLVPFVIIFFCYGRLLCTV----KEAAAAQQ--------------------------
+2== VVHFTIPMIVIFFCYGQLVFTV----KEAAAQQQ--------------------------
+3== VIHFIIPVVVIFFSYGRLICKV----REAAAQQQ--------------------------
+4=p VCHFILPVAVIFFTYGRLVCTV----KAAAAQQQ--------------------------
+5=p ICHFILPVTIIFFTYGRLVCTV----KAAAAQQQ--------------------------
+6== CFCFAVPFGTIVFCYGQLLITL----KLAAKAQA--------------------------
+7== IFCFIVPLSLICFSYTQLLRAL----KAVAAQQQ--------------------------
+8=opsin, VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+9== VTCCITPLSIIVLCYLQVWLAI----RAVAKQQK--------------------------
+10== VTCCIIPLAIIMLCYLQVWLAI----RAVAKQQK--------------------------
+11== ITCCFLPLFIIIVCYLQVWMAI----RAVAAQQK--------------------------
+12== VTCCFFPLAIIILCYLQVWLAI----RAVAAQQK--------------------------
+13== VTCFVLPLSLILFSYTNLLLTL----RAAAAQQK--------------------------
+14== FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+15== FFSFVCPTTMITYYYSQIVGHVFSHEKALRDQAKK-------------------------
+16== FFSFVCPTLMILYYYSQIVGHVFSHEKALREQAKK-------------------------
+17== LFSFVVPTLMILYYYSQIVGHVFNHEKALREQAKK-------------------------
+18== VFDYFLPAAIIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+19== IFDFFLPASVIVFSYVFIVKAIFAHEAAMRAQAKK-------------------------
+20== IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+21== IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+22== IFVYYIPLFLICYSYWFIIAAVSAHEKAMREQAKK-------------------------
+23== LFVYYTPLFLICYSYWFIIAAVAAHEKAMREQAKK-------------------------
+24== LFVYYTPLFMICYSYWFIIATVAAHEKAMRDQAKK-------------------------
+25== IWVYFVPLFLIIYSYWFIIQAVAAHEKNMREQAKK-------------------------
+26== LAVYFLPLITMIYCYFFIVHAVAEHEKQLREQAKK-------------------------
+27== FCGFMLPIIIIAFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+28== ILGFFGPILIIFFCYFNIVMSVSNHEKEMAAMAKR-------------------------
+29== AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+30== AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+31=p AVAFYIPMSVMLFMYYQIY-------KAARKSAAKHKF----------------------
+32== FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+33=p FGAFYIPLLLMLVLYGRIF-------RAARFRIRK-------------------------
+34== VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+35=p VGAFYLPMLVMMIIYIRIW-------LVARSRIRKDKFQMTKARLKTEETTLVASPKTEY
+36== ASSFYVPVLIILILYWRIY-------QTARKRIR--------------------------
+ * : * :
-1== ------------------------------------------------------AAAAQQ
-2== ------------------------------------------------------AAAQQQ
-3== ------------------------------------------------------AAAQQQ
-4=p ------------------------------------------------------AAAQQQ
-5=p ------------------------------------------------------AAAQQQ
-6== ------------------------------------------------------AAKAQA
-7== ------------------------------------------------------VAAQQQ
-8=opsin, ------------------------------------------------------VAKQQK
-9== ------------------------------------------------------VAKQQK
-10== ------------------------------------------------------VAKQQK
-11== ------------------------------------------------------VAAQQK
-12== ------------------------------------------------------VAAQQK
-13== ------------------------------------------------------AAAQQK
-14== ------------------------------------------------------LRDQAK
-15== ------------------------------------------------------LRDQAK
-16== ------------------------------------------------------LREQAK
-17== ------------------------------------------------------LREQAK
-18== ------------------------------------------------------MRAQAK
-19== ------------------------------------------------------MRAQAK
-20== ------------------------------------------------------MREQAK
-21== ------------------------------------------------------MREQAK
-22== ------------------------------------------------------MREQAK
-23== ------------------------------------------------------MREQAK
-24== ------------------------------------------------------MRDQAK
-25== ------------------------------------------------------MREQAK
-26== ------------------------------------------------------LREQAK
-27== ------------------------------------------------------MAAMAK
-28== ------------------------------------------------------MAAMAK
-29== --------------------------------------------P----GFPRVEPDSVI
-30== --------------------------------------------P----GFPRVQPESVI
-31=p --------------------------------------------P----GFPRVQPESVI
-32== -------------------------TVKKVEKTGADTRHGASPAP---------QPKKS-
-33=p -------------------------TVRKVEKKGAGTSLGTSSAP---------PPKKS-
-34== TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-35=p TTLVASPKTEYSVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENAN
-36== ------------------------------RRRGATARGGVGPPP---------VPAGGA
+1== ------------------------------------------------------------
+2== ------------------------------------------------------------
+3== ------------------------------------------------------------
+4=p ------------------------------------------------------------
+5=p ------------------------------------------------------------
+6== ------------------------------------------------------------
+7== ------------------------------------------------------------
+8=opsin, ------------------------------------------------------------
+9== ------------------------------------------------------------
+10== ------------------------------------------------------------
+11== ------------------------------------------------------------
+12== ------------------------------------------------------------
+13== ------------------------------------------------------------
+14== --------------------------------------------------MN--------
+15== --------------------------------------------------MN--------
+16== --------------------------------------------------MN--------
+17== --------------------------------------------------MN--------
+18== --------------------------------------------------MN--------
+19== --------------------------------------------------MN--------
+20== --------------------------------------------------MN--------
+21== --------------------------------------------------MN--------
+22== --------------------------------------------------MN--------
+23== --------------------------------------------------MN--------
+24== --------------------------------------------------MN--------
+25== --------------------------------------------------MN--------
+26== --------------------------------------------------MN--------
+27== --------------------------------------------------LN--------
+28== --------------------------------------------------LN--------
+29== ---------------------------------PGFPRV----EPDSVIALNG-------
+30== ---------------------------------PGFPRV----QPESVISLNG-------
+31=p ---------------------------------PGFPRV----QPESVISLNG-------
+32== --------------TVKKVEKTGADTRHGASPAPQPKKS-----------VNGESGSR--
+33=p --------------TVRKVEKKGAGTSLGTSSAPPPKKS-----------LNGQPGSG--
+34== SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+35=p SVVSDCNGCNSPDSTTEKKKRRAPFKSYGCSPRPERKKNRAKKLPENANGVNSNSSS---
+36== -------------------RRRGATARGGVGPPP---------VPAGGALVAGGGSGGIA
1== ------------------------------------------------------------
@@ -280,217 +280,179 @@
11== ------------------------------------------------------------
12== ------------------------------------------------------------
13== ------------------------------------------------------------
-14== KMN---------------VESLRS------------------------------------
-15== KMN---------------VDSLRS------------------------------------
-16== KMN---------------VESLRS------------------------------------
-17== KMN---------------VESLRS------------------------------------
-18== KMN---------------VSTLRS------------------------------------
-19== KMN---------------VTNLRS------------------------------------
-20== KMN---------------VKSLRS------------------------------------
-21== KMN---------------VKSLRS------------------------------------
-22== KMN---------------VKSLRS------------------------------------
-23== KMN---------------VKSLRS------------------------------------
-24== KMN---------------VKSLRS------------------------------------
-25== KMN---------------VASLRS------------------------------------
-26== KMN---------------VASLRA------------------------------------
-27== RLN---------------AKELR-------------------------------------
-28== RLN---------------AKELR-------------------------------------
-29== ALNG--------------IVKLQ----------------------KEVEECANLSR----
-30== SLNG--------------VVKLQ----------------------KEVEECANLSR----
-31=p SLNG--------------VVKLQ----------------------KEVEECANLSR----
-32== -VNGESGSRNWRL-----GVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPL
-33=p -LNGQPGSGDWRR-----CAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPL
-34== GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-35=p GVNSNSSS----------SERLKQIQIETAEAFANGCAEEASIAMLERQ-CNNGKKISSN
-36== LVAGGGSGGIAAAVVAVIGRPLPTISETTTTGFTNVSSNNTS---PEKQSCANGLEADPP
+14== --VESL------------------------------------------------------
+15== --VDSL------------------------------------------------------
+16== --VESL------------------------------------------------------
+17== --VESL------------------------------------------------------
+18== --VSTL------------------------------------------------------
+19== --VTNL------------------------------------------------------
+20== --VKSL------------------------------------------------------
+21== --VKSL------------------------------------------------------
+22== --VKSL------------------------------------------------------
+23== --VKSL------------------------------------------------------
+24== --VKSL------------------------------------------------------
+25== --VASL------------------------------------------------------
+26== --VASL------------------------------------------------------
+27== --AKEL------------------------------------------------------
+28== --AKEL------------------------------------------------------
+29== --IVKL----------------------QK---------EVEECAN--------------
+30== --VVKL----------------------QK---------EVEECAN--------------
+31=p --VVKL----------------------QK---------EVEECAN--------------
+32== -------NWRLGVESKAGGALCANGAVRQGDDGAALEVIEVHRVGNSKEHLPLPSEAG--
+33=p -------DWRRCAENRAVGTPCTNGAVRQGDDEATLEVIEVHRVGNSKEHLPLPSESG--
+34== -------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+35=p -------SERLKQIQIETAEAFANGCA----EEASIAMLERQ-CNNGKKISSNDTPYS--
+36== AAVVAVIGRPLPTISETTTTGFTNVSS----NNTSP---EKQSCANGLEADPPTTGYGAV
-1== --------------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVA
-2== --------------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVA
-3== --------------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVA
-4=p --------------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVA
-5=p --------------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVA
-6== --------------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFS
-7== --------------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFA
-8=opsin, --------------------ESESTQK------AEKEVTRMVVVMVLAFC----------
-9== --------------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFA
-10== --------------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFA
-11== --------------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFV
-12== --------------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFA
-13== --------------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFA
-14== -------------------NVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMS
-15== -------------------NVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMS
-16== -------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-17== -------------------NVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMS
-18== --------------------NEADAQR------AEIRIAKTALVNVSLWFICWTPYALIS
-19== --------------------NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAIT
-20== --------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-21== --------------------SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVIN
-22== --------------------SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVIN
-23== --------------------SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVIC
-24== --------------------SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIIC
-25== --------------------SENQNTS------AECKLAKVALMTISLWFMAWTPYLVIN
-26== -------------------NADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIIS
-27== --------------------KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIA
-28== --------------------KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVA
-29== --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-30== --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-31=p --------------LLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLS
-32== PSEAG--PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-33=p PSESG--SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVA
-34== DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-35=p DTPYS-------------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIA
-36== TTGYGAVAAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLA
- * . :
+1== -------------ESASTQK------AEKEVTRMVVLMVIGFLVCWVPYASVAFYIFT-H
+2== -------------ESATTQK------AEKEVTRMVIIMVIFFLICWLPYASVAMYIFT-H
+3== -------------ESATTQK------AEKEVTRMVILMVLGFMLAWTPYAVVAFWIFT-N
+4=p -------------DSASTQK------AEREVTKMVILMVFGFLIAWTPYATVAAWIFF-N
+5=p -------------DSASTQK------AEREVTKMVILMVLGFLVAWTPYATVAAWIFF-N
+6== -------------DSASTQK------AEREVTKMVVVMVLGFLVCWAPYASFSLWIVS-H
+7== -------------ESATTQK------AEREVSRMVVVMVGSFCVCYVPYAAFAMYMVN-N
+8=opsin, -------------ESESTQK------AEKEVTRMVVVMVLAFC-----------------
+9== -------------ESESTQK------AEKEVTRMVVVMVLAFCFCWGPYAFFACFAAA-N
+10== -------------ESESTQK------AEKEVTRMVVVMIFAYCVCWGPYTFFACFAAA-N
+11== -------------ESESTQK------AEREVSRMVVVMIVAFCICWGPYASFVSFAAA-N
+12== -------------ESESTQK------AEKEVSRMVVVMIVAYCFCWGPYTFFACFAAA-N
+13== -------------EADTTQR------AEREVTRMVIVMVMAFLLCWLPYSTFALVVAT-H
+14== ----------RSNVDKNKET------AEIRIAKAAITICFLFFCSWTPYGVMSLIGAF-G
+15== ----------RSNVDKSKEA------AEIRIAKAAITICFLFFASWTPYGVMSLIGAF-G
+16== ----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+17== ----------RSNVDKSKET------AEIRIAKAAITICFLFFVSWTPYGVMSLIGAF-G
+18== ----------RS-NEADAQR------AEIRIAKTALVNVSLWFICWTPYALISLKGVM-G
+19== ----------RS-NEAETQR------AEIRIAKTALVNVSLWFICWTPYAAITIQGLL-G
+20== ----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+21== ----------RS-SEDAEKS------AEGKLAKVALVTITLWFMAWTPYLVINCMGLF-K
+22== ----------RS-SEDADKS------AEGKLAKVALVTISLWFMAWTPYLVINCMGLF-K
+23== ----------RS-SEDCDKS------AEGKLAKVALTTISLWFMAWTPYLVICYFGLF-K
+24== ----------RS-SEDCDKS------AENKLAKVALTTISLWFMAWTPYLIICYFGLF-K
+25== ----------RS-SENQNTS------AECKLAKVALMTISLWFMAWTPYLVINFSGIF-N
+26== ----------RANADQQKQS------AECRLAKVAMMTVGLWFMAWTPYLIISWAGVF-S
+27== ----------R--KAQAGAS------AEMKLAKISMVIITQFMLSWSPYAIIALLAQF-G
+28== ----------R--KAQAGAN------AEMRLAKISIVIVSQFLLSWSPYAVVALLAQF-G
+29== ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+30== ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+31=p ----LSRLLKHERKNISIFK------REQKAATTLGIIVGAFTVCWLPFFLLSTARPFIC
+32== PTPCAPASFERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+33=p SNSYAPACLERKNERNAEAKRKMALARERKTVKTLGIIMGTFILCWLPFFIVALVLPF-C
+34== -----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+35=p -----------RTREKLELK------RERKAARTLAIITGAFLICWLPFFIIALIGPF-V
+36== AAAYYPSLVRRKPKEAADSK------RERKAAKTLAIITGAFVACWLPFFVLAILVPT-C
+ * . :
-1== FYIFT-HQGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC------
-2== MYIFT-HQGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC------
-3== FWIFT-NKGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC------
-4=p AWIFF-NKGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC------
-5=p AWIFF-NKGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC------
-6== LWIVS-HRGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC------
-7== MYMVN-NRNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC------
+1== QGS--DFGATFMTLPAFFAKSSALYNPVIYILMNKQFRNCMITTLCC--------GKNPL
+2== QGS--NFGPIFMTLPAFFAKTASIYNPIIYIMMNKQFRNCMLTSLCC--------GKNPL
+3== KGA--DFTATLMAVPAFFSKSSSLYNPIIYVLMNKQFRNCMITTICC--------GKNPF
+4=p KGA--DFSAKFMAIPAFFSKSSALYNPVIYVLLNKQFRNCMLTTIFC--------GKNPL
+5=p KGA--AFSAQFMAIPAFFSKTSALYNPVIYVLLNKQFRSCMLTTLFC--------GKNPL
+6== RGE--EFDLRMATIPSCLSKASTVYNPVIYVLMNKQFRSCMM-KMVC--------GKN-I
+7== RNH--GLDLRLVTIPSFFSKSACIYNPIIYCFMNKQFQACIM-KMVC--------GKA-M
8=opsin, ------------------------------------------------------------
-9== CFAAA-NPGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
-10== CFAAA-NPGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF-------
-11== SFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF-------
-12== CFAAA-NPGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF-------
-13== LVVAT-HKGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY---
-14== LIGAF-GDKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---
-15== LIGAF-GDKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---
-16== LIGAF-GDKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---
-17== LIGAF-GDKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---
-18== LKGVM-GDTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV---
-19== IQGLL-GNAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV---
-20== CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
-21== CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
-22== CMGLF-KF-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF---
-23== YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF---
-24== YFGLF-KI-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC---
-25== FSGIF-NL-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC---
-26== WAGVF-SSGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC---
-27== LLAQF-GPAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQ
-28== LLAQF-GPLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQ
-29== TARPFICGTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
-30== TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQC------
-31=p TARPFICGTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQC------
-32== LVLPF-CESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
-33=p LVLPF-CESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKC------
-34== LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
-35=p LIGPF-VDPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFG------
-36== ILVPT-CDCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCG------
+9== PGY--PFHPLMAALPAFFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+10== PGY--AFHPLMAALPAYFAKSATIYNPVIYVFMNRQFRNCIL-QLF---------GKK-V
+11== PGY--AFHPLAAALPAYFAKSATIYNPVIYVFMNRQFRNCIM-QLF---------GKK-V
+12== PGY--AFHPLAAALPAYFAKSATIYNPIIYVFMNRQFRNCIL-QLF---------GKK-V
+13== KGI--IIQPVLASLPSYFSKTATVYNPIIYVFMNKQFQSCLL-EMLCCGY----QPQR-T
+14== DKT--LLTPGATMIPACACKMVACIDPFVYAISHPRYRMELQKRCPWLAL---------N
+15== DKT--LLTPGATMIPACTCKMVACIDPFVYAISHPRYRMELQKRCPWLAI---------S
+16== DKS--LLTQGATMIPACTCKLVACIDPFVYAISHPRYRLELQKRCPWLGV---------N
+17== DKS--LLTPGATMIPACTCKLVACIEPFVYAISHPRYRMELQKRCPWLGV---------N
+18== DTS--GITPLVSTLPALLAKSCSCYNPFVYAISHPKYRLAITQHLPWFCV------HE-T
+19== NAE--GITPLLTTLPALLAKSCSCYNPFVYAISHPKFRLAITQHLPWFCV------HE-K
+20== F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+21== F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+22== F-E--GLTPLNTIWGACFAKSAACYNPIVYGISHPKYRLALKEKCPCCVF------GK-V
+23== I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPKYRIVLKEKCPMCVF------GN-T
+24== I-D--GLTPLTTIWGATFAKTSAVYNPIVYGISHPNDRLVLKEKCPMCVC------GT-T
+25== L-V--KISPLFTIWGSLFAKANAVYNPIVYGISHPKYRAALFAKFPSLAC-------A-A
+26== SGT--RLTPLATIWGSVFAKANSCYNPIVYGISHPRYKAALYQRFPSLAC------GS-G
+27== PAE--WVTPYAAELPVLFAKASAIHNPIVYSVSHPKFREAIQTTFPWLLTCCQFDEKE-C
+28== PLE--WVTPYAAQLPVMFAKASAIHNPMIYSVSHPKFREAISQTFPWVLTCCQFDDKE-T
+29== GTSCSCIPLWVERTFLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+30== GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRPTSRSLLQCQYR----NINR--
+31=p GTSCSCIPLWVERTCLWLGYANSLINPFIYAFFNRDLRTTYRSLLQCQYR----NINR--
+32== ESSC-HMPTLLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RQ----
+33=p ESSC-HMPALLGAIINWLGYSNSLLNPVIYAYFNKDFQNAFKKIIKCKFC----RR----
+34== DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+35=p DPE--GIPPFARSFVLWLGYFNSLLNPIIYTIFSPEFRSAFQKILFGKYR----RGHR--
+36== DCE---VSPVLTSLSLWLGYFNSTLNPVIYTVFSPEFRHAFQRLLCGRRV----RRRR--
-1== --GKNPLGDDE--SGASTSKTEVSSVS-TSPVS---------------------------
-2== --GKNPLGDDE--ASATASKTE------TSQVA---------------------------
-3== --GKNPFGDEDVSSTVSQSKTEVSSVS-SSQVS---------------------------
-4=p --GKNPLGDDE-SSTVSTSKTEVSS------VS---------------------------
-5=p --GKNPLGDEE-SSTVSTSKTEVSS------VS---------------------------
-6== --GKN-IEEDE--ASTSSQVTQVSS------VA---------------------------
-7== --GKA-MTDES--DTCSSQKTEVSTVS-STQVG---------------------------
+1== GDDE--SGASTSKTEVSSVS-TSPVSPA--------------------------------
+2== GDDE--ASATASKTE------TSQVAPA--------------------------------
+3== GDEDVSSTVSQSKTEVSSVS-SSQVSPA--------------------------------
+4=p GDDE-SSTVSTSKTEVSS------VSPA--------------------------------
+5=p GDEE-SSTVSTSKTEVSS------VSPA--------------------------------
+6== EEDE--ASTSSQVTQVSS------VAPEK-------------------------------
+7== TDES--DTCSSQKTEVSTVS-STQVGPN--------------------------------
8=opsin, ------------------------------------------------------------
-9== --GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
-10== --GKK-VDDGS--ELSSASKTEVSSV---SSVS---------------------------
-11== --GKK-VDDGS--EASTTSRTEVSSVS-NSSVA---------------------------
-12== --GKK-VDDGS--EVST-SRTEVSSVS-NSSVS---------------------------
-13== -QPQR-TGKAS--PGTPGPHADVTAAGLRNKVM---------------------------
-14== ---NE-KAPES----SAVASTSTTQEPQQTTAA---------------------------
-15== ---SE-KAPES----RAAISTSTTQEQQQTTAA---------------------------
-16== ---NE-KSGEI----SSAQSTTTQEQ-QQTTAA---------------------------
-17== ---NE-KSGEA----SSAQSTTTQEQTQQTSAA---------------------------
-18== ---HE-TETKS-NDDSQSNSTVAQDKA---------------------------------
-19== ---HE-KDPND-VEENQSSNTQTQEKS---------------------------------
-20== ---GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-21== ---GK-VDDGK-SSDAQSQATASEAESKA-------------------------------
-22== ---GK-VDDGK-SSEAQSQATTSEAESKA-------------------------------
-23== ---GN-TDEPKPDAPASDTETTSEADSKA-------------------------------
-24== ---GT-TDEPKPDAPPSDTETTSEAESKD-------------------------------
-25== ----A-AEPSS-DAVSTTSGTTTVTDNEKSNA----------------------------
-26== ---GS-GESGS-DVKSEASATTTMEEKPKIPEA---------------------------
-27== FDEKE-CEDAN-DAEEEVVASER--GGESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQG
-28== FDDKE-TEDDK-DAETEIPAGESSDAAPSADAAQMKEMMAMMQKMQQQQAAY----PPQG
-29== ---QY-RNINR--KLSAAGMHEALKLAER-------------------------------
-30== ---QY-RNINR--KLSAAGMHEALKLAER-------------------------------
-31=p ---QY-RNINR--KLSAAGMHEALKLAER-------------------------------
-32== ---KF-CRQ---------------------------------------------------
-33=p ---KF-CRR---------------------------------------------------
-34== ---KY-RRGHR-------------------------------------------------
-35=p ---KY-RRGHR-------------------------------------------------
-36== ---RR-VRRRR--A----------------------------------------------
-
-
-1== -----------------------------------PA-----------------------
-2== -----------------------------------PA-----------------------
-3== -----------------------------------PA-----------------------
-4=p -----------------------------------PA-----------------------
-5=p -----------------------------------PA-----------------------
-6== -----------------------------------PEK----------------------
-7== -----------------------------------PN-----------------------
-8=opsin, ------------------------------------------------------------
-9== -----------------------------------PA-----------------------
-10== -----------------------------------PA-----------------------
-11== -----------------------------------PA-----------------------
-12== -----------------------------------PA-----------------------
-13== -----------------------------------PAHPV--------------------
-14== ------------------------------------------------------------
-15== ------------------------------------------------------------
-16== ------------------------------------------------------------
-17== ------------------------------------------------------------
-18== ------------------------------------------------------------
-19== ------------------------------------------------------------
-20== ------------------------------------------------------------
-21== ------------------------------------------------------------
-22== ------------------------------------------------------------
-23== ------------------------------------------------------------
-24== ------------------------------------------------------------
-25== ------------------------------------------------------------
-26== ------------------------------------------------------------
-27== Y--PPQGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAY
-28== YAPPPQGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAY
-29== -----------------------------------PERPEFVL-QNADYCRKKGHDS---
-30== -----------------------------------PERSEFVL-QNSDHCGKKGHDT---
-31=p -----------------------------------PERSEFVL-QNSDHCGKKGHDT---
+9== DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+10== DDGS--ELSSASKTEVSSV---SSVSPA--------------------------------
+11== DDGS--EASTTSRTEVSSVS-NSSVAPA--------------------------------
+12== DDGS--EVST-SRTEVSSVS-NSSVSPA--------------------------------
+13== GKAS--PGTPGPHADVTAAGLRNKVMPAHPV-----------------------------
+14== EKAP--ESSAVASTSTTQEP--QQTTAA--------------------------------
+15== EKAP--ESRAAISTSTTQEQ--QQTTAA--------------------------------
+16== EKSG--EISSAQST-TTQEQ--QQTTAA--------------------------------
+17== EKSG--EASSAQST-TTQEQ-TQQTSAA--------------------------------
+18== ETKS--NDDSQSNSTVAQDK-A--------------------------------------
+19== DPND--VEENQSSNTQTQEK-S--------------------------------------
+20== DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+21== DDGK--SSDAQSQA-TASEA-ESKA-----------------------------------
+22== DDGK--SSEAQSQA-TTSEA-ESKA-----------------------------------
+23== DEPK--PDAPASDTETTSEA-DSKA-----------------------------------
+24== DEPK--PDAPPSDTETTSEA-ESKD-----------------------------------
+25== EPSS--DAVSTTSGTTTVTD-NEKSNA---------------------------------
+26== ESGS--DVKSEASATTTMEE-KPKIPEA--------------------------------
+27== EDAN--DAEEEVVASER--G-GESRDAAQMKEMMAMMQKMQAQQAAYQPPPPPQGY--PP
+28== EDDK--DAETEIPAGESSDA-APSADAAQMKEMMAMMQKMQQQQAAY----PPQGYAPPP
+29== ------KLSAAGMHEALKLAERPERPEF------------VLQNADY-------------
+30== ------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
+31=p ------KLSAAGMHEALKLAERPERSEF------------VLQNSDH-------------
32== ------------------------------------------------------------
33=p ------------------------------------------------------------
34== ------------------------------------------------------------
35=p ------------------------------------------------------------
-36== -----------------------------------PQ-----------------------
+36== ------A---------------PQ------------------------------------
-1== --
-2== --
-3== --
-4=p --
-5=p --
-6== --
-7== --
-8=opsin, --
-9== --
-10== --
-11== --
-12== --
-13== --
-14== --
-15== --
-16== --
-17== --
-18== --
-19== --
-20== --
-21== --
-22== --
-23== --
-24== --
-25== --
-26== --
-27== QA
-28== QA
-29== --
-30== --
-31=p --
-32== --
-33=p --
-34== --
-35=p --
-36== --
-
+1== ---------------------------------------------------------
+2== ---------------------------------------------------------
+3== ---------------------------------------------------------
+4=p ---------------------------------------------------------
+5=p ---------------------------------------------------------
+6== ---------------------------------------------------------
+7== ---------------------------------------------------------
+8=opsin, ---------------------------------------------------------
+9== ---------------------------------------------------------
+10== ---------------------------------------------------------
+11== ---------------------------------------------------------
+12== ---------------------------------------------------------
+13== ---------------------------------------------------------
+14== ---------------------------------------------------------
+15== ---------------------------------------------------------
+16== ---------------------------------------------------------
+17== ---------------------------------------------------------
+18== ---------------------------------------------------------
+19== ---------------------------------------------------------
+20== ---------------------------------------------------------
+21== ---------------------------------------------------------
+22== ---------------------------------------------------------
+23== ---------------------------------------------------------
+24== ---------------------------------------------------------
+25== ---------------------------------------------------------
+26== ---------------------------------------------------------
+27== QGYPPQGAYPPPQGYPPQGYPPQGYPPQGYPPQGAPPQVEAPQGAPPQGVDNQAYQA
+28== QGYPPQGY--PPQGYPPQGYPPQGYPP---PPQGAPPQ-GAPPAAPPQGVDNQAYQA
+29== --------------------------------------------CRKKGHDS-----
+30== --------------------------------------------CGKKGHDT-----
+31=p --------------------------------------------CGKKGHDT-----
+32== ---------------------------------------------------------
+33=p ---------------------------------------------------------
+34== ---------------------------------------------------------
+35=p ---------------------------------------------------------
+36== ---------------------------------------------------------
+