view interproscan5/data-p/__base__.gff3 @ 7:1a4c5ab108fc draft

Uploaded
author mkh
date Fri, 05 Feb 2016 13:08:08 -0500
parents 74cf3f49f10c
children
line wrap: on
line source

##gff-version 3
##feature-ontology http://song.cvs.sourceforge.net/viewvc/song/ontology/sofa.obo?revision=1.269
##sequence-region P00363 1 602
P00363	.	polypeptide	1	602	.	+	.	md5=0d2c0f1acdd08ab0157f2308531a58e4;ID=P00363
P00363	SUPERFAMILY	protein_match	361	415	2.27E-71	+	.	Name=SSF51905;Target=P00363 361 415;status=T;ID=match$1_361_415;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR023753"
P00363	SUPERFAMILY	protein_match	2	250	2.27E-71	+	.	Name=SSF51905;Target=P00363 2 250;status=T;ID=match$1_2_250;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR023753"
P00363	TIGRFAM	protein_match	7	581	4.7E-250	+	.	Name=TIGR01812;signature_desc=sdhA_frdA_Gneg: succinate dehydrogenase or fumarate reductase, flavoprotein subunit;Target=P00363 7 581;status=T;ID=match$2_7_581;Ontology_term="GO:0016627","GO:0022900","GO:0050660","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR014006"
P00363	Gene3D	protein_match	234	352	3.6E-37	+	.	Name=G3DSA:3.90.700.10;Target=P00363 234 352;status=T;ID=match$3_234_352;date=24-01-2016;Dbxref="InterPro:IPR027477"
P00363	PRINTS	protein_match	375	382	2.5E-5	+	.	Name=PR00411;signature_desc=Pyridine nucleotide disulphide reductase class-I signature;Target=P00363 375 382;status=T;ID=match$4_375_382;date=24-01-2016
P00363	PRINTS	protein_match	7	29	2.5E-5	+	.	Name=PR00411;signature_desc=Pyridine nucleotide disulphide reductase class-I signature;Target=P00363 7 29;status=T;ID=match$4_7_29;date=24-01-2016
P00363	Gene3D	protein_match	426	537	1.5E-38	+	.	Name=G3DSA:1.20.58.100;Target=P00363 426 537;status=T;ID=match$5_426_537;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR015939"
P00363	Coils	protein_match	423	443	.	+	.	Name=Coil;Target=P00363 423 443;status=T;ID=match$6_423_443;date=24-01-2016
P00363	Gene3D	protein_match	353	416	5.9E-106	+	.	Name=G3DSA:3.50.50.60;Target=P00363 353 416;status=T;ID=match$7_353_416;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR023753"
P00363	Gene3D	protein_match	2	233	5.9E-106	+	.	Name=G3DSA:3.50.50.60;Target=P00363 2 233;status=T;ID=match$7_2_233;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR023753"
P00363	PANTHER	protein_match	1	584	0.0	+	.	Name=PTHR11632;Target=P00363 1 584;status=T;ID=match$8_1_584;date=24-01-2016
P00363	SUPERFAMILY	protein_match	444	590	3.01E-46	+	.	Name=SSF46977;Target=P00363 444 590;status=T;ID=match$9_444_590;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR015939"
P00363	PANTHER	protein_match	1	584	0.0	+	.	Name=PTHR11632:SF50;Target=P00363 1 584;status=T;ID=match$10_1_584;date=24-01-2016
P00363	PIRSF	protein_match	1	575	2.0E-42	+	.	Name=PIRSF000171;Target=P00363 1 575;status=T;ID=match$11_1_575;date=24-01-2016;Dbxref="InterPro:IPR030664"
P00363	TIGRFAM	protein_match	3	582	0.0	+	.	Name=TIGR01176;signature_desc=fum_red_Fp: fumarate reductase (quinol), flavoprotein subunit;Target=P00363 3 582;status=T;ID=match$12_3_582;Ontology_term="GO:0009061","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR005884"
P00363	Pfam	protein_match	453	581	7.0E-39	+	.	Name=PF02910;signature_desc=Fumarate reductase flavoprotein C-term;Target=P00363 453 581;status=T;ID=match$13_453_581;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR015939"
P00363	Coils	protein_match	473	493	.	+	.	Name=Coil;Target=P00363 473 493;status=T;ID=match$14_473_493;date=24-01-2016
P00363	ProSitePatterns	protein_match	43	52	.	+	.	Name=PS00504;signature_desc=Fumarate reductase / succinate dehydrogenase FAD-binding site.;Target=P00363 43 52;status=T;ID=match$15_43_52;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR003952"
P00363	Gene3D	protein_match	543	577	5.5E-18	+	.	Name=G3DSA:4.10.80.40;Target=P00363 543 577;status=T;ID=match$16_543_577;date=24-01-2016
P00363	SUPERFAMILY	protein_match	227	358	6.88E-43	+	.	Name=SSF56425;Target=P00363 227 358;status=T;ID=match$17_227_358;date=24-01-2016;Dbxref="InterPro:IPR027477"
P00363	Pfam	protein_match	7	397	1.1E-115	+	.	Name=PF00890;signature_desc=FAD binding domain;Target=P00363 7 397;status=T;ID=match$18_7_397;date=24-01-2016;Dbxref="InterPro:IPR003953"
P00363	PRINTS	protein_match	8	27	3.0E-10	+	.	Name=PR00368;signature_desc=FAD-dependent pyridine nucleotide reductase signature;Target=P00363 8 27;status=T;ID=match$19_8_27;date=24-01-2016
P00363	PRINTS	protein_match	360	382	3.0E-10	+	.	Name=PR00368;signature_desc=FAD-dependent pyridine nucleotide reductase signature;Target=P00363 360 382;status=T;ID=match$19_360_382;date=24-01-2016
##sequence-region P00350 1 468
P00350	.	polypeptide	1	468	.	+	.	md5=1776f92beb74ff0ccd9ac47a65663644;ID=P00350
P00350	SUPERFAMILY	protein_match	4	173	4.86E-50	+	.	Name=SSF51735;Target=P00350 4 173;status=T;ID=match$20_4_173;date=24-01-2016;Dbxref="InterPro:IPR016040"
P00350	TIGRFAM	protein_match	5	467	1.1E-232	+	.	Name=TIGR00873;signature_desc=gnd: 6-phosphogluconate dehydrogenase (decarboxylating);Target=P00350 5 467;status=T;ID=match$21_5_467;Ontology_term="GO:0004616","GO:0006098","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006113"
P00350	Gene3D	protein_match	1	180	1.9E-61	+	.	Name=G3DSA:3.40.50.720;Target=P00350 1 180;status=T;ID=match$22_1_180;date=24-01-2016;Dbxref="InterPro:IPR016040"
P00350	Pfam	protein_match	3	174	1.8E-52	+	.	Name=PF03446;signature_desc=NAD binding domain of 6-phosphogluconate dehydrogenase;Target=P00350 3 174;status=T;ID=match$23_3_174;Ontology_term="GO:0004616","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006115"
P00350	PIRSF	protein_match	1	468	1.9E-243	+	.	Name=PIRSF000109;Target=P00350 1 468;status=T;ID=match$24_1_468;Ontology_term="GO:0004616","GO:0006098","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006113"
P00350	ProSitePatterns	protein_match	253	265	.	+	.	Name=PS00461;signature_desc=6-phosphogluconate dehydrogenase signature.;Target=P00350 253 265;status=T;ID=match$25_253_265;Ontology_term="GO:0004616","GO:0006098","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006184"
P00350	Gene3D	protein_match	181	433	1.0E-119	+	.	Name=G3DSA:1.10.1040.10;Target=P00350 181 433;status=T;ID=match$26_181_433;Ontology_term="GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR013328"
P00350	Gene3D	protein_match	436	467	1.4E-22	+	.	Name=G3DSA:1.20.5.320;Target=P00350 436 467;status=T;ID=match$27_436_467;date=24-01-2016;Dbxref="InterPro:IPR012284"
P00350	PRINTS	protein_match	249	276	1.521867E-89	+	.	Name=PR00076;signature_desc=6-phosphogluconate dehydrogenase signature;Target=P00350 249 276;status=T;ID=match$28_249_276;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006183"
P00350	PRINTS	protein_match	168	196	1.521867E-89	+	.	Name=PR00076;signature_desc=6-phosphogluconate dehydrogenase signature;Target=P00350 168 196;status=T;ID=match$28_168_196;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006183"
P00350	PRINTS	protein_match	66	95	1.521867E-89	+	.	Name=PR00076;signature_desc=6-phosphogluconate dehydrogenase signature;Target=P00350 66 95;status=T;ID=match$28_66_95;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006183"
P00350	PRINTS	protein_match	119	144	1.521867E-89	+	.	Name=PR00076;signature_desc=6-phosphogluconate dehydrogenase signature;Target=P00350 119 144;status=T;ID=match$28_119_144;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006183"
P00350	PRINTS	protein_match	4	27	1.521867E-89	+	.	Name=PR00076;signature_desc=6-phosphogluconate dehydrogenase signature;Target=P00350 4 27;status=T;ID=match$28_4_27;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006183"
P00350	PRINTS	protein_match	356	378	1.521867E-89	+	.	Name=PR00076;signature_desc=6-phosphogluconate dehydrogenase signature;Target=P00350 356 378;status=T;ID=match$28_356_378;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006183"
P00350	PANTHER	protein_match	1	466	7.6E-305	+	.	Name=PTHR11811:SF25;Target=P00350 1 466;status=T;ID=match$29_1_466;date=24-01-2016
P00350	PANTHER	protein_match	1	466	7.6E-305	+	.	Name=PTHR11811;Target=P00350 1 466;status=T;ID=match$30_1_466;date=24-01-2016
P00350	Pfam	protein_match	179	466	2.0E-132	+	.	Name=PF00393;signature_desc=6-phosphogluconate dehydrogenase, C-terminal domain;Target=P00350 179 466;status=T;ID=match$31_179_466;Ontology_term="GO:0004616","GO:0006098","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006114"
P00350	SUPERFAMILY	protein_match	177	467	6.8E-132	+	.	Name=SSF48179;Target=P00350 177 467;status=T;ID=match$32_177_467;Ontology_term="GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR008927"
##sequence-region P00370 1 447
P00370	.	polypeptide	1	447	.	+	.	md5=9ec8e26fcf5c160f533bf9a69dec0212;ID=P00370
P00370	PRINTS	protein_match	372	383	2.5E-33	+	.	Name=PR00082;signature_desc=Glutamate/leucine/phenylalanine/valine dehydrogenase signature;Target=P00370 372 383;status=T;ID=match$33_372_383;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006095"
P00370	PRINTS	protein_match	114	128	2.5E-33	+	.	Name=PR00082;signature_desc=Glutamate/leucine/phenylalanine/valine dehydrogenase signature;Target=P00370 114 128;status=T;ID=match$33_114_128;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006095"
P00370	PRINTS	protein_match	235	255	2.5E-33	+	.	Name=PR00082;signature_desc=Glutamate/leucine/phenylalanine/valine dehydrogenase signature;Target=P00370 235 255;status=T;ID=match$33_235_255;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006095"
P00370	PRINTS	protein_match	193	215	2.5E-33	+	.	Name=PR00082;signature_desc=Glutamate/leucine/phenylalanine/valine dehydrogenase signature;Target=P00370 193 215;status=T;ID=match$33_193_215;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006095"
P00370	SUPERFAMILY	protein_match	6	196	6.72E-74	+	.	Name=SSF53223;Target=P00370 6 196;status=T;ID=match$34_6_196;date=24-01-2016
P00370	Gene3D	protein_match	68	188	1.0E-60	+	.	Name=G3DSA:3.40.192.10;Target=P00370 68 188;status=T;ID=match$35_68_188;date=24-01-2016
P00370	Pfam	protein_match	202	445	1.3E-87	+	.	Name=PF00208;signature_desc=Glutamate/Leucine/Phenylalanine/Valine dehydrogenase;Target=P00370 202 445;status=T;ID=match$36_202_445;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006096"
P00370	PIRSF	protein_match	22	447	1.8E-114	+	.	Name=PIRSF000185;Target=P00370 22 447;status=T;ID=match$37_22_447;Ontology_term="GO:0016639","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR014362"
P00370	SMART	protein_match	204	445	2.0E-93	+	.	Name=SM00839;signature_desc=Glutamate/Leucine/Phenylalanine/Valine dehydrogenase;Target=P00370 204 445;status=T;ID=match$38_204_445;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006096"
P00370	Gene3D	protein_match	209	372	1.6E-63	+	.	Name=G3DSA:3.40.50.720;Target=P00370 209 372;status=T;ID=match$39_209_372;date=24-01-2016;Dbxref="InterPro:IPR016040"
P00370	SUPERFAMILY	protein_match	202	446	4.96E-77	+	.	Name=SSF51735;Target=P00370 202 446;status=T;ID=match$40_202_446;date=24-01-2016;Dbxref="InterPro:IPR016040"
P00370	Gene3D	protein_match	7	67	8.2E-28	+	.	Name=G3DSA:1.10.285.10;Target=P00370 7 67;status=T;ID=match$41_7_67;date=24-01-2016
P00370	Gene3D	protein_match	373	446	2.0E-26	+	.	Name=G3DSA:1.10.285.10;Target=P00370 373 446;status=T;ID=match$41_373_446;date=24-01-2016
P00370	ProSitePatterns	protein_match	122	135	.	+	.	Name=PS00074;signature_desc=Glu / Leu / Phe / Val dehydrogenases active site.;Target=P00370 122 135;status=T;ID=match$42_122_135;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006095"
P00370	Pfam	protein_match	57	184	6.3E-49	+	.	Name=PF02812;signature_desc=Glu/Leu/Phe/Val dehydrogenase, dimerisation domain;Target=P00370 57 184;status=T;ID=match$43_57_184;Ontology_term="GO:0006520","GO:0016491","GO:0055114";date=24-01-2016;Dbxref="InterPro:IPR006097"
P00370	PANTHER	protein_match	1	447	3.2E-250	+	.	Name=PTHR11606;Target=P00370 1 447;status=T;ID=match$44_1_447;date=24-01-2016
P00370	PANTHER	protein_match	1	447	3.2E-250	+	.	Name=PTHR11606:SF4;Target=P00370 1 447;status=T;ID=match$45_1_447;date=24-01-2016
##sequence-region C1P5Z7 1 43
C1P5Z7	.	polypeptide	1	43	.	+	.	md5=abfa044baa298f169ea62ac6b48e1185;ID=C1P5Z7
C1P5Z7	Pfam	protein_match	2	37	1.0E-11	+	.	Name=PF15894;signature_desc=Inhibitor of glucose uptake transporter SgrT;Target=C1P5Z7 2 37;status=T;ID=match$46_2_37;Ontology_term="GO:0046325";date=24-01-2016;Dbxref="InterPro:IPR031767"
##FASTA
>C1P5Z7
MRQFYQHYFTATAKLCWLRWLSVPQRLTMLEGLMQWDDRNSES
>P00350
MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEF
VESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGF
NFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIGADGAGH
YVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDIFT
KKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVAAS
KVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAKIF
RAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPVPT
FSAAVAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEWLD
>P00363
MQTFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDH
DSFEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGM
KIERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGT
LVQIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGS
GILMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWR
KGNTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMG
GIETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERAATAGN
GNEAAIEAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKL
AELQERFKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGC
TERDDVNFLKHTLAFRDADGTTRLEYSDVKITTLPPAKRVYGGEADAADKAEAANKKEKA
NG
>P00370
MDQTYSLESFLNHVQKRDPNQTEFAQAVREVMTTLWPFLEQNPKYRQMSLLERLVEPERV
IQFRVVWVDDRNQIQVNRAWRVQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFKNALT
TLPMGGGKGGSDFDPKGKSEGEVMRFCQALMTELYRHLGADTDVPAGDIGVGGREVGFMA
GMMKKLSNNTACVFTGKGLSFGGSLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGS
GNVAQYAIEKAMEFGARVITASDSSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEF
GLVYLEGQQPWSLPVDIALPCATQNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQ
QAGVLFAPGKAANAGGVATSGLEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEG
EQTNYVQGANIAGFVKVADAMLAQGVI
>match$1_2_250
QTFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDHD
SFEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGMK
IERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGTL
VQIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGSG
ILMTEGCRG
>match$1_361_415
GIETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERA
>match$2_7_581
DLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDHDSFEYH
FHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGMKIERTW
FAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGTLVQIRA
NAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGSGILMTE
GCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWRKGNTIS
TPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMGGIETDQ
NCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERAATAGNGNEAAI
EAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKLAELQER
FKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGCTERDDV
NFLKHTLAFRDADGTTRLEYSDVKITTLPPAKRVY
>match$3_234_352
PTGLPGSGILMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQ
AFWHEWRKGNTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVR
>match$4_7_29
DLAIVGAGGAGLRAAIAAAQANP
>match$4_375_382
LFAVGECS
>match$5_426_537
IEAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKLAELQE
RFKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLD
>match$6_423_443
EAAIEAQAAGVEQRLKDLVNQ
>match$7_2_233
QTFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDHD
SFEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGMK
IERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGTL
VQIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYH
>match$7_353_416
PTAHYTMGGIETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQAT
ERAA
>match$8_1_584
MQTFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDH
DSFEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGM
KIERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGT
LVQIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGS
GILMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWR
KGNTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMG
GIETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERAATAGN
GNEAAIEAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKL
AELQERFKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGC
TERDDVNFLKHTLAFRDADGTTRLEYSDVKITTLPPAKRVYGGE
>match$9_444_590
DGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKLAELQERFKRVRITDTSSVFNTDL
LYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGCTERDDVNFLKHTLAFRDADGTTR
LEYSDVKITTLPPAKRVYGGEADAADK
>match$10_1_584
MQTFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDH
DSFEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGM
KIERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGT
LVQIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGS
GILMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWR
KGNTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMG
GIETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERAATAGN
GNEAAIEAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKL
AELQERFKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGC
TERDDVNFLKHTLAFRDADGTTRLEYSDVKITTLPPAKRVYGGE
>match$11_1_575
MQTFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDH
DSFEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGM
KIERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGT
LVQIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGS
GILMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWR
KGNTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMG
GIETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERAATAGN
GNEAAIEAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKL
AELQERFKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGC
TERDDVNFLKHTLAFRDADGTTRLEYSDVKITTLP
>match$12_3_582
TFQADLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDHDS
FEYHFHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGMKI
ERTWFAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGTLV
QIRANAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGSGI
LMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWRKG
NTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMGGI
ETDQNCETRIKGLFAVGECSSVGLHGANRLGSNSLAELVVFGRLAGEQATERAATAGNGN
EAAIEAQAAGVEQRLKDLVNQDGGENWAKIRDEMGLAMEEGCGIYRTPELMQKTIDKLAE
LQERFKRVRITDTSSVFNTDLLYTIELGHGLNVAECMAHSAMARKESRGAHQRLDEGCTE
RDDVNFLKHTLAFRDADGTTRLEYSDVKITTLPPAKRVYG
>match$13_453_581
RDEMGLAMEEGCGIYRTPELMQKTIDKLAELQERFKRVRITDTSSVFNTDLLYTIELGHG
LNVAECMAHSAMARKESRGAHQRLDEGCTERDDVNFLKHTLAFRDADGTTRLEYSDVKIT
TLPPAKRVY
>match$14_473_493
MQKTIDKLAELQERFKRVRIT
>match$15_43_52
RSHTVAAEGG
>match$16_543_577
RDDVNFLKHTLAFRDADGTTRLEYSDVKITTLPPA
>match$17_227_358
MEFVQYHPTGLPGSGILMTEGCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELG
PRDKVSQAFWHEWRKGNTISTPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVK
EPIPVRPTAHYT
>match$18_7_397
DLAIVGAGGAGLRAAIAAAQANPNAKIALISKVYPMRSHTVAAEGGSAAVAQDHDSFEYH
FHDTVAGGDWLCEQDVVDYFVHHCPTEMTQLELWGCPWSRRPDGSVNVRRFGGMKIERTW
FAADKTGFHMLHTLFQTSLQFPQIQRFDEHFVLDILVDDGHVRGLVAMNMMEGTLVQIRA
NAVVMATGGAGRVYRYNTNGGIVTGDGMGMALSHGVPLRDMEFVQYHPTGLPGSGILMTE
GCRGEGGILVNKNGYRYLQDYGMGPETPLGEPKNKYMELGPRDKVSQAFWHEWRKGNTIS
TPRGDVVYLDLRHLGEKKLHERLPFICELAKAYVGVDPVKEPIPVRPTAHYTMGGIETDQ
NCETRIKGLFAVGECSSVGLHGANRLGSNSL
>match$19_8_27
LAIVGAGGAGLRAAIAAAQA
>match$19_360_382
GGIETDQNCETRIKGLFAVGECS
>match$20_4_173
QQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEFVES
LETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGFNFI
GTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYI
>match$21_5_467
QIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEFVESL
ETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGFNFIG
TGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIGADGAGHYVKM
VHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDIFTKKDE
DGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVAASKVLS
GPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAKIFRAGC
IIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPVPTFSAA
VAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEWL
>match$22_1_180
MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEF
VESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGF
NFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIGADGAGH
>match$23_3_174
KQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEFVE
SLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGFNF
IGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIG
>match$24_1_468
MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEF
VESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGF
NFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIGADGAGH
YVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDIFT
KKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVAAS
KVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAKIF
RAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPVPT
FSAAVAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEWLD
>match$25_253_265
ILDEAANKGTGKW
>match$26_181_433
YVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDIFT
KKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVAAS
KVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAKIF
RAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPVPT
FSAAVAYYDSYRA
>match$27_436_467
LPANLIQAQRDYFGAHTYKRIDKEGVFHTEWL
>match$28_4_27
QQIGVVGMAVMGRNLALNIESRGY
>match$28_66_95
TPRRILLMVKAGAGTDAAIDSLKPYLDKGD
>match$28_119_144
GFNFIGTGVSGGEEGALKGPSIMPGG
>match$28_168_196
PCVTYIGADGAGHYVKMVHNGIEYGDMQL
>match$28_249_276
LVDVILDEAANKGTGKWTSQSALDLGEP
>match$28_356_378
IAKIFRAGCIIRAQFLQKITDAY
>match$29_1_466
MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEF
VESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGF
NFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIGADGAGH
YVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDIFT
KKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVAAS
KVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAKIF
RAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPVPT
FSAAVAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEW
>match$30_1_466
MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIAENPGKKLVPYYTVKEF
VESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGNTFFQDTIRRNRELSAEGF
NFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIAAVAEDGEPCVTYIGADGAGH
YVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDIFT
KKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVAAS
KVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAKIF
RAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPVPT
FSAAVAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEW
>match$31_179_466
GHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITKDI
FTKKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQRVA
ASKVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEIAK
IFRAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGIPV
PTFSAAVAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEW
>match$32_177_467
GAGHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQTFTEWNNGELSSYLIDITK
DIFTKKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEPLSLITESVFARYISSLKDQR
VAASKVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYAQGFSQLRAASEEYNWDLNYGEI
AKIFRAGCIIRAQFLQKITDAYAENPQIANLLLAPYFKQIADDYQQALRDVVAYAVQNGI
PVPTFSAAVAYYDSYRAAVLPANLIQAQRDYFGAHTYKRIDKEGVFHTEWL
>match$33_114_128
TFKNALTTLPMGGGK
>match$33_193_215
VFTGKGLSFGGSLIRPEATGYGL
>match$33_235_255
VSVSGSGNVAQYAIEKAMEFG
>match$33_372_383
ANAGGVATSGLE
>match$34_6_196
SLESFLNHVQKRDPNQTEFAQAVREVMTTLWPFLEQNPKYRQMSLLERLVEPERVIQFRV
VWVDDRNQIQVNRAWRVQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFKNALTTLPMG
GGKGGSDFDPKGKSEGEVMRFCQALMTELYRHLGADTDVPAGDIGVGGREVGFMAGMMKK
LSNNTACVFTG
>match$35_68_188
VDDRNQIQVNRAWRVQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFKNALTTLPMGGG
KGGSDFDPKGKSEGEVMRFCQALMTELYRHLGADTDVPAGDIGVGGREVGFMAGMMKKLS
N
>match$36_202_445
GGSLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGSGNVAQYAIEKAMEFGARVITA
SDSSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEFGLVYLEGQQPWSLPVDIALPC
ATQNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQQAGVLFAPGKAANAGGVATSG
LEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEGEQTNYVQGANIAGFVKVADAM
LAQG
>match$37_22_447
TEFAQAVREVMTTLWPFLEQNPKYRQMSLLERLVEPERVIQFRVVWVDDRNQIQVNRAWR
VQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFKNALTTLPMGGGKGGSDFDPKGKSEG
EVMRFCQALMTELYRHLGADTDVPAGDIGVGGREVGFMAGMMKKLSNNTACVFTGKGLSF
GGSLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGSGNVAQYAIEKAMEFGARVITA
SDSSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEFGLVYLEGQQPWSLPVDIALPC
ATQNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQQAGVLFAPGKAANAGGVATSG
LEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEGEQTNYVQGANIAGFVKVADAM
LAQGVI
>match$38_204_445
SLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGSGNVAQYAIEKAMEFGARVITASD
SSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEFGLVYLEGQQPWSLPVDIALPCAT
QNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQQAGVLFAPGKAANAGGVATSGLE
MAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEGEQTNYVQGANIAGFVKVADAMLA
QG
>match$39_209_372
EATGYGLVYFTEAMLKRHGMGFEGMRVSVSGSGNVAQYAIEKAMEFGARVITASDSSGTV
VDESGFTKEKLARLIEIKASRDGRVADYAKEFGLVYLEGQQPWSLPVDIALPCATQNELD
VDAAHQLIANGVKAVAEGANMPTTIEATELFQQAGVLFAPGKAA
>match$40_202_446
GGSLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGSGNVAQYAIEKAMEFGARVITA
SDSSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEFGLVYLEGQQPWSLPVDIALPC
ATQNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQQAGVLFAPGKAANAGGVATSG
LEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEGEQTNYVQGANIAGFVKVADAM
LAQGV
>match$41_7_67
LESFLNHVQKRDPNQTEFAQAVREVMTTLWPFLEQNPKYRQMSLLERLVEPERVIQFRVV
W
>match$41_373_446
NAGGVATSGLEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEGEQTNYVQGANIA
GFVKVADAMLAQGV
>match$42_122_135
LPMGGGKGGSDFDP
>match$43_57_184
PERVIQFRVVWVDDRNQIQVNRAWRVQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFK
NALTTLPMGGGKGGSDFDPKGKSEGEVMRFCQALMTELYRHLGADTDVPAGDIGVGGREV
GFMAGMMK
>match$44_1_447
MDQTYSLESFLNHVQKRDPNQTEFAQAVREVMTTLWPFLEQNPKYRQMSLLERLVEPERV
IQFRVVWVDDRNQIQVNRAWRVQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFKNALT
TLPMGGGKGGSDFDPKGKSEGEVMRFCQALMTELYRHLGADTDVPAGDIGVGGREVGFMA
GMMKKLSNNTACVFTGKGLSFGGSLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGS
GNVAQYAIEKAMEFGARVITASDSSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEF
GLVYLEGQQPWSLPVDIALPCATQNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQ
QAGVLFAPGKAANAGGVATSGLEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEG
EQTNYVQGANIAGFVKVADAMLAQGVI
>match$45_1_447
MDQTYSLESFLNHVQKRDPNQTEFAQAVREVMTTLWPFLEQNPKYRQMSLLERLVEPERV
IQFRVVWVDDRNQIQVNRAWRVQFSSAIGPYKGGMRFHPSVNLSILKFLGFEQTFKNALT
TLPMGGGKGGSDFDPKGKSEGEVMRFCQALMTELYRHLGADTDVPAGDIGVGGREVGFMA
GMMKKLSNNTACVFTGKGLSFGGSLIRPEATGYGLVYFTEAMLKRHGMGFEGMRVSVSGS
GNVAQYAIEKAMEFGARVITASDSSGTVVDESGFTKEKLARLIEIKASRDGRVADYAKEF
GLVYLEGQQPWSLPVDIALPCATQNELDVDAAHQLIANGVKAVAEGANMPTTIEATELFQ
QAGVLFAPGKAANAGGVATSGLEMAQNAARLGWKAEKVDARLHHIMLDIHHACVEHGGEG
EQTNYVQGANIAGFVKVADAMLAQGVI
>match$46_2_37
RQFYQHYFTATAKLCWLRWLSVPQRLTMLEGLMQWD