comparison weblogolib/htdocs/examples.html @ 0:c55bdc2fb9fa

Uploaded
author davidmurphy
date Thu, 27 Oct 2011 12:09:09 -0400
parents
children
comparison
equal deleted inserted replaced
-1:000000000000 0:c55bdc2fb9fa
1 <!DOCTYPE HTML PUBLIC "-//W3C//DTD HTML 4.01//EN"
2 "http://www.w3.org/TR/html4/transitional.dtd">
3
4 <html>
5 <head>
6 <link rel="stylesheet" type="text/css" href="logo.css" >
7 <title>CodonLogo - Examples</title>
8 <meta name="author" content="Gavin E. Crooks" >
9 <meta name="author" content="Steven E. Brenner" >
10 <meta name="ID" content="$ID:" >
11
12 <style type="text/css">
13 img {
14 display: block;
15 margin-left: auto;
16 margin-right: auto }
17
18 </style>
19 </head>
20
21 <body>
22
23 <table width="80%" border = '0' cellspacing='0' cellpadding='1' align="center">
24 <tr><td >
25 <h1> CodonLogo 1.0: Examples</h1>
26
27 </td><td align = "right">
28 &middot;
29 <a href="./">about</a>&nbsp;&middot;
30 <a href="create.cgi">create</a>&nbsp;&middot;
31 <a class="selected" href="examples.html">examples</a>&nbsp;&middot;
32 <a href="manual.html">manual</a>&nbsp;&middot;
33 <br>
34 &nbsp;
35 </td></tr>
36
37
38 <tr><td colspan="2" class="discourse" >
39
40 <ul>
41 <li> <a href="#CAP">CAP HTH motif</a> </li>
42 <li> <a href="#trans">Transcription Factors</a> </li>
43 <li> <a href="#promoters"><i>E. coli</i> Promoters</a> </li>
44 <li> <a href="#globins">Globins</a> </li>
45 <li> <a href="#HTH">HTH motif</a> </li>
46 <li> <a href="#splice">Splice Signals</a> </li>
47 </ul>
48 <p>
49 The <strong>Edit Logo</strong> buttons will transfer the relevant
50 sequence data to the <a class="in" href="create.cgi">Logo creation form</a>.
51 There you can examine the sequence data and recreate the logo for
52 yourself.
53 <!--Additional examples can be found at the
54 <a href="http://www.lecb.ncifcrf.gov/~toms/sequencelogo.html">Sequence Logo
55 Gallery</a>.-->
56 </p>
57
58
59 <!--<hr >
60 <a name="CAP"></a>
61 <a name="CAP_HTH"></a>
62 <h2>Catobolite Activator Protein (CAP)</h2>
63
64 <img alt="Catobolite Activator Protein (CAP) Logo" src="examples/cap_hth.png">
65 <p>
66 The helix-turn-helix motif from the CAP family of homodimeric DNA
67 binding proteins. CAP (Catabolite Activator Protein, also known as
68 CRP for cAMP Receptor Protein) is a transcription promoter that binds
69 at more than 100 sites within the <i>E.&nbsp;coli</i> genome. Residues 1-7
70 form the first helix, 8-11 the turn and 12-20 form the DNA recognition
71 helix. The glycine at position 9 appears to be
72 critical in forming the turn. Positions 4, 8, 10, 15 and 19 are
73 partially or completely buried, and therefore tend to be populated by
74 hydrophobic amino acids, which are colored black. Positions 11-14, 17
75 and 20 interact directly with bases in the major groove
76 and are critical to the sequence specific binding of the
77 protein. The data for this logo consists of 100 sequences from the
78 full Pfam alignment of this family (Accession number
79 PF00325). A few sequences with rare insertions were removed for
80 convenience.
81 </p>-->
82
83 <!--
84 # Pfam 7.1 crp
85 # Accession number: PF00325
86 # Bacterial regulatory proteins, crp family
87 #
88 # Description
89 # Numerous bacterial transcription regulatory
90 # proteins bind DNA via a helix-turn-helix (HTH)
91 # motif. These proteins are very diverse, but
92 # for convenience may be grouped into subfamilies on
93 # the basis of sequence similarity. One such
94 # family groups together a range of proteins, including
95 # anr, crp, clp, cysR, fixK, flp, fnr, fnrN, hlyX and
96 # ntcA [MEDLINE:91064083], [MEDLINE:93181282],
97 # [MEDLINE:91008963]. Within this family, the HTH motif is situated
98 # towards the C-terminus.
99 # This is the full Pfam alignment, less a couple of inserts
100 # 102 sequences.
101 #
102 # http://pfam.wustl.edu/cgi-bin/getdesc?name=crp
103 #
104 # Introduction to protein structure, 1st edition, contains
105 # some more information.
106 # First number is sequence number is -5
107 # First Helix: 1-7, Turn: 8-11, 2nd (DNA recognition) 12-20
108 #
109 -->
110
111 <!--
112 <form method="post" action="create.cgi">
113 <input type="submit" name="cmd_edit" value="Edit Logo" >
114 <input type="hidden" name="logo_title" value="The DNA-binding helix-turn-helix motif of the CAP family" >
115 <input type="hidden" name="first_index" value="-5" >
116 <input type="hidden" name="logo_start" value="1" >
117 <input type="hidden" name="logo_end" value="20" >
118 <input type="hidden" name="show_xaxis" value="true" >
119 <input type="hidden" name="show_yaxis" value="true" >
120 <input type="hidden" name="show_errorbars" value="true" >
121 <input type="hidden" name="show_fineprint" value="true" >
122 <input type="hidden" name="scale_width" value="true" >
123 <input type="hidden" name="sequences" value=">Q9EXQ1/196-227
124 LTMT.-RGDIGNYLGLTVETISRLLGRFQKLGVL
125 >Q46158/72-92
126 LTMT.-RGDIGNYLGLTVETISR-----------
127 >Q46157/72-92
128 LTMT.-RGDIGNYLGLTVETISR-----------
129 >Q46159/72-92
130 LTMT.-RGDIGNYLGLTVETISR-----------
131 >Q47948/72-92
132 LTMT.-RGDIGNYLGLTVETISR-----------
133 >FNR_HAEIN/196-227
134 LTMT.-RGDIGNYLGLTVETISRLLGRFQKLGVI
135 >ETRA_SHEPU/193-224
136 LTMT.-RGDIGNYLGLTVETISRLLGRFQKSGLI
137 >FNR_SALTY/193-224
138 LTMT.-RGDIGNYLGLTVETISRLLGRFQKSGML
139 >Q9LA24/207-238
140 LTMT.-RGDIGNYLGLTVETISRLLGRFQKSGML
141 >Q9AQ50/193-224
142 LTMT.-RGDIGNYLGLTVETISRLLGRFQKSGML
143 >FNR_ECOLI/193-224
144 LTMT.-RGDIGNYLGLTVETISRLLGRFQKSGML
145 >HLYX_ACTPL/192-223
146 LTMT.-RGDIGNYLGLTIETISRLLGRFQKSGMI
147 >O31204/192-223
148 LTMT.-RGDIGNYLGLTIETISRLLGRFQKSGMI
149 >Q9L801/192-223
150 LTMT.-RGDIGNYLGLTIETISRLLGRFQKSGMI
151 >Q9KS27/193-224
152 LTMT.-RGDIGNYLGLTVETISRLLGRFQKSEIL
153 >Q9CMY2/212-243
154 LTMT.-RGDIGNYLGLTVETISRLLGRLQKMGIL
155 >Q44500/188-219
156 LAMS.-RNEIGNYLGLAVETVSRVFSRFQQNELI
157 >ANR_PSEAE/188-219
158 LAMS.-RNEIGNYLGLAVETVSRVFTRFQQNGLI
159 >O85222/188-219
160 LSMS.-RNEIGNYLGLAVETVSRVFTRFQQNELI
161 >FNRA_PSEST/188-219
162 LPMS.-RNEIGNYLGLAVETVSRVFTRFQQNGLL
163 >BTR_BORPE/186-217
164 VRMS.-REEIGNYLGLTLETVSRLFSRFGREGLI
165 >Q9JQQ8/187-218
166 LRMS.-REEIGSYLGLKLETVSRTLSKFHQEGLI
167 >O69245/180-211
168 LPMC.-RRDIGDYLGLTLETVSRALSQLHTQGIL
169 >Q9AMR4/161-192
170 LPMS.-RRDIADYLGLTVETVSRAVSQLHTDGVL
171 >FIXK_BRAJA/185-216
172 LPMS.-RQDIADYLGLTIETVSRTFTKLERHGAI
173 >AADR_RHOPA/187-218
174 LPMG.-RQDIADFLGLTIETVSRTFTKLEREKLI
175 >FIXK_RHIME/159-190
176 LPMS.-RQDIADYLGLTIETVSRVVTKLKERSLI
177 >FIXK_AZOCA/196-227
178 LAMS.-RQDIADFLGLTIETVSRTLTYLEEQGTI
179 >Q9AA54/164-195
180 VPMS.-RQDMADYLGLTIETVSRTLTSLQDEGLI
181 >Q988V4/163-194
182 LPMS.-RMDIGDYLGLTIETVSRVFTRLKDKGVI
183 >Q53170/175-206
184 LPMT.-RLDVADYLGMTIETVSRTITKLAGSGVI
185 >Q989I4/189-220
186 LPLT.-RADISDFLGLTNETVSRQLTRLRADGVI
187 >Q988R0/189-220
188 LPLT.-RADIADFLGLTIETVSRQLTRLRTDGLI
189 >O06655/187-218
190 LPLS.-RAEIADFLGLTIETVSRKLTKLRKSGVI
191 >O86069/185-216
192 LPLS.-RAEIADFLGLTIETVSRQLTRLRKEGVI
193 >O86067/187-218
194 LPLS.-RAEIADFLGLTIETVSRQMTRLRKWGVI
195 >Q52775/187-218
196 LPLS.-RAEIADFLGLTIETVSRQMTRLRKSGVI
197 >FX24_RHILV/187-218
198 LPLS.-RAEIADFLGLTIETVSRQMTRLRKIGVI
199 >FNRL_RHOSH/187-218
200 LPLT.-REEMADYLGLTLETVSRQVSALKRDGVI
201 >Q51677/188-219
202 LPLT.-REAMADYLGLTLETVSRQMSALKREGVI
203 >O33961/187-218
204 LPLT.-REAMADYLGLTLETVSRQMSALKRDGVI
205 >O87372/155-185
206 -SIS.-RADMADFLGLTTETVSRLLSAFHREQLI
207 >P95599/188-221
208 LRVSmNRQDIADHLGLTIETLAHTVTKLASRNIV
209 >Q52823/185-216
210 VPMS.-RQDIADHLGLTIETVSRTLTKLASRNVV
211 >Q9FDG3/192-223
212 VPMN.-RQDIADHLGLTIETVSRTITKLAARNIV
213 >O84975/207-238
214 LRMS.-REDIASYLGLRLETVCRSVARLRAQDVV
215 >Q53240/186-217
216 FPIT.-RQNISEMTGTTLHTVSRLLSAWEREGIV
217 >O52578/162-191
218 --IS.-RQDIAEMTGTTLHTVSRILSAWEQLGFV
219 >Q9KWP8/153-184
220 FPIT.-KQDIAEMTGTTLHTVSRILTGWEAQGFV
221 >O66781/189-220
222 LPLT.-RQDIAEMTGTTVETTIRVMSKWKKQGII
223 >Q982N1/28-58
224 -PIA.-RGEIASRVGLTVQTVSTIVRELEEQGYI
225 >P96094/179-210
226 LPAK.-KAMIAARLGLTPETFSRVLKRLREEHLI
227 >FLP_LACCA/168-199
228 VPMA.-WTQLADYLGTTPETVSRTLKRLAEEKLI
229 >Q97IX9/173-206
230 INMElSITYLADMLGSKRETVSRQLKLLTEKNLV
231 >Q9CE44/171-202
232 IPMK.-LKELANYIGTSPETISRKIKVFEENKII
233 >Q9S392/178-209
234 IPMK.-MKDLATFIGTTPETISRKFKILEEKGFI
235 >Q9S393/178-209
236 IPMT.-LKDLSAFIGTTPETISRKLRLLEEKGLV
237 >Q98GX3/209-240
238 LPLS.-QAELADVLGLSVVHMNRVIGALRKVGVV
239 >Q9XDD3/182-213
240 CPLT.-QGELADALGLTPIHINRMLRELREDNLL
241 >NTCA_ANASP/172-203
242 LKLS.-HQAIAEAIGSTRVTVTRLLGDLREKKMI
243 >NTCA_SYNP7/171-202
244 LKLS.-HQAIAEAIGSTRVTVTRLLGDLRESKLI
245 >NTCA_SYNY3/174-205
246 LKLS.-HQAIAEAIGSTRVTVTRLLGDLREGNMI
247 >P94611/175-206
248 LKLS.-HQAIAEAIGSTRVTVTRLLGDLRQEEMI
249 >Q9L627/170-201
250 LKLS.-HQAIAEAIGSTRVTVTRLLGDLRQDEMI
251 >Q9AG80/172-203
252 LKLS.-HQAIAEAIGSTRVTVTRLLGDLRQDKMI
253 >O30778/173-204
254 LRLS.-HQAIAEAIGSTRVTITRLLGDLRNSGLV
255 >Q9KI45/189-220
256 FPLT.-HAQIGSAIGSTRVTVTRLMGKLRQRGLI
257 >CYSR_SYNP7/152-183
258 IPLT.-HQVIAELSGSTRVTTTRLLGEFRQAGRI
259 >CYSR_SYNY3/160-191
260 VRLT.-HQMLANAIGTTRVTVTRLLGEFQTQGKV
261 >Q55322/177-208
262 LRLT.-HQEMASALSTTRVTVTRVIGLLRDEGWL
263 >Q9RTV7/201-231
264 -RIS.-HQDLAHSVGSTRETITKLLGDFRTRGLL
265 >Q9TLZ6/157-188
266 IYIS.-QHDIASILSTTRSTITRLINQLRKDNII
267 >FNR_BACSU/174-205
268 IVLT.-NQDLAKFCAAARESVNRMLGDLRKKGVI
269 >O86128/173-204
270 IVLT.-NQDLAKFCAAARESINRMLSDLRKNGVI
271 >Q9KG81/173-204
272 IVLT.-NQELANFCAAARESVNRMLGELRKLGVI
273 >CRP_PASMU/165-196
274 IKIT.-RQEIGQMVGCSRETVGRILKMLEDQHLI
275 >Q48301/170-201
276 IKIT.-RQEIGQMVGCSRETVGRILKMLEDQHLI
277 >CRP_HAEIN/180-211
278 IKIT.-RQEIGQMVGCSRETVGRIIKMLEDQNLI
279 >Q51859/180-211
280 IKIT.-RQEIGQMVGCSRETVGRIIKMLEDEGLI
281 >Q9F435/166-197
282 IKIT.-RQEIGQIVGCSRETVGHILKMLEDQNLI
283 >CRP_ECOLI/166-197
284 IKIT.-RQEIGQIVGCSRETVGRILKMLEDQNLI
285 >CRP_SALTY/166-197
286 IKIT.-RQEIGQIVGCSRETVGRILKMLEDQNLI
287 >O07097/166-197
288 IKIT.-RQEIGQIVGCSRETVGRILKMLEDQNLI
289 >Q9ALY5/166-197
290 IKIT.-RQEIGQIVGCSRETVGRILKMLEEQNLI
291 >O34015/166-197
292 IKIT.-RQEIGQIVGCSRETVGRILKMLEEQNLI
293 >Q9KNW6/166-197
294 IKIT.-RQEIGQIVGCSRETVGRILKMLEEQNLI
295 >CLP_XANCP/186-217
296 LRVS.-RQELARLVGCCAQMAGRVLKKLQADGLL
297 >Q9PD39/185-216
298 LRVS.-RQELARLVGCSREMAGRVLKKLQADGLL
299 >Q9S6B5/186-217
300 LRVS.-RQELARLVGCSREMAGRVLKKLQADGLL
301 >P71977/33-62
302 --LS.-QAEIGERVGMARSTVSRILNALEDEGLV
303 >O28174/36-67
304 VKIS.-SKELAEHIGQSLQTAARKLKELEDEGLI
305 >Q9CB91/174-204
306 -DLT.-QEEIAQLVGASRETVNKALADFAHRGWI
307 >O69644/174-204
308 -DLT.-QEEIAQLVGASRETVNKALADFAHRGWI
309 >Q9XA42/174-204
310 -DLT.-QEELAQLVGASRETVNKALADFAQRGWL
311 >Q97TL8/136-167
312 INCT.-HEDIGKAVGVSRVTVSRTLNKFSQYQWI
313 >Q99YT6/175-206
314 FQLT.-TTDIAQISGTTRETVSHVLRDLKKQELI
315 >Q9RRX0/176-209
316 LNLKlNQEDIARMVGATRETVSHSLSRLKKGGAI
317 >Q9K5F3/178-209
318 CPIT.-AAEIAKISGTSRETVSAVLKKLRCEGVI
319 >P73234/185-215
320 -NLP.-HRETAMLSGVTRETVTRTLGKLEKKGLI
321 >P74171/182-212
322 -NLP.-HRELSSISGLARETVTRCLTKLEKRGLI
323 >Q981X4/78-109
324 AKVT.-HDQIAAMVGSTRQWVTMMMKRFQKEGLV
325 " >
326 </form>-->
327
328
329
330 <!--<!--<img alt="CAP Binding Site Logo"
331 src="examples/cap_dna.png" >
332 <p>
333 The two DNA recognition helixes of the CAP homodimer insert
334 themselves into consecutive turns of the major groove. Several
335 consequences can be observed in this CAP binding site logo. The logo
336 is approximately palindromic, which provides two very similar
337 recognition sites, one for each subunit of the dimer.
338 However, the binding
339 site is not perfectly symmetric, possible due to the
340 inherent asymmetry of the operon promoter region.
341 The displacement of the two parts is 11 base pairs, or approximately
342 one full turn of the DNA helix. Additional interactions between the
343 protein and the first and last two bases occur within the DNA minor
344 groove, where it is difficult for the protein to distinguish A from T,
345 or G from C.
346 The data for this logo consists of 59 binding sites determined by
347 <a href="#footprinting">DNA footprinting</a>.
348 <cite>
349 Robison, K., McGuire, A. M., Church, G. M. A comprehensive library of
350 DNA-binding site matrices for 55 proteins applied to the
351 complete <i>Escherichia coli</i> K12 genome. Journal of Molecular Biology
352 (1998) 284, 241-254.
353 </cite>
354 </p>
355
356 <form method="post" action="create.cgi">
357 <input type="submit" name="cmd_edit" value="Edit Logo" >
358 <input type="hidden" name="first_index" value="-10" >
359 <input type="hidden" name="show_xaxis" value="true" >
360 <input type="hidden" name="show_yaxis" value="true" >
361 <input type="hidden" name="show_errorbars" value="true" >
362 <input type="hidden" name="show_fineprint" value="true" >
363 <input type="hidden" name="scale_width" value="true" >
364 <input type="hidden" name="logo_title" value="58 CAP Binding Sites" >
365 <input type="hidden" name="sequences" value="
366 >aldB -18->4
367 attcgtgatagctgtcgtaaag
368 >ansB 103->125
369 ttttgttacctgcctctaactt
370 >araB1 109->131
371 aagtgtgacgccgtgcaaataa
372 >araB2 147->169
373 tgccgtgattatagacactttt
374 >cdd 1 107->129
375 atttgcgatgcgtcgcgcattt
376 >cdd 2 57->79
377 taatgagattcagatcacatat
378 >crp 1 115->137
379 taatgtgacgtcctttgcatac
380 >crp 2
381 gaaggcgacctgggtcatgctg
382 >cya 151->173
383 aggtgttaaattgatcacgttt
384 >cytR 1 125->147
385 cgatgcgaggcggatcgaaaaa
386 >cytR 2 106->128
387 aaattcaatattcatcacactt
388 >dadAX 1 95->117
389 agatgtgagccagctcaccata
390 >dadAX 2 32->54
391 agatgtgattagattattattc
392 >deoP2 1 75->97
393 aattgtgatgtgtatcgaagtg
394 >deoP2 2 128->150
395 ttatttgaaccagatcgcatta
396 >fur 136->158
397 aaatgtaagctgtgccacgttt
398 >gal 56->78
399 aagtgtgacatggaataaatta
400 >glpACB (glpTQ) 1 54->76
401 ttgtttgatttcgcgcatattc
402 >glpACB (glpTQ) 2 94->116
403 aaacgtgatttcatgcgtcatt
404 >glpACB (glpTQ) 144->166
405 atgtgtgcggcaattcacattt
406 >glpD (glpE) 95->117
407 taatgttatacatatcactcta
408 >glpFK 1 120->142
409 ttttatgacgaggcacacacat
410 >glpFK 2 95->117
411 aagttcgatatttctcgttttt
412 >gut (srlA) 72->94
413 ttttgcgatcaaaataacactt
414 >ilvB 87->109
415 aaacgtgatcaacccctcaatt
416 >lac 1 (lacZ) 88->110
417 taatgtgagttagctcactcat
418 >lac 2 (lacZ) 16->38
419 aattgtgagcggataacaattt
420 >malEpKp1 110->132
421 ttgtgtgatctctgttacagaa
422 >malEpKp2 139->161
423 TAAtgtggagatgcgcacaTAA
424 >malEpKp3 173->195
425 TTTtgcaagcaacatcacgAAA
426 >malEpKp4 205->227
427 GACctcggtttagttcacaGAA
428 >malT 121->143
429 aattgtgacacagtgcaaattc
430 >melR 52->74
431 aaccgtgctcccactcgcagtc
432 >mtl 302->324
433 TCTTGTGATTCAGATCACAAAG
434 >nag 156->178
435 ttttgtgagttttgtcaccaaa
436 >nupG2 97->119
437 aaatgttatccacatcacaatt
438 >nupG1 47->69
439 ttatttgccacaggtaacaaaa
440 >ompA 166->188
441 atgcctgacggagttcacactt
442 >ompR 161->183
443 taacgtgatcatatcaacagaa
444 >ptsH A 316->338
445 Ttttgtggcctgcttcaaactt
446 >ptsH B 188->210
447 ttttatgatttggttcaattct
448 >rhaS (rhaB) 161->183
449 aattgtgaacatcatcacgttc
450 >rot 1 (ppiA) 182->204
451 ttttgtgatctgtttaaatgtt
452 >rot 2 (ppiA) 129->151
453 agaggtgattttgatcacggaa
454 >tdcA 60->82
455 atttgtgagtggtcgcacatat
456 >tnaL 73->95
457 gattgtgattcgattcacattt
458 >tsx 2 146->168
459 gtgtgtaaacgtgaacgcaatc
460 >tsx 1 107->129
461 aactgtgaaacgaaacatattt
462 >uxuAB 165->187
463 TCTTGTGATGTGGTTAACCAAT
464 " >
465 </form>
466
467 <hr ><a name="trans"></a>
468 <h2><i>E. coli</i> Transcription Factor Binding Sites</h2>
469
470 <p>
471 The following logos (along with the <a href="#CAP">CAP logo</a> above) display
472 a selection of <i>E. coli</i> transcription factor binding sites determined
473 by DNA footprinting. This data has been collated in the
474 <a href="http://arep.med.harvard.edu/dpinteract/">DPInteract</a>
475 database and has been used to
476 <a href="http://arep.med.harvard.edu/ecoli_matrices/">search for
477 additional binding sites</a> within the <i>E. coli</i> genome.
478 </p>
479 <p>
480 <a name="footprinting"></a>
481 <cite>
482 Robison, K., McGuire, A. M., Church, G. M. A comprehensive library of
483 DNA-binding site matrices for 55 proteins applied to the
484 complete <i>Escherichia coli</i> K12 genome. Journal of Molecular Biology
485 (1998) 284, 241-254.
486 </cite>
487 </p>
488
489 <a name="LexA"></a>
490 <img alt ="" src="examples/lexA.png" ><br >
491 <form method="post" action="create.cgi">
492 <input type="submit" name="cmd_edit" value="Edit Logo" >
493 LexA repressor is closely related to CAP, and has similar DNA protein
494 interactions.
495 <input type="hidden" name="logo_title" value="19 LexA Binding Sites" >
496 <input type="hidden" name="first_index" value="-9" >
497 <input type="hidden" name="show_xaxis" value="true" >
498 <input type="hidden" name="show_yaxis" value="true" >
499 <input type="hidden" name="show_errorbars" value="true" >
500 <input type="hidden" name="show_fineprint" value="true" >
501 <input type="hidden" name="scale_width" value="true" >
502 <input type="hidden" name="sequences" value="
503 >dinD 32->52
504 aactgtatataaatacagtt
505 >dinG 15->35
506 tattggctgtttatacagta
507 >dinH 77->97
508 tcctgttaatccatacagca
509 >dinI 19->39
510 acctgtataaataaccagta
511 >lexA-1 28->48
512 tgctgtatatactcacagca
513 >lexA-2 7->27
514 aactgtatatacacccaggg
515 >polB(dinA) 53->73
516 gactgtataaaaccacagcc
517 >recA 59->79
518 tactgtatgagcatacagta
519 >recN-1 49->69
520 tactgtatataaaaccagtt
521 >recN-2 27->47
522 tactgtacacaataacagta
523 >recN-3 9-29
524 TCCTGTATGAAAAACCATTA
525 >ruvAB 49->69
526 cgctggatatctatccagca
527 >sosC 18->38
528 tactgatgatatatacaggt
529 >sosD 14->34
530 cactggatagataaccagca
531 >sulA 22->42
532 tactgtacatccatacagta
533 >umuDC 20->40
534 tactgtatataaaaacagta
535 >uvrA 83->103
536 tactgtatattcattcaggt
537 >uvrB 75->95
538 aactgtttttttatccagta
539 >uvrD 57->77
540 atctgtatatatacccagct" >
541 </form>
542
543 <a name="hns"></a>
544 <!--<img alt ="" src="examples/hns.png" >-->
545 <!--<form method="post" action="create.cgi">
546 <input type="submit" name="cmd_edit" value="Edit Logo" >
547 H-NS: Histone like, nucleoid-associated DNA-binding protein.
548 <input type="hidden" name="logo_title" value="15 hns Binding Sites" >
549 <input type="hidden" name="first_index" value="-1" >
550 <input type="hidden" name="logo_start" value="1" >
551 <input type="hidden" name="show_xaxis" value="true" >
552 <input type="hidden" name="show_yaxis" value="true" >
553 <input type="hidden" name="show_errorbars" value="true" >
554 <input type="hidden" name="show_fineprint" value="true" >
555 <input type="hidden" name="scale_width" value="true" >
556 <input type="hidden" name="sequences" value="
557 >hns1
558 tAGGCTGATTT
559 >hns2
560 gAAAATTATTT
561 >hns3
562 gGGAGTTATTC
563 >hns4
564 aCAAATTATTT
565 >hns5
566 gCAACAGAGTA
567 >hns6
568 aCGCCTGAATA
569 >hns7
570 tCGAGAAAGTT
571 >hns8
572 tCGCCGGAATT
573 >hns9
574 tGGCATGAATA
575 >hns10
576 aTAAAGGAATC
577 >hns11
578 cTAATTTAATT
579 >hns12
580 gCAATTAAATT
581 >hns13
582 tGACATGAATC
583 >hns14
584 cTGGCTAATTT
585 >hns15
586 aCAACTGAATT" >
587 </form>
588
589
590 <a name="dnaA"></a>-->
591 <!--<img alt="" src="examples/dnaA.png" >-->
592 <!--<form method="post" action="create.cgi">
593 <input type="submit" name="cmd_edit" value="Edit Logo" >
594 DNA biosynthesis initiation binding protein.
595 <input type="hidden" name="logo_title" value="8 dnaA Binding Sites" >
596 <input type="hidden" name="logo_end" value="14" >
597 <input type="hidden" name="show_xaxis" value="true" >
598 <input type="hidden" name="show_yaxis" value="true" >
599 <input type="hidden" name="show_errorbars" value="true" >
600 <input type="hidden" name="show_fineprint" value="true" >
601 <input type="hidden" name="scale_width" value="true" >
602 <input type="hidden" name="sequences" value="
603 >dnaA_1 rpoH-1
604 aatttattcacaagc
605 >dnaA_2 rpoH-2
606 attttatccacaagt
607 >dnaA_3 nrd
608 gagttatccacaaag
609 >dnaA_4 oriC-R1
610 ttgttatccacaggg
611 >dnaA_5 oriC-R2
612 ggggttatacacaac
613 >dnaA_6 oriC-R3
614 ttctttggataacta
615 >dnaA_7 oriC-R4
616 gagttatccacagta
617 >dnaA_10 dnaA
618 gatttatccacagga" >
619 </form>
620 -->
621
622 <!-- <a name="argR"></a> -->
623 <!--<img alt ="" src="examples/argR.png" >-->
624 <!--<form method="post" action="create.cgi">
625 <input type="submit" name="cmd_edit" value="Edit Logo" >
626 Arginine Repressor.
627 <input type="hidden" name="logo_title" value="17 ArgR Binding Sites" >
628 <input type="hidden" name="first_index" value="-8" >
629 <input type="hidden" name="show_xaxis" value="true" >
630 <input type="hidden" name="show_yaxis" value="true" >
631 <input type="hidden" name="show_errorbars" value="true" >
632 <input type="hidden" name="show_fineprint" value="true" >
633 <input type="hidden" name="scale_width" value="true" >
634 <input type="hidden" name="sequences" value="
635 >argA-1 32->50
636 acagaataaaaatacact
637 >argA-2 11->29
638 ttcgaataatcatgcaaa
639 >argD-1 51->69
640 agtgattttttatgcata
641 >argD-2 30->48
642 tgtggttataatttcaca
643 >argECBH-1 26->44, argC 110->128
644 tatcaatattcatgcagt
645 >argECBH-2 47->65, argC 89->107
646 tatgaataaaaatacact
647 >argF-1 48->66
648 aatgaataattacacata
649 >argF-2 27->45
650 agtgaattttaattcaat
651 >argG-1 73->91
652 attaaatgaaaactcatt
653 >argG-2 52->70
654 tttgcataaaaattcagt
655 >argG-3 192->210
656 tgtgaatgaatatccagt
657 >argI-1 46->64
658 aatgaataatcatccata
659 >argI-2 25->43
660 attgaattttaattcatt
661 >argR-1 45->63
662 tttgcataaaaattcatc
663 >argR-2 24->42
664 tatgcacaataatgttgt
665 >carAB-1 32->50
666 tgtgaattaatatgcaaa
667 >carAB-2 11->29
668 agtgagtgaatattctct" >
669 </form>
670
671
672
673 <hr >
674 <a name="promoters"></a>
675 <h2><i>E. coli</i> Promoters (Transcription Start Signals)</h2>
676
677 <p>
678 <img alt="" src="examples/ecoli10.png"><br >
679 In prokaryotes the DNA sequence just upstream of the transcription start point
680 contains two important conserved regions. The first such region is centered
681 at around 35bp upstream and is involved in the initial recognition of the
682 gene by RNA polymerase. -->
683 <!--The consensus sequence is TTGACAT, but the logo
684 indicates that a great deal of variation occurs. -->
685 <!--The second region, sometimes
686 referred to as the Pribnow box, is centered at about 10bp upstream. The typical
687 separation between the -35 and -10 sites is 15-18 bp.
688 See
689 <a class="out" href="http://www.lecb.ncifcrf.gov/~toms/papers/baseflip/">baseflip:
690 Strong Minor Groove Base Conservation in Sequence Logos
691 implies DNA Distortion or Base Flipping during Replication and
692 Transcription Initiation</a> for more information. This sequence data was kindly provided by Prof. Julia Brettschneider &lt;juliab@stat.berkeley.edu&gt;
693 </p>-->
694
695 <!--
696 <form method="post" action="create.cgi">
697 <input type="submit" name="cmd_edit" value="Edit Logo" >
698 The -10 region of 350 E. coli promoters
699 <input type="hidden" name="logo_title" value="-10 region of 3E. coli promoters" >
700 <input type="hidden" name="first_index" value="-21" >
701 <input type="hidden" name="logo_start" value="0" >
702 <input type="hidden" name="logo_end" value="7" >
703 <input type="hidden" name="show_xaxis" value="true" >
704 <input type="hidden" name="show_yaxis" value="true" >
705 <input type="hidden" name="show_errorbars" value="true" >
706 <input type="hidden" name="show_fineprint" value="true" >
707 <input type="hidden" name="scale_width" value="true" >
708 <input type="hidden" name="sequences" value="> The -10 hexamers of 350 E.coli promoters
709 gatgacgtggtttacgaccccaTTTAGTagtcaaccgcagtgagtgagtc
710 >
711 ttgaaaccagacgtttcgccccTATTACagactcacaaccacatgatgac
712 >
713 ctggcggcgtagcgatgcgctgGTTACTctgaaaacggtctatgcaaatt
714 >
715 tgacttttagcgcccatatctcCAGAATgccgccgtttgccagaaattcg
716 >
717 gatttacgtcatcattgtgaatTAATATgcaaataaagtgagtgaatatt
718 >
719 agaatacagcttattgaataccCATTATgagttagccattaacgcgtcca
720 >
721 cgacgacggtttacgctttacgTATAGTggcgacaattttttttatcggg
722 >
723 ctgacgctttttatcgcaactcTCTACTgtttctccatacccgttttttt
724 >
725 atccgtttttgtatccagtaacTCTAAAagcatatcgcattcatctggag
726 >
727 ttttttattgaatgtagaatttTATTCTgaatgtgtgggctctctatttt
728 >
729 tattctgaatgtgtgggctctcTATTTTaggattaattaaaaaaatagag
730 >
731 tcttttcacctttcctcctgttTATTCTtattaccccgtgtttatgtctc
732 >
733 attgcttaagcaagatcggacgGTTAATgtgttttacacattttttccgt
734 >
735 gcgccacactaaggtaattcctTATGCTggcaatgtcgtgaccagtgata
736 >
737 tgcagcctgtgctcagcgcgtgTTTCATacgcaagtgcgtatcggcgcgc
738 >
739 tgcattcgctgccgcataccatTATTCTtgatctgacggaagtctttttg
740 >
741 ggacataaggtgaatactttgtTACTTTagcgtcacagacatgaaattgg
742 >
743 ttattgagctttccggcgagagTTCAATgggacaggttccagaaaactca
744 >
745 ttaaaaattgttaacaattttgTAAAATaccgacggatagaacgacccgg
746 >
747 taacacctcgtcaaaatcctgcTATTCTgcccgttgcggtactgggcatt
748 >
749 tctattttatattattccctgtTTTAATtaactctatcagggatggttta
750 >
751 gacagaggccctcaatccaaacGATAAAgggtgatgtgtttactgatatg
752 >
753 tgctatctcgctgacggacaggCAAATTgatgaccagcttttaaaccgac
754 >
755 tttgacatttcttttgcactggTAAACTaaatcacttttttttgtcccag
756 >
757 ttttctcgcgtccgcgatagcgTAAAATagcgccgtaacccccaggtcct
758 >
759 aatttctacctgtttaagcatcTCTGGTagacttcctgtaattgaatcga
760 >
761 tgcagtgctcatagcggtcattTATGTCagacttgtcgttttacagttcg
762 >
763 aacatatctcgcaagcctgtctTGTGTTgacaacattttctgctaaccct
764 >
765 ctctccctgacgcgggataaagTGGTATtctcaaacatatctcgcaagcc
766 >
767 tatatctttaacaatctcaggtTAAAAActttcctgttttcaacgggact
768 >
769 gttgcaaatgaataattacacaTATAAAgtgaattttaattcaataagtg
770 >
771 tgaacgtccaatcaataaccgcTTTAATagataaacaccgctgatgaatg
772 >
773 ttgctttttatcttcagatgaaTAGAATgcggcggattttttgggtttca
774 >
775 gtcataaggtaaaagtctcattTATGATgagttccattggatttacttat
776 >
777 ttaccttatgacaatcggcgagTAGTCTgcctctcattccagagacagac
778 >
779 tacactttatgcttccggctcgTATGTTgtgtggaattgtgagcggataa
780 >
781 cgcaaaacctttcgcggtatggCATGATagcgcccggaagagagtcaatt
782 >
783 taaagttgtcacggccgagactTATAGTcgctttgtttttattttttaat
784 >
785 ttcattcttgaatatttattggTATAGTaaggggtgtattgagattttca
786 >
787 atctcttggccttgctggtcgtTATCCTgcaagctatcactttattggct
788 >
789 taaatctgtcataaatctgacgCATAATgacgtcgcattaatgatcgcaa
790 >
791 tgcagggagagcgccccggcacTAGACTacccgcctcttattttagtctg
792 >
793 acatatttttgtgagcaatgatTTTTATaataggctcctctgtatacgaa
794 >
795 ttacagtaatgtaaccttcccgTAAAATgcccacacactttaaacgccac
796 >
797 tagcgtaacaacaaaagattgtTATGCTtgaaatatggtgatgccgtacc
798 >
799 tcccttgtccccatctctcccaCATCCTgtttttaaccttaaaatggcat
800 >
801 tgaggcaatcgcctgttggtggTATCGTttatcgctttttcaaaaaattc
802 >
803 gattgcagaaatatattgataaTATTATtgataactatttgcatttgcaa
804 >
805 aaatgcaaatagttatcaataaTATTATcaatatatttctgcaatcaatg
806 >
807 tgctggaaaattaatgtgctttTATAGTggcgcttattgttgtcaatatt
808 >
809 attatcactcccttttactggcTAAACCagaaaacttattttatcattca
810 >
811 tcacacactctgtagcagatgaTCTAACaatctgattacagaacatcggc
812 >
813 tgtcagcctgtcccgcttataaGATCATacgccgttatacgttgtttacg
814 >
815 tttcatttaggcgtggcaattcTATAATgatacgcattatctcaagagca
816 >
817 acagttattagtggtagacaagTTTAATaattcggattgctaagtacttg
818 >
819 acaaacattaccaggaaaagcaTATAATgcgtaaaagttatgaagtcggt
820 >
821 tgtaatgattttgtgaacagccTATACTgccgccaggtctccggaacacc
822 >
823 tgggcagcttcttcgtcaaattTATCATgtggggcatccttaccgctctg
824 >
825 ctttaaaaactgcccctgacacTAAGACagtttttaaaggttccttcgcg
826 >
827 ggaaatgggcatcaaaaagagaTAAATTgttctcgatcaaattggctgaa
828 >
829 ttacacattctgacggaagataTAGATTggaagtattgcattcactaaga
830 >
831 gtcacacttttcgcatctttgtTATGCTatggttatttcataccataagc
832 >
833 gtcacacttttcgcatctttgtTATGCTatggttatttcataccataagc
834 >
835 gttttttgttgttaattcggtgTAGACTtgtaaacctaaatcttttcaat
836 >
837 tgtaaaccaaattgaaaagattTAGGTTtacaagtctacaccgaattaac
838 >
839 caaaactggcacgattttttcaTATATGtgaatgtcacgcaggggatcgt
840 >
841 tttttcatcaggttttacgctaAATAATcactgtgttgagtgcacaattt
842 >
843 ttgacggctcgccctaattctcTAAATTgtatttctagagttggcgaggt
844 >
845 cgtgttacaaaaattcttttctTATGATgtagaacgtgcaacgcaattga
846 >
847 caaaaattcttttcttatgatgTAGAACgtgcaacgcaattgatgctcgc
848 >
849 gatggtgaacaagtacgcgaggGAGAATgagcatccattgctgtgtacgc
850 >
851 actcctcacttacacgtaatacTACTTTcgagtgaaaatctacctatctc
852 >
853 ggtggtggtttgttggttgggtTGACATactgggtcatttacctgcgtga
854 >
855 tatggtgctgccggtcgcgatgTTTGTTgccagcggttttgagcacagta
856 >
857 gcaaacctgatggtatgtctggCAGTATggatgagttattctggccgcag
858 >
859 tttctcatctataatgctttgtTAGTATctcgtcgccgacttaataaaga
860 >
861 tttctcatctataatgctttgtTAGTATctcgtcgccgacttaataaaga
862 >
863 tgataaaaccgatagccacaggAATAATgtattacctgtggtcgcaatcg
864 >
865 gagcaagtgattgaaaaagcgcTACAATacgcgcgccagaaattggctct
866 >
867 tggaattttgtaaatctcccgtTACCCTgatagcggacttcccttctgta
868 >
869 ttcaataaattgcgaaacaaggTATACTccagcagttcctgaagatgttt
870 >
871 acgcagcagtagcaaactaagcTATAAAttgcagcgcgaactggagcagc
872 >
873 tgttcagcgtacacgtgttagcTATCCTgcgtgcttcaataaaataaggc
874 >
875 ttgtaagttttcaactacgttgTAGACTttacatcgccaggggtgctcgg
876 >
877 ttcacacttgtaagttttcaacTACGTTgtagactttacatcgccagggg
878 >
879 gttgatctttgttgtcactggaTGTACTgtacatccatacagtaactcac
880 >
881 attagcatcgcatcaggcaatcAATAATgtcagatatgaaaagcggaaac
882 >
883 tggcatatgaaattttgaggatTACCCTacacttataggagttaccttac
884 >
885 acatggttgcacaaagttgcaaCATCATggatatttcacgataacgttaa
886 >
887 aaaatttaatgtaaatggtgtgTTAAATcgattgtgaataaccagcgctt
888 >
889 aaaatttaatgtaaatggtgtgTTAAATcgattgtgaataaccagcgctt
890 >
891 tgtgaataaccagcgcttccggCAGGATacggtcgccctggtaaaacata
892 >
893 aacggcaagtttcgacattgccGATAATaattttttggagactttagatg
894 >
895 catcactctgtcatctttccagTAGAAActaatgtcactgaaatggtgtt
896 >
897 gtcggaatggctggttatccatTAAAATagatcggatcgatataagcaca
898 >
899 tgcaaaggaaaacgtttccgctTATCCTttgtgtccggcaaaaacatccc
900 >
901 tgactctatgacgttacaaagtTAATATgcgcgccctatgcaaaaggtaa
902 >
903 tttcagagattatgaattgccgCATTATagcctaataacgcgcatctttc
904 >
905 ttcatgacggcaaacaatagggTAGTATtgacaagccaattacaaatcat
906 >
907 tgatctgctggcaagaacagacTACTGTatataaaaacagtataacttca
908 >
909 tgaataatattttcaactgagtTATCAAgatgtgattagattattattct
910 >
911 gatcatgcagctagtgcgatccTGAACTaaggttttctgatacttgaata
912 >
913 gatgcggtgctttcctggctgtTAGAATacgccccgtcgcgcctgactgg
914 >
915 agcgttaccgtccgctatcgtcTATGTTcaagttgtcttaattgccagaa
916 >
917 tttattgatcttacgcatcctgTATGATgcaagcagactaaccctatcaa
918 >
919 catcaaattgcctttagctacaGACACTaaggtggcagacatcgaaacga
920 >
921 gtttcagagcgttaccttgcccTTAAACattagcaatgtcgatttatcag
922 >
923 tgcacaactgaatttaaggctcTATTATtacctcaacaaaccaccccaat
924 >
925 taatgtagccaccaaatcatacTACAATttattaactgttagctataatg
926 >
927 tgctgaagaataattgaaatgaTATTATtaattccactgcctttggtaga
928 >
929 gaatatgattgctatttgcattTAAAATcgagacctggtttttctactga
930 >
931 cgtgacattttaacacgtttgtTACAAGgtaaaggcgacgccgcccatga
932 >
933 tgacaattaatcatcgaactagTTAACTagtacgcaagttcacgtaaaaa
934 >
935 ttgcgtatcggattttatcaggTACAGTgtgacgctttcgtcaatctggc
936 >
937 gacgctttcgtcaatctggcaaTAGATTtgcttgacattcgaccaaaatt
938 >
939 acattcgaccaaaattccgtcgTGCTATagcgcctgtaggccaagacctg
940 >
941 ggtgaaccccttctcgttatggCAAAATaagccaatacagaaccagcatt
942 >
943 gacagatttgtgccattccgtgAACGATcgacgcgtcgtgattaggtgaa
944 >
945 tttcaccagacttattcttagcTATTATagttatagagagcttacttccg
946 >
947 tcctgctatccaaatagtgtcaTATCATcatattaattgttcttttttca
948 >
949 gctgtgttattgacagttagcaTAAACTaggtgtgacgttaactatatgt
950 >
951 cgattccgtctctctgatgattGATGTTaattaacaatgtattcaccgaa
952 >
953 tgtccttgttcgataaacacaaTAAACTtgatcatgaaattgccagaaag
954 >
955 tatcctcgtgctgtttctcacgTAGTCTataatttcctttttaagcccac
956 >
957 tttgttaaaaaagtgtgtaggaTATTGTtactcgcttttaacagggcaac
958 >
959 ttacttcccgtaggattcttgcTTTAATagtgggattaatttccacatta
960 >
961 attacgcaacgataatagcgggTATAAGataaataaaaggtaaaacgttt
962 >
963 tttgtctcaccttttaatttgcTACCCTatccatacgcacaataaggcta
964 >
965 tccccttttcgtcaagatcggcCAAAATtccacgcttacactatttgcgt
966 >
967 attctcaacataaaaaactttgTGTAATacttgtaacgctacatggagat
968 >
969 ttcatccggttaaatatgcaaaGATAAAtgcgcagaaatgtgtttctcaa
970 >
971 gtgcattagcttatttttttgtTATCATgctaaccacccggcgaggtgtg
972 >
973 tgacttttatcgccgtagccttTTCAATaaaggtcttttgaagagtacca
974 >
975 ttaacgtttttaactttttaatTAGAATatagatacaggagagcacatat
976 >
977 taacggatgtatccgtttagtcTATGATatgtacagcacttttggcttcg
978 >
979 tcactttccgctgattcggtgcCAGACTgaaatcagcctataggaggaaa
980 >
981 gggcttgaaaaagcgcccaatgTATTCCaggcttatctaacacgctgata
982 >
983 cttaccgtcacattcttgatggTATAGTcgaaaactgcaaaagcacatga
984 >
985 accaactggcaaaattttgtccTAAACTtgatctcgacgaaatggctgca
986 >
987 catttttatcgtaattgcccttTAAAATtcggggcgccgaccccatgtgg
988 >
989 aaaattcggggcgccgaccccaTGTGGTctcaagcccaaaggaagagtga
990 >
991 ttgacgctgcgtaaggtttttgTAATTTtacaggcaaccttttattcact
992 >
993 ataaaataattttttcgatatcTAAAATaaatcgcgaaacgcaggggttt
994 >
995 ttgaaaatagtcgcgtaacccaTACGATgtgggtatcgcatattgcgttt
996 >
997 tttcgcaagctcgtaaaagcagTACAGTgcaccgtaagaaaattacaagt
998 >
999 tcttcatccttcgctggatatcTATCCAgcatttttttatcatacagcat
1000 >
1001 gacgagtacagttgcgtcgattTAGGAAaaatcttagataagtgtaaaga
1002 >
1003 cttcatgaccgtgaatagagtcCATCGTccctcctcaaaaaaagcctagc
1004 >
1005 tgacgaagcagccgttatgcctTAACCTgcgccgcagatatcactcataa
1006 >
1007 tgaaacattgatgtctctgtagCAACATaggggtaatcttactgacaaca
1008 >
1009 tgtctgaacgtgaattgcagatTATGCTgatgatcaccaagggccagaag
1010 >
1011 tcaaagttgcaataaaaaccgcTAATATacgaatgactaactatcagtag
1012 >
1013 gattaaaaaccctgcagaaacgGATAATcatgccgataactcatataacg
1014 >
1015 ctttgttgcgctcaagacgcagGATAATtagccgataagcagtagcgaca
1016 >
1017 tactttaagacaattccaggcaAATTATacaacactttacgggatagtaa
1018 >
1019 tttgtttcacatttctgtgacaTACTATcggatgtgcggtaattgtatgg
1020 >
1021 ttcacatttctgtgacatactaTCGGATgtgcggtaattgtatggaacag
1022 >
1023 ttcacatttctgtgacatactaTCGGATgtgcggtaattgtatggaacag
1024 >
1025 tgtgacatactatcggatgtgcGGTAATtgtatggaacaggagacacaca
1026 >
1027 tgtgacatactatcggatgtgcGGTAATtgtatggaacaggagacacaca
1028 >
1029 gctgattagcacggtgatatttGATACTctggcagacagcagaaataacg
1030 >
1031 taataaatagttaattaacgctCATCATtgtacaatgaactgtacaaaag
1032 >
1033 ttaaatctttgtgggatcagggCATTATcttacgtgatcagaataaacaa
1034 >
1035 ttatactttaataagtactttgTATACTtatttgcgaacattccaggccg
1036 >
1037 atataaagccacaacgggttcgTAAACTgttatcccattacatgattatg
1038 >
1039 gaagtcctgtattcagtgctgaCAAAATagccgccagcaagcagtcattt
1040 >
1041 tgataattgttatcgtttgcatTATCGTtacgccgcaatcaaaaaaggct
1042 >
1043 taacatttggattgataattgtTATCGTttgcattatcgttacgccgcaa
1044 >
1045 tggattattctgcatttttgggGAGAATggacttgccgactgattaatga
1046 >
1047 acctcaaactgcgcggctgtgtTATAATttgcgacctttgaatccgggat
1048 >
1049 tgcaagagggtcattttcacacTATCTTgcagtgaatcccaaacataccc
1050 >
1051 atttaatttatgaatgttttctTAACATcgcggcaactcaagaaacggca
1052 >
1053 aaatcacgtttcactttcgaatTATGAGcgaatatgcgcgaaatcaaaca
1054 >
1055 attagctgtataaaagaatttcTACAGTgattgtaaggttttttttattc
1056 >
1057 ccaaagtttcgggctgttatgtTTTAATgtgcaacattcatggtctgttg
1058 >
1059 acgagagttaaccggacaagtgTGCCATaatctcgcggccaggcatactt
1060 >
1061 tgttcggcgtacaagtgtacgcTATTGTgcattcgaaacttactctatgt
1062 >
1063 caacattccagctggtccgaccTATACTctcgccactggtctgatttcta
1064 >
1065 ggcgctacgctcaatgaaacatTTAAATactatacgacagcgacatttat
1066 >
1067 ttgaggaatcaggcgggagtgaTAGAATatcgcccacttaatttttccag
1068 >
1069 tgtcaacgaaaacaataatgcgTAAGGTagaaacccgaactacattgagg
1070 >
1071 tgcgcaatttgtcaacgaaaacAATAATgcgtaaggtagaaacccgaact
1072 >
1073 ttccgcatattctctgagcgggTATGCTacctgttgtatcccaatttcat
1074 >
1075 attcagcctgtcggaactggtaTTTAACcagactaattattttgatgcgc
1076 >
1077 attcagcctgtcggaactggtaTTTAACcagactaattattttgatgcgc
1078 >
1079 ggttcaattcttcctttagcggCATAATgtttaatgacgtacgaaacgtc
1080 >
1081 ttcttcctttagcggcataatgTTTAATgacgtacgaaacgtcagcggtc
1082 >
1083 tggcagttgaccgtggtaatgaTATGATttcacacctttaccagccaatg
1084 >
1085 gcttttaatgccataccaaacgTACCATtgagacacttgtttgcacagag
1086 >
1087 attgttgtatgcatgtttttttTATGCTttccttaagaacaactcacccc
1088 >
1089 cagaactcaatgcacaaggcagTATTAAcgtcgtcaattattcccaacat
1090 >
1091 ttgccgccttgaagaaaggaggTATAATccgtcgattttttttgtggctg
1092 >
1093 cgcaaacgtttgctttccctgtTAGAATtgcgccgaattttatttttcta
1094 >
1095 ccggaagctggttgcgtgaaatTAGAAAtttcgccgctgatccaaacctg
1096 >
1097 gggaagcgcctcgcttcccgtgTATGATtgaacccgcatggctcccgaaa
1098 >
1099 ttcccttcgccatttccttgagCAAACTttagctattcttatcaattatg
1100 >
1101 tgttatcgcacaatgattcggtTATACTgttcgccgttgtccaacaggac
1102 >
1103 ggaatgaattggcgttatgtgtTACGTTtagcagatcaaaagacaggcga
1104 >
1105 ggggcgcaaccggacagaatttTATAAActgctttcccgacacgagctgg
1106 >
1107 ttcgtcagcgcatcagattcttTATAATgacgcccgtttcccccccttgg
1108 >
1109 ttgtagtgtagaatgcggcgttTCTATTaatacagacgttaagctcagaa
1110 >
1111 gaataattgagggatgacctcaTTTAATctccagtagcaactttgatccg
1112 >
1113 gacagcgtgaaaacagtacgggTACTGTactaaagtcacttaaggaaaca
1114 >
1115 ttgaaaactttactttatgtgtTATCGTtacgtcatcctcgctgaggatc
1116 >
1117 ttgaaaccctgaaactgatcccCATAATaagcgaagttagcgagatgaat
1118 >
1119 ggaaatataataagtgatcgctTACACTacgcgacgaaatactttttttg
1120 >
1121 acgcaaataatttgtggtgatcTACACTgatactctgttgcattattcgc
1122 >
1123 tgcattattcgcctgaaaccacAATATTcaggcgttttttcgctatcttt
1124 >
1125 ttgcctcagattctcagtatgtTAGGGTagaaaaaagtgactatttccat
1126 >
1127 ttactttatttgtcactgtcgtTACTATatcggctgaaattaatgaggtc
1128 >
1129 taccttcccagtcaagaaaactTATCTTattcccacttttcagttaccag
1130 >
1131 ttgatactgtatgagcatacagTATAATtgcttcaacagaacatattgac
1132 >
1133 cttttaaatctttcaatctgatTAGATTaggttgccgtttggtaataaaa
1134 >
1135 gcggcagcgtggcggaaggttgTAAACTgcacctcgaagaacaagaggcc
1136 >
1137 tgcgtcgcaaccgacaattacgTATTCTgagtcttcgggtgaacagagtg
1138 >
1139 gttattttgccgcaggtcagcgTATCGTgaacatcttttccagtgttcag
1140 >
1141 tcattcgttctcttacgctcccTATAGTcgaaacatctgatggcaagaaa
1142 >
1143 taatccacaccgtttgccccgtTAACCTtaccttctcttctgttttatgg
1144 >
1145 tgtggcacaggtcatgttcgggTATACTgctttcccgtcttggttattcc
1146 >
1147 aaaacatttaccccaaaggggcTATTTTctcactcctgatttcaatagtg
1148 >
1149 tattacagagcgttttttatttGAAAATgaatccatgagttcatttcaga
1150 >
1151 ggtagaagctcaacggacaattTATAATggctcagattaaaaaaactaat
1152 >
1153 tgcgcaatctatccgcttacttTATGATgcgcaccagtcacggactgatg
1154 >
1155 acacctgcgtgagttgttcacgTATTTTttcactatgtcttactctctgc
1156 >
1157 tccttttattccacgtttcgctTATCCTagctgaagcgtttcagtcgatt
1158 >
1159 gttcgaggcaggtttgtacggtTATACTtatcttgaagatgagtaagtcc
1160 >
1161 aatttcccatacagagctaaggGATAATgcgtagcgttcacgtaactgga
1162 >
1163 tctccaaaatatattcacgttgTAAATTgtttaacgtcaaatttcccata
1164 >
1165 taacaaaaaaccagtccgcgaaGTTGATagaatcccatcatctcgcacgg
1166 >
1167 acaacagtaaaatcagagcgttTCTGCTtttactgatgtctggcggtcgg
1168 >
1169 ttacatcaacccgcattggtccTACACTgcgcggtaataaagcgaggtaa
1170 >
1171 cgcccctggagaaagcctcgtgTATACTcctcacccttataaaagtccct
1172 >
1173 tacaaagcagcagcaattgcagTAAAATtccgcaccattttgaaataagc
1174 >
1175 caccgggcaacttttagagcacTATCGTggtacaaataatgctgccaccc
1176 >
1177 aaaaactgtcgatgtgggacgaTATAGCagataagaatattgctgagcaa
1178 >
1179 gcacatatcctgttcatttcatTTTGATacacttcatgccgtcaatgagg
1180 >
1181 gtcttttgtactcgtgtactggTACAGTgcaatgcataacaacgcagtcg
1182 >
1183 tgcgataacaggtcgctacgagTAGAATactgccgcttaacgtcgcgtaa
1184 >
1185 tgcattttttacccaaaacgagTAGAATttgccacgtttcaggcgcgggg
1186 >
1187 tgacctgtatcagctttcccgaTAAGTTggaaatccgctggaagctttct
1188 >
1189 gtttctcaataacgaaatttgaTAAAATcccgctctttcataacattatt
1190 >
1191 ataaaaattcatctgtatgcacAATAATgttgtatcaaccaccatatcgg
1192 >
1193 tgattatcttccctgataagacCAGTATttagctgccaattgctacgaaa
1194 >
1195 acccatatccttgaagcggtgtTATAATgccgcgccctcgatatggggat
1196 >
1197 ttgcgttcggtggttaagtatgTATAATgcgcgggcttgtcgtagttgac
1198 >
1199 tgacaccttttcggcatcgcccTAAAATtcggcgtcctcatattgtgtga
1200 >
1201 agacacaaagcgaaagctatgcTAAAACagtcaggatgctacagtaatac
1202 >
1203 gccaaacccgctggagtattgaGATAATtttcagtctgactctcgcaata
1204 >
1205 tgacgcgcgcaggtatttagcaTACAAGgagtaccgatttgagagttggt
1206 >
1207 acacctaaaatgctatttctgcGATAATagcaaccgtttcgtgacaggaa
1208 >
1209 attgtatacttaagctgctgttTAATATgctttgtaacaatttaggctga
1210 >
1211 ggaaggtcaacatcgagcctggCAAACTagcgataacgttgtgttgaaaa
1212 >
1213 taacgccacgcttgaggtaacaGAGATTgttttacctgctggggagtggc
1214 >
1215 tttttctgtaattcgagcatgtCATGTTaccccgcgagcataaaacgcgt
1216 >
1217 tgtcatctttctgacaccttacTATCTTacaaatgtaacaaaaaagttat
1218 >
1219 ttttatgctgacaaaggcacttTTTTCTgtttatctatcaataaattcag
1220 >
1221 ttccaatatcataaaaatcgggTATGTTttagcagagtatgctgctaaag
1222 >
1223 ggtctgataaaacagtgaatgaTAACCTcgttgctcttaagctctggcac
1224 >
1225 gaacttgtggataaaatcacggTCTGATaaaacagtgaatgataacctcg
1226 >
1227 gaacttgtggataaaatcacggTCTGATaaaacagtgaatgataacctcg
1228 >
1229 cgcctgaataataaaagcgtgtTATACTctttccctgcaatgggttccgt
1230 >
1231 attgacggatcatccgggtcgcTATAAGgtaaggatggtcttaacactga
1232 >
1233 tgacttatccgcttcgaagagaGACACTacctgcaacaatcaggagcgca
1234 >
1235 tgacgttttcacattctgttgaCAGATTgtaggtcacgaggggcatttta
1236 >
1237 tgcatcacccgccaatgcgtggCTTAATgcacatcaacggtttgacgtac
1238 >
1239 gttttgtttggcttatcgctggCAAACTgtctgaaatcgcagcaataagg
1240 >
1241 ggacagttaaccgattcagtgcCAGATTtcgcagtatctacaaggtccgg
1242 >
1243 tgcggaaaaaacgcgcgcgaggCAGCATtgactttactaggtcgtgcacg
1244 >
1245 cgtcgcgacctataagtttgggTAATATgtgctggaatttgccctgtctg
1246 >
1247 atctcaggcctgatttgctgctGATTTTtacaatgcatgcctcacgcagg
1248 >
1249 ttgaaaagttcatttccagaccCATTTTtacatcgtagccgatgaggacg
1250 >
1251 agatgtttaccgtggaaaagggTAAAATaacggattaacccaagtataaa
1252 >
1253 gcatcaggacgttcgctattacTTAAATggtatgctgtttgaaaccgaag
1254 >
1255 tatgaaatttaccgtagaacgtGAGCATttattaaaaccgctacaacagg
1256 >
1257 tcagaagacggtggcggagtacTACAAGatcaaagtcgcggatctccttt
1258 >
1259 gcaggaaaaactggtcaccatcGACAATattcagaagacggtggcggagt
1260 >
1261 gcgttctttatcgccaagcgtcTACGATctaacgtacgtgagctggaagg
1262 >
1263 cccgcctcgcggcaggatcgttTACACTtagcgagttctggaaagtcctg
1264 >
1265 agacaaaaattggcttaatcgaTCTAATaaagatccaggacgatccttgc
1266 >
1267 ttgcgctttacccatcagcccgTATAATcctccacccggcgcgccatgct
1268 >
1269 tgactccggagtgtacaattatTACAATccggcctctttaatcacccatg
1270 >
1271 gttttttcaaggtgaagcggttTAAATTcgttctcaaattacagtcagga
1272 >
1273 gacaaaaggcgtgacgatggtcGAAAATggcgctttcgtcagcggggata
1274 >
1275 tggcagtctttctgcctaacgtTTTGTTtatgatatttgcctggcgtcac
1276 >
1277 ttgaaatcacgggggcgcaccgTATAATttgaccgctttttgatgcttga
1278 >
1279 gttttcccaactcagtcaggatTAAACTgtgggtcagcgaaacgtttcgc
1280 >
1281 ttatttttaaaaaacaacaattTATATTgaaattattaaacgcatcataa
1282 >
1283 ttgccagcccacggtcggtcgaCTTACTgtttagtcagttaaataaactg
1284 >
1285 ggaaatttattgcggaaattgaTATATTcacaacgtcacattgcaatttt
1286 >
1287 atatatcaatttccgcaataaaTTTCCTgtcatatagtgaattcaatctc
1288 >
1289 tcacattcaaatgcgattctgcTACAATcctccccccgttcgaagattga
1290 >
1291 ggacgcccggcgtgagtcatgcTAACTTagtgttgacttcgtattaaaca
1292 >
1293 ttacggtcaatcagcaaggtgtTAAATTgatcacgttttagaccattttt
1294 >
1295 ttggcatctctgacctcgctgaTATAATcagcaaatctgtatatataccc
1296 >
1297 gaaaaaatgttaaacccttcggTAAAGTgtctttttgcttcttctgacta
1298 >
1299 tgcatatttttaacacaaaataCACACTtcgactcatctggtacgaccag
1300 >
1301 gcgctttttatccgtaaaaagcTATAATgcactaaaatggtgcaacctgt
1302 >
1303 gcaccaacatggtgcttaatgtTTCCATtgaagcactatattggtgcaac
1304 >
1305 ggtaagaacctgacctcgtgatTACTATttcgccgtgttgacgacatcag
1306 >
1307 ttttcaatatcatttaattaacTATAATgaaccaactgcttacgcggcat
1308 >
1309 tctcgtttttgctcgttaacgaTAAGTTtacagcatgcctacaagcatcg
1310 >
1311 attgacgtccattaacacaatgTTTACTctggtgcctgacatttcaccga
1312 >
1313 tttcggttgacgcccttcggctTTTCCTtcatctttacatctggacgtct
1314 >
1315 gttgacacacctctggtcatgaTAGTATcaatattcatgcagtatttatg
1316 >
1317 tttattacgctcaacgttagtgTATTTTtattcataaatactgcatgaat
1318 >
1319 gcgctgaaacagtcaaagcggtTATGTTcatatgcggatggcgatttaca
1320 >
1321 gatagggataatcgttcattgcTATTCTacctatcgccatgaactatcgt
1322 >
1323 tggacatctgatgagcaatcccTACAATcgccgcgtactttaatttttca
1324 >
1325 gacagtaacttgttacaacctgTAGCATccacttgccggtcctgtgagtt
1326 >
1327 tgcatgaactcgcatgtctccaTAGAATgcgcgctacttgatgccgactt
1328 >
1329 gacgcaatgcgcactaaaagggCATCATttgatgccctttttgcacgctt
1330 >
1331 tgcacaaggcgtgagattggaaTACAATttcgcgccttttgtttttatgg
1332 >
1333 ttacgtgggcggtgattttgtcTACAATcttacccccacgtataatgctt
1334 >
1335 tttgactactgctgtgcctttcAATGCTtgtttctatcgacgacttaata
1336 >
1337 ttcgcgagcgttgcgcaaacgtTTTCGTtacaatgcgggcgaaaaataag
1338 >
1339 cgacattggcaaattttctggtTATCTTcagctatctggatgtctaaacg
1340 >
1341 ttgattttgcattttaaatgagTAGTCTtagttgtgctgaacgaaaagag
1342 >
1343 accacagatgcgtttatgccagTATGGTttgttgaatttttattaaatct
1344 >
1345 ttgacaaccgccccgctcacccTTTATTtataaatgtactacctgcgcta
1346 >
1347 tggaaagaggttgccgtataaaGAAACTagagtccgtttaggtgttttca
1348 >
1349 tttaagccatctcctgatgacgCATAGTcagcccatcatgaatgttgctg
1350 >
1351 tccaaaatcgccttttgctgtaTATACTcacagcataactgtatatacac
1352 >
1353 attcattcaggtcaatttgtgtCATAATtaaccgtttgtgatcgccggta
1354 >
1355 gaatgcattacccggagtgttgTGTAACaatgtctggccaggtttgtttc
1356 >
1357 ggtaatggtacaatcgcgcgttTACACTtattcagaacgatttttttcag
1358 >
1359 acctcaagttaacttgaggaatTATACTccccaacagatgaattaacgaa
1360 >
1361 ataaaatgtggcataaaagatgCATACTgtagtcgagagcgcgtatgcgt
1362 >
1363 tgatcacaaatttaaacactggTAGGGTaaaaaggtcattaactgcccaa
1364 >
1365 agtcatcctccctcactcctgcCATAATtctgatattccaggaaagagag
1366 >
1367 ctgtgatctattcagcaaaaatTTAAATaggattatcgcgagggttcaca
1368 >
1369 gtaagcgttagtttcgataagaTAAACTgagttactaatagtcgaggcag
1370 >
1371 ttgaggtaagcgttagtttcgaTAAGATaaactgagttactaatagtcga
1372 >
1373 ggattaatccttttttcgtgagTAATCTtatcgccagtttggtctggtca
1374 >
1375 cggtagaaatcctcaagcagcaTATGATctcgggtattcggtcgatgcag
1376 >
1377 ttgtcacgctgattggtgtcgtTACAATctaacgcatcgccaatgtaaat
1378 >
1379 gtcatgaatccatggcagtgacCATACTaatggtgactgccattgatgga
1380 >
1381 ttttcaaagcgtaaaattgtggCATTCTtcactgttctataagtaagacg
1382 >
1383 ggcattcacaaatgcgcaggggTAAAACgtttcctgtagcaccgtgagtt
1384 >
1385 tttcctgtagcaccgtgagttaTACTTTgtataacttaaggaggtgcaga
1386 >
1387 ttgcgccgcttctgacgatgagTATAATgccggacaatttgccgggagga
1388 >
1389 gccaccgctttcacagaagtggTAGACTtcgttccttatgaagattctct
1390 >
1391 taaggaaaataattcttatttcGATTGTcctttttacccttctcgttcga
1392 >
1393 tggaaacaattttatttccaatTGTAATgataaccattctcatattaata
1394 >
1395 ggcgtttgtatggcaacgttatTATAATtaacagttgctactccatttaa
1396 >
1397 gaacatcgatctcgtcttgtgtTAGAATtctaacatacggttgcaacaac
1398 >
1399 aagtgtgttgcggagtagatgtTAGAATactaacaaactcgcaaggtgaa
1400 >
1401 tcgccgtatcagcgaataacggTATACTgatctgatcatttaaatttgaa
1402 >
1403 ttgcttctggcaacattaagtcTCAAATtttcaaagggtggaagatggct
1404 >
1405 gccagaagcaatggatacaaggTAGCCTcatgcgttattttccctgcttc
1406 >
1407 ttactgatccgcacgtttatgaTATGCTatcgtactctttagcgagtaca
1408 " >
1409 </form>-->
1410
1411
1412 <!--
1413 <hr >
1414 <a name="globins"></a>
1415 <h2>Globins</h2>
1416 <img alt="" src="examples/globins.png" ><br >
1417 The end of the B helix through the beginning of the D helix of 34 globins. This
1418 sequence data was taken from
1419 <a href="http://www.lecb.ncifcrf.gov/~toms/paper/logopaper/">Sequence Logos: A New Way to Display Consensus Sequences</a>.<br ><br >
1420 <form method="post" action="create.cgi">
1421 <input type="submit" name="cmd_edit" value="Edit Logo" >
1422 <input type="hidden" name="logo_start" value="61" >
1423 <input type="hidden" name="logo_end" value="83" >
1424 <input type="hidden" name="show_xaxis" value="true" >
1425 <input type="hidden" name="show_yaxis" value="true" >
1426 <input type="hidden" name="show_errorbars" value="true" >
1427 <input type="hidden" name="show_fineprint" value="true" >
1428 <input type="hidden" name="scale_width" value="true" >
1429 <input type="hidden" name="sequences" value="
1430 >Lamprey GLOBIN V - SEA LAMPREY
1431 PIVDTGSVA-P------------------LSAAEKTKIRSAWAPVYSTY---ETSGVDILVKFFTSTPAAQEFFPKFKGL
1432 TT-----ADQLKKSA---DVRWHA-ERIINAVNDAVASMDDTEKMS--MKL-RDLSGKH----AKSFQV-----DPQYFK
1433 VLAAVI-AD-TVAAGD--AGFEKLMSM------I---CILLR----S-----A-----Y------------
1434 >Hagfish GLOBIN III - ATLANTIC HAGFISH
1435 PITDHGQPP-T------------------LSEGDKKAIRESWPQIYKNF---EQNSLAVLLEFLKKFPKAQDSFPKFSAK
1436 KS-------HLEQDP---AVKLQA-EVIINAVNHTIGLMDKEAAMK--KYL-KDLSTKH----STEFQV-----NPDMFK
1437 ELSAVF-VS-TMG-GK--AAYEKLFSI------I---ATLLR----S-----T-----YDA----------
1438 >Frog HEMOGLOBIN BETA CHAIN - EDIBLE FROG
1439 ----------GS-----------------------DLVSGFWGKV--DA---HKIGGEALARLLVVYPWTQRYFTTFGNL
1440 GSADAIC-----HNA---KVLAHG-EKVLAAIGEGLKHPENLKAHY--AKL-SEYHSNK----LHVDPANFRLLGNVFIT
1441 VLARHF-QH-EFTPELQ-HALEAHFCA------V---GDALA----K-----A-----YH-----------
1442 >African Elephant HEMOGLOBIN BETA CHAIN - AFRICAN ELEPHANT
1443 ----------VN-----------------LTAAEKTQVTNLWGKV--NV---KELGGEALSRLLVVYPWTRRFFEHFGDL
1444 STAEAVL-----HNA---KVLAHG-EKVLTSFGEGLKHLDNLKGTF--ADL-SELHCDK----LHVDPENFRLLGNVLVI
1445 VLARHF-GK-EFTPDVQ-AAYEKVVAG------V---ANALA----H-----K-----YH-----------
1446 >Goat HEMOGLOBIN BETA-A CHAIN - GOAT
1447 ----------M------------------LTAEEKAAVTGFWGKV--KV---DEVGAEALGRLLVVYPWTQRFFEHFGDL
1448 SSADAVM-----NNA---KVKAHG-KKVLDSFSNGMKHLDDLKGTF--AQL-SELHCDK----LHVDPENFKLLGNVLVV
1449 VLARHH-GS-EFTPLLQ-AEFQKVVAG------V---ANALA----H-----R-----YH-----------
1450 >Primate HEMOGLOBIN BETA CHAIN - HUMAN, CHIMPANZEES, AND GORILLA
1451 ----------VH-----------------LTPEEKSAVTALWGKV--NV---DEVGGEALGRLLVVYPWTQRFFESFGDL
1452 STPDAVM-----GNP---KVKAHG-KKVLGAFSDGLAHLDNLKGTF--ATL-SELHCDK----LHVDPENFRLLGNVLVC
1453 VLAHHF-GK-EFTPPVQ-AAYQKVVAG------V---ANALA----H-----K-----YH-----------
1454 >Gibbon HEMOGLOBIN BETA CHAIN - COMMON GIBBON (TENTATIVE SEQUENCE)
1455 ----------VH-----------------LTPEEKSAVTALWGKV--NV---DEVGGEALGRLLVVYPWTQRFFESFGDL
1456 STPDAVM-----GNP---KVKAHG-KKVLGAFSDGLAHLDNLKGTF--AQL-SELHCDK----LHVDPENFRLLGNVLVC
1457 VLAHHF-GK-EFTPQVQ-AAYQKVVAG------V---ANALA----H-----K-----YH-----------
1458 >Dog HEMOGLOBIN BETA CHAIN - DOG AND COYOTE
1459 ----------VH-----------------LTAEEKSLVSGLWGKV--NV---DEVGGEALGRLLIVYPWTQRFFDSFGDL
1460 STPDAVM-----SNA---KVKAHG-KKVLNSFSDGLKNLDNLKGTF--AKL-SELHCDK----LHVDPENFKLLGNVLVC
1461 VLAHHF-GK-EFTPQVQ-AAYQKVVAG------V---ANALA----H-----K-----YH-----------
1462 >Horse HEMOGLOBIN BETA CHAIN - HORSE
1463 ----------VQ-----------------LSGEEKAAVLALWDKV--NE---EEVGGEALGRLLVVYPWTQRFFDSFGDL
1464 SNPGAVM-----GNP---KVKAHG-KKVLHSFGEGVHHLDNLKGTF--AAL-SELHCDK----LHVDPENFRLLGNVLVV
1465 VLARHF-GK-DFTPELQ-ASYQKVVAG------V---ANALA----H-----K-----YH-----------
1466 >Human, Chimp HEMOGLOBIN GAMMA CHAINS - HUMAN AND CHIMPANZEE
1467 ----------GH-----------------FTEEDKATITSLWGKV--NV---EDAGGETLGRLLVVYPWTQRFFDSFGNL
1468 SSASAIM-----GNP---KVKAHG-KKVLTSLGDAIKHLDDLKGTF--AQL-SELHCDK----LHVDPENFKLLGNVLVT
1469 VLAIHF-GK-EFTPEVQ-ASWQKMVTA------V---ASALS----S-----R-----YH-----------
1470 >Nile Crocodile HEMOGLOBIN BETA CHAIN - NILE CROCODILE
1471 ----------AS-----------------FDPHEKQLIGDLWHKV--DV---AHCGGEALSRMLIVYPWKRRYFENFGDI
1472 SNAQAIM-----HNE---KVQAHG-KKVLASFGEAVCHLDGIRAHF--ANL-SKLHCEK----LHVDPENFKLLGDIIII
1473 VLAAHY-PK-DFGLECH-AAYQKLVRQ------V---AAALA----A-----E-----YH-----------
1474 >Chicken HEMOGLOBIN BETA CHAIN - CHICKEN
1475 ----------VH-----------------WTAEEKQLITGLWGKV--NV---AECGAEALARLLIVYPWTQRFFASFGNL
1476 SSPTAIL-----GNP---MVRAHG-KKVLTSFGDAVKNLDNIKNTF--SQL-SELHCDK----LHVDPENFRLLGDILII
1477 VLAAHF-SK-DFTPECQ-AAWQKLVRV------V---AHALA----R-----K-----YH-----------
1478 >NA Opossum HEMOGLOBIN BETA CHAIN - NORTH AMERICAN OPOSSUM
1479 ----------VH-----------------LTSEEKNCITTIWSKV--QV---DQTGGEALGRMLVVYPWTTRFFGSFGDL
1480 SSPGAVM-----SNS---KVQAHG-AKVLTSFGEAVKHLDDLKGTY--AKL-SELHCDK----LHVDPENFKMLG-IIVI
1481 CLAEHF-GK-DFTPECV-A--WKLVAG------V---AHALA----H-----K-----YH-----------
1482 >Carp HEMOGLOBIN BETA CHAINS - CARP
1483 ----------VE-----------------WTDAERSAIIALWGKL--NP---DELGPEALARCLIVYPWTQRFFASYGNL
1484 SSPAAIM-----GNP---KVAAHG-RTVEGGLMRAIKDMDNIKATY--APL-SVMHSEK----LHVDPDNFRLLADCITV
1485 CAAMKFGPS-GFSPNVQ-EAWQKFLSV------V---VNALK----R-----Q-----YH-----------
1486 >Shark HEMOGLOBIN BETA CHAIN - PORT JACKSON SHARK
1487 ----------VH-----------------WSEVELHEITTTWKSI--DK---HSLGAKALARMFIVYPWTTRYFGNLKEF
1488 TA----------CSY---GVKEHA-KKVTGALGVAVTHLGDVKSQF--TDL-SKKHAEE----LHVDVESFKLLAKCFVV
1489 ELGILL-KD-KFAPQTQ-AIWEKYFGV------V---VDAIS----K-----E-----YH-----------
1490 >Shark HEMOGLOBIN ALPHA CHAIN - PORT JACKSON SHARK
1491 ----------S-TSTSTSD----------YSAADRAELAALSKVLAQNA---EAFGAEALARMFTVYAATKSYFKDYKDF
1492 TA----------AAP---SIKAHG-AKVVTALAKACDHLDDLKTHL--HKL-ATFHGSE----LKVDPANFQYLSYCLEV
1493 ALAVHL--T-EFSPETH-CALDKFLTN------V---CHELS----S-----R-----YR-----------
1494 >Carp HEMOGLOBIN ALPHA CHAIN - CARP
1495 ----------S------------------LSDKDKAAVKIAWAKISPKA---DDIGAEALGRMLTVYPQTKTYFAHWADL
1496 SP----------GSG---PVKHGK-KVIMGAVGDAVSKIDDLVGGL--ASL-SELHASK----LRVDPANFKILANHIVV
1497 GIMFYL-PG-DFPPEVH-MSVDKFFQN------L---ALALS----E-----K-----YR-----------
1498 >Bullfrog HEMOGLOBIN ALPHA CHAIN - BULLFROG TADPOLE
1499 ----------S------------------LSASEKAAVLSIVGKIGSQG---SALGSEALTRLFLSFPQTKTYFPHF-DL
1500 TP----------GSA---DLNTHG-GKIINALAGAANHLDDLAGNL--SSL-SDLHAYN----LRVDPGNFPLLAHIIQV
1501 VLATHF-PG-DFTAEVQ-AAWDKFLAL------V---SAVLT----S-----K-----YR-----------
1502 >Nile Crocodile HEMOGLOBIN ALPHA CHAIN - NILE CROCODILE
1503 ----------V------------------LSSDDKCNVKAVWSKVAGHL---EEYGAEALERMFCAYPQTKIYFPHF-DL
1504 SH----------GSA---QIRAHG-KKVFAALHEAVNHIDDLPGAL--CRL-SELHAHS----LRVDPVNFKFLAQCVLV
1505 VVAIHH-PG-SLTPEVH-ASLDKFLCA------V---SSVLT----S-----K-----YR-----------
1506 >Ostrich HEMOGLOBIN ALPHA CHAIN - OSTRICH
1507 ----------V------------------LSGTDKTNVKGIFSKISSHA---EEYGAETLERMFITYPQTKTYFPHF-DL
1508 HH----------GSA---QIKAHG-KKVANALIEAVNHIDDISGAL--SKL-SDLHAQK----LRVDPVNFKLLGQCFLV
1509 VVAIHH-PS-ALTPEVH-ASLDKFLCA------V---GAVLT----A-----K-----YR-----------
1510 >Kangaroo HEMOGLOBIN ALPHA CHAIN - EASTERN GRAY KANGAROO
1511 ----------V------------------LSAADKGHVKAIWGKVGGHA---GEYAAEGLERTFHSFPTTKTYFPHF-DL
1512 SH----------GSA---QIQAHG-KKIADALGQAVEHIDDLPGTL--SKL-SDLHAHK----LRVDPVNFKLLSHCLLV
1513 TFAAHL-GD-AFTPEVH-ASLDKFLAA------V---STVLT----S-----K-----YR-----------
1514 >Armadillo HEMOGLOBIN ALPHA CHAIN - NINE-BANDED ARMADILLO
1515 ----------V------------------LSAADKTHVKAFWGKVGGHA---AEFGAEALERMFASFPPTKTYFSHM-DL
1516 SH----------GSA---QVKAHG-KKVADALTLAVGHLDDLPGAL--STL-SDLHAHK----LRVDPVNFKFLSHCLLV
1517 TLACHL-PD-DFTPAVH-ASMDKFMAG------V---STVLV----S-----K-----YR-----------
1518 >Horse HEMOGLOBIN ALPHA CHAINS - HORSE
1519 ----------V------------------LSAADKTNVKAAWSKVGGHA---GEYGAEALERMFLGFPTTKTYFPHF-DL
1520 SH----------GSA---QVKAHG-KKVGDALTLAVGHLDDLPGAL--SNL-SDLHAHK----LRVDPVNFKLLSHCLLS
1521 TLAVHL-PN-DFTPAVH-ASLDKFLSS------V---STVLT----S-----K-----YR-----------
1522 >Primate HEMOGLOBIN ALPHA CHAIN - HUMAN AND CHIMPANZEES
1523 ----------V------------------LSPADKTNVKAAWGKVGAHA---GEYGAEALERMFLSFPTTKTYFPHF-DL
1524 SH----------GSA---QVKGHG-KKVADALTNAVAHVDDMPNAL--SAL-SDLHAHK----LRVDPVNFKLLSHCLLV
1525 TLAAHL-PA-EFTPAVH-ASLDKFLAS------V---STVLT----S-----K-----YR-----------
1526 >Macaque HEMOGLOBIN ALPHA CHAIN - RHESUS MACAQUE AND JAPANESE MACAQUE
1527 ----------V------------------LSPADKSNVKAAWGKVGGHA---GEYGAEALERMFLSFPTTKTYFPHF-DL
1528 SH----------GSA---QVKGHG-KKVADALTLAVGHVDDMPNAL--SAL-SDLHAHK----LRVDPVNFKLLSHCLLV
1529 TLAAHL-PA-EFTPAVH-ASLDKFLAS------V---STVLT----S-----K-----YR-----------
1530 >Badger HEMOGLOBIN ALPHA CHAIN - EURASIAN BADGER
1531 ----------V------------------LSPADKANIKATWDKIGGHA---GEYGGEALERTFASFPTTKTYFPHF-DL
1532 SH----------GSA---QVKGHG-KKVADALTNAVAHLDDLPGAL--SAL-SDLHAYK----LRVDPVNFKLLSHCLLV
1533 TLACHH-PA-EFTPAVH-ASLDKFLSS------V---STVLT----S-----K-----YR-----------
1534 >Ind Elephant HEMOGLOBIN ALPHA CHAIN - INDIAN ELEPHANT
1535 ----------V------------------LSDKDKTNVKATWSKVGDHA---SDYVAEALERMFFSFPTTKTYFPHF-DL
1536 SH----------GSG---QVKGHG-KKVGEALTQAVGHLDDLPSAL--SAL-SDLHAHK----LRVDPVNFKLLSHCLLV
1537 TLSSHQ-PT-EFTPEVH-ASLDKFLSN------V---STVLT----S-----K-----YR-----------
1538 >Hyrax HEMOGLOBIN ALPHA CHAIN - ABYSSINIAN HYRAX
1539 ----------V------------------LSAADKNNVKGAWEKVGTHA---GEYGAEALERMFLSFPTTKTYFPHF-DL
1540 TH----------GSA---QVKAHG-QKVGAALTKAVGHLDDLPNAL--SDL-SDLHAHK----LRVDPVNFKLLSHCLLV
1541 TLSRHL-PEQEFTPAVH-ASLDKFFSN------V---STVLT----S-----K-----YR-----------
1542 >Tuna MYOGLOBIN - YELLOWFIN TUNA
1543 ----------A----------------------DFDAVLKCWGPVEADY---TTMGGLVLTRLFKEHPETQKLFPKFAGI
1544 -A-----QADIAGNA---AISAHG-ATVLKKLGELLKAKGSHAAIL--KPL-ANSHATK----HKIPINNFKLISEVLVK
1545 VMHEK---A-GLDAGGQ-TALRNVMGI------I---IADLE----ANYKELG-----FSG----------
1546 >Shark MYOGLOBIN - PORT JACKSON SHARK
1547 ----------T----------------------EWEHVNKVWAVVEPDI---PAVGLAILLRLFKEHKETKDLFPKFKEI
1548 -P-----VQQLGNNE---DLRKHG-VTVLRALGNILKQKGKHSTNV--KEL-ADTHINK----HKIPPKNFVLITNIAVK
1549 VLTEMY-PS-DMTGPMQ-ESFSKVFTV------I---CSDLE----TLYKEAN-----FQG----------
1550 >Turtle MYOGLOBIN - MAP TURTLE
1551 ----------G------------------LSDDEWHHVLGIWAKVEPDL---SAHGQEVIIRLFQVHPETQERFAKFKNL
1552 KT-----IDELRSSE---EVKKHG-TTVLTALGRILKLKNNHEPEL--KPL-AESHATK----HKIPVKYLEFICEIIVK
1553 VIAEKH-PS-DFGADSQ-AAMRKALEL------F---RNDMA----SKYKEFG-----FQG----------
1554 >Chicken MYOGLOBIN - CHICKEN
1555 ----------G------------------LSDQEWQQVLTIWGKVEADI---AGHGHEVLMRLFHDHPETLDRFDKFKGL
1556 KT-----EPDMKGSE---DLKKHG-QTVLTALGAQLKKKGHHEADL--KPL-AQTHATK----HKIPVKYLEFISEVIIK
1557 VIAEKH-AA-DFGADSQ-AAMKKALEL------F---RDDMA----SKYKEFG-----FQG----------
1558 >Dog MYOGLOBIN - DOG, BAT-EARED FOX, AFRICAN HUNTING DOG, AND CAPE FOX
1559 ----------G------------------LSDGEWQIVLNIWGKVETDL---AGHGQEVLIRLFKNHPETLDKFDKFKHL
1560 KT-----EDEMKGSE---DLKKHG-NTVLTALGGILKKKGHHEAEL--KPL-AQSHATK----HKIPVKYLEFISDAIIQ
1561 VLQSKH-SG-DFHADTE-AAMKKALEL------F---RNDIA----AKYKELG-----FQG----------
1562 >Badger MYOGLOBIN - EURASIAN BADGER
1563 ----------G------------------LSDGEWQLVLNVWGKVEADL---AGHGQEVLIRLFKGHPETLEKFDKFKHL
1564 KS-----EDEMKGSE---DLKKHG-NTVLTALGGILKKKGHQEAEL--KPL-AQSHATK----HKIPVKYLEFISDAIAQ
1565 VLQSKH-PG-NFAAEAQ-GAMKKALEL------F---RNDIA----AKYKELG-----FQG----------
1566 >Dolphin MYOGLOBIN - SADDLEBACK DOLPHIN
1567 ----------G------------------LSDGEWQLVLNVWGKVEADV---AGHGQDILIRLFKGHPETLEKFDKFKHL
1568 KT-----EADMKASE---DLKKHG-DTVLTALGAILKKKGHHDAEL--KPL-AQSHATK----HKIPIKYLEFISEAIIH
1569 VLHSRH-PA-QFGADAQ-GAMNKALEL------F---RKDIA----AKYKELG-----FHG----------
1570 >Horse, Zebra MYOGLOBIN - HORSE AND PLAINS ZEBRA
1571 ----------G------------------LSDGEWQQVLNVWGKVEADI---AGHGQEVLIRLFTGHPETLEKFDKFKHL
1572 KT-----EAEMKASE---DLKKHG-TVVLTALGGILKKKGHHEAEL--KPL-AQSHATK----HKIPIKYLEFISDAIIH
1573 VLHSKH-PG-NFGADAQ-GAMTKALEL------F---RNDIA----AKYKELG-----FQG----------
1574 >African Elephant MYOGLOBIN - AFRICAN ELEPHANT
1575 ----------G------------------LSDGEWELVLKTWGKVEADI---PGHGEFVLVRLFTGHPETLEKFDKFKHL
1576 KT-----EGEMKASE---DLKKQG-VTVLTALGGILKKKGHHEAEI--QPL-AQSHATK----HKIPIKYLEFISDAIIH
1577 VLQSKH-PA-EFGADAQ-AAMKKALEL------F---RNDIA----AKYKELG-----FQG----------
1578 >Aardvark MYOGLOBIN - AARDVARK
1579 ----------G------------------LSDAEWQLVLNVWGKVEADI---PGHGQDVLIRLFKGHPETLEKFDRFKHL
1580 KT-----EDEMKASE---DLKKHG-TTVLTALGGILKKKGQHEAEI--QPL-AQSHATK----HKIPVKYLEFISEAIIQ
1581 VIQSKH-SG-DFGADAQ-GAMSKALEL------F---RNDIA----AKYKELG-----FQG----------
1582 >Human MYOGLOBIN - HUMAN
1583 ----------G------------------LSDGEWQLVLNVWGKVEADI---PGHGQEVLIRLFKGHPETLEKFDKFKHL
1584 KS-----EDEMKASE---DLKKHG-ATVLTALGGILKKKGHHEAEI--KPL-AQSHATK----HKIPVKYLEFISECIIQ
1585 VLQSKH-PG-DFGADAQ-GAMNKALEL------F---RKDMA----SNYKELG-----FQG----------
1586 >Macaque MYOGLOBIN - CRAB-EATING MACAQUE (TENTATIVE SEQUENCE)
1587 ----------G------------------LSDGEWQLVLNVWGKVEADI---PSHGQEVLIRLFKGHPETLEKFDKFKHL
1588 KS-----EDEMKASE---DLKKHG-VTVLTALGGILKKKGHHEAEI--KPL-AQSHATK----HKIPVKYLELISESIIQ
1589 VLQSKH-PG-DFGADAQ-GAMNKALEL------F---RNDMA----AKYKELG-----FQG----------
1590 >NA Opossum MYOGLOBIN - NORTH AMERICAN OPOSSUM
1591 ----------G------------------LSDGEWQLVLNAWGKVEADI---PGHGQEVLIRLFKGHPETLEKFDKFKHL
1592 KS-----EDEMKASE---DLKKHG-ATVLTALGNILKKKGNHEAEL--KPL-AQSHATK----HKISVQFLEFISEAIIQ
1593 VIQSKH-PG-DFGGDAQ-AAMGKALEL------F---RNDMA----AKYKELG-----FQG----------
1594 >Earthworm GLOBIN AIII - COMMON EARTHWORM
1595 ---------KK------------------QCGVLEGLKVKSEWGRAYGS---GHDREAFSQAIWRATFAQVPESRSLFKR
1596 VH-----GDH-TSDP---AFIAHA-ERVLGGLDIAISTLDQPATLK--EEL-DHLQVQHEG--RKIPDNYFDAFKTAILH
1597 VVAAQL-GE-RCYSNN--EEIHDAIACDGFARVL---PQVLE----R-----G-----IKGHH--------
1598 > SMALL CHAIN - TYLORRHYNCHUS HETEROCHAETUS
1599 ----------T------------------DCGILQRIKVKQQWAQVYSV---GESRTDFAIDVFNNFFRTNPD-RSLFNR
1600 VN-----GDN-VYSP---EFKAHM-VRVFAGFDILISVLDDKPVLD--QAL-AHYAAFH----KQFGTIPFKAFGQTMFQ
1601 TIAEHI--------HG--ADIGAWRAC------Y---AEQIV----T-----G-----ITA----------
1602 >BloodwormGLOBIN, MAJOR MONOMERIC COMPONENT - BLOODWORM
1603 ----------G------------------LSAAQRQVIAATWKDIAGND---NGAGVGKDCLI--KHLSAHPQMAAVFGF
1604 SG-----ASD-PAVA---DLGAKV-LAIGVAVSHLGDGKMVAQMKA--VGV-RHKGYGN----KHIKGQYFEPLGASLLS
1605 AMEHRI-GG-KMNAAA-KDAWAAAYAD------I---SGALI----S-----G-----LQS----------
1606 >Whelk GLOBIN - WHELK
1607 ----------G------------------LDGAQKTALKESWKVLGADGPTMMKNGSLLFGLLFKTYPDTKKHFKHFDDA
1608 TF-----AAM-DTTG---VGKAHG-VAVFSGLGSMICSIDDDDCV---GLA-KKLSRNH--LARGVSAADF-KLLEAVFK
1609 FLDEAT-QR-KATDAQ-KDADGALLTM------L---IKA------------H-----V------------
1610 >Snail GLOBIN - WATER SNAIL
1611 ----------S------------------LQPASKSALASSWKTLAKDAATIQNNGATLFSLLFKQFPDTRNYFTHFGNM
1612 SD-----AEM-KTTG---VGKAHS-MAVFAGIGSMIDSMDDADCMN--GLA-LKLSRNH--IQRKIGASRFGEMRQVFPN
1613 FLDEAL-GG-GASGDV-KGAWDALLAY------LQDNKQA------------Q-----A----L-------
1614 >Clam GLOBIN I - BLOOD CLAM
1615 ----------P--------SVQGAAAQ--LTADVKKDLRDSWKVIGSDK---KGNGVALMTTLFADNQETIGYFKRLGNV
1616 SQ-----GM---AND---KLRGHS-ITLMYALQNFIDQLDNTDDLV--CVV-EKFAVNH--ITRKISAAEFGKINGP---
1617 -IKKVL-AS-KNFGDK-YANAWAKLVA------V---VQA------------A-----L------------
1618 >Midge larvaGLOBIN CTT-II BETA - MIDGE LARVA
1619 ----------A------------------PLSADEASLV---RGSWAQV---KHSEVDILYYIFKANPDIMAKFPQFAGK
1620 DL-----ETL-KGTGQFATHAGRI-VGFVSEIVALMGNSANMPAME--TLI-KDMAANH--KARGIPKAQFNEFRASLVS
1621 YLQSKV----SWNDSL-GAAWTQGLDN------V---FNMMF----S-----Y-----L------------
1622 >Midge larva GLOBINS CTT-I AND CTT-IA - MIDGE LARVA
1623 ----------G------------------P-SGDQIAAA---KASWNTV---KNNQVDILYAVFKANPDIQTAFSQFAGK
1624 DL-----DSI-KGTPDFSKHAGRV-VGLFSEVMDLLGNDANTPTIL--AKA-KDFGKSH--KSRASP-AQLDNFRKSLVV
1625 YLKGAT----KWDSAV-ESSWAPVLDF------V---FSTLK----N-----E-----L------------
1626 >Bacteria BACTERIAL HEMOGLOBIN - VITREOSCILLA SP
1627 -----------------------------MLDQQTINII---KATVPVL---KEHGVTITTTFYKNLFAKHPEVRPLFDM
1628 GR-----Q---ESLEQ-------P-KALAMTVLAAAQNIENLPAIL--PAV-KKIAVKH--CQAGVAAAHYPIVGQELLG
1629 AIKEVL-GD-AATDDI-LDAWGKAYGV------I---ADVFI----Q-----VEADLYA-----Q-AVE--
1630 >P andersonii ONLEGUME HEMOGLOBIN I - PARASPONIA ANDERSONII
1631 ----------V----------------NKVFTEEQEALV---VKAWAVM---KKNSAELGLQFLK-IFEIAPSAKNLFSY
1632 LK-----DSP-VPLEQNPKLKPHA-TTFVMTTESAVQLRKAGKVTVK-ESDLKRIGAIH--FKTGVVNEHFEVTRFALLE
1633 TIKEAV-PE-MWSPEM-KNAWGVAYDQ------L---VAAIK----F-----E-----M-----KPSST--
1634 >Yellow Lupin LEGHEMOGLOBIN I - YELLOW LUPIN
1635 ----------G------------------VLTDVQVALV---KSSFEEF---NANIPKNTHRFFTLVLEIAPGAKDLFSF
1636 LK-----GSS-EVPQNNPDLQAHAGKVFKLTYEAAIQLEVNGAVAS--DATLKSLGSVH--VSKGVVDAHFPVVKEAILK
1637 TIKEVV-GD-KWSEEL-NTAWTIAYDE------L---AIIIK----K-----E-----M-----K-DAA--
1638 >Garden Pea LEGHEMOGLOBIN I - GARDEN PEA
1639 ----------G-------------------FTDKQEALV---NSSSE-F---KQNLPGYSILFYTIVLEKAPAAKGLFSF
1640 LK-----DTA-GVE-DSPKLQAHAEQVFGLVRDSAAQLRTKGEVVL-GNATL---GAIH--VQKGVTNPHFVVVKEALLQ
1641 TIKKAS-GN-NWSEEL-NTAWEVAYDG------L---ATAIKKAMKT---------------------A--
1642 >Broad Bean LEGHEMOGLOBIN I - BROAD BEAN
1643 ----------G-------------------FTEKQEALV---NSSSQLF---KQNPSNYSVLFYTIILQKAPTAKAMFSF
1644 LK-----DSA-GVV-DSPKLGAHAEKVFGMVRDSAVQLRATGEVVL--DGKD---GSIH--IQKGVLDPHFVVVKEALLK
1645 TIKEAS-GD-KWSEEL-SAAWEVAYDG------L---ATAIK----A---------------------A--
1646 >Soybean LEGHEMOGLOBIN C1 - SOYBEAN
1647 ----------G------------------AFTEKQEALV---SSSFEAF---KANIPQYSVVFYNSILEKAPAAKDLFSF
1648 LA-----NGV-DPT--NPKLTGHAEKLFALVRDSAGQLKTNGTVVA--DAAL---VSIH--AQKAVTDPQFVVVKEALLK
1649 TIKEAV-GG-NWSDEL-SSAWEVAYDE------L---AAAIK----K---------------------A--
1650 >Kidney Bean LEGHEMOGLOBIN A - KIDNEY BEAN
1651 ----------G------------------AFTEKQEALV---NSSWEAF---KGNIPQYSVVFYTSILEKAPAAKNLFSF
1652 LA-----NGV-DPT--NPKLTAHAESLFGLVRDSAAQLRANGAVVA--DAAL---GSIH--SQKGVSNDQFLVVKEALLK
1653 TLKQAV-GD-KWTDQL-STALELAYDE------L---AAAIK----K---------------------AYA
1654 " >
1655 </form>
1656 <br >
1657 <br >-->
1658
1659 <!--
1660
1661
1662 <hr >
1663 <a name="HTH"></a>
1664 <h2>HTH Proteins</h2>
1665 <img alt="" src="examples/hth.png" > <br >
1666 Helix-Turn-Helix DNA binding motifs found by the
1667 Gibbs
1668 sampling system. Compared to the <a href="#CAP_HTH">CAP HTH logo</a>
1669 there is much less sequence conservation within the DNA binding helix (11-17),
1670 as might be expected for a diverse sample of proteins.
1671 <form method="post" action="create.cgi">
1672 <input type="submit" name="cmd_edit" value="Edit Logo" >
1673 <input type="hidden" name="logo_title" value ="Helix-Turn-Helix Motifs" >
1674 <input type="hidden" name="first_index" value ="-11" >
1675 <input type="hidden" name="logo_start" value ="1" >
1676 <input type="hidden" name="logo_end" value ="17" >
1677 <input type="hidden" name="yaxis_scale" value ="2.0" >
1678 <input type="hidden" name="show_xaxis" value="true" >
1679 <input type="hidden" name="show_yaxis" value="true" >
1680 <input type="hidden" name="show_errorbars" value="true" >
1681 <input type="hidden" name="show_fineprint" value="true" >
1682 <input type="hidden" name="scale_width" value="true" >
1683 <input type="hidden" name="sequences" value=">A25944 DNA-directed RNA polymerase sigma-37 chain - Bacillu 223-240
1684 iidltyiqnk SQKETGDILGISQMHVSR lqrkavkklr
1685 >A28627 spoIIIC protein - Bacillus subtilis 94-111
1686 rfgldlkkek TQREIAKELGISRSYVSR iekralmkmf
1687 >A32837 *Transcriptional activator nahR - Pseudomonas putida 22-39
1688 vvfnqllvdr RVSITAENLGLTQPAVSN alkrlrtslq
1689 >A23450 Antennapedia homeotic protein - Fruit fly (Drosophil 326-343
1690 fhfnryltrr RRIEIAHALCLTERQIKI wfqnrrmkwk
1691 >B26499 Regulatory protein ntrC - Bradyrhizobium sp. 449-466
1692 ltaalaatrg NQIRAADLLGLNRNTLRK kirdldiqvy
1693 >BVECDA dicA protein - Escherichia coli | 1551.0 1.0 1.0 1.0 22-39
1694 iryrrknlkh TQRSLAKALKISHVSVSQ wergdseptg
1695 >C29010 Mercuric resistance operon regulatory merD protein - 5-22
1696 ------mnay TVSRLALDAGVSVHIVRD yllrgllrpv
1697 >DNECFS DNA-binding protein fis - Escherichia coli | 928.0 1 73-90
1698 ldmvmqytrg NQTRAALMMGINRGTLRK klkkygmn--
1699 >JEBY1 Mating hormone a1 - Yeast (Saccharomyces cerevisiae) 99-116
1700 frrkqslnsk EKEEVAKKCGITPLQVRV wfinkrmrsk
1701 >QCBP2L Regulatory protein cII - Phage lambda | 1559.0 2.0 1 25-42
1702 sallnkiaml GTEKTAEAVGVDKSQISR wkrdwipkfs
1703 >QRECC cAMP receptor protein (CAP) - Escherichia coli | 1507 169-186
1704 thpdgmqiki TRQEIGQIVGCSRETVGR ilkmledqnl
1705 >RCBPL Regulatory protein cro - Phage lambda | 1555.0 1.0 1. 15-32
1706 itlkdyamrf GQTKTAKDLGVYQSAINK aihagrkifl
1707 >RGBP22 Regulatory protein cro - Phage P22 | 1556.0 1.0 1.0 12-29
1708 ykkdvidhfg TQRAVAKALGISDAAVSQ wkevipekda
1709 >RGECA Arabinose operon regulatory protein - Escherichia col 196-213
1710 isdhladsnf DIASVAQHVCLSPSRLSH lfrqqlgisv
1711 >RGECF Regulatory protein fnr - Escherichia coli | 1507.0 1. 196-213
1712 fsprefrltm TRGDIGNYLGLTVETISR llgrfqksgm
1713 >RGECH Heat shock regulatory protein - Escherichia coli | 30 252-269
1714 arwldednks TLQELADRYGVSAERVRQ leknamkklr
1715 >RGKBCP Nitrogen assimilation regulatory protein - Klebsiell 444-461
1716 lttalrhtqg HKQEAARLLGWGRNTLTR klkelgme--
1717 >RPECCT cyt repressor - Escherichia coli | 1291.0 3.0 1.0 1. 11-28
1718 mkakkqetaa TMKDVALKAKVSTATVSR almnpdkvsq
1719 >RPECDO Deo operon repressor - Escherichia coli | 1536.0 1.0 23-40
1720 lqelkrsdkl HLKDAAALLGVSEMTIRR dlnnhsapvv
1721 >RPECG gal repressor - Escherichia coli | 1291.0 4.0 1.0 1.0 3-20
1722 --------ma TIKDVARLAGVSVATVSR vinnspkase
1723 >RPECL lac repressor - Escherichia coli | 1291.0 2.0 1.0 1.0 5-22
1724 ------mkpv TLYDVAEYAGVSYQTVSR vvnqashvsa
1725 >RPECTN TetR repressor - Escherichia coli transposon Tn10 | 26-43
1726 llnevgiegl TTRKLAQKLGVEQPTLYW hvknkralld
1727 >RPECW trp repressor - Escherichia coli | 1534.0 1.0 1.0 1.0 67-84
1728 iveellrgem SQRELKNELGAGIATITR gsnslkaapv
1729 >S02513 Regulatory protein nifA - Klebsiella pneumoniae 495-512
1730 liaalekagw VQAKAARLLGMTPRQVAY riqimditmp
1731 >S07337 *spoIIG protein - Bacillus subtilis 205-222
1732 rfglvgeeek TQKDVADMMGISQSYISR lekriikrlr
1733 >S07958 *DNA-invertase - Escherichia coli 160-177
1734 qagrliaagt PRQKVAIIYDVGVSTLYK tfpagdk---
1735 >S08477 Regulatory protein purR - Escherichia coli 3-20
1736 -------ma TIKDVAKRANVSTTTVSH vinktrfvae-
1737 >S09205 *ebgR protein - Escherichia coli 3-20
1738 --------ma TLKDIAIEAGVSLATVSR vlnddptlnv
1739 >S11945 *lexA repressor - Escherichia coli 27-44
1740 dhisqtgmpp TRAEIAQRLGFRSPNAAE ehlkalarkg
1741 >Z1BPC2 Regulatory protein cI - Phage P22 | 1559.0 1.0 1.0 1 25-42
1742 ssilnriair GQRKVADALGINESQISR wkgdfipkmg
1743 " >
1744 </form>
1745
1746 <br ><br >
1747 <hr >
1748 <a name="splice"></a>
1749 <h2>Human Splice Sites</h2>
1750
1751 <img alt="" src="examples/exon-intron.png" ><img alt="" src="examples/intron-exon.png" > <br >
1752 <br >
1753 These logos show a small sample of Human intron-exon
1754 splice boundaries. Sequences of experimentally
1755 confirmed genes were extracted from
1756 <a href="http://mcb.harvard.edu/gilbert/EID/">EID: the Exon-Intron
1757 database</a>.
1758 Additional discussion of the features in this logo can be found in
1759 the paper
1760 <a href="http://www.lecb.ncifcrf.gov/~toms/paper/splice/">
1761 Features of spliceosome evolution...</a>-->
1762 <!--
1763 <form method="post" action="create.cgi">
1764 <input type="submit" name="cmd_edit" value="Edit Logo" >
1765 Exon-Intron (Donor) Sites
1766 <input type="hidden" name="logo_title" value="exon | intron" >
1767 <input type="hidden" name="first_index" value="-11" >
1768 <input type="hidden" name="logo_start" value="-6" >
1769 <input type="hidden" name="logo_end" value="8" >
1770 <input type="hidden" name="show_xaxis" value="true" >
1771 <input type="hidden" name="show_yaxis" value="true" >
1772 <input type="hidden" name="show_errorbars" value="true" >
1773 <input type="hidden" name="show_fineprint" value="true" >
1774 <input type="hidden" name="scale_width" value="true" >
1775 <input type="hidden" name="sequences" value="
1776 > 19082_AF115399
1777 GGATCGACCCTgtaagtttt
1778 > 45328_AB000381
1779 GCGCGCTCAGTgtaagtatc
1780 > 45328_AB000381
1781 AATCTCCATTCgtaagtacc
1782 > 45330_AB001517
1783 ACTGGACGCTGgtaaggact
1784 > 45331_AB001517
1785 TCGCTTACCGGgtgagcgcg
1786 > 45331_AB001517
1787 GACCTTAAAAAgtaagtatg
1788 > 45331_AB001517
1789 CGTCGATGAAGgtacttgcc
1790 > 45331_AB001517
1791 CCTGATGGCAGgtaaggggg
1792 > 45331_AB001517
1793 GATGACTCCAGgtgcggcct
1794 > 45331_AB001517
1795 ACAGCCTGGACgtatgtccc
1796 > 45331_AB001517
1797 CGGCTGGCCAAgtaggtctc
1798 > 45331_AB001517
1799 CACTCCCTGAGgtaagcctt
1800 > 45331_AB001517
1801 TGGCTGTTCAGgtttgtccc
1802 > 45331_AB001517
1803 ACGACGGCAAGgtaggctcc
1804 > 45331_AB001517
1805 GACCTTCACAGgtgatgttt
1806 > 45331_AB001517
1807 GGCTCCTTGATgtaagcacc
1808 > 45331_AB001517
1809 GACCTCTGATGgtgagcacg
1810 > 45331_AB001517
1811 GCCAAGGGGAAgtgagtgtc
1812 > 45331_AB001517
1813 ACGCCATGGAGgtgagccgc
1814 > 45331_AB001517
1815 CGTCAGGAAAGgtgagcaga
1816 > 45331_AB001517
1817 CTCTCCCACTGgtgagcact
1818 > 45331_AB001517
1819 CAGGGGCGAGAgtgagttgg
1820 > 45331_AB001517
1821 CTGAAGTCCAGgtagagggt
1822 > 45331_AB001517
1823 CTGTCGAAACTgtacgtgtg
1824 > 45332_AB001517
1825 GGGTCGCGCTGgtgagtgga
1826 > 45332_AB001517
1827 GAGGCCTCGGCgtaagtcct
1828 > 45332_AB001517
1829 GGCGAGAGCAGgtgtggggg
1830 > 45332_AB001517
1831 GCTAAAAACCTgtgcgtatt
1832 > 45332_AB001517
1833 AAGCCCATCGGgtgtgtaca
1834 > 45333_AB001517
1835 GGGTCGCGCTGgtgagtgga
1836 > 45333_AB001517
1837 GAGGCCTCGGCgtaagtcct
1838 > 45333_AB001517
1839 GGCGAGAGCAGgtgtggggg
1840 > 45333_AB001517
1841 GCTAAAAACCTgtgcgtatt
1842 > 45334_AB001523
1843 CATCGTCACCTgtgagtgcc
1844 > 45334_AB001523
1845 GAATGGAGAAGgtatgagtt
1846 > 45334_AB001523
1847 CAGAGTGCTGTgtgagtacc
1848 > 45334_AB001523
1849 CAGAGTGACAGgtaagtgta
1850 > 45334_AB001523
1851 TCATGGTTCAGgtacttgac
1852 > 45334_AB001523
1853 CGGGGCCGGGGgtgagtagt
1854 > 45334_AB001523
1855 AGCTCTTAGAAgtgagtcgg
1856 > 45334_AB001523
1857 CCACAGAAAAGgtgcctacc
1858 > 45334_AB001523
1859 ACCAGAAACAGgtacttttt
1860 > 45334_AB001523
1861 AACACTACTTAgtaagtatt
1862 > 45334_AB001523
1863 GAGTTTTACATgtaattgat
1864 > 45334_AB001523
1865 CAAATTGAAAAgtatccttt
1866 > 45334_AB001523
1867 AGACAGCCCAGgtaagacca
1868 > 45334_AB001523
1869 TCAGGACTCAGgtatgcgtt
1870 > 45334_AB001523
1871 GCCGCTGGCTGgtgagtggg
1872 > 45334_AB001523
1873 CAACACGAGAGgtgaggtgc
1874 > 45334_AB001523
1875 CAGACCACAAAgtgagtagg
1876 > 45334_AB001523
1877 TCAGGAACACGgtaacggag
1878 > 45334_AB001523
1879 AGTCCCAGCAGgtaaacatt
1880 > 45334_AB001523
1881 AAAATTTTTTTgtaagtgat
1882 > 45334_AB001523
1883 TATGTATGAAGgtaggtggt
1884 > 45334_AB001523
1885 ACTGGACGCTGgtaaggact
1886 > 45335_AB001523
1887 TCGCTTACCGGgtgagcgcg
1888 > 45337_AB00189S
1889 TGTGGTACCTGgtgagtagg
1890 > 45337_AB00189S
1891 CCCCAAATTATgtaagtcaa
1892 > 45337_AB00189S
1893 AATGAAAATAAgtacgtcac
1894 > 45338_AB00189S
1895 TGTGGTACCTGgtgagtagg
1896 > 45338_AB00189S
1897 CCCCAAATTATgtaagtcaa
1898 > 45338_AB00189S
1899 AATGAAAATAAgtacgtcac
1900 > 45338_AB00189S
1901 GGAGAAGCAAGgtcagtggc
1902 > 45339_AB00189S
1903 TGTGGTACCTGgtgagtagg
1904 > 45339_AB00189S
1905 CCCCAAATTATgtaagtcaa
1906 > 45339_AB00189S
1907 AATGAAAATAAgtacgtcac
1908 > 45339_AB00189S
1909 GGAGAAGCAAGgtcagtggc
1910 > 45340_AB00189S
1911 TGTGGTACCTGgtgagtagg
1912 > 45340_AB00189S
1913 CCCCAAATTATgtaagtcaa
1914 > 45340_AB00189S
1915 AATGAAAATAAgtacgtcac
1916 > 45341_AB00189S
1917 TGTGGTACCTGgtgagtagg
1918 > 45341_AB00189S
1919 CCCCAAATTATgtaagtcaa
1920 > 45341_AB00189S
1921 AATGAAAATAAgtacgtcac
1922 > 45341_AB00189S
1923 AAGACCAGCAGgtaatgcat
1924 > 45342_AB00189S
1925 TGTGGTACCTGgtgagtagg
1926 > 45342_AB00189S
1927 CCCCAAATTATgtaagtcaa
1928 > 45342_AB00189S
1929 AATGAAAATAAgtacgtcac
1930 > 45342_AB00189S
1931 AGATTACACAGgtaatgagc
1932 > 45342_AB00189S
1933 AAGACCAGCAGgtaatgcat
1934 > 45342_AB00189S
1935 GTGTGTCGAAGgtacggtcc
1936 > 45342_AB00189S
1937 GTGCAGCAACGgtgagcagc
1938 > 45343_AB00189S
1939 TGTGGTACCTGgtgagtagg
1940 > 45343_AB00189S
1941 CCCCAAATTATgtaagtcaa
1942 > 45343_AB00189S
1943 AATGAAAATAAgtacgtcac
1944 > 45343_AB00189S
1945 AAGACCAGCAGgtaatgcat
1946 > 45343_AB00189S
1947 GTGTGTCGAAGgtacggtcc
1948 > 45343_AB00189S
1949 GTGCAGCAACGgtgagcagc
1950 > 45344_AB00189S
1951 TGTGGTACCTGgtgagtagg
1952 > 45344_AB00189S
1953 CCCCAAATTATgtaagtcaa
1954 > 45344_AB00189S
1955 AATGAAAATAAgtacgtcac
1956 > 45344_AB00189S
1957 AGATTACACAGgtaatgagc
1958 > 45344_AB00189S
1959 AAGACCAGCAGgtaatgcat
1960 > 45345_AB002059
1961 TATGTGGTAGGgtaagagag
1962 > 45345_AB002059
1963 AGCCACCTCAGgtgggggcc
1964 > 45345_AB002059
1965 GATGCCCAGAGgtgagttta
1966 > 45345_AB002059
1967 ACACAGCCACGgtaactgtg
1968 > 45345_AB002059
1969 GTTGTGCCCTCgtaagtgtc
1970 > 45345_AB002059
1971 AACTTCTCTAAgtaagcaga
1972 > 45345_AB002059
1973 TGGCGTTGCTGgtgggtccc" >
1974 </form>-->
1975
1976
1977 <!--
1978 <form method="post" action="create.cgi">
1979 <input type="submit" name="cmd_edit" value="Edit Logo" >
1980 Intron-Exon (Acceptor) Sites
1981 <input type="hidden" name="logo_title" value="intron | exon" >
1982 <input type="hidden" name="first_index" value="-21" >
1983 <input type="hidden" name="logo_start" value="-20" >
1984 <input type="hidden" name="logo_end" value="3" >
1985 <input type="hidden" name="show_xaxis" value="true" >
1986 <input type="hidden" name="show_yaxis" value="true" >
1987 <input type="hidden" name="show_errorbars" value="true" >
1988 <input type="hidden" name="show_fineprint" value="true" >
1989 <input type="hidden" name="scale_width" value="true" >
1990 <input type="hidden" name="sequences" value="
1991 > 19082_AF115399
1992 ttctctgaaatatgaatttagACTGGTACTTATCATGGAG
1993 > 45328_AB000381
1994 gcctgctttctcccctctcagGGACTTACAGTTTGAGATG
1995 > 45328_AB000381
1996 cattgctgcttctttttttagGCATAAATTCTCGTGAACT
1997 > 45330_AB001517
1998 aacttcctgtgtgttttgcagACAGCTGGATAGAAAACGA
1999 > 45331_AB001517
2000 acaattttgttttcttcacagTTTTCAAATTTGCTGGGTA
2001 > 45331_AB001517
2002 tgtggtttttgtctttatcagCAACAAATCTGACACGCTG
2003 > 45331_AB001517
2004 gtgacctctggcgtcctgcagGGGGCGATGCGCTGCTGGT
2005 > 45331_AB001517
2006 atgtccgcgttccttccatagGAAGTTTGTTGTCACAAAG
2007 > 45331_AB001517
2008 tgccatctccctcttttccagGTGCTTTGTGGTTGGGAGC
2009 > 45331_AB001517
2010 accctgtgcttccccttgcagCTGTACTCACTCAGCCAGG
2011 > 45331_AB001517
2012 tcttctctctcgtcaattcagGTACTTCTTCAATAAAGAA
2013 > 45331_AB001517
2014 ttacaggcccgttctctgcagCATTTCAGATCAGAGCATC
2015 > 45331_AB001517
2016 cagcttcccccgtgtgcacagGCCTGGGCCAGCTGCTGGT
2017 > 45331_AB001517
2018 gcccctcctgtcctgcctcagGTCAAGGTGTGGAACACCC
2019 > 45331_AB001517
2020 gaccttgcctcttctctgcagGTACCGAAACTTCCGCACC
2021 > 45331_AB001517
2022 cgcctccttgctctacggtagGTTTTGTCTGGACACGAAG
2023 > 45331_AB001517
2024 ttactttgcatctctgtttagCTCTGGCTGTGACTTTTCG
2025 > 45331_AB001517
2026 ccatgtctcctctccacccagGGCCTTCACCGCCCTGTGC
2027 > 45331_AB001517
2028 ccactgcttttgctgttctagGAATTTTTGAACCGAAGAA
2029 > 45331_AB001517
2030 taacggttcttttttccccagGTGACATGAGTTCTCGGCA
2031 > 45331_AB001517
2032 aagcactgcttaatttcccagGGCGCTGCTGGGCGGCCAC
2033 > 45331_AB001517
2034 tgattttttctccttttgcagTTGAAGTGGTCACCTCCTC
2035 > 45331_AB001517
2036 cttagggagtctccctttcagAGCCGGGACGCTGCTGCCT
2037 > 45331_AB001517
2038 catcccctgtgtgattgacagCTGTAGCTGGAACCACTAT
2039 > 45332_AB001517
2040 cagctcccgctcctctcgcagGTGCTGTCTGGATGCGGAG
2041 > 45332_AB001517
2042 ctctggttttcccccgtgcagGATCCTGGTGCACCTGAGC
2043 > 45332_AB001517
2044 ttgccctgtgctctttcccagGAATGTTTTGACCGAGTCT
2045 > 45332_AB001517
2046 aggccttttgtctcccggtagGAGCACGTTTGCCGTGGAC
2047 > 45332_AB001517
2048 cgtgttcttttcgcctttcagCTTGTGCTGCATTGCACCT
2049 > 45333_AB001517
2050 cagctcccgctcctctcgcagGTGCTGTCTGGATGCGGAG
2051 > 45333_AB001517
2052 ctctggttttcccccgtgcagGATCCTGGTGCACCTGAGC
2053 > 45333_AB001517
2054 ttgccctgtgctctttcccagGAATGTTTTGACCGAGTCT
2055 > 45333_AB001517
2056 cgtgttcttttcgcctttcagCTTGTGCTGCATTGCACCT
2057 > 45334_AB001523
2058 atttctttcttcccttcatagGTGCTGGAGATCAGAATTT
2059 > 45334_AB001523
2060 acttcaaacaattgtttacagGTCCTATGGCCGGGCTCCG
2061 > 45334_AB001523
2062 cagtgacttgtttgtttttagGATACCGAAGTGTATAAAG
2063 > 45334_AB001523
2064 agtctgttcatgtctttgcagGTGTGTTGTGCTCTCCGAC
2065 > 45334_AB001523
2066 aaacgtatcttgggcgaatagGAGGAGCTTGCCTTTGTTT
2067 > 45334_AB001523
2068 tcatgatgtgtgtttgtttagATGGTGCCAACTGGCTGAC
2069 > 45334_AB001523
2070 ttcgcatttgcacccccacagGTCTCTGTCCCACCTGGTG
2071 > 45334_AB001523
2072 attgtggatttatcttaacagTTAAAGTCCTTGGGCTATC
2073 > 45334_AB001523
2074 tctcgtttctttctgtttaagCCAACACAGCTCAGAGTCC
2075 > 45334_AB001523
2076 tgtgtttttacttccccacagGATTTGTCCCATGCCACCA
2077 > 45334_AB001523
2078 actgtttgttgactttgcaagGAGGAAAAAGGCTCCACAA
2079 > 45334_AB001523
2080 ctccttacctctccgctccagCTACCTGCAGACCAGCAGC
2081 > 45334_AB001523
2082 tacgataatgtctatttacagGTCATAAGATAGTGCTACC
2083 > 45334_AB001523
2084 tgcctgattctttgactctagGCCAAGGAACCTGGAACGT
2085 > 45334_AB001523
2086 ccacgatctcttttcctttagATAGCCTTCTGGCAGGCAT
2087 > 45334_AB001523
2088 gactttttctgtccttcgtagAACAGTCTTCTGAGGCCGC
2089 > 45334_AB001523
2090 gtctttgtgcttcctcctcagGTGTCGATTGACTGCCCGT
2091 > 45334_AB001523
2092 ctttttgtttttccactttagGAAATATGTTCAAGTTTGT
2093 > 45334_AB001523
2094 gacccccaactctctttccagCCCATCTACAGCAAGCAGT
2095 > 45334_AB001523
2096 ttctctccctttcctgcccagACATTATACAACGTGAAGG
2097 > 45334_AB001523
2098 catcgcttcctctcgtttcagTTGTCGACAACAGTAGCAA
2099 > 45334_AB001523
2100 aacttcctgtgtgttttgcagACAGCTGGATAGAAAACGA
2101 > 45335_AB001523
2102 acaattttgttttcttcacagTTTTCAAATTTGCTGGGTA
2103 > 45337_AB00189S
2104 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2105 > 45337_AB00189S
2106 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2107 > 45337_AB00189S
2108 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2109 > 45338_AB00189S
2110 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2111 > 45338_AB00189S
2112 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2113 > 45338_AB00189S
2114 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2115 > 45338_AB00189S
2116 aatgcattctttacccattagGTGATCTTGAGACTCCTGT
2117 > 45339_AB00189S
2118 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2119 > 45339_AB00189S
2120 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2121 > 45339_AB00189S
2122 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2123 > 45339_AB00189S
2124 aatgcattctttacccattagGTGATCTTGAGACTCCTGT
2125 > 45340_AB00189S
2126 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2127 > 45340_AB00189S
2128 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2129 > 45340_AB00189S
2130 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2131 > 45341_AB00189S
2132 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2133 > 45341_AB00189S
2134 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2135 > 45341_AB00189S
2136 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2137 > 45341_AB00189S
2138 ctcctgcctttgctcctacagGAAGTGCGTGAGTGTGTGC
2139 > 45342_AB00189S
2140 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2141 > 45342_AB00189S
2142 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2143 > 45342_AB00189S
2144 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2145 > 45342_AB00189S
2146 -ggcaatttgcactcacacagCTCAATCCACCCCAGGCTC
2147 > 45342_AB00189S
2148 ctcctgcctttgctcctacagGAAGTGCGTGAGTGTGTGC
2149 > 45342_AB00189S
2150 aggaacggtatcttcccacagGTGTGACGAGAACTGCTTG
2151 > 45342_AB00189S
2152 tttcctgatgcggggccccagCTGACGAGACATTCTGCGA
2153 > 45343_AB00189S
2154 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2155 > 45343_AB00189S
2156 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2157 > 45343_AB00189S
2158 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2159 > 45343_AB00189S
2160 ctcctgcctttgctcctacagGAAGTGCGTGAGTGTGTGC
2161 > 45343_AB00189S
2162 aggaacggtatcttcccacagGTGTGACGAGAACTGCTTG
2163 > 45343_AB00189S
2164 tttcctgatgcggggccccagCTGACGAGACATTCTGCGA
2165 > 45344_AB00189S
2166 ttgtgtctttcgtgcttacagCATTGTGGCGACAAGAACA
2167 > 45344_AB00189S
2168 caccacgattccatttcttagGATTCCTACGCCAGCTACG
2169 > 45344_AB00189S
2170 tggttttttcctttgtttcagACACGGCACTCGTTGTGCG
2171 > 45344_AB00189S
2172 -ggcaatttgcactcacacagCTCAATCCACCCCAGGCTC
2173 > 45344_AB00189S
2174 ctcctgcctttgctcctacagGAAGTGCGTGAGTGTGTGC
2175 > 45345_AB002059
2176 tgcccgacttctcctccccagGTGGGCGCTCCTCGCCAAA
2177 > 45345_AB002059
2178 accttgagacttgcctcctagGGAGAGAACGTGTTCTTCT
2179 > 45345_AB002059
2180 ctgctctctctcccacctcagCACCCGTCCGTCCCACTGG
2181 > 45345_AB002059
2182 agttcatcttttgttttctagGTGTAAAAACAGGCCAGTG
2183 > 45345_AB002059
2184 tcacctcccttccacctgcagGAGGCCCCTGCTGGCCCAG
2185 > 45345_AB002059
2186 gacctttcccactcctcccagGTCCAATGCCTTGGAGACC
2187 > 45345_AB002059
2188 aaagctatgtgctatgtgcagGGTGGCTCTGTAGGCATCA
2189 > 45345_AB002059
2190 agccttctttcctgcccacagGACAGCCACTCACTGGTGG
2191 " >
2192 </form>-->-->
2193
2194 </td></tr>
2195
2196
2197
2198
2199
2200 </table>
2201
2202 <script type="text/javascript">
2203 var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
2204 document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
2205 </script>
2206 <script type="text/javascript">
2207 var pageTracker = _gat._getTracker("UA-5951066-1");
2208 pageTracker._trackPageview();
2209 </script>
2210 </body></html>