This file is indexed.

/usr/share/EMBOSS/test/embl/pro.dat is in emboss-test 6.4.0-2.

This file is owned by root:root, with mode 0o644.

The actual contents of the file can be viewed below.

   1
   2
   3
   4
   5
   6
   7
   8
   9
  10
  11
  12
  13
  14
  15
  16
  17
  18
  19
  20
  21
  22
  23
  24
  25
  26
  27
  28
  29
  30
  31
  32
  33
  34
  35
  36
  37
  38
  39
  40
  41
  42
  43
  44
  45
  46
  47
  48
  49
  50
  51
  52
  53
  54
  55
  56
  57
  58
  59
  60
  61
  62
  63
  64
  65
  66
  67
  68
  69
  70
  71
  72
  73
  74
  75
  76
  77
  78
  79
  80
  81
  82
  83
  84
  85
  86
  87
  88
  89
  90
  91
  92
  93
  94
  95
  96
  97
  98
  99
 100
 101
 102
 103
 104
 105
 106
 107
 108
 109
 110
 111
 112
 113
 114
 115
 116
 117
 118
 119
 120
 121
 122
 123
 124
 125
 126
 127
 128
 129
 130
 131
 132
 133
 134
 135
 136
 137
 138
 139
 140
 141
 142
 143
 144
 145
 146
 147
 148
 149
 150
 151
 152
 153
 154
 155
 156
 157
 158
 159
 160
 161
 162
 163
 164
 165
 166
 167
 168
 169
 170
 171
 172
 173
 174
 175
 176
 177
 178
 179
 180
 181
 182
 183
 184
 185
 186
 187
 188
 189
 190
 191
 192
 193
 194
 195
 196
 197
 198
 199
 200
 201
 202
 203
 204
 205
 206
 207
 208
 209
 210
 211
 212
 213
 214
 215
 216
 217
 218
 219
 220
 221
 222
 223
 224
 225
 226
 227
 228
 229
 230
 231
 232
 233
 234
 235
 236
 237
 238
 239
 240
 241
 242
 243
 244
 245
 246
 247
 248
 249
 250
 251
 252
 253
 254
 255
 256
 257
 258
 259
 260
 261
 262
 263
 264
 265
 266
 267
 268
 269
 270
 271
 272
 273
 274
 275
 276
 277
 278
 279
 280
 281
 282
 283
 284
 285
 286
 287
 288
 289
 290
 291
 292
 293
 294
 295
 296
 297
 298
 299
 300
 301
 302
 303
 304
 305
 306
 307
 308
 309
 310
 311
 312
 313
 314
 315
 316
 317
 318
 319
 320
 321
 322
 323
 324
 325
 326
 327
 328
 329
 330
 331
 332
 333
 334
 335
 336
 337
 338
 339
 340
 341
 342
 343
 344
 345
 346
 347
 348
 349
 350
 351
 352
 353
 354
 355
 356
 357
 358
 359
 360
 361
 362
 363
 364
 365
 366
 367
 368
 369
 370
 371
 372
 373
 374
 375
 376
 377
 378
 379
 380
 381
 382
 383
 384
 385
 386
 387
 388
 389
 390
 391
 392
 393
 394
 395
 396
 397
 398
 399
 400
 401
 402
 403
 404
 405
 406
 407
 408
 409
 410
 411
 412
 413
 414
 415
 416
 417
 418
 419
 420
 421
 422
 423
 424
 425
 426
 427
 428
 429
 430
 431
 432
 433
 434
 435
 436
 437
 438
 439
 440
 441
 442
 443
 444
 445
 446
 447
 448
 449
 450
 451
 452
 453
 454
 455
 456
 457
 458
 459
 460
 461
 462
 463
 464
 465
 466
 467
 468
 469
 470
 471
 472
 473
 474
 475
 476
 477
 478
 479
 480
 481
 482
 483
 484
 485
 486
 487
 488
 489
 490
 491
 492
 493
 494
 495
 496
 497
 498
 499
 500
 501
 502
 503
 504
 505
 506
 507
 508
 509
 510
 511
 512
 513
 514
 515
 516
 517
 518
 519
 520
 521
 522
 523
 524
 525
 526
 527
 528
 529
 530
 531
 532
 533
 534
 535
 536
 537
 538
 539
 540
 541
 542
 543
 544
 545
 546
 547
 548
 549
 550
 551
 552
 553
 554
 555
 556
 557
 558
 559
 560
 561
 562
 563
 564
 565
 566
 567
 568
 569
 570
 571
 572
 573
 574
 575
 576
 577
 578
 579
 580
 581
 582
 583
 584
 585
 586
 587
 588
 589
 590
 591
 592
 593
 594
 595
 596
 597
 598
 599
 600
 601
 602
 603
 604
 605
 606
 607
 608
 609
 610
 611
 612
 613
 614
 615
 616
 617
 618
 619
 620
 621
 622
 623
 624
 625
 626
 627
 628
 629
 630
 631
 632
 633
 634
 635
 636
 637
 638
 639
 640
 641
 642
 643
 644
 645
 646
 647
 648
 649
 650
 651
 652
 653
 654
 655
 656
 657
 658
 659
 660
 661
 662
 663
 664
 665
 666
 667
 668
 669
 670
 671
 672
 673
 674
 675
 676
 677
 678
 679
 680
 681
 682
 683
 684
 685
 686
 687
 688
 689
 690
 691
 692
 693
 694
 695
 696
 697
 698
 699
 700
 701
 702
 703
 704
 705
 706
 707
 708
 709
 710
 711
 712
 713
 714
 715
 716
 717
 718
 719
 720
 721
 722
 723
 724
 725
 726
 727
 728
 729
 730
 731
 732
 733
 734
 735
 736
 737
 738
 739
 740
 741
 742
 743
 744
 745
 746
 747
 748
 749
 750
 751
 752
 753
 754
 755
 756
 757
 758
 759
 760
 761
 762
 763
 764
 765
 766
 767
 768
 769
 770
 771
 772
 773
 774
 775
 776
 777
 778
 779
 780
 781
 782
 783
 784
 785
 786
 787
 788
 789
 790
 791
 792
 793
 794
 795
 796
 797
 798
 799
 800
 801
 802
 803
 804
 805
 806
 807
 808
 809
 810
 811
 812
 813
 814
 815
 816
 817
 818
 819
 820
 821
 822
 823
 824
 825
 826
 827
 828
 829
 830
 831
 832
 833
 834
 835
 836
 837
 838
 839
 840
 841
 842
 843
 844
 845
 846
 847
 848
 849
 850
 851
 852
 853
 854
 855
 856
 857
 858
 859
 860
 861
 862
 863
 864
 865
 866
 867
 868
 869
 870
 871
 872
 873
 874
 875
 876
 877
 878
 879
 880
 881
 882
 883
 884
 885
 886
 887
 888
 889
 890
 891
 892
 893
 894
 895
 896
 897
 898
 899
 900
 901
 902
 903
 904
 905
 906
 907
 908
 909
 910
 911
 912
 913
 914
 915
 916
 917
 918
 919
 920
 921
 922
 923
 924
 925
 926
 927
 928
 929
 930
 931
 932
 933
 934
 935
 936
 937
 938
 939
 940
 941
 942
 943
 944
 945
 946
 947
 948
 949
 950
 951
 952
 953
 954
 955
 956
 957
 958
 959
 960
 961
 962
 963
 964
 965
 966
 967
 968
 969
 970
 971
 972
 973
 974
 975
 976
 977
 978
 979
 980
 981
 982
 983
 984
 985
 986
 987
 988
 989
 990
 991
 992
 993
 994
 995
 996
 997
 998
 999
1000
1001
1002
1003
1004
1005
1006
1007
1008
1009
1010
1011
1012
1013
1014
1015
1016
1017
1018
1019
1020
1021
1022
1023
1024
1025
1026
1027
1028
1029
1030
1031
1032
1033
1034
1035
1036
1037
1038
1039
1040
1041
1042
1043
1044
1045
1046
1047
1048
1049
1050
1051
1052
1053
1054
1055
1056
1057
1058
1059
1060
1061
1062
1063
1064
1065
1066
1067
1068
1069
1070
1071
1072
1073
1074
1075
1076
1077
1078
1079
1080
1081
1082
1083
1084
1085
1086
1087
1088
1089
1090
1091
1092
1093
1094
1095
1096
1097
1098
1099
1100
1101
1102
1103
1104
1105
1106
1107
1108
1109
1110
1111
1112
1113
1114
1115
1116
1117
1118
1119
1120
1121
1122
1123
1124
1125
1126
1127
1128
1129
1130
1131
1132
1133
1134
1135
1136
1137
1138
1139
1140
1141
1142
1143
1144
1145
1146
1147
1148
1149
1150
1151
1152
1153
1154
1155
1156
1157
1158
1159
1160
1161
1162
1163
1164
1165
1166
1167
1168
1169
1170
1171
1172
1173
1174
1175
1176
1177
1178
1179
1180
1181
1182
1183
1184
1185
1186
1187
1188
1189
1190
1191
1192
1193
1194
1195
1196
1197
1198
1199
1200
1201
1202
1203
1204
1205
1206
1207
1208
1209
1210
1211
1212
1213
1214
1215
1216
1217
1218
1219
1220
1221
1222
1223
1224
1225
1226
1227
1228
1229
1230
1231
1232
1233
1234
1235
1236
1237
1238
1239
1240
1241
1242
1243
1244
1245
1246
1247
1248
1249
1250
1251
1252
1253
1254
1255
1256
1257
1258
1259
1260
1261
1262
1263
1264
1265
1266
1267
1268
1269
1270
1271
1272
1273
1274
1275
1276
1277
1278
1279
1280
1281
1282
1283
1284
1285
1286
1287
1288
1289
1290
1291
1292
1293
1294
1295
1296
1297
1298
1299
1300
1301
1302
1303
1304
1305
1306
1307
1308
1309
1310
1311
1312
1313
1314
1315
1316
1317
1318
1319
1320
1321
1322
1323
1324
1325
1326
1327
1328
1329
1330
1331
1332
1333
1334
1335
1336
1337
1338
1339
1340
1341
1342
1343
1344
1345
1346
1347
1348
1349
1350
1351
1352
1353
1354
1355
1356
1357
1358
1359
1360
1361
1362
1363
1364
1365
1366
1367
1368
1369
1370
1371
1372
1373
1374
1375
1376
1377
1378
1379
1380
1381
1382
1383
1384
1385
1386
1387
1388
1389
1390
1391
1392
1393
1394
1395
1396
1397
1398
1399
1400
1401
1402
1403
1404
1405
1406
1407
1408
1409
1410
1411
1412
1413
1414
1415
1416
1417
1418
1419
1420
1421
1422
1423
1424
1425
1426
1427
1428
1429
1430
1431
1432
1433
1434
1435
1436
1437
1438
1439
1440
1441
1442
1443
1444
1445
1446
1447
1448
1449
1450
1451
1452
1453
1454
1455
1456
1457
1458
1459
1460
1461
1462
1463
1464
1465
1466
1467
1468
1469
1470
1471
1472
1473
1474
1475
1476
1477
1478
1479
1480
1481
1482
1483
1484
1485
1486
1487
1488
1489
1490
1491
1492
1493
1494
1495
1496
1497
1498
1499
1500
1501
1502
1503
1504
1505
1506
1507
1508
1509
1510
1511
1512
1513
1514
1515
1516
1517
1518
1519
1520
1521
1522
1523
1524
1525
1526
1527
1528
1529
1530
1531
1532
1533
1534
1535
1536
1537
1538
1539
1540
1541
1542
1543
1544
1545
1546
1547
1548
1549
1550
1551
1552
1553
1554
1555
1556
1557
1558
1559
1560
1561
1562
1563
1564
1565
1566
1567
1568
1569
1570
1571
1572
1573
1574
1575
1576
1577
1578
1579
1580
1581
1582
1583
1584
1585
1586
1587
1588
1589
1590
1591
1592
1593
1594
1595
1596
1597
1598
1599
1600
1601
1602
1603
1604
1605
1606
1607
1608
1609
1610
1611
1612
1613
1614
1615
1616
1617
1618
1619
1620
1621
1622
1623
1624
1625
1626
1627
1628
1629
1630
1631
1632
1633
1634
1635
1636
1637
1638
1639
1640
1641
1642
1643
1644
1645
1646
1647
1648
1649
1650
1651
1652
1653
1654
1655
1656
1657
1658
1659
1660
1661
1662
1663
1664
1665
1666
1667
1668
1669
1670
1671
1672
1673
1674
1675
1676
1677
1678
1679
1680
1681
1682
1683
1684
1685
1686
1687
1688
1689
1690
1691
1692
1693
1694
1695
1696
1697
1698
1699
ID   J01636; SV 1; linear; genomic DNA; STD; PRO; 7477 BP.
XX
AC   J01636; J01637; K01483; K01793;
XX
DT   30-NOV-1990 (Rel. 26, Created)
DT   09-SEP-2004 (Rel. 81, Last updated, Version 8)
XX
DE   E.coli lactose operon with lacI, lacZ, lacY and lacA genes.
XX
KW   acetyltransferase; beta-D-galactosidase; galactosidase; lac operon;
KW   lac repressor protein; lacA gene; lacI gene; lactose permease; lacY gene;
KW   lacZ gene; mutagenesis; palindrome; promoter region;
KW   thiogalactoside acetyltransferase.
XX
OS   Escherichia coli
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Escherichia.
XX
RN   [1]
RP   1243-1266
RX   DOI; 10.1073/pnas.70.12.3581.
RX   PUBMED; 4587255.
RA   Gilbert W., Maxam A.;
RT   "The nucleotide sequence of the lac operator";
RL   Proc. Natl. Acad. Sci. U.S.A. 70(12):3581-3584(1973).
XX
RN   [2]
RP   1246-1308
RX   DOI; 10.1073/pnas.70.12.3585.
RX   PUBMED; 4587256.
RA   Maizels N.M.;
RT   "The nucleotide sequence of the lactose messenger ribonucleic acid
RT   transcribed from the UV5 promoter mutant of Escherichia coli";
RL   Proc. Natl. Acad. Sci. U.S.A. 70(12):3585-3589(1973).
XX
RN   [3]
RX   PUBMED; 4598642.
RA   Gilbert W., Maizels N., Maxam A.;
RT   "Sequences of controlling regions of the lactose operon";
RL   Cold Spring Harb. Symp. Quant. Biol. 38:845-855(1974).
XX
RN   [4]
RA   Gilbert W., Gralla J., Majors A.J., Maxam A.;
RT   "Lactose operator sequences and the action of lac repressor";
RL   (in) Sund H., Blauer G. (Eds.);
RL   PROTEIN-LIGAND INTERACTIONS:193-207;
RL   Walter de Gruyter, New York (1975)
XX
RN   [5]
RP   1146-1282
RX   DOI; 10.1126/science.1088926.
RX   PUBMED; 1088926.
RA   Dickson R.C., Abelson J.N., Barnes W.M., Reznikoff W.S.;
RT   "Genetic regulation: the Lac control region";
RL   Science 187(4171):27-35(1975).
XX
RN   [6]
RP   1227-1271
RA   Gilbert W., Maxam A., Mirzabekov A.;
RT   "Contacts between the lac repressor and DNA revealed by methylation";
RL   (in) Kjeldgaard N.C., Maaloe O. (Eds.);
RL   CONTROL OF RIBOSOME SYNTHESIS:138-143;
RL   Academic Press, New York (1976)
XX
RN   [7]
RX   DOI; 10.1038/260360a0.
RX   PUBMED; 768781.
RA   Marians K.J., Wu R.;
RT   "Structure of the lactose operator";
RL   Nature 260(5549):360-363(1976).
XX
RN   [8]
RP   1242-1268
RX   DOI; 10.1038/263748a0.
RX   PUBMED; 1069185.
RA   Heyneker H.L., Shine J., Goodman H.M., Boyer H.W., Rosenberg J.,
RA   Dickerson R.E., Narang S.A., Itakura K., Lin S., Riggs A.D.;
RT   "Synthetic lac operator DNA is functional in vivo";
RL   Nature 263(5580):748-752(1976).
XX
RN   [9]
RX   DOI; 10.1016/S0022-2836(77)80132-0.
RX   PUBMED; 323498.
RA   Dickson R.C., Abelson J.N., Johnson P., Reznikoff W.S., Barnes W.M.;
RT   "Nucleotide sequence changes produced by mutations in the lac promoter of
RT   Escherichia coli";
RL   J. Mol. Biol. 111(1):65-75(1977).
XX
RN   [10]
RP   51-264
RX   DOI; 10.1073/pnas.74.10.4163.
RX   PUBMED; 337294.
RA   Steege D.A.;
RT   "5'-Terminal nucleotide sequence of Escherichia coli lactose repressor
RT   mRNA: features of translational initiation and reinitiation sites";
RL   Proc. Natl. Acad. Sci. U.S.A. 74(10):4163-4167(1977).
XX
RN   [11]
RP   1-81
RX   DOI; 10.1038/274762a0.
RX   PUBMED; 355890.
RA   Calos M.P.;
RT   "DNA sequence for a low-level promoter of the lac repressor gene and an
RT   'up' promoter mutation";
RL   Nature 274(5673):762-765(1978).
XX
RN   [12]
RP   49-1161
RX   DOI; 10.1038/274765a0.
RX   PUBMED; 355891.
RA   Farabaugh P.J.;
RT   "Sequence of the lacI gene";
RL   Nature 274(5673):765-769(1978).
XX
RN   [13]
RX   DOI; 10.1038/274770a0.
RX   PUBMED; 355892.
RA   Miller J.H., Coulondre C., Farabaugh P.J.;
RT   "Correlation of nonsense sites in the lacI gene with specific codons in the
RT   nucleotide sequence";
RL   Nature 274(5673):770-775(1978).
XX
RN   [14]
RX   DOI; 10.1007/BF00267233.
RX   PUBMED; 6770231.
RA   Calos M.P., Miller J.H.;
RT   "DNA sequence alteration resulting from a mutation impairing promoter
RT   function in the lac repressor gene";
RL   Mol. Gen. Genet. 178(1):225-227(1980).
XX
RN   [15]
RP   4306-5804
RX   DOI; 10.1038/283541a0.
RX   PUBMED; 6444453.
RA   Buechel D.E., Gronenborn B., Mueller-Hill B.;
RT   "Sequence of the lactose permease gene";
RL   Nature 283(5747):541-545(1980).
XX
RN   [16]
RX   PUBMED; 6271472.
RA   Miller J.H., Calos M.P., Galas D.J.;
RT   "Genetic and sequencing studies of the specificity of transposition into
RT   the lac region of E. coli";
RL   Cold Spring Harb. Symp. Quant. Biol. 45:243-257(1981).
XX
RN   [17]
RX   DOI; 10.1016/0014-5793(81)81076-9.
RX   PUBMED; 7023981.
RA   Chenchick A., Beabealashvilli R.S., Mirzabekov A.;
RT   "Topography of interaction of Escherichia coli RNA polymerase subunits with
RT   lac UV5 promoter";
RL   FEBS Lett. 128(1):46-50(1981).
XX
RN   [18]
RX   DOI; 10.1016/0378-1119(81)90038-X.
RX   PUBMED; 7016667.
RA   Betz J.L., Sadler J.R.;
RT   "Variants of a cloned synthetic lactose operator. I. A palindromic dimer
RT   lactose operator derived from one stand of the cloned 40-base pair
RT   operator";
RL   Gene 13(1):1-12(1981).
XX
RN   [19]
RX   DOI; 10.1016/0378-1119(81)90039-1.
RX   PUBMED; 6263752.
RA   Sadler J.R., Tecklenburg M.;
RT   "Cloning and characterization of the natural lactose operator";
RL   Gene 13(1):13-23(1981).
XX
RN   [20]
RX   DOI; 10.1016/0378-1119(81)90128-1.
RX   PUBMED; 6271642.
RA   Betz J.L., Sadler J.R.;
RT   "Variants of a cloned synthetic lactose operator. II.
RT   Chloramphenicol-resistant revertants retaining a lactose operator in the
RT   CAT gene of plasmid pBR325";
RL   Gene 15(2-3):187-200(1981).
XX
RN   [21]
RX   DOI; 10.1007/BF00268783.
RX   PUBMED; 7038381.
RA   Calos M.P., Miller J.H.;
RT   "The DNA sequence change resulting from the IQ1 mutation, which greatly
RT   increases promoter strength";
RL   Mol. Gen. Genet. 183(3):559-560(1981).
XX
RN   [22]
RX   DOI; 10.1073/pnas.78.12.7652.
RX   PUBMED; 6278484.
RA   Mieschendahl M., Buechel D.E., Bocklage H., Mueller-Hill B.;
RT   "Mutations in the lacY gene of Escherichia coli define functional
RT   organization of lactose permease";
RL   Proc. Natl. Acad. Sci. U.S.A. 78(12):7652-7656(1981).
XX
RN   [23]
RX   DOI; 10.1016/0378-1119(82)90042-7.
RX   PUBMED; 6299890.
RA   Russell D.R., Bennett G.N.;
RT   "Construction and analysis of in vivo activity of E. coli promoter hybrids
RT   and promoter mutants that alter the -35 to -10 spacing";
RL   Gene 20(2):231-243(1982).
XX
RN   [24]
RX   PUBMED; 6288696.
RA   Horowitz H., Platt T.;
RT   "A termination site for LacI transcription is between the CAP site and the
RT   lac promoter";
RL   J. Biol. Chem. 257(19):11740-11746(1982).
XX
RN   [25]
RX   PUBMED; 6290487.
RA   Klein R.D., Wells R.D.;
RT   "Effects of neighboring DNA homopolymers on the biochemical and physical
RT   properties of the Escherichia coli lactose promoter. I. Cloning and
RT   characterization studies";
RL   J. Biol. Chem. 257(21):12954-12961(1982).
XX
RN   [26]
RP   1183-1291
RX   DOI; 10.1073/pnas.79.5.1408.
RX   PUBMED; 7041119.
RA   Weiher H., Schaller H.;
RT   "Segment-specific mutagenesis: extensive mutagenesis of a lac
RT   promoter/operator element";
RL   Proc. Natl. Acad. Sci. U.S.A. 79(5):1408-1412(1982).
XX
RN   [27]
RX   PUBMED; 6305557.
RA   Van Dyke M.W., Dervan P.B.;
RT   "Footprinting with MPE-Fe(II). Complementary-strand analyses of distamycin-
RT   and actinomycin-binding sites on heterogeneous DNA";
RL   Cold Spring Harb. Symp. Quant. Biol. 47:347-353(1983).
XX
RN   [28]
RP   1287-4364
RX   PUBMED; 6313347.
RA   Kalnins A., Otto K., Ruether U., Mueller-Hill B.;
RT   "Sequence of the lacZ gene of Escherichia coli";
RL   EMBO J. 2(4):593-597(1983).
XX
RN   [29]
RX   PUBMED; 6309841.
RA   Cone K.C., Sellitti M.A., Steege D.A.;
RT   "Lac repressor mRNA transcription terminates in vivo in the lac control
RT   region";
RL   J. Biol. Chem. 258(18):11296-11304(1983).
XX
RN   [30]
RX   DOI; 10.1073/pnas.80.22.6785.
RX   PUBMED; 6316325.
RA   Sadler J.R., Sasmor H., Betz J.L.;
RT   "A perfectly symmetric lac operator binds the lac repressor very tightly";
RL   Proc. Natl. Acad. Sci. U.S.A. 80(22):6785-6789(1983).
XX
RN   [31]
RX   DOI; 10.1073/pnas.81.2.512.
RX   PUBMED; 6582506.
RA   Glickman B.W., Ripley L.S.;
RT   "Structural intermediates of deletion mutagenesis: a role for palindromic
RT   DNA";
RL   Proc. Natl. Acad. Sci. U.S.A. 81(2):512-516(1984).
XX
RN   [32]
RX   DOI; 10.1021/bi00332a019.
RX   PUBMED; 3896305.
RA   Spassky A., Kirkegaard K., Buc H.;
RT   "Changes in the DNA structure of the lac UV5 promoter during formation of
RT   an open complex with Escherichia coli RNA polymerase";
RL   Biochemistry 24(11):2723-2731(1985).
XX
RN   [33]
RX   DOI; 10.1016/0092-8674(85)90175-8.
RX   PUBMED; 2416465.
RA   Straney D.C., Crothers D.M.;
RT   "Intermediates in transcription initiation from the E. coli lac UV5
RT   promoter";
RL   Cell 43(2 Pt 1):449-459(1985).
XX
RN   [34]
RX   DOI; 10.1016/0378-1119(85)90267-7.
RX   PUBMED; 3932130.
RA   Looman A.C., de Gruyter M., Vogelaar A., van Knippenberg P.H.;
RT   "Effects of heterologous ribosomal binding sites on the transcription and
RT   translation of the lacZ gene of Escherichia coli";
RL   Gene 37(1-3):145-154(1985).
XX
RN   [35]
RX   PUBMED; 2999082.
RA   Mandecki W., Goldman R.A., Powell B.S., Caruthers M.H.;
RT   "lac Up-promoter mutants with increased homology to the consensus promoter
RT   sequence";
RL   J. Bacteriol. 164(3):1353-1355(1985).
XX
RN   [36]
RX   DOI; 10.1016/0022-2836(85)90427-9.
RX   PUBMED; 2987506.
RA   Malamy M.H., Rahaim P.T., Hoffman C.S., Baghdoyan D., O'Connor M.B.,
RA   Miller J.F.;
RT   "A frameshift mutation at the junction of an IS1 insertion within lacZ
RT   restores beta-galactosidase activity via formation of an active lacZ-IS1
RT   fusion protein";
RL   J. Mol. Biol. 181(4):551-555(1985).
XX
RN   [37]
RP   5646-7477
RX   DOI; 10.1073/pnas.82.19.6414.
RX   PUBMED; 3901000.
RA   Hediger M.A., Johnson D.F., Nierlich D.P., Zabin I.;
RT   "DNA sequence of the lactose operon: the lacA gene and the transcriptional
RT   termination region";
RL   Proc. Natl. Acad. Sci. U.S.A. 82(19):6414-6418(1985).
XX
CC   [3]  sites; UV5 mRNA transcripts and operator mutants. [(in)
CC   Sund,H. and Blauer,G. (eds.);Protein-Ligand Interactions:
CC   193-207;Walter de]  sites; operator mutational analysis. [7]
CC   sites; S1 and mung bean nuclease action on operator DNA. [9]
CC   sites; class I, II and III promoter mutant analysis. [13]  sites;
CC   lacI mutant analysis.
CC   [16]  sites; Tn5, Tn9 and Tn10 insertion sites in lac region. [14]
CC   sites; lacI promoter mutation UJ177.
CC   [18]  sites; palindromic dimer operator;.
CC   [19]  sites; natural operator sequence.
CC   [20]  sites; operator mutational analysis.
CC   [21]  sites; lacI-Q deletion.
CC   [17]  sites; RNA polymerase UV5 promoter interaction. [22]  sites;
CC   lacY mutational analysis.
CC   [24]  sites; lacI-promoted transcription termination. [25]  sites;
CC   wt and UV5 promoter sequence studies. [23]  sites; UV5 promoter
CC   mutational analysis.
CC   [30]  sites; perfectly symmetric operator sequence. [29]  sites;
CC   lacI mRNA termination site.
CC   [27]  sites; distamycin and actinomycin binding to promoter. [31]
CC   sites; lacI deletion studies.
CC   [35]  sites; promoter mutational studies.
CC   [33]  sites; DNAase I studies with promoter sequence. [34]  sites;
CC   ribosomal binding and translation initiation for lacZ. [36]  sites;
CC   insertion sequence IS1 integration in lacZ;. [32]  sites; DNAase I
CC   studies with promoter.
CC   [1] first reports a 27 bp operator(sites 1240-1266) with two-fold
CC   symmetries; the operator has also been defined to be bases
CC   1246-1266 or bases 1239-1273 [8]. [(in) Kjeldgaard,N.C. and Maaloe,
CC   O.(eds);Control of ribosome synthesis: 138-143;A] explores the
CC   ability of lac
CC   repressor protein to affect methylation of operator DNA.  [8]
CC   argues that DNA on both sides of the 21 bp operator (bases
CC   1246-1266) affects repressor binding but that the sequences of this
CC   DNA are probably not critical. [5] gives a larger sequence known as
CC   the promoter-operator region for the wild-type, whereas [2] and
CC   [26] give portions of this region for the mutant strain UV5. Within
CC   the promoter region, bases 1162-1199 are identified as the
CC   catabolite gene activator protein binding site (cap) and bases
CC   1200-1245 are the RNA polymerase interaction site. [10] reports a
CC   sequence for the 5'end of the lacI (repressor) gene and discusses
CC   restart in mutant strains. [11] presents a sequence for the lacI
CC   promoter region and identifies an I-Q mutation which enhances lacI
CC   transcription approximately ten-fold. [12] gives a complete
CC   sequence
CC   for lacI which agrees with the known lac repressor sequence. [26]
CC   examines the promoter-operator region in the UV5 strain (lac109)
CC   and studies 23 mutant derivatives of this sequence. This sequence
CC   agrees with known protein sequences for the lacZ, lacY and lacA
CC   enzymes. [15] notes that the fMet codon is not present
CC   for lacA and suggests that the 'ttg' codon (5727-5729), which
CC   immediately precedes the mature N-terminal asparagine codon, is the
CC   start codon. The cds for lacZ, lacY and lacA are included on a
CC   single mRNA transcript.
CC   Complete source information:
CC   Escherichia coli DNA [1],[(in) Kjeldgaard,N.C. and Maaloe,O.(eds);
CC   Control of ribosome synthesis: 138-143;A],[8],[12],[26]; mRNA [2],
CC   [5],[10]; clone
CC   lambda-h80dlac DNA [11],[15]; clone puk217 [28]; pgm8 [37].
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..7477
FT                   /organism="Escherichia coli"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:562"
FT   variation       16
FT                   /note="c in wild-type; t in 'up' promoter mutant I-Q [11]"
FT   mRNA            51..1230
FT                   /note="lacI (repressor) mRNA; preferred in vivo 3' end
FT                   [12],[29]"
FT   CDS             79..1161
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="lacI"
FT                   /note="lac repressor protein (gtg start codon)"
FT                   /db_xref="GOA:P03023"
FT                   /db_xref="InterPro:IPR000843"
FT                   /db_xref="InterPro:IPR001761"
FT                   /db_xref="InterPro:IPR010982"
FT                   /db_xref="PDB:1CJG"
FT                   /db_xref="PDB:1EFA"
FT                   /db_xref="PDB:1JWL"
FT                   /db_xref="PDB:1JYE"
FT                   /db_xref="PDB:1JYF"
FT                   /db_xref="PDB:1L1M"
FT                   /db_xref="PDB:1LBG"
FT                   /db_xref="PDB:1LBH"
FT                   /db_xref="PDB:1LBI"
FT                   /db_xref="PDB:1LCC"
FT                   /db_xref="PDB:1LCD"
FT                   /db_xref="PDB:1LQC"
FT                   /db_xref="PDB:1LTP"
FT                   /db_xref="PDB:1OSL"
FT                   /db_xref="PDB:1TLF"
FT                   /db_xref="PDB:1Z04"
FT                   /db_xref="PDB:2BJC"
FT                   /db_xref="PDB:2KEI"
FT                   /db_xref="PDB:2KEJ"
FT                   /db_xref="PDB:2KEK"
FT                   /db_xref="PDB:2P9H"
FT                   /db_xref="PDB:2PAF"
FT                   /db_xref="PDB:2PE5"
FT                   /db_xref="PDB:3EDC"
FT                   /db_xref="UniProtKB/Swiss-Prot:P03023"
FT                   /protein_id="AAA24052.1"
FT                   /translation="MKPVTLYDVAEYAGVSYQTVSRVVNQASHVSAKTREKVEAAMAEL
FT                   NYIPNRVAQQLAGKQSLLIGVATSSLALHAPSQIVAAIKSRADQLGASVVVSMVERSGV
FT                   EACKAAVHNLLAQRVSGLIINYPLDDQDAIAVEAACTNVPALFLDVSDQTPINSIIFSH
FT                   EDGTRLGVEHLVALGHQQIALLAGPLSSVSARLRLAGWHKYLTRNQIQPIAEREGDWSA
FT                   MSGFQQTMQMLNEGIVPTAMLVANDQMALGAMRAITESGLRVGADISVVGYDDTEDSSC
FT                   YIPPSTTIKQDFRLLGQTSVDRLLQLSQGQAVKGNQLLPVSLVKRKTTLAPNTQTASPR
FT                   ALADSLMQLARQVSRLESGQ"
FT   misc_signal     1162..1199
FT                   /note="cap protein binding site"
FT   variation       1183..1186
FT                   /note="ttag in wild-type; aatt in strain UV5 [26]"
FT   variation       1209..1211
FT                   /note="gct in wild-type; gt in mutant l305 [5]"
FT   variation       1212
FT                   /note="t in wild-type; a in mutant l241 [5]"
FT   variation       1230
FT                   /note="c in wild-type; a in mutant p-r-1a [5]"
FT   variation       1237..1238
FT                   /note="gt in wild-type; aa in strain UV5 [26]"
FT   variation       1242..1245
FT                   /note="gtgg in wild-type; ttca in synthetic operator [8]"
FT   misc_signal     1246..1266
FT                   /note="lac repressor protein binding site"
FT   mRNA            1246..>4358
FT                   /note="lacZ mRNA [2],[5]"
FT   variation       1267..1268
FT                   /note="tc in wild-type; tg in synthetic operator [8]"
FT   variation       1282..1291
FT                   /note="ctatgaccat in wild-type; gatccggcca in strain UV5
FT                   [26]"
FT   CDS             1284..4358
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="lacZ"
FT                   /note="beta-d-galactosidase"
FT                   /db_xref="GOA:P00722"
FT                   /db_xref="InterPro:IPR004199"
FT                   /db_xref="InterPro:IPR006101"
FT                   /db_xref="InterPro:IPR006102"
FT                   /db_xref="InterPro:IPR006103"
FT                   /db_xref="InterPro:IPR006104"
FT                   /db_xref="InterPro:IPR008979"
FT                   /db_xref="InterPro:IPR011013"
FT                   /db_xref="InterPro:IPR013781"
FT                   /db_xref="InterPro:IPR013812"
FT                   /db_xref="InterPro:IPR014718"
FT                   /db_xref="InterPro:IPR017853"
FT                   /db_xref="PDB:1BGL"
FT                   /db_xref="PDB:1BGM"
FT                   /db_xref="PDB:1DP0"
FT                   /db_xref="PDB:1F49"
FT                   /db_xref="PDB:1F4A"
FT                   /db_xref="PDB:1F4H"
FT                   /db_xref="PDB:1GHO"
FT                   /db_xref="PDB:1HN1"
FT                   /db_xref="PDB:1JYN"
FT                   /db_xref="PDB:1JYV"
FT                   /db_xref="PDB:1JYW"
FT                   /db_xref="PDB:1JYX"
FT                   /db_xref="PDB:1JYY"
FT                   /db_xref="PDB:1JYZ"
FT                   /db_xref="PDB:1JZ0"
FT                   /db_xref="PDB:1JZ1"
FT                   /db_xref="PDB:1JZ2"
FT                   /db_xref="PDB:1JZ3"
FT                   /db_xref="PDB:1JZ4"
FT                   /db_xref="PDB:1JZ5"
FT                   /db_xref="PDB:1JZ6"
FT                   /db_xref="PDB:1JZ7"
FT                   /db_xref="PDB:1JZ8"
FT                   /db_xref="PDB:1PX3"
FT                   /db_xref="PDB:1PX4"
FT                   /db_xref="PDB:3CZJ"
FT                   /db_xref="PDB:3DYM"
FT                   /db_xref="PDB:3DYO"
FT                   /db_xref="PDB:3DYP"
FT                   /db_xref="PDB:3E1F"
FT                   /db_xref="PDB:3IAP"
FT                   /db_xref="PDB:3IAQ"
FT                   /db_xref="UniProtKB/Swiss-Prot:P00722"
FT                   /protein_id="AAA24053.1"
FT                   /translation="MTMITDSLAVVLQRRDWENPGVTQLNRLAAHPPFASWRNSEEART
FT                   DRPSQQLRSLNGEWRFAWFPAPEAVPESWLECDLPEADTVVVPSNWQMHGYDAPIYTNV
FT                   TYPITVNPPFVPTENPTGCYSLTFNVDESWLQEGQTRIIFDGVNSAFHLWCNGRWVGYG
FT                   QDSRLPSEFDLSAFLRAGENRLAVMVLRWSDGSYLEDQDMWRMSGIFRDVSLLHKPTTQ
FT                   ISDFHVATRFNDDFSRAVLEAEVQMCGELRDYLRVTVSLWQGETQVASGTAPFGGEIID
FT                   ERGGYADRVTLRLNVENPKLWSAEIPNLYRAVVELHTADGTLIEAEACDVGFREVRIEN
FT                   GLLLLNGKPLLIRGVNRHEHHPLHGQVMDEQTMVQDILLMKQNNFNAVRCSHYPNHPLW
FT                   YTLCDRYGLYVVDEANIETHGMVPMNRLTDDPRWLPAMSERVTRMVQRDRNHPSVIIWS
FT                   LGNESGHGANHDALYRWIKSVDPSRPVQYEGGGADTTATDIICPMYARVDEDQPFPAVP
FT                   KWSIKKWLSLPGETRPLILCEYAHAMGNSLGGFAKYWQAFRQYPRLQGGFVWDWVDQSL
FT                   IKYDENGNPWSAYGGDFGDTPNDRQFCMNGLVFADRTPHPALTEAKHQQQFFQFRLSGQ
FT                   TIEVTSEYLFRHSDNELLHWMVALDGKPLASGEVPLDVAPQGKQLIELPELPQPESAGQ
FT                   LWLTVRVVQPNATAWSEAGHISAWQQWRLAENLSVTLPAASHAIPHLTTSEMDFCIELG
FT                   NKRWQFNRQSGFLSQMWIGDKKQLLTPLRDQFTRAPLDNDIGVSEATRIDPNAWVERWK
FT                   AAGHYQAEAALLQCTADTLADAVLITTAHAWQHQGKTLFISRKTYRIDGSGQMAITVDV
FT                   EVASDTPHPARIGLNCQLAQVAERVNWLGLGPQENYPDRLTAACFDRWDLPLSDMYTPY
FT                   VFPSENGLRCGTRELNYGPHQWRGDFQFNISRYSQQQLMETSHRHLLHAEEGTWLNIDG
FT                   FHMGIGGDDSWSPSVSAEFQLSAGRYHYQLVWCQK"
FT   CDS             4410..5663
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="lacY"
FT                   /note="lactose permease"
FT                   /db_xref="GOA:P02920"
FT                   /db_xref="InterPro:IPR000576"
FT                   /db_xref="InterPro:IPR016196"
FT                   /db_xref="InterPro:IPR018457"
FT                   /db_xref="InterPro:IPR020480"
FT                   /db_xref="PDB:1M2U"
FT                   /db_xref="PDB:1PV6"
FT                   /db_xref="PDB:1PV7"
FT                   /db_xref="PDB:2CFP"
FT                   /db_xref="PDB:2CFQ"
FT                   /db_xref="PDB:2V8N"
FT                   /db_xref="UniProtKB/Swiss-Prot:P02920"
FT                   /protein_id="AAA24054.1"
FT                   /translation="MYYLKNTNFWMFGLFFFFYFFIMGAYFPFFPIWLHDINHISKSDT
FT                   GIIFAAISLFSLLFQPLFGLLSDKLGLRKYLLWIITGMLVMFAPFFIFIFGPLLQYNIL
FT                   VGSIVGGIYLGFCFNAGAPAVEAFIEKVSRRSNFEFGRARMFGCVGWALCASIVGIMFT
FT                   INNQFVFWLGSGCALILAVLLFFAKTDAPSSATVANAVGANHSAFSLKLALELFRQPKL
FT                   WFLSLYVIGVSCTYDVFDQQFANFFTSFFATGEQGTRVFGYVTTMGELLNASIMFFAPL
FT                   IINRIGGKNALLLAGTIMSVRIIGSSFATSALEVVILKTLHMFEVPFLLVGCFKYITSQ
FT                   FEVRFSATIYLVCFCFFKQLAMIFMSVLAGNMYESIGFQGAYLVLGLVALGFTLISVFT
FT                   LSGPGPLSLLRRQVNEVA"
FT   CDS             5727..6338
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="lacA"
FT                   /note="thiogalactoside acetyltransferase (ttg start codon)"
FT                   /db_xref="GOA:P07464"
FT                   /db_xref="InterPro:IPR001451"
FT                   /db_xref="InterPro:IPR011004"
FT                   /db_xref="InterPro:IPR018357"
FT                   /db_xref="PDB:1KQA"
FT                   /db_xref="PDB:1KRR"
FT                   /db_xref="PDB:1KRU"
FT                   /db_xref="PDB:1KRV"
FT                   /db_xref="UniProtKB/Swiss-Prot:P07464"
FT                   /protein_id="AAA24055.1"
FT                   /translation="MNMPMTERIRAGKLFTDMCEGLPEKRLRGKTLMYEFNHSHPSEVE
FT                   KRESLIKEMFATVGENAWVEPPVYFSYGSNIHIGRNFYANFNLTIVDDYTVTIGDNVLI
FT                   APNVTLSVTGHPVHHELRKNGEMYSFPITIGNNVWIGSHVVINPGVTIGDNSVIGAGSI
FT                   VTKDIPPNVVAAGVPCRVIREINDRDKHYYFKDYKVESSV"
XX
SQ   Sequence 7477 BP; 1739 A; 1991 C; 2004 G; 1743 T; 0 other;
     gacaccatcg aatggcgcaa aacctttcgc ggtatggcat gatagcgccc ggaagagagt        60
     caattcaggg tggtgaatgt gaaaccagta acgttatacg atgtcgcaga gtatgccggt       120
     gtctcttatc agaccgtttc ccgcgtggtg aaccaggcca gccacgtttc tgcgaaaacg       180
     cgggaaaaag tggaagcggc gatggcggag ctgaattaca ttcccaaccg cgtggcacaa       240
     caactggcgg gcaaacagtc gttgctgatt ggcgttgcca cctccagtct ggccctgcac       300
     gcgccgtcgc aaattgtcgc ggcgattaaa tctcgcgccg atcaactggg tgccagcgtg       360
     gtggtgtcga tggtagaacg aagcggcgtc gaagcctgta aagcggcggt gcacaatctt       420
     ctcgcgcaac gcgtcagtgg gctgatcatt aactatccgc tggatgacca ggatgccatt       480
     gctgtggaag ctgcctgcac taatgttccg gcgttatttc ttgatgtctc tgaccagaca       540
     cccatcaaca gtattatttt ctcccatgaa gacggtacgc gactgggcgt ggagcatctg       600
     gtcgcattgg gtcaccagca aatcgcgctg ttagcgggcc cattaagttc tgtctcggcg       660
     cgtctgcgtc tggctggctg gcataaatat ctcactcgca atcaaattca gccgatagcg       720
     gaacgggaag gcgactggag tgccatgtcc ggttttcaac aaaccatgca aatgctgaat       780
     gagggcatcg ttcccactgc gatgctggtt gccaacgatc agatggcgct gggcgcaatg       840
     cgcgccatta ccgagtccgg gctgcgcgtt ggtgcggata tctcggtagt gggatacgac       900
     gataccgaag acagctcatg ttatatcccg ccgtcaacca ccatcaaaca ggattttcgc       960
     ctgctggggc aaaccagcgt ggaccgcttg ctgcaactct ctcagggcca ggcggtgaag      1020
     ggcaatcagc tgttgcccgt ctcactggtg aaaagaaaaa ccaccctggc gcccaatacg      1080
     caaaccgcct ctccccgcgc gttggccgat tcattaatgc agctggcacg acaggtttcc      1140
     cgactggaaa gcgggcagtg agcgcaacgc aattaatgtg agttagctca ctcattaggc      1200
     accccaggct ttacacttta tgcttccggc tcgtatgttg tgtggaattg tgagcggata      1260
     acaatttcac acaggaaaca gctatgacca tgattacgga ttcactggcc gtcgttttac      1320
     aacgtcgtga ctgggaaaac cctggcgtta cccaacttaa tcgccttgca gcacatcccc      1380
     ctttcgccag ctggcgtaat agcgaagagg cccgcaccga tcgcccttcc caacagttgc      1440
     gcagcctgaa tggcgaatgg cgctttgcct ggtttccggc accagaagcg gtgccggaaa      1500
     gctggctgga gtgcgatctt cctgaggccg atactgtcgt cgtcccctca aactggcaga      1560
     tgcacggtta cgatgcgccc atctacacca acgtaaccta tcccattacg gtcaatccgc      1620
     cgtttgttcc cacggagaat ccgacgggtt gttactcgct cacatttaat gttgatgaaa      1680
     gctggctaca ggaaggccag acgcgaatta tttttgatgg cgttaactcg gcgtttcatc      1740
     tgtggtgcaa cgggcgctgg gtcggttacg gccaggacag tcgtttgccg tctgaatttg      1800
     acctgagcgc atttttacgc gccggagaaa accgcctcgc ggtgatggtg ctgcgttgga      1860
     gtgacggcag ttatctggaa gatcaggata tgtggcggat gagcggcatt ttccgtgacg      1920
     tctcgttgct gcataaaccg actacacaaa tcagcgattt ccatgttgcc actcgcttta      1980
     atgatgattt cagccgcgct gtactggagg ctgaagttca gatgtgcggc gagttgcgtg      2040
     actacctacg ggtaacagtt tctttatggc agggtgaaac gcaggtcgcc agcggcaccg      2100
     cgcctttcgg cggtgaaatt atcgatgagc gtggtggtta tgccgatcgc gtcacactac      2160
     gtctgaacgt cgaaaacccg aaactgtgga gcgccgaaat cccgaatctc tatcgtgcgg      2220
     tggttgaact gcacaccgcc gacggcacgc tgattgaagc agaagcctgc gatgtcggtt      2280
     tccgcgaggt gcggattgaa aatggtctgc tgctgctgaa cggcaagccg ttgctgattc      2340
     gaggcgttaa ccgtcacgag catcatcctc tgcatggtca ggtcatggat gagcagacga      2400
     tggtgcagga tatcctgctg atgaagcaga acaactttaa cgccgtgcgc tgttcgcatt      2460
     atccgaacca tccgctgtgg tacacgctgt gcgaccgcta cggcctgtat gtggtggatg      2520
     aagccaatat tgaaacccac ggcatggtgc caatgaatcg tctgaccgat gatccgcgct      2580
     ggctaccggc gatgagcgaa cgcgtaacgc gaatggtgca gcgcgatcgt aatcacccga      2640
     gtgtgatcat ctggtcgctg gggaatgaat caggccacgg cgctaatcac gacgcgctgt      2700
     atcgctggat caaatctgtc gatccttccc gcccggtgca gtatgaaggc ggcggagccg      2760
     acaccacggc caccgatatt atttgcccga tgtacgcgcg cgtggatgaa gaccagccct      2820
     tcccggctgt gccgaaatgg tccatcaaaa aatggctttc gctacctgga gagacgcgcc      2880
     cgctgatcct ttgcgaatac gcccacgcga tgggtaacag tcttggcggt ttcgctaaat      2940
     actggcaggc gtttcgtcag tatccccgtt tacagggcgg cttcgtctgg gactgggtgg      3000
     atcagtcgct gattaaatat gatgaaaacg gcaacccgtg gtcggcttac ggcggtgatt      3060
     ttggcgatac gccgaacgat cgccagttct gtatgaacgg tctggtcttt gccgaccgca      3120
     cgccgcatcc agcgctgacg gaagcaaaac accagcagca gtttttccag ttccgtttat      3180
     ccgggcaaac catcgaagtg accagcgaat acctgttccg tcatagcgat aacgagctcc      3240
     tgcactggat ggtggcgctg gatggtaagc cgctggcaag cggtgaagtg cctctggatg      3300
     tcgctccaca aggtaaacag ttgattgaac tgcctgaact accgcagccg gagagcgccg      3360
     ggcaactctg gctcacagta cgcgtagtgc aaccgaacgc gaccgcatgg tcagaagccg      3420
     ggcacatcag cgcctggcag cagtggcgtc tggcggaaaa cctcagtgtg acgctccccg      3480
     ccgcgtccca cgccatcccg catctgacca ccagcgaaat ggatttttgc atcgagctgg      3540
     gtaataagcg ttggcaattt aaccgccagt caggctttct ttcacagatg tggattggcg      3600
     ataaaaaaca actgctgacg ccgctgcgcg atcagttcac ccgtgcaccg ctggataacg      3660
     acattggcgt aagtgaagcg acccgcattg accctaacgc ctgggtcgaa cgctggaagg      3720
     cggcgggcca ttaccaggcc gaagcagcgt tgttgcagtg cacggcagat acacttgctg      3780
     atgcggtgct gattacgacc gctcacgcgt ggcagcatca ggggaaaacc ttatttatca      3840
     gccggaaaac ctaccggatt gatggtagtg gtcaaatggc gattaccgtt gatgttgaag      3900
     tggcgagcga tacaccgcat ccggcgcgga ttggcctgaa ctgccagctg gcgcaggtag      3960
     cagagcgggt aaactggctc ggattagggc cgcaagaaaa ctatcccgac cgccttactg      4020
     ccgcctgttt tgaccgctgg gatctgccat tgtcagacat gtataccccg tacgtcttcc      4080
     cgagcgaaaa cggtctgcgc tgcgggacgc gcgaattgaa ttatggccca caccagtggc      4140
     gcggcgactt ccagttcaac atcagccgct acagtcaaca gcaactgatg gaaaccagcc      4200
     atcgccatct gctgcacgcg gaagaaggca catggctgaa tatcgacggt ttccatatgg      4260
     ggattggtgg cgacgactcc tggagcccgt cagtatcggc ggaattccag ctgagcgccg      4320
     gtcgctacca ttaccagttg gtctggtgtc aaaaataata ataaccgggc aggccatgtc      4380
     tgcccgtatt tcgcgtaagg aaatccatta tgtactattt aaaaaacaca aacttttgga      4440
     tgttcggttt attctttttc ttttactttt ttatcatggg agcctacttc ccgtttttcc      4500
     cgatttggct acatgacatc aaccatatca gcaaaagtga tacgggtatt atttttgccg      4560
     ctatttctct gttctcgcta ttattccaac cgctgtttgg tctgctttct gacaaactcg      4620
     ggctgcgcaa atacctgctg tggattatta ccggcatgtt agtgatgttt gcgccgttct      4680
     ttatttttat cttcgggcca ctgttacaat acaacatttt agtaggatcg attgttggtg      4740
     gtatttatct aggcttttgt tttaacgccg gtgcgccagc agtagaggca tttattgaga      4800
     aagtcagccg tcgcagtaat ttcgaatttg gtcgcgcgcg gatgtttggc tgtgttggct      4860
     gggcgctgtg tgcctcgatt gtcggcatca tgttcaccat caataatcag tttgttttct      4920
     ggctgggctc tggctgtgca ctcatcctcg ccgttttact ctttttcgcc aaaacggatg      4980
     cgccctcttc tgccacggtt gccaatgcgg taggtgccaa ccattcggca tttagcctta      5040
     agctggcact ggaactgttc agacagccaa aactgtggtt tttgtcactg tatgttattg      5100
     gcgtttcctg cacctacgat gtttttgacc aacagtttgc taatttcttt acttcgttct      5160
     ttgctaccgg tgaacagggt acgcgggtat ttggctacgt aacgacaatg ggcgaattac      5220
     ttaacgcctc gattatgttc tttgcgccac tgatcattaa tcgcatcggt gggaaaaacg      5280
     ccctgctgct ggctggcact attatgtctg tacgtattat tggctcatcg ttcgccacct      5340
     cagcgctgga agtggttatt ctgaaaacgc tgcatatgtt tgaagtaccg ttcctgctgg      5400
     tgggctgctt taaatatatt accagccagt ttgaagtgcg tttttcagcg acgatttatc      5460
     tggtctgttt ctgcttcttt aagcaactgg cgatgatttt tatgtctgta ctggcgggca      5520
     atatgtatga aagcatcggt ttccagggcg cttatctggt gctgggtctg gtggcgctgg      5580
     gcttcacctt aatttccgtg ttcacgctta gcggccccgg cccgctttcc ctgctgcgtc      5640
     gtcaggtgaa tgaagtcgct taagcaatca atgtcggatg cggcgcgacg cttatccgac      5700
     caacatatca taacggagtg atcgcattga acatgccaat gaccgaaaga ataagagcag      5760
     gcaagctatt taccgatatg tgcgaaggct taccggaaaa aagacttcgt gggaaaacgt      5820
     taatgtatga gtttaatcac tcgcatccat cagaagttga aaaaagagaa agcctgatta      5880
     aagaaatgtt tgccacggta ggggaaaacg cctgggtaga accgcctgtc tatttctctt      5940
     acggttccaa catccatata ggccgcaatt tttatgcaaa tttcaattta accattgtcg      6000
     atgactacac ggtaacaatc ggtgataacg tactgattgc acccaacgtt actctttccg      6060
     ttacgggaca ccctgtacac catgaattga gaaaaaacgg cgagatgtac tcttttccga      6120
     taacgattgg caataacgtc tggatcggaa gtcatgtggt tattaatcca ggcgtcacca      6180
     tcggggataa ttctgttatt ggcgcgggta gtatcgtcac aaaagacatt ccaccaaacg      6240
     tcgtggcggc tggcgttcct tgtcgggtta ttcgcgaaat aaacgaccgg gataagcact      6300
     attatttcaa agattataaa gttgaatcgt cagtttaaat tataaaaatt gcctgatacg      6360
     ctgcgcttat caggcctaca agttcagcga tctacattag ccgcatccgg catgaacaaa      6420
     gcgcaggaac aagcgtcgca tcatgcctct ttgacccaca gctgcggaaa acgtactggt      6480
     gcaaaacgca gggttatgat catcagccca acgacgcaca gcgcatgaaa tgcccagtcc      6540
     atcaggtaat tgccgctgat actacgcagc acgccagaaa accacggggc aagcccggcg      6600
     atgataaaac cgattccctg cataaacgcc accagcttgc cagcaatagc cggttgcaca      6660
     gagtgatcga gcgccagcag caaacagagc ggaaacgcgc cgcccagacc taacccacac      6720
     accatcgccc acaataccgg caattgcatc ggcagccaga taaagccgca gaaccccacc      6780
     agttgtaaca ccagcgccag cattaacagt ttgcgccgat cctgatggcg agccatagca      6840
     ggcatcagca aagctcctgc ggcttgccca agcgtcatca atgccagtaa ggaaccgctg      6900
     tactgcgcgc tggcaccaat ctcaatatag aaagcgggta accaggcaat caggctggcg      6960
     taaccgccgt taatcagacc gaagtaaaca cccagcgtcc acgcgcgggg agtgaatacc      7020
     acgcgaaccg gagtggttgt tgtcttgtgg gaagaggcga cctcgcgggc gctttgccac      7080
     caccaggcaa agagcgcaac aacggcaggc agcgccacca ggcgagtgtt tgataccagg      7140
     tttcgctatg ttgaactaac cagggcgtta tggcggcacc aagcccaccg ccgcccatca      7200
     gagccgcgga ccacagcccc atcaccagtg gcgtgcgctg ctgaaaccgc cgtttaatca      7260
     ccgaagcatc accgcctgaa tgatgccgat ccccacccca ccaagcagtg cgctgctaag      7320
     cagcagcgca ctttgcgggt aaagctcacg catcaatgca ccgacggcaa tcagcaacag      7380
     actgatggcg acactgcgac gttcgctgac atgctgatga agccagcttc cggccagcgc      7440
     cagcccgccc atggtaacca ccggcagagc ggtcgac                               7477
//
ID   X51872; SV 1; linear; genomic DNA; STD; PRO; 1832 BP.
XX
AC   X51872;
XX
DT   17-APR-1990 (Rel. 23, Created)
DT   05-JUL-1999 (Rel. 60, Last updated, Version 5)
XX
DE   Escherichia coli lacA gene for thiogalactoside transacetylase
XX
KW   lac operon; lacA gene; lacY gene; thiogalactoside transacetylase.
XX
OS   Escherichia coli
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Escherichia.
XX
RN   [1]
RC   (1-1832)
RP   1-1832
RX   DOI; 10.1073/pnas.82.19.6414.
RX   PUBMED; 3901000.
RA   Hediger M.A., Johnson D.F., Nierlich D.P., Zabin I.;
RT   "DNA sequence of the lactose operon: the lacA gene and the transcriptional
RT   termination region";
RL   Proc. Natl. Acad. Sci. U.S.A. 82(19):6414-6418(1985).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1832
FT                   /organism="Escherichia coli"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:562"
FT   CDS             <1..18
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /product="lacY gene product"
FT                   /protein_id="CAA36161.1"
FT                   /translation="VNEVA"
FT   CDS             82..693
FT                   /transl_table=11
FT                   /gene="lacA"
FT                   /product="thiogalactoside transacetylase"
FT                   /db_xref="GOA:P07464"
FT                   /db_xref="InterPro:IPR001451"
FT                   /db_xref="InterPro:IPR011004"
FT                   /db_xref="InterPro:IPR018357"
FT                   /db_xref="PDB:1KQA"
FT                   /db_xref="PDB:1KRR"
FT                   /db_xref="PDB:1KRU"
FT                   /db_xref="PDB:1KRV"
FT                   /db_xref="UniProtKB/Swiss-Prot:P07464"
FT                   /protein_id="CAA36162.1"
FT                   /translation="MNMPMTERIRAGKLFTDMCEGLPEKRLRGKTLMYEFNHSHPSEVE
FT                   KRESLIKEMFATVGENAWVEPPVYFSYGSNIHIGRNFYANFNLTIVDDYTVTIGDNVLI
FT                   APNVTLSVTGHPVHHELRKNGEMYSFPITIGNNVWIGSHVVINPGVTIGDNSVIGAGSI
FT                   VTKDIPPNVVAAGVPCRVIREINDRDKHYYFKDYKVESSV"
XX
SQ   Sequence 1832 BP; 519 A; 510 C; 450 G; 353 T; 0 other;
     gtgaatgaag tcgcttaagc aatcaatgtc ggatgcggcg cgacgcttat ccgaccaaca        60
     tatcataacg gagtgatcgc attgaacatg ccaatgaccg aaagaataag agcaggcaag       120
     ctatttaccg atatgtgcga aggcttaccg gaaaaaagac ttcgtgggaa aacgttaatg       180
     tatgagttta atcactcgca tccatcagaa gttgaaaaaa gagaaagcct gattaaagaa       240
     atgtttgcca cggtagggga aaacgcctgg gtagaaccgc ctgtctattt ctcttacggt       300
     tccaacatcc atataggccg caatttttat gcaaatttca atttaaccat tgtcgatgac       360
     tacacggtaa caatcggtga taacgtactg attgcaccca acgttactct ttccgttacg       420
     ggacaccctg tacaccatga attgagaaaa aacggcgaga tgtactcttt tccgataacg       480
     attggcaata acgtctggat cggaagtcat gtggttatta atccaggcgt caccatcggg       540
     gataattctg ttattggcgc gggtagtatc gtcacaaaag acattccacc aaacgtcgtg       600
     gcggctggcg ttccttgtcg ggttattcgc gaaataaacg accgggataa gcactattat       660
     ttcaaagatt ataaagttga atcgtcagtt taaattataa aaattgcctg atacgctgcg       720
     cttatcaggc ctacaagttc agcgatctac attagccgca tccggcatga acaaagcgca       780
     ggaacaagcg tcgcatcatg cctctttgac ccacagctgc ggaaaacgta ctggtgcaaa       840
     acgcagggtt atgatcatca gcccaacgac gcacagcgca tgaaatgccc agtccatcag       900
     gtaattgccg ctgatactac gcagcacgcc agaaaaccac ggggcaagcc cggcgatgat       960
     aaaaccgatt ccctgcataa acgccaccag cttgccagca atagccggtt gcacagagtg      1020
     atcgagcgcc agcagcaaac agagcggaaa cgcgccgccc agacctaacc cacacaccat      1080
     cgcccacaat accggcaatt gcatcggcag ccagataaag ccgcagaacc ccaccagttg      1140
     taacaccagc gccagcatta acagtttgcg ccgatcctga tggcgagcca tagcaggcat      1200
     cagcaaagct cctgcggctt gcccaagcgt catcaatgcc agtaaggaac cgctgtactg      1260
     cgcgctggca ccaatctcaa tatagaaagc gggtaaccag gcaatcaggc tggcgtaacc      1320
     gccgttaatc agaccgaagt aaacacccag cgtccacgcg cggggagtga ataccacgcg      1380
     aaccggagtg gttgttgtct tgtgggaaga ggcgacctcg cgggcgcttt gccaccacca      1440
     ggcaaagagc gcaacaacgg caggcagcgc caccaggcga gtgtttgata ccaggtttcg      1500
     ctatgttgaa ctaaccaggg cgttatggcg gcaccaagcc caccgccgcc catcagagcc      1560
     gcggaccaca gccccatcac cagtggcgtg cgctgctgaa accgccgttt aatcaccgaa      1620
     gcatcaccgc ctgaatgatg ccgatcccca ccccaccaag cagtgcgctg ctaagcagca      1680
     gcgcactttg cgggtaaagc tcacgcatca atgcaccgac ggcaatcagc aacagactga      1740
     tggcgacact gcgacgttcg ctgacatgct gatgaagcca gcttccggcc agcgccagcc      1800
     cgcccatggt aaccaccggc agagcggtcg ac                                    1832
//
ID   V00294; SV 1; linear; genomic DNA; STD; PRO; 1113 BP.
XX
AC   V00294;
XX
DT   09-JUN-1982 (Rel. 01, Created)
DT   10-FEB-1999 (Rel. 58, Last updated, Version 2)
XX
DE   E. coli laci gene (codes for the lac repressor).
XX
KW   DNA binding protein; repressor.
XX
OS   Escherichia coli
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Escherichia.
XX
RN   [1]
RP   1-1113
RX   DOI; 10.1038/274765a0.
RX   PUBMED; 355891.
RA   Farabaugh P.J.;
RT   "Sequence of the lacI gene";
RL   Nature 274(5673):765-769(1978).
XX
CC   KST ECO.LACI
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1113
FT                   /organism="Escherichia coli"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:562"
FT   CDS             31..1113
FT                   /transl_table=11
FT                   /note="reading frame"
FT                   /db_xref="GOA:P03023"
FT                   /db_xref="InterPro:IPR000843"
FT                   /db_xref="InterPro:IPR001761"
FT                   /db_xref="InterPro:IPR010982"
FT                   /db_xref="PDB:1CJG"
FT                   /db_xref="PDB:1EFA"
FT                   /db_xref="PDB:1JWL"
FT                   /db_xref="PDB:1JYE"
FT                   /db_xref="PDB:1JYF"
FT                   /db_xref="PDB:1L1M"
FT                   /db_xref="PDB:1LBG"
FT                   /db_xref="PDB:1LBH"
FT                   /db_xref="PDB:1LBI"
FT                   /db_xref="PDB:1LCC"
FT                   /db_xref="PDB:1LCD"
FT                   /db_xref="PDB:1LQC"
FT                   /db_xref="PDB:1LTP"
FT                   /db_xref="PDB:1OSL"
FT                   /db_xref="PDB:1TLF"
FT                   /db_xref="PDB:1Z04"
FT                   /db_xref="PDB:2BJC"
FT                   /db_xref="PDB:2KEI"
FT                   /db_xref="PDB:2KEJ"
FT                   /db_xref="PDB:2KEK"
FT                   /db_xref="PDB:2P9H"
FT                   /db_xref="PDB:2PAF"
FT                   /db_xref="PDB:2PE5"
FT                   /db_xref="PDB:3EDC"
FT                   /db_xref="UniProtKB/Swiss-Prot:P03023"
FT                   /protein_id="CAA23569.1"
FT                   /translation="MKPVTLYDVAEYAGVSYQTVSRVVNQASHVSAKTREKVEAAMAEL
FT                   NYIPNRVAQQLAGKQSLLIGVATSSLALHAPSQIVAAIKSRADQLGASVVVSMVERSGV
FT                   EACKAAVHNLLAQRVSGLIINYPLDDQDAIAVEAACTNVPALFLDVSDQTPINSIIFSH
FT                   EDGTRLGVEHLVALGHQQIALLAGPLSSVSARLRLAGWHKYLTRNQIQPIAEREGDWSA
FT                   MSGFQQTMQMLNEGIVPTAMLVANDQMALGAMRAITESGLRVGADISVVGYDDTEDSSC
FT                   YIPPSTTIKQDFRLLGQTSVDRLLQLSQGQAVKGNQLLPVSLVKRKTTLAPNTQTASPR
FT                   ALADSLMQLARQVSRLESGQ"
XX
SQ   Sequence 1113 BP; 249 A; 304 C; 322 G; 238 T; 0 other;
     ccggaagaga gtcaattcag ggtggtgaat gtgaaaccag taacgttata cgatgtcgca        60
     gagtatgccg gtgtctctta tcagaccgtt tcccgcgtgg tgaaccaggc cagccacgtt       120
     tctgcgaaaa cgcgggaaaa agtggaagcg gcgatggcgg agctgaatta cattcccaac       180
     cgcgtggcac aacaactggc gggcaaacag tcgttgctga ttggcgttgc cacctccagt       240
     ctggccctgc acgcgccgtc gcaaattgtc gcggcgatta aatctcgcgc cgatcaactg       300
     ggtgccagcg tggtggtgtc gatggtagaa cgaagcggcg tcgaagcctg taaagcggcg       360
     gtgcacaatc ttctcgcgca acgcgtcagt gggctgatca ttaactatcc gctggatgac       420
     caggatgcca ttgctgtgga agctgcctgc actaatgttc cggcgttatt tcttgatgtc       480
     tctgaccaga cacccatcaa cagtattatt ttctcccatg aagacggtac gcgactgggc       540
     gtggagcatc tggtcgcatt gggtcaccag caaatcgcgc tgttagcggg cccattaagt       600
     tctgtctcgg cgcgtctgcg tctggctggc tggcataaat atctcactcg caatcaaatt       660
     cagccgatag cggaacggga aggcgactgg agtgccatgt ccggttttca acaaaccatg       720
     caaatgctga atgagggcat cgttcccact gcgatgctgg ttgccaacga tcagatggcg       780
     ctgggcgcaa tgcgcgccat taccgagtcc gggctgcgcg ttggtgcgga tatctcggta       840
     gtgggatacg acgataccga agacagctca tgttatatcc cgccgtcaac caccatcaaa       900
     caggattttc gcctgctggg gcaaaccagc gtggaccgct tgctgcaact ctctcagggc       960
     caggcggtga agggcaatca gctgttgccc gtctcactgg tgaaaagaaa aaccaccctg      1020
     gcgcccaata cgcaaaccgc ctctccccgc gcgttggccg attcattaat gcagctggca      1080
     cgacaggttt cccgactgga aagcgggcag tga                                   1113
//
ID   V00295; SV 1; linear; genomic DNA; STD; PRO; 1500 BP.
XX
AC   V00295;
XX
DT   09-JUN-1982 (Rel. 01, Created)
DT   07-JUL-1995 (Rel. 44, Last updated, Version 4)
XX
DE   E. coli lacY gene (codes for lactose permease).
XX
KW   membrane protein.
XX
OS   Escherichia coli
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Escherichia.
XX
RN   [1]
RP   1-1500
RX   DOI; 10.1038/283541a0.
RX   PUBMED; 6444453.
RA   Buechel D.E., Gronenborn B., Mueller-Hill B.;
RT   "Sequence of the lactose permease gene";
RL   Nature 283(5747):541-545(1980).
XX
CC   lacZ is a beta-galactosidase and lacA is transacetylase.
CC   KST ECO.LACY
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1500
FT                   /organism="Escherichia coli"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:562"
FT   CDS             <1..54
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /note="reading frame (lacZ)"
FT                   /db_xref="GOA:P00722"
FT                   /db_xref="InterPro:IPR004199"
FT                   /db_xref="InterPro:IPR006101"
FT                   /db_xref="InterPro:IPR006102"
FT                   /db_xref="InterPro:IPR006103"
FT                   /db_xref="InterPro:IPR006104"
FT                   /db_xref="InterPro:IPR008979"
FT                   /db_xref="InterPro:IPR011013"
FT                   /db_xref="InterPro:IPR013781"
FT                   /db_xref="InterPro:IPR013812"
FT                   /db_xref="InterPro:IPR014718"
FT                   /db_xref="InterPro:IPR017853"
FT                   /db_xref="PDB:1BGL"
FT                   /db_xref="PDB:1BGM"
FT                   /db_xref="PDB:1DP0"
FT                   /db_xref="PDB:1F49"
FT                   /db_xref="PDB:1F4A"
FT                   /db_xref="PDB:1F4H"
FT                   /db_xref="PDB:1GHO"
FT                   /db_xref="PDB:1HN1"
FT                   /db_xref="PDB:1JYN"
FT                   /db_xref="PDB:1JYV"
FT                   /db_xref="PDB:1JYW"
FT                   /db_xref="PDB:1JYX"
FT                   /db_xref="PDB:1JYY"
FT                   /db_xref="PDB:1JYZ"
FT                   /db_xref="PDB:1JZ0"
FT                   /db_xref="PDB:1JZ1"
FT                   /db_xref="PDB:1JZ2"
FT                   /db_xref="PDB:1JZ3"
FT                   /db_xref="PDB:1JZ4"
FT                   /db_xref="PDB:1JZ5"
FT                   /db_xref="PDB:1JZ6"
FT                   /db_xref="PDB:1JZ7"
FT                   /db_xref="PDB:1JZ8"
FT                   /db_xref="PDB:1PX3"
FT                   /db_xref="PDB:1PX4"
FT                   /db_xref="PDB:3CZJ"
FT                   /db_xref="PDB:3DYM"
FT                   /db_xref="PDB:3DYO"
FT                   /db_xref="PDB:3DYP"
FT                   /db_xref="PDB:3E1F"
FT                   /db_xref="PDB:3IAP"
FT                   /db_xref="PDB:3IAQ"
FT                   /db_xref="UniProtKB/Swiss-Prot:P00722"
FT                   /protein_id="CAA23570.1"
FT                   /translation="FQLSAGRYHYQLVWCQK"
FT   CDS             106..1359
FT                   /transl_table=11
FT                   /note="reading frame (lacY)"
FT                   /db_xref="GOA:P02920"
FT                   /db_xref="InterPro:IPR000576"
FT                   /db_xref="InterPro:IPR016196"
FT                   /db_xref="InterPro:IPR018457"
FT                   /db_xref="InterPro:IPR020480"
FT                   /db_xref="PDB:1M2U"
FT                   /db_xref="PDB:1PV6"
FT                   /db_xref="PDB:1PV7"
FT                   /db_xref="PDB:2CFP"
FT                   /db_xref="PDB:2CFQ"
FT                   /db_xref="PDB:2V8N"
FT                   /db_xref="UniProtKB/Swiss-Prot:P02920"
FT                   /protein_id="CAA23571.1"
FT                   /translation="MYYLKNTNFWMFGLFFFFYFFIMGAYFPFFPIWLHDINHISKSDT
FT                   GIIFAAISLFSLLFQPLFGLLSDKLGLRKYLLWIITGMLVMFAPFFIFIFGPLLQYNIL
FT                   VGSIVGGIYLGFCFNAGAPAVEAFIEKVSRRSNFEFGRARMFGCVGWALCASIVGIMFT
FT                   INNQFVFWLGSGCALILAVLLFFAKTDAPSSATVANAVGANHSAFSLKLALELFRQPKL
FT                   WFLSLYVIGVSCTYDVFDQQFANFFTSFFATGEQGTRVFGYVTTMGELLNASIMFFAPL
FT                   IINRIGGKNALLLAGTIMSVRIIGSSFATSALEVVILKTLHMFEVPFLLVGCFKYITSQ
FT                   FEVRFSATIYLVCFCFFKQLAMIFMSVLAGNMYESIGFQGAYLVLGLVALGFTLISVFT
FT                   LSGPGPLSLLRRQVNEVA"
FT   CDS             1423..>1500
FT                   /transl_table=11
FT                   /note="reading frame (lacA)"
FT                   /db_xref="GOA:P07464"
FT                   /db_xref="InterPro:IPR001451"
FT                   /db_xref="InterPro:IPR011004"
FT                   /db_xref="InterPro:IPR018357"
FT                   /db_xref="PDB:1KQA"
FT                   /db_xref="PDB:1KRR"
FT                   /db_xref="PDB:1KRU"
FT                   /db_xref="PDB:1KRV"
FT                   /db_xref="UniProtKB/Swiss-Prot:P07464"
FT                   /protein_id="CAA23572.1"
FT                   /translation="MNMPMTERIRAGKLFTDMCEGLPEKR"
XX
SQ   Sequence 1500 BP; 315 A; 342 C; 357 G; 486 T; 0 other;
     ttccagctga gcgccggtcg ctaccattac cagttggtct ggtgtcaaaa ataataataa        60
     ccgggcaggc catgtctgcc cgtatttcgc gtaaggaaat ccattatgta ctatttaaaa       120
     aacacaaact tttggatgtt cggtttattc tttttctttt acttttttat catgggagcc       180
     tacttcccgt ttttcccgat ttggctacat gacatcaacc atatcagcaa aagtgatacg       240
     ggtattattt ttgccgctat ttctctgttc tcgctattat tccaaccgct gtttggtctg       300
     ctttctgaca aactcgggct gcgcaaatac ctgctgtgga ttattaccgg catgttagtg       360
     atgtttgcgc cgttctttat ttttatcttc gggccactgt tacaatacaa cattttagta       420
     ggatcgattg ttggtggtat ttatctaggc ttttgtttta acgccggtgc gccagcagta       480
     gaggcattta ttgagaaagt cagccgtcgc agtaatttcg aatttggtcg cgcgcggatg       540
     tttggctgtg ttggctgggc gctgtgtgcc tcgattgtcg gcatcatgtt caccatcaat       600
     aatcagtttg ttttctggct gggctctggc tgtgcactca tcctcgccgt tttactcttt       660
     ttcgccaaaa cggatgcgcc ctcttctgcc acggttgcca atgcggtagg tgccaaccat       720
     tcggcattta gccttaagct ggcactggaa ctgttcagac agccaaaact gtggtttttg       780
     tcactgtatg ttattggcgt ttcctgcacc tacgatgttt ttgaccaaca gtttgctaat       840
     ttctttactt cgttctttgc taccggtgaa cagggtacgc gggtatttgg ctacgtaacg       900
     acaatgggcg aattacttaa cgcctcgatt atgttctttg cgccactgat cattaatcgc       960
     atcggtggga aaaacgccct gctgctggct ggcactatta tgtctgtacg tattattggc      1020
     tcatcgttcg ccacctcagc gctggaagtg gttattctga aaacgctgca tatgtttgaa      1080
     gtaccgttcc tgctggtggg ctgctttaaa tatattacca gccagtttga agtgcgtttt      1140
     tcagcgacga tttatctggt ctgtttctgc ttctttaagc aactggcgat gatttttatg      1200
     tctgtactgg cgggcaatat gtatgaaagc atcggtttcc agggcgctta tctggtgctg      1260
     ggtctggtgg cgctgggctt caccttaatt tccgtgttca cgcttagcgg ccccggcccg      1320
     ctttccctgc tgcgtcgtca ggtgaatgaa gtcgcttaag caatcaatgt cggatgcggc      1380
     gcgacgctta tccgaccaac atatcataac ggagtgatcg cattgaacat gccaatgacc      1440
     gaaagaataa gagcaggcaa gctatttacc gatatgtgcg aaggcttacc ggaaaaaaga      1500
//
ID   V00296; SV 1; linear; genomic DNA; STD; PRO; 3078 BP.
XX
AC   V00296;
XX
DT   13-JUL-1983 (Rel. 03, Created)
DT   18-APR-2005 (Rel. 83, Last updated, Version 5)
XX
DE   E. coli gene lacZ coding for beta-galactosidase (EC 3.2.1.23).
XX
KW   galactosidase.
XX
OS   Escherichia coli
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Escherichia.
XX
RN   [1]
RP   1-3078
RX   PUBMED; 6313347.
RA   Kalnins A., Otto K., Ruether U., Mueller-Hill B.;
RT   "Sequence of the lacZ gene of Escherichia coli";
RL   EMBO J. 2(4):593-597(1983).
XX
RN   [2]
RX   PUBMED; 3038536.
RA   Zell R., Fritz H.J.;
RT   "DNA mismatch-repair in Escherichia coli counteracting the hydrolytic
RT   deamination of 5-methyl-cytosine residues";
RL   EMBO J. 6(6):1809-1815(1987).
XX
CC   Data kindly reviewed (18-MAY-1983) by U. Ruether
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..3078
FT                   /organism="Escherichia coli"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:562"
FT   CDS             <1..3072
FT                   /transl_table=11
FT                   /note="galactosidase"
FT                   /db_xref="GOA:P00722"
FT                   /db_xref="InterPro:IPR004199"
FT                   /db_xref="InterPro:IPR006101"
FT                   /db_xref="InterPro:IPR006102"
FT                   /db_xref="InterPro:IPR006103"
FT                   /db_xref="InterPro:IPR006104"
FT                   /db_xref="InterPro:IPR008979"
FT                   /db_xref="InterPro:IPR011013"
FT                   /db_xref="InterPro:IPR013781"
FT                   /db_xref="InterPro:IPR013812"
FT                   /db_xref="InterPro:IPR014718"
FT                   /db_xref="InterPro:IPR017853"
FT                   /db_xref="PDB:1BGL"
FT                   /db_xref="PDB:1BGM"
FT                   /db_xref="PDB:1DP0"
FT                   /db_xref="PDB:1F49"
FT                   /db_xref="PDB:1F4A"
FT                   /db_xref="PDB:1F4H"
FT                   /db_xref="PDB:1GHO"
FT                   /db_xref="PDB:1HN1"
FT                   /db_xref="PDB:1JYN"
FT                   /db_xref="PDB:1JYV"
FT                   /db_xref="PDB:1JYW"
FT                   /db_xref="PDB:1JYX"
FT                   /db_xref="PDB:1JYY"
FT                   /db_xref="PDB:1JYZ"
FT                   /db_xref="PDB:1JZ0"
FT                   /db_xref="PDB:1JZ1"
FT                   /db_xref="PDB:1JZ2"
FT                   /db_xref="PDB:1JZ3"
FT                   /db_xref="PDB:1JZ4"
FT                   /db_xref="PDB:1JZ5"
FT                   /db_xref="PDB:1JZ6"
FT                   /db_xref="PDB:1JZ7"
FT                   /db_xref="PDB:1JZ8"
FT                   /db_xref="PDB:1PX3"
FT                   /db_xref="PDB:1PX4"
FT                   /db_xref="PDB:3CZJ"
FT                   /db_xref="PDB:3DYM"
FT                   /db_xref="PDB:3DYO"
FT                   /db_xref="PDB:3DYP"
FT                   /db_xref="PDB:3E1F"
FT                   /db_xref="PDB:3IAP"
FT                   /db_xref="PDB:3IAQ"
FT                   /db_xref="UniProtKB/Swiss-Prot:P00722"
FT                   /protein_id="CAA23573.1"
FT                   /translation="TMITDSLAVVLQRRDWENPGVTQLNRLAAHPPFASWRNSEEARTD
FT                   RPSQQLRSLNGEWRFAWFPAPEAVPESWLECDLPEADTVVVPSNWQMHGYDAPIYTNVT
FT                   YPITVNPPFVPTENPTGCYSLTFNVDESWLQEGQTRIIFDGVNSAFHLWCNGRWVGYGQ
FT                   DSRLPSEFDLSAFLRAGENRLAVMVLRWSDGSYLEDQDMWRMSGIFRDVSLLHKPTTQI
FT                   SDFHVATRFNDDFSRAVLEAEVQMCGELRDYLRVTVSLWQGETQVASGTAPFGGEIIDE
FT                   RGGYADRVTLRLNVENPKLWSAEIPNLYRAVVELHTADGTLIEAEACDVGFREVRIENG
FT                   LLLLNGKPLLIRGVNRHEHHPLHGQVMDEQTMVQDILLMKQNNFNAVRCSHYPNHPLWY
FT                   TLCDRYGLYVVDEANIETHGMVPMNRLTDDPRWLPAMSERVTRMVQRDRNHPSVIIWSL
FT                   GNESGHGANHDALYRWIKSVDPSRPVQYEGGGADTTATDIICPMYARVDEDQPFPAVPK
FT                   WSIKKWLSLPGETRPLILCEYAHAMGNSLGGFAKYWQAFRQYPRLQGGFVWDWVDQSLI
FT                   KYDENGNPWSAYGGDFGDTPNDRQFCMNGLVFADRTPHPALTEAKHQQQFFQFRLSGQT
FT                   IEVTSEYLFRHSDNELLHWMVALDGKPLASGEVPLDVAPQGKQLIELPELPQPESAGQL
FT                   WLTVRVVQPNATAWSEAGHISAWQQWRLAENLSVTLPAASHAIPHLTTSEMDFCIELGN
FT                   KRWQFNRQSGFLSQMWIGDKKQLLTPLRDQFTRAPLDNDIGVSEATRIDPNAWVERWKA
FT                   AGHYQAEAALLQCTADTLADAVLITTAHAWQHQGKTLFISRKTYRIDGSGQMAITVDVE
FT                   VASDTPHPARIGLNCQLAQVAERVNWLGLGPQENYPDRLTAACFDRWDLPLSDMYTPYV
FT                   FPSENGLRCGTRELNYGPHQWRGDFQFNISRYSQQQLMETSHRHLLHAEEGTWLNIDGF
FT                   HMGIGGDDSWSPSVSAEFQLSAGRYHYQLVWCQK"
FT   mat_peptide     1..3069
XX
SQ   Sequence 3078 BP; 682 A; 841 C; 886 G; 669 T; 0 other;
     accatgatta cggattcact ggccgtcgtt ttacaacgtc gtgactggga aaaccctggc        60
     gttacccaac ttaatcgcct tgcagcacat ccccctttcg ccagctggcg taatagcgaa       120
     gaggcccgca ccgatcgccc ttcccaacag ttgcgcagcc tgaatggcga atggcgcttt       180
     gcctggtttc cggcaccaga agcggtgccg gaaagctggc tggagtgcga tcttcctgag       240
     gccgatactg tcgtcgtccc ctcaaactgg cagatgcacg gttacgatgc gcccatctac       300
     accaacgtaa cctatcccat tacggtcaat ccgccgtttg ttcccacgga gaatccgacg       360
     ggttgttact cgctcacatt taatgttgat gaaagctggc tacaggaagg ccagacgcga       420
     attatttttg atggcgttaa ctcggcgttt catctgtggt gcaacgggcg ctgggtcggt       480
     tacggccagg acagtcgttt gccgtctgaa tttgacctga gcgcattttt acgcgccgga       540
     gaaaaccgcc tcgcggtgat ggtgctgcgt tggagtgacg gcagttatct ggaagatcag       600
     gatatgtggc ggatgagcgg cattttccgt gacgtctcgt tgctgcataa accgactaca       660
     caaatcagcg atttccatgt tgccactcgc tttaatgatg atttcagccg cgctgtactg       720
     gaggctgaag ttcagatgtg cggcgagttg cgtgactacc tacgggtaac agtttcttta       780
     tggcagggtg aaacgcaggt cgccagcggc accgcgcctt tcggcggtga aattatcgat       840
     gagcgtggtg gttatgccga tcgcgtcaca ctacgtctga acgtcgaaaa cccgaaactg       900
     tggagcgccg aaatcccgaa tctctatcgt gcggtggttg aactgcacac cgccgacggc       960
     acgctgattg aagcagaagc ctgcgatgtc ggtttccgcg aggtgcggat tgaaaatggt      1020
     ctgctgctgc tgaacggcaa gccgttgctg attcgaggcg ttaaccgtca cgagcatcat      1080
     cctctgcatg gtcaggtcat ggatgagcag acgatggtgc aggatatcct gctgatgaag      1140
     cagaacaact ttaacgccgt gcgctgttcg cattatccga accatccgct gtggtacacg      1200
     ctgtgcgacc gctacggcct gtatgtggtg gatgaagcca atattgaaac ccacggcatg      1260
     gtgccaatga atcgtctgac cgatgatccg cgctggctac cggcgatgag cgaacgcgta      1320
     acgcgaatgg tgcagcgcga tcgtaatcac ccgagtgtga tcatctggtc gctggggaat      1380
     gaatcaggcc acggcgctaa tcacgacgcg ctgtatcgct ggatcaaatc tgtcgatcct      1440
     tcccgcccgg tgcagtatga aggcggcgga gccgacacca cggccaccga tattatttgc      1500
     ccgatgtacg cgcgcgtgga tgaagaccag cccttcccgg ctgtgccgaa atggtccatc      1560
     aaaaaatggc tttcgctacc tggagagacg cgcccgctga tcctttgcga atacgcccac      1620
     gcgatgggta acagtcttgg cggtttcgct aaatactggc aggcgtttcg tcagtatccc      1680
     cgtttacagg gcggcttcgt ctgggactgg gtggatcagt cgctgattaa atatgatgaa      1740
     aacggcaacc cgtggtcggc ttacggcggt gattttggcg atacgccgaa cgatcgccag      1800
     ttctgtatga acggtctggt ctttgccgac cgcacgccgc atccagcgct gacggaagca      1860
     aaacaccagc agcagttttt ccagttccgt ttatccgggc aaaccatcga agtgaccagc      1920
     gaatacctgt tccgtcatag cgataacgag ctcctgcact ggatggtggc gctggatggt      1980
     aagccgctgg caagcggtga agtgcctctg gatgtcgctc cacaaggtaa acagttgatt      2040
     gaactgcctg aactaccgca gccggagagc gccgggcaac tctggctcac agtacgcgta      2100
     gtgcaaccga acgcgaccgc atggtcagaa gccgggcaca tcagcgcctg gcagcagtgg      2160
     cgtctggcgg aaaacctcag tgtgacgctc cccgccgcgt cccacgccat cccgcatctg      2220
     accaccagcg aaatggattt ttgcatcgag ctgggtaata agcgttggca atttaaccgc      2280
     cagtcaggct ttctttcaca gatgtggatt ggcgataaaa aacaactgct gacgccgctg      2340
     cgcgatcagt tcacccgtgc accgctggat aacgacattg gcgtaagtga agcgacccgc      2400
     attgacccta acgcctgggt cgaacgctgg aaggcggcgg gccattacca ggccgaagca      2460
     gcgttgttgc agtgcacggc agatacactt gctgatgcgg tgctgattac gaccgctcac      2520
     gcgtggcagc atcaggggaa aaccttattt atcagccgga aaacctaccg gattgatggt      2580
     agtggtcaaa tggcgattac cgttgatgtt gaagtggcga gcgatacacc gcatccggcg      2640
     cggattggcc tgaactgcca gctggcgcag gtagcagagc gggtaaactg gctcggatta      2700
     gggccgcaag aaaactatcc cgaccgcctt actgccgcct gttttgaccg ctgggatctg      2760
     ccattgtcag acatgtatac cccgtacgtc ttcccgagcg aaaacggtct gcgctgcggg      2820
     acgcgcgaat tgaattatgg cccacaccag tggcgcggcg acttccagtt caacatcagc      2880
     cgctacagtc aacagcaact gatggaaacc agccatcgcc atctgctgca cgcggaagaa      2940
     ggcacatggc tgaatatcga cggtttccat atggggattg gtggcgacga ctcctggagc      3000
     ccgtcagtat cggcggaatt ccagctgagc gccggtcgct accattacca gttggtctgg      3060
     tgtcaaaaat aataataa                                                    3078
//
ID   V00307; SV 1; linear; genomic DNA; STD; PRO; 2271 BP.
XX
AC   V00307; J01654;
XX
DT   09-JUN-1982 (Rel. 01, Created)
DT   01-OCT-1996 (Rel. 49, Last updated, Version 8)
XX
DE   E. coli ompA gene (codes for the outer membrane protein II*).
XX
KW   membrane protein; unidentified reading frame.
XX
OS   Escherichia coli
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Escherichia.
XX
RN   [1]
RP   1-2271
RX   DOI; 10.1093/nar/8.13.3011.
RX   PUBMED; 6253901.
RA   Beck E., Bremer E.;
RT   "Nucleotide sequence of the gene ompA coding the outer membrane protein II
RT   of Escherichia coli K-12";
RL   Nucleic Acids Res. 8(13):3011-3027(1980).
XX
RN   [2]
RP   783-1317
RX   DOI; 10.1073/pnas.77.7.3845.
RX   PUBMED; 7001445.
RA   Movva N.R., Nakamura K., Inouye M.;
RT   "Regulatory region of the gene for the ompA protein, a major outer membrane
RT   protein of Escherichia coli";
RL   Proc. Natl. Acad. Sci. U.S.A. 77(7):3845-3849(1980).
XX
DR   GOA; P0A8N0.
DR   InterPro; IPR009390; DUF1047.
DR   UniProtKB/Swiss-Prot; P0A8N0; YCBG_ECOLI.
XX
CC   KST ECO.OMPA
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..2271
FT                   /organism="Escherichia coli"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:562"
FT   CDS             172..669
FT                   /transl_table=11
FT                   /note="reading frame (unknown protein)"
FT                   /db_xref="GOA:P0AFZ5"
FT                   /db_xref="InterPro:IPR004596"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0AFZ5"
FT                   /protein_id="CAA23587.1"
FT                   /translation="MYTSGYAHRSSSFSSAASKIARVSTENTTAGLISEVVYREDQPMM
FT                   TQLLLLPLLQQLGQQSRWQLWLTPQQKLSREWVQASGLPLTKVMQISQLSPCHTVESMV
FT                   RALRTGNYSVVIGWLADDLTEEEHAEVVDAANEGNAMGFIIHSGKRILSRHETTFRAKN
FT                   SL"
FT   conflict        906..906
FT                   /note="may be missing [2]"
FT                   /citation=[2]
FT   CDS             1037..2077
FT                   /transl_table=11
FT                   /gene="ompA"
FT                   /product="ompA protein"
FT                   /db_xref="GOA:P0A910"
FT                   /db_xref="InterPro:IPR002368"
FT                   /db_xref="InterPro:IPR006664"
FT                   /db_xref="InterPro:IPR006665"
FT                   /db_xref="InterPro:IPR006690"
FT                   /db_xref="InterPro:IPR011250"
FT                   /db_xref="PDB:1BXW"
FT                   /db_xref="PDB:1G90"
FT                   /db_xref="PDB:1QJP"
FT                   /db_xref="PDB:2GE4"
FT                   /db_xref="PDB:2JMM"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0A910"
FT                   /protein_id="CAA23588.1"
FT                   /translation="MKKTAIAIAVALAGFATVAQAAPKDNTWYTGAKLGWSQYHDTGFI
FT                   NNNGPTHENQLGAGAFGGYQVNPYVGFEMGYDWLGRMPYKGSVENGAYKAQGVQLTAKL
FT                   GYPITDDLDIYTRLGGMVWRADTKSNVYGKNHDTGVSPVFAGGVEYAITPEIATRLEYQ
FT                   WTNNIGDAHTIGTRPDNGMLSLGVSYRFGQGEAAPVVAPAPAPAPEVQTKHFTLKSDVL
FT                   FNFNKATLKPEGQAALDQLYSQLSNLDPKDGSVVVLGYTDRIGSDAYNQGLSERRAQSV
FT                   VDYLISKGIPADKISARGMGESNPVTGNTCDNVKQRAALIDCLAPDRRVEIEVKGIKDV
FT                   VTQPQA"
XX
SQ   Sequence 2271 BP; 567 A; 552 C; 548 G; 604 T; 0 other;
     gatccgttaa ctacgaaaat aggcaactta ttcttaaggg gcaagattaa tttatgtttt        60
     cccgtcacca acgacaaaat ttgcgaggct ctttccgaaa atagggttga tctttgttgt       120
     cactggatgt actgtacatc catacagtaa ctcacagggg ctggattgat tatgtacact       180
     tcaggctatg cacatcgttc ttcgtcgttc tcatccgcag caagtaaaat tgcgcgtgtc       240
     tctacggaaa acactacagc cgggcttatc agtgaagttg tctatcgcga agatcagccc       300
     atgatgacgc aacttctact gttgccattg ttacagcaac tcggtcagca atcgcgctgg       360
     caactctggt taacaccgca acaaaaactg agtcgggaat gggttcaggc atctgggcta       420
     cccttaacga aagtaatgca gattagccag ctctcccctt gccacactgt ggagtcaatg       480
     gttcgcgctt tacgcacggg caattacagt gtggtgatcg gttggttggc agatgatttg       540
     actgaagaag agcatgctga agttgttgat gcggcaaatg aaggtaacgc tatggggttt       600
     attatacatt ccggtaagcg catcctctca cgccacgaga caactttccg ggctaaaaat       660
     tcactctaat ttgtatcatt aagtaaattt aggattaatc ctggaacttt ttttgtcgcc       720
     cagccaatgc tttcagtcgt gactaatttc cttgcggagg cttgtctgag cggtttccgc       780
     gattctcttc tgtaaattgt cgctgacaaa aaagattaaa cataccttat acaagacttt       840
     tttttcatat gcctgacgga gttcacactt gtaagttttc aactacgttg tagactttac       900
     atcgccaagg gtgctcggca taagccgaag atatcggtag agttaatatt gagcagatcc       960
     cccggtgaag gatttaaccg tgttatctcg ttggagatat tcatggcgta ttttggatga      1020
     taacgaggcg caaaaaatga aaaagacagc tatcgcgatt gcagtggcac tggctggttt      1080
     cgctaccgta gcgcaggccg ctccgaaaga taacacctgg tacactggtg ctaaactggg      1140
     ctggtcccag taccatgata ctggtttcat caacaacaat ggcccgaccc atgaaaacca      1200
     actgggcgct ggtgcttttg gtggttacca ggttaacccg tatgttggct ttgaaatggg      1260
     ttacgactgg ttaggtcgta tgccgtacaa aggcagcgtt gaaaacggtg catacaaagc      1320
     tcagggcgtt caactgaccg ctaaactggg ttacccaatc actgacgacc tggacatcta      1380
     cactcgtctg ggtggcatgg tatggcgtgc agacactaaa tccaacgttt atggtaaaaa      1440
     ccacgacacc ggcgtttctc cggtcttcgc tggcggtgtt gagtacgcga tcactcctga      1500
     aatcgctacc cgtctggaat accagtggac gaacaacatc ggtgacgcac acaccatcgg      1560
     cactcgtccg gacaacggca tgctgagcct gggtgtttcc taccgtttcg gtcagggcga      1620
     ggcagctcca gtagttgctc cggctccagc tccggcaccg gaagtacaga ccaagcactt      1680
     cactctgaag tctgacgttc tgttcaactt caacaaagca accctgaaac cggaaggtca      1740
     ggctgctctg gatcagctgt acagccagct gagcaacttg gatccgaaag acggttccgt      1800
     agttgttctg ggttacaccg accgcatcgg ttctgacgct tacaaccagg gtctgtccga      1860
     gcgccgtgct cagtctgttg ttgattacct gatctccaaa ggtatcccgg cagacaagat      1920
     ctccgcacgt ggtatgggcg aatccaaccc ggttactggc aacacctgtg acaacgtgaa      1980
     acagcgtgct gcactgatcg actgcctggc tccggatcgt cgcgtagaga tcgaagttaa      2040
     aggtatcaaa gacgttgtaa ctcagccgca ggcttaagtt ctcgtctggt agaaaaacgc      2100
     tgctgcgggt ttttttttgc ctttagtaaa ttgaactgac tttcgtcagt tattccttac      2160
     ccagcaatgc ctgcagatcc tgcttcagag aagacatttt attcgcgtat ttctctttgt      2220
     tttccgcatc ttcaatcagc tgaacaatcg tttcagaaag cgttttaccg c               2271
//
ID   X77160; SV 1; linear; genomic DNA; STD; PRO; 1212 BP.
XX
AC   X77160;
XX
DT   13-APR-1994 (Rel. 39, Created)
DT   18-APR-2005 (Rel. 83, Last updated, Version 8)
XX
DE   Pseudomonas aeruginosa (PAC1) amiB gene.
XX
KW   amiB gene.
XX
OS   Pseudomonas aeruginosa
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
OC   Pseudomonadaceae; Pseudomonas.
XX
RN   [1]
RA   Wilson S.A., Wachira S.M., Drew R.E., Jones D., Pearl L.H.;
RT   "Identification of a putative ABC transporter in the Pseudomonas aeruginosa
RT   amidase operon";
RL   Unpublished.
XX
RN   [2]
RP   1-1212
RA   Wilson S.A.;
RT   ;
RL   Submitted (17-JAN-1994) to the EMBL/GenBank/DDBJ databases.
RL   S.A. Wilson, University College London, Dept of Biochemistry, Gower Street,
RL   London WC1E 6BT, UK
XX
RN   [3]
RP   1-1212
RX   DOI; 10.1074/jbc.270.32.18818.
RX   PUBMED; 7642533.
RA   Wilson S.A., Williams R.J., Pearl L.H., Drew R.E.;
RT   "Identification of two new genes in the Pseudomonas aeruginosa amidase
RT   operon, encoding an ATPase (AmiB) and a putative integral membrane protein
RT   (AmiS)";
RL   J. Biol. Chem. 270(32):18818-18824(1995).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1212
FT                   /organism="Pseudomonas aeruginosa"
FT                   /strain="PAC1"
FT                   /mol_type="genomic DNA"
FT                   /clone="plasmid pAS20"
FT                   /db_xref="taxon:287"
FT   CDS             97..1212
FT                   /transl_table=11
FT                   /gene="amiB"
FT                   /db_xref="GOA:Q51416"
FT                   /db_xref="InterPro:IPR001270"
FT                   /db_xref="InterPro:IPR003593"
FT                   /db_xref="InterPro:IPR013093"
FT                   /db_xref="InterPro:IPR019489"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q51416"
FT                   /protein_id="CAA54405.1"
FT                   /translation="MPFLSDMLDQSRRQQDEEQALARENLAEASLLQAHLSHRSALHSR
FT                   FRFDPAAVMDCLRAEVLGQEPALQAVEDMLKVVRADIADPRRPLFSALFLGPTGVGKTE
FT                   IVRALARALHGDAEGFCRVDMNTLSQEHYAAALTGAPPGYVGAKEGTTLLEQDKLDGSP
FT                   GRPGIVLFDELEKASPEVVHALLNVLDNGLLRVASGERTYHFRNTLVFMTSNLCAHEIQ
FT                   RYDERRQRLPWRLLPVGGERRRRDIDGMVRARLLKTFSPEFVNRLDSVVTFNWIERDVV
FT                   ARLVELEVQRLNRRLEKHRCRLEATPEVLAKIARAGFDRQFGARALRRSVRHHLEVPLA
FT                   EHLLDHHQPGDGNCTIYLASLEHERVRFVRR"
XX
SQ   Sequence 1212 BP; 193 A; 426 C; 403 G; 190 T; 0 other;
     gaaggaagcc tgacggcaga cgccgccagc ccggcgtgcc gtcgtgcggc acgccgtctc        60
     cgccatttcc cccctgtggc agaaggagtt tcatccatgc cttttctgag cgacatgctc       120
     gaccagtccc gccggcagca ggacgaggaa caggccctgg cgcgggagaa tcttgccgag       180
     gcaagtctgc tccaggccca cctgagtcac cgcagcgccc tgcacagccg tttccgtttc       240
     gacccggcgg cggtgatgga ctgcctgcgc gccgaggtgc tcggccagga accggcgcta       300
     caggccgtcg aggacatgct caaggtggtt cgcgcggaca tcgccgaccc gcgccgtccg       360
     ctgttcagcg cgctgttcct cggccccacc ggagtcggca agaccgagat cgtgcgcgcc       420
     ctggccaggg ccctgcacgg cgacgccgag gggttctgcc gggtggacat gaacaccctg       480
     tcccaggagc actatgccgc cgccctcacc ggtgcgccgc cgggctacgt cggggcgaag       540
     gagggcacca ccctgttgga gcaggacaag ctggacggca gtcccgggcg ccccggcatc       600
     gttctcttcg acgaactgga aaaggccagc ccggaagtgg tccatgcgtt gctcaacgta       660
     ctcgacaacg gcctgctacg ggtcgcttcc ggcgaacgca cctaccattt ccgcaacacc       720
     ctggtgttca tgaccagcaa tctctgcgcc catgagatcc agcgctacga cgagcgtcgc       780
     cagcgcctgc cctggcgcct gctgccggtc ggcggcgagc gccggcggcg ggacatcgac       840
     gggatggtcc gggcccggct gctgaagacc ttctcgccgg agttcgtcaa tcgtctcgat       900
     agcgtggtca ccttcaactg gatcgaacgc gacgtcgtcg cgcgcctggt cgagctggag       960
     gtgcagcggc tcaaccggcg cctggagaag catcgctgcc gcctggaggc gaccccggag      1020
     gtgctggcga agatcgcccg cgccggcttc gaccggcagt tcggcgcccg tgcgttgcgc      1080
     cgcagcgtcc gtcatcatct cgaggtaccg ctggccgagc atctgctcga tcaccaccag      1140
     ccgggcgacg ggaactgcac gatctacctg gcgagcctgg agcacgagcg ggttcgcttc      1200
     gtacggcgct ga                                                          1212
//
ID   M27612; SV 1; linear; genomic DNA; STD; PRO; 1065 BP.
XX
AC   M27612;
XX
DT   02-FEB-1990 (Rel. 22, Created)
DT   22-APR-2002 (Rel. 71, Last updated, Version 4)
XX
DE   Pseudomonas aeruginosa aliphatic amidase (amiE) gene, complete cds.
XX
KW   .
XX
OS   Pseudomonas aeruginosa
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
OC   Pseudomonadaceae; Pseudomonas.
XX
RN   [1]
RP   1-1065
RX   DOI; 10.1016/0014-5793(87)80164-3.
RX   PUBMED; 3108030.
RA   Brammar W.J., Charles I.G., Matfield M., Liu C.P., Drew R.E., Clarke P.H.;
RT   "The nucleotide sequence of the amiE gene of Pseudomonas aeruginosa";
RL   FEBS Lett. 215(2):291-294(1987).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1065
FT                   /organism="Pseudomonas aeruginosa"
FT                   /strain="PAC433"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:287"
FT   CDS             25..1065
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="amiE"
FT                   /product="aliphatic amidase"
FT                   /EC_number="3.5.1.4"
FT                   /db_xref="GOA:P11436"
FT                   /db_xref="InterPro:IPR003010"
FT                   /db_xref="PDB:1K17"
FT                   /db_xref="PDB:2UXY"
FT                   /db_xref="UniProtKB/Swiss-Prot:P11436"
FT                   /protein_id="AAA25697.1"
FT                   /translation="MRHGDISSSNDTVGVAVVNYKMPRLHTAAEVLDNARKIADMIVGM
FT                   KQGLPGMDLVVFPEYSLQGIMYDPAEMMETAVAIPGEETEIFSRACRKANVWGVFSLTG
FT                   ERHEEHPRKAPYNTLVLIDNNGEIVQKYRKIIPWCPIEGWYPGGQTYVSEGPKGMKISL
FT                   IICDDPNYPEIWRDCAMKGAELIVRCQGYMYPAKDQQVMMAKAMAWANNCYVAVANAAG
FT                   FDGVYSYFGHSAIIGFDGRTLGECGEEEMGIQYAQLSLSQIRDARANDQSQNHLFKILH
FT                   RGYSGLQASGDGDRGLAECPFEFYRTWVTDAEKARDNVERLTRSTTGVAQCPVGRLPYE
FT                   GLEKEA"
XX
SQ   Sequence 1065 BP; 220 A; 337 C; 343 G; 165 T; 0 other;
     aaataacaac aggaggtgat acccatgcgt cacggcgata tttccagcag caacgacacc        60
     gtcggagtgg ccgtggtcaa ctacaagatg ccgcgcctgc acaccgcggc ggaggtcctg       120
     gacaacgccc ggaagatcgc cgacatgatc gtcggcatga agcagggcct gcccggcatg       180
     gacctggtgg tgttcccgga gtacagcctg cagggcatca tgtacgatcc ggcggagatg       240
     atggaaaccg cggtggcgat ccccggcgag gaaaccgaga tattctcccg cgcctgccgc       300
     aaggccaacg tctggggcgt attctccctc accggcgaac ggcacgagga gcatccgcgc       360
     aaggcgccgt acaacaccct ggtgctgatc gacaacaacg gcgagatcgt ccagaagtac       420
     cgcaagatca ttccctggtg ccccatcgag ggctggtatc ccggtggcca gacctacgtc       480
     agcgaagggc cgaagggcat gaagatcagc ctgatcatct gcgacgaccc caattacccg       540
     gagatctggc gcgactgcgc gatgaagggc gccgagctga tcgtgcgctg ccagggctac       600
     atgtacccgg ccaaggacca gcaggtgatg atggccaagg ccatggcctg ggccaacaac       660
     tgctatgtgg cggtggccaa cgcggccggc ttcgacggtg tctattccta cttcggccac       720
     tcggcgatca tcggcttcga cggccgtacc ctcggtgagt gcggcgagga ggaaatgggt       780
     atccagtacg cccagctgtc cctttcgcag atccgcgatg cgcgcgccaa cgatcagtcg       840
     cagaaccacc tgttcaagat cctccaccgc ggctacagcg gcttgcaggc gtccggcgac       900
     ggcgaccggg gcctggcgga gtgtccgttc gagttctacc gcacctgggt caccgacgcc       960
     gagaaggcgc gcgacaatgt cgagcgactg acccgctcga ccaccggcgt ggcgcaatgc      1020
     ccggtcggcc ggctgcccta tgagggactg gagaaggaag cctga                      1065
//
ID   X13776; SV 1; linear; genomic DNA; STD; PRO; 2167 BP.
XX
AC   X13776; M43175;
XX
DT   19-APR-1989 (Rel. 19, Created)
DT   14-NOV-2006 (Rel. 89, Last updated, Version 24)
XX
DE   Pseudomonas aeruginosa amiC and amiR gene for aliphatic amidase regulation
XX
KW   aliphatic amidase regulator; amiC gene; amiR gene.
XX
OS   Pseudomonas aeruginosa
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
OC   Pseudomonadaceae; Pseudomonas.
XX
RN   [1]
RP   1167-2167
RA   Rice P.M.;
RT   ;
RL   Submitted (16-DEC-1988) to the EMBL/GenBank/DDBJ databases.
RL   Rice P.M., EMBL, Postfach 10-2209, Meyerhofstrasse 1, 6900 Heidelberg, FRG.
XX
RN   [2]
RP   1167-2167
RX   DOI; 10.1016/0014-5793(89)80249-2.
RX   PUBMED; 2495988.
RA   Lowe N., Rice P.M., Drew R.E.;
RT   "Nucleotide sequence of the aliphatic amidase regulator gene (amiR) of
RT   Pseudomonas aeruginosa";
RL   FEBS Lett. 246(1-2):39-43(1989).
XX
RN   [3]
RP   1-1292
RX   PUBMED; 1907262.
RA   Wilson S., Drew R.;
RT   "Cloning and DNA sequence of amiC, a new gene regulating expression of the
RT   Pseudomonas aeruginosa aliphatic amidase, and purification of the amiC
RT   product";
RL   J. Bacteriol. 173(16):4914-4921(1991).
XX
RN   [4]
RP   1-2167
RA   Rice P.M.;
RT   ;
RL   Submitted (04-SEP-1991) to the EMBL/GenBank/DDBJ databases.
RL   Rice P.M., EMBL, Postfach 10-2209, Meyerhofstrasse 1, 6900 Heidelberg, FRG.
XX
DR   GOA; Q51417.
DR   InterPro; IPR003211; AmiSUreI_transpt.
DR   UniProtKB/Swiss-Prot; Q51417; AMIS_PSEAE.
XX
CC   Data kindly reviewed (04-SEP-1991) by Rice P. M.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..2167
FT                   /organism="Pseudomonas aeruginosa"
FT                   /map="38 min"
FT                   /strain="PAC"
FT                   /isolate="PAC 1"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:287"
FT   CDS             1289..1879
FT                   /transl_table=11
FT                   /gene="amiR"
FT                   /note="aliphatic amidase regulator, positive  regulator of
FT                   amiE"
FT                   /db_xref="GOA:P10932"
FT                   /db_xref="InterPro:IPR005561"
FT                   /db_xref="InterPro:IPR008327"
FT                   /db_xref="InterPro:IPR011006"
FT                   /db_xref="InterPro:IPR011991"
FT                   /db_xref="PDB:1QO0"
FT                   /db_xref="UniProtKB/Swiss-Prot:P10932"
FT                   /protein_id="CAA32023.1"
FT                   /translation="MSANSLLGSLRELQVLVLNPPGEVSDALVLQLIRIGCSVRQCWPP
FT                   PEAFDVPVDVVFTSIFQNGHHDEIAALLAAGTPRTTLVALVEYESPAVLSQIIELECHG
FT                   VITQPLDAHRVLPVLVSARRISEEMAKLKQKTEQLQDRIAGQARINQAKVLLMQRHGWD
FT                   EREAHQHLSREAMKRREPILKIAQELLGNEPSA"
FT   CDS             135..1292
FT                   /transl_table=11
FT                   /gene="amiC"
FT                   /note="negative regulator of amiR"
FT                   /db_xref="GOA:P27017"
FT                   /db_xref="InterPro:IPR000709"
FT                   /db_xref="PDB:1PEA"
FT                   /db_xref="PDB:1QNL"
FT                   /db_xref="PDB:1QO0"
FT                   /db_xref="UniProtKB/Swiss-Prot:P27017"
FT                   /protein_id="CAA32024.1"
FT                   /translation="MGSHQERPLIGLLFSETGVTADIERSHAYGALLAVEQLNREGGVG
FT                   GRPIETLSQDPGGDPDRYRLCAEDFIRNRGVRFLVGCYMSHTRKAVMPVVERADALLCY
FT                   PTPYEGFEYSPNIVYGGPAPNQNSAPLAAYLIRHYGERVVFIGSDYIYPRESNHVMRHL
FT                   YRQHGGTVLEEIYIPLYPSDDDLQRAVERIYQARADVVFSTVVGTGTAELYRAIARRYG
FT                   DGRRPPIASLTTSEAEVAKMESDVAEGQVVVAPYFSSIDTPASRAFVQACHGFFPENAT
FT                   ITAWAEAAYWQTLLLGRAAQAAGNWRVEDVQRHLYDIDIDAPQGPVRVERQNNHSRLSS
FT                   RIAEIDARGVFQVRWQSPEPIRPDPYVVVHNLDDWSASMGGGPLP"
FT   promoter        8..24
FT                   /note="proposed rpoN-dependent promoter"
FT   promoter        65..81
FT                   /note="proposed rpoN-dependent promoter"
FT   RBS             121..126
FT                   /note="proposed Shine-Dalgarno sequence"
FT   variation       912..1167
FT                   /gene="amiC"
FT                   /replace=""
FT                   /note="ClaI fragment deleted in pSW36,  constitutive
FT                   phenotype"
FT   misc_feature    1
FT                   /note="last base of an XhoI site"
FT   misc_feature    648..653
FT                   /note="end of 658bp XhoI fragment, deletion in  pSW3 causes
FT                   constitutive expression of amiE"
FT   conflict        1281
FT                   /replace="g"
FT                   /citation=[3]
XX
SQ   Sequence 2167 BP; 363 A; 712 C; 730 G; 362 T; 0 other;
     ggtaccgctg gccgagcatc tgctcgatca ccaccagccg ggcgacggga actgcacgat        60
     ctacctggcg agcctggagc acgagcgggt tcgcttcgta cggcgctgag cgacagtcac       120
     aggagaggaa acggatggga tcgcaccagg agcggccgct gatcggcctg ctgttctccg       180
     aaaccggcgt caccgccgat atcgagcgct cgcacgcgta tggcgcattg ctcgcggtcg       240
     agcaactgaa ccgcgagggc ggcgtcggcg gtcgcccgat cgaaacgctg tcccaggacc       300
     ccggcggcga cccggaccgc tatcggctgt gcgccgagga cttcattcgc aaccgggggg       360
     tacggttcct cgtgggctgc tacatgtcgc acacgcgcaa ggcggtgatg ccggtggtcg       420
     agcgcgccga cgcgctgctc tgctacccga ccccctacga gggcttcgag tattcgccga       480
     acatcgtcta cggcggtccg gcgccgaacc agaacagtgc gccgctggcg gcgtacctga       540
     ttcgccacta cggcgagcgg gtggtgttca tcggctcgga ctacatctat ccgcgggaaa       600
     gcaaccatgt gatgcgccac ctgtatcgcc agcacggcgg cacggtgctc gaggaaatct       660
     acattccgct gtatccctcc gacgacgact tgcagcgcgc cgtcgagcgc atctaccagg       720
     cgcgcgccga cgtggtcttc tccaccgtgg tgggcaccgg caccgccgag ctgtatcgcg       780
     ccatcgcccg tcgctacggc gacggcaggc ggccgccgat cgccagcctg accaccagcg       840
     aggcggaggt ggcgaagatg gagagtgacg tggcagaggg gcaggtggtg gtcgcgcctt       900
     acttctccag catcgatacg cccgccagcc gggccttcgt ccaggcctgc catggtttct       960
     tcccggagaa cgcgaccatc accgcctggg ccgaggcggc ctactggcag accttgttgc      1020
     tcggccgcgc cgcgcaggcc gcaggcaact ggcgggtgga agacgtgcag cggcacctgt      1080
     acgacatcga catcgacgcg ccacaggggc cggtccgggt ggagcgccag aacaaccaca      1140
     gccgcctgtc ttcgcgcatc gcggaaatcg atgcgcgcgg cgtgttccag gtccgctggc      1200
     agtcgcccga accgattcgc cccgaccctt atgtcgtcgt gcataacctc gacgactggt      1260
     ccgccagcat gggcggggga ccgctcccat gagcgccaac tcgctgctcg gcagcctgcg      1320
     cgagttgcag gtgctggtcc tcaacccgcc gggggaggtc agcgacgccc tggtcttgca      1380
     gctgatccgc atcggttgtt cggtgcgcca gtgctggccg ccgccggaag ccttcgacgt      1440
     gccggtggac gtggtcttca ccagcatttt ccagaatggc caccacgacg agatcgctgc      1500
     gctgctcgcc gccgggactc cgcgcactac cctggtggcg ctggtggagt acgaaagccc      1560
     cgcggtgctc tcgcagatca tcgagctgga gtgccacggc gtgatcaccc agccgctcga      1620
     tgcccaccgg gtgctgcctg tgctggtatc ggcgcggcgc atcagcgagg aaatggcgaa      1680
     gctgaagcag aagaccgagc agctccagga ccgcatcgcc ggccaggccc ggatcaacca      1740
     ggccaaggtg ttgctgatgc agcgccatgg ctgggacgag cgcgaggcgc accagcacct      1800
     gtcgcgggaa gcgatgaagc ggcgcgagcc gatcctgaag atcgctcagg agttgctggg      1860
     aaacgagccg tccgcctgag cgatccgggc cgaccagaac aataacaaga ggggtatcgt      1920
     catcatgctg ggactggttc tgctgtacgt tggcgcggtg ctgtttctca atgccgtctg      1980
     gttgctgggc aagatcagcg gtcgggaggt ggcggtgatc aacttcctgg tcggcgtgct      2040
     gagcgcctgc gtcgcgttct acctgatctt ttccgcagca gccgggcagg gctcgctgaa      2100
     ggccggagcg ctgaccctgc tattcgcttt tacctatctg tgggtggccg ccaaccagtt      2160
     cctcgag                                                                2167
//
ID   X77161; SV 1; linear; genomic DNA; STD; PRO; 1130 BP.
XX
AC   X77161;
XX
DT   13-APR-1994 (Rel. 39, Created)
DT   31-JUL-2003 (Rel. 76, Last updated, Version 7)
XX
DE   Pseudomonas aeruginosa (PAC1) amiS gene.
XX
KW   amiS gene.
XX
OS   Pseudomonas aeruginosa
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
OC   Pseudomonadaceae; Pseudomonas.
XX
RN   [1]
RA   Wilson S.A., Wachira S.M., Drew R.E., Jones D., Pearl L.H.;
RT   "Identification of a putative ABC transporter in the Pseudomonas aeruginosa
RT   amidase operon";
RL   Unpublished.
XX
RN   [2]
RP   1-1130
RA   Wilson S.A.;
RT   ;
RL   Submitted (17-JAN-1994) to the EMBL/GenBank/DDBJ databases.
RL   S.A. Wilson, University College London, Dept of Biochemistry, Gower Street,
RL   London WC1E 6BT, UK
XX
RN   [3]
RP   1-1130
RX   DOI; 10.1074/jbc.270.32.18818.
RX   PUBMED; 7642533.
RA   Wilson S.A., Williams R.J., Pearl L.H., Drew R.E.;
RT   "Identification of two new genes in the Pseudomonas aeruginosa amidase
RT   operon, encoding an ATPase (AmiB) and a putative integral membrane protein
RT   (AmiS)";
RL   J. Biol. Chem. 270(32):18818-18824(1995).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1130
FT                   /organism="Pseudomonas aeruginosa"
FT                   /strain="PAC1"
FT                   /mol_type="genomic DNA"
FT                   /clone="plasmid pAS20"
FT                   /db_xref="taxon:287"
FT   CDS             61..576
FT                   /transl_table=11
FT                   /gene="amiS"
FT                   /db_xref="GOA:Q51417"
FT                   /db_xref="InterPro:IPR003211"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q51417"
FT                   /protein_id="CAA54406.1"
FT                   /translation="MLGLVLLYVGAVLFLNAVWLLGKISGREVAVINFLVGVLSACVAF
FT                   YLIFSAAAGQGSLKAGALTLLFAFTYLWVAANQFLEVDGKGLGWFCLFVSLTACTVAIE
FT                   SFAGASGPFGLWNAVNWTVWALLWFCFFLLLGLSRGIQKPVAYLTLASAIFTAWLPGLL
FT                   LLGQVLKA"
XX
SQ   Sequence 1130 BP; 167 A; 335 C; 377 G; 251 T; 0 other;
     gagccgtccg cctgagcgat ccgggccgac cagaacaata acaagagggg tatcgtcatc        60
     atgctgggac tggttctgct gtacgttggc gcggtgctgt ttctcaatgc cgtctggttg       120
     ctgggcaaga tcagcggtcg ggaggtggcg gtgatcaact tcctggtcgg cgtgctgagc       180
     gcctgcgtcg cgttctacct gatcttttcc gcagcagccg ggcagggctc gctgaaggcc       240
     ggagcgctga ccctgctatt cgcttttacc tatctgtggg tggccgccaa ccagttcctc       300
     gaggtggacg gcaagggcct cggctggttc tgcctgttcg tcagcctcac cgcctgcacc       360
     gtggcgatcg agtcgttcgc cggcgccagt ggtccgttcg gcctgtggaa cgcggtcaac       420
     tggacagtct gggcgttgct ctggttctgt ttcttcctgc tgctggggct gtcccgcggc       480
     atccagaagc cggtggccta cctgaccctg gccagcgcca tattcaccgc ctggttgccc       540
     ggcctgctgc tgctcggaca ggtgctcaag gcatagcagg aagtcggaaa gggatgacgg       600
     cttgccgcca tcccgtccct tccgaacgcc tagccgagcg gccagttgat caccacgacg       660
     gcgtcgttgt agtcgttgtc ggtgccgtct tcagagccga ccagggcgaa gttcagctcg       720
     ttggtcagga ttacctgtgc cgagaccaga tccgaggggc ggccgttgac gctgacctgg       780
     acctgtacct tgccactgct gccggagttg agcacctggg tgccgatgac ggcgttattg       840
     gtgctttgcc cgctgaaggt cgcggccgtg ctcgttgttg accagcacgt tcaccgtctg       900
     ggttccggac gagttggcga aggcggtgac gccggaacct ggttgttggc gggaagggtg       960
     aacactcctt gtggttgcca tggtggtatc tccactgaat acctggcccc ttccttttca      1020
     ggcagccgtc tggcgcgcgg tatggcgtgt cgggagaaat ccgcagtcct tggcggcagg      1080
     cgatgcgcag gcaggaagga cgcatcgttc agccaatcta cgccgtcgac                 1130
//