1ID   J01636; SV 1; linear; genomic DNA; STD; PRO; 7477 BP.
2XX
3AC   J01636; J01637; K01483; K01793;
4XX
5DT   30-NOV-1990 (Rel. 26, Created)
6DT   09-SEP-2004 (Rel. 81, Last updated, Version 8)
7XX
8DE   E.coli lactose operon with lacI, lacZ, lacY and lacA genes.
9XX
10KW   acetyltransferase; beta-D-galactosidase; galactosidase; lac operon;
11KW   lac repressor protein; lacA gene; lacI gene; lactose permease; lacY gene;
12KW   lacZ gene; mutagenesis; palindrome; promoter region;
13KW   thiogalactoside acetyltransferase.
14XX
15OS   Escherichia coli
16OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
17OC   Enterobacteriaceae; Escherichia.
18XX
19RN   [1]
20RP   1243-1266
21RX   DOI; 10.1073/pnas.70.12.3581.
22RX   PUBMED; 4587255.
23RA   Gilbert W., Maxam A.;
24RT   "The nucleotide sequence of the lac operator";
25RL   Proc. Natl. Acad. Sci. U.S.A. 70(12):3581-3584(1973).
26XX
27RN   [2]
28RP   1246-1308
29RX   DOI; 10.1073/pnas.70.12.3585.
30RX   PUBMED; 4587256.
31RA   Maizels N.M.;
32RT   "The nucleotide sequence of the lactose messenger ribonucleic acid
33RT   transcribed from the UV5 promoter mutant of Escherichia coli";
34RL   Proc. Natl. Acad. Sci. U.S.A. 70(12):3585-3589(1973).
35XX
36RN   [3]
37RX   PUBMED; 4598642.
38RA   Gilbert W., Maizels N., Maxam A.;
39RT   "Sequences of controlling regions of the lactose operon";
40RL   Cold Spring Harb. Symp. Quant. Biol. 38:845-855(1974).
41XX
42RN   [4]
43RA   Gilbert W., Gralla J., Majors A.J., Maxam A.;
44RT   "Lactose operator sequences and the action of lac repressor";
45RL   (in) Sund H., Blauer G. (Eds.);
46RL   PROTEIN-LIGAND INTERACTIONS:193-207;
47RL   Walter de Gruyter, New York (1975)
48XX
49RN   [5]
50RP   1146-1282
51RX   DOI; 10.1126/science.1088926.
52RX   PUBMED; 1088926.
53RA   Dickson R.C., Abelson J.N., Barnes W.M., Reznikoff W.S.;
54RT   "Genetic regulation: the Lac control region";
55RL   Science 187(4171):27-35(1975).
56XX
57RN   [6]
58RP   1227-1271
59RA   Gilbert W., Maxam A., Mirzabekov A.;
60RT   "Contacts between the lac repressor and DNA revealed by methylation";
61RL   (in) Kjeldgaard N.C., Maaloe O. (Eds.);
62RL   CONTROL OF RIBOSOME SYNTHESIS:138-143;
63RL   Academic Press, New York (1976)
64XX
65RN   [7]
66RX   DOI; 10.1038/260360a0.
67RX   PUBMED; 768781.
68RA   Marians K.J., Wu R.;
69RT   "Structure of the lactose operator";
70RL   Nature 260(5549):360-363(1976).
71XX
72RN   [8]
73RP   1242-1268
74RX   DOI; 10.1038/263748a0.
75RX   PUBMED; 1069185.
76RA   Heyneker H.L., Shine J., Goodman H.M., Boyer H.W., Rosenberg J.,
77RA   Dickerson R.E., Narang S.A., Itakura K., Lin S., Riggs A.D.;
78RT   "Synthetic lac operator DNA is functional in vivo";
79RL   Nature 263(5580):748-752(1976).
80XX
81RN   [9]
82RX   DOI; 10.1016/S0022-2836(77)80132-0.
83RX   PUBMED; 323498.
84RA   Dickson R.C., Abelson J.N., Johnson P., Reznikoff W.S., Barnes W.M.;
85RT   "Nucleotide sequence changes produced by mutations in the lac promoter of
86RT   Escherichia coli";
87RL   J. Mol. Biol. 111(1):65-75(1977).
88XX
89RN   [10]
90RP   51-264
91RX   DOI; 10.1073/pnas.74.10.4163.
92RX   PUBMED; 337294.
93RA   Steege D.A.;
94RT   "5'-Terminal nucleotide sequence of Escherichia coli lactose repressor
95RT   mRNA: features of translational initiation and reinitiation sites";
96RL   Proc. Natl. Acad. Sci. U.S.A. 74(10):4163-4167(1977).
97XX
98RN   [11]
99RP   1-81
100RX   DOI; 10.1038/274762a0.
101RX   PUBMED; 355890.
102RA   Calos M.P.;
103RT   "DNA sequence for a low-level promoter of the lac repressor gene and an
104RT   'up' promoter mutation";
105RL   Nature 274(5673):762-765(1978).
106XX
107RN   [12]
108RP   49-1161
109RX   DOI; 10.1038/274765a0.
110RX   PUBMED; 355891.
111RA   Farabaugh P.J.;
112RT   "Sequence of the lacI gene";
113RL   Nature 274(5673):765-769(1978).
114XX
115RN   [13]
116RX   DOI; 10.1038/274770a0.
117RX   PUBMED; 355892.
118RA   Miller J.H., Coulondre C., Farabaugh P.J.;
119RT   "Correlation of nonsense sites in the lacI gene with specific codons in the
120RT   nucleotide sequence";
121RL   Nature 274(5673):770-775(1978).
122XX
123RN   [14]
124RX   DOI; 10.1007/BF00267233.
125RX   PUBMED; 6770231.
126RA   Calos M.P., Miller J.H.;
127RT   "DNA sequence alteration resulting from a mutation impairing promoter
128RT   function in the lac repressor gene";
129RL   Mol. Gen. Genet. 178(1):225-227(1980).
130XX
131RN   [15]
132RP   4306-5804
133RX   DOI; 10.1038/283541a0.
134RX   PUBMED; 6444453.
135RA   Buechel D.E., Gronenborn B., Mueller-Hill B.;
136RT   "Sequence of the lactose permease gene";
137RL   Nature 283(5747):541-545(1980).
138XX
139RN   [16]
140RX   PUBMED; 6271472.
141RA   Miller J.H., Calos M.P., Galas D.J.;
142RT   "Genetic and sequencing studies of the specificity of transposition into
143RT   the lac region of E. coli";
144RL   Cold Spring Harb. Symp. Quant. Biol. 45:243-257(1981).
145XX
146RN   [17]
147RX   DOI; 10.1016/0014-5793(81)81076-9.
148RX   PUBMED; 7023981.
149RA   Chenchick A., Beabealashvilli R.S., Mirzabekov A.;
150RT   "Topography of interaction of Escherichia coli RNA polymerase subunits with
151RT   lac UV5 promoter";
152RL   FEBS Lett. 128(1):46-50(1981).
153XX
154RN   [18]
155RX   DOI; 10.1016/0378-1119(81)90038-X.
156RX   PUBMED; 7016667.
157RA   Betz J.L., Sadler J.R.;
158RT   "Variants of a cloned synthetic lactose operator. I. A palindromic dimer
159RT   lactose operator derived from one stand of the cloned 40-base pair
160RT   operator";
161RL   Gene 13(1):1-12(1981).
162XX
163RN   [19]
164RX   DOI; 10.1016/0378-1119(81)90039-1.
165RX   PUBMED; 6263752.
166RA   Sadler J.R., Tecklenburg M.;
167RT   "Cloning and characterization of the natural lactose operator";
168RL   Gene 13(1):13-23(1981).
169XX
170RN   [20]
171RX   DOI; 10.1016/0378-1119(81)90128-1.
172RX   PUBMED; 6271642.
173RA   Betz J.L., Sadler J.R.;
174RT   "Variants of a cloned synthetic lactose operator. II.
175RT   Chloramphenicol-resistant revertants retaining a lactose operator in the
176RT   CAT gene of plasmid pBR325";
177RL   Gene 15(2-3):187-200(1981).
178XX
179RN   [21]
180RX   DOI; 10.1007/BF00268783.
181RX   PUBMED; 7038381.
182RA   Calos M.P., Miller J.H.;
183RT   "The DNA sequence change resulting from the IQ1 mutation, which greatly
184RT   increases promoter strength";
185RL   Mol. Gen. Genet. 183(3):559-560(1981).
186XX
187RN   [22]
188RX   DOI; 10.1073/pnas.78.12.7652.
189RX   PUBMED; 6278484.
190RA   Mieschendahl M., Buechel D.E., Bocklage H., Mueller-Hill B.;
191RT   "Mutations in the lacY gene of Escherichia coli define functional
192RT   organization of lactose permease";
193RL   Proc. Natl. Acad. Sci. U.S.A. 78(12):7652-7656(1981).
194XX
195RN   [23]
196RX   DOI; 10.1016/0378-1119(82)90042-7.
197RX   PUBMED; 6299890.
198RA   Russell D.R., Bennett G.N.;
199RT   "Construction and analysis of in vivo activity of E. coli promoter hybrids
200RT   and promoter mutants that alter the -35 to -10 spacing";
201RL   Gene 20(2):231-243(1982).
202XX
203RN   [24]
204RX   PUBMED; 6288696.
205RA   Horowitz H., Platt T.;
206RT   "A termination site for LacI transcription is between the CAP site and the
207RT   lac promoter";
208RL   J Biol Chem 257(19):11740-11746(1982).
209XX
210RN   [25]
211RX   PUBMED; 6290487.
212RA   Klein R.D., Wells R.D.;
213RT   "Effects of neighboring DNA homopolymers on the biochemical and physical
214RT   properties of the Escherichia coli lactose promoter. I. Cloning and
215RT   characterization studies";
216RL   J Biol Chem 257(21):12954-12961(1982).
217XX
218RN   [26]
219RP   1183-1291
220RX   DOI; 10.1073/pnas.79.5.1408.
221RX   PUBMED; 7041119.
222RA   Weiher H., Schaller H.;
223RT   "Segment-specific mutagenesis: extensive mutagenesis of a lac
224RT   promoter/operator element";
225RL   Proc. Natl. Acad. Sci. U.S.A. 79(5):1408-1412(1982).
226XX
227RN   [27]
228RX   PUBMED; 6305557.
229RA   Van Dyke M.W., Dervan P.B.;
230RT   "Footprinting with MPE-Fe(II). Complementary-strand analyses of distamycin-
231RT   and actinomycin-binding sites on heterogeneous DNA";
232RL   Cold Spring Harb. Symp. Quant. Biol. 47:347-353(1983).
233XX
234RN   [28]
235RP   1287-4364
236RX   PUBMED; 6313347.
237RA   Kalnins A., Otto K., Ruether U., Mueller-Hill B.;
238RT   "Sequence of the lacZ gene of Escherichia coli";
239RL   EMBO J. 2(4):593-597(1983).
240XX
241RN   [29]
242RX   PUBMED; 6309841.
243RA   Cone K.C., Sellitti M.A., Steege D.A.;
244RT   "Lac repressor mRNA transcription terminates in vivo in the lac control
245RT   region";
246RL   J Biol Chem 258(18):11296-11304(1983).
247XX
248RN   [30]
249RX   DOI; 10.1073/pnas.80.22.6785.
250RX   PUBMED; 6316325.
251RA   Sadler J.R., Sasmor H., Betz J.L.;
252RT   "A perfectly symmetric lac operator binds the lac repressor very tightly";
253RL   Proc. Natl. Acad. Sci. U.S.A. 80(22):6785-6789(1983).
254XX
255RN   [31]
256RX   DOI; 10.1073/pnas.81.2.512.
257RX   PUBMED; 6582506.
258RA   Glickman B.W., Ripley L.S.;
259RT   "Structural intermediates of deletion mutagenesis: a role for palindromic
260RT   DNA";
261RL   Proc. Natl. Acad. Sci. U.S.A. 81(2):512-516(1984).
262XX
263RN   [32]
264RX   DOI; 10.1021/bi00332a019.
265RX   PUBMED; 3896305.
266RA   Spassky A., Kirkegaard K., Buc H.;
267RT   "Changes in the DNA structure of the lac UV5 promoter during formation of
268RT   an open complex with Escherichia coli RNA polymerase";
269RL   Biochemistry 24(11):2723-2731(1985).
270XX
271RN   [33]
272RX   DOI; 10.1016/0092-8674(85)90175-8.
273RX   PUBMED; 2416465.
274RA   Straney D.C., Crothers D.M.;
275RT   "Intermediates in transcription initiation from the E. coli lac UV5
276RT   promoter";
277RL   Cell 43(2 Pt 1):449-459(1985).
278XX
279RN   [34]
280RX   DOI; 10.1016/0378-1119(85)90267-7.
281RX   PUBMED; 3932130.
282RA   Looman A.C., de Gruyter M., Vogelaar A., van Knippenberg P.H.;
283RT   "Effects of heterologous ribosomal binding sites on the transcription and
284RT   translation of the lacZ gene of Escherichia coli";
285RL   Gene 37(1-3):145-154(1985).
286XX
287RN   [35]
288RX   PUBMED; 2999082.
289RA   Mandecki W., Goldman R.A., Powell B.S., Caruthers M.H.;
290RT   "lac Up-promoter mutants with increased homology to the consensus promoter
291RT   sequence";
292RL   J. Bacteriol. 164(3):1353-1355(1985).
293XX
294RN   [36]
295RX   DOI; 10.1016/0022-2836(85)90427-9.
296RX   PUBMED; 2987506.
297RA   Malamy M.H., Rahaim P.T., Hoffman C.S., Baghdoyan D., O'Connor M.B.,
298RA   Miller J.F.;
299RT   "A frameshift mutation at the junction of an IS1 insertion within lacZ
300RT   restores beta-galactosidase activity via formation of an active lacZ-IS1
301RT   fusion protein";
302RL   J. Mol. Biol. 181(4):551-555(1985).
303XX
304RN   [37]
305RP   5646-7477
306RX   DOI; 10.1073/pnas.82.19.6414.
307RX   PUBMED; 3901000.
308RA   Hediger M.A., Johnson D.F., Nierlich D.P., Zabin I.;
309RT   "DNA sequence of the lactose operon: the lacA gene and the transcriptional
310RT   termination region";
311RL   Proc. Natl. Acad. Sci. U.S.A. 82(19):6414-6418(1985).
312XX
313CC   [3]  sites; UV5 mRNA transcripts and operator mutants. [(in)
314CC   Sund,H. and Blauer,G. (eds.);Protein-Ligand Interactions:
315CC   193-207;Walter de]  sites; operator mutational analysis. [7]
316CC   sites; S1 and mung bean nuclease action on operator DNA. [9]
317CC   sites; class I, II and III promoter mutant analysis. [13]  sites;
318CC   lacI mutant analysis.
319CC   [16]  sites; Tn5, Tn9 and Tn10 insertion sites in lac region. [14]
320CC   sites; lacI promoter mutation UJ177.
321CC   [18]  sites; palindromic dimer operator;.
322CC   [19]  sites; natural operator sequence.
323CC   [20]  sites; operator mutational analysis.
324CC   [21]  sites; lacI-Q deletion.
325CC   [17]  sites; RNA polymerase UV5 promoter interaction. [22]  sites;
326CC   lacY mutational analysis.
327CC   [24]  sites; lacI-promoted transcription termination. [25]  sites;
328CC   wt and UV5 promoter sequence studies. [23]  sites; UV5 promoter
329CC   mutational analysis.
330CC   [30]  sites; perfectly symmetric operator sequence. [29]  sites;
331CC   lacI mRNA termination site.
332CC   [27]  sites; distamycin and actinomycin binding to promoter. [31]
333CC   sites; lacI deletion studies.
334CC   [35]  sites; promoter mutational studies.
335CC   [33]  sites; DNAase I studies with promoter sequence. [34]  sites;
336CC   ribosomal binding and translation initiation for lacZ. [36]  sites;
337CC   insertion sequence IS1 integration in lacZ;. [32]  sites; DNAase I
338CC   studies with promoter.
339CC   [1] first reports a 27 bp operator(sites 1240-1266) with two-fold
340CC   symmetries; the operator has also been defined to be bases
341CC   1246-1266 or bases 1239-1273 [8]. [(in) Kjeldgaard,N.C. and Maaloe,
342CC   O.(eds);Control of ribosome synthesis: 138-143;A] explores the
343CC   ability of lac
344CC   repressor protein to affect methylation of operator DNA.  [8]
345CC   argues that DNA on both sides of the 21 bp operator (bases
346CC   1246-1266) affects repressor binding but that the sequences of this
347CC   DNA are probably not critical. [5] gives a larger sequence known as
348CC   the promoter-operator region for the wild-type, whereas [2] and
349CC   [26] give portions of this region for the mutant strain UV5. Within
350CC   the promoter region, bases 1162-1199 are identified as the
351CC   catabolite gene activator protein binding site (cap) and bases
352CC   1200-1245 are the RNA polymerase interaction site. [10] reports a
353CC   sequence for the 5'end of the lacI (repressor) gene and discusses
354CC   restart in mutant strains. [11] presents a sequence for the lacI
355CC   promoter region and identifies an I-Q mutation which enhances lacI
356CC   transcription approximately ten-fold. [12] gives a complete
357CC   sequence
358CC   for lacI which agrees with the known lac repressor sequence. [26]
359CC   examines the promoter-operator region in the UV5 strain (lac109)
360CC   and studies 23 mutant derivatives of this sequence. This sequence
361CC   agrees with known protein sequences for the lacZ, lacY and lacA
362CC   enzymes. [15] notes that the fMet codon is not present
363CC   for lacA and suggests that the 'ttg' codon (5727-5729), which
364CC   immediately precedes the mature N-terminal asparagine codon, is the
365CC   start codon. The cds for lacZ, lacY and lacA are included on a
366CC   single mRNA transcript.
367CC   Complete source information:
368CC   Escherichia coli DNA [1],[(in) Kjeldgaard,N.C. and Maaloe,O.(eds);
369CC   Control of ribosome synthesis: 138-143;A],[8],[12],[26]; mRNA [2],
370CC   [5],[10]; clone
371CC   lambda-h80dlac DNA [11],[15]; clone puk217 [28]; pgm8 [37].
372XX
373FH   Key             Location/Qualifiers
374FH
375FT   source          1..7477
376FT                   /organism="Escherichia coli"
377FT                   /mol_type="genomic DNA"
378FT                   /db_xref="taxon:562"
379FT   variation       16
380FT                   /note="c in wild-type; t in 'up' promoter mutant I-Q [11]"
381FT   mRNA            51..1230
382FT                   /note="lacI (repressor) mRNA; preferred in vivo 3' end
383FT                   [12],[29]"
384FT   CDS             79..1161
385FT                   /codon_start=1
386FT                   /transl_table=11
387FT                   /gene="lacI"
388FT                   /note="lac repressor protein (gtg start codon)"
389FT                   /db_xref="GOA:P03023"
390FT                   /db_xref="InterPro:IPR000843"
391FT                   /db_xref="InterPro:IPR010982"
392FT                   /db_xref="PDB:1CJG"
393FT                   /db_xref="PDB:1EFA"
394FT                   /db_xref="PDB:1JWL"
395FT                   /db_xref="PDB:1JYE"
396FT                   /db_xref="PDB:1JYF"
397FT                   /db_xref="PDB:1L1M"
398FT                   /db_xref="PDB:1LBG"
399FT                   /db_xref="PDB:1LBH"
400FT                   /db_xref="PDB:1LBI"
401FT                   /db_xref="PDB:1LCC"
402FT                   /db_xref="PDB:1LCD"
403FT                   /db_xref="PDB:1LQC"
404FT                   /db_xref="PDB:1LTP"
405FT                   /db_xref="PDB:1OSL"
406FT                   /db_xref="PDB:1TLF"
407FT                   /db_xref="PDB:1Z04"
408FT                   /db_xref="PDB:2BJC"
409FT                   /db_xref="PDB:2KEI"
410FT                   /db_xref="PDB:2KEJ"
411FT                   /db_xref="PDB:2KEK"
412FT                   /db_xref="PDB:2P9H"
413FT                   /db_xref="PDB:2PAF"
414FT                   /db_xref="PDB:2PE5"
415FT                   /db_xref="PDB:3EDC"
416FT                   /db_xref="UniProtKB/Swiss-Prot:P03023"
417FT                   /protein_id="AAA24052.1"
418FT                   /translation="MKPVTLYDVAEYAGVSYQTVSRVVNQASHVSAKTREKVEAAMAEL
419FT                   NYIPNRVAQQLAGKQSLLIGVATSSLALHAPSQIVAAIKSRADQLGASVVVSMVERSGV
420FT                   EACKAAVHNLLAQRVSGLIINYPLDDQDAIAVEAACTNVPALFLDVSDQTPINSIIFSH
421FT                   EDGTRLGVEHLVALGHQQIALLAGPLSSVSARLRLAGWHKYLTRNQIQPIAEREGDWSA
422FT                   MSGFQQTMQMLNEGIVPTAMLVANDQMALGAMRAITESGLRVGADISVVGYDDTEDSSC
423FT                   YIPPSTTIKQDFRLLGQTSVDRLLQLSQGQAVKGNQLLPVSLVKRKTTLAPNTQTASPR
424FT                   ALADSLMQLARQVSRLESGQ"
425FT   misc_signal     1162..1199
426FT                   /note="cap protein binding site"
427FT   variation       1183..1186
428FT                   /note="ttag in wild-type; aatt in strain UV5 [26]"
429FT   variation       1209..1211
430FT                   /note="gct in wild-type; gt in mutant l305 [5]"
431FT   variation       1212
432FT                   /note="t in wild-type; a in mutant l241 [5]"
433FT   variation       1230
434FT                   /note="c in wild-type; a in mutant p-r-1a [5]"
435FT   variation       1237..1238
436FT                   /note="gt in wild-type; aa in strain UV5 [26]"
437FT   variation       1242..1245
438FT                   /note="gtgg in wild-type; ttca in synthetic operator [8]"
439FT   misc_signal     1246..1266
440FT                   /note="lac repressor protein binding site"
441FT   mRNA            1246..>4358
442FT                   /note="lacZ mRNA [2],[5]"
443FT   variation       1267..1268
444FT                   /note="tc in wild-type; tg in synthetic operator [8]"
445FT   variation       1282..1291
446FT                   /note="ctatgaccat in wild-type; gatccggcca in strain UV5
447FT                   [26]"
448FT   CDS             1284..4358
449FT                   /codon_start=1
450FT                   /transl_table=11
451FT                   /gene="lacZ"
452FT                   /note="beta-d-galactosidase"
453FT                   /db_xref="GOA:P00722"
454FT                   /db_xref="InterPro:IPR004199"
455FT                   /db_xref="InterPro:IPR006101"
456FT                   /db_xref="InterPro:IPR006102"
457FT                   /db_xref="InterPro:IPR006103"
458FT                   /db_xref="InterPro:IPR006104"
459FT                   /db_xref="InterPro:IPR008979"
460FT                   /db_xref="InterPro:IPR011013"
461FT                   /db_xref="InterPro:IPR013781"
462FT                   /db_xref="InterPro:IPR013812"
463FT                   /db_xref="InterPro:IPR014718"
464FT                   /db_xref="InterPro:IPR017853"
465FT                   /db_xref="InterPro:IPR023230"
466FT                   /db_xref="InterPro:IPR023232"
467FT                   /db_xref="InterPro:IPR023933"
468FT                   /db_xref="PDB:1BGL"
469FT                   /db_xref="PDB:1BGM"
470FT                   /db_xref="PDB:1DP0"
471FT                   /db_xref="PDB:1F49"
472FT                   /db_xref="PDB:1F4A"
473FT                   /db_xref="PDB:1F4H"
474FT                   /db_xref="PDB:1GHO"
475FT                   /db_xref="PDB:1HN1"
476FT                   /db_xref="PDB:1JYN"
477FT                   /db_xref="PDB:1JYV"
478FT                   /db_xref="PDB:1JYW"
479FT                   /db_xref="PDB:1JYX"
480FT                   /db_xref="PDB:1JYY"
481FT                   /db_xref="PDB:1JYZ"
482FT                   /db_xref="PDB:1JZ0"
483FT                   /db_xref="PDB:1JZ1"
484FT                   /db_xref="PDB:1JZ2"
485FT                   /db_xref="PDB:1JZ3"
486FT                   /db_xref="PDB:1JZ4"
487FT                   /db_xref="PDB:1JZ5"
488FT                   /db_xref="PDB:1JZ6"
489FT                   /db_xref="PDB:1JZ7"
490FT                   /db_xref="PDB:1JZ8"
491FT                   /db_xref="PDB:1PX3"
492FT                   /db_xref="PDB:1PX4"
493FT                   /db_xref="PDB:3CZJ"
494FT                   /db_xref="PDB:3DYM"
495FT                   /db_xref="PDB:3DYO"
496FT                   /db_xref="PDB:3DYP"
497FT                   /db_xref="PDB:3E1F"
498FT                   /db_xref="PDB:3I3B"
499FT                   /db_xref="PDB:3I3D"
500FT                   /db_xref="PDB:3I3E"
501FT                   /db_xref="PDB:3IAP"
502FT                   /db_xref="PDB:3IAQ"
503FT                   /db_xref="PDB:3MUY"
504FT                   /db_xref="PDB:3MUZ"
505FT                   /db_xref="PDB:3MV0"
506FT                   /db_xref="PDB:3MV1"
507FT                   /db_xref="PDB:3SEP"
508FT                   /db_xref="PDB:3T08"
509FT                   /db_xref="PDB:3T09"
510FT                   /db_xref="PDB:3T0A"
511FT                   /db_xref="PDB:3T0B"
512FT                   /db_xref="PDB:3T0D"
513FT                   /db_xref="PDB:3T2O"
514FT                   /db_xref="PDB:3T2P"
515FT                   /db_xref="PDB:3T2Q"
516FT                   /db_xref="PDB:3VD3"
517FT                   /db_xref="PDB:3VD4"
518FT                   /db_xref="PDB:3VD5"
519FT                   /db_xref="PDB:3VD7"
520FT                   /db_xref="PDB:3VD9"
521FT                   /db_xref="PDB:3VDA"
522FT                   /db_xref="PDB:3VDB"
523FT                   /db_xref="PDB:3VDC"
524FT                   /db_xref="UniProtKB/Swiss-Prot:P00722"
525FT                   /protein_id="AAA24053.1"
526FT                   /translation="MTMITDSLAVVLQRRDWENPGVTQLNRLAAHPPFASWRNSEEART
527FT                   DRPSQQLRSLNGEWRFAWFPAPEAVPESWLECDLPEADTVVVPSNWQMHGYDAPIYTNV
528FT                   TYPITVNPPFVPTENPTGCYSLTFNVDESWLQEGQTRIIFDGVNSAFHLWCNGRWVGYG
529FT                   QDSRLPSEFDLSAFLRAGENRLAVMVLRWSDGSYLEDQDMWRMSGIFRDVSLLHKPTTQ
530FT                   ISDFHVATRFNDDFSRAVLEAEVQMCGELRDYLRVTVSLWQGETQVASGTAPFGGEIID
531FT                   ERGGYADRVTLRLNVENPKLWSAEIPNLYRAVVELHTADGTLIEAEACDVGFREVRIEN
532FT                   GLLLLNGKPLLIRGVNRHEHHPLHGQVMDEQTMVQDILLMKQNNFNAVRCSHYPNHPLW
533FT                   YTLCDRYGLYVVDEANIETHGMVPMNRLTDDPRWLPAMSERVTRMVQRDRNHPSVIIWS
534FT                   LGNESGHGANHDALYRWIKSVDPSRPVQYEGGGADTTATDIICPMYARVDEDQPFPAVP
535FT                   KWSIKKWLSLPGETRPLILCEYAHAMGNSLGGFAKYWQAFRQYPRLQGGFVWDWVDQSL
536FT                   IKYDENGNPWSAYGGDFGDTPNDRQFCMNGLVFADRTPHPALTEAKHQQQFFQFRLSGQ
537FT                   TIEVTSEYLFRHSDNELLHWMVALDGKPLASGEVPLDVAPQGKQLIELPELPQPESAGQ
538FT                   LWLTVRVVQPNATAWSEAGHISAWQQWRLAENLSVTLPAASHAIPHLTTSEMDFCIELG
539FT                   NKRWQFNRQSGFLSQMWIGDKKQLLTPLRDQFTRAPLDNDIGVSEATRIDPNAWVERWK
540FT                   AAGHYQAEAALLQCTADTLADAVLITTAHAWQHQGKTLFISRKTYRIDGSGQMAITVDV
541FT                   EVASDTPHPARIGLNCQLAQVAERVNWLGLGPQENYPDRLTAACFDRWDLPLSDMYTPY
542FT                   VFPSENGLRCGTRELNYGPHQWRGDFQFNISRYSQQQLMETSHRHLLHAEEGTWLNIDG
543FT                   FHMGIGGDDSWSPSVSAEFQLSAGRYHYQLVWCQK"
544FT   CDS             4410..5663
545FT                   /codon_start=1
546FT                   /transl_table=11
547FT                   /gene="lacY"
548FT                   /note="lactose permease"
549FT                   /db_xref="GOA:P02920"
550FT                   /db_xref="InterPro:IPR000576"
551FT                   /db_xref="InterPro:IPR016196"
552FT                   /db_xref="InterPro:IPR018457"
553FT                   /db_xref="InterPro:IPR020846"
554FT                   /db_xref="InterPro:IPR022814"
555FT                   /db_xref="PDB:1M2U"
556FT                   /db_xref="PDB:1PV6"
557FT                   /db_xref="PDB:1PV7"
558FT                   /db_xref="PDB:2CFP"
559FT                   /db_xref="PDB:2CFQ"
560FT                   /db_xref="PDB:2V8N"
561FT                   /db_xref="PDB:2Y5Y"
562FT                   /db_xref="UniProtKB/Swiss-Prot:P02920"
563FT                   /protein_id="AAA24054.1"
564FT                   /translation="MYYLKNTNFWMFGLFFFFYFFIMGAYFPFFPIWLHDINHISKSDT
565FT                   GIIFAAISLFSLLFQPLFGLLSDKLGLRKYLLWIITGMLVMFAPFFIFIFGPLLQYNIL
566FT                   VGSIVGGIYLGFCFNAGAPAVEAFIEKVSRRSNFEFGRARMFGCVGWALCASIVGIMFT
567FT                   INNQFVFWLGSGCALILAVLLFFAKTDAPSSATVANAVGANHSAFSLKLALELFRQPKL
568FT                   WFLSLYVIGVSCTYDVFDQQFANFFTSFFATGEQGTRVFGYVTTMGELLNASIMFFAPL
569FT                   IINRIGGKNALLLAGTIMSVRIIGSSFATSALEVVILKTLHMFEVPFLLVGCFKYITSQ
570FT                   FEVRFSATIYLVCFCFFKQLAMIFMSVLAGNMYESIGFQGAYLVLGLVALGFTLISVFT
571FT                   LSGPGPLSLLRRQVNEVA"
572FT   CDS             5727..6338
573FT                   /codon_start=1
574FT                   /transl_table=11
575FT                   /gene="lacA"
576FT                   /note="thiogalactoside acetyltransferase (ttg start codon)"
577FT                   /db_xref="GOA:P07464"
578FT                   /db_xref="InterPro:IPR001451"
579FT                   /db_xref="InterPro:IPR011004"
580FT                   /db_xref="InterPro:IPR018357"
581FT                   /db_xref="InterPro:IPR024688"
582FT                   /db_xref="PDB:1KQA"
583FT                   /db_xref="PDB:1KRR"
584FT                   /db_xref="PDB:1KRU"
585FT                   /db_xref="PDB:1KRV"
586FT                   /db_xref="UniProtKB/Swiss-Prot:P07464"
587FT                   /protein_id="AAA24055.1"
588FT                   /translation="MNMPMTERIRAGKLFTDMCEGLPEKRLRGKTLMYEFNHSHPSEVE
589FT                   KRESLIKEMFATVGENAWVEPPVYFSYGSNIHIGRNFYANFNLTIVDDYTVTIGDNVLI
590FT                   APNVTLSVTGHPVHHELRKNGEMYSFPITIGNNVWIGSHVVINPGVTIGDNSVIGAGSI
591FT                   VTKDIPPNVVAAGVPCRVIREINDRDKHYYFKDYKVESSV"
592XX
593SQ   Sequence 7477 BP; 1739 A; 1991 C; 2004 G; 1743 T; 0 other;
594     gacaccatcg aatggcgcaa aacctttcgc ggtatggcat gatagcgccc ggaagagagt        60
595     caattcaggg tggtgaatgt gaaaccagta acgttatacg atgtcgcaga gtatgccggt       120
596     gtctcttatc agaccgtttc ccgcgtggtg aaccaggcca gccacgtttc tgcgaaaacg       180
597     cgggaaaaag tggaagcggc gatggcggag ctgaattaca ttcccaaccg cgtggcacaa       240
598     caactggcgg gcaaacagtc gttgctgatt ggcgttgcca cctccagtct ggccctgcac       300
599     gcgccgtcgc aaattgtcgc ggcgattaaa tctcgcgccg atcaactggg tgccagcgtg       360
600     gtggtgtcga tggtagaacg aagcggcgtc gaagcctgta aagcggcggt gcacaatctt       420
601     ctcgcgcaac gcgtcagtgg gctgatcatt aactatccgc tggatgacca ggatgccatt       480
602     gctgtggaag ctgcctgcac taatgttccg gcgttatttc ttgatgtctc tgaccagaca       540
603     cccatcaaca gtattatttt ctcccatgaa gacggtacgc gactgggcgt ggagcatctg       600
604     gtcgcattgg gtcaccagca aatcgcgctg ttagcgggcc cattaagttc tgtctcggcg       660
605     cgtctgcgtc tggctggctg gcataaatat ctcactcgca atcaaattca gccgatagcg       720
606     gaacgggaag gcgactggag tgccatgtcc ggttttcaac aaaccatgca aatgctgaat       780
607     gagggcatcg ttcccactgc gatgctggtt gccaacgatc agatggcgct gggcgcaatg       840
608     cgcgccatta ccgagtccgg gctgcgcgtt ggtgcggata tctcggtagt gggatacgac       900
609     gataccgaag acagctcatg ttatatcccg ccgtcaacca ccatcaaaca ggattttcgc       960
610     ctgctggggc aaaccagcgt ggaccgcttg ctgcaactct ctcagggcca ggcggtgaag      1020
611     ggcaatcagc tgttgcccgt ctcactggtg aaaagaaaaa ccaccctggc gcccaatacg      1080
612     caaaccgcct ctccccgcgc gttggccgat tcattaatgc agctggcacg acaggtttcc      1140
613     cgactggaaa gcgggcagtg agcgcaacgc aattaatgtg agttagctca ctcattaggc      1200
614     accccaggct ttacacttta tgcttccggc tcgtatgttg tgtggaattg tgagcggata      1260
615     acaatttcac acaggaaaca gctatgacca tgattacgga ttcactggcc gtcgttttac      1320
616     aacgtcgtga ctgggaaaac cctggcgtta cccaacttaa tcgccttgca gcacatcccc      1380
617     ctttcgccag ctggcgtaat agcgaagagg cccgcaccga tcgcccttcc caacagttgc      1440
618     gcagcctgaa tggcgaatgg cgctttgcct ggtttccggc accagaagcg gtgccggaaa      1500
619     gctggctgga gtgcgatctt cctgaggccg atactgtcgt cgtcccctca aactggcaga      1560
620     tgcacggtta cgatgcgccc atctacacca acgtaaccta tcccattacg gtcaatccgc      1620
621     cgtttgttcc cacggagaat ccgacgggtt gttactcgct cacatttaat gttgatgaaa      1680
622     gctggctaca ggaaggccag acgcgaatta tttttgatgg cgttaactcg gcgtttcatc      1740
623     tgtggtgcaa cgggcgctgg gtcggttacg gccaggacag tcgtttgccg tctgaatttg      1800
624     acctgagcgc atttttacgc gccggagaaa accgcctcgc ggtgatggtg ctgcgttgga      1860
625     gtgacggcag ttatctggaa gatcaggata tgtggcggat gagcggcatt ttccgtgacg      1920
626     tctcgttgct gcataaaccg actacacaaa tcagcgattt ccatgttgcc actcgcttta      1980
627     atgatgattt cagccgcgct gtactggagg ctgaagttca gatgtgcggc gagttgcgtg      2040
628     actacctacg ggtaacagtt tctttatggc agggtgaaac gcaggtcgcc agcggcaccg      2100
629     cgcctttcgg cggtgaaatt atcgatgagc gtggtggtta tgccgatcgc gtcacactac      2160
630     gtctgaacgt cgaaaacccg aaactgtgga gcgccgaaat cccgaatctc tatcgtgcgg      2220
631     tggttgaact gcacaccgcc gacggcacgc tgattgaagc agaagcctgc gatgtcggtt      2280
632     tccgcgaggt gcggattgaa aatggtctgc tgctgctgaa cggcaagccg ttgctgattc      2340
633     gaggcgttaa ccgtcacgag catcatcctc tgcatggtca ggtcatggat gagcagacga      2400
634     tggtgcagga tatcctgctg atgaagcaga acaactttaa cgccgtgcgc tgttcgcatt      2460
635     atccgaacca tccgctgtgg tacacgctgt gcgaccgcta cggcctgtat gtggtggatg      2520
636     aagccaatat tgaaacccac ggcatggtgc caatgaatcg tctgaccgat gatccgcgct      2580
637     ggctaccggc gatgagcgaa cgcgtaacgc gaatggtgca gcgcgatcgt aatcacccga      2640
638     gtgtgatcat ctggtcgctg gggaatgaat caggccacgg cgctaatcac gacgcgctgt      2700
639     atcgctggat caaatctgtc gatccttccc gcccggtgca gtatgaaggc ggcggagccg      2760
640     acaccacggc caccgatatt atttgcccga tgtacgcgcg cgtggatgaa gaccagccct      2820
641     tcccggctgt gccgaaatgg tccatcaaaa aatggctttc gctacctgga gagacgcgcc      2880
642     cgctgatcct ttgcgaatac gcccacgcga tgggtaacag tcttggcggt ttcgctaaat      2940
643     actggcaggc gtttcgtcag tatccccgtt tacagggcgg cttcgtctgg gactgggtgg      3000
644     atcagtcgct gattaaatat gatgaaaacg gcaacccgtg gtcggcttac ggcggtgatt      3060
645     ttggcgatac gccgaacgat cgccagttct gtatgaacgg tctggtcttt gccgaccgca      3120
646     cgccgcatcc agcgctgacg gaagcaaaac accagcagca gtttttccag ttccgtttat      3180
647     ccgggcaaac catcgaagtg accagcgaat acctgttccg tcatagcgat aacgagctcc      3240
648     tgcactggat ggtggcgctg gatggtaagc cgctggcaag cggtgaagtg cctctggatg      3300
649     tcgctccaca aggtaaacag ttgattgaac tgcctgaact accgcagccg gagagcgccg      3360
650     ggcaactctg gctcacagta cgcgtagtgc aaccgaacgc gaccgcatgg tcagaagccg      3420
651     ggcacatcag cgcctggcag cagtggcgtc tggcggaaaa cctcagtgtg acgctccccg      3480
652     ccgcgtccca cgccatcccg catctgacca ccagcgaaat ggatttttgc atcgagctgg      3540
653     gtaataagcg ttggcaattt aaccgccagt caggctttct ttcacagatg tggattggcg      3600
654     ataaaaaaca actgctgacg ccgctgcgcg atcagttcac ccgtgcaccg ctggataacg      3660
655     acattggcgt aagtgaagcg acccgcattg accctaacgc ctgggtcgaa cgctggaagg      3720
656     cggcgggcca ttaccaggcc gaagcagcgt tgttgcagtg cacggcagat acacttgctg      3780
657     atgcggtgct gattacgacc gctcacgcgt ggcagcatca ggggaaaacc ttatttatca      3840
658     gccggaaaac ctaccggatt gatggtagtg gtcaaatggc gattaccgtt gatgttgaag      3900
659     tggcgagcga tacaccgcat ccggcgcgga ttggcctgaa ctgccagctg gcgcaggtag      3960
660     cagagcgggt aaactggctc ggattagggc cgcaagaaaa ctatcccgac cgccttactg      4020
661     ccgcctgttt tgaccgctgg gatctgccat tgtcagacat gtataccccg tacgtcttcc      4080
662     cgagcgaaaa cggtctgcgc tgcgggacgc gcgaattgaa ttatggccca caccagtggc      4140
663     gcggcgactt ccagttcaac atcagccgct acagtcaaca gcaactgatg gaaaccagcc      4200
664     atcgccatct gctgcacgcg gaagaaggca catggctgaa tatcgacggt ttccatatgg      4260
665     ggattggtgg cgacgactcc tggagcccgt cagtatcggc ggaattccag ctgagcgccg      4320
666     gtcgctacca ttaccagttg gtctggtgtc aaaaataata ataaccgggc aggccatgtc      4380
667     tgcccgtatt tcgcgtaagg aaatccatta tgtactattt aaaaaacaca aacttttgga      4440
668     tgttcggttt attctttttc ttttactttt ttatcatggg agcctacttc ccgtttttcc      4500
669     cgatttggct acatgacatc aaccatatca gcaaaagtga tacgggtatt atttttgccg      4560
670     ctatttctct gttctcgcta ttattccaac cgctgtttgg tctgctttct gacaaactcg      4620
671     ggctgcgcaa atacctgctg tggattatta ccggcatgtt agtgatgttt gcgccgttct      4680
672     ttatttttat cttcgggcca ctgttacaat acaacatttt agtaggatcg attgttggtg      4740
673     gtatttatct aggcttttgt tttaacgccg gtgcgccagc agtagaggca tttattgaga      4800
674     aagtcagccg tcgcagtaat ttcgaatttg gtcgcgcgcg gatgtttggc tgtgttggct      4860
675     gggcgctgtg tgcctcgatt gtcggcatca tgttcaccat caataatcag tttgttttct      4920
676     ggctgggctc tggctgtgca ctcatcctcg ccgttttact ctttttcgcc aaaacggatg      4980
677     cgccctcttc tgccacggtt gccaatgcgg taggtgccaa ccattcggca tttagcctta      5040
678     agctggcact ggaactgttc agacagccaa aactgtggtt tttgtcactg tatgttattg      5100
679     gcgtttcctg cacctacgat gtttttgacc aacagtttgc taatttcttt acttcgttct      5160
680     ttgctaccgg tgaacagggt acgcgggtat ttggctacgt aacgacaatg ggcgaattac      5220
681     ttaacgcctc gattatgttc tttgcgccac tgatcattaa tcgcatcggt gggaaaaacg      5280
682     ccctgctgct ggctggcact attatgtctg tacgtattat tggctcatcg ttcgccacct      5340
683     cagcgctgga agtggttatt ctgaaaacgc tgcatatgtt tgaagtaccg ttcctgctgg      5400
684     tgggctgctt taaatatatt accagccagt ttgaagtgcg tttttcagcg acgatttatc      5460
685     tggtctgttt ctgcttcttt aagcaactgg cgatgatttt tatgtctgta ctggcgggca      5520
686     atatgtatga aagcatcggt ttccagggcg cttatctggt gctgggtctg gtggcgctgg      5580
687     gcttcacctt aatttccgtg ttcacgctta gcggccccgg cccgctttcc ctgctgcgtc      5640
688     gtcaggtgaa tgaagtcgct taagcaatca atgtcggatg cggcgcgacg cttatccgac      5700
689     caacatatca taacggagtg atcgcattga acatgccaat gaccgaaaga ataagagcag      5760
690     gcaagctatt taccgatatg tgcgaaggct taccggaaaa aagacttcgt gggaaaacgt      5820
691     taatgtatga gtttaatcac tcgcatccat cagaagttga aaaaagagaa agcctgatta      5880
692     aagaaatgtt tgccacggta ggggaaaacg cctgggtaga accgcctgtc tatttctctt      5940
693     acggttccaa catccatata ggccgcaatt tttatgcaaa tttcaattta accattgtcg      6000
694     atgactacac ggtaacaatc ggtgataacg tactgattgc acccaacgtt actctttccg      6060
695     ttacgggaca ccctgtacac catgaattga gaaaaaacgg cgagatgtac tcttttccga      6120
696     taacgattgg caataacgtc tggatcggaa gtcatgtggt tattaatcca ggcgtcacca      6180
697     tcggggataa ttctgttatt ggcgcgggta gtatcgtcac aaaagacatt ccaccaaacg      6240
698     tcgtggcggc tggcgttcct tgtcgggtta ttcgcgaaat aaacgaccgg gataagcact      6300
699     attatttcaa agattataaa gttgaatcgt cagtttaaat tataaaaatt gcctgatacg      6360
700     ctgcgcttat caggcctaca agttcagcga tctacattag ccgcatccgg catgaacaaa      6420
701     gcgcaggaac aagcgtcgca tcatgcctct ttgacccaca gctgcggaaa acgtactggt      6480
702     gcaaaacgca gggttatgat catcagccca acgacgcaca gcgcatgaaa tgcccagtcc      6540
703     atcaggtaat tgccgctgat actacgcagc acgccagaaa accacggggc aagcccggcg      6600
704     atgataaaac cgattccctg cataaacgcc accagcttgc cagcaatagc cggttgcaca      6660
705     gagtgatcga gcgccagcag caaacagagc ggaaacgcgc cgcccagacc taacccacac      6720
706     accatcgccc acaataccgg caattgcatc ggcagccaga taaagccgca gaaccccacc      6780
707     agttgtaaca ccagcgccag cattaacagt ttgcgccgat cctgatggcg agccatagca      6840
708     ggcatcagca aagctcctgc ggcttgccca agcgtcatca atgccagtaa ggaaccgctg      6900
709     tactgcgcgc tggcaccaat ctcaatatag aaagcgggta accaggcaat caggctggcg      6960
710     taaccgccgt taatcagacc gaagtaaaca cccagcgtcc acgcgcgggg agtgaatacc      7020
711     acgcgaaccg gagtggttgt tgtcttgtgg gaagaggcga cctcgcgggc gctttgccac      7080
712     caccaggcaa agagcgcaac aacggcaggc agcgccacca ggcgagtgtt tgataccagg      7140
713     tttcgctatg ttgaactaac cagggcgtta tggcggcacc aagcccaccg ccgcccatca      7200
714     gagccgcgga ccacagcccc atcaccagtg gcgtgcgctg ctgaaaccgc cgtttaatca      7260
715     ccgaagcatc accgcctgaa tgatgccgat ccccacccca ccaagcagtg cgctgctaag      7320
716     cagcagcgca ctttgcgggt aaagctcacg catcaatgca ccgacggcaa tcagcaacag      7380
717     actgatggcg acactgcgac gttcgctgac atgctgatga agccagcttc cggccagcgc      7440
718     cagcccgccc atggtaacca ccggcagagc ggtcgac                               7477
719//
720ID   X51872; SV 1; linear; genomic DNA; STD; PRO; 1832 BP.
721XX
722AC   X51872;
723XX
724DT   17-APR-1990 (Rel. 23, Created)
725DT   05-JUL-1999 (Rel. 60, Last updated, Version 5)
726XX
727DE   Escherichia coli lacA gene for thiogalactoside transacetylase
728XX
729KW   lac operon; lacA gene; lacY gene; thiogalactoside transacetylase.
730XX
731OS   Escherichia coli
732OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
733OC   Enterobacteriaceae; Escherichia.
734XX
735RN   [1]
736RC   (1-1832)
737RP   1-1832
738RX   DOI; 10.1073/pnas.82.19.6414.
739RX   PUBMED; 3901000.
740RA   Hediger M.A., Johnson D.F., Nierlich D.P., Zabin I.;
741RT   "DNA sequence of the lactose operon: the lacA gene and the transcriptional
742RT   termination region";
743RL   Proc. Natl. Acad. Sci. U.S.A. 82(19):6414-6418(1985).
744XX
745FH   Key             Location/Qualifiers
746FH
747FT   source          1..1832
748FT                   /organism="Escherichia coli"
749FT                   /mol_type="genomic DNA"
750FT                   /db_xref="taxon:562"
751FT   CDS             <1..18
752FT                   /codon_start=1
753FT                   /transl_table=11
754FT                   /product="lacY gene product"
755FT                   /protein_id="CAA36161.1"
756FT                   /translation="VNEVA"
757FT   CDS             82..693
758FT                   /transl_table=11
759FT                   /gene="lacA"
760FT                   /product="thiogalactoside transacetylase"
761FT                   /db_xref="GOA:P07464"
762FT                   /db_xref="InterPro:IPR001451"
763FT                   /db_xref="InterPro:IPR011004"
764FT                   /db_xref="InterPro:IPR018357"
765FT                   /db_xref="InterPro:IPR024688"
766FT                   /db_xref="PDB:1KQA"
767FT                   /db_xref="PDB:1KRR"
768FT                   /db_xref="PDB:1KRU"
769FT                   /db_xref="PDB:1KRV"
770FT                   /db_xref="UniProtKB/Swiss-Prot:P07464"
771FT                   /protein_id="CAA36162.1"
772FT                   /translation="MNMPMTERIRAGKLFTDMCEGLPEKRLRGKTLMYEFNHSHPSEVE
773FT                   KRESLIKEMFATVGENAWVEPPVYFSYGSNIHIGRNFYANFNLTIVDDYTVTIGDNVLI
774FT                   APNVTLSVTGHPVHHELRKNGEMYSFPITIGNNVWIGSHVVINPGVTIGDNSVIGAGSI
775FT                   VTKDIPPNVVAAGVPCRVIREINDRDKHYYFKDYKVESSV"
776XX
777SQ   Sequence 1832 BP; 519 A; 510 C; 450 G; 353 T; 0 other;
778     gtgaatgaag tcgcttaagc aatcaatgtc ggatgcggcg cgacgcttat ccgaccaaca        60
779     tatcataacg gagtgatcgc attgaacatg ccaatgaccg aaagaataag agcaggcaag       120
780     ctatttaccg atatgtgcga aggcttaccg gaaaaaagac ttcgtgggaa aacgttaatg       180
781     tatgagttta atcactcgca tccatcagaa gttgaaaaaa gagaaagcct gattaaagaa       240
782     atgtttgcca cggtagggga aaacgcctgg gtagaaccgc ctgtctattt ctcttacggt       300
783     tccaacatcc atataggccg caatttttat gcaaatttca atttaaccat tgtcgatgac       360
784     tacacggtaa caatcggtga taacgtactg attgcaccca acgttactct ttccgttacg       420
785     ggacaccctg tacaccatga attgagaaaa aacggcgaga tgtactcttt tccgataacg       480
786     attggcaata acgtctggat cggaagtcat gtggttatta atccaggcgt caccatcggg       540
787     gataattctg ttattggcgc gggtagtatc gtcacaaaag acattccacc aaacgtcgtg       600
788     gcggctggcg ttccttgtcg ggttattcgc gaaataaacg accgggataa gcactattat       660
789     ttcaaagatt ataaagttga atcgtcagtt taaattataa aaattgcctg atacgctgcg       720
790     cttatcaggc ctacaagttc agcgatctac attagccgca tccggcatga acaaagcgca       780
791     ggaacaagcg tcgcatcatg cctctttgac ccacagctgc ggaaaacgta ctggtgcaaa       840
792     acgcagggtt atgatcatca gcccaacgac gcacagcgca tgaaatgccc agtccatcag       900
793     gtaattgccg ctgatactac gcagcacgcc agaaaaccac ggggcaagcc cggcgatgat       960
794     aaaaccgatt ccctgcataa acgccaccag cttgccagca atagccggtt gcacagagtg      1020
795     atcgagcgcc agcagcaaac agagcggaaa cgcgccgccc agacctaacc cacacaccat      1080
796     cgcccacaat accggcaatt gcatcggcag ccagataaag ccgcagaacc ccaccagttg      1140
797     taacaccagc gccagcatta acagtttgcg ccgatcctga tggcgagcca tagcaggcat      1200
798     cagcaaagct cctgcggctt gcccaagcgt catcaatgcc agtaaggaac cgctgtactg      1260
799     cgcgctggca ccaatctcaa tatagaaagc gggtaaccag gcaatcaggc tggcgtaacc      1320
800     gccgttaatc agaccgaagt aaacacccag cgtccacgcg cggggagtga ataccacgcg      1380
801     aaccggagtg gttgttgtct tgtgggaaga ggcgacctcg cgggcgcttt gccaccacca      1440
802     ggcaaagagc gcaacaacgg caggcagcgc caccaggcga gtgtttgata ccaggtttcg      1500
803     ctatgttgaa ctaaccaggg cgttatggcg gcaccaagcc caccgccgcc catcagagcc      1560
804     gcggaccaca gccccatcac cagtggcgtg cgctgctgaa accgccgttt aatcaccgaa      1620
805     gcatcaccgc ctgaatgatg ccgatcccca ccccaccaag cagtgcgctg ctaagcagca      1680
806     gcgcactttg cgggtaaagc tcacgcatca atgcaccgac ggcaatcagc aacagactga      1740
807     tggcgacact gcgacgttcg ctgacatgct gatgaagcca gcttccggcc agcgccagcc      1800
808     cgcccatggt aaccaccggc agagcggtcg ac                                    1832
809//
810ID   V00294; SV 1; linear; genomic DNA; STD; PRO; 1113 BP.
811XX
812AC   V00294;
813XX
814DT   09-JUN-1982 (Rel. 01, Created)
815DT   10-FEB-1999 (Rel. 58, Last updated, Version 2)
816XX
817DE   E. coli laci gene (codes for the lac repressor).
818XX
819KW   DNA binding protein; repressor.
820XX
821OS   Escherichia coli
822OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
823OC   Enterobacteriaceae; Escherichia.
824XX
825RN   [1]
826RP   1-1113
827RX   DOI; 10.1038/274765a0.
828RX   PUBMED; 355891.
829RA   Farabaugh P.J.;
830RT   "Sequence of the lacI gene";
831RL   Nature 274(5673):765-769(1978).
832XX
833CC   KST ECO.LACI
834XX
835FH   Key             Location/Qualifiers
836FH
837FT   source          1..1113
838FT                   /organism="Escherichia coli"
839FT                   /mol_type="genomic DNA"
840FT                   /db_xref="taxon:562"
841FT   CDS             31..1113
842FT                   /transl_table=11
843FT                   /note="reading frame"
844FT                   /db_xref="GOA:P03023"
845FT                   /db_xref="InterPro:IPR000843"
846FT                   /db_xref="InterPro:IPR010982"
847FT                   /db_xref="PDB:1CJG"
848FT                   /db_xref="PDB:1EFA"
849FT                   /db_xref="PDB:1JWL"
850FT                   /db_xref="PDB:1JYE"
851FT                   /db_xref="PDB:1JYF"
852FT                   /db_xref="PDB:1L1M"
853FT                   /db_xref="PDB:1LBG"
854FT                   /db_xref="PDB:1LBH"
855FT                   /db_xref="PDB:1LBI"
856FT                   /db_xref="PDB:1LCC"
857FT                   /db_xref="PDB:1LCD"
858FT                   /db_xref="PDB:1LQC"
859FT                   /db_xref="PDB:1LTP"
860FT                   /db_xref="PDB:1OSL"
861FT                   /db_xref="PDB:1TLF"
862FT                   /db_xref="PDB:1Z04"
863FT                   /db_xref="PDB:2BJC"
864FT                   /db_xref="PDB:2KEI"
865FT                   /db_xref="PDB:2KEJ"
866FT                   /db_xref="PDB:2KEK"
867FT                   /db_xref="PDB:2P9H"
868FT                   /db_xref="PDB:2PAF"
869FT                   /db_xref="PDB:2PE5"
870FT                   /db_xref="PDB:3EDC"
871FT                   /db_xref="UniProtKB/Swiss-Prot:P03023"
872FT                   /protein_id="CAA23569.1"
873FT                   /translation="MKPVTLYDVAEYAGVSYQTVSRVVNQASHVSAKTREKVEAAMAEL
874FT                   NYIPNRVAQQLAGKQSLLIGVATSSLALHAPSQIVAAIKSRADQLGASVVVSMVERSGV
875FT                   EACKAAVHNLLAQRVSGLIINYPLDDQDAIAVEAACTNVPALFLDVSDQTPINSIIFSH
876FT                   EDGTRLGVEHLVALGHQQIALLAGPLSSVSARLRLAGWHKYLTRNQIQPIAEREGDWSA
877FT                   MSGFQQTMQMLNEGIVPTAMLVANDQMALGAMRAITESGLRVGADISVVGYDDTEDSSC
878FT                   YIPPSTTIKQDFRLLGQTSVDRLLQLSQGQAVKGNQLLPVSLVKRKTTLAPNTQTASPR
879FT                   ALADSLMQLARQVSRLESGQ"
880XX
881SQ   Sequence 1113 BP; 249 A; 304 C; 322 G; 238 T; 0 other;
882     ccggaagaga gtcaattcag ggtggtgaat gtgaaaccag taacgttata cgatgtcgca        60
883     gagtatgccg gtgtctctta tcagaccgtt tcccgcgtgg tgaaccaggc cagccacgtt       120
884     tctgcgaaaa cgcgggaaaa agtggaagcg gcgatggcgg agctgaatta cattcccaac       180
885     cgcgtggcac aacaactggc gggcaaacag tcgttgctga ttggcgttgc cacctccagt       240
886     ctggccctgc acgcgccgtc gcaaattgtc gcggcgatta aatctcgcgc cgatcaactg       300
887     ggtgccagcg tggtggtgtc gatggtagaa cgaagcggcg tcgaagcctg taaagcggcg       360
888     gtgcacaatc ttctcgcgca acgcgtcagt gggctgatca ttaactatcc gctggatgac       420
889     caggatgcca ttgctgtgga agctgcctgc actaatgttc cggcgttatt tcttgatgtc       480
890     tctgaccaga cacccatcaa cagtattatt ttctcccatg aagacggtac gcgactgggc       540
891     gtggagcatc tggtcgcatt gggtcaccag caaatcgcgc tgttagcggg cccattaagt       600
892     tctgtctcgg cgcgtctgcg tctggctggc tggcataaat atctcactcg caatcaaatt       660
893     cagccgatag cggaacggga aggcgactgg agtgccatgt ccggttttca acaaaccatg       720
894     caaatgctga atgagggcat cgttcccact gcgatgctgg ttgccaacga tcagatggcg       780
895     ctgggcgcaa tgcgcgccat taccgagtcc gggctgcgcg ttggtgcgga tatctcggta       840
896     gtgggatacg acgataccga agacagctca tgttatatcc cgccgtcaac caccatcaaa       900
897     caggattttc gcctgctggg gcaaaccagc gtggaccgct tgctgcaact ctctcagggc       960
898     caggcggtga agggcaatca gctgttgccc gtctcactgg tgaaaagaaa aaccaccctg      1020
899     gcgcccaata cgcaaaccgc ctctccccgc gcgttggccg attcattaat gcagctggca      1080
900     cgacaggttt cccgactgga aagcgggcag tga                                   1113
901//
902ID   V00295; SV 1; linear; genomic DNA; STD; PRO; 1500 BP.
903XX
904AC   V00295;
905XX
906DT   09-JUN-1982 (Rel. 01, Created)
907DT   07-JUL-1995 (Rel. 44, Last updated, Version 4)
908XX
909DE   E. coli lacY gene (codes for lactose permease).
910XX
911KW   membrane protein.
912XX
913OS   Escherichia coli
914OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
915OC   Enterobacteriaceae; Escherichia.
916XX
917RN   [1]
918RP   1-1500
919RX   DOI; 10.1038/283541a0.
920RX   PUBMED; 6444453.
921RA   Buechel D.E., Gronenborn B., Mueller-Hill B.;
922RT   "Sequence of the lactose permease gene";
923RL   Nature 283(5747):541-545(1980).
924XX
925CC   lacZ is a beta-galactosidase and lacA is transacetylase.
926CC   KST ECO.LACY
927XX
928FH   Key             Location/Qualifiers
929FH
930FT   source          1..1500
931FT                   /organism="Escherichia coli"
932FT                   /mol_type="genomic DNA"
933FT                   /db_xref="taxon:562"
934FT   CDS             <1..54
935FT                   /codon_start=1
936FT                   /transl_table=11
937FT                   /note="reading frame (lacZ)"
938FT                   /db_xref="GOA:P00722"
939FT                   /db_xref="InterPro:IPR004199"
940FT                   /db_xref="InterPro:IPR006101"
941FT                   /db_xref="InterPro:IPR006102"
942FT                   /db_xref="InterPro:IPR006103"
943FT                   /db_xref="InterPro:IPR006104"
944FT                   /db_xref="InterPro:IPR008979"
945FT                   /db_xref="InterPro:IPR011013"
946FT                   /db_xref="InterPro:IPR013781"
947FT                   /db_xref="InterPro:IPR013812"
948FT                   /db_xref="InterPro:IPR014718"
949FT                   /db_xref="InterPro:IPR017853"
950FT                   /db_xref="InterPro:IPR023230"
951FT                   /db_xref="InterPro:IPR023232"
952FT                   /db_xref="InterPro:IPR023933"
953FT                   /db_xref="PDB:1BGL"
954FT                   /db_xref="PDB:1BGM"
955FT                   /db_xref="PDB:1DP0"
956FT                   /db_xref="PDB:1F49"
957FT                   /db_xref="PDB:1F4A"
958FT                   /db_xref="PDB:1F4H"
959FT                   /db_xref="PDB:1GHO"
960FT                   /db_xref="PDB:1HN1"
961FT                   /db_xref="PDB:1JYN"
962FT                   /db_xref="PDB:1JYV"
963FT                   /db_xref="PDB:1JYW"
964FT                   /db_xref="PDB:1JYX"
965FT                   /db_xref="PDB:1JYY"
966FT                   /db_xref="PDB:1JYZ"
967FT                   /db_xref="PDB:1JZ0"
968FT                   /db_xref="PDB:1JZ1"
969FT                   /db_xref="PDB:1JZ2"
970FT                   /db_xref="PDB:1JZ3"
971FT                   /db_xref="PDB:1JZ4"
972FT                   /db_xref="PDB:1JZ5"
973FT                   /db_xref="PDB:1JZ6"
974FT                   /db_xref="PDB:1JZ7"
975FT                   /db_xref="PDB:1JZ8"
976FT                   /db_xref="PDB:1PX3"
977FT                   /db_xref="PDB:1PX4"
978FT                   /db_xref="PDB:3CZJ"
979FT                   /db_xref="PDB:3DYM"
980FT                   /db_xref="PDB:3DYO"
981FT                   /db_xref="PDB:3DYP"
982FT                   /db_xref="PDB:3E1F"
983FT                   /db_xref="PDB:3I3B"
984FT                   /db_xref="PDB:3I3D"
985FT                   /db_xref="PDB:3I3E"
986FT                   /db_xref="PDB:3IAP"
987FT                   /db_xref="PDB:3IAQ"
988FT                   /db_xref="PDB:3MUY"
989FT                   /db_xref="PDB:3MUZ"
990FT                   /db_xref="PDB:3MV0"
991FT                   /db_xref="PDB:3MV1"
992FT                   /db_xref="PDB:3SEP"
993FT                   /db_xref="PDB:3T08"
994FT                   /db_xref="PDB:3T09"
995FT                   /db_xref="PDB:3T0A"
996FT                   /db_xref="PDB:3T0B"
997FT                   /db_xref="PDB:3T0D"
998FT                   /db_xref="PDB:3T2O"
999FT                   /db_xref="PDB:3T2P"
1000FT                   /db_xref="PDB:3T2Q"
1001FT                   /db_xref="PDB:3VD3"
1002FT                   /db_xref="PDB:3VD4"
1003FT                   /db_xref="PDB:3VD5"
1004FT                   /db_xref="PDB:3VD7"
1005FT                   /db_xref="PDB:3VD9"
1006FT                   /db_xref="PDB:3VDA"
1007FT                   /db_xref="PDB:3VDB"
1008FT                   /db_xref="PDB:3VDC"
1009FT                   /db_xref="UniProtKB/Swiss-Prot:P00722"
1010FT                   /protein_id="CAA23570.1"
1011FT                   /translation="FQLSAGRYHYQLVWCQK"
1012FT   CDS             106..1359
1013FT                   /transl_table=11
1014FT                   /note="reading frame (lacY)"
1015FT                   /db_xref="GOA:P02920"
1016FT                   /db_xref="InterPro:IPR000576"
1017FT                   /db_xref="InterPro:IPR016196"
1018FT                   /db_xref="InterPro:IPR018457"
1019FT                   /db_xref="InterPro:IPR020846"
1020FT                   /db_xref="InterPro:IPR022814"
1021FT                   /db_xref="PDB:1M2U"
1022FT                   /db_xref="PDB:1PV6"
1023FT                   /db_xref="PDB:1PV7"
1024FT                   /db_xref="PDB:2CFP"
1025FT                   /db_xref="PDB:2CFQ"
1026FT                   /db_xref="PDB:2V8N"
1027FT                   /db_xref="PDB:2Y5Y"
1028FT                   /db_xref="UniProtKB/Swiss-Prot:P02920"
1029FT                   /protein_id="CAA23571.1"
1030FT                   /translation="MYYLKNTNFWMFGLFFFFYFFIMGAYFPFFPIWLHDINHISKSDT
1031FT                   GIIFAAISLFSLLFQPLFGLLSDKLGLRKYLLWIITGMLVMFAPFFIFIFGPLLQYNIL
1032FT                   VGSIVGGIYLGFCFNAGAPAVEAFIEKVSRRSNFEFGRARMFGCVGWALCASIVGIMFT
1033FT                   INNQFVFWLGSGCALILAVLLFFAKTDAPSSATVANAVGANHSAFSLKLALELFRQPKL
1034FT                   WFLSLYVIGVSCTYDVFDQQFANFFTSFFATGEQGTRVFGYVTTMGELLNASIMFFAPL
1035FT                   IINRIGGKNALLLAGTIMSVRIIGSSFATSALEVVILKTLHMFEVPFLLVGCFKYITSQ
1036FT                   FEVRFSATIYLVCFCFFKQLAMIFMSVLAGNMYESIGFQGAYLVLGLVALGFTLISVFT
1037FT                   LSGPGPLSLLRRQVNEVA"
1038FT   CDS             1423..>1500
1039FT                   /transl_table=11
1040FT                   /note="reading frame (lacA)"
1041FT                   /db_xref="GOA:P07464"
1042FT                   /db_xref="InterPro:IPR001451"
1043FT                   /db_xref="InterPro:IPR011004"
1044FT                   /db_xref="InterPro:IPR018357"
1045FT                   /db_xref="InterPro:IPR024688"
1046FT                   /db_xref="PDB:1KQA"
1047FT                   /db_xref="PDB:1KRR"
1048FT                   /db_xref="PDB:1KRU"
1049FT                   /db_xref="PDB:1KRV"
1050FT                   /db_xref="UniProtKB/Swiss-Prot:P07464"
1051FT                   /protein_id="CAA23572.1"
1052FT                   /translation="MNMPMTERIRAGKLFTDMCEGLPEKR"
1053XX
1054SQ   Sequence 1500 BP; 315 A; 342 C; 357 G; 486 T; 0 other;
1055     ttccagctga gcgccggtcg ctaccattac cagttggtct ggtgtcaaaa ataataataa        60
1056     ccgggcaggc catgtctgcc cgtatttcgc gtaaggaaat ccattatgta ctatttaaaa       120
1057     aacacaaact tttggatgtt cggtttattc tttttctttt acttttttat catgggagcc       180
1058     tacttcccgt ttttcccgat ttggctacat gacatcaacc atatcagcaa aagtgatacg       240
1059     ggtattattt ttgccgctat ttctctgttc tcgctattat tccaaccgct gtttggtctg       300
1060     ctttctgaca aactcgggct gcgcaaatac ctgctgtgga ttattaccgg catgttagtg       360
1061     atgtttgcgc cgttctttat ttttatcttc gggccactgt tacaatacaa cattttagta       420
1062     ggatcgattg ttggtggtat ttatctaggc ttttgtttta acgccggtgc gccagcagta       480
1063     gaggcattta ttgagaaagt cagccgtcgc agtaatttcg aatttggtcg cgcgcggatg       540
1064     tttggctgtg ttggctgggc gctgtgtgcc tcgattgtcg gcatcatgtt caccatcaat       600
1065     aatcagtttg ttttctggct gggctctggc tgtgcactca tcctcgccgt tttactcttt       660
1066     ttcgccaaaa cggatgcgcc ctcttctgcc acggttgcca atgcggtagg tgccaaccat       720
1067     tcggcattta gccttaagct ggcactggaa ctgttcagac agccaaaact gtggtttttg       780
1068     tcactgtatg ttattggcgt ttcctgcacc tacgatgttt ttgaccaaca gtttgctaat       840
1069     ttctttactt cgttctttgc taccggtgaa cagggtacgc gggtatttgg ctacgtaacg       900
1070     acaatgggcg aattacttaa cgcctcgatt atgttctttg cgccactgat cattaatcgc       960
1071     atcggtggga aaaacgccct gctgctggct ggcactatta tgtctgtacg tattattggc      1020
1072     tcatcgttcg ccacctcagc gctggaagtg gttattctga aaacgctgca tatgtttgaa      1080
1073     gtaccgttcc tgctggtggg ctgctttaaa tatattacca gccagtttga agtgcgtttt      1140
1074     tcagcgacga tttatctggt ctgtttctgc ttctttaagc aactggcgat gatttttatg      1200
1075     tctgtactgg cgggcaatat gtatgaaagc atcggtttcc agggcgctta tctggtgctg      1260
1076     ggtctggtgg cgctgggctt caccttaatt tccgtgttca cgcttagcgg ccccggcccg      1320
1077     ctttccctgc tgcgtcgtca ggtgaatgaa gtcgcttaag caatcaatgt cggatgcggc      1380
1078     gcgacgctta tccgaccaac atatcataac ggagtgatcg cattgaacat gccaatgacc      1440
1079     gaaagaataa gagcaggcaa gctatttacc gatatgtgcg aaggcttacc ggaaaaaaga      1500
1080//
1081ID   V00296; SV 1; linear; genomic DNA; STD; PRO; 3078 BP.
1082XX
1083AC   V00296;
1084XX
1085DT   13-JUL-1983 (Rel. 03, Created)
1086DT   18-APR-2005 (Rel. 83, Last updated, Version 5)
1087XX
1088DE   E. coli gene lacZ coding for beta-galactosidase (EC 3.2.1.23).
1089XX
1090KW   galactosidase.
1091XX
1092OS   Escherichia coli
1093OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
1094OC   Enterobacteriaceae; Escherichia.
1095XX
1096RN   [1]
1097RP   1-3078
1098RX   PUBMED; 6313347.
1099RA   Kalnins A., Otto K., Ruether U., Mueller-Hill B.;
1100RT   "Sequence of the lacZ gene of Escherichia coli";
1101RL   EMBO J. 2(4):593-597(1983).
1102XX
1103RN   [2]
1104RX   PUBMED; 3038536.
1105RA   Zell R., Fritz H.J.;
1106RT   "DNA mismatch-repair in Escherichia coli counteracting the hydrolytic
1107RT   deamination of 5-methyl-cytosine residues";
1108RL   EMBO J. 6(6):1809-1815(1987).
1109XX
1110CC   Data kindly reviewed (18-MAY-1983) by U. Ruether
1111XX
1112FH   Key             Location/Qualifiers
1113FH
1114FT   source          1..3078
1115FT                   /organism="Escherichia coli"
1116FT                   /mol_type="genomic DNA"
1117FT                   /db_xref="taxon:562"
1118FT   CDS             <1..3072
1119FT                   /transl_table=11
1120FT                   /note="galactosidase"
1121FT                   /db_xref="GOA:P00722"
1122FT                   /db_xref="InterPro:IPR004199"
1123FT                   /db_xref="InterPro:IPR006101"
1124FT                   /db_xref="InterPro:IPR006102"
1125FT                   /db_xref="InterPro:IPR006103"
1126FT                   /db_xref="InterPro:IPR006104"
1127FT                   /db_xref="InterPro:IPR008979"
1128FT                   /db_xref="InterPro:IPR011013"
1129FT                   /db_xref="InterPro:IPR013781"
1130FT                   /db_xref="InterPro:IPR013812"
1131FT                   /db_xref="InterPro:IPR014718"
1132FT                   /db_xref="InterPro:IPR017853"
1133FT                   /db_xref="InterPro:IPR023230"
1134FT                   /db_xref="InterPro:IPR023232"
1135FT                   /db_xref="InterPro:IPR023933"
1136FT                   /db_xref="PDB:1BGL"
1137FT                   /db_xref="PDB:1BGM"
1138FT                   /db_xref="PDB:1DP0"
1139FT                   /db_xref="PDB:1F49"
1140FT                   /db_xref="PDB:1F4A"
1141FT                   /db_xref="PDB:1F4H"
1142FT                   /db_xref="PDB:1GHO"
1143FT                   /db_xref="PDB:1HN1"
1144FT                   /db_xref="PDB:1JYN"
1145FT                   /db_xref="PDB:1JYV"
1146FT                   /db_xref="PDB:1JYW"
1147FT                   /db_xref="PDB:1JYX"
1148FT                   /db_xref="PDB:1JYY"
1149FT                   /db_xref="PDB:1JYZ"
1150FT                   /db_xref="PDB:1JZ0"
1151FT                   /db_xref="PDB:1JZ1"
1152FT                   /db_xref="PDB:1JZ2"
1153FT                   /db_xref="PDB:1JZ3"
1154FT                   /db_xref="PDB:1JZ4"
1155FT                   /db_xref="PDB:1JZ5"
1156FT                   /db_xref="PDB:1JZ6"
1157FT                   /db_xref="PDB:1JZ7"
1158FT                   /db_xref="PDB:1JZ8"
1159FT                   /db_xref="PDB:1PX3"
1160FT                   /db_xref="PDB:1PX4"
1161FT                   /db_xref="PDB:3CZJ"
1162FT                   /db_xref="PDB:3DYM"
1163FT                   /db_xref="PDB:3DYO"
1164FT                   /db_xref="PDB:3DYP"
1165FT                   /db_xref="PDB:3E1F"
1166FT                   /db_xref="PDB:3I3B"
1167FT                   /db_xref="PDB:3I3D"
1168FT                   /db_xref="PDB:3I3E"
1169FT                   /db_xref="PDB:3IAP"
1170FT                   /db_xref="PDB:3IAQ"
1171FT                   /db_xref="PDB:3MUY"
1172FT                   /db_xref="PDB:3MUZ"
1173FT                   /db_xref="PDB:3MV0"
1174FT                   /db_xref="PDB:3MV1"
1175FT                   /db_xref="PDB:3SEP"
1176FT                   /db_xref="PDB:3T08"
1177FT                   /db_xref="PDB:3T09"
1178FT                   /db_xref="PDB:3T0A"
1179FT                   /db_xref="PDB:3T0B"
1180FT                   /db_xref="PDB:3T0D"
1181FT                   /db_xref="PDB:3T2O"
1182FT                   /db_xref="PDB:3T2P"
1183FT                   /db_xref="PDB:3T2Q"
1184FT                   /db_xref="PDB:3VD3"
1185FT                   /db_xref="PDB:3VD4"
1186FT                   /db_xref="PDB:3VD5"
1187FT                   /db_xref="PDB:3VD7"
1188FT                   /db_xref="PDB:3VD9"
1189FT                   /db_xref="PDB:3VDA"
1190FT                   /db_xref="PDB:3VDB"
1191FT                   /db_xref="PDB:3VDC"
1192FT                   /db_xref="UniProtKB/Swiss-Prot:P00722"
1193FT                   /protein_id="CAA23573.1"
1194FT                   /translation="TMITDSLAVVLQRRDWENPGVTQLNRLAAHPPFASWRNSEEARTD
1195FT                   RPSQQLRSLNGEWRFAWFPAPEAVPESWLECDLPEADTVVVPSNWQMHGYDAPIYTNVT
1196FT                   YPITVNPPFVPTENPTGCYSLTFNVDESWLQEGQTRIIFDGVNSAFHLWCNGRWVGYGQ
1197FT                   DSRLPSEFDLSAFLRAGENRLAVMVLRWSDGSYLEDQDMWRMSGIFRDVSLLHKPTTQI
1198FT                   SDFHVATRFNDDFSRAVLEAEVQMCGELRDYLRVTVSLWQGETQVASGTAPFGGEIIDE
1199FT                   RGGYADRVTLRLNVENPKLWSAEIPNLYRAVVELHTADGTLIEAEACDVGFREVRIENG
1200FT                   LLLLNGKPLLIRGVNRHEHHPLHGQVMDEQTMVQDILLMKQNNFNAVRCSHYPNHPLWY
1201FT                   TLCDRYGLYVVDEANIETHGMVPMNRLTDDPRWLPAMSERVTRMVQRDRNHPSVIIWSL
1202FT                   GNESGHGANHDALYRWIKSVDPSRPVQYEGGGADTTATDIICPMYARVDEDQPFPAVPK
1203FT                   WSIKKWLSLPGETRPLILCEYAHAMGNSLGGFAKYWQAFRQYPRLQGGFVWDWVDQSLI
1204FT                   KYDENGNPWSAYGGDFGDTPNDRQFCMNGLVFADRTPHPALTEAKHQQQFFQFRLSGQT
1205FT                   IEVTSEYLFRHSDNELLHWMVALDGKPLASGEVPLDVAPQGKQLIELPELPQPESAGQL
1206FT                   WLTVRVVQPNATAWSEAGHISAWQQWRLAENLSVTLPAASHAIPHLTTSEMDFCIELGN
1207FT                   KRWQFNRQSGFLSQMWIGDKKQLLTPLRDQFTRAPLDNDIGVSEATRIDPNAWVERWKA
1208FT                   AGHYQAEAALLQCTADTLADAVLITTAHAWQHQGKTLFISRKTYRIDGSGQMAITVDVE
1209FT                   VASDTPHPARIGLNCQLAQVAERVNWLGLGPQENYPDRLTAACFDRWDLPLSDMYTPYV
1210FT                   FPSENGLRCGTRELNYGPHQWRGDFQFNISRYSQQQLMETSHRHLLHAEEGTWLNIDGF
1211FT                   HMGIGGDDSWSPSVSAEFQLSAGRYHYQLVWCQK"
1212FT   mat_peptide     1..3069
1213XX
1214SQ   Sequence 3078 BP; 682 A; 841 C; 886 G; 669 T; 0 other;
1215     accatgatta cggattcact ggccgtcgtt ttacaacgtc gtgactggga aaaccctggc        60
1216     gttacccaac ttaatcgcct tgcagcacat ccccctttcg ccagctggcg taatagcgaa       120
1217     gaggcccgca ccgatcgccc ttcccaacag ttgcgcagcc tgaatggcga atggcgcttt       180
1218     gcctggtttc cggcaccaga agcggtgccg gaaagctggc tggagtgcga tcttcctgag       240
1219     gccgatactg tcgtcgtccc ctcaaactgg cagatgcacg gttacgatgc gcccatctac       300
1220     accaacgtaa cctatcccat tacggtcaat ccgccgtttg ttcccacgga gaatccgacg       360
1221     ggttgttact cgctcacatt taatgttgat gaaagctggc tacaggaagg ccagacgcga       420
1222     attatttttg atggcgttaa ctcggcgttt catctgtggt gcaacgggcg ctgggtcggt       480
1223     tacggccagg acagtcgttt gccgtctgaa tttgacctga gcgcattttt acgcgccgga       540
1224     gaaaaccgcc tcgcggtgat ggtgctgcgt tggagtgacg gcagttatct ggaagatcag       600
1225     gatatgtggc ggatgagcgg cattttccgt gacgtctcgt tgctgcataa accgactaca       660
1226     caaatcagcg atttccatgt tgccactcgc tttaatgatg atttcagccg cgctgtactg       720
1227     gaggctgaag ttcagatgtg cggcgagttg cgtgactacc tacgggtaac agtttcttta       780
1228     tggcagggtg aaacgcaggt cgccagcggc accgcgcctt tcggcggtga aattatcgat       840
1229     gagcgtggtg gttatgccga tcgcgtcaca ctacgtctga acgtcgaaaa cccgaaactg       900
1230     tggagcgccg aaatcccgaa tctctatcgt gcggtggttg aactgcacac cgccgacggc       960
1231     acgctgattg aagcagaagc ctgcgatgtc ggtttccgcg aggtgcggat tgaaaatggt      1020
1232     ctgctgctgc tgaacggcaa gccgttgctg attcgaggcg ttaaccgtca cgagcatcat      1080
1233     cctctgcatg gtcaggtcat ggatgagcag acgatggtgc aggatatcct gctgatgaag      1140
1234     cagaacaact ttaacgccgt gcgctgttcg cattatccga accatccgct gtggtacacg      1200
1235     ctgtgcgacc gctacggcct gtatgtggtg gatgaagcca atattgaaac ccacggcatg      1260
1236     gtgccaatga atcgtctgac cgatgatccg cgctggctac cggcgatgag cgaacgcgta      1320
1237     acgcgaatgg tgcagcgcga tcgtaatcac ccgagtgtga tcatctggtc gctggggaat      1380
1238     gaatcaggcc acggcgctaa tcacgacgcg ctgtatcgct ggatcaaatc tgtcgatcct      1440
1239     tcccgcccgg tgcagtatga aggcggcgga gccgacacca cggccaccga tattatttgc      1500
1240     ccgatgtacg cgcgcgtgga tgaagaccag cccttcccgg ctgtgccgaa atggtccatc      1560
1241     aaaaaatggc tttcgctacc tggagagacg cgcccgctga tcctttgcga atacgcccac      1620
1242     gcgatgggta acagtcttgg cggtttcgct aaatactggc aggcgtttcg tcagtatccc      1680
1243     cgtttacagg gcggcttcgt ctgggactgg gtggatcagt cgctgattaa atatgatgaa      1740
1244     aacggcaacc cgtggtcggc ttacggcggt gattttggcg atacgccgaa cgatcgccag      1800
1245     ttctgtatga acggtctggt ctttgccgac cgcacgccgc atccagcgct gacggaagca      1860
1246     aaacaccagc agcagttttt ccagttccgt ttatccgggc aaaccatcga agtgaccagc      1920
1247     gaatacctgt tccgtcatag cgataacgag ctcctgcact ggatggtggc gctggatggt      1980
1248     aagccgctgg caagcggtga agtgcctctg gatgtcgctc cacaaggtaa acagttgatt      2040
1249     gaactgcctg aactaccgca gccggagagc gccgggcaac tctggctcac agtacgcgta      2100
1250     gtgcaaccga acgcgaccgc atggtcagaa gccgggcaca tcagcgcctg gcagcagtgg      2160
1251     cgtctggcgg aaaacctcag tgtgacgctc cccgccgcgt cccacgccat cccgcatctg      2220
1252     accaccagcg aaatggattt ttgcatcgag ctgggtaata agcgttggca atttaaccgc      2280
1253     cagtcaggct ttctttcaca gatgtggatt ggcgataaaa aacaactgct gacgccgctg      2340
1254     cgcgatcagt tcacccgtgc accgctggat aacgacattg gcgtaagtga agcgacccgc      2400
1255     attgacccta acgcctgggt cgaacgctgg aaggcggcgg gccattacca ggccgaagca      2460
1256     gcgttgttgc agtgcacggc agatacactt gctgatgcgg tgctgattac gaccgctcac      2520
1257     gcgtggcagc atcaggggaa aaccttattt atcagccgga aaacctaccg gattgatggt      2580
1258     agtggtcaaa tggcgattac cgttgatgtt gaagtggcga gcgatacacc gcatccggcg      2640
1259     cggattggcc tgaactgcca gctggcgcag gtagcagagc gggtaaactg gctcggatta      2700
1260     gggccgcaag aaaactatcc cgaccgcctt actgccgcct gttttgaccg ctgggatctg      2760
1261     ccattgtcag acatgtatac cccgtacgtc ttcccgagcg aaaacggtct gcgctgcggg      2820
1262     acgcgcgaat tgaattatgg cccacaccag tggcgcggcg acttccagtt caacatcagc      2880
1263     cgctacagtc aacagcaact gatggaaacc agccatcgcc atctgctgca cgcggaagaa      2940
1264     ggcacatggc tgaatatcga cggtttccat atggggattg gtggcgacga ctcctggagc      3000
1265     ccgtcagtat cggcggaatt ccagctgagc gccggtcgct accattacca gttggtctgg      3060
1266     tgtcaaaaat aataataa                                                    3078
1267//
1268ID   V00307; SV 1; linear; genomic DNA; STD; PRO; 2271 BP.
1269XX
1270AC   V00307; J01654;
1271XX
1272DT   09-JUN-1982 (Rel. 01, Created)
1273DT   01-OCT-1996 (Rel. 49, Last updated, Version 8)
1274XX
1275DE   E. coli ompA gene (codes for the outer membrane protein II*).
1276XX
1277KW   membrane protein; unidentified reading frame.
1278XX
1279OS   Escherichia coli
1280OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
1281OC   Enterobacteriaceae; Escherichia.
1282XX
1283RN   [1]
1284RP   1-2271
1285RX   DOI; 10.1093/nar/8.13.3011.
1286RX   PUBMED; 6253901.
1287RA   Beck E., Bremer E.;
1288RT   "Nucleotide sequence of the gene ompA coding the outer membrane protein II
1289RT   of Escherichia coli K-12";
1290RL   Nucleic Acids Res. 8(13):3011-3027(1980).
1291XX
1292RN   [2]
1293RP   783-1317
1294RX   DOI; 10.1073/pnas.77.7.3845.
1295RX   PUBMED; 7001445.
1296RA   Movva N.R., Nakamura K., Inouye M.;
1297RT   "Regulatory region of the gene for the ompA protein, a major outer membrane
1298RT   protein of Escherichia coli";
1299RL   Proc. Natl. Acad. Sci. U.S.A. 77(7):3845-3849(1980).
1300XX
1301DR   GOA; P0A8N0.
1302DR   InterPro; IPR009390; Ter_macrodom_MatS-bd_MatP.
1303DR   UniProtKB/Swiss-Prot; P0A8N0; MATP_ECOLI.
1304XX
1305CC   KST ECO.OMPA
1306XX
1307FH   Key             Location/Qualifiers
1308FH
1309FT   source          1..2271
1310FT                   /organism="Escherichia coli"
1311FT                   /mol_type="genomic DNA"
1312FT                   /db_xref="taxon:562"
1313FT   CDS             172..669
1314FT                   /transl_table=11
1315FT                   /note="reading frame (unknown protein)"
1316FT                   /db_xref="GOA:P0AFZ5"
1317FT                   /db_xref="InterPro:IPR004596"
1318FT                   /db_xref="UniProtKB/Swiss-Prot:P0AFZ5"
1319FT                   /protein_id="CAA23587.1"
1320FT                   /translation="MYTSGYAHRSSSFSSAASKIARVSTENTTAGLISEVVYREDQPMM
1321FT                   TQLLLLPLLQQLGQQSRWQLWLTPQQKLSREWVQASGLPLTKVMQISQLSPCHTVESMV
1322FT                   RALRTGNYSVVIGWLADDLTEEEHAEVVDAANEGNAMGFIIHSGKRILSRHETTFRAKN
1323FT                   SL"
1324FT   misc_difference 906..906
1325FT                   /note="may be missing [2]"
1326FT                   /note="conflict"
1327FT                   /citation=[2]
1328FT   CDS             1037..2077
1329FT                   /transl_table=11
1330FT                   /gene="ompA"
1331FT                   /product="ompA protein"
1332FT                   /db_xref="GOA:P0A910"
1333FT                   /db_xref="InterPro:IPR000498"
1334FT                   /db_xref="InterPro:IPR002368"
1335FT                   /db_xref="InterPro:IPR006664"
1336FT                   /db_xref="InterPro:IPR006665"
1337FT                   /db_xref="InterPro:IPR006690"
1338FT                   /db_xref="InterPro:IPR011250"
1339FT                   /db_xref="PDB:1BXW"
1340FT                   /db_xref="PDB:1G90"
1341FT                   /db_xref="PDB:1QJP"
1342FT                   /db_xref="PDB:2GE4"
1343FT                   /db_xref="PDB:2JMM"
1344FT                   /db_xref="PDB:3NB3"
1345FT                   /db_xref="UniProtKB/Swiss-Prot:P0A910"
1346FT                   /protein_id="CAA23588.1"
1347FT                   /translation="MKKTAIAIAVALAGFATVAQAAPKDNTWYTGAKLGWSQYHDTGFI
1348FT                   NNNGPTHENQLGAGAFGGYQVNPYVGFEMGYDWLGRMPYKGSVENGAYKAQGVQLTAKL
1349FT                   GYPITDDLDIYTRLGGMVWRADTKSNVYGKNHDTGVSPVFAGGVEYAITPEIATRLEYQ
1350FT                   WTNNIGDAHTIGTRPDNGMLSLGVSYRFGQGEAAPVVAPAPAPAPEVQTKHFTLKSDVL
1351FT                   FNFNKATLKPEGQAALDQLYSQLSNLDPKDGSVVVLGYTDRIGSDAYNQGLSERRAQSV
1352FT                   VDYLISKGIPADKISARGMGESNPVTGNTCDNVKQRAALIDCLAPDRRVEIEVKGIKDV
1353FT                   VTQPQA"
1354XX
1355SQ   Sequence 2271 BP; 567 A; 552 C; 548 G; 604 T; 0 other;
1356     gatccgttaa ctacgaaaat aggcaactta ttcttaaggg gcaagattaa tttatgtttt        60
1357     cccgtcacca acgacaaaat ttgcgaggct ctttccgaaa atagggttga tctttgttgt       120
1358     cactggatgt actgtacatc catacagtaa ctcacagggg ctggattgat tatgtacact       180
1359     tcaggctatg cacatcgttc ttcgtcgttc tcatccgcag caagtaaaat tgcgcgtgtc       240
1360     tctacggaaa acactacagc cgggcttatc agtgaagttg tctatcgcga agatcagccc       300
1361     atgatgacgc aacttctact gttgccattg ttacagcaac tcggtcagca atcgcgctgg       360
1362     caactctggt taacaccgca acaaaaactg agtcgggaat gggttcaggc atctgggcta       420
1363     cccttaacga aagtaatgca gattagccag ctctcccctt gccacactgt ggagtcaatg       480
1364     gttcgcgctt tacgcacggg caattacagt gtggtgatcg gttggttggc agatgatttg       540
1365     actgaagaag agcatgctga agttgttgat gcggcaaatg aaggtaacgc tatggggttt       600
1366     attatacatt ccggtaagcg catcctctca cgccacgaga caactttccg ggctaaaaat       660
1367     tcactctaat ttgtatcatt aagtaaattt aggattaatc ctggaacttt ttttgtcgcc       720
1368     cagccaatgc tttcagtcgt gactaatttc cttgcggagg cttgtctgag cggtttccgc       780
1369     gattctcttc tgtaaattgt cgctgacaaa aaagattaaa cataccttat acaagacttt       840
1370     tttttcatat gcctgacgga gttcacactt gtaagttttc aactacgttg tagactttac       900
1371     atcgccaagg gtgctcggca taagccgaag atatcggtag agttaatatt gagcagatcc       960
1372     cccggtgaag gatttaaccg tgttatctcg ttggagatat tcatggcgta ttttggatga      1020
1373     taacgaggcg caaaaaatga aaaagacagc tatcgcgatt gcagtggcac tggctggttt      1080
1374     cgctaccgta gcgcaggccg ctccgaaaga taacacctgg tacactggtg ctaaactggg      1140
1375     ctggtcccag taccatgata ctggtttcat caacaacaat ggcccgaccc atgaaaacca      1200
1376     actgggcgct ggtgcttttg gtggttacca ggttaacccg tatgttggct ttgaaatggg      1260
1377     ttacgactgg ttaggtcgta tgccgtacaa aggcagcgtt gaaaacggtg catacaaagc      1320
1378     tcagggcgtt caactgaccg ctaaactggg ttacccaatc actgacgacc tggacatcta      1380
1379     cactcgtctg ggtggcatgg tatggcgtgc agacactaaa tccaacgttt atggtaaaaa      1440
1380     ccacgacacc ggcgtttctc cggtcttcgc tggcggtgtt gagtacgcga tcactcctga      1500
1381     aatcgctacc cgtctggaat accagtggac gaacaacatc ggtgacgcac acaccatcgg      1560
1382     cactcgtccg gacaacggca tgctgagcct gggtgtttcc taccgtttcg gtcagggcga      1620
1383     ggcagctcca gtagttgctc cggctccagc tccggcaccg gaagtacaga ccaagcactt      1680
1384     cactctgaag tctgacgttc tgttcaactt caacaaagca accctgaaac cggaaggtca      1740
1385     ggctgctctg gatcagctgt acagccagct gagcaacttg gatccgaaag acggttccgt      1800
1386     agttgttctg ggttacaccg accgcatcgg ttctgacgct tacaaccagg gtctgtccga      1860
1387     gcgccgtgct cagtctgttg ttgattacct gatctccaaa ggtatcccgg cagacaagat      1920
1388     ctccgcacgt ggtatgggcg aatccaaccc ggttactggc aacacctgtg acaacgtgaa      1980
1389     acagcgtgct gcactgatcg actgcctggc tccggatcgt cgcgtagaga tcgaagttaa      2040
1390     aggtatcaaa gacgttgtaa ctcagccgca ggcttaagtt ctcgtctggt agaaaaacgc      2100
1391     tgctgcgggt ttttttttgc ctttagtaaa ttgaactgac tttcgtcagt tattccttac      2160
1392     ccagcaatgc ctgcagatcc tgcttcagag aagacatttt attcgcgtat ttctctttgt      2220
1393     tttccgcatc ttcaatcagc tgaacaatcg tttcagaaag cgttttaccg c               2271
1394//
1395ID   X77160; SV 1; linear; genomic DNA; STD; PRO; 1212 BP.
1396XX
1397AC   X77160;
1398XX
1399DT   13-APR-1994 (Rel. 39, Created)
1400DT   18-APR-2005 (Rel. 83, Last updated, Version 8)
1401XX
1402DE   Pseudomonas aeruginosa (PAC1) amiB gene.
1403XX
1404KW   amiB gene.
1405XX
1406OS   Pseudomonas aeruginosa
1407OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
1408OC   Pseudomonadaceae; Pseudomonas.
1409XX
1410RN   [1]
1411RA   Wilson S.A., Wachira S.M., Drew R.E., Jones D., Pearl L.H.;
1412RT   "Identification of a putative ABC transporter in the Pseudomonas aeruginosa
1413RT   amidase operon";
1414RL   Unpublished.
1415XX
1416RN   [2]
1417RP   1-1212
1418RA   Wilson S.A.;
1419RT   ;
1420RL   Submitted (17-JAN-1994) to the INSDC.
1421RL   S.A. Wilson, University College London, Dept of Biochemistry, Gower Street,
1422RL   London WC1E 6BT, UK
1423XX
1424RN   [3]
1425RP   1-1212
1426RX   DOI; 10.1074/jbc.270.32.18818.
1427RX   PUBMED; 7642533.
1428RA   Wilson S.A., Williams R.J., Pearl L.H., Drew R.E.;
1429RT   "Identification of two new genes in the Pseudomonas aeruginosa amidase
1430RT   operon, encoding an ATPase (AmiB) and a putative integral membrane protein
1431RT   (AmiS)";
1432RL   J Biol Chem 270(32):18818-18824(1995).
1433XX
1434DR   StrainInfo; 345027; 0.
1435XX
1436FH   Key             Location/Qualifiers
1437FH
1438FT   source          1..1212
1439FT                   /organism="Pseudomonas aeruginosa"
1440FT                   /strain="PAC1"
1441FT                   /mol_type="genomic DNA"
1442FT                   /clone="plasmid pAS20"
1443FT                   /db_xref="taxon:287"
1444FT   CDS             97..1212
1445FT                   /transl_table=11
1446FT                   /gene="amiB"
1447FT                   /db_xref="GOA:Q51416"
1448FT                   /db_xref="InterPro:IPR001270"
1449FT                   /db_xref="InterPro:IPR003593"
1450FT                   /db_xref="InterPro:IPR013093"
1451FT                   /db_xref="InterPro:IPR019489"
1452FT                   /db_xref="UniProtKB/Swiss-Prot:Q51416"
1453FT                   /protein_id="CAA54405.1"
1454FT                   /translation="MPFLSDMLDQSRRQQDEEQALARENLAEASLLQAHLSHRSALHSR
1455FT                   FRFDPAAVMDCLRAEVLGQEPALQAVEDMLKVVRADIADPRRPLFSALFLGPTGVGKTE
1456FT                   IVRALARALHGDAEGFCRVDMNTLSQEHYAAALTGAPPGYVGAKEGTTLLEQDKLDGSP
1457FT                   GRPGIVLFDELEKASPEVVHALLNVLDNGLLRVASGERTYHFRNTLVFMTSNLCAHEIQ
1458FT                   RYDERRQRLPWRLLPVGGERRRRDIDGMVRARLLKTFSPEFVNRLDSVVTFNWIERDVV
1459FT                   ARLVELEVQRLNRRLEKHRCRLEATPEVLAKIARAGFDRQFGARALRRSVRHHLEVPLA
1460FT                   EHLLDHHQPGDGNCTIYLASLEHERVRFVRR"
1461XX
1462SQ   Sequence 1212 BP; 193 A; 426 C; 403 G; 190 T; 0 other;
1463     gaaggaagcc tgacggcaga cgccgccagc ccggcgtgcc gtcgtgcggc acgccgtctc        60
1464     cgccatttcc cccctgtggc agaaggagtt tcatccatgc cttttctgag cgacatgctc       120
1465     gaccagtccc gccggcagca ggacgaggaa caggccctgg cgcgggagaa tcttgccgag       180
1466     gcaagtctgc tccaggccca cctgagtcac cgcagcgccc tgcacagccg tttccgtttc       240
1467     gacccggcgg cggtgatgga ctgcctgcgc gccgaggtgc tcggccagga accggcgcta       300
1468     caggccgtcg aggacatgct caaggtggtt cgcgcggaca tcgccgaccc gcgccgtccg       360
1469     ctgttcagcg cgctgttcct cggccccacc ggagtcggca agaccgagat cgtgcgcgcc       420
1470     ctggccaggg ccctgcacgg cgacgccgag gggttctgcc gggtggacat gaacaccctg       480
1471     tcccaggagc actatgccgc cgccctcacc ggtgcgccgc cgggctacgt cggggcgaag       540
1472     gagggcacca ccctgttgga gcaggacaag ctggacggca gtcccgggcg ccccggcatc       600
1473     gttctcttcg acgaactgga aaaggccagc ccggaagtgg tccatgcgtt gctcaacgta       660
1474     ctcgacaacg gcctgctacg ggtcgcttcc ggcgaacgca cctaccattt ccgcaacacc       720
1475     ctggtgttca tgaccagcaa tctctgcgcc catgagatcc agcgctacga cgagcgtcgc       780
1476     cagcgcctgc cctggcgcct gctgccggtc ggcggcgagc gccggcggcg ggacatcgac       840
1477     gggatggtcc gggcccggct gctgaagacc ttctcgccgg agttcgtcaa tcgtctcgat       900
1478     agcgtggtca ccttcaactg gatcgaacgc gacgtcgtcg cgcgcctggt cgagctggag       960
1479     gtgcagcggc tcaaccggcg cctggagaag catcgctgcc gcctggaggc gaccccggag      1020
1480     gtgctggcga agatcgcccg cgccggcttc gaccggcagt tcggcgcccg tgcgttgcgc      1080
1481     cgcagcgtcc gtcatcatct cgaggtaccg ctggccgagc atctgctcga tcaccaccag      1140
1482     ccgggcgacg ggaactgcac gatctacctg gcgagcctgg agcacgagcg ggttcgcttc      1200
1483     gtacggcgct ga                                                          1212
1484//
1485ID   M27612; SV 1; linear; genomic DNA; STD; PRO; 1065 BP.
1486XX
1487AC   M27612;
1488XX
1489DT   02-FEB-1990 (Rel. 22, Created)
1490DT   22-APR-2002 (Rel. 71, Last updated, Version 4)
1491XX
1492DE   Pseudomonas aeruginosa aliphatic amidase (amiE) gene, complete cds.
1493XX
1494KW   .
1495XX
1496OS   Pseudomonas aeruginosa
1497OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
1498OC   Pseudomonadaceae; Pseudomonas.
1499XX
1500RN   [1]
1501RP   1-1065
1502RX   DOI; 10.1016/0014-5793(87)80164-3.
1503RX   PUBMED; 3108030.
1504RA   Brammar W.J., Charles I.G., Matfield M., Liu C.P., Drew R.E., Clarke P.H.;
1505RT   "The nucleotide sequence of the amiE gene of Pseudomonas aeruginosa";
1506RL   FEBS Lett. 215(2):291-294(1987).
1507XX
1508FH   Key             Location/Qualifiers
1509FH
1510FT   source          1..1065
1511FT                   /organism="Pseudomonas aeruginosa"
1512FT                   /strain="PAC433"
1513FT                   /mol_type="genomic DNA"
1514FT                   /db_xref="taxon:287"
1515FT   CDS             25..1065
1516FT                   /codon_start=1
1517FT                   /transl_table=11
1518FT                   /gene="amiE"
1519FT                   /product="aliphatic amidase"
1520FT                   /EC_number="3.5.1.4"
1521FT                   /db_xref="GOA:P11436"
1522FT                   /db_xref="InterPro:IPR003010"
1523FT                   /db_xref="InterPro:IPR023719"
1524FT                   /db_xref="PDB:1K17"
1525FT                   /db_xref="PDB:2UXY"
1526FT                   /db_xref="UniProtKB/Swiss-Prot:P11436"
1527FT                   /protein_id="AAA25697.1"
1528FT                   /translation="MRHGDISSSNDTVGVAVVNYKMPRLHTAAEVLDNARKIADMIVGM
1529FT                   KQGLPGMDLVVFPEYSLQGIMYDPAEMMETAVAIPGEETEIFSRACRKANVWGVFSLTG
1530FT                   ERHEEHPRKAPYNTLVLIDNNGEIVQKYRKIIPWCPIEGWYPGGQTYVSEGPKGMKISL
1531FT                   IICDDPNYPEIWRDCAMKGAELIVRCQGYMYPAKDQQVMMAKAMAWANNCYVAVANAAG
1532FT                   FDGVYSYFGHSAIIGFDGRTLGECGEEEMGIQYAQLSLSQIRDARANDQSQNHLFKILH
1533FT                   RGYSGLQASGDGDRGLAECPFEFYRTWVTDAEKARDNVERLTRSTTGVAQCPVGRLPYE
1534FT                   GLEKEA"
1535XX
1536SQ   Sequence 1065 BP; 220 A; 337 C; 343 G; 165 T; 0 other;
1537     aaataacaac aggaggtgat acccatgcgt cacggcgata tttccagcag caacgacacc        60
1538     gtcggagtgg ccgtggtcaa ctacaagatg ccgcgcctgc acaccgcggc ggaggtcctg       120
1539     gacaacgccc ggaagatcgc cgacatgatc gtcggcatga agcagggcct gcccggcatg       180
1540     gacctggtgg tgttcccgga gtacagcctg cagggcatca tgtacgatcc ggcggagatg       240
1541     atggaaaccg cggtggcgat ccccggcgag gaaaccgaga tattctcccg cgcctgccgc       300
1542     aaggccaacg tctggggcgt attctccctc accggcgaac ggcacgagga gcatccgcgc       360
1543     aaggcgccgt acaacaccct ggtgctgatc gacaacaacg gcgagatcgt ccagaagtac       420
1544     cgcaagatca ttccctggtg ccccatcgag ggctggtatc ccggtggcca gacctacgtc       480
1545     agcgaagggc cgaagggcat gaagatcagc ctgatcatct gcgacgaccc caattacccg       540
1546     gagatctggc gcgactgcgc gatgaagggc gccgagctga tcgtgcgctg ccagggctac       600
1547     atgtacccgg ccaaggacca gcaggtgatg atggccaagg ccatggcctg ggccaacaac       660
1548     tgctatgtgg cggtggccaa cgcggccggc ttcgacggtg tctattccta cttcggccac       720
1549     tcggcgatca tcggcttcga cggccgtacc ctcggtgagt gcggcgagga ggaaatgggt       780
1550     atccagtacg cccagctgtc cctttcgcag atccgcgatg cgcgcgccaa cgatcagtcg       840
1551     cagaaccacc tgttcaagat cctccaccgc ggctacagcg gcttgcaggc gtccggcgac       900
1552     ggcgaccggg gcctggcgga gtgtccgttc gagttctacc gcacctgggt caccgacgcc       960
1553     gagaaggcgc gcgacaatgt cgagcgactg acccgctcga ccaccggcgt ggcgcaatgc      1020
1554     ccggtcggcc ggctgcccta tgagggactg gagaaggaag cctga                      1065
1555//
1556ID   X13776; SV 1; linear; genomic DNA; STD; PRO; 2167 BP.
1557XX
1558AC   X13776; M43175;
1559XX
1560DT   19-APR-1989 (Rel. 19, Created)
1561DT   14-NOV-2006 (Rel. 89, Last updated, Version 24)
1562XX
1563DE   Pseudomonas aeruginosa amiC and amiR gene for aliphatic amidase regulation
1564XX
1565KW   aliphatic amidase regulator; amiC gene; amiR gene.
1566XX
1567OS   Pseudomonas aeruginosa
1568OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
1569OC   Pseudomonadaceae; Pseudomonas.
1570XX
1571RN   [1]
1572RP   1167-2167
1573RA   Rice P.M.;
1574RT   ;
1575RL   Submitted (16-DEC-1988) to the INSDC.
1576RL   Rice P.M., EMBL, Postfach 10-2209, Meyerhofstrasse 1, 6900 Heidelberg, FRG.
1577XX
1578RN   [2]
1579RP   1167-2167
1580RX   DOI; 10.1016/0014-5793(89)80249-2.
1581RX   PUBMED; 2495988.
1582RA   Lowe N., Rice P.M., Drew R.E.;
1583RT   "Nucleotide sequence of the aliphatic amidase regulator gene (amiR) of
1584RT   Pseudomonas aeruginosa";
1585RL   FEBS Lett. 246(1-2):39-43(1989).
1586XX
1587RN   [3]
1588RP   1-1292
1589RX   PUBMED; 1907262.
1590RA   Wilson S., Drew R.;
1591RT   "Cloning and DNA sequence of amiC, a new gene regulating expression of the
1592RT   Pseudomonas aeruginosa aliphatic amidase, and purification of the amiC
1593RT   product";
1594RL   J. Bacteriol. 173(16):4914-4921(1991).
1595XX
1596RN   [4]
1597RP   1-2167
1598RA   Rice P.M.;
1599RT   ;
1600RL   Submitted (04-SEP-1991) to the INSDC.
1601RL   Rice P.M., EMBL, Postfach 10-2209, Meyerhofstrasse 1, 6900 Heidelberg, FRG.
1602XX
1603DR   GOA; Q51417.
1604DR   InterPro; IPR003211; AmiSUreI_transpt.
1605DR   UniProtKB/Swiss-Prot; Q51417; AMIS_PSEAE.
1606XX
1607CC   Data kindly reviewed (04-SEP-1991) by Rice P. M.
1608XX
1609FH   Key             Location/Qualifiers
1610FH
1611FT   source          1..2167
1612FT                   /organism="Pseudomonas aeruginosa"
1613FT                   /map="38 min"
1614FT                   /strain="PAC"
1615FT                   /isolate="PAC 1"
1616FT                   /mol_type="genomic DNA"
1617FT                   /db_xref="taxon:287"
1618FT   CDS             1289..1879
1619FT                   /transl_table=11
1620FT                   /gene="amiR"
1621FT                   /note="aliphatic amidase regulator, positive  regulator of
1622FT                   amiE"
1623FT                   /db_xref="GOA:P10932"
1624FT                   /db_xref="InterPro:IPR005561"
1625FT                   /db_xref="InterPro:IPR008327"
1626FT                   /db_xref="InterPro:IPR011006"
1627FT                   /db_xref="InterPro:IPR011991"
1628FT                   /db_xref="PDB:1QO0"
1629FT                   /db_xref="UniProtKB/Swiss-Prot:P10932"
1630FT                   /protein_id="CAA32023.1"
1631FT                   /translation="MSANSLLGSLRELQVLVLNPPGEVSDALVLQLIRIGCSVRQCWPP
1632FT                   PEAFDVPVDVVFTSIFQNGHHDEIAALLAAGTPRTTLVALVEYESPAVLSQIIELECHG
1633FT                   VITQPLDAHRVLPVLVSARRISEEMAKLKQKTEQLQDRIAGQARINQAKVLLMQRHGWD
1634FT                   EREAHQHLSREAMKRREPILKIAQELLGNEPSA"
1635FT   CDS             135..1292
1636FT                   /transl_table=11
1637FT                   /gene="amiC"
1638FT                   /note="negative regulator of amiR"
1639FT                   /db_xref="GOA:P27017"
1640FT                   /db_xref="InterPro:IPR000709"
1641FT                   /db_xref="PDB:1PEA"
1642FT                   /db_xref="PDB:1QNL"
1643FT                   /db_xref="PDB:1QO0"
1644FT                   /db_xref="UniProtKB/Swiss-Prot:P27017"
1645FT                   /protein_id="CAA32024.1"
1646FT                   /translation="MGSHQERPLIGLLFSETGVTADIERSHAYGALLAVEQLNREGGVG
1647FT                   GRPIETLSQDPGGDPDRYRLCAEDFIRNRGVRFLVGCYMSHTRKAVMPVVERADALLCY
1648FT                   PTPYEGFEYSPNIVYGGPAPNQNSAPLAAYLIRHYGERVVFIGSDYIYPRESNHVMRHL
1649FT                   YRQHGGTVLEEIYIPLYPSDDDLQRAVERIYQARADVVFSTVVGTGTAELYRAIARRYG
1650FT                   DGRRPPIASLTTSEAEVAKMESDVAEGQVVVAPYFSSIDTPASRAFVQACHGFFPENAT
1651FT                   ITAWAEAAYWQTLLLGRAAQAAGNWRVEDVQRHLYDIDIDAPQGPVRVERQNNHSRLSS
1652FT                   RIAEIDARGVFQVRWQSPEPIRPDPYVVVHNLDDWSASMGGGPLP"
1653FT   promoter        8..24
1654FT                   /note="proposed rpoN-dependent promoter"
1655FT   promoter        65..81
1656FT                   /note="proposed rpoN-dependent promoter"
1657FT   RBS             121..126
1658FT                   /note="proposed Shine-Dalgarno sequence"
1659FT   variation       912..1167
1660FT                   /gene="amiC"
1661FT                   /replace=""
1662FT                   /note="ClaI fragment deleted in pSW36,  constitutive
1663FT                   phenotype"
1664FT   misc_feature    1
1665FT                   /note="last base of an XhoI site"
1666FT   misc_feature    648..653
1667FT                   /note="end of 658bp XhoI fragment, deletion in  pSW3 causes
1668FT                   constitutive expression of amiE"
1669FT   misc_difference 1281
1670FT                   /replace="g"
1671FT                   /note="conflict"
1672FT                   /citation=[3]
1673XX
1674SQ   Sequence 2167 BP; 363 A; 712 C; 730 G; 362 T; 0 other;
1675     ggtaccgctg gccgagcatc tgctcgatca ccaccagccg ggcgacggga actgcacgat        60
1676     ctacctggcg agcctggagc acgagcgggt tcgcttcgta cggcgctgag cgacagtcac       120
1677     aggagaggaa acggatggga tcgcaccagg agcggccgct gatcggcctg ctgttctccg       180
1678     aaaccggcgt caccgccgat atcgagcgct cgcacgcgta tggcgcattg ctcgcggtcg       240
1679     agcaactgaa ccgcgagggc ggcgtcggcg gtcgcccgat cgaaacgctg tcccaggacc       300
1680     ccggcggcga cccggaccgc tatcggctgt gcgccgagga cttcattcgc aaccgggggg       360
1681     tacggttcct cgtgggctgc tacatgtcgc acacgcgcaa ggcggtgatg ccggtggtcg       420
1682     agcgcgccga cgcgctgctc tgctacccga ccccctacga gggcttcgag tattcgccga       480
1683     acatcgtcta cggcggtccg gcgccgaacc agaacagtgc gccgctggcg gcgtacctga       540
1684     ttcgccacta cggcgagcgg gtggtgttca tcggctcgga ctacatctat ccgcgggaaa       600
1685     gcaaccatgt gatgcgccac ctgtatcgcc agcacggcgg cacggtgctc gaggaaatct       660
1686     acattccgct gtatccctcc gacgacgact tgcagcgcgc cgtcgagcgc atctaccagg       720
1687     cgcgcgccga cgtggtcttc tccaccgtgg tgggcaccgg caccgccgag ctgtatcgcg       780
1688     ccatcgcccg tcgctacggc gacggcaggc ggccgccgat cgccagcctg accaccagcg       840
1689     aggcggaggt ggcgaagatg gagagtgacg tggcagaggg gcaggtggtg gtcgcgcctt       900
1690     acttctccag catcgatacg cccgccagcc gggccttcgt ccaggcctgc catggtttct       960
1691     tcccggagaa cgcgaccatc accgcctggg ccgaggcggc ctactggcag accttgttgc      1020
1692     tcggccgcgc cgcgcaggcc gcaggcaact ggcgggtgga agacgtgcag cggcacctgt      1080
1693     acgacatcga catcgacgcg ccacaggggc cggtccgggt ggagcgccag aacaaccaca      1140
1694     gccgcctgtc ttcgcgcatc gcggaaatcg atgcgcgcgg cgtgttccag gtccgctggc      1200
1695     agtcgcccga accgattcgc cccgaccctt atgtcgtcgt gcataacctc gacgactggt      1260
1696     ccgccagcat gggcggggga ccgctcccat gagcgccaac tcgctgctcg gcagcctgcg      1320
1697     cgagttgcag gtgctggtcc tcaacccgcc gggggaggtc agcgacgccc tggtcttgca      1380
1698     gctgatccgc atcggttgtt cggtgcgcca gtgctggccg ccgccggaag ccttcgacgt      1440
1699     gccggtggac gtggtcttca ccagcatttt ccagaatggc caccacgacg agatcgctgc      1500
1700     gctgctcgcc gccgggactc cgcgcactac cctggtggcg ctggtggagt acgaaagccc      1560
1701     cgcggtgctc tcgcagatca tcgagctgga gtgccacggc gtgatcaccc agccgctcga      1620
1702     tgcccaccgg gtgctgcctg tgctggtatc ggcgcggcgc atcagcgagg aaatggcgaa      1680
1703     gctgaagcag aagaccgagc agctccagga ccgcatcgcc ggccaggccc ggatcaacca      1740
1704     ggccaaggtg ttgctgatgc agcgccatgg ctgggacgag cgcgaggcgc accagcacct      1800
1705     gtcgcgggaa gcgatgaagc ggcgcgagcc gatcctgaag atcgctcagg agttgctggg      1860
1706     aaacgagccg tccgcctgag cgatccgggc cgaccagaac aataacaaga ggggtatcgt      1920
1707     catcatgctg ggactggttc tgctgtacgt tggcgcggtg ctgtttctca atgccgtctg      1980
1708     gttgctgggc aagatcagcg gtcgggaggt ggcggtgatc aacttcctgg tcggcgtgct      2040
1709     gagcgcctgc gtcgcgttct acctgatctt ttccgcagca gccgggcagg gctcgctgaa      2100
1710     ggccggagcg ctgaccctgc tattcgcttt tacctatctg tgggtggccg ccaaccagtt      2160
1711     cctcgag                                                                2167
1712//
1713ID   X77161; SV 1; linear; genomic DNA; STD; PRO; 1130 BP.
1714XX
1715AC   X77161;
1716XX
1717DT   13-APR-1994 (Rel. 39, Created)
1718DT   31-JUL-2003 (Rel. 76, Last updated, Version 7)
1719XX
1720DE   Pseudomonas aeruginosa (PAC1) amiS gene.
1721XX
1722KW   amiS gene.
1723XX
1724OS   Pseudomonas aeruginosa
1725OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
1726OC   Pseudomonadaceae; Pseudomonas.
1727XX
1728RN   [1]
1729RA   Wilson S.A., Wachira S.M., Drew R.E., Jones D., Pearl L.H.;
1730RT   "Identification of a putative ABC transporter in the Pseudomonas aeruginosa
1731RT   amidase operon";
1732RL   Unpublished.
1733XX
1734RN   [2]
1735RP   1-1130
1736RA   Wilson S.A.;
1737RT   ;
1738RL   Submitted (17-JAN-1994) to the INSDC.
1739RL   S.A. Wilson, University College London, Dept of Biochemistry, Gower Street,
1740RL   London WC1E 6BT, UK
1741XX
1742RN   [3]
1743RP   1-1130
1744RX   DOI; 10.1074/jbc.270.32.18818.
1745RX   PUBMED; 7642533.
1746RA   Wilson S.A., Williams R.J., Pearl L.H., Drew R.E.;
1747RT   "Identification of two new genes in the Pseudomonas aeruginosa amidase
1748RT   operon, encoding an ATPase (AmiB) and a putative integral membrane protein
1749RT   (AmiS)";
1750RL   J Biol Chem 270(32):18818-18824(1995).
1751XX
1752DR   StrainInfo; 345027; 0.
1753XX
1754FH   Key             Location/Qualifiers
1755FH
1756FT   source          1..1130
1757FT                   /organism="Pseudomonas aeruginosa"
1758FT                   /strain="PAC1"
1759FT                   /mol_type="genomic DNA"
1760FT                   /clone="plasmid pAS20"
1761FT                   /db_xref="taxon:287"
1762FT   CDS             61..576
1763FT                   /transl_table=11
1764FT                   /gene="amiS"
1765FT                   /db_xref="GOA:Q51417"
1766FT                   /db_xref="InterPro:IPR003211"
1767FT                   /db_xref="UniProtKB/Swiss-Prot:Q51417"
1768FT                   /protein_id="CAA54406.1"
1769FT                   /translation="MLGLVLLYVGAVLFLNAVWLLGKISGREVAVINFLVGVLSACVAF
1770FT                   YLIFSAAAGQGSLKAGALTLLFAFTYLWVAANQFLEVDGKGLGWFCLFVSLTACTVAIE
1771FT                   SFAGASGPFGLWNAVNWTVWALLWFCFFLLLGLSRGIQKPVAYLTLASAIFTAWLPGLL
1772FT                   LLGQVLKA"
1773XX
1774SQ   Sequence 1130 BP; 167 A; 335 C; 377 G; 251 T; 0 other;
1775     gagccgtccg cctgagcgat ccgggccgac cagaacaata acaagagggg tatcgtcatc        60
1776     atgctgggac tggttctgct gtacgttggc gcggtgctgt ttctcaatgc cgtctggttg       120
1777     ctgggcaaga tcagcggtcg ggaggtggcg gtgatcaact tcctggtcgg cgtgctgagc       180
1778     gcctgcgtcg cgttctacct gatcttttcc gcagcagccg ggcagggctc gctgaaggcc       240
1779     ggagcgctga ccctgctatt cgcttttacc tatctgtggg tggccgccaa ccagttcctc       300
1780     gaggtggacg gcaagggcct cggctggttc tgcctgttcg tcagcctcac cgcctgcacc       360
1781     gtggcgatcg agtcgttcgc cggcgccagt ggtccgttcg gcctgtggaa cgcggtcaac       420
1782     tggacagtct gggcgttgct ctggttctgt ttcttcctgc tgctggggct gtcccgcggc       480
1783     atccagaagc cggtggccta cctgaccctg gccagcgcca tattcaccgc ctggttgccc       540
1784     ggcctgctgc tgctcggaca ggtgctcaag gcatagcagg aagtcggaaa gggatgacgg       600
1785     cttgccgcca tcccgtccct tccgaacgcc tagccgagcg gccagttgat caccacgacg       660
1786     gcgtcgttgt agtcgttgtc ggtgccgtct tcagagccga ccagggcgaa gttcagctcg       720
1787     ttggtcagga ttacctgtgc cgagaccaga tccgaggggc ggccgttgac gctgacctgg       780
1788     acctgtacct tgccactgct gccggagttg agcacctggg tgccgatgac ggcgttattg       840
1789     gtgctttgcc cgctgaaggt cgcggccgtg ctcgttgttg accagcacgt tcaccgtctg       900
1790     ggttccggac gagttggcga aggcggtgac gccggaacct ggttgttggc gggaagggtg       960
1791     aacactcctt gtggttgcca tggtggtatc tccactgaat acctggcccc ttccttttca      1020
1792     ggcagccgtc tggcgcgcgg tatggcgtgt cgggagaaat ccgcagtcct tggcggcagg      1080
1793     cgatgcgcag gcaggaagga cgcatcgttc agccaatcta cgccgtcgac                 1130
1794//
1795