spacer
spacer

EBI Dbfetch

ID   U89712; SV 1; linear; genomic DNA; STD; PRO; 6040 BP.
XX
AC   U89712;
XX
DT   26-MAR-1997 (Rel. 51, Created)
DT   18-APR-2005 (Rel. 83, Last updated, Version 4)
XX
DE   Rhodococcus globerulus hpp operon, 3-(3-hydroxyphenyl) propionate
DE   hydroxylase (hppA), 2-hydroxy-6-ketonona-2,4-dienoate hydrolase (hppC),
DE   2,3-dihydroxyphenylpropionate 1,2-dioxygenase (hppB), putative
DE   3-(3-hydroxyphenyl) propionate transport protein (hppK) and putative
DE   regulatory protein (hppR) genes, complete cds.
XX
KW   .
XX
OS   Rhodococcus globerulus
OC   Bacteria; Actinobacteria; Actinobacteridae; Actinomycetales;
OC   Corynebacterineae; Nocardiaceae; Rhodococcus.
XX
RN   [1]
RP   1-6040
RX   PUBMED; 9324265.
RA   Barnes M.R., Duetz W.A., Williams P.A.;
RT   "A 3-(3-hydroxyphenyl)propionic acid catabolic pathway in Rhodococcus
RT   globerulus PWD1: cloning and characterization of the hpp operon";
RL   J. Bacteriol. 179(19):6145-6153(1997).
XX
RN   [2]
RP   1-6040
RA   Williams P.A., Barnes M.R.;
RT   ;
RL   Submitted (14-FEB-1997) to the EMBL/GenBank/DDBJ databases.
RL   School of Biological Sciences, University of Wales, Bangor, Memorial
RL   Building, Deiniol Road, Bangor, Gwynedd LL57 2UW, United Kingdom
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..6040
FT                   /organism="Rhodococcus globerulus"
FT                   /strain="PWD1"
FT                   /mol_type="genomic DNA"
FT                   /note="NCIMB 13325; hpp operon"
FT                   /db_xref="taxon:33008"
FT   stem_loop       14..54
FT   gene            268..1587
FT                   /gene="hppA"
FT   CDS             268..1587
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hppA"
FT                   /product="3-(3-hydroxyphenyl) propionate hydroxylase"
FT                   /note="HppA"
FT                   /db_xref="GOA:O05144"
FT                   /db_xref="HSSP:1FOH"
FT                   /db_xref="InterPro:IPR003042"
FT                   /db_xref="UniProtKB/TrEMBL:O05144"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT                   /protein_id="AAB81312.1"
FT                   /translation="MKTTQDTEVLIVGAGPAGLMLANILGMYGKQVTVLEAMDTLIDYP
FT                   RGVGLDDESFRTIQTVGLVDAIRPHTNPQHIMRLVNGAGKVMLVNNPQTVEFGWERKHG
FT                   FIQPEADKALYEGLSRFGNVQVLFGHRVENVEEDGQSVTAIALVSRPDGTIEERRFSAQ
FT                   YLVGCEGGKSPTRKRLGVSFEGESPSTRWLVVDVNNDPLGTPNVFLGADPKRPYVSIGL
FT                   PHAVRRWEFMLHDDETEEQVTDPDYVNALLADHVPNPAELDFIRRRVFTHHGRVASDFR
FT                   KGRQLIAGDAAHLMPVWMGQGWNSGMRDATNLGWKLAAVLSGQADDALLDTYTSERKDH
FT                   AQAMVDLSLTFGRLIKITNPVGAVLRDAASSVLNLFPQVKSYFADMRFKPMPRYTRGVL
FT                   ADPNTRESGSAAAKLTSKLIPVLTANVKNSPVGVQFRSRV"
FT   stem_loop       1653..1668
FT   stem_loop       1695..1705
FT   stem_loop       1933..1941
FT   stem_loop       1942..1953
FT   gene            2030..2896
FT                   /gene="hppC"
FT   CDS             2030..2896
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hppC"
FT                   /product="2-hydroxy-6-ketonona-2,4-dienoate hydrolase"
FT                   /note="HppC"
FT                   /db_xref="GOA:O05145"
FT                   /db_xref="HSSP:1IUN"
FT                   /db_xref="InterPro:IPR000073"
FT                   /db_xref="UniProtKB/TrEMBL:O05145"
FT                   /experiment="experimental evidence, no additional details
FT                   recorded"
FT                   /protein_id="AAB81313.1"
FT                   /translation="MTTTEIPAYITDDFFGLEDKWIETADGELTHYHELGEGTPILFLH
FT                   GSGTGVTAAANWWLNLPVLSEQGRCIAIDSIGYGQSVVAPNTEYGIKEWVRHAVRVLDA
FT                   LGIEKTWIVGNSLGGWLAFQFAIDFPERLLGIVSMGTGGAKLTGALAGHSNPNLTEAGI
FT                   RKTLELFVVDKSLVTDELVSLRYQSALNDTASDRLAEVVAARDRDRTELPLDFDVLSRL
FT                   DVPVLLIHGVQDVVIPVSRTWELLNVIPNADVHIFSQCGHWSQVERAEEFNTVITQYLS
FT                   ARGVSRS"
FT   gene            2893..3837
FT                   /gene="hppB"
FT   CDS             2893..3837
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hppB"
FT                   /product="2,3-dihydroxyphenylpropionate 1,2-dioxygenase"
FT                   /note="HppB"
FT                   /db_xref="GOA:O05146"
FT                   /db_xref="InterPro:IPR004183"
FT                   /db_xref="UniProtKB/Swiss-Prot:O05146"
FT                   /experiment="experimental evidence, no additional details
FT                   recorded"
FT                   /protein_id="AAB81314.1"
FT                   /translation="MKQALLCMSHSPLLHHLDPPADVKASVEAAFDQARAFVHNFDPDV
FT                   IVNFGPDHYNGFFYDLMPPFCIGYKAKGSGDYDSFAGELNVPEAMAEDLAQFVMDQGLD
FT                   IAISRQMEVDHGAVQPMEIIYGDVASKPLIPVFVNSVARPFVKVARVRKFGEAVGAYFK
FT                   NSDKKVLFIGSGGLSHDPPVPQIATADEAQRKMLTDGRNPTPQARAARQQRVIDTAVKF
FT                   AADEADIMDLNPEWDRGFLDVCASGRIEDFDRYTADDMDAVAGHSSHEVRNWVAAYSAL
FT                   RACGEYEIAYEFYRPIKEYISGFAVTTAILRDI"
FT   stem_loop       3851..3862
FT   gene            3888..5249
FT                   /gene="hppK"
FT   CDS             3888..5249
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hppK"
FT                   /product="putative 3-(3-hydroxyphenyl) propionate transport
FT                   protein"
FT                   /note="contains sugar transport proteins signature 2
FT                   (PROSITE  PS00217); HppK"
FT                   /db_xref="GOA:O05147"
FT                   /db_xref="InterPro:IPR011701"
FT                   /db_xref="UniProtKB/TrEMBL:O05147"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT                   /protein_id="AAB81315.1"
FT                   /translation="MDVREAIRTQPMRRYQISTIAICLILSMIDGFEILVMAFVAPHLG
FT                   KSWDISSVEIGYLLSAGIIGTALGAIFISPLADKIGRRRLAIWCLVGITVGMALSACAV
FT                   NVPQLIAFRAFAGLGIGGLVANLNVLVSEFSSDKRRGTALGIYGVGYPLGGAVGGAISG
FT                   VLISVFDWRSAFIFGTIITAIMLVVVIKTLPESIEFLIEKRPVGALERYNEIADRLGYE
FT                   QSSELPVPIRKTERVVRDGLFKGIMLRRTVFLWLGYSCLIASFYFANTWTPKLLSDATG
FT                   DSNMGVTAGVLVNVGGVIGSIIFAGLSIVLRPRVVTVLLMFGGVFAFIGYASGFHIVAL
FT                   ALTLAVLVGIFANGGITGFYAISPPIYPAAARGTGVGWMIGCGRTVSIIAPILTGYLLD
FT                   GGWTPKSVYMMFGGVLVIAGIATLLLDATYRGRSENPETPEARREEDLAAAATA"
FT   misc_feature    3930..4016
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 1"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4044..4121
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 2"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4131..4202
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 3"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4203..4256
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 4"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4302..4376
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 5"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4392..4469
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 6"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4626..4709
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 7"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4752..4820
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 8"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4830..4895
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 9"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    4902..4970
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 10"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    5028..5114
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 11"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   misc_feature    5112..5174
FT                   /gene="hppK"
FT                   /note="Region: Transmembrane region 12"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT   gene            5252..5872
FT                   /gene="hppR"
FT   CDS             5252..5872
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hppR"
FT                   /product="putative regulatory protein"
FT                   /note="similar to IclR type regulators; HppR"
FT                   /db_xref="GOA:O05148"
FT                   /db_xref="InterPro:IPR014757"
FT                   /db_xref="UniProtKB/TrEMBL:O05148"
FT                   /inference="non-experimental evidence, no additional
FT                   details recorded"
FT                   /protein_id="AAB81316.1"
FT                   /translation="MCRSGVKPRENRVKGVASESNGSSGKQPGSQTLARGLQALELVAT
FT                   TPDGMTIQEVADALGVHRTIASRLLTTVADFRLIKRGADGKYRAGGGLAALARDLYAGL
FT                   RDEATPLLRRLANSLGASVALFVAEGSEAVAVAVVEPKNARYWVSFREGGRHPIDRGAA
FT                   GYALLAGQPPVPGESSRVTDARRDGYVVSYGEVEPGYWGLGYR"
XX
SQ   Sequence 6040 BP; 1122 A; 1799 C; 1862 G; 1257 T; 0 other;
     agaggatctg cgcaatggcc gcgccggagg tgaacaacct ccggcgcggc cattttgtgt        60
     ctcgggcaca tggagaaggc cggcaaacca tgctctagct gcagttttga tgccgcgcca       120
     ttctgtctga gcgatcccat cgggcaccaa atgcggcccc ggtcacaaaa gctcattgac       180
     gtaccccgct tcgtggtttc taatagacgc atcgtgcata tagtgtgcta aggcacgcga       240
     tagttgcatt agcgcagata ggaagccatg aaaaccactc aggacaccga agtactcatc       300
     gtcggcgccg gtcccgccgg cctgatgttg gcgaacatcc tcggcatgta cggcaagcag       360
     gtcaccgtgc tcgaggccat ggatacgctg atcgactacc cgcgtggtgt gggactcgac       420
     gacgagtcgt tccgcaccat tcagacggtg ggcctggtgg atgcgatccg tccgcacaca       480
     aatccgcagc acatcatgcg tctggtcaac ggtgccggaa aggtcatgct ggtcaacaac       540
     ccgcagaccg tggaattcgg ctgggaacgt aagcacggct tcatccagcc ggaagccgac       600
     aaggcgctgt atgagggact gtcccggttc gggaacgttc aggtgttgtt cggtcatcgc       660
     gtcgagaacg tcgaagaaga tggccagtcg gttaccgcta tcgcgttggt ttctcgcccc       720
     gacggaacca tcgaagaacg gcgattcagt gcgcagtacc tggtggggtg tgaaggtggt       780
     aagtctccga cccgcaagcg tctcggtgtc agcttcgagg gtgaatcacc ttctacacgt       840
     tggcttgtcg tggacgtcaa caacgatccg ctgggaaccc ccaacgtgtt cctgggtgcc       900
     gatccgaagc gtccgtacgt gtccatcggt ctgccccacg cggttcggcg ctgggaattc       960
     atgctgcacg acgacgaaac cgaagagcag gtcacggacc ccgactacgt gaatgctctt      1020
     ctggcagatc atgttcccaa cccggcggaa ctcgatttca ttcgacgacg cgtcttcacc      1080
     catcacggcc gcgtcgcttc cgacttccgc aagggccgcc aattgatcgc gggcgacgcc      1140
     gcgcacctga tgccggtgtg gatgggtcag ggctggaatt cgggtatgcg cgacgcaacc      1200
     aatcttgggt ggaagttggc cgccgtactt tccggtcagg cggacgacgc actgctcgat      1260
     acctatacgt cggagcgcaa ggatcacgcc caggcaatgg tggatctgtc gctgacgttc      1320
     ggacggctca tcaagatcac caatccggtc ggtgctgtac tccgcgacgc tgcgtcgtcg      1380
     gtgctcaatc tcttccctca ggtcaagagc tacttcgcgg acatgcgctt caagccgatg      1440
     ccgcgctaca ccaggggagt gctggccgac ccgaacactc gggaatcggg aagtgcagca      1500
     gcgaaactca cgagcaagct catcccggtg ctgaccgcca acgtcaagaa ctcaccggtt      1560
     ggcgtccagt tccgcagccg cgtgtgaact cgcgggatgc gtcggaccaa ctgctcgacg      1620
     acgcgatcgg caactggtgg tcggtaatcg tgtggggcaa cagccccaag gacgtgctcc      1680
     cacaggattc gctcgacaag ttgtctctac tcggtgcccg ccttgttgcg gtagttccgg      1740
     agacccagcg cgaatgggct cagaagcaca tggatccgga cgttatggtc ctcggcgatc      1800
     acaccggccg actcaagaag tggttcgacg accgtcccac tcccttggtc ttccttcgcc      1860
     cggaccgttt tgttgccggc gcctgcctga cgcagcatgc cccggcgacg ttggacgcga      1920
     tcctggccgc aatgaagttc acgccggccg gcgctgtcgc ggacgcagtc gcagtgccgg      1980
     tcgcgctcta accatccgcc acacacactc ttacgagaaa gccagatata tgactacaac      2040
     cgagattccc gcgtacatca ccgacgattt cttcggcctc gaagacaagt ggatcgagac      2100
     cgcagacggt gaactcaccc actaccacga actgggcgaa ggtaccccga tcctgttcct      2160
     gcacggttcg ggcaccggcg tcaccgccgc cgccaactgg tggctcaatc ttccggttct      2220
     cagcgagcag ggtcgatgca tcgcaatcga ttccatcggc tacgggcaga gcgttgttgc      2280
     tccgaacacc gagtacggca tcaaggaatg ggttcgccac gcggtgcgcg ttctcgacgc      2340
     cctcggcatc gagaagacgt ggattgtcgg aaactccctc ggtggttggc ttgcattcca      2400
     gtttgccatc gatttcccgg aacgccttct ggggatcgtc tcgatgggca cgggcggcgc      2460
     aaagttgacg ggcgccctgg ccggtcactc caacccgaac ctgactgaag ccggcattcg      2520
     caagaccctc gaactctttg ttgtcgacaa gtcgcttgtc actgacgaat tggtgtccct      2580
     gcgctaccaa tccgcgctca acgatacggc ctcggatcgc ctcgccgagg tggtcgcagc      2640
     ccgagaccgt gaccgcaccg aactaccgct cgatttcgat gtgctctctc gtttggatgt      2700
     tccggttctg ctgatccacg gtgtccagga cgtggtgatc cccgtctcgc gtacgtggga      2760
     gttactcaac gtcatcccga atgccgacgt gcatatcttc agccagtgtg gccactggtc      2820
     acaggtcgag cgggcagaag agttcaatac cgttatcacg cagtatcttt ccgctcgggg      2880
     tgtgagtcgg tcatgaagca ggctttgctg tgcatgtcgc acagcccact gttgcaccac      2940
     ctcgacccgc cggccgatgt caaagcatcg gtggaagcag cgttcgacca ggcccgcgca      3000
     tttgttcaca atttcgatcc cgatgtgatc gttaacttcg gacccgatca ctacaacgga      3060
     ttcttctacg atctgatgcc gccgttctgc atcggctaca aggcaaaggg cagtggcgat      3120
     tacgactcgt ttgccggtga actgaacgtg ccggaagcta tggccgagga cttggcgcag      3180
     ttcgtgatgg atcaggggct cgacattgcg atttcacgtc agatggaggt cgatcacggt      3240
     gcggtgcaac cgatggagat catctacgga gacgtagcgt ccaaaccgct gatcccagtc      3300
     ttcgtcaatt cggttgccag gccgttcgtg aaggttgccc gcgtgcgtaa gttcggcgag      3360
     gccgtcggcg cgtatttcaa gaattccgac aagaaggtgc tgttcatcgg ttccggtggg      3420
     ctgtcacatg atccgccggt tccgcagatc gccaccgccg acgaggctca gcgcaagatg      3480
     ctgaccgacg gccggaatcc gacgccgcag gcgcgtgcgg ccaggcaaca gcgagtcatc      3540
     gacacggccg tcaagttcgc ggcggacgag gccgacatca tggatctgaa tccggagtgg      3600
     gacagaggat ttctcgacgt gtgcgcgtcc gggcggatcg aggatttcga tcgctacacc      3660
     gcagacgaca tggatgcggt agccgggcac tcctcgcatg aggtgcgcaa ctgggtggct      3720
     gcctactctg ccctacgggc ctgcggtgaa tacgagatcg cctacgagtt ctaccggccg      3780
     atcaaggaat acatctccgg ctttgccgtc acgaccgcga ttctgcggga tatctgattc      3840
     ttgctactcc ggggaagccc cctcccatct tatgaaagta gacctcgatg gatgttcgtg      3900
     aagcgattcg gacgcaaccg atgcgccgat atcagatttc gacaatcgcg atctgtctga      3960
     tcctcagcat gatcgacggt ttcgagatcc tggtcatggc gttcgtagcg cctcacctcg      4020
     gaaagtcctg ggacatcagc tccgtcgaga tcggctacct gctcagtgcc ggcatcatcg      4080
     gcacggctct gggtgcaatt ttcatctccc cattggcgga caagatcggt aggcgccggc      4140
     ttgcgatctg gtgtctcgtc ggtatcaccg tcggaatggc gttgtctgcc tgcgccgtca      4200
     acgttcccca gctcatcgca ttccgtgcgt ttgccggctt ggggatcggc ggactggtcg      4260
     cgaacctgaa tgttcttgta tcggagttca gttcggacaa gcgtcgtggt accgccctgg      4320
     gaatctatgg tgtcggctac cccctcggtg gagccgtggg tggcgcgatt tccggcgtcc      4380
     tgatttccgt gttcgactgg cggtcggcgt tcatcttcgg cacgatcatc accgcaatca      4440
     tgctggttgt cgtgatcaag accctgccgg aatccatcga gttcctcatc gagaagcggc      4500
     cggtcggggc actggagcgg tacaacgaga tcgcggatcg gctcggctac gagcagtcgt      4560
     cggaactgcc cgttccgatt cgaaagaccg aacgtgttgt gcgggacggc cttttcaagg      4620
     gaatcatgct gcgtcgcacg gttttcctct ggctcgggta ctcatgcttg atcgcgtcgt      4680
     tctacttcgc caatacctgg acgccgaagt tgctgtccga tgcaacgggg gattcgaaca      4740
     tgggcgtcac tgccggtgtg ctcgtcaacg tcggtggtgt catcggatcg atcatttttg      4800
     cgggcctgtc gatcgtgttg cggccgagag ttgtgacagt tctcttgatg ttcggtggag      4860
     tatttgcgtt catcggttac gcctccggat tccacatcgt cgccctggct ttgacgctcg      4920
     cggtactggt cggcattttt gccaatggcg gcatcaccgg tttctacgcg atcagcccgc      4980
     ccatctaccc ggcggcggcc cggggcaccg gtgtgggctg gatgatcggg tgcggtcgca      5040
     cggtctcgat tatcgctccg attctgaccg gctacctgct cgatggtggc tggactccga      5100
     agagcgtcta catgatgttc ggtggggtgt tggtgatcgc cggaatcgcg acgttgcttc      5160
     tcgacgcgac ctaccgcggc cgcagtgaga atccggagac tccggaggcg agacgggaag      5220
     aggacctggc cgccgcagcc actgcttgag gatgtgccga tccggcgtca agccccgaga      5280
     gaatagagtc aagggcgtgg cttcagaatc gaatgggtcg tccggcaaac aaccgggctc      5340
     gcaaacactg gcgaggggat tgcaggccct cgaattggtt gccaccactc ccgatggaat      5400
     gacaattcag gaagtagccg atgccctggg tgttcaccgg accattgcat cgcggttgct      5460
     caccactgtg gctgacttcc ggctcatcaa gcgcggtgcg gacggcaagt accgggccgg      5520
     gggcggattg gcggcgctcg ctcgggactt gtacgcaggc cttcgagacg aggcgacacc      5580
     gttgttgcgt cggctcgcga attccttggg cgcgagtgtt gcgctgtttg tcgcggaggg      5640
     ctccgaagcg gtggccgtcg ccgtcgtcga gccgaagaat gctcggtact gggtgtcgtt      5700
     ccgtgagggt ggtcgccacc ctatcgaccg cggcgccgcc ggctatgcgt tgttggccgg      5760
     gcagccgccc gtccccgggg aatcgagtcg agtcaccgat gcccgccggg acggctacgt      5820
     cgtcagttac ggcgaagtcg agccgggata ctggggcctc gggtaccgtt gacacacggc      5880
     caatgagccg gccggttgcc tgacgttgat taccgcgtcc gaggatctgg cccgcggcgc      5940
     agtgcgcgaa ttgatggatg ctgctgaaaa gatcagcggc acaacacact agctacaagt      6000
     gcggcagtat tcccacgaag aacgatgcgc tcaggcaagc                            6040
//


  
spacer
spacer