spacer
spacer

EBI Dbfetch

ID   M35107; SV 1; linear; genomic DNA; STD; PRO; 5120 BP.
XX
AC   M35107;
XX
DT   19-JUL-1990 (Rel. 24, Created)
DT   17-APR-2005 (Rel. 83, Last updated, Version 6)
XX
DE   C.acetobutylicum beta-D-galactosidase (cbgA) and beta-D-galactosidase
DE   regulatory protein (cbgR) genes, complete cds.
XX
KW   beta-D-galactosidase; beta-D-galactosidase regulatory protein.
XX
OS   Clostridium acetobutylicum
OC   Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae;
OC   Clostridium.
XX
RN   [1]
RP   1-5120
RA   Scott D.B., Hancock K.R., Pearce L., Maddox I.S.;
RT   ;
RL   Unpublished.
XX
RN   [2]
RP   1260-5120
RX   PUBMED; 1850729.
RA   Hancock K.R., Rockman E., Young C.A., Pearce L., Maddox I.S., Scott D.B.;
RT   "Expression and nucleotide sequence of the Clostridium acetobutylicum
RT   beta-galactosidase gene cloned in Escherichia coli";
RL   J. Bacteriol. 173(10):3084-3095(1991).
XX
CC   Draft entry and computer-readable sequence for [1] kindly submitted
CC   by D.B.Scott, 11-JUN-1990.
CC   Author address:D.B.Scott:
CC   Molecular Genetics Unit
CC   Department of Microbiology and Genetics
CC   Massey University
CC   Palmerston North, New Zealand
CC   E-mail:D.B.Scott@massey.ac.nz.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..5120
FT                   /organism="Clostridium acetobutylicum"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:1488"
FT   CDS             1560..4253
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /note="beta-D-galactosidase (cbgA)"
FT                   /db_xref="GOA:P24131"
FT                   /db_xref="HSSP:1JZ8"
FT                   /db_xref="InterPro:IPR013781"
FT                   /db_xref="UniProtKB/Swiss-Prot:P24131"
FT                   /protein_id="AAA23216.1"
FT                   /translation="MINNKPSLDWLENPEIFRVNRIDAHSDTWFYEKFEDVKLEDTMPL
FT                   KQNLNGKWRFSYSENSSLRIKEFYKDEFDVSWIDYIEVPGHIQLQGYDKCQYINTMYPW
FT                   EGHDELRPPHISKTYNPVGSYVTFFEVKDELKNKQTFISFQGVETAFYVWVNGEFVGYS
FT                   EDTFTPSEFDITDYLREGENKLAVEVYKRSSASWIEDQDFWRFSGIFRDVYLYAVPETH
FT                   VNDIFIKTDLYDDFKNAKLNAELKMIGNSETTVETYLEDKEGNKIAISEKIPFSDELTL
FT                   YLDAQNINLWSAEEPNLYTLYILVNKKDGNLIEVVTQKIGFRHFEMKDKIMCLKWKRII
FT                   FKGVNRHEFSARRGRSITKEDMLWDIKFLKQHNINAVRTSHYPNQSLWYRLCDEYGIYL
FT                   IDETNLESHGSWQKMGQIEPSWNVPGSLPQWQAAVLDRASSMVERDKNHPSVLIWSCGN
FT                   ESYAGEDIYQMSKYFRKKDPSRLVHYEGVTRCREFMTRRHESRMYAKAAEIEEYLNDNP
FT                   KKPYISCEYMHSMGNSTGGMMKYTELEDKYLMYQGGFIWDYGDQALYRKLPDGKEVLAY
FT                   GGDFTDRPTDYNFSGNGLIYADRTISPKAQEVKYLYQNVKLEPDEKGVTIKNQNLFVNT
FT                   DKYDLYYIVERDGKLIKDGYLNVSVAPDEEKYIELPIGNYNFPEEIVLTTSLRLAQATL
FT                   WAEKGYEIAFGQKVIKEKSDMNNHNSESKMKIIHGDVNIGVHGKDFKAIFSKQEGGIVS
FT                   LRYNNKEFITRTPKTFYWRATTDNDRGNRHEFRCSQWLAATMGQKYVDFSVEEFDEKIT
FT                   LYYTYQLPTVPSTNVKITYEVSGEGIIKVNVKYKGVSGLPELPVLGMDFKLLAEFNSFS
FT                   WYGMGPEENYIDRCEGAKLGIYESTQ"
FT   CDS             4500..4805
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /note="beta-D-galactosidase regulatory protein (cbgR)"
FT                   /db_xref="UniProtKB/Swiss-Prot:P24132"
FT                   /protein_id="AAA23217.1"
FT                   /translation="MLGSTMIPKFCIDSSKDLEYSFIISKIILRTYGNYRYPKQNLDLC
FT                   NNLRKDRYSVVSVTKNKLRLSNIISCTISACSRDKLVTSKNGTTYDEEMPATYSLM"
XX
SQ   Sequence 5120 BP; 1921 A; 683 C; 876 G; 1640 T; 0 other;
     gaattccttt tcatatatat ctttaatatt tctactggaa tagaagaggt tgctcaatac        60
     aaaaaatgct tctttaaaac tatttgaaac tacttctgaa atattttcta gcttactaaa       120
     tagagaatta taatttttat catcaaaatt tagaattaca actatgattt cgttttcaat       180
     attagcaatt tgtatattat aattgctatt taatccgtct aaagaaaatt ctttgccgat       240
     ttctgaaatt gtaaaatcaa taatttcatg gcgtttgcta taattatcat atatttcttt       300
     gcgtttaaac caaataagca aaatgattga aaagtaaata tgtatcaaag tagttaaagt       360
     caggatcatg tcaaaacctg atataaggcg atttaaggcg ctattagtga gacttaaaga       420
     gtttccttct aaagtatttc ttttcatttt tattgaaatc ttttttagag tacttaataa       480
     ctcagaagga tttagagaag gttttaaaat ataatcaaca gcaccatttt gaaaagatga       540
     tttaacatat tcaaaatcgc tataactact taagatgata attcttatct taggatattt       600
     gtcctgcaca aatttagcta attcaacccc atttatttgg ggcattacaa catcagaaat       660
     tataatgtca ggaatatcct tttttatcat ttccagagct tcttgaccat tagaagcctg       720
     tcctataatt tgaaagcctt ctttttccca atcaatcata tgagttatgc cttgccgcat       780
     aataaattca tcatcaacaa ctaaattttt actatattcg ttcaatagta tagcacccct       840
     tattctaaaa ttaccacaac atagataaat attgcttaat actattatac cttatagatt       900
     tattgtatgt atctgtatac gttacgttaa ttcatctaca aatttatatg agttttggtt       960
     gcacttttag agaaaatctt tttgtctatg gtcttattgt cctataatgg tcaaatcatc      1020
     tttaccaaag tctcttgatt taaagagata aaaacaccac tgatccatta ttcctcattt      1080
     tggtaatgaa cctatgcggt tgaagatatt aatcagatgt ctaaatactt tagaaaaaaa      1140
     gacctttact aatatcttca atatttacac ccctattcta aaattaccac aagatagata      1200
     aatattgctt aatactgatt ataccttata gattaaaggt tttcaattaa acaataaatt      1260
     actttagtaa agtttagtaa aatataattg attttttact aaaaagataa taaaatgaaa      1320
     ctataaattt agttaatagc ataaatctaa catcagaaga taggataaat taaagaagta      1380
     atgtaattga ttacgaaaca aaatctcata ttaatattag cccataattt ttttattctc      1440
     atatatgttt aagtattaat taaatgtgac tttataaaaa ggttgcattt agttaatacg      1500
     attaacaact ttaatttaaa aaagcaataa ctctacaaag tgaaagtgag ggggtaagta      1560
     tgattaataa taaaccgtca ttagattggc tagaaaatcc ggaaatattt agagttaata      1620
     gaatagatgc tcattctgat acttggtttt atgaaaaatt tgaggatgtt aaattagaag      1680
     acaccatgcc tcttaagcaa aatttaaatg gaaaatggag attttcatat agtgaaaatt      1740
     catcattaag aattaaagag ttttataagg atgagtttga cgtaagttgg attgattata      1800
     ttgaagttcc aggtcatatt cagcttcaag gatatgataa atgtcaatat attaatacta      1860
     tgtatccttg ggaaggtcac gatgaattaa gaccacctca tatttcaaaa acatataatc      1920
     cggtgggaag ctatgtaaca ttttttgaag ttaaagatga actcaaaaat aagcagactt      1980
     ttatttcttt tcaaggtgtt gaaacagcat tttacgtatg ggtaaatgga gaatttgtag      2040
     gatatagcga agatacattt acaccatcag aatttgatat tactgattat ttaagagagg      2100
     gagaaaataa acttgcagtt gaggtttata aaaggagtag cgcaagttgg atagaagatc      2160
     aagatttctg gagattttca ggcatcttta gagatgtata tttatatgca gttccagaaa      2220
     ctcatgtaaa tgatatattt ataaaaacag atttatatga cgatttcaaa aacgcaaagt      2280
     taaatgctga acttaaaatg attggaaatt cagaaacaac agttgaaaca tatttagaag      2340
     ataaagaagg aaataaaata gctatatctg aaaagattcc gttctctgat gagttgactt      2400
     tatatttaga tgcgcaaaat ataaacctat ggagtgcaga agagcctaac ttatatacac      2460
     tttatatttt agtgaataaa aaagatggta atttaattga ggttgtaact caaaagatag      2520
     ggtttaggca ctttgaaatg aaggataaaa ttatgtgtct aaaatggaaa cgtattatct      2580
     ttaaaggcgt aaaccgtcac gaatttagcg caagacgtgg acgctcaatt acgaaagagg      2640
     acatgttgtg ggatattaag ttcttgaaac aacacaatat taatgctgtt agaacatcac      2700
     attatccaaa tcaaagttta tggtacagac tttgcgatga atacgggatt tatttaatag      2760
     atgaaacaaa tttagaaagc catggttcat ggcaaaagat ggggcagatt gaaccatcat      2820
     ggaatgtgcc aggaagtctt ccacagtggc aggcagcagt tttagatcga gcatcatcaa      2880
     tggttgaaag agataaaaat catccatctg tacttatttg gtcatgtggt aatgaatcct      2940
     atgcgggtga agatatttat cagatgtcta aatactttag aaaaaaagat ccttcacgtt      3000
     tagtgcacta tgaaggggta actagatgca gagaatttat gacacgacga catgaaagta      3060
     gaatgtatgc aaaggcagca gaaatagaag aatatcttaa tgataatccg aagaaacctt      3120
     atatcagctg cgaatacatg cactcaatgg gtaactcaac tggtggaatg atgaaataca      3180
     cagaacttga agataaatat ttgatgtatc aaggtggatt catttgggat tacggcgatc      3240
     aggcgttgta tagaaaactt ccagatggaa aagaagttct agcttatgga ggagacttta      3300
     cagatcgtcc aacagactat aatttctctg gaaatggttt gatttatgca gatagaacta      3360
     tatcacctaa agcacaggaa gttaagtatc tatatcaaaa cgtaaaatta gaaccagatg      3420
     aaaaaggggt gactattaag aatcaaaatc tttttgttaa tactgataaa tatgatttat      3480
     actatatcgt tgaaagagat ggaaaactaa taaaagatgg ttatctaaat gtatctgtag      3540
     ctccagatga agaaaaatat atagaacttc caataggaaa ttacaatttt cctgaagaaa      3600
     ttgtacttac aacctcatta agattagcac aagctacact ttgggcagaa aaaggatatg      3660
     aaatagcatt tggacaaaag gttattaaag aaaaatcaga tatgaataat cataattcag      3720
     agtctaaaat gaagatcatt catggagatg taaacatagg ggttcacgga aaagatttca      3780
     aggctatatt ctctaaacaa gagggaggaa tcgtatcctt gagatataat aataaggagt      3840
     ttataacgag aacgccaaaa actttctatt ggagagcaac aacagataat gatagaggaa      3900
     atagacatga atttagatgc agtcaatggc tggctgctac tatggggcag aagtatgtgg      3960
     atttttcagt tgaggaattt gatgagaaga ttacattata ttatacttat caattgccaa      4020
     cagtgccatc tactaatgtt aagataactt atgaagtatc tggagaagga ataattaaag      4080
     taaatgttaa gtataaagga gttagcggat tacctgaatt gcctgtacta ggaatggatt      4140
     ttaaattatt agccgaattt aattcattta gctggtatgg aatggggcca gaagaaaact      4200
     atatagacag atgtgaaggt gcaaaacttg gaatatatga gagtacacaa tagaaaatct      4260
     atcaaggtat ttagtaccac aagaatgtgg taacaggata ggaactagat gggtagtagt      4320
     taaaaatcat aagaatgaag gtcttaaatt tacttatgtt aaagttccat ttgaatttag      4380
     tgttttacca tacagcagca tggaattaga aaattcactt catatagaag aattaccatc      4440
     tgttaatttt acacattgtg aatataatag gtaaacaaat gggtgttggc ggagatgcaa      4500
     tgctggggag caccatgata cctaaattct gtatagattc aagtaaggat ttagaatata      4560
     gttttataat ttctaaaatt atactacgca catatgggaa ctatagatat ccaaaacaaa      4620
     acttagactt atgcaataat ttacgaaagg acaggtactc tgttgtttcg gttactaaga      4680
     ataagttgag gctttctaac atcataagtt gcaccatttc agcatgctcc cgagacaagc      4740
     tcgtgacaag caaaaatgga acaacttatg atgaagaaat gcctgcaaca tattctttaa      4800
     tgtaacactg cacaaaagag tacctgtcct ttctgatata gcagattttt caagctataa      4860
     gtatatctca cgaaatcata aatattttga ttccgaaaag ctatgaaaat atcgctgaag      4920
     gttctaagca gctggttgtg tgcaccttag catgctccaa ctttcagttt gacaagctaa      4980
     aatggaacaa tctacagctc aagaaacttt aacagctcat tttcaaatgt tttctacaca      5040
     aatatattta tatttctagt gaagatatga aattaaattt ttagcgactt tgtaaatatg      5100
     ttaatctaat atacgaattc                                                  5120
//


  
spacer
spacer