spacer
spacer

EBI Dbfetch

ID   U34793; SV 3; linear; genomic DNA; STD; PRO; 4652 BP.
XX
AC   U34793;
XX
DT   22-MAY-1998 (Rel. 55, Created)
DT   17-APR-2005 (Rel. 83, Last updated, Version 5)
XX
DE   Clostridium cellulovorans exoglucanase S (exgS) and endoglucanase H (engH)
DE   genes, complete cds.
XX
KW   .
XX
OS   Clostridium cellulovorans
OC   Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae;
OC   Clostridium.
XX
RN   [1]
RP   1-334, 401-4652
RX   DOI; 10.1016/S0378-1119(98)00081-X
RX   PUBMED; 9643978.
RA   Liu C.C., Doi R.H.;
RT   "Properties of exgS, a gene for a major subunit of the Clostridium
RT   cellulovorans cellulosome";
RL   Gene 211(1):39-47(1998).
XX
RN   [2]
RP   1-4652
RX   DOI; 10.1128/JB.182.20.5906-5910.2000
RX   PUBMED; 11004194.
RA   Tamaru Y., Karita S., Ibrahim A., Chan H., Doi R.H.;
RT   "A large gene cluster for the Clostridium cellulovorans cellulosome";
RL   J. Bacteriol. 182(20):5906-5910(2000).
XX
RN   [3]
RP   1-334, 401-4652
RA   Liu C.C., Doi R.H.;
RT   ;
RL   Submitted (23-AUG-1995) to the EMBL/GenBank/DDBJ databases.
RL   Chichi Liu, Molecular and Cellular Biology, University of California,
RL   Davis, Davis, CA 95616, USA
XX
RN   [4]
RC   Sequence update by submitter
RP   1-334, 401-4652
RA   Liu C.C., Doi R.H.;
RT   ;
RL   Submitted (09-MAR-1999) to the EMBL/GenBank/DDBJ databases.
RL   Chichi Liu, Molecular and Cellular Biology, University of California,
RL   Davis, Davis, CA 95616, USA
XX
RN   [5]
RC   Sequence update by submitter
RP   1-4652
RA   Liu C.C., Doi R.H.;
RT   ;
RL   Submitted (05-AUG-1999) to the EMBL/GenBank/DDBJ databases.
RL   Chichi Liu, Molecular and Cellular Biology, University of California,
RL   Davis, Davis, CA 95616, USA
XX
CC   On Aug 5, 1999 this sequence version replaced gi:4388626.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4652
FT                   /organism="Clostridium cellulovorans"
FT                   /map="3' and linked to cbpA"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:1493"
FT   CDS             70..2253
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="exgS"
FT                   /product="exoglucanase S"
FT                   /EC_number="3.2.1.91"
FT                   /note="ExgS; cellobiohydrolase; similar to Clostridium
FT                   thermocellum CelS"
FT                   /db_xref="GOA:O65986"
FT                   /db_xref="HSSP:1FAE"
FT                   /db_xref="InterPro:IPR016134"
FT                   /db_xref="UniProtKB/TrEMBL:O65986"
FT                   /protein_id="AAC38571.3"
FT                   /translation="MRKRLNKIVAVALTATTISSVAATVNTAQVSAAPVVPNNEYVQHF
FT                   KDMYAKIHNANNGYFSDEGIPYHAVETLMVEAPDYGHETTSEAFSYYMWLEAMNAKLTG
FT                   DFSGFKKAWDVTEKYIIPGETDQPSASMSNYDPNKPATYAAEHPDPSMYPSQLQFGAAV
FT                   GKDPLYNELKSTYGTSQVYGMHWLLDVDNWYGFGGATSTSPVYINTFQRGVQESCWETV
FT                   PQPCKDEMKYGGRNGFLDLFTGDSQYATQFKYTNAPDADARAVQATYYAQLAAKEWGVD
FT                   ISSYVAKSTKMGDFLRYSFFDKYFRKVGNSTQAGTGYDSAQYLLNWYYAWGGGISSNWS
FT                   WRIGSSHNHFGYQNPMAAWILSNTSDFKPKSPNAATDWNNSLKRQIEFYQWLQSAEGGI
FT                   AGGASNSNGGSYQAWPAGTRTFYGMGYTPHPVYEDPGSNEWFGMQAWSMQRVAEYYYSS
FT                   KDPAAKSLLDKWAKWACANVQFDDAAKKFKIPAKLVWTGQPDTWTGSYTGNSNLHVKVE
FT                   AYGEDLGVAGSLSNALSYYAKALESSTDAADKVAYNTAKETSRKILDYLWASYQDDKGI
FT                   AVTETRNDFKRFNQSVYIPSGWTGKMPNGDVIQSGATFLSIRSKYKQDPSWPNVEAALA
FT                   NGTGVDMTYHRFWGQSDIAIAFGTYGTLFTDPTPGLKGDVNSDAKVNAIDLAILKKYIL
FT                   DSTTKINTANSDMNGDGKVNAMDLALLKKALLA"
FT   CDS             2505..4652
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="engH"
FT                   /product="endoglucanase H"
FT                   /note="EngH; member of family E2"
FT                   /db_xref="GOA:O65987"
FT                   /db_xref="HSSP:1G87"
FT                   /db_xref="InterPro:IPR016134"
FT                   /db_xref="UniProtKB/TrEMBL:O65987"
FT                   /protein_id="AAC38572.2"
FT                   /translation="MFNISKKKAQALLLSGILGATSFTPAVLVKGETTATPTFNYGEAL
FT                   QKSIMFYEFQRSGKLPTDIRSNWRGDSGTKDGSDVGVDLTGGWYDAGDHVKFNLPMSYT
FT                   VAMLAWSLSEDKAAYEKSGQLDYLVKEIKWATDYLMKCHTAPNEYYYQVGDGGADHKWW
FT                   GPAEVMQMARPAYKVDLQKPGSSVVAETAAALASTAFALKDIDKAYSEQCIQHAKELYN
FT                   FADTTKSDAGYTAANTYYNSWSGYYDELSWAAAWLYMATNDASYLEKAESYVPFWKVEQ
FT                   QTTTIAYRWAHCWDDVHFGAQLLLARLTGKSIYKESVERNLDYWTTGYDGNKIKYTPKG
FT                   LAWMDSWGSLRYATTTAFLADVYASSDVCSISKVDTYKNFAKSQADYALGSTGRSFVVG
FT                   FGENAPKKPHHRTAHSSWSDQQVNPTDHRHVLYGALVGGPDASDGYTDAIDNFTNNEVA
FT                   CDYNAGFVGLLARQYSKYGGDPIPDFKAIEKPTNDEFFVEAGVNCTGPNFVEIKALVNN
FT                   RTGWPARMGDKLSFKYFINVSEFVNAGYSADDLKVTVGYNTGGTVSNLIPWDKENNIYY
FT                   VNVDFTGVKIYPGGQSDYKKEIQFRISGIQNVNIWDNSDDFSYEGITKTPGETPVKVTN
FT                   IPVYDNGVKVFGNEPGTTKPPVIAGDVNNNGIVNSMDLAMLKKYILGYEVEMNKEASDL
FT                   NKDGKINAIDFALLKKLLLSQ"
XX
SQ   Sequence 4652 BP; 1660 A; 733 C; 946 G; 1313 T; 0 other;
     taatatataa ataatattta aaatcaataa atcaatcggg gaaaatttaa aaaaagagag        60
     ggataatcaa tgagaaaaag attaaataag atcgttgctg ttgctttaac tgcaacaact       120
     atatcatcag tagcagctac tgttaataca gctcaagttt cagctgcacc agtagtgcca       180
     aataatgagt atgttcaaca ctttaaggat atgtacgcta agatccataa tgcaaacaat       240
     ggatacttca gtgatgaagg aataccttat cacgcagttg aaacattaat ggttgaagca       300
     ccagactatg gtcatgaaac tacaagtgaa gctttcagtt actatatgtg gcttgaagct       360
     atgaacgcta agcttactgg agatttctca ggattcaaaa aagcttggga tgtaactgaa       420
     aagtacataa ttccaggtga gactgatcaa ccaagcgcaa gtatgagcaa ttatgatcca       480
     aataagccag ctacatatgc agctgaacat ccagatccaa gcatgtaccc atctcaatta       540
     caatttggtg ctgctgtagg taaggatcca ttatacaatg aattaaaatc tacttatgga       600
     actagccaag tatatggtat gcattggtta ctagatgttg ataactggta tggttttggt       660
     ggtgcaacaa gcacaagccc agtatacatc aacactttcc aaagaggtgt tcaagaatct       720
     tgttgggaaa ctgtgccaca accatgtaaa gacgaaatga agtacggtgg aagaaacggt       780
     ttcttagatc tattcactgg tgattcacaa tacgcaactc aatttaaata tactaacgct       840
     ccagacgcag atgctcgtgc agttcaagct acttactatg cacaattagc tgctaaagaa       900
     tggggagtag acatcagctc atatgtagca aaatctacta agatgggtga cttcttaaga       960
     tattcattct ttgataaata ctttagaaaa gttggaaatt caacacaagc aggaactgga      1020
     tatgattcag ctcaatacct attaaactgg tactatgctt ggggtggtgg aatcagctca      1080
     aactggtctt ggagaattgg atcaagccat aaccatttcg gataccaaaa cccaatggca      1140
     gcatggatat tatcaaatac atctgacttt aaaccaaagt caccaaatgc tgctacagat      1200
     tggaataaca gtttaaagag acaaatagaa ttctatcaat ggttacaatc tgctgaaggt      1260
     ggtatcgctg gaggagctag taactcaaat ggaggaagct atcaagcatg gccagcaggt      1320
     actcgaacat tctacggaat gggatatact cctcacccag tatacgaaga tccaggtagt      1380
     aacgaatggt ttggtatgca agcatggtca atgcaacgtg tggctgaata ctactacagt      1440
     tcaaaagatc cagcagctaa atcattactt gataaatggg ctaaatgggc ttgtgcaaat      1500
     gttcaattcg atgatgcagc taagaaattt aagattcctg ctaaattagt atggactgga      1560
     caaccagata cttggactgg atcatataca ggaaattcaa atcttcatgt taaagttgaa      1620
     gcttatggag aagatcttgg agtagcaggt tcactttcta atgcattatc atattatgca      1680
     aaagctcttg aatctagcac agatgctgca gataaagtag catataacac tgcaaaagaa      1740
     acttctagaa agatacttga ttacttatgg gcaagctacc aagatgataa gggtatagca      1800
     gttactgaaa caagaaatga tttcaaacgt ttcaatcaat ctgtatatat tccatcaggt      1860
     tggacaggaa aaatgcctaa tggagatgta atccaaagtg gagctacttt cttaagcata      1920
     cgttcaaaat acaaacaaga tccatcatgg ccaaatgttg aagctgcttt agcaaatggt      1980
     actggtgttg atatgacata ccacagattc tggggtcaaa gtgatatcgc tatagcattt      2040
     ggaacatacg gtacattatt cacagaccct actccaggat taaaaggtga tgttaactct      2100
     gatgctaaag taaatgctat agatttagct atattaaaga aatacatctt agattcaaca      2160
     actaaaatta acactgctaa ttctgatatg aacggtgatg gaaaagttaa tgcaatggat      2220
     ttagctttat taaagaaagc acttcttgct taagattaaa taactttaga tcgaaattgt      2280
     aaggttattt aaggctggac aatatcaagt atattgtcca gctactttaa aaaatattgg      2340
     gaaacactgt gtaaggtaaa cttaaaccat ggatatgaaa tatagtaaga ttaatgccat      2400
     tgctatggca aacttaaaat aaatatatta gagcataaac atgaaattta agtaaaaggc      2460
     gaataaataa attccctaat caaaaaaatt aaggggtgga actagtgttt aacatatcta      2520
     agaaaaaagc gcaagctctt cttttatcag gaatcttggg tgcaacttca tttacaccag      2580
     ctgtattggt aaaaggtgaa acaacagcga ctccaacatt caattatgga gaagcattac      2640
     aaaagtcaat aatgttttat gaattccaac gttctggaaa gttaccaacg gatattcgta      2700
     gtaattggcg tggtgattct ggaacaaaag atggctctga tgtaggagtt gatttaactg      2760
     gtggatggta tgatgctgga gaccacgtta aatttaatct gccaatgtct tatactgtgg      2820
     caatgcttgc atggtcatta agtgaagaca aagcagctta cgaaaaaagc ggccaattag      2880
     attaccttgt taaggaaata aaatgggcta cagattatct aatgaagtgc catacggcac      2940
     caaatgaata ctattatcaa gttggtgatg gtggagctga tcacaaatgg tggggacctg      3000
     cagaagtaat gcagatggca agaccggctt ataaagtaga tttgcaaaaa ccaggatcat      3060
     cagttgtcgc tgaaacagca gcagcattag cttctacagc ttttgcatta aaagacatag      3120
     ataaagcgta ttcagaacaa tgtattcagc atgcaaaaga actttataac tttgctgata      3180
     caacaaagag tgatgctggt tatacagcag caaatacata ttacaattca tggagtggat      3240
     actatgatga attatcatgg gctgcagcat ggctttacat ggcaacaaat gatgcatcat      3300
     atctagaaaa agcggaatca tatgttccat tttggaaggt tgaacagcaa acaaccacta      3360
     tagcatatag atgggcgcat tgttgggatg atgtacattt cggagctcaa ttactccttg      3420
     ccagattaac aggaaaatca atatacaaag aatcagttga aagaaacctt gattattgga      3480
     caactggtta tgatggaaat aaaataaagt acactccaaa aggtttagct tggatggatt      3540
     cttggggctc attaagatat gcaactacaa cggcattcct tgccgatgtt tatgcaagct      3600
     cagatgtttg ttctatttct aaggtagata catataagaa ttttgctaag agtcaagctg      3660
     attatgcttt aggaagtact ggaagaagtt ttgtggtagg atttggtgaa aatgctccaa      3720
     agaaaccaca tcatagaact gcccatagtt catggtcaga tcaacaagta aatccaacag      3780
     accatagaca tgttttatat ggtgctttag ttggaggacc agatgccagt gatggttata      3840
     ctgatgctat tgacaatttt actaataatg aggtggcttg tgattataat gcaggatttg      3900
     taggactttt agctagacaa tattctaaat atggcggaga tccaatacct gattttaaag      3960
     cgatagaaaa gccaaccaac gatgagttct ttgtcgaagc aggagtaaat tgtacaggtc      4020
     caaattttgt agaaattaaa gctttagtta ataatagaac aggatggcca gcaagaatgg      4080
     gagataaact ttcattcaaa tacttcataa atgtaagtga atttgttaat gctggttaca      4140
     gtgcagatga tttaaaggtt actgttggtt acaatactgg cggaactgta tcaaacctaa      4200
     tcccatggga taaggaaaat aatatttatt atgtaaatgt tgatttcaca ggggtaaaga      4260
     tttatccagg tggacaatca gattataaaa aagaaattca atttagaatt tcaggaattc      4320
     aaaatgttaa tatttgggat aattctgatg acttctctta tgaggggatt acaaaaactc      4380
     caggtgaaac acctgtgaag gttacaaaca tcccagttta tgataatgga gttaaggtat      4440
     tcggaaatga accaggaact actaagccac ctgttatagc tggtgatgta aacaataatg      4500
     gtatcgtgaa ttcaatggat ttagcgatgt taaagaaata tatacttgga tacgaagtag      4560
     aaatgaataa agaggcttca gatttaaata aagatggtaa gattaatgcc attgatttcg      4620
     ctcttttaaa gaaactactt ttatcacagt ag                                    4652
//


  
spacer
spacer