spacer
spacer

EBI Dbfetch

ID   X13602; SV 1; linear; genomic DNA; STD; PRO; 4241 BP.
XX
AC   X13602;
XX
DT   16-FEB-1989 (Rel. 18, Created)
DT   14-NOV-2006 (Rel. 89, Last updated, Version 5)
XX
DE   Caldocellum saccharolyticum celB gene for cellobiohydrolase/endocellulase
XX
KW   cellobiohydrolase; endocellulase.
XX
OS   Caldicellulosiruptor saccharolyticus
OC   Bacteria; Firmicutes; Clostridia; Thermoanaerobacterales;
OC   Thermoanaerobacterales Family III. Incertae Sedis; Caldicellulosiruptor.
XX
RN   [1]
RP   1-4241
RA   Saul D.J.;
RT   ;
RL   Submitted (18-NOV-1988) to the EMBL/GenBank/DDBJ databases.
RL   Saul D.J., Department of Cellular and Molecular Biology, University of
RL   Auckland, Private Bag, Auckland, New Zealand.
XX
RN   [2]
RP   1-4241
RX   DOI; 10.1093/nar/17.1.439
RX   PUBMED; 2789517.
RA   Saul D.J.;
RT   "Nucleotide sequence of a gene from Caldocellum saccharolyticum encoding
RT   for exocellulase and endocellulase activity";
RL   Nucleic Acids Res. 17(1):439-439(1989).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4241
FT                   /organism="Caldicellulosiruptor saccharolyticus"
FT                   /mol_type="genomic DNA"
FT                   /clone="pNZ1087"
FT                   /db_xref="taxon:44001"
FT   promoter        623..628
FT                   /note="put. -35 region"
FT   promoter        646..651
FT                   /note="put. -10 region"
FT   RBS             661..667
FT                   /note="pot. rRNA binding site"
FT   CDS             679..3798
FT                   /transl_table=11
FT                   /product="celB polypeptide precursor"
FT                   /db_xref="GOA:P10474"
FT                   /db_xref="HSSP:1NBC"
FT                   /db_xref="InterPro:IPR013781"
FT                   /db_xref="UniProtKB/Swiss-Prot:P10474"
FT                   /protein_id="CAA31936.1"
FT                   /translation="MKRNLFRIVSRVVLIAFIASISLVGAMSYFPVETQAAPDWSIPSL
FT                   CESYKDDFMIGVAIPARCLSNDTDKRMVLKHFNSITAENEMKPESLLAGQTSTGLSYRF
FT                   STADAFVDFASTNKIGIRGHTLVWHNQTPDWFFKDSNGQRLSKDALLARLKQYIYDVVG
FT                   RYKGKVYAWDVVNEAIDENQPDSYRRSTWYEICGPEYIEKAFIWAHEADPNAKLFYNDY
FT                   NTEISKKRDFIYNMVKNLKSKGIPIHGIGMQCHINVNWPSVSEIENSIKLFSSIPGIEI
FT                   HITELDMSLYNYGSSENYSTPPQDLLQKQSQKYKEIFTMLKKYKNVVKSVTFWGLKDDY
FT                   SWLRSFYGKNDWPLLFFEDYSAKPAYWAVIEASGVTTSSPTPTPTPTVTVTPTPTPTPT
FT                   PTVTATPTPTPTPVSTPATGGQIKVLYANKETNSTTNTIRPWLKVVNSGSSSIDLSRVT
FT                   IRYWYTVDGERAQSAVSDWAQIGASNVTFKFVKLSSSVSGADYYLEIGFKSGAGQLQPG
FT                   KDTGEIQIRFNKSDWSNYNQGNDWSWLQSMTSYGENEKVTAYIDGVLVWGQEPSGATPA
FT                   PTMTVAPTATPTPTLSPTVTPTPAPTQTAIPTPTLTPNPTPTSSIPDDTNDDWLYVSGN
FT                   KIVDKDGRPVWLTGINWFGYNTGTNVFDGVWSCNLKDTLAEIANRGFNLLRVPISAELI
FT                   LNWSQGIYPKPNINYYVNPELEGKNSLEVFDIVVQTCKEVGLKIMLDIHSIKTDAMGHI
FT                   YPVWYDEKFTPEDFYKACEWITNRYKNDDTIIAFDLKNEPHGKPWQDTTFAKWDNSTDI
FT                   NNWKYAAETCAKRILNINPNLLIVIEGIEAYPKDDVTWTSKSSSDYYSTWWGGNLRGVR
FT                   KYPINLGKYQNKVVYSPHDYGPSVYQQPWFYPGFTKESLLQDCWRPNWAYIMEENIAPL
FT                   LIGEWGGHLDGADNEKWMKYLRDYIIENHIHHTFWCFNANSGDTGGLVGYDFTTWDEKK
FT                   YSFLKPALWQDSQGRFVGLDHKRPLGTNGKNINITTYYNNNEPEPVPASK"
FT   sig_peptide     679..762
FT                   /note="signal peptide"
FT   mat_peptide     763..3795
FT                   /note="mat. cellobiohydrolase/endocellulase"
FT   misc_feature    1804..1932
FT                   /note="TP box"
FT   misc_feature    2398..2532
FT                   /note="TP box"
FT   RBS             4024..4030
FT                   /note="pot. rRNA binding site"
FT   CDS             4043..4241
FT                   /partial
FT                   /transl_table=11
FT                   /note="unkown ORF"
FT                   /db_xref="GOA:P21481"
FT                   /db_xref="HSSP:1G87"
FT                   /db_xref="InterPro:IPR001701"
FT                   /db_xref="UniProtKB/Swiss-Prot:P21481"
FT                   /protein_id="CAA31937.1"
FT                   /translation="MLKLKKAIKRITLCVAVVFLLQILFLFSGYNNSDVKAATTFNYGE
FT                   ALQKAIMFYEFQMSGKLPSWI"
XX
SQ   Sequence 4241 BP; 1524 A; 636 C; 920 G; 1161 T; 0 other;
     cggtgtatca catagtatta cgttagattt caatgtaagc ataaaaatta tacaaaatga        60
     ggttataaaa ttcataagga atttggtttt tatgagggct ctggtgtaat gccaaagtgg       120
     caattgataa tgtaacttgg acgtaagaat tgtgtcaaat atgttgatag tatttttgca       180
     acagaggttg aaatattttc aaaatgagca ttgttaattt aaatagactg agagcacaaa       240
     tgtgaagctt aaaatttgga aaaagagcga taattacaaa ataaggtttt taaaattaga       300
     tactgtcgaa gaaaaaacag taactgagtt tttaatgatg ttaaattcta taaagtcaaa       360
     tgtaccacat atggtatata tgaaattaac ataagaaaaa atgcaaaaaa gaataaatta       420
     taatttaatt ataggtttaa aaaagccgaa aaaaatattt aagtttacgc tgcacgatgt       480
     gctgggagcc tttcggcaac accagagcct ttgtttaaag ttttgctcat attaagaatt       540
     ttttaatcac aaataagctt tcaaaaaatg gtaacatata gcgtctaaat tgaacaatta       600
     tatagtgtcg ccaatttgtt tttcgacaaa atgtaaaata aaaaatttaa aaataagaag       660
     agggggttag tggataaaat gaagagaaat ctatttagga ttgtatctcg agttgtatta       720
     atagcgttta ttgctagtat ttctctggtt ggtgcaatga gttattttcc agttgaaact       780
     caagctgcgc cagactggag tattccaagt ttatgtgaga gttataaaga cgattttatg       840
     ataggcgtgg caatacctgc aagatgtttg agcaatgata ctgacaaacg aatggtattg       900
     aaacatttta acagtataac agcagagaat gaaatgaagc cggaaagctt attagctggt       960
     cagaccagta ctgggttaag ttatagattt agtactgctg atgcttttgt tgactttgcg      1020
     agtacaaaca agataggtat aagaggtcat acattagttt ggcataatca gacacctgat      1080
     tggttcttta aagatagcaa tggtcaaagg ttatccaaag atgcattatt agcaagacta      1140
     aagcaatata tttatgatgt tgttggaaga tataaaggga aagtgtatgc atgggacgtt      1200
     gtcaatgaag ctatcgatga gaatcagcca gatagttata gacgttcgac atggtatgaa      1260
     atttgtggtc ctgagtacat tgaaaaagca tttatatggg ctcatgaagc agaccctaac      1320
     gcaaagctat tctacaatga ctataatacc gagatttcta agaaaagaga ttttatatac      1380
     aacatggtaa aaaacctgaa atctaaaggt atacctattc atggtattgg tatgcaatgt      1440
     catataaatg ttaactggcc atctgttagc gaaatagaaa acagtattaa gttatttagt      1500
     tcgataccag gtattgagat tcacattaca gaacttgata tgagcctata caactacggc      1560
     tccagcgaaa attattccac accaccacag gatttgcttc aaaagcagtc tcagaaatac      1620
     aaagagattt ttacaatgct gaaaaaatac aaaaatgtag taaaaagtgt tactttttgg      1680
     ggattgaaag atgattattc atggttaaga tcattctacg gtaagaatga ttggccgttg      1740
     ttgttttttg aagattacag tgcaaagcca gcctattggg cagtaattga agcttctggg      1800
     gtaacaacat catctccgac acctacacct acgccgacag taacagtaac accaactcca      1860
     acaccgacac cgacaccgac agtaacagcg actccaacac ctacacctac acctgttagc      1920
     acacctgcga caggtgggca gataaaggta ctgtatgcta acaaggagac aaacagcacg      1980
     acaaacacga taaggccatg gttgaaggta gtgaatagtg gcagcagtag catagatttg      2040
     agcagggtaa cgataaggta ctggtacacg gtagatggtg aaagggcaca gagtgcggta      2100
     tcagactggg cacagatagg agcaagcaat gtaacattca agtttgtgaa gctgagcagt      2160
     agtgtaagtg gagcggatta ttacttggag ataggattta agagtggagc agggcagtta      2220
     cagcctggga aggacacagg agagatacag ataaggttta acaagagtga ctggagcaat      2280
     tacaatcagg ggaatgactg gtcatggtta cagagcatga cgagttatgg agagaatgag      2340
     aaggtaacag cgtatataga tggagtgctg gtatggggac aggagccgag tggagcgacg      2400
     cctgcgccga cgatgacggt tgcaccgaca gcgaccccga caccaactct gagtccgacg      2460
     gtaacgccga cgccggcacc gacgcagaca gcaataccaa cgccaacatt aactccaaat      2520
     ccaacgccaa catcgagtat tcctgatgat acaaatgatg attggcttta tgtaagtggt      2580
     aataaaatag ttgataaaga cggtagacca gtatggttaa caggtattaa ctggtttgga      2640
     tataatactg gtacaaatgt atttgatggt gtatggagtt gtaatctgaa agatactctt      2700
     gctgaaatag ctaatagagg ctttaacttg ctaagagttc caatatctgc agagcttata      2760
     ttgaactggt cgcaaggtat ttatccaaaa ccaaatataa actactacgt aaatccagag      2820
     cttgaaggca aaaacagctt ggaagtattt gacatagtag tgcaaacatg taaagaagtt      2880
     ggtttgaaaa ttatgttgga tattcacagt ataaaaacag acgcgatggg acatatctat      2940
     ccggtatggt atgatgaaaa atttactcca gaggattttt ataaagcgtg cgaatggatt      3000
     acaaatagat ataaaaatga tgacactatt atagcttttg acctaaagaa tgagccacat      3060
     ggaaaaccgt ggcaagatac aacatttgca aaatgggata attcaacaga tattaataat      3120
     tggaaatatg cagctgaaac atgtgcaaaa cgtatactga atataaatcc aaaccttcta      3180
     attgtaattg aaggaattga agcctatcca aaggacgacg tcacatggac atcaaaatcc      3240
     tccagcgact actattcaac atggtggggc ggtaacttgc gaggtgttag aaagtatcct      3300
     attaatctgg gtaaatatca aaataaagtt gtatattcgc cacatgatta cgggccatct      3360
     gtttaccagc agccgtggtt ttatccaggg ttcacaaaag agtctttact acaagattgt      3420
     tggcgtccga attgggcgta cattatggaa gaaaacattg cgccacttct gataggtgag      3480
     tggggtggtc atctggatgg agccgataac gaaaagtgga tgaagtattt acgagattat      3540
     atcatagaaa atcatattca tcacacattt tggtgcttta atgctaactc gggtgacact      3600
     ggaggattgg ttggatatga ttttacgaca tgggatgaga aaaaatactc atttttgaaa      3660
     ccggctctat ggcaagacag tcaaggtagg tttgttggat tagatcacaa aagaccctta      3720
     ggtacaaatg ggaaaaacat taatattaca acatattaca acaataatga gcctgagcca      3780
     gttccagctt caaaatgata aaatacatta aataggaatt tatggatata tgagaaaaat      3840
     ttaaggtcag taggggaatg tatagttaaa gtcattaagc aagcgaatta aaggaaaaag      3900
     gggggtgata aaaaacggct aaaaacataa gtaattatta aacatttatt gtaggaacta      3960
     agtataagtt tcaaaatcat accgtccaat acgattaatt gaagttaact atcaaatcaa      4020
     aaagaggggg ttagggttaa aaatgcttaa actaaaaaaa gcaataaaaa ggataacact      4080
     gtgtgttgct gtggtatttc tattgcagat tttatttcta ttttcaggat acaataacag      4140
     tgatgtgaaa gcagcaacaa cctttaacta tggtgaagct cttcaaaaag caattatgtt      4200
     ttatgaattc cagatgtcag gtaaactgcc atcatggatc c                          4241
//


  
spacer
spacer