spacer
spacer

EBI Dbfetch

ID   L20094; SV 1; linear; genomic DNA; STD; PRO; 3289 BP.
XX
AC   L20094;
XX
DT   08-JUL-1993 (Rel. 36, Created)
DT   17-APR-2005 (Rel. 83, Last updated, Version 4)
XX
DE   Thermomonospora fusca beta-1,4-endoglucanase precursor (E1) gene, complete
DE   cds.
XX
KW   .
XX
OS   Thermobifida fusca
OC   Bacteria; Actinobacteria; Actinobacteridae; Actinomycetales;
OC   Streptosporangineae; Nocardiopsaceae; Thermobifida.
XX
RN   [1]
RA   Lin E., Wilson D.B.;
RT   "Identification of a celE binding protein and its potential role in
RT   induction of the celE gene in Thermomonospora fusca";
RL   J. Bacteriol. 1701:3843-3846(1988).
XX
RN   [2]
RX   PUBMED; 1904434.
RA   Lao G., Ghangas G.S., Jung E.D., Wilson D.B.;
RT   "DNA sequences of three beta-1,4-endoglucanase genes from Thermomonospora
RT   fusca";
RL   J. Bacteriol. 173(11):3397-3407(1991).
XX
RN   [3]
RP   1-3289
RX   DOI; 10.1002/bit.260420811
RX   PUBMED; 18613149.
RA   Irwin D.C., Spezio M., Walker L.P., Wilson D.B.;
RT   "Activity studies of eight purified cellulases: Specificity, synergism, and
RT   binding domain effects";
RL   Biotechnol. Bioeng. 42(8):1002-1013(1993).
XX
RN   [4]
RP   1-3289
RX   PUBMED; 8215374.
RA   Jung E.D., Lao G., Irwin D., Barr B.K., Benjamin A., Wilson D.B.;
RT   "DNA sequences and expression in Streptomyces lividans of an exoglucanase
RT   gene and an endoglucanase gene from Thermomonospora fusca";
RL   Appl. Environ. Microbiol. 59(9):3032-3043(1993).
XX
RN   [5]
RP   1-3289
RA   Irwin D.;
RT   ;
RL   Submitted (26-JUL-1993) to the EMBL/GenBank/DDBJ databases.
RL   Biochemistry, Cornell University, 460 Biotechnology Bldg., Ithaca, NY
RL   14853, USA
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..3289
FT                   /organism="Thermobifida fusca"
FT                   /strain="YX"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:2021"
FT   protein_bind    104..117
FT                   /bound_moiety="regulatory protein"
FT                   /citation=[2]
FT                   /citation=[1]
FT   RBS             168..172
FT                   /note="complementary to the 3' end of the 16S RNA of S.
FT                   lividans and E. coli"
FT   sig_peptide     178..273
FT                   /gene="E1"
FT   CDS             178..3102
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="E1"
FT                   /product="beta-1,4-endoglucanase precursor"
FT                   /note="the cellulose binding domain includes residues
FT                   870-974"
FT                   /db_xref="GOA:Q08166"
FT                   /db_xref="HSSP:1K85"
FT                   /db_xref="InterPro:IPR001701"
FT                   /db_xref="InterPro:IPR001919"
FT                   /db_xref="InterPro:IPR003305"
FT                   /db_xref="InterPro:IPR003961"
FT                   /db_xref="InterPro:IPR004197"
FT                   /db_xref="InterPro:IPR008928"
FT                   /db_xref="InterPro:IPR008957"
FT                   /db_xref="InterPro:IPR008965"
FT                   /db_xref="InterPro:IPR008979"
FT                   /db_xref="InterPro:IPR012291"
FT                   /db_xref="InterPro:IPR012341"
FT                   /db_xref="InterPro:IPR013783"
FT                   /db_xref="InterPro:IPR014756"
FT                   /db_xref="InterPro:IPR018221"
FT                   /db_xref="UniProtKB/TrEMBL:Q08166"
FT                   /protein_id="AAC06387.1"
FT                   /translation="MLRRPRSRSPLVALTAATCRVALGGTAVPAQADEVNQIRNGDFSS
FT                   GTAPWWGTENIQLNVTDGMLCVDVPGGTVNPWDVIIGQDDIPLIEGESYAFSFTASSTV
FT                   PVSIRALVQEPVEPWTTQMDERALLGPEAETYEFVFTSNVDWDDAQVAFQIGGSDEPWT
FT                   FCLDDVALLGRAEPPVYEPDTGPRVRVNQVGYLPHGPKKATVVTDATSALTWELADADG
FT                   NVVASGQTKPHGADSSSGLNVHTVDFSSYTTKGSDYTLTVDGETSYPFDIDESVYEELR
FT                   VDALSFYYPQRSGIEILDSIAPGYGRPAGHIGVPPNQGDTDVPCAPGTCDYSLDVSGGW
FT                   YDAGDHGKYVVNGGISVHQIMSIYERSQLADTAQPDKLADSTLRLPETGNGVPDVLDEA
FT                   RWEMEFLLKMQVPEGEPLAGMAHHKIHDEQWTGLPLLPSADPQPRYLQPPSTAATLNLA
FT                   ATAAQCARVFEPFDEDFAAECLAAAETAWDAAKANPNIYAPAFGEGGGPYNDNNVTDEF
FT                   YWAAAELFLTTGKEEYRDAVTSSPLHTDDEEVFRDGAFDWGWTAALARLQLATIPNDLA
FT                   DRDRVRQSVVDAADMYLANVETSPWGLAYKPNNGVFVWGSNSAVLNNMVILAVAFDLTG
FT                   DTKYRDGVLEGMDYIFGRNALNQSYVTGYGDKDSRNQHSRWYAHQLDPRLPNPPKGTLA
FT                   GGPNSDSTTWDPVAQSKLTGCAPQMCYIDHIESWSTNELTINWNAPLSWIASFIADQDD
FT                   AGEPGGEEPGPGDDETPPSKPGNLKASDITATSATLTWDASTDNVGVVGYKVSLVRDGD
FT                   AEEVGTTAQTSYTLTGLSADQEYTVQVVAYDAAGNLSTPATVTFTTEKEDETPTPSASC
FT                   AVTYQTNDWPGGFTASVTLTNTGSTPWDSWELRFTFPSGQTVSHGWSANWQQSGSDVTA
FT                   TSLPWNGSVPPGGGSVNIGFNGTWGGSNTKPEKFTVNGAVCSIG"
FT   mat_peptide     274..3099
FT                   /gene="E1"
FT                   /product="beta-1,4-endoglucanase"
FT                   /EC_number="3.2.1.4"
FT   misc_feature    370..735
FT                   /gene="E1"
FT                   /note="encodes cellulose binding domain; family IV"
FT   misc_feature    1006..2427
FT                   /gene="E1"
FT                   /note="encodes catalytic domain; family 9"
FT   misc_feature    2782..3099
FT                   /gene="E1"
FT                   /note="encodes cellulose binding domain; family II"
XX
SQ   Sequence 3289 BP; 621 A; 1237 C; 961 G; 470 T; 0 other;
     ttttgttgtt acagggagga aagagcagcc ggaaagttct attccgagcg taactattga        60
     caccgctgag tgatcctgtt tttatgtcat aggtcacatg aaatgggagc gctcccatgg       120
     tgggcctccg ctgtgaggtc atcctcccag ttcgaatccc cctacggaag gacttccgtg       180
     cttaggagac ccagatctcg atcccccctt gtcgccctca ccgcggcgac ttgccgagtc       240
     gcgctcgggg gtacggcggt tcccgcccag gcagacgaag tcaaccagat tcgcaacggc       300
     gacttcagct ccggcaccgc accctggtgg ggaaccgaga acatccaact caacgtcacc       360
     gacgggatgc tgtgcgtcga cgtccccggc ggcaccgtca acccgtggga cgtgatcatc       420
     ggccaggacg acatccccct catcgaaggt gagtcctacg ccttctcctt cactgcctcc       480
     agcaccgtcc ccgtctccat ccgcgccctg gtgcaagagc ccgtggagcc gtggaccacc       540
     cagatggacg agcgtgccct gctcggcccc gaggcagaaa cctacgaatt cgtcttcacc       600
     tccaacgtcg actgggacga cgcccaagtc gccttccaga tcggcggctc cgacgaaccg       660
     tggaccttct gcctcgacga cgtcgccctg ctcggccgcg ccgaaccccc ggtctacgaa       720
     cccgacaccg gaccgcgggt ccgcgtcaac caggtcggct acctcccgca cggtcccaag       780
     aaggcgaccg tggtcaccga cgccaccagc gcgctcacct gggagcttgc cgacgccgac       840
     ggtaacgtgg tcgccagcgg ccagaccaag ccgcacggcg cggactccag ctccgggctc       900
     aacgtccaca ccgtcgactt cagctcctac accacgaagg gaagcgacta cacgctcacc       960
     gtcgacggtg aaaccagcta ccccttcgac atcgacgaaa gcgtctacga ggaactgcgc      1020
     gtcgacgcgc tgtcgttcta ctacccgcag cgcagcggca tcgagatcct cgactccatc      1080
     gcccccggct acggacgccc ggccggccac atcggcgtgc cccccaacca gggcgatacc      1140
     gacgtgccgt gcgcgcccgg cacctgcgac tactccctgg acgtctccgg cggctggtac      1200
     gacgcgggcg accacggcaa atacgtggtc aacggcggta tctcggtgca ccagatcatg      1260
     agcatctacg agcgctccca gctcgccgac accgcccagc ccgacaagct ggccgactcc      1320
     accctgcgcc tgcccgaaac cggcaacggc gtgcccgacg tgctcgacga agcacgctgg      1380
     gagatggagt tcctcctcaa gatgcaggtg cccgaaggcg aaccgctcgc cggcatggcg      1440
     caccacaaga tccacgacga acagtggacc gggctgccgc tgctgccctc cgctgacccg      1500
     cagccgcgct acctgcagcc gccgtccacc gcggccacgc tgaacctggc cgccaccgcc      1560
     gcccagtgcg ctcgcgtgtt cgaacccttc gacgaggatt tcgccgccga gtgcctggct      1620
     gccgcggaaa ccgcgtggga cgccgccaag gccaacccga acatctacgc gcctgccttc      1680
     ggtgaaggcg gcggcccgta caacgacaac aacgtcaccg acgagttcta ctgggccgcg      1740
     gccgaactgt tcctcaccac cggcaaggag gagtaccgcg acgcggtgac ctcgtcgccg      1800
     ctgcacaccg acgacgaaga ggtcttccgc gacggcgcct tcgactgggg atggactgct      1860
     gcgctggccc gcctccagct ggccacgatc cccaacgacc tcgccgaccg cgaccgggtg      1920
     cgccagtccg tggtcgatgc cgccgacatg tacctcgcca acgtcgagac cagcccgtgg      1980
     ggcctggcct acaagccgaa caacggcgtg ttcgtctggg gctccaacag cgctgtcctc      2040
     aacaacatgg tgatcctggc ggtcgccttc gacctcaccg gtgacaccaa ataccgcgac      2100
     ggcgtgctgg aaggcatgga ctacatcttc ggccgcaacg cgctgaacca gtcctacgtc      2160
     accggctacg gcgacaagga ctcccgcaac cagcacagcc gctggtacgc ccaccagctc      2220
     gacccccggt tgcccaaccc gcccaagggc acgctggccg gtggacccaa ctccgactcc      2280
     accacctggg acccggtggc ccagtccaag ctgaccgggt gcgcccccca gatgtgctac      2340
     atcgaccaca tcgagtcgtg gtccaccaac gagctgacca tcaactggaa cgcccccctg      2400
     tcgtggatcg cgtccttcat cgccgaccag gacgacgccg gcgagcccgg cggagaagag      2460
     cccggaccgg gcgacgacga gaccccgccg agcaagcctg ggaacctgaa ggccagcgac      2520
     atcaccgcga ccagcgccac cctgacctgg gacgcctcca ccgacaacgt cggagtggtc      2580
     ggctacaagg tctccctggt ccgcgacggt gacgctgaag aggtgggcac caccgcgcag      2640
     accagctaca cgctcaccgg gctgagcgcg gaccaggagt acaccgtcca ggtggtcgcc      2700
     tacgacgcgg caggcaacct ctccacgcca gccaccgtca ccttcaccac cgagaaggag      2760
     gacgagactc ccacgcccag cgcctcctgc gcggtgacgt accagaccaa cgactggccg      2820
     ggcggcttca ccgcctcggt gacgctgacc aacaccggca gcaccccgtg ggactcctgg      2880
     gaactgcgct tcaccttccc gtcgggacag actgtcagcc acggctggag cgccaactgg      2940
     cagcagagcg gcagtgacgt gaccgccacc tccttgccgt ggaacggatc agttccgccg      3000
     ggcggcggct cagtcaacat cggcttcaac ggaacctggg gcggttcgaa caccaaacct      3060
     gagaagttca ccgtcaacgg cgcggtctgc tccatcggct gaacctcgcc ctggattcgg      3120
     atgtaagccg ccgtggcccc tgtcatcggc gggggccaca cccggcacca tccccgcaca      3180
     ccccctgtgc ggggatggtg ctcccctcat tggtctggta agacgaggaa ggcgccaacg      3240
     tgacctccga gagccccgtg cgcgcggccc cccgtgccgg acggatgac                  3289
//


  
spacer
spacer