spacer
spacer

EBI Dbfetch

ID   AF144563; SV 1; linear; genomic DNA; STD; PRO; 5971 BP.
XX
AC   AF144563;
XX
DT   28-JUN-1999 (Rel. 60, Created)
DT   15-APR-2005 (Rel. 83, Last updated, Version 2)
XX
DE   Thermobifida fusca beta-1,4-exocellulase E6 precursor (celF) gene, complete
DE   cds; and unknown genes.
XX
KW   .
XX
OS   Thermobifida fusca
OC   Bacteria; Actinobacteria; Actinobacteridae; Actinomycetales;
OC   Streptosporangineae; Nocardiopsaceae; Thermobifida.
XX
RN   [1]
RP   1-5971
RA   Irwin D.I., Zhang S., Wilson D.B.;
RT   "Characterization of a Thermomonospora fusca family 48 exocellulase E6";
RL   Unpublished.
XX
RN   [2]
RP   1-5971
RA   Irwin D.I., Zhang S., Wilson D.B.;
RT   ;
RL   Submitted (20-APR-1999) to the EMBL/GenBank/DDBJ databases.
RL   Biochemistry, Cornell University, 460 Biotechnology, Ithaca, NY 14853, USA
XX
DR   StrainInfo; 501250; YX.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..5971
FT                   /organism="Thermobifida fusca"
FT                   /strain="YX"
FT                   /mol_type="genomic DNA"
FT                   /clone="pE6-91"
FT                   /db_xref="taxon:2021"
FT   protein_bind    join(540..551,633..646)
FT                   /bound_moiety="CelR transcriptional regulator"
FT                   /note="CelR transcriptional regulator encoded by GenBank
FT                   Accession Number AF086819"
FT   RBS             880..884
FT                   /gene="celF"
FT   CDS             897..3851
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="celF"
FT                   /product="beta-1,4-exocellulase E6 precursor"
FT                   /note="family 48 exocellulase"
FT                   /db_xref="GOA:Q9XCD4"
FT                   /db_xref="HSSP:1FAE"
FT                   /db_xref="InterPro:IPR000556"
FT                   /db_xref="InterPro:IPR000601"
FT                   /db_xref="InterPro:IPR001919"
FT                   /db_xref="InterPro:IPR008928"
FT                   /db_xref="InterPro:IPR008965"
FT                   /db_xref="InterPro:IPR012291"
FT                   /db_xref="InterPro:IPR012341"
FT                   /db_xref="UniProtKB/TrEMBL:Q9XCD4"
FT                   /protein_id="AAD39947.1"
FT                   /translation="MRSLLSPRRWRTLASGALAAALAAAVLSPGVAHAAVACSVDYDDS
FT                   NDWGSGFVAEVKVTNEGSDPIQNWQVGWTFPGNQQITNGWNGVFSQSGANVTVRYPDWN
FT                   PNIAPGATISFGFQGTYSGSNDAPTSFTVNGVTCSGSQPANLPPDVTLTSPANNSTFLV
FT                   NDPIELTAVASDPDGSIDRVEFAADNTVIGIDTTSPYSFTWTDAAAGSYSVTAIAYDDQ
FT                   GARTVSAPIAIRVLDRAAVIASPPTVRVPQGGTADFEVRLSNQPSGNVTVTVARTSGSS
FT                   DLTVSSGSQLQFTSSNWNQPQKVTIASADNGGNLAEAVFTVSAPGHDSAEVTVREIDPN
FT                   TSSYDQAFLEQYEKIKDPASGYFREFNGLLVPYHSVETMIVEAPDHGHQTTSEAFSYYL
FT                   WLEAYYGRVTGDWKPLHDAWESMETFIIPGTKDQPTNSAYNPNSPATYIPEQPNADGYP
FT                   SPLMNNVPVGQDPLAQELSSTYGTNEIYGMHWLLDVDNVYGFGFCGDGTDDAPAYINTY
FT                   QRGARESVWETIPHPSCDDFTHGGPNGYLDLFTDDQNYAKQWRYTNAPDADARAVQVMF
FT                   WAHEWAKEQGKENEIAGLMDKASKMGDYLRYAMFDKYFKKIGNCVGATSCPGGQGKDSA
FT                   HYLLSWYYSWGGSLDTSSAWAWRIGSSSSHQGYQNVLAAYALSQVPELQPDSPTGVQDW
FT                   ATSFDRQLEFLQWLQSAEGGIAGGATNSWKGSYDTPPTGLSQFYGMYYDWQPVWNDPPS
FT                   NNWFGFQVWNMERVAQLYYVTGDARAEAILDKWVPWAIQHTDVDADNGGQNFQVPSDLE
FT                   WSGQPDTWTGTYTGNPNLHVQVVSYSQDVGVTAALAKTLMYYAKRSGDTTALATAEGLL
FT                   DALLAHRDSIGIATPEQPSWDRLDDPWDGSEGLYVPPGWSGTMPNGDRIEPGATFLSIR
FT                   SFYKNDPLWPQVEAHLNDPQNVPAPIVERHRFWAQVEIATAFAAHDELFGAGAP"
FT   sig_peptide     897..998
FT                   /gene="celF"
FT   mat_peptide     999..3848
FT                   /gene="celF"
FT                   /product="beta-1,4-exocellulase E6"
FT   misc_feature    999..1313
FT                   /gene="celF"
FT                   /note="Region: family II cellulose binding domain"
FT   misc_feature    1338..1604
FT                   /gene="celF"
FT                   /note="Region: FNIII-like domain"
FT   misc_feature    1923..3848
FT                   /gene="celF"
FT                   /note="catalytic domain; Region: family 48 glycosyl
FT                   hydrolase"
FT   terminator      3931..3968
FT                   /gene="celF"
FT                   /note="putative"
FT   CDS             4044..4430
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /product="unknown"
FT                   /note="Orf 2"
FT                   /db_xref="UniProtKB/TrEMBL:Q9XCD3"
FT                   /protein_id="AAD39948.1"
FT                   /translation="MPLEPRLDIGADRTHPQPAGPHIIQRLPHQPAAHPLPLERAVHPS
FT                   VEEDHPITGNRLVFRETGDFLPGTDLVPVLCRIVDHRDIHGVPLPFPRRRRISHPAACP
FT                   GLSSSPGQPEHAPARRTPATALAW"
FT   CDS             4473..5480
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /product="unknown"
FT                   /note="Orf 3; similar to SuA5 superfamily related proteins"
FT                   /db_xref="HSSP:1JCU"
FT                   /db_xref="InterPro:IPR004388"
FT                   /db_xref="InterPro:IPR005145"
FT                   /db_xref="InterPro:IPR006070"
FT                   /db_xref="InterPro:IPR010923"
FT                   /db_xref="InterPro:IPR017945"
FT                   /db_xref="UniProtKB/TrEMBL:Q9XCD2"
FT                   /protein_id="AAD39949.1"
FT                   /translation="MGDGGTVRHPSVRAVSPAALDEAVRVLRAGGLVAFPTETVYGLGA
FT                   DAANPAAVARIFAAKGRPADHPLIVHVASAESARDWAATFPPLARTLADAFWPGPLTLI
FT                   LPRSAQVPDAVTGGRATVGLRVPDQPVALALLERFGGGIAAPSANRFGRVSPTTAAHVA
FT                   ADLGDRVDLVLDGGPCTVGVESTIVEVADGRLTVLRTGGITPDDLAAVTGAPVDTTPTG
FT                   PARAPGMLAAHYAPAARVVLAEAAEAADTVAQWVEKGHRVAVLAETATVPENLPEGVVV
FT                   LPSPASARDYARVLYQRLRDVDAAGADVVVAIPPEPAGIGLAVRDRLLRASRAH"
FT   CDS             5654..>5971
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /product="unknown"
FT                   /note="Orf 4"
FT                   /db_xref="InterPro:IPR015035"
FT                   /db_xref="InterPro:IPR015057"
FT                   /db_xref="UniProtKB/TrEMBL:Q9XCD1"
FT                   /protein_id="AAD39950.1"
FT                   /translation="MLKVQGDNGGPPYWVRWEDEGRETLVYPGPDARIEPRHPVPQARQ
FT                   EHTEARQPQPGQSLKRIQIDVAVSEVHENGSVRTLAEAQLPSTKWNLRGHGEARKHPTD
FT                   AD"
XX
SQ   Sequence 5971 BP; 1023 A; 2244 C; 1836 G; 868 T; 0 other;
     gcggccgcca ggtggggcgg ccgagtccga cggtggcgag gacttcgacc ccgtggtcgt        60
     cagcgaagca tgcttcgctg acgttggcgg cggtgagcag gcctaccccg gtgccggtca       120
     tcccgaagtg ggtggcgagt tcttcgaggt ggttgtccgg gtcggtccgc cggtagtcgc       180
     cgtcgacttg ggcgttgatg acgtagtccc gtggtccgag gccgccgccg agcacgctgg       240
     aggcggccat gcgccagccg gggccgcact gccagagcac tgcggcaagg gcgcggccgt       300
     tgtcgcgccg ccagcgcagg tgcgcggtga ggagggtgcc gtcgccgatc gtctccgtgt       360
     ccactccgct ctccagggtc ggttccgcgg ggccacttta acgagtccgc atcgggcggc       420
     agcggggtca tgcttccatc tgggcgaatg ccacgcggag tactgcgagt ctcacgcttc       480
     gtcccattgt ctttttacgg agggtttaca cggcacatcc ggaacgttac cctcctactg       540
     ggagcgctcc cgtgactcag gccacaggcc cccttcccgg ggcgagcccc caccaccccg       600
     ggaaggccac tgcgacccct gagctcaatt catgggagcg ctcccatgcc agtgctcccg       660
     gcagaaagga gagaaccgga acccggtacc gctggtttca ctgatccccc tgttttcacc       720
     cggcatcgcc ccgacaccag cgatgccacc cccgcggcgg ctgcagtcca cacccggcac       780
     gccgcacacc cctctcctgt gtgacacgcg gttccgaacg gccttgccgg ttctcggtat       840
     gccgacgaac ggcacggctg ctccggaacc ggaagatccg gaggttattt ccaagcatga       900
     gatcgttact gtctccccgg cgctggcgca cgctggcctc gggggcgctc gcagcggccc       960
     tggccgccgc tgtactctcc cccggcgtcg cgcacgccgc cgtcgcctgc tcggtggact      1020
     acgacgactc caacgactgg ggtagcgggt tcgtcgccga agtcaaggtg accaacgaag      1080
     gcagcgaccc catccagaac tggcaagtag gctggacctt ccccggtaac cagcagatca      1140
     ccaacggctg gaacggcgtg ttcagccaga gcggcgccaa cgtcaccgtc cgctacccgg      1200
     actggaaccc caatatcgcc cccggagcca ccatctcctt cggcttccag ggcacctaca      1260
     gcggctccaa cgacgccccg accagcttca ccgtcaacgg cgtcacctgc agcggatccc      1320
     agcccgccaa cctgccgccc gatgtcaccc tgacatcccc ggccaacaac tcgaccttcc      1380
     tggtcaacga cccgatcgag ctgaccgcgg tcgcctccga ccccgacggc tcgatcgacc      1440
     gggtggaatt cgccgccgac aacaccgtca tcggcatcga caccacctcc ccctacagct      1500
     tcacctggac ggacgctgcc gccggctcct actcggtgac cgcgatcgcc tacgacgacc      1560
     agggagccag gaccgtctcc gctcccatcg ccatccgagt gctggaccgg gccgccgtca      1620
     tcgcctcacc gcccaccgtc cgcgtgccgc agggcggcac cgccgacttc gaggtgcggc      1680
     tgtccaacca gccctccggc aacgtcacgg tcaccgtggc gcgcacgtcg ggcagctccg      1740
     acctgaccgt ctccagcggc tcccaactcc agttcacctc cagcaactgg aaccagccgc      1800
     agaaggtgac catcgcctcc gctgacaacg gcggaaacct ggccgaggcg gtcttcaccg      1860
     tcagcgcccc cggccacgac tcggccgagg tgacggtccg ggagatcgac ccgaacacca      1920
     gctcctacga ccaggccttc ctggagcagt acgagaagat caaggacccc gccagcggct      1980
     acttccgcga attcaacggg ctcctggtcc cctaccactc ggtggagacc atgatcgtcg      2040
     aggctccgga ccacggccac cagaccacgt ccgaggcgtt cagctactac ctgtggctgg      2100
     aggcgtacta cggccgggtc accggtgact ggaagccgct ccacgacgcc tgggagtcga      2160
     tggagacctt catcatcccc ggcaccaagg accagccgac caactccgcc tacaacccga      2220
     actccccggc gacctacatc cccgagcagc ccaacgctga cggctacccg tcgcctctca      2280
     tgaacaacgt cccggtgggt caagacccgc tcgcccagga gctgagctcc acctacggga      2340
     ccaacgagat ctacggcatg cactggctgc tcgacgtgga caacgtctac ggcttcgggt      2400
     tctgcggcga cggcaccgac gacgcccccg cctacatcaa cacctaccag cgtggtgcgc      2460
     gcgagtcggt gtgggagacc attccgcacc cgtcctgcga cgacttcacg cacggcggcc      2520
     ccaacggcta cctggacctg ttcaccgacg accagaacta cgccaagcag tggcgctaca      2580
     ccaacgcccc cgacgctgac gcgcgggccg tccaggtgat gttctgggcg cacgaatggg      2640
     ccaaggagca gggcaaggag aacgagatcg cgggcctgat ggacaaggcg tccaagatgg      2700
     gcgactacct ccggtacgcg atgttcgaca agtacttcaa gaagatcggc aactgcgtcg      2760
     gcgccacctc ctgcccgggt ggccaaggca aggacagcgc gcactacctg ctgtcctggt      2820
     actactcctg gggcggctcg ctcgacacct cctctgcgtg ggcgtggcgt atcggctcca      2880
     gctcctcgca ccagggctac cagaacgtgc tcgctgccta cgcgctctcg caggtgcccg      2940
     aactgcagcc tgactccccg accggtgtcc aggactgggc caccagcttc gaccgccagt      3000
     tggagttcct ccagtggctg cagtccgctg aaggtggtat cgccggtggc gccaccaaca      3060
     gctggaaggg aagctacgac accccgccga ccggcctgtc gcagttctac ggcatgtact      3120
     acgactggca gccggtctgg aacgacccgc cgtccaacaa ctggttcggc ttccaggtct      3180
     ggaacatgga gcgcgtcgcc cagctctact acgtgaccgg cgacgcccgg gccgaggcca      3240
     tcctcgacaa gtgggtgccg tgggccatcc agcacaccga cgtggacgcc gacaacggcg      3300
     gccagaactt ccaggtcccc tccgacctgg agtggtcggg ccagcctgac acctggaccg      3360
     gcacctacac cggcaacccg aacctgcacg tccaggtcgt ctcctacagc caggacgtcg      3420
     gtgtgaccgc cgctctggcc aagaccctga tgtactacgc gaagcgttcg ggcgacacca      3480
     ccgccctcgc caccgcggag ggtctgctgg acgccctgct ggcccaccgg gacagcatcg      3540
     gtatcgccac ccccgagcag ccgagctggg accgtctgga cgacccgtgg gacggctccg      3600
     agggcctgta cgtgccgccg ggctggtcgg gcaccatgcc caacggtgac cgcatcgagc      3660
     cgggcgcgac cttcctgtcc atccgctcgt tctacaagaa cgacccgctg tggccgcagg      3720
     tcgaggcaca cctgaacgac ccgcagaacg tcccggcgcc gatcgtggag cgccaccgct      3780
     tctgggctca ggtggaaatc gcgaccgcgt tcgcagccca cgacgaactg ttcggggccg      3840
     gagctccctg atcctgaaca gtccgtctcc tgaccggcgg tccgtggcgg cgtagtgctc      3900
     ccccgccgcg gaccgccctc caccaccccc ctggggccgt ccggcgcacc aacaccggac      3960
     ggccccagac tcctttcacg gcctgctact cggcccgacg ccccgcccta tccagcccga      4020
     tcaaccaggt cagcgtagtc cgggtgccgc tcgagccacg ccttgacata ggggcagacc      4080
     gcacgcaccc gcagcccgcg ggcccgcaca tcatccaacg cctcccgcac cagccggctg      4140
     cccatcccct tcccctggaa agagccgtcc acccgagtgt ggaagaagac cacccgatca      4200
     ccggcaacag gctggtattc cgtgaaaccg gcgattttct ccccggcacg gatctcgtac      4260
     cggtgctgtg ccggattgtc gatcaccgtg acatccatgg cgttcccctc ccgttcccca      4320
     ggcggcggcg catctctcat ccggcggcct gcccaggact gtcctcttcc ccaggacagc      4380
     ctgagcacgc gcccgcacgg cgaaccccag ccacagccct agcatggtga acggccacgg      4440
     tcgcagggcg accacgacac cgaggaggag tgatgggcga cggcggcaca gtacgccacc      4500
     cttccgtacg tgccgtatca ccggcagcgt tggacgaggc ggtacgcgtc ctgcgggcag      4560
     gcggcctcgt agctttcccc accgaaaccg tctacggcct aggcgcggac gccgcgaacc      4620
     cggccgcggt agcgcgcatt ttcgccgcca aaggccgtcc cgctgaccac cccctgatcg      4680
     tgcacgtcgc ttccgcggag agcgcgcgcg actgggctgc tacctttcct cctctcgccc      4740
     gcacgctggc ggacgcgttc tggcccggcc cgctgaccct catcctcccc cgctccgccc      4800
     aagtgccgga cgcagtgacc ggtggacgcg ccacggtagg gctgcgggtc cccgaccagc      4860
     cggtcgcgct cgcactcctg gaacgcttcg gcggcggaat cgccgcacct tccgcgaacc      4920
     ggttcggccg agtgagcccg accacggccg cgcacgttgc cgctgacctc ggggaccggg      4980
     tcgacctggt gttggacggc ggaccgtgca cggtcggcgt ggaatcgacg atcgtcgaag      5040
     tggccgacgg ccggctcacc gtgctccgca ccggaggcat cacccccgac gaccttgccg      5100
     cggtcaccgg agcccccgtc gacaccaccc ccaccggacc ggcccgggca cccggcatgc      5160
     tcgccgccca ctacgcaccc gccgcacggg tcgtgctagc cgaagcagca gaagccgcgg      5220
     acacggtcgc ccagtgggtg gagaaaggac accgggtggc tgtgctggcg gagaccgcta      5280
     ccgtgcccga aaacctgccg gaaggcgtgg tggtgctacc gtcccctgct tcggctcggg      5340
     actatgcccg cgtgctgtac cagcggctgc gggacgtgga cgcggcggga gccgacgtgg      5400
     tcgtcgcgat cccccccgaa cccgcgggga tcggcttggc ggtacgggac cggctgctgc      5460
     gcgcatcccg ggcgcactga cctctccccc tggggcaagg gatttttccg catagacgag      5520
     cccgtttccg ggatctcttt ctgtggagac agaaagagag caccgacacc agggagggcc      5580
     gatgaaagct caagccggag accggatcgt tgtggaacgc ccccgcgatg acctgcccgc      5640
     gcgcaaaggc gtcgtgctca aagtgcaggg ggacaacggg ggcccgccct actgggtgcg      5700
     gtgggaggac gaaggccggg aaaccctcgt ctacccggga ccggacgccc gtatcgagcc      5760
     ccgccacccc gtcccccaag cccgccagga gcatacggag gcccgtcaac cgcagccggg      5820
     acagtccctg aaacggatac agatcgacgt cgcagtgtcg gaggtgcacg agaacggctc      5880
     cgtgcgcacc ctcgccgaag cgcaactgcc gtccaccaag tggaacctgc gcggccacgg      5940
     agaagcacgc aagcatccca ccgacgccga t                                     5971
//


  
spacer
spacer