spacer
spacer

EBI Dbfetch

ID   X02425; SV 1; linear; genomic DNA; STD; FUN; 4235 BP.
XX
AC   X02425;
XX
DT   02-JUL-1986 (Rel. 09, Created)
DT   23-OCT-2008 (Rel. 97, Last updated, Version 7)
XX
DE   Hansenula polymorpha MOX gene for methanol oxidase
XX
KW   inverted repeat; methanol oxidase; unidentified reading frame.
XX
OS   Pichia angusta
OC   Eukaryota; Fungi; Dikarya; Ascomycota; Saccharomycotina; Saccharomycetes;
OC   Saccharomycetales; Saccharomycetaceae; Pichia.
XX
RN   [1]
RP   1-4235
RX   DOI; 10.1093/nar/13.9.3063
RX   PUBMED; 2582370.
RA   Ledeboer A.M., Edens L., Maat J., Visser C., Bos J.W., Verrips C.T.;
RT   "Molecular cloning and characterization of a gene coding for methanol
RT   oxidase in Hansenula polymorpha";
RL   Nucleic Acids Res. 13(9):3063-3082(1985).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4235
FT                   /organism="Pichia angusta"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:4905"
FT   CDS             3..509
FT                   /note="unidentified reading frame (aa 1-168)"
FT                   /db_xref="UniProtKB/TrEMBL:Q00920"
FT                   /protein_id="CAA26277.1"
FT                   /translation="MEEPRHLQQLGRVENEPDVVERGGHKPAFADGAALVLDVEGLFQR
FT                   QSREEAANARNQLHEPRQFGGAGFGHFNVVVDEEFEVVEDFRVAAFCLRVYHEVVHCRD
FT                   AVALHRVQDERRGQQALDPFYEAISTVFLECVLHSVATGHLETGLAVLDAPINCCRMHP
FT                   CTASF"
FT   misc_feature    458..490
FT                   /note="pot. stem-loop structure"
FT   repeat_region   458..464
FT                   /note="inverted repeat A"
FT   repeat_region   484..490
FT                   /note="inverted repeat A'"
FT   misc_feature    499..542
FT                   /note="pot. stem-loop structure"
FT   repeat_region   499..506
FT                   /note="inverted repeat B"
FT   repeat_region   535..542
FT                   /note="inverted repeat B'"
FT   misc_feature    851..857
FT                   /note="pot. transcription initiation region"
FT   promoter        915..923
FT                   /note="put. TATA box (MOX gene)"
FT   promoter        962..971
FT                   /note="pot. promoter sequence"
FT   CDS             972..2966
FT                   /note="methanol oxidase (aa 1-664)"
FT                   /db_xref="GOA:P04841"
FT                   /db_xref="InterPro:IPR000172"
FT                   /db_xref="InterPro:IPR007867"
FT                   /db_xref="InterPro:IPR012132"
FT                   /db_xref="UniProtKB/Swiss-Prot:P04841"
FT                   /protein_id="CAA26278.1"
FT                   /translation="MAIPDEFDIIVVGGGSTGCCIAGRLANLDDQNLTVALIEGGENNI
FT                   NNPWVYLPGVYPRNMRLDSKTATFYSSRPSKALNGRRAIVPCANILGGGSSINFLMYTR
FT                   ASASDYDDWESEGWSTDELLPLIKKIETYQRPCNNRDLHGFDGPIKVSFGNYTYPTCQD
FT                   FLRAAESQGIPVVDDLEDFKTSHGAEHWLKWINRDLGRRSDSAHAYVHPTMRNKQSLFL
FT                   ITSTKCDKVIIEDGKAVAVRTVPMKPLNPKKPVSRTFRARKQIVISCGTISSPLVLQRS
FT                   GIGAAHHLRSVGVKPIVDLPGVGENFQDHYCFFTPYYVKPDVPTFDDFVRGDPVAQKAA
FT                   FDQWYSNKDGPLTTNGIEAGVKIRPTEEELATADEDFRRGYAEYFENKPDKPLMHYSVI
FT                   SGFFGDHTKIPNGKFMTMFHFLEYPFSRGFVRITSANPYDAPDFDPGFLNDERDLWPMV
FT                   WAYKKSRETARRMESFAGEVTSHHPLFKVDSPARARDLDLETCSAYAGPKHLTANLYHG
FT                   SWTVPIDKPTPKNDFHVTSNQVQLHSDIEYTEEDDEAIVNYIKEHTETTWHCLGTCSMA
FT                   PREGSKIAPKGGVLDARLNVYGVQNLKVADLSVCPDNVGCNTYSTALTIGEKAATLVAE
FT                   DLGYSGSDLDMTIPNFRLGTYEETGLARF"
FT   CDS             complement(1341..>2675)
FT                   /note="unidentified reading frame (aa 1-444)"
FT                   /db_xref="UniProtKB/TrEMBL:Q00921"
FT                   /protein_id="CAA26279.1"
FT                   /translation="VPSGLGVFLNVVDDGLVVLLGVLDVGVQLDLVGGHVEIVLRRWLV
FT                   DRNGPRAVVQVGSEVLRTGICTACLEVQVSGSGWRVNLEQWVVRGDLSCKALHSSGRLS
FT                   GLLVCPDHRPQVSFVIEEAGIEVRSVVWVCRGDSNKSSGEWILQEVEHGHELAVRNLGV
FT                   VSKEAGDDRVVHQRLVWLVLEVLCVAASEVLVRGSQLLFGRSDLDSGFNTVGGQWTVLV
FT                   GVPLVESGLLGNWVAPDKVVERRNVRLDVVWSEETVVVLEILTHTWQVDDWLDPHGSQV
FT                   VSCTNTRSLEHQRRRDGSAGDHNLLSGSEGSGHRLLRVQRLHWHCSHGHSLAVLDDHLV
FT                   TLGGGDEEQALLVSHSWVDVGVRRIRSSAQVSVNPLQPVLCTMRCLEVLQVVHNRNSLR
FT                   LCCSQEVLARRIRVVSKGNLDWAVKAVQISVVARTLVSFDFFDQR"
FT   misc_signal     3081..3100
FT                   /note="pot. stem loop structure; pot. transcription
FT                   terminator"
FT   repeat_region   3081..3088
FT                   /note="inverted repeat C"
FT   repeat_region   3093..3100
FT                   /note="inverted repeat C'"
FT   misc_feature    3106..3109
FT                   /note="T stretch"
FT   CDS             3134..3886
FT                   /note="unidentified reading frame (aa 1-230)"
FT                   /db_xref="GOA:P09575"
FT                   /db_xref="InterPro:IPR000991"
FT                   /db_xref="InterPro:IPR001317"
FT                   /db_xref="InterPro:IPR001468"
FT                   /db_xref="InterPro:IPR006220"
FT                   /db_xref="InterPro:IPR006221"
FT                   /db_xref="InterPro:IPR011060"
FT                   /db_xref="InterPro:IPR011702"
FT                   /db_xref="InterPro:IPR013785"
FT                   /db_xref="InterPro:IPR013798"
FT                   /db_xref="InterPro:IPR017926"
FT                   /db_xref="UniProtKB/Swiss-Prot:P09575"
FT                   /protein_id="CAA26280.1"
FT                   /translation="MPAASKNVVMIDNYDSFTWNLYEYLCQEGANVEVFRNDQITIPEI
FT                   EQLKPDVVVISPGPGHPRTDSGISRDVISHFKGKIPVFGVCMGQQCIFEEFGGDVEYAG
FT                   EIVHGKTSTVKHDNKGMFKNVPQDVAVTRYHSLAGTLKSLPDCLEITARTDNGIIMGVR
FT                   HKKYTIEGVQFHPESILTEEGHLMIQNILNVSGGYWEENANGAAQRKESILEKIYAQRR
FT                   KDYEFEMNRPGRRFADLELYLSMGLHRR"
XX
SQ   Sequence 4235 BP; 1071 A; 1115 C; 1113 G; 936 T; 0 other;
     gaatggaaga accgcgacat ctccaacagc tgggccgtgt tgagaatgag ccggacgtcg        60
     ttgaacgagg gggccacaag ccggcgtttg ctgatggcgc ggcgctcgtc ctcgatgtag       120
     aaggcctttt ccagaggcag tctcgtgaag aagctgccaa cgctcggaac cagctgcacg       180
     agccgagaca attcgggggt gccggctttg gtcatttcaa tgttgtcgtc gatgaggagt       240
     tcgaggtcgt ggaagatttc cgcgtagcgg cgttttgcct cagagtttac catgaggtcg       300
     tccactgcag agatgccgtt gctcttcacc gcgtacagga cgaacggcgt ggccagcagg       360
     cccttgatcc attctatgag gccatctcga cggtgttcct tgagtgcgta ctccactctg       420
     tagcgactgg acatctcgag actgggcttg ctgtgctgga tgcaccaatt aattgttgcc       480
     gcatgcatcc ttgcaccgca agtttttaaa acccactcgc tttagccgtc gcgtaaaact       540
     tgtgaatctg gcaactgagg gggttctgca gccgcaaccg aacttttcgc ttcgaggacg       600
     cagctggatg gtgtcatgtg aggctctgtt tgctggcgta gcctacaacg tgaccttgcc       660
     taaccggacg gcgctaccca ctgctgtctg tgcctgctac cagaaaatca ccagagcagc       720
     agagggccga tgtggcaact ggtggggtgt cggacaggct gtttctccac agtgcaaatg       780
     cgggtgaacc ggccagaaag taaattctta tgctaccgtg cagcgactcc gacatcccca       840
     gtttttgccc tacttgatca cagatggggt cagcgctgcc gctaagtgta cccaaccgtc       900
     cccacacggt ccatctataa atactgctgc cagtgcacgg tggtgacatc aatctaaagt       960
     acaaaaacaa aatggccatt cctgacgaat tcgatatcat tgttgttggt ggaggttcca      1020
     ccggctgctg cattgcgggc agactcgcaa acctcgacga ccaaaacctc acagttgccc      1080
     tgatcgaggg tggtgagaac aacatcaaca acccttgggt ctaccttccc ggagtgtatc      1140
     ctagaaacat gagactcgac tccaagacgg ccaccttcta ctcgtccaga ccatcgaagg      1200
     ctctgaacgg cagaagagcg atcgttcctt gcgccaacat ccttggaggc ggctcgtcga      1260
     tcaactttct gatgtacacc agagcctctg cttccgacta cgacgactgg gagtccgagg      1320
     gatggagcac cgacgagttg ctacctctga tcaaaaaaat cgaaacttac cagcgtcctt      1380
     gcaacaacag agatctgcac ggctttgacg gcccaatcaa ggtttccttt ggaaactaca      1440
     cgtatcctac gtgccaggac ttcctgagag cagcagagtc gcagggaatt cctgttgtgg      1500
     acgacctgga ggacttcaag acatcgcatg gtgcagagca ctggctgaag tggattaaca      1560
     gagacctggg cagaagatcg gattctgcgc acgcctacgt ccacccaact atgagaaaca      1620
     agcagagcct gttcctcatc acctccacca agtgtgacaa ggtgatcatc gaggacggca      1680
     aggctgtggc cgtgagaaca gtgccaatga agcctctgaa ccctaagaag cctgtgtcca      1740
     gaaccttcag agccagaaag cagattgtga tctcctgcgg aaccatctcg tctcctctgg      1800
     tgctccagag atctggtatt ggtgcagctc accacttgag atccgtgggg gtcaagccaa      1860
     tcgtcgacct gccaggtgtg ggtgagaatt tccaggacca ctactgtttc ttcactccat      1920
     actacgtcaa gcctgacgtt cctacgttcg acgactttgt caggggcgac ccagttgccc      1980
     agaaggccgc tttcgaccag tggtactcca acaaggacgg tccattgacc accaacggta      2040
     ttgaagccgg agtcaagatc agacctaccg aagaggagct ggctaccgcg gacgaggact      2100
     tcagacgcgg ctacgcagag tacttcgaga acaagccaga caagcctctg atgcactact      2160
     ctgtcatctc cggcttcttt ggagaccaca ccaagattcc taacggcaag ttcatgacca      2220
     tgttccactt cctggagtat ccattctcca gaggatttgt tagaatcacc tcggcaaacc      2280
     catacgacgc tcctgacttc gatcccggct tcctcaatga cgaaagagac ctgtggccta      2340
     tggtctgggc atacaagaag tccagagaga cggccagaag aatggagagc tttgcaggag      2400
     aggtcacctc gcaccaccca ttgttcaagg ttgactcgcc agccagagcc agagacctgg      2460
     acctcgagac atgcagtgca tatgccggtc ctaagcacct cactgccaac ctgtaccacg      2520
     gctcgtggac cgttcctatc gacaagccaa cgcctaagaa cgatttccac gtgacctcca      2580
     accaagtcca actgcactcc gacatcgagt acaccgagga ggacgacgag gccatcgtca      2640
     actacattaa ggaacacacc gagaccactt ggcactgtct gggtacctgc tcgatggccc      2700
     caagagaggg tagtaagatt gctcctaagg gaggtgtctt ggacgccaga ctgaacgttt      2760
     acggagtcca gaacctcaag gttgcggacc tttctgtttg tcccgacaac gttggatgca      2820
     acacctactc tactgcattg accatcggtg agaaggctgc cactcttgtt gctgaagatc      2880
     ttggctactc aggctccgac ctggacatga cgattccaaa cttcagactc ggaacttacg      2940
     aggagaccgg acttgccaga ttctaaggag acgtggaagg acataccgct tttgagaagc      3000
     gtgtttgaaa atagttcttt ttctggttta tatcgtttat gaagtgatga gatgaaaagc      3060
     tgaaatagcg agtataggaa aatttaatga aaattaaatt aaatattttc ttaggctatt      3120
     agtcaccttc aaaatgccgg ccgcttctaa gaacgttgtc atgatcgaca actacgactc      3180
     gtttacctgg aacctgtacg agtacctgtg tcaggaggga gccaatgtcg aggttttcag      3240
     gaacgatcag atcaccattc cggagattga gcagctcaag ccggacgttg tggtgatatc      3300
     ccctggtcct ggccatccaa gaacagactc gggaatatct cgcgacgtga tcagccattt      3360
     taaaggcaag attcctgtct ttggtgtctg tatgggccag cagtgtatct tcgaggagtt      3420
     tggcggagac gtcgagtatg cgggcgagat tgtccatgga aaaacgtcca ctgttaagca      3480
     cgacaacaag ggaatgttca aaaacgttcc gcaagatgtt gctgtcacca gataccactc      3540
     gctggccgga acgctcaagt cgcttccgga ctgtctagag atcactgctc gcacagacaa      3600
     cgggatcatt atgggtgtga gacacaagaa gtacaccatc gagggcgtcc agtttcatcc      3660
     agagagcatt ctgaccgagg agggccatct gatgatccag aatatcctca acgtttccgg      3720
     tggttactgg gaggaaaatg ccaacggcgc ggctcagaga aaggaaagca tattggagaa      3780
     aatatacgcg cagagacgaa aagactacga gtttgagatg aacagaccgg ggcgcagatt      3840
     tgctgatcta gaactgtact tgtccatggg actgcaccgc cgctaatcaa tttttacgac      3900
     agattggagc agaacatcag cgccggcaag gttgcaattc tcagcgaaat caagagagcg      3960
     tcgccttcta aaggcgtcat cgacggagac gctaacgctg ccaaacaggc cctcaactac      4020
     gccaaggctg gagttgccac aatttctgtt ttgaccgagc caacctggtt taaaggaaat      4080
     atccaggacc tggaggtggc cagaaaagcc attgactctg tggccaatag accgtgtatt      4140
     ttgcggaagg agtttatctt caacaagtac caaattctag aggcccgact ggcgggagca      4200
     gacacggttc tgctgattgt caagatgctg agctc                                 4235
//


  
spacer
spacer