spacer
spacer

EBI Dbfetch

ID   AJ005644; SV 1; linear; genomic DNA; STD; FUN; 5616 BP.
XX
AC   AJ005644;
XX
DT   29-APR-1998 (Rel. 55, Created)
DT   15-APR-2005 (Rel. 83, Last updated, Version 5)
XX
DE   Encephalitozoon cuniculi dhfr, ts, shmt genes and gene encoding
DE   aminopeptidase
XX
KW   aminopeptidase; dhfr gene; dihydrofolate reductase; metalloprotease;
KW   N-terminal exopeptidase; serine hydroxymethyltransferase; shmt gene;
KW   thymidylate synthase; ts gene.
XX
OS   Encephalitozoon cuniculi
OC   Eukaryota; Fungi; Microsporidia; Unikaryonidae; Encephalitozoon.
XX
RN   [1]
RP   1-5616
RA   Duffieux F.;
RT   ;
RL   Submitted (16-APR-1998) to the EMBL/GenBank/DDBJ databases.
RL   Duffieux F., Protistologie Moleculaire et Cellulaire des Parasites Opport,
RL   Universite Blaise Pascal - Upresa 6023, Bat. Biologie A, Campus des
RL   Cezeaux, 24 Avenue des Landais, 63177 Aubiere Cedex, FRANCE.
XX
RN   [2]
RP   1-4296
RX   PUBMED; 11013707.
RA   Duffieux F., Peyret P., Roe B.A., Vivares C.P.;
RT   "First report on the systematic sequencing of the small genome of
RT   Encephalitozoon cuniculi (Protozoa, Microspora): gene organization of a 4.3
RT   kbp region on chromosome I";
RL   Microb. Comp. Genomics 3(1):1-11(1998).
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..5616
FT                   /organism="Encephalitozoon cuniculi"
FT                   /chromosome="1"
FT                   /lab_host="mouse"
FT                   /mol_type="genomic DNA"
FT                   /cell_line="MDCK "
FT                   /cell_type="resistant spores"
FT                   /db_xref="taxon:6035"
FT   CDS             complement(1..2595)
FT                   /codon_start=1
FT                   /product="aminopeptidase"
FT                   /function="zinc-dependent metalloprotease"
FT                   /function="N-terminal exopeptidase"
FT                   /EC_number="3.4.11.7"
FT                   /db_xref="GOA:Q8SQI6"
FT                   /db_xref="InterPro:IPR014782"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q8SQI6"
FT                   /protein_id="CAA06646.1"
FT                   /translation="MRWIKVMAGLLPMIGSKGADEKDSSQQRRLSRVVVPEHYDLHVKI
FT                   LDAGFCGSVGIRVMISQDVSEIVLNAKELEIRDAGIVVEGARIPGRVVVGEAEKELEVV
FT                   RIVFPSSLRAGPGYLTMEFCGDYSNGLVGLYKSGGPKEVYSTHFEPTDARRAFPCFDQP
FT                   DMKATFKISIDAGSKFTVLANTQAIPSLREEYGDRKIEYFEETCKMSTYLVAFVVGELS
FT                   YIEDWSKDGVRLRVYGDSSEVEWGRYGLEVGKRCLEYFSEYFGVGYEFPRAGSAKIDMV
FT                   GIPNFSSGAMENWGLITFRRESLLYVPGKSNVEDMKNVAGTVCHELGHMWFGNLVTMSW
FT                   WDDLWLNEGFATWVSFKGMENIGSVVSWDVWGEFVLWNVVRGMVDDGLGKSHQIRMNVT
FT                   DPGEIGEIFDSISYCKGASVIRMIERYVGESVFMLGIRRYIKEHMYGNGNAMSLWKAIG
FT                   EEYGEDISEMVEGWISQAGYPVVSVQDCGSSLVLSQSRYSMLGKSDDSLWTIPVVVSWE
FT                   GKGQERIELRGRETTVRKRSSVYKVNAEYGGFYRVLYDSAGLSGLESRIDSLSVVDRVN
FT                   VIEDVFGLGFGLYGGLEHGLRRISEYYSDSYHVARSGIEKLLRLRSVFYDDAEIVSLID
FT                   KKVRKMILPCVGRIDVFDIGTSVESVSMNKYVLSVGVEVGIREAVEKVQELWRRHVEAG
FT                   EELGELRWIVYKAVVDENLGYMMDKHKYGDTPGMRREVMNGFSGIKREENFLDVVGNLS
FT                   QFSVEDIGVVIGSISRGGAFRDAMVEYVVSHGEELYLMVHKNAMLYNMIIMSLRHVSGD
FT                   LIVEKVERFLSGIKHSGSNLSIEKVRNEIQWRRRMRGIREEVLRGLLPEAEK"
FT   CDS             2632..3249
FT                   /codon_start=1
FT                   /gene="dhfr"
FT                   /product="dihydrofolate reductase"
FT                   /function="reduction of DHF into THF"
FT                   /EC_number="1.5.1.3"
FT                   /db_xref="GOA:O62583"
FT                   /db_xref="HSSP:1J3J"
FT                   /db_xref="InterPro:IPR017925"
FT                   /db_xref="UniProtKB/Swiss-Prot:O62583"
FT                   /protein_id="CAA06647.1"
FT                   /translation="MLALVVALASHRGIGNANALPWPRPLAADMAWFRTLSQSIPLISP
FT                   DRIALAPSASNAVVMGRRTWDSIPSRFRPLANRINVVLSRGPARSTENTFFIQTFEALD
FT                   SLPLPPSSMTFVIGGRDVYSLALESGRPHLIFATEVFESPECDVFFPHIDWASYEKRDI
FT                   TRDVSRLIDRTLASAFYSPETATFTENGTSFKMFLYTKPETR"
FT   CDS             3285..4169
FT                   /codon_start=1
FT                   /gene="ts"
FT                   /product="thymidylate synthase"
FT                   /function="reductive methylation of dUMP to dTMP with
FT                   conversion of N5,N10-methylene THF"
FT                   /EC_number="2.1.1.45"
FT                   /db_xref="GOA:O62584"
FT                   /db_xref="HSSP:1RTS"
FT                   /db_xref="InterPro:IPR000398"
FT                   /db_xref="UniProtKB/Swiss-Prot:O62584"
FT                   /protein_id="CAA06648.1"
FT                   /translation="MPQDPRHPEHQYLDLVKHILENGARRMDRTGTGALSVFGATMRFS
FT                   LEDNTFPLLTTRRVFYRGVVEELLFFLRGETDSKVLEKKGVRIWEKNGAKQFLQSVGID
FT                   REEGDLGPIYGFQWRHFGARYETSASSYEGKGVDQIASAIAAIRANPASRRIVVSAWNP
FT                   TDLGSMALPPCHVLFQFNVTDGKLSCAMYQRSGDMGLGVPFNIASYSLLTILVAHLTGL
FT                   QPGEFVHFLGDAHVYLDHVDSLRQQIQRPPRAFPKLFVSPKGPRTEPEHFQYEDFELVG
FT                   YDPHPAIKMNMSA"
FT   CDS             4220..5602
FT                   /codon_start=1
FT                   /gene="shmt"
FT                   /product="serine hydroxymethyltransferase"
FT                   /function="interconversion of serine and glycine"
FT                   /EC_number="2.1.2.2"
FT                   /db_xref="GOA:O62585"
FT                   /db_xref="HSSP:1CJ0"
FT                   /db_xref="InterPro:IPR019798"
FT                   /db_xref="UniProtKB/Swiss-Prot:O62585"
FT                   /protein_id="CAA06649.1"
FT                   /translation="MTDAREKGFWTGPLEMADPELHALICGEVERQKKTINLIASENYA
FT                   HQSAMEACGSVLTNKYSEGRVGERYYGGTHWVDRIELLCQKRALELFGLDPDAWGVYVQ
FT                   PYSGSPANFAIYTAVVPPGGRIMGLDLPSGGHLTHGYKTKTRKISASSVYFDSRPYTVG
FT                   SNGLIDYEGLEKTFTDFLPHILICGYSAYSRDIDYKRLQSIAGRNGAFLFADISHISPL
FT                   VASGLMNSPFEHCDIVMTTTQKGLRGPRGALIFYRRAVTKNGETVDLDARINFAVFPML
FT                   QGGPHNHTIAGIASALLHAGTPEFAEYTRRVVENSRELCSRLQSLGLDILTGGTDNHML
FT                   LVDLRSTGVDGAAVEHMCDALGISLNRNAIVGNSSPLSPSGIRVGTYAVTARGFGPEEM
FT                   REVGDIIGGVVKLCREMTGGRKMSKADLHRVTSDARVMGSEQVLVLRRRVCALAEAYPI
FT                   YE"
XX
SQ   Sequence 5616 BP; 1317 A; 1877 C; 1301 G; 1121 T; 0 other;
     ttacttctca gcctccggca gaagcccacg aaggacctcc tctcttatcc cccgcatcct        60
     ccttctccac tggatctcgt tccgcacctt ctcaatgctc aggttgcttc cagagtgctt       120
     gatcccagaa agaaaccttt cgaccttctc cacaatcaaa tccccgctca catgccgcag       180
     cgacatgata atcatgttgt acagcatcgc attcttgtgc accatcaggt acagctcctc       240
     cccatgcgac acaacatact cgaccatcgc gtcccggaac gctcctcccc tgctgatgct       300
     ccctatcacc actccaatat cctcaacact gaactgagag agattcccaa ccacatcaag       360
     aaagttctcc tccctcttta tcccgctgaa tccgttcatg acctcccgcc gcatcccagg       420
     cgtatccccg tacttgtgct tgtccatcat gtatccaaga ttctcgtcga caactgcctt       480
     gtacacaatc caccggagct ctccaagctc ctctcctgcc tccacatgcc gcctccacag       540
     ctcctggacc ttctcaaccg cttcccggat tcccacctca acccccacag acagcacata       600
     cttgttcatg ctgacactct caacagacgt cccaatatca aacacatcaa tcctcccaac       660
     acagggcaaa atcatcttcc tgaccttctt gtcaatcaga gacacaatct ctgcgtcgtc       720
     gtagaacaca ctcctcaacc gaagcaactt ctcaatcccg ctccgagcaa catggtacga       780
     gtcagaatag tactcagata tccgccgaag cccatgctca agacccccat acagcccaaa       840
     ccctagccca aacacatcct caataacatt caccctgtca accacactca gggaatcaat       900
     ccgagactca agcccagata gcccggcaga gtcatacaga accctgtaga accccccgta       960
     ctcggcattc accttgtaca cactgctcct cttccgaaca gtcgtctccc gtcccctaag      1020
     ctcaatcctc tcctgcccct ttccttccca cgataccaca acaggaatcg tccacaggct      1080
     gtcatcactc ttccctagca tcgagtatct gctctgcgac agaacaagag acgacccgca      1140
     gtcctgcaca gacacaacag gataccctgc ctgcgaaatc catccctcaa ccatctcaga      1200
     aatgtcctct ccatactcct ccccaatcgc cttccacagg ctcattgcat tcccgttccc      1260
     atacatgtgc tccttgatgt accgccggat cccaagcata aacacagact cgccgacata      1320
     cctctcaatc atccggataa cactcgctcc cttgcagtag ctgatgctgt cgaaaatctc      1380
     cccaatctcc ccgggatccg tcacattcat ccggatctgg tggctcttcc caagcccgtc      1440
     gtcgaccatc ccgcgcacca cattccacag cacaaactcc ccccacacgt cccatgaaac      1500
     aacagatccg atgttctcca tccccttgaa cgacacccac gtcgcaaacc cctcgttcag      1560
     ccacaggtcg tcccaccacg acatcgtcac aagattccca aaccacatgt gtccaagctc      1620
     gtggcacacc gtccctgcca cattcttcat gtcctccaca ttgctcttcc caggcacata      1680
     cagaaggctc tcccttcgga acgtgatcag cccccagttc tccatcgccc cgctgctaaa      1740
     gttcgggatc ccaaccatgt caatcttcgc agaccccgca cgaggaaact catatccaac      1800
     cccaaagtac tccgaaaaat actccaggca cctcttccca acctcaagcc cataccgtcc      1860
     ccactcaacc tcagagctgt ccccgtacac acggaggcgc accccgtcct tgctccagtc      1920
     ctcaatgtac gaaagctcgc caaccacaaa tgcaacaaga tacgtcgaca tcttgcacgt      1980
     ctcctcaaag tactcgatct tcctgtctcc atactcctcc cggagagacg gaatcgcctg      2040
     tgtgttcgcc agcacagtaa acttcgaccc cgcgtcaatc gaaatcttga acgtcgcctt      2100
     catatcgggc tggtcaaagc acggaaacgc ccgccgtgca tcagtcggct caaagtgtgt      2160
     gctgtacacc tccttcggcc ctccgctctt gtacagcccc acaagcccat tgctatagtc      2220
     tccacaaaac tccatcgtaa gatatccagg ccctgcacgc agagaggacg gaaacacaat      2280
     ccgcacaacc tccaactcct tctccgcctc cccgacaacc acacgccccg gaatccgtgc      2340
     gccctcaaca acaatccctg catcccgtat ctcaagctcc ttggcattca gaactatctc      2400
     ggaaacatcc tgcgaaatca tcacccggat ccccacagac ccgcagaacc ctgcatcaag      2460
     gatcttcaca tgcagatcat agtgctcggg aacaacaacc ctgctcagcc ttctttgctg      2520
     cgacgagtcc ttctcgtcgg cacccttact tccaatcatg ggcagaagcc ctgccattac      2580
     tttaatccac ctcatttttt cacaatacta ttcataataa ataatttccc catgcttgca      2640
     ttggtcgttg cccttgctag ccaccgcgga ataggaaatg ccaatgccct tccatggcca      2700
     cggcccctgg ctgctgacat ggcctggttc aggacactct cccagagcat cccgctcatc      2760
     tccccagacc gcatcgccct tgccccgtct gcatccaatg ccgttgtcat gggcaggagg      2820
     acgtgggact ccatcccctc caggttcagg ccccttgcca accgcatcaa cgtcgtcctg      2880
     tcgagaggcc ctgccagaag cacagaaaac accttcttca tccagacctt cgaggccctc      2940
     gactccctgc ccctcccgcc gtcgtccatg acatttgtga tcggagggcg cgacgtctac      3000
     agccttgcac tcgagagcgg caggccccac cttatatttg ccaccgaggt cttcgagtct      3060
     cccgagtgcg acgtgttctt cccccacatc gactgggcat cctacgaaaa gcgagacatc      3120
     acccgggacg tctccaggct catagaccgc acactcgcga gtgccttcta cagccccgag      3180
     acggccacct ttacagagaa cgggacctcc ttcaagatgt ttctctacac taaaccggag      3240
     acccgctaga cctgccatat ataacccctg cccatgcctg ccaaatgccc caggacccgc      3300
     gccacccaga gcaccagtat cttgacctgg tgaagcacat actggaaaac ggcgccagaa      3360
     ggatggacag gacaggcacg ggagcgctgt ccgtcttcgg agcaacaatg aggttttccc      3420
     tcgaagacaa caccttcccg ctgctgacga caaggagggt cttctacaga ggcgttgtcg      3480
     aggagctcct gttcttcctg agaggcgaga cagactcgaa ggtccttgag aagaaaggag      3540
     tccggatctg ggaaaagaac ggggccaagc agttcctgca gtccgtgggg atagacaggg      3600
     aggagggcga cctcggcccg atatacggct tccagtggag gcacttcggc gcccggtacg      3660
     agacatcggc ctcgagctac gagggcaagg gggtcgacca gatcgcgagc gccatcgcag      3720
     caatcagggc caaccccgcc agcaggagga ttgttgtgag tgcatggaac cccacagacc      3780
     tcgggagcat ggcccttccc ccgtgccacg tgctcttcca gttcaacgtg acggacggga      3840
     agctcagctg tgcaatgtac cagaggtctg gagacatggg cctgggcgtt cccttcaaca      3900
     ttgcctcgta ctcgctgctc acaatactcg tggcgcatct gacaggcctg cagcccgggg      3960
     agtttgttca ctttctgggc gacgcccacg tgtatctgga ccacgtcgac tctcttcggc      4020
     agcagatcca gagacccccg agagcatttc caaagctctt tgtcagccca aaggggccga      4080
     gaacagagcc ggagcacttc cagtacgagg acttcgagct tgtgggatac gacccgcacc      4140
     ctgcaatcaa gatgaacatg agtgcttgag gacccgacgg ttccctccaa gatatttaat      4200
     cttctggagg ggaggaggca tgacagatgc aagagaaaag ggtttctgga caggcccgct      4260
     ggagatggca gaccccgagc tccatgccct gatctgcgga gaggtcgaga ggcagaagaa      4320
     gacaataaac ctgatagcaa gcgagaacta tgcgcatcag agcgcgatgg aggcctgtgg      4380
     gtctgtcctc accaacaagt attcagaagg cagggtggga gagcgatact acggggggac      4440
     gcactgggtc gacaggatcg agctcctctg ccagaagagg gctctcgagc tcttcgggct      4500
     ggatcctgac gcctggggcg tctatgtcca gccatactcg gggagcccag ccaactttgc      4560
     aatctacacg gccgttgtcc ctccgggcgg gaggatcatg ggccttgacc tgccgtctgg      4620
     aggacacctg acccatggat acaagacgaa gaccaggaag atatctgcct caagcgtcta      4680
     cttcgactca aggccataca cagtggggag caacggcctc atcgactacg agggcctcga      4740
     gaagaccttc acggactttc tgccgcacat cctgatctgc ggatacagcg catactccag      4800
     agacatcgac tacaagaggc tgcagtcgat agccggcagg aacggtgcct ttctgtttgc      4860
     agacatctcg cacatctcgc cgctggttgc gtctgggctg atgaacagcc cgttcgagca      4920
     ctgcgacatt gtcatgacga caacgcagaa ggggctccgg ggacctcgag gggcgctcat      4980
     cttctacagg agggccgtga caaagaatgg ggagactgtg gatctggatg cccggatcaa      5040
     ctttgccgtg tttccgatgc tgcagggagg cccccacaac cacacgattg cagggattgc      5100
     ctctgcactt ctccatgcag gaactcccga gtttgcggag tacacaaggc gcgtggtgga      5160
     gaactcgagg gagctgtgca gccgcttgca gtctctgggc cttgacatcc tgacgggggg      5220
     aacggacaac cacatgctcc ttgtggatct ccggagcacg ggtgtcgacg gggcggctgt      5280
     ggagcacatg tgcgatgccc tgggcatcag cctgaacaga aacgccattg tcggaaactc      5340
     cagcccgctg agcccgtctg gaatacgtgt gggcacatat gcagtcactg ccaggggatt      5400
     tggccccgag gagatgaggg aggttggaga cataatcggc ggggtagtca agctctgcag      5460
     ggagatgacg ggcggcagga agatgtcgaa ggccgatctc cacagagtga cgtccgatgc      5520
     ccgggtcatg ggcagcgagc aggttttagt gctgagaaga agagtgtgtg ccctggcaga      5580
     ggcatatccc atctacgaat gatttattaa acggct                                5616
//


  
spacer
spacer