Dbfetch

ID   AJ717547; SV 1; circular; genomic DNA; STD; VRL; 2801 BP.
XX
AC   AJ717547;
XX
DT   09-MAR-2006 (Rel. 87, Created)
DT   14-SEP-2006 (Rel. 89, Last updated, Version 3)
XX
DE   East African cassava mosaic virus segment DNA A, complete sequence, isolate
DE   EACMV-[K312]
XX
KW   AC1 gene; AC1 protein; AC2 gene; AC2 protein; AC3 gene; AC3 protein;
KW   AC4 gene; AC4 protein; AV1 gene; AV1 protein; AV2 gene; AV2 protein.
XX
OS   East African cassava mosaic virus
OC   Viruses; Geminiviridae; Begomovirus.
XX
RN   [1]
RP   1-2801
RA   Bull S.E.;
RT   ;
RL   Submitted (19-MAY-2004) to the INSDC.
RL   Bull S.E., Department of Disease & Stress Biology, John Innes Centre,
RL   Colney Lane, Norwich, Norfolk, NR4 7UH, UNITED KINGDOM.
XX
RN   [2]
RA   Bull S.E.;
RT   "Diversity of cassava-infecting geminiviruses in Kenya";
RL   Thesis (2005), MSc (Research), University of East Anglia, Norwich, UK.
XX
RN   [3]
RX   DOI; 10.1099/vir.0.82013-0.
RX   PUBMED; 16963765.
RA   Bull S.E., Briddon R.W., Sserubombwe W.S., Ngugi K., Markham P.G.,
RA   Stanley J.;
RT   "Genetic diversity and phylogeography of cassava mosaic viruses in Kenya";
RL   J. Gen. Virol. 87(Pt 10):3053-3065(2006).
XX
DR   MD5; f78f2dfea61aa36196ad8a30407bc04e.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..2801
FT                   /organism="East African cassava mosaic virus"
FT                   /segment="DNA A"
FT                   /host="Manihot esculenta"
FT                   /isolate="EACMV-[K312]"
FT                   /mol_type="genomic DNA"
FT                   /country="Kenya:Machakos, Migwani/Tiuuni"
FT                   /clone="K312FA-2[2002]"
FT                   /db_xref="taxon:62079"
FT   CDS             174..539
FT                   /codon_start=1
FT                   /gene="AV2"
FT                   /product="AV2 protein"
FT                   /db_xref="GOA:Q2A8U4"
FT                   /db_xref="InterPro:IPR002511"
FT                   /db_xref="InterPro:IPR005159"
FT                   /db_xref="UniProtKB/TrEMBL:Q2A8U4"
FT                   /protein_id="CAJ78124.1"
FT                   /translation="MWDPLLNDFPETVHGFRSMLAVKYLLHLEQEYDRGSVGAEYIRDL
FT                   IGVLRCKSYVEATRRYNNLNTRIQGAEEAELRQPIHEPCCCPHCPRHQKQNMGQQAHVS
FT                   EAQDVQNVSKPRCPEGL"
FT   CDS             334..1107
FT                   /codon_start=1
FT                   /gene="AV1"
FT                   /product="AV1 protein"
FT                   /db_xref="GOA:Q2A8U3"
FT                   /db_xref="InterPro:IPR000263"
FT                   /db_xref="InterPro:IPR000650"
FT                   /db_xref="UniProtKB/TrEMBL:Q2A8U3"
FT                   /protein_id="CAJ78125.1"
FT                   /translation="MSKRPGDIIISTPVSKVRRRLNFDSPYTNRVVAPTVRVTRSKIWA
FT                   NRPMYRKPKMYRMYRSPDVPKGCEGPCKVQSYEQRDDVKHTGMVRCVSDVTRGSGITHR
FT                   VGKRFCVKSIYILGKIWMDENIKKQNHTNHVMFFLVRDRRPYGPSPQDFGQVFNMFDNE
FT                   PTTATVKNDLRDRYQVLRKFYATVVGGPSGMKEQSLVKRFFRINNHVVYNHQEQAKYEN
FT                   HTENALLLYMACTHASNPVYATLKIRIYFYDAVTN"
FT   CDS             complement(1104..1508)
FT                   /codon_start=1
FT                   /gene="AC3"
FT                   /product="AC3 protein"
FT                   /db_xref="GOA:Q2A8U2"
FT                   /db_xref="InterPro:IPR000657"
FT                   /db_xref="UniProtKB/TrEMBL:Q2A8U2"
FT                   /protein_id="CAJ78126.1"
FT                   /translation="MDSRTGELITAPQATNGVFTWEITNPLYFAITNHDKRPGNMTHDI
FT                   ITLQIRFNHNIRKALGIHKCFLNFKVWTTLRPPTGLFLKVFRYQVLKYLDMIGVISINT
FT                   VLQAVDHVLYDVLLNTLQVTEQHAIKFNLY"
FT   CDS             complement(1249..1656)
FT                   /codon_start=1
FT                   /gene="AC2"
FT                   /product="AC2 protein"
FT                   /db_xref="GOA:Q2A8U1"
FT                   /db_xref="InterPro:IPR000942"
FT                   /db_xref="UniProtKB/TrEMBL:Q2A8U1"
FT                   /protein_id="CAJ78127.1"
FT                   /translation="MPPSSPSTSHCSQVPIKVQHRTAKTRALRRRRVDLECGCSFYLHI
FT                   DCINHGFSHRGTHHCASSNEWRFYLGNNKSPLFRNHQPRQEAREHDPRHHHTPDTVQPQ
FT                   HSEGIGDSQVFSQLQGLDDLTASDWSFFKSI"
FT   CDS             complement(1565..2644)
FT                   /codon_start=1
FT                   /gene="AC1"
FT                   /product="AC1 protein"
FT                   /db_xref="GOA:Q2A8U0"
FT                   /db_xref="InterPro:IPR001191"
FT                   /db_xref="InterPro:IPR001301"
FT                   /db_xref="InterPro:IPR022690"
FT                   /db_xref="InterPro:IPR022692"
FT                   /db_xref="UniProtKB/TrEMBL:Q2A8U0"
FT                   /protein_id="CAJ78128.1"
FT                   /translation="MPRAGRFQINAKNYFITYPRCSLTKEEALSQLKAFSYPTNIKFIR
FT                   VCRELHQDGVPHLHVLIQFEGKFQCTNPRFFDLISPSRSTHFHPNIQGAKSSSDVKAYI
FT                   EKGGEFLDDGIFQVDARSARGEGQHLAQVYAEALNASSKSEALQIIKEKDPKSFFLQFH
FT                   NISANAGRIFQAPPQTYVSPFLSSSFTQVPEEIEVWVSENICSPAARPWRPISIVLEGD
FT                   SRTGKTMWARSLGPHNYLCGHLDLSPKIYSNDAWYNVIDDVDPHYLKHFKEFMGAQRDW
FT                   QSNTKYGKPIQIKGGIPTIFLCNPGPTSSYKEFLEEEKNQSLKAWALKNATFVTLYEPL
FT                   FSSANQSPTPHSEDQGTQT"
FT   CDS             complement(2254..2487)
FT                   /codon_start=1
FT                   /gene="AC4"
FT                   /product="AC4 protein"
FT                   /db_xref="InterPro:IPR002488"
FT                   /db_xref="UniProtKB/TrEMBL:Q2A8R5"
FT                   /protein_id="CAJ78129.1"
FT                   /translation="MGCLISMFSSNSKASSNVPTPDSSISFPHPDQHISIRTFRELNHR
FT                   PMSRLTLKREGNFLTMEFSKSMPEVPGGRASI"
XX
SQ   Sequence 2801 BP; 732 A; 553 C; 722 G; 794 T; 0 other;
     accggatggc cgcgcccgaa aaagcaggtg gaccccaccg gatggccgca ctcgtgaaag        60
     aaagtggtcc ccgcgcactt gtttcggtcg gccagtcata ttcacgcgtg aaagtctaga       120
     tatttctggt ttgactttat atacttcgtc gcgaagtagt ggagcgcgtc aacatgtggg       180
     atccattgtt aaacgatttt cccgaaaccg ttcacggttt ccgttctatg cttgctgtta       240
     aatacctgtt acatctggaa caggaatacg accgcggttc tgtcggggct gagtatatac       300
     gggatctaat aggggttcta cggtgtaaga gttatgtcga agcgaccagg agatataata       360
     atctcaacac ccgtatccaa ggtgcggagg aggctgaact tcgacagccc atacacgaac       420
     cgtgttgttg cccccactgt ccgcgtcacc agaagcaaaa tatgggccaa caggcccatg       480
     tatcggaagc ccaagatgta cagaatgtat cgaagcccag atgtcccgaa gggctgtgaa       540
     ggcccatgta aggttcagtc ctatgaacag agggatgatg ttaagcatac gggtatggtc       600
     cgatgtgtca gtgatgttac gcgtgggtca ggcattaccc atagagttgg gaagaggttt       660
     tgtgtgaagt ccatatatat attgggcaag atctggatgg atgagaatat caagaagcaa       720
     aatcatacga accatgttat gttctttctc gttcgagata gaaggcctta tggtccgagc       780
     cctcaagatt ttggacaagt gttcaacatg tttgataatg aacctactac ggcaactgtg       840
     aagaatgatc ttagggaccg gtatcaggtg ttacgtaaat tctatgcgac tgttgttggt       900
     ggaccctctg ggatgaagga acaatcgctg gttaagaggt tttttaggat caataatcat       960
     gtagtgtata atcatcagga acaggccaag tatgagaatc atactgagaa tgcgttgtta      1020
     ttatatatgg catgtacaca tgcctcaaat cctgtgtacg ctacgctgaa aatacgcatc      1080
     tatttctatg atgcagtgac aaattaataa aggttgaatt ttattgcatg ttgctccgta      1140
     acttggagtg tgtttagtaa tacatcgtac agaacatgat caacagcttg aagtacagtg      1200
     ttaattgaaa taacgcctat catatctaaa tacttgagca cttgatatct aaatactttt      1260
     aaaaaaagac cagtcggagg ccgtaaggtc gtccagacct tgaagttgag aaaacacttg      1320
     tgaatcccca atgccttccg aatgttgtgg ttgaaccgta tctggagtgt gatgatgtcg      1380
     tgggtcatgt tccctggcct cttgtcgtgg ttggtgattg cgaaatagag gggatttgtt      1440
     atttcccagg taaaaacgcc attcgttgct tgaggcgcag tgatgagttc ccctgtgcga      1500
     gaatccatgg ttgatgcagt cgatatggag atagaacgag cagccgcatt cgaggtctac      1560
     ccgcctacgt ctgagtgccc tggtcttcgc tgtgcggtgt tggactttga ttggcacttg      1620
     agaacaatgg ctcgtagagg gtgacgaagg tggcattctt taaagcccag gctttaaggg      1680
     actgattctt ttcctcttct agaaactctt tatatgatga agttggtcct ggattgcaga      1740
     ggaagatagt gggaatgccg cctttaattt gaattggctt cccgtacttt gtattgcttt      1800
     gccagtccct ttgggccccc atgaattctt tgaagtgttt gaggtagtgg gggtcgacgt      1860
     catcaatgac gttgtaccag gcgtcgtttg aatatatctt tggagacaga tccaggtgtc      1920
     cacataaata attatgtggg cccagtgaac gagcccacat ggtcttcccg gttcggctat      1980
     caccttctag aacaatactg atcggtctcc atggccgcgc agcgggactg catatatttt      2040
     cggataccca tacttcgatt tcctctggga cttgtgtaaa tgaggaggat aagaacggac      2100
     taacgtaggt ttggggcgga gcctggaaga ttctacctgc gttagcagat atgttatgaa      2160
     actgtaaaaa aaaggacttt ggatcttttt ccttgataat ttgaagagct tcggatttag      2220
     aagaagcatt caacgcttct gcatatacct gagctaaatg ctggccctcc cccctggcac      2280
     ttctggcatc gacttggaaa attccatcgt caagaaattc ccctcccttt tcaatgtaag      2340
     ccttgacatc ggacgatgat ttagctccct gaatgttcgg atggaaatgt gttgatctgg      2400
     atggggaaat gagatcgaag aatctggggt tggtacattg gaacttgcct tcgaattgga      2460
     tgagaacatg gagatgaggc accccatcct gatgtagttc tctgcaaacc ctaatgaatt      2520
     tgatattcgt cgggtaagaa aaggctttta attgggaaag ggcctcttcc tttgttagtg      2580
     agcatcgggg ataggtgatg aaataatttt tggcatttat ttgaaaacga ccggctcgtg      2640
     gcatatttgt tgtcgttttg gatcggggga cactcaaaac tccaggggaa cggtggaatg      2700
     gggggcatta tataggatgt cccccaatgg catatgtgta aataggtaga tttccattca      2760
     aaatttgaat tgcgaatatt ggcggccatc cgattaatat t                          2801
//