Dbfetch

ID   JF909075; SV 1; circular; genomic DNA; STD; VRL; 2801 BP.
XX
AC   JF909075;
XX
DT   21-JUN-2012 (Rel. 113, Created)
DT   05-DEC-2012 (Rel. 115, Last updated, Version 3)
XX
DE   East African cassava mosaic virus-Kenya isolate
DE   Comoros:Anjouan:AJ26BP1:2009 segment DNA-A, complete sequence.
XX
KW   .
XX
OS   East African cassava mosaic virus-Kenya
OC   Viruses; Geminiviridae; Begomovirus.
XX
RN   [1]
RC   Publication Status: Online-Only
RP   1-2801
RX   DOI; 10.1186/1471-2148-12-228.
RX   PUBMED; 23186303.
RA   De Bruyn A., Villemot J., Lefeuvre P., Villar E., Hoareau M.,
RA   Harimalala M., Abdoul-Karime A.L., Abdou-Chakour C., Reynaud B.,
RA   Harkins G.W., Varsani A., Martin D.P., Lett J.M.;
RT   "East African cassava mosaic-like viruses from Africa to Indian ocean
RT   islands: molecular diversity, evolutionary history and geographical
RT   dissemination of a bipartite begomovirus";
RL   BMC Evol. Biol. 12(1):228-228(2012).
XX
RN   [2]
RP   1-2801
RA   Villemot J., Lefeuvre P., Villar E., Hoareau M., Harimalala M.,
RA   Abdoul-Karime A.L., Abdou-Chakour C., Reynaud B., Varsani A., Martin D.P.,
RA   Lett J.-M.;
RT   ;
RL   Submitted (24-MAR-2011) to the INSDC.
RL   UMR PVBMT, CIRAD, 7, chemin de l'IRAT, Saint-Pierre, Reunion 97410, France
XX
DR   MD5; 840f6fe777a024f1360d0beba529b2f4.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..2801
FT                   /organism="East African cassava mosaic virus-Kenya"
FT                   /segment="DNA-A"
FT                   /host="Manihot esculenta (cassava)"
FT                   /isolate="Comoros:Anjouan:AJ26BP1:2009"
FT                   /mol_type="genomic DNA"
FT                   /country="Comoros:Anjouan"
FT                   /lat_lon="12.19 S 44.51 E"
FT                   /collection_date="2009"
FT                   /db_xref="taxon:1229189"
FT   gene            174..530
FT                   /gene="AV2"
FT   CDS             174..530
FT                   /codon_start=1
FT                   /gene="AV2"
FT                   /product="movement protein"
FT                   /db_xref="GOA:I6LX59"
FT                   /db_xref="InterPro:IPR002511"
FT                   /db_xref="InterPro:IPR005159"
FT                   /db_xref="UniProtKB/TrEMBL:I6LX59"
FT                   /protein_id="AEG89784.1"
FT                   /translation="MWDPLLNDFPETVHGFRSMLAVKYLLHLEQEYDRGTVGAEYIRDL
FT                   IGVLRCKSYVEATRRYNNLNTRIQGAEEAELRQPIHEPCCCPHCPRHQKQNMGQQAHVS
FT                   EAQDVQNVSKPRCP"
FT   gene            334..1107
FT                   /gene="AV1"
FT   CDS             334..1107
FT                   /codon_start=1
FT                   /gene="AV1"
FT                   /product="coat protein"
FT                   /db_xref="GOA:I6LX52"
FT                   /db_xref="InterPro:IPR000263"
FT                   /db_xref="InterPro:IPR000650"
FT                   /db_xref="UniProtKB/TrEMBL:I6LX52"
FT                   /protein_id="AEG89783.1"
FT                   /translation="MSKRPGDIIISTPVSKVRRRLNFDSPYTNRVVAPTVRVTRSKIWA
FT                   NRPMYRKPKMYRMYRSPDVPKGCEGPCKVQSYEQRDDVKHTGMVRCVSDVTRGSGITHR
FT                   VGKRFCVKSIYILGKIWMDENIKKQNHTNHVMFFLVRDRRPYGPSPQDFGQVFNMFDNE
FT                   PTTATVKNDLRDRYQVLRKFYATVVGGPSGMKEQALVKRFFRINNHVVYNHQEQAKYEN
FT                   HTENALLLYMACTHASNPVYATLKIRIYFYDAVTN"
FT   gene            complement(1104..1508)
FT                   /gene="AC3"
FT   CDS             complement(1104..1508)
FT                   /codon_start=1
FT                   /gene="AC3"
FT                   /product="replication enhancer"
FT                   /db_xref="GOA:I6LYZ8"
FT                   /db_xref="InterPro:IPR000657"
FT                   /db_xref="UniProtKB/TrEMBL:I6LYZ8"
FT                   /protein_id="AEG89787.1"
FT                   /translation="MDFRTGELITAPQAKNGVFTWEITNPLYFDITNHDKRPGNMNHDI
FT                   ITLQIRFNHNLRKALAIHKCFLNFKVWTTLRPQTGLFLRVFRYQVLKYLDMIGVISINT
FT                   VITAVDHVLYDVLLNTLQVTEQHAIKFNLY"
FT   gene            complement(1249..1656)
FT                   /gene="AC2"
FT   CDS             complement(1249..1656)
FT                   /codon_start=1
FT                   /gene="AC2"
FT                   /product="transcription activator protein"
FT                   /db_xref="GOA:I6LX79"
FT                   /db_xref="InterPro:IPR000942"
FT                   /db_xref="UniProtKB/TrEMBL:I6LX79"
FT                   /protein_id="AEG89786.1"
FT                   /translation="MPPSSPSTSHCSQVPIKVQHRTAKTRALRRSRVDLECGCSFYLHI
FT                   DCINHGFSHRGTHHCASSKEWRFYLGNNKSPLFRHHQPRQEAREHEPRHHHTPDTFQPQ
FT                   PPEGIGDSQVFSQLQGLDDLTASDWSFLKSI"
FT   gene            complement(1565..2644)
FT                   /gene="AC1"
FT   CDS             complement(1565..2644)
FT                   /codon_start=1
FT                   /gene="AC1"
FT                   /product="replication associated protein"
FT                   /db_xref="GOA:I6LX78"
FT                   /db_xref="InterPro:IPR001191"
FT                   /db_xref="InterPro:IPR001301"
FT                   /db_xref="InterPro:IPR022690"
FT                   /db_xref="InterPro:IPR022692"
FT                   /db_xref="UniProtKB/TrEMBL:I6LX78"
FT                   /protein_id="AEG89785.1"
FT                   /translation="MPRAGRFQINAKNYFITYPRCSLTKEEALSQLKALSYPTNIKFIR
FT                   VCRELHQDGVPHLHVLIQFEGKFQCTNQRFFDLISPSRSTHFHPNIQGAKSSSDVKAYI
FT                   EKGGEFLDDGIFQVDARSARGEGQHLAQVYADALNASSKSEALQIIKEKDPKSFFLQFH
FT                   NISANADRIFQAPPQTYVSPFLSSSFTHVPEELEVWVSENICSPAARPWRPISIVLEGD
FT                   SRTGKTMWARSLGPHNYLCGHLDLSPKVYSNDAWYNVIDDVDPHYLKHFKEFMGAQRDW
FT                   QSNTKYGKPIQIKGGIPTIFLCNPGPTSSYKEFLDEEKNQSLNAWALKNATFVTLHEPL
FT                   FSSAHQSPTPHSEDQGPQT"
FT   gene            complement(2254..2487)
FT                   /gene="AC4"
FT   CDS             complement(2254..2487)
FT                   /codon_start=1
FT                   /gene="AC4"
FT                   /product="C4 protein"
FT                   /db_xref="InterPro:IPR002488"
FT                   /db_xref="UniProtKB/TrEMBL:I6LX81"
FT                   /protein_id="AEG89788.1"
FT                   /translation="MGCLISMFSSNSKASSNVQTKDSSISFPHPDQHISIRIFRELNRR
FT                   PMSRLTLKREGNFLTMEFSKSMPEVQGGRASI"
XX
SQ   Sequence 2801 BP; 738 A; 554 C; 718 G; 791 T; 0 other;
     accggatggc cgcgcccgaa aaagcaggtg gaccccactg tatgaccgcg tccatgaaat        60
     aaagtggtcc ccgcgcactg gggttggtcg gccagtcata ttcacgcgtg aaagtctaga       120
     tatttgttgt ttgtctttat agacttcgtc acgaagtagt ggaacgcgtc aacatgtggg       180
     atccattgtt gaatgatttt cccgaaactg ttcacggttt ccgttctatg cttgctgtta       240
     aatacctgtt acatctggaa caggaatacg atcgcggtac tgtcggggcg gagtatatac       300
     gggatctaat aggggttcta cggtgtaaga gttatgtcga agcgaccagg agatataata       360
     atctcaacac ccgtatccaa ggtgcggagg aggctgaact tcgacagccc atacacgaac       420
     cgtgttgttg cccccactgt ccgcgtcacc agaagcaaaa tatgggccaa caggcccatg       480
     tatcggaagc ccaagatgta cagaatgtat cgaagcccag atgtccctaa gggctgtgaa       540
     ggcccatgta aggttcagtc gtatgaacag agggatgatg ttaagcacac tggtatggtc       600
     cgatgtgtca gtgatgttac tcgtggatca ggcatcaccc atagagtcgg gaagaggttt       660
     tgtgtgaagt ccatatatat attgggcaag atctggatgg atgagaatat caagaagcaa       720
     aatcatacga accatgttat gttctttctc gttcgagata gaaggcctta tgggccgagc       780
     ccgcaagatt ttggacaagt gttcaacatg tttgataatg aacctactac ggcaacggtg       840
     aagaatgatc tgagggatcg gtatcaggtg ttacgaaaat tctatgcgac cgttgttggt       900
     ggaccctccg ggatgaagga acaagcgctg gttaagaggt tttttaggat caataatcat       960
     gtagtgtata atcatcagga acaggccaag tatgagaatc atacggagaa tgcgttgtta      1020
     ttgtatatgg catgtacaca tgcctcaaat cctgtgtacg ccactctgaa aatacgcatc      1080
     tatttctatg atgcagtgac aaattaataa aggttgaatt ttattgcatg ttgctccgta      1140
     acttggagtg tgtttagtaa tacatcgtac agaacatgat caacagctgt aattacagtg      1200
     ttaatggaaa taacgcctat catatctaaa tacttgagca cttgatatct aaatactctt      1260
     aagaaaagac cagtctgagg ccgtaaggtc gtccagacct tgaagttgag aaaacacttg      1320
     tgaatcgcca atgccttccg gaggttgtgg ttgaaacgta tctggagtgt gatgatgtcg      1380
     tggttcatgt tccctggcct cttgtcgtgg ttggtgatgt cgaaatagag gggatttgtt      1440
     atttcccagg taaaaacgcc attctttgct tgaggcgcag tgatgagttc ccctgtgcga      1500
     aaatccatgg ttgatgcagt cgatatggag atagaacgag cagccacatt cgaggtctac      1560
     ccggctacgt ctgagggccc tggtcttcgc tgtgcggtgt tggactttga tgggcacttg      1620
     agaacaatgg ctcgtggagg gtgacgaagg tggcattctt taaagcccag gcgttaaggg      1680
     actgattctt ttcctcgtcc agaaactctt tatatgatga tgttggtcct ggattgcaga      1740
     ggaagatagt gggaatgccg cctttaattt gaataggctt cccgtacttt gtattgcttt      1800
     gccagtccct ttgggccccc atgaattctt tgaagtgttt gagataatgc gggtctacgt      1860
     cgtcaatgac gttgtaccat gcgtcgtttg aatatacctt tggagacaga tccaggtgtc      1920
     cacatagata attatggggt cccagtgaac gagcccacat ggttttcccg gttcggctat      1980
     caccttcgag aacaatactg atcggtctcc atggccgcgc agcgggactg catatatttt      2040
     ctgataccca tacctctagt tcttcgggaa cgtgtgtaaa tgatgatgat aagaatggac      2100
     taacgtaagt ttgtggcgga gcctggaaga ttctatctgc gttagcagat atgttatgga      2160
     actgtaaaaa aaaggacttt ggatcttttt ctttaataat ttgaagagct tctgatttag      2220
     aagaagcatt caacgcgtct gcatatacct gagctaaatg ctggccctcc ccccttgcac      2280
     ttctggcatc gacttggaaa attccatcgt caagaaattc ccctcccttt tcaatgtaag      2340
     ccttgacatc ggacgacgat ttagctccct gaatattcgg atggaaatgt gttgatcggg      2400
     atggggaaat gagatcgaag aatctttggt ttgtacattg gaacttgcct tcgaattgga      2460
     tgagaacatg gagatgaggc accccatcct gatgtagttc tctgcaaacc ctaatgaatt      2520
     tgatattcgt cgggtaagaa agggctttta attgggaaag ggcctcttcc ttggttaatg      2580
     agcatcgggg ataggtgatg aaataatttt tggcatttat ttgaaaacga cctgctcttg      2640
     gcatatttgc tgtcgtattg gatcggggga cactcaaaac tccaggggaa cggtggaatg      2700
     gggggcaata tatatgatgt cccccaatgg catatgtgta aatacgtcga cctccattca      2760
     aattttgaat tgcgaatatt ggcggccatc cgattaatat t                          2801
//