Dbfetch

ID   GU723749; SV 1; circular; genomic DNA; STD; VRL; 2744 BP.
XX
AC   GU723749;
XX
DT   01-APR-2010 (Rel. 104, Created)
DT   01-APR-2010 (Rel. 104, Last updated, Version 1)
XX
DE   Tomato yellow leaf curl Thailand virus isolate H6-4 segment DNA-A, complete
DE   sequence.
XX
KW   .
XX
OS   Tomato yellow leaf curl Thailand virus
OC   Viruses; Geminiviridae; Begomovirus.
XX
RN   [1]
RP   1-2744
RA   Tsai W.S., Shih S.L., Green S.K., Kenyon L., Jan F.-J.;
RT   "Molecular diversity and pathogenicity of tomato-infecting begomoviruses in
RT   Taiwan";
RL   Unpublished.
XX
RN   [2]
RP   1-2744
RA   Tsai W.S., Shih S.L., Green S.K., Kenyon L., Jan F.-J.;
RT   ;
RL   Submitted (08-FEB-2010) to the INSDC.
RL   Virology Unit, AVRDC-The World Vegetable Center, PO Box 42, Shanhua,
RL   Tainan, Taiwan 74199, ROC
XX
DR   MD5; 677e33c4326f8f61f48d1c95411e430f.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..2744
FT                   /organism="Tomato yellow leaf curl Thailand virus"
FT                   /segment="DNA-A"
FT                   /host="tomato"
FT                   /isolate="H6-4"
FT                   /mol_type="genomic DNA"
FT                   /country="Taiwan:Shoufong, Hualian"
FT                   /collection_date="2007"
FT                   /db_xref="taxon:85752"
FT   CDS             87..473
FT                   /codon_start=1
FT                   /product="V2 protein"
FT                   /db_xref="GOA:A5JH98"
FT                   /db_xref="InterPro:IPR002511"
FT                   /db_xref="InterPro:IPR005159"
FT                   /db_xref="UniProtKB/TrEMBL:A5JH98"
FT                   /protein_id="ADE09285.1"
FT                   /translation="MVPYLRLSHQVSAKFKMWDPLLNEFPENVHGFRCMLAVKYLQAVE
FT                   KTYSPDTLGFDLIRDLIGVIRAKNYVEASSRYSHFHARLESTSPSELRQPIQQPCCCPH
FT                   CPRHKRADMEEPTCIQKAQVLQNV"
FT   CDS             295..1065
FT                   /codon_start=1
FT                   /product="V1 protein"
FT                   /note="coat protein"
FT                   /db_xref="GOA:Q6R4D4"
FT                   /db_xref="InterPro:IPR000263"
FT                   /db_xref="InterPro:IPR000650"
FT                   /db_xref="InterPro:IPR029053"
FT                   /db_xref="UniProtKB/TrEMBL:Q6R4D4"
FT                   /protein_id="ADE09282.1"
FT                   /translation="MSKRPADILISTPVSKVRRRLNFDSPYNSRAAVPTVRVTKGQIWK
FT                   NRPAYRKPRFYRMYRSPDVPKGCEGPCKVQSFDAKNDIGHMGKVICLSDVTRGIGLTHR
FT                   VGKRFCVKSLYFVGKIWMDENIKVKNHTNTVLFWIVRDRRPTGTPNDFQQVFNVYDNEP
FT                   STATVKNDQRDRFQVIRRFQATVTGGQYAAKEQAIIRKFYRVNNYVVYNHQEAGKYENH
FT                   TENALLLYMACTHASNPVYATLKVRSYFYDSVTN"
FT   CDS             complement(1062..1466)
FT                   /codon_start=1
FT                   /product="C3 protein"
FT                   /db_xref="GOA:D5KYY6"
FT                   /db_xref="InterPro:IPR000657"
FT                   /db_xref="UniProtKB/TrEMBL:D5KYY6"
FT                   /protein_id="ADE09284.1"
FT                   /translation="MDLRTGELLTATQLESGVYIWTVKNPLYFKITKHLESPFQRNHDI
FT                   ITLQIQFNHNLRKALGIHKCFLVCKIWTHLHPQTSRFLILFKYQCIKYLDRLGVISINN
FT                   VIRAMSHVLYNVLEGTIDVIEEHDIKFNIY"
FT   CDS             complement(1207..1611)
FT                   /codon_start=1
FT                   /product="C2 protein"
FT                   /db_xref="GOA:D5KYY7"
FT                   /db_xref="InterPro:IPR000942"
FT                   /db_xref="UniProtKB/TrEMBL:D5KYY7"
FT                   /protein_id="ADE09283.1"
FT                   /translation="MRSSSPSKAHSTQVPIKVQHRIAKRATRRRRVDLPCGCSYFVAIG
FT                   CHNNGFTHRGTTHCNSIREWRVYLDGQKSPIFQDNQAPREPIPEEPRHNHVTNPVQPQP
FT                   EESVGDTQMFSSLQNLDSFTSSDLAFLNII"
FT   CDS             complement(1514..2599)
FT                   /codon_start=1
FT                   /product="C1 protein"
FT                   /note="replication-associated protein"
FT                   /db_xref="GOA:D5KYY8"
FT                   /db_xref="InterPro:IPR001191"
FT                   /db_xref="InterPro:IPR001301"
FT                   /db_xref="InterPro:IPR022690"
FT                   /db_xref="InterPro:IPR022692"
FT                   /db_xref="UniProtKB/TrEMBL:D5KYY8"
FT                   /protein_id="ADE09281.1"
FT                   /translation="MAPPNKFRINAKNYFLTYPHCSLTKEEALSQIQALETPTNKLFIR
FT                   ICRELHEDGTPHLHVLIQFEGKFQCKNQRFFDLTSPTRSAHFHPNIQGAKSSTDVKTYM
FT                   EKDGDVLDHGIFQIDGRSARGGCQSANDAYAEAINSGSKASALTILREKAPKDFVLQFH
FT                   NLNSNLDRIFTPPMEEYISPFSSSSFNQVPEELKEWACNNVLSAAARPLRPIGIVIEGD
FT                   SRTGKTMWARSLGPHNYLCGHLDLSPKVYNNNVWYNVIDDVDPHYLKHFKEFMGAQRDW
FT                   QSNTKYGKPVQIKGGIPTIFLCNPGPNSSYKEYLEEEKNSALRNWAIRNAIFVTLKGPL
FT                   YSGSNQGATPNSQEGNQTTES"
FT   CDS             complement(2149..2448)
FT                   /codon_start=1
FT                   /product="C4 protein"
FT                   /db_xref="InterPro:IPR002488"
FT                   /db_xref="UniProtKB/TrEMBL:A5JH97"
FT                   /protein_id="ADE09286.1"
FT                   /translation="MKMGLLTCMSSSNSKENSNVKIKDSSISHPQPGQHISIRTFRELK
FT                   AQQMLKHTWKKTETCLIMEFSRSMEDRLEEVANLPTTHMPRQSIQGPKLRPSLY"
XX
SQ   Sequence 2744 BP; 736 A; 540 C; 602 G; 865 T; 1 other;
     accggatggc cgcgattttt tttaaagtgg tccccttgat gtgatgtttc atccaattaa        60
     aacgctcggc caaagcttaa ttatttatgg tcccctattt aagacttagt caccaagttt       120
     cggcgaaatt caaaatgtgg gatccactcc taaacgaatt tccagaaaac gtccacggtt       180
     tccgttgtat gttagcggtt aagtatctgc aagcggtcga gaagacgtat tcacctgata       240
     ccctagggtt tgatctcatc cgtgatctca tcggtgtaat tcgtgcgaag aactatgtcg       300
     aagcgtccag cagatattct catttccacg cccgtctcga aagtacgtcg ccgtctgaac       360
     ttcgacagcc catacaacag ccgtgctgct gtccccactg tccgcgtcac aaaagggcag       420
     atatggaaga accgacctgc atacagaaag cccaggttct acagaatgta tagaagtcct       480
     gatgtcccta agggatgtga gggtccatgt aaagtgcaat ctttcgatgc gaagaacgac       540
     attggtcata tgggcaaggt aatctgtctg tctgacgtta cccgtggtat tgggcttact       600
     catcgagttg gcaagcgttt ctgtgtcaag tcactttatt ttgtcgggaa gatctggatg       660
     gatgaaaata ttaaggttaa gaatcacact aataccgttt tattttggat agttagggat       720
     cggcgtccta ctggaacgcc taatgatttt cagcaggtct ttaatgtata tgataatgaa       780
     cccagcactg ctactgtaaa gaacgaccag cgtgatcgtt tccaggttat aaggaggttt       840
     caggcaacgg tgactggtgg acaatatgca gctaaggagc aggcgattat tagaaagttt       900
     tatcgtgtta ataattatgt agtttacaat caccaggaag ctgggaagta cgagaaccat       960
     actgaaaatg ctttgttgtt gtatatggca tgtactcatg cctctaatcc tgtgtatgct      1020
     actttgaaag tcaggagtta tttctatgac tcagtgacga attaataaat attaaatttt      1080
     atatcgtgtt cttcaattac atcaattgtt ccttctaata cattgtacag tacatgagac      1140
     attgccctaa ttacattatt tatactaatc acgcctaatc tatctaaata tttaatacat      1200
     tgatatttaa ataatattaa gaaacgcgag gtctgaggat gtaaatgagt ccagattttg      1260
     cagactagaa aacatttgtg tatccccaac gctttcctca ggttgtggtt gaactggatt      1320
     tgtaacgtga ttatgtcgtg gttcctctgg aatgggctct ctaggtgctt ggttatcttg      1380
     aaatataggg gatttttgac cgtccagata tacacgccac tctctaattg agttgcagtg      1440
     agtagttccc cggtgcgtaa atccattatt gtgacatcct attgcgacga agtacgaaca      1500
     tccacaaggt agatcaactc tccgtcgtct ggttgccctc ttggctattc ggtgttgcac      1560
     cttgattgga acctgagtag agtgggcctt tgagggtgac gaagatcgca tttcttatag      1620
     cccagtttct aagtgckgag ttcttttctt cttccaagta ctctttataa ctggagttgg      1680
     gtccaggatt gcagagaaag atagtgggaa ttccgccttt aatttgaact ggctttccgt      1740
     actttgtgtt tgattgccag tccctttggg cccccatgaa ttctttaaag tgttttagat      1800
     agtgcggatc gacgtcatcg atgacgttgt accacacatt attattgtac acttttggac      1860
     ttaaatctaa atggccacac agataattat gtggtcccaa tgacctagcc cacatcgtct      1920
     tccccgttct gctatcaccc tcaattacta taccaatggg tctcaatggc cgcgcagcgg      1980
     cactgagaac attattacaa gcccattctt taagttcttc tggaacttga ttaaaagaag      2040
     aagaagaaaa tggagaaata tattcctcca ttggaggagt aaaaatccta tctaaattag      2100
     aatttaaatt atgaaattgc aaaacaaaat ctttaggggc tttttccctc agtatagtga      2160
     gggccgaagc tttggaccct gaattgattg cctcggcata tgcgtcgttg gcagattggc      2220
     aacctcctct agccgatctt ccatcgatct ggaaaattcc atgatcaagc acgtctccgt      2280
     ctttttccat gtatgtttta acatctgttg agcttttagc tccctgaatg ttcggatgga      2340
     aatgtgctga cctggttggg gatgtgagat cgaagaatct ttgattttta cattggaatt      2400
     ttccttcgaa ttggatgagg acatgcaggt gaggagtccc atcttcatgg agttccctgc      2460
     agattctgat gaataattta ttagttggtg tttctagtgc ttgaatttgg gaaagtgctt      2520
     cctctttagt gagagaacaa tgtgggtatg tcaggaaata gttcttggca tttattctga      2580
     atttattagg aggagccatt gactggtcaa tcggtgtctc tcaaacttgg ctatgcaatc      2640
     ggtgtctggg gtcttattta tacctggaca ccaaatggca taattgtaat ttagtaaatg      2700
     tgatttaaaa ttcaaaatcc aaaagcggcc atccgtataa tatt                       2744
//