spacer

EBI Dbfetch

ID   FR692336; SV 1; circular; genomic DNA; STD; VRL; 5064 BP.
XX
AC   FR692336;
XX
DT   01-DEC-2010 (Rel. 107, Created)
DT   01-DEC-2010 (Rel. 107, Last updated, Version 1)
XX
DE   Chimpanzee polyomavirus complete genome, isolate Azzie
XX
KW   complete genome.
XX
OS   Chimpanzee polyomavirus
OC   Viruses; dsDNA viruses, no RNA stage; Polyomaviridae; Polyomavirus;
OC   unclassified Polyomavirus.
XX
RN   [1]
RP   1-5064
RA   Verschoor E.J.;
RT   ;
RL   Submitted (21-SEP-2010) to the INSDC.
RL   Verschoor E.J., Virology, Biomedical Primate Research Centre, Lange Kleiweg
RL   161 Rijswijk, 2288GJ, NETHERLANDS.
XX
RN   [2]
RX   PUBMED; 21110837.
RA   Deuzing I., Fagrouch Z., Groenewoud M.J., Niphuis H., Kondova I.,
RA   Bogers W., Verschoor E.J.;
RT   "Detection and characterization of two chimpanzee polyomavirus genotypes
RT   from different subspecies";
RL   Virol J 7:347-347(2010).
XX
DR   MD5; f5bf50b768c26525469408cc33f96f80.
DR   EuropePMC; PMC3003640; 21110837.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..5064
FT                   /organism="Chimpanzee polyomavirus"
FT                   /host="Pan troglodytes troglodytes"
FT                   /isolate="Azzie"
FT                   /mol_type="genomic DNA"
FT                   /isolation_source="host blood"
FT                   /db_xref="taxon:305677"
FT   CDS             156..350
FT                   /gene="agnogene"
FT                   /product="agnoprotein"
FT                   /db_xref="UniProtKB/TrEMBL:E5AX39"
FT                   /protein_id="CBX23447.1"
FT                   /translation="MFTCLGVKPRFRACSQVIISNRRRRTAACQRSFNWRKLTVCVRTV
FT                   TCQANKSSGDQAGENKLLL"
FT   CDS             382..1089
FT                   /gene="VP2"
FT                   /product="VP2 protein"
FT                   /function="structural protein"
FT                   /db_xref="GOA:E5AX40"
FT                   /db_xref="InterPro:IPR001070"
FT                   /db_xref="UniProtKB/TrEMBL:E5AX40"
FT                   /protein_id="CBX23448.1"
FT                   /translation="MGGLLSSLVDMIVMASELSAASGLTIEALLTGEALAALEAEVFSL
FT                   MAVEGLSGIEALAQLGWTAEQFSNMAFISTTFSNAIGYGVLFQTVSGISSLVSAGIRLG
FT                   TSVSSVNRHQTEQELETLFGKIAHFLHVNLAFHLDPFDWCGSIGTTMPSEFSNLTLDQL
FT                   SKLALIIENGRWVVQRSPTHDPLFESGDVIDIFGPPGGARQRVTPDWMLPLILRLNGAP
FT                   EEKSSLCVNTNQS"
FT   CDS             517..1089
FT                   /gene="VP3"
FT                   /product="VP3 protein"
FT                   /function="structural protein"
FT                   /db_xref="GOA:E5AX41"
FT                   /db_xref="InterPro:IPR001070"
FT                   /db_xref="UniProtKB/TrEMBL:E5AX41"
FT                   /protein_id="CBX23449.1"
FT                   /translation="MAVEGLSGIEALAQLGWTAEQFSNMAFISTTFSNAIGYGVLFQTV
FT                   SGISSLVSAGIRLGTSVSSVNRHQTEQELETLFGKIAHFLHVNLAFHLDPFDWCGSIGT
FT                   TMPSEFSNLTLDQLSKLALIIENGRWVVQRSPTHDPLFESGDVIDIFGPPGGARQRVTP
FT                   DWMLPLILRLNGAPEEKSSLCVNTNQS"
FT   CDS             1037..2506
FT                   /gene="VP1"
FT                   /product="VP1 protein"
FT                   /function="structural protein"
FT                   /db_xref="GOA:E5AX42"
FT                   /db_xref="InterPro:IPR000662"
FT                   /db_xref="InterPro:IPR011222"
FT                   /db_xref="UniProtKB/TrEMBL:E5AX42"
FT                   /protein_id="CBX23450.1"
FT                   /translation="MAPPRKRARCVSTPTKVKCVPKKCPVPTPVPKLLVKGGVEVLNII
FT                   TGPDSTTEIELYLEPRMGINSPTGDKKEWYGYSEVIHHADGYDNNLLSIQMPQYSCARV
FT                   QLPMLNTDMTCDTLMMWEAVSCKTEIVGIGSLISVHLLEAKMAAKEGGDGPSQPIEGMN
FT                   YHMFAVGGEPLDLQGIESNALTKYASAIPPKTIHPNDIAKLAEEEKPQLQGLVPKAKAR
FT                   LDKDGFYPIEEWSPDPSRNENSRYFGSFVGGLNTPPNLQFTNAVTTVLLDENGVGPLCK
FT                   GDGLFVSAADICGVMVKADNGAIRYRGLPRYFKVTLRKRAVKNPYPITSLLGSLFTGLM
FT                   PKMDGQPMTGPDAQIEEVRIYQGKEGLPADPDMKRYIDQFGQEQTPTPTPAAPAAVAAL
FT                   LEKWREKFSEEHKYDTIQHWGSSYPGHLFTEESQKIPKPQETPTQTIPVVTEHHIIDED
FT                   YTSTPTPAPTLTSFGGTTNLEKLPGKDSEEA"
FT   CDS             complement(2548..5064)
FT                   /gene="small t"
FT                   /product="small t antigen"
FT                   /db_xref="GOA:E5AX43"
FT                   /db_xref="InterPro:IPR001623"
FT                   /db_xref="InterPro:IPR003133"
FT                   /db_xref="InterPro:IPR003354"
FT                   /db_xref="InterPro:IPR003593"
FT                   /db_xref="InterPro:IPR010932"
FT                   /db_xref="InterPro:IPR014015"
FT                   /db_xref="InterPro:IPR017910"
FT                   /db_xref="InterPro:IPR027417"
FT                   /db_xref="UniProtKB/TrEMBL:E5AX43"
FT                   /protein_id="CBX23451.1"
FT                   /translation="MDKVLEKSDREILIELLGIPSYAFGNFPIMKTAYKRASKIYHPDK
FT                   GGSSEKMMLLNSLWQKFQEGLVDIRGSEVCHVSFSDCYDVKLLRNCGTVKHFHEIFLRS
FT                   PQCLQKGAAVCNCITSTLFNQHRQIKLLCNKRCLSWGECFCFFCFLTWFGMEDKWESFD
FT                   MWKYVIAEMPTGLLQLPTSKYKFSLLALFLSELLIISLFQIFSESYGSPSFRRRYASWC
FT                   SSVYTNERADNRGDLHCDESPISSSDEEDTQSSGYNSFPFSSTPSTSTASQEVPPSFSE
FT                   PQFPETSSTSGSSSSGRNTEAERESPPKRRRSPEDLDGSYTDSQASFASTPPKQKRQNP
FT                   DSPSDLPSCLFDFVSHAIFSNKTVNAFILYSNFEKASLLFEKIDKFKIEFKSLHKLIEG
FT                   VAIGGGLVLVMTSGKHRLSAVKNYCQQFCTISFLIIKAVLKPLECYQCLCKPPFSQIKA
FT                   NKDGLFSYDFEDRKEENCNWNKVAEFAVSADLDDPLLILAHYLDFAQPFPCLKCENQKT
FT                   KAHDFHKAHHDNAVLFEMCKSQRSICNQASDVVLAKRRLLLQESSREELLAMCFQKQLK
FT                   ALKALDTLDIFDHMAGVAWYANLFENCDELLFQILKLLTQNIPKQRNILFRGPVNSGKT
FT                   TLAAALVDLLGGRSLNVNCPADKINFELGCAIDRFFVVFEDVKGQTMLNKKLQPGQGIS
FT                   NLDNMRDYLDGAVPINLERKHMNKRSQVFPPCVMTMNEYILPQTLYVRFTLKLEFISRP
FT                   NLQAAIEKTPGLTAKRILQKGLTLFLLLIWYTPVSKFTVSLQEEIANWKAIIEKTVSHS
FT                   DFCKMLENIEVGESPLTDIIDEGDIA"
FT   CDS             complement(join(2548..4176,4846..5064))
FT                   /gene="large T"
FT                   /product="large T antigen"
FT                   /db_xref="GOA:E5AX44"
FT                   /db_xref="InterPro:IPR001623"
FT                   /db_xref="InterPro:IPR003133"
FT                   /db_xref="InterPro:IPR003593"
FT                   /db_xref="InterPro:IPR010932"
FT                   /db_xref="InterPro:IPR014015"
FT                   /db_xref="InterPro:IPR016392"
FT                   /db_xref="InterPro:IPR017910"
FT                   /db_xref="InterPro:IPR027417"
FT                   /db_xref="UniProtKB/TrEMBL:E5AX44"
FT                   /protein_id="CBX23452.1"
FT                   /translation="MDKVLEKSDREILIELLGIPSYAFGNFPIMKTAYKRASKIYHPDK
FT                   GGSSEKMMLLNSLWQKFQEGLVDIRGSEGRNTEAERESPPKRRRSPEDLDGSYTDSQAS
FT                   FASTPPKQKRQNPDSPSDLPSCLFDFVSHAIFSNKTVNAFILYSNFEKASLLFEKIDKF
FT                   KIEFKSLHKLIEGVAIGGGLVLVMTSGKHRLSAVKNYCQQFCTISFLIIKAVLKPLECY
FT                   QCLCKPPFSQIKANKDGLFSYDFEDRKEENCNWNKVAEFAVSADLDDPLLILAHYLDFA
FT                   QPFPCLKCENQKTKAHDFHKAHHDNAVLFEMCKSQRSICNQASDVVLAKRRLLLQESSR
FT                   EELLAMCFQKQLKALKALDTLDIFDHMAGVAWYANLFENCDELLFQILKLLTQNIPKQR
FT                   NILFRGPVNSGKTTLAAALVDLLGGRSLNVNCPADKINFELGCAIDRFFVVFEDVKGQT
FT                   MLNKKLQPGQGISNLDNMRDYLDGAVPINLERKHMNKRSQVFPPCVMTMNEYILPQTLY
FT                   VRFTLKLEFISRPNLQAAIEKTPGLTAKRILQKGLTLFLLLIWYTPVSKFTVSLQEEIA
FT                   NWKAIIEKTVSHSDFCKMLENIEVGESPLTDIIDEGDIA"
FT   exon            complement(2548..4176)
FT                   /gene="large T"
FT                   /number=2
FT   intron          complement(4177..4845)
FT                   /gene="large T"
FT                   /number=1
FT   exon            complement(4846..5064)
FT                   /gene="large T"
FT                   /number=1
XX
SQ   Sequence 5064 BP; 1583 A; 986 C; 967 G; 1528 T; 0 other;
     tttacctgcc tagaagacct gtcctgcgcg cctgctgaag caagtaagtg caagtgtccc        60
     taattaggcc tctctccttt ttataagatg aggtggaggc aagaggcctc ctgcctcacc       120
     acaattagta aaaaaaagca tccccttgtc tatgcatgtt tacatgtctg ggagtaaagc       180
     caaggtttag ggcatgcagc caagtaatta ttagcaaccg caggcggcgc acggcagcct       240
     gccaaagaag ttttaattgg aggaagttga ctgtgtgtgt tcgcacggtg acctgccagg       300
     caaacaaaag cagcggggac caggcaggcg aaaacaagct tttactgtaa gtaaactctg       360
     tactttttaa ttttttctag aatgggaggt cttttatcat ctttggtgga tatgattgtg       420
     atggcttcag aactaagtgc agcatctgga ttgactattg aagccctctt aactggagaa       480
     gccctagctg ctttagaagc cgaagttttt tctctcatgg ctgtagaagg cttatcagga       540
     atagaagctt tagctcagtt gggctggact gcggaacaat tttccaacat ggcattcatt       600
     tcaactacat tttctaatgc cataggatat ggagtattgt ttcaaacagt ctcaggaatt       660
     agttcacttg tttccgccgg gataaggttg ggaacaagtg tttcatctgt aaatagacat       720
     caaacagagc aagaattgga gactttattt ggtaaaatag cccattttct tcatgtgaat       780
     ttagcgttcc atctggatcc gtttgattgg tgtggttcca ttggaacaac aatgccttct       840
     gaattttcaa atttaaccct tgatcagctt tcaaaattag ccctaataat tgaaaatggg       900
     agatgggtag ttcaaaggtc ccctactcat gatcctcttt ttgaaagtgg ggatgttatt       960
     gatatttttg ggcctcctgg gggagccaga caaagagtta cacctgactg gatgctccct      1020
     ttaattttaa ggttaaatgg cgcccccgag gaaaagagct cgttgtgtgt caacaccaac      1080
     caaagttaaa tgtgttccca agaagtgtcc tgtgcctaca ccagttccta aacttcttgt      1140
     gaaaggagga gtagaagtcc tcaatataat tactggtcca gattccacta cagaaattga      1200
     actttattta gaacccagga tgggtataaa tagtcctaca ggagataaaa aggaatggta      1260
     tggttacagt gaagttattc atcatgcaga tggttatgac aataatttgc tgagtattca      1320
     aatgcctcaa tatagttgtg caagagttca attacctatg ttgaacacgg acatgacctg      1380
     tgacacatta atgatgtggg aagctgtgtc atgtaaaaca gagatagtag gtattggatc      1440
     tttaattagt gttcacttac tagaagcaaa aatggctgct aaagaaggag gagatggacc      1500
     ctcgcaaccc atagagggta tgaattatca catgtttgca gtaggaggtg aacctctaga      1560
     tttacaaggc atagagagta atgccttaac taaatatgct tcagctatac cacccaaaac      1620
     tatccatcct aatgatatag ctaaattagc tgaagaagaa aagccccagc tgcaaggcct      1680
     agttcctaaa gctaaagcaa gactagataa agatggcttt tatcctattg aagagtggag      1740
     ccctgatcca tctagaaatg aaaattctag atattttgga tcatttgtgg gagggctcaa      1800
     tacacctccc aatttacagt ttacaaatgc tgttacaact gttttgctag acgaaaatgg      1860
     agtaggcccc ttgtgtaaag gagatgggtt gtttgtttca gctgctgata tttgtggtgt      1920
     catggtaaag gcagataatg gggccattag ataccgaggg ctccccagat actttaaagt      1980
     aactttgaga aagagggcag ttaaaaatcc ttacccaata actagtctcc tgggaagcct      2040
     cttcacaggc cttatgccta aaatggatgg acagcctatg acaggaccag atgctcaaat      2100
     tgaagaagtg agaatttatc aagggaaaga aggattgcca gctgacccag acatgaagag      2160
     atacatagat caatttggcc aggaacaaac tcccacaccc acaccagctg cgcctgctgc      2220
     agtagctgct ttgctagaaa agtggaggga aaaattctca gaagagcata agtatgacac      2280
     tattcagcat tggggttcta gttacccagg gcatttattc acagaggaat cccagaaaat      2340
     tcctaaacct caagagacac ccacccaaac tattccagtt gtcactgaac atcacataat      2400
     tgacgaagat tacaccagca ctccaacccc cgcccctacc ttaactagtt tcggcgggac      2460
     tactaacttg gaaaaacttc caggcaaaga ctcagaagaa gcttaaatgt ttattgtcac      2520
     atatcatttc aataaactgt ctttatatca agcaatatct ccttcatcta ttatatcagt      2580
     taaaggactt tctcccactt caatattttc caacatttta caaaaatcag aatgacttac      2640
     agttttttca ataatagctt tccaattggc aatttcttct tgtaaagaaa ctgtgaattt      2700
     actgacagga gtataccaaa ttaacagcaa aaacagagtt agcccctttt gtaaaattct      2760
     tttagcagtt aagccaggag ttttttcaat agctgcttga agattaggcc tgctgataaa      2820
     ttctaatttt aaagtgaatc ttacatataa ggtttgaggt aaaatatatt cattcattgt      2880
     cataacacat ggaggaaaaa cctgacttct tttattcata tgttttcttt ctaaattaat      2940
     aggcactgcg ccatctaaat aatctctcat attatccaga ttagaaatcc cctggcctgg      3000
     ttgcaatttt ttatttaaca tagtttgccc tttcacatct tcaaacacta caaagaatct      3060
     atcaattgca cagccaagtt caaagtttat tttatctgct ggacaattaa cattcaaaga      3120
     tctgcctcct aaaaggtcaa ccagagctgc agctaaagta gtttttccac tgttaactgg      3180
     gcctctaaat aaaatatttc tttgcttagg aatattttga gttagtaatt ttaaaatttg      3240
     aaacagtagt tcatcacaat tttcaaacaa atttgcatac caagctactc cagccatatg      3300
     atcaaatata tctaatgtat ctaaggcctt caaggctttc agttgttttt gaaagcacat      3360
     agctaacaat tcctctcttg aactttcttg taataatagc cttcgtttag ctaacactac      3420
     atcactagcc tgattacaga ttgacctttg acttttacac atttcaaaca gcacagcatt      3480
     atcatggtgg gctttatgaa agtcatgcgc tttagttttc tgattttcac atttgagaca      3540
     aggaaagggc tgagcaaaat ctaaatagtg agctaaaatt aacaaaggat catctaaatc      3600
     tgctgatact gcaaattcag caactttatt ccaattacag ttttcttctt ttctatcttc      3660
     aaagtcataa ctaaataatc catccttatt agctttaatt tgagaaaatg gaggtttgca      3720
     taagcattga taacattcca aaggcttaag tactgctttt attatcagaa aactaatagt      3780
     acaaaattgc tgacagtaat ttttaacagc agaaagccta tgtttaccac tagtcataac      3840
     taaaacaagg cctcctccta ttgctacacc ttctattaat ttatgcaagc tcttaaattc      3900
     tattttaaat ttatcaattt tttcaaataa taaggaggcc ttttcaaagt tactatatag      3960
     aataaatgca tttactgttt tattactaaa tatagcgtga ctgacaaaat caaacaaaca      4020
     agaaggaagg tcagaagggc tatcagggtt ttgccttttt tgttttggtg gtgtacttgc      4080
     aaaacttgct tgcgagtcag tataagatcc atccaaatct tcaggacttc gtcgtctctt      4140
     tggaggagac tctctctcag cctctgtatt tcttcctgaa gaagaacttc cagatgtgga      4200
     agacgtctcg gggaattgag gctcactgaa cgacgggggt acttcttggg aggcagtgga      4260
     ggtggaaggg gtggaagaga aggggaaaga attgtaccca gagctttggg tgtcttcttc      4320
     atcagaagag gagattgggg actcatcgca gtgtaaatct cctctgttgt cagctctttc      4380
     attggtatat actgaggagc accagctggc atatcgtctc ctgaagcttg ggctgccata      4440
     ggactcagag aatatctgaa aaagagaaat tataagtaat tcacttaaaa acagggctaa      4500
     cagtgaaaac ttatacttac tagtaggcaa ttgaagtaaa cctgtaggca tctcagcaat      4560
     cacatatttc cacatatcaa agctctccca tttgtcctcc atgccaaacc atgtcagaaa      4620
     gcaaaaaaag cagaagcatt ctccccagct aagacacctt ttgttacata acaattttat      4680
     ttgtctgtgt tggttaaaca gagtactagt tatgcaattg caaactgcag ctcctttctg      4740
     caagcattga gggcttctaa gaaatatctc atgaaaatgt tttacagttc cacaatttct      4800
     taaaagtttt acatcataac aatcagaaaa agaaacatga catacctctg agcctcttat      4860
     atcaacaaga ccctcttgga atttttgcca cagtgaattt aaaagcatca ttttttcact      4920
     gctgcctcct ttgtcaggat gatatatttt agaagccctt ttataagctg ttttcattat      4980
     aggaaaattt ccaaaagcat agcttggaat tcctaaaagt tctataagta tttctctatc      5040
     acttttttct agtactttgt ccat                                             5064
//


spacer
spacer