ID M18752; SV 1; circular; genomic DNA; STD; VRL; 3323 BP. XX AC M18752; XX DT 01-DEC-1990 (Rel. 26, Created) DT 17-APR-2005 (Rel. 83, Last updated, Version 5) XX DE Woodchuck hepatitis virus (WHV), complete genome, clone WHV 7. XX KW coat protein; complete genome; core protein; DNA polymerase; KW envelope-associated protein; origin of replication; polymerase. XX OS Woodchuck hepatitis virus OC Viruses; Hepadnaviridae; Orthohepadnavirus. XX RN [1] RP 1-3323 RX DOI; 10.1016/0042-6822(88)90389-3. RX PUBMED; 3336938. RA Cohen J.I., Miller R.H., Rosenblum B., Denniston K., Gerin J.L., RA Purcell R.H.; RT "Sequence comparison of woodchuck hepatitis virus replicative forms shows RT conservation of the genome"; RL Virology 162(1):12-20(1988). XX DR MD5; 2433731dab60c73401e0f6987f3e8db1. DR EuropePMC; PMC2643773; 19073743. DR EuropePMC; PMC5341730; 27903772. DR GOA; P0C6J5. DR InterPro; IPR002006; Hepatitis_core. DR InterPro; IPR013195; Hepatitis_B_virus_capsid_N. DR RFAM; RF01047; HBV_epsilon. DR UniProtKB/Swiss-Prot; P0C6J5; HBEAG_WHV4. XX FH Key Location/Qualifiers FH FT source 1..3323 FT /organism="Woodchuck hepatitis virus" FT /mol_type="genomic DNA" FT /db_xref="taxon:35269" FT CDS join(2427..3323,1..1758) FT /codon_start=1 FT /product="DNA polymerase" FT /db_xref="GOA:P12898" FT /db_xref="InterPro:IPR000201" FT /db_xref="InterPro:IPR000477" FT /db_xref="InterPro:IPR001462" FT /db_xref="InterPro:IPR037531" FT /db_xref="UniProtKB/Swiss-Prot:P12898" FT /protein_id="AAA46767.1" FT /translation="MHPFSRLFRNIQSLGEEEVQELLGPPEDALPLLAGEDLNHRVADA FT LNLHLPTADLQWVHKTNAITGLYSNQAAQFNPHWIQPEFPELHLHNDLIQKLQQYFGPL FT TINEKRKLQLNFPARFFPKATKYFPLIKGIKNNYPNFALEHFFATANYLWTLWEAGILY FT LRKNQTTLTFKGKPYSWEHRQLVQHNGQQHKSHLQSRQNSSMVACSGHLLHNHLSSESV FT SVSTRNLSNNISDKSQKSTRTGLCSYKQIQTDRLEHLARISCGSKITIGQQGSSPKTLY FT KSISSNFRNQTWAYNSSRNSGHTTWFSSASNSNKSRSREKAYSSNSTSKRYSPPLNYEK FT SDFSSPGVRRRITRLDNNGTPTQCLWRSFYNTKPCGSYCIHHIVSSLDDWGPCTVTGDV FT TIKSPRTPRRITGGVFLVDKNPNNSSESRLVVDFSQFSRGHTRVHWPKFAVPNLQTLAN FT LLSTNLQWLSLDVSAAFYHIPISPAAVPHLLVGSPGLERFNTCLSSSTHNRNNSQLQTM FT HNLCTRHVYSSLLLLFKTYGRKLHLLAHPFIMGFRKLPMGVGLSPFLLAQFTSALASMV FT RRNFPHCVVFAYMDDLVLGARTSEHLTAIYSHICSVFLDLGIHLNVNKTKWWGNHLHFM FT GYVITSSGVLPQDKHVKKISRYLRSVPVNQPLDYKICERLTGILNYVAPFTLCGYAALM FT PLYHAITSRTAFIFSSLYKSWLLSLYEELWPVVRQRGVVCTVFADATPTGWGIATTYQL FT LSGTFAFPLPIATAELIAACLARCWTGARLLGTDNSVVLSGKLTSFPWLLACVANWILR FT GTSFCYVPSALNPADLPSRGLLPVLRPLPRLRLRPQTSRISLWAASPPVSPRRPVRVAW FT SSPVQNCEPWIPP" FT sig_peptide join(2992..3323,1..295) FT /note="pre-surface protein" FT CDS join(2992..3323,1..964) FT /codon_start=1 FT /product="surface protein" FT /note="precursor" FT /db_xref="GOA:P12909" FT /db_xref="InterPro:IPR000349" FT /db_xref="UniProtKB/Swiss-Prot:P12909" FT /protein_id="AAA46766.1" FT /translation="MGNNIKVTFNPDKIAAWWPAVGTYYTTTYPQNQSVFQPGIYQTTS FT LINPKNQQELDSVLINRYKQIDWNTWQGFPVDQKLPLVSRDPPPKPYINQSAQTFEIKP FT GPIIVPGIRDIPRGLVPPQTPTNRDQGRKPTPPTPPLRDTHPHLTMKNQTFHLQGFVDG FT LRDLTTTERQHNAYGDPFTTLSPAVPTVSTILSPPSTTGDPALSPEMSPSSLLGLLAGL FT QVVYFLWTKILTIAQNLDWWWTSLSFPGGIPECTGQNSQFQTCKHLPTSCPPTCNGFRW FT MYLRRFIIYLLVLLLCLIFLLVLLDWKGLIPVCPLQPTTETTVNCRQCTISAQDMYTPP FT YCCCLKPTAGNCTCWPIPSSWALGNYLWEWALARFSWLNLLVPLLQWLGGISLIAWFLL FT IWMIWFWGPALLSILPPFIPIFVLFFLIWVYI" FT mat_peptide 296..961 FT /product="surface protein" FT CDS 1503..1928 FT /codon_start=1 FT /product="X protein" FT /db_xref="GOA:P12913" FT /db_xref="InterPro:IPR000236" FT /db_xref="UniProtKB/Swiss-Prot:P12913" FT /protein_id="AAA46768.1" FT /translation="MAARLCCQLDSARDVLLLRPFGPQSSGPSFPRPAAGSAASSASSP FT SPSDESDLPLGRLPACFASASGPCCLVFTCAELRTMDSTVNFVSWHANRQLGMPSKDLW FT TPYIKDQLLTKWEEGSIDPRLSIFVLGGCRHKCMRLL" FT CDS 2021..2587 FT /codon_start=1 FT /product="core protein" FT /db_xref="GOA:P69710" FT /db_xref="InterPro:IPR002006" FT /db_xref="InterPro:IPR036459" FT /db_xref="UniProtKB/Swiss-Prot:P69710" FT /protein_id="AAA46769.1" FT /translation="MDIDPYKEFGSSYQLLNFLPLDFFPDLNALVDTATALYEEELTGR FT EHCSPHHTAIRQALVCWDELTKLIAWMSSNITSEQVRTIIVNHVNDTWGLKVRQSLWFH FT LSCLTFGQHTVQEFLVSFGVWIRTPAPYRPPNAPILSTLPEHTVIRRRGGARASRSPRR FT RTPSPRRRRSQSPRRRRSQSPSANC" XX SQ Sequence 3323 BP; 845 A; 817 C; 661 G; 1000 T; 0 other; aattcgggac ataccacgtg gtttagttcc gcctcaaact ccaacaaatc gagatcaagg 60 gagaaagcct actcctccaa ctccacctct aagagatact cacccccact taactatgaa 120 aaatcagact tttcatctcc aggggttcgt agacggatta cgagacttga caacaacgga 180 acgccaacac aatgcctatg gagatccttt tacaacacta agccctgcgg ttcctactgt 240 atccaccata ttgtctcctc cctcgacgac tggggaccct gcactgtcac cggagatgtc 300 accatcaagt ctcctaggac tcctcgcagg attacaggtg gtgtatttct tgtggacaaa 360 aatcctaaca atagctcaga atctagattg gtggtggact tctctcagtt ttccaggggg 420 cataccagag tgcactggcc aaaattcgca gttccaaact tgcaaacact tgccaacctc 480 ctgtccacca acttgcaatg gctttcgttg gatgtatctg cggcgtttta tcatatacct 540 attagtcctg ctgctgtgcc tcatcttctt gttggttctc ctggactgga aaggtttaat 600 acctgtctgt cctcttcaac ccacaacaga aacaacagtc aattgcagac aatgcacaat 660 ctctgcacaa gacatgtata ctcctcctta ctgttgttgt ttaaaaccta cggcaggaaa 720 ttgcacttgt tggcccatcc cttcatcatg ggctttagga aattacctat gggagtgggc 780 cttagcccgt ttctcttggc tcaatttact agtgcccttg cttcaatggt taggaggaat 840 ttccctcatt gcgtggtttt tgcttatatg gatgatttgg ttttgggggc ccgcacttct 900 gagcatctta ccgccattta ttcccatatt tgttctgttt ttcttgattt gggtatacat 960 ttgaatgtca ataaaacaaa atggtggggc aatcatctac atttcatggg atatgtgatt 1020 actagttcag gtgtattgcc acaagacaaa catgttaaga aaatttcccg ttatttgcgc 1080 tctgttcctg ttaatcaacc tctggattac aaaatttgtg aaagattgac tggtattctt 1140 aactatgttg ctccttttac gctatgtgga tacgctgctt taatgccttt gtatcatgct 1200 attacttccc gtacggcttt cattttctcc tccttgtata aatcctggtt gctgtctctt 1260 tatgaggagt tgtggcccgt tgtcaggcaa cgtggcgtgg tgtgcactgt gtttgctgac 1320 gcaaccccca ctggttgggg cattgccacc acctatcaac tcctttccgg gactttcgct 1380 ttccccctcc ctattgccac ggcggaactc attgccgcct gccttgcccg ctgctggaca 1440 ggggctcggc tgttgggcac tgacaattcc gtggtgttgt cggggaagct gacgtccttt 1500 ccatggctgc tcgcctgtgt tgccaactgg attctgcgcg ggacgtcctt ctgctacgtc 1560 ccttcggccc tcaatccagc ggaccttcct tcccgcggcc tgctgccggt tctgcggcct 1620 cttccgcgtc ttcgccttcg ccctcagacg agtcggatct ccctttgggc cgcctccccg 1680 cctgtttcgc ctcggcgtcc ggtccgtgtt gcttggtctt cacctgtgca gaattgcgaa 1740 ccatggattc caccgtgaac tttgtctcct ggcatgcaaa tcgtcaactt ggcatgccaa 1800 gtaaggacct ttggactcct tatataaaag atcaattatt aactaaatgg gaggagggca 1860 gcattgatcc tagattatca atatttgtat taggaggctg taggcataaa tgcatgcgac 1920 ttctgtaacc atgtatcttt ttcacctgtg ccttgttttt gcctgtgttc catgtcctac 1980 ttttcaagcc tccaagctgt gccttggatg gctttggggc atggacatag atccctataa 2040 agaatttggt tcatcttatc agttgttgaa ttttcttcct ttggacttct ttcctgacct 2100 taatgctttg gtggacactg ctactgcctt gtatgaagaa gagctaacag gtagggaaca 2160 ttgctctccg caccatacag ctattagaca agctttagta tgctgggatg aattaactaa 2220 attgatagct tggatgagct ctaacataac ttctgaacaa gtaagaacaa tcatagtaaa 2280 tcatgtcaat gatacctggg gacttaaggt gagacaaagt ttatggtttc atttgtcatg 2340 tctcactttt ggacaacata cagttcaaga atttttagta agttttggag tatggatcag 2400 aactccagct ccatatagac ctcctaatgc acccattctc tcgactcttc cggaacatac 2460 agtcattagg agaagaggag gtgcaagagc ttctaggtcc cccagaagac gcactccctc 2520 tcctcgcagg agaagatctc aatcaccgcg tcgcagacgc tctcaatctc catctgccaa 2580 ctgctgatct tcaatgggta cataaaacta atgctattac aggtctttac tctaaccaag 2640 ctgctcagtt caatccgcat tggattcaac ctgagtttcc tgaacttcat ttacataatg 2700 atttaattca aaaattgcaa cagtattttg gtcctttgac tataaatgaa aagagaaaat 2760 tgcaattaaa ttttcctgcc agatttttcc ccaaagctac taaatatttc cctttaatta 2820 aaggcataaa aaacaattat cctaattttg ctttagaaca tttctttgct accgcaaatt 2880 atttgtggac tttatgggaa gctggaattt tgtatttaag gaagaatcaa acaactttga 2940 cttttaaagg taaaccatat tcttgggaac acagacagct agtgcaacat aatgggcaac 3000 aacataaaag tcaccttcaa tccagacaaa atagcagcat ggtggcctgc agtgggcact 3060 tattacacaa ccacttatcc tcagaatcag tcagtgtttc aaccaggaat ttatcaaaca 3120 acatctctga taaatcccaa aaatcaacaa gaactggact ctgttcttat aaacagatac 3180 aaacagatag actggaacac ttggcaagga tttcctgtgg atcaaaaatt accattggtc 3240 agcagggatc ctcccccaaa accttatata aatcaatcag ctcaaacttt cgaaatcaaa 3300 cctgggccta taatagttcc cgg 3323 //