spacer
spacer

EBI Dbfetch

ID   GQ477520; SV 1; linear; genomic DNA; STD; VRL; 1203 BP.
XX
AC   GQ477520;
XX
DT   19-OCT-2009 (Rel. 102, Created)
DT   19-OCT-2009 (Rel. 102, Last updated, Version 1)
XX
DE   Hepatitis B virus isolate P62 large S protein, middle S protein, and S
DE   protein genes, complete cds.
XX
KW   .
XX
OS   Hepatitis B virus
OC   Viruses; Retro-transcribing viruses; Hepadnaviridae; Orthohepadnavirus.
XX
RN   [1]
RP   1-1203
RA   Grabarczyk P., Garmiri P., Liszewski G., Doucet D., Sulkowska E.,
RA   Brojer E., Allain J.-P.;
RT   "Molecular and serological characterization of Hepatitis B virus genotype A
RT   and D infected blood donors in Poland";
RL   Unpublished.
XX
RN   [2]
RP   1-1203
RA   Grabarczyk P., Garmiri P., Liszewski G., Doucet D., Sulkowska E.,
RA   Brojer E., Allain J.-P.;
RT   ;
RL   Submitted (13-AUG-2009) to the EMBL/GenBank/DDBJ databases.
RL   Department of Immunohaematology, Institute of Haematology and Transfusion
RL   Medicine, 5 Chocimska Street, Warsaw 00-957, Poland
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1203
FT                   /organism="Hepatitis B virus"
FT                   /host="Homo sapiens"
FT                   /isolate="P62"
FT                   /mol_type="genomic DNA"
FT                   /country="Poland"
FT                   /isolation_source="blood donor"
FT                   /collection_date="2006"
FT                   /note="subtype: A2; genotype: A"
FT                   /db_xref="taxon:10407"
FT   CDS             1..1203
FT                   /codon_start=1
FT                   /product="large S protein"
FT                   /note="pre-S1/pre-S2/S"
FT                   /db_xref="UniProtKB/TrEMBL:D0EEV3"
FT                   /protein_id="ACX69667.1"
FT                   /translation="MGGWSSKPRKGMGTNLSVPNPLGFFPDHQLDPAFGANSNNPDWDF
FT                   NPIKDHWPAANQVGVGAFGPGLTPPHGGILGWSPQAQGILTTMSTIPPPASTNRQSGRQ
FT                   PTPISPPLRDSHPQAMQWNSTAFHQALQDPRVRGLHSPAGGSSSGTVNPAPNIASHISS
FT                   ISARTGDPVTNMENITSGFLGPLLVLQAGFFLLTRILTIPQSLDSWWTSLNFLGGSPVC
FT                   LGQNSQSPTSNHSPTSCPPICPGYRWMCLRRFIIFLFILLLCLIFLLVLLDYQGMLPVC
FT                   PLIPGSTTTSTGPCKTCTTPAQGNSMFPSCCCTKPTDGNCTCIPIPSSWAFAKYLWEWA
FT                   SVRFSWLSLLVPFVQWFVGLSPTVWLSAIWMMWYWGPSLYSIVSPFIPLLPIFFCLWVY
FT                   I"
FT   CDS             358..1203
FT                   /codon_start=1
FT                   /product="middle S protein"
FT                   /note="preS2/S"
FT                   /db_xref="UniProtKB/TrEMBL:D0EEV4"
FT                   /protein_id="ACX69668.1"
FT                   /translation="MQWNSTAFHQALQDPRVRGLHSPAGGSSSGTVNPAPNIASHISSI
FT                   SARTGDPVTNMENITSGFLGPLLVLQAGFFLLTRILTIPQSLDSWWTSLNFLGGSPVCL
FT                   GQNSQSPTSNHSPTSCPPICPGYRWMCLRRFIIFLFILLLCLIFLLVLLDYQGMLPVCP
FT                   LIPGSTTTSTGPCKTCTTPAQGNSMFPSCCCTKPTDGNCTCIPIPSSWAFAKYLWEWAS
FT                   VRFSWLSLLVPFVQWFVGLSPTVWLSAIWMMWYWGPSLYSIVSPFIPLLPIFFCLWVYI
FT                   "
FT   CDS             523..1203
FT                   /codon_start=1
FT                   /product="S protein"
FT                   /note="HBsAg"
FT                   /db_xref="InterPro:IPR000349"
FT                   /db_xref="UniProtKB/TrEMBL:Q773S4"
FT                   /protein_id="ACX69669.1"
FT                   /translation="MENITSGFLGPLLVLQAGFFLLTRILTIPQSLDSWWTSLNFLGGS
FT                   PVCLGQNSQSPTSNHSPTSCPPICPGYRWMCLRRFIIFLFILLLCLIFLLVLLDYQGML
FT                   PVCPLIPGSTTTSTGPCKTCTTPAQGNSMFPSCCCTKPTDGNCTCIPIPSSWAFAKYLW
FT                   EWASVRFSWLSLLVPFVQWFVGLSPTVWLSAIWMMWYWGPSLYSIVSPFIPLLPIFFCL
FT                   WVYI"
XX
SQ   Sequence 1203 BP; 259 A; 349 C; 266 G; 329 T; 0 other;
     atgggaggtt ggtcatcaaa acctcgcaaa ggcatgggga cgaatctttc tgttcccaac        60
     cctctgggat tctttcccga tcatcagttg gacccggcat tcggagccaa ctcaaacaat       120
     ccagattggg acttcaaccc catcaaggac cactggccag cagccaacca ggtaggagtg       180
     ggagcattcg ggccagggct cacccctcca cacggcggta ttttggggtg gagccctcag       240
     gctcagggca tattgaccac aatgtcaaca attcctcctc ctgcctccac caatcggcag       300
     tcaggaaggc agcctactcc catctctcca cctctaagag acagtcatcc tcaggccatg       360
     cagtggaatt ccactgcctt ccaccaagct ctacaggatc ccagagtcag gggtctgcat       420
     tctcctgctg gtggctccag ttcaggaaca gtaaaccctg ctccgaatat tgcctctcac       480
     atctcgtcaa tctccgcgag gactggggac cctgtgacga acatggagaa catcacatca       540
     ggattcctag gacccctgct cgtgttacag gcggggtttt tcttgttgac aagaatcctc       600
     acaataccgc agagtctaga ctcgtggtgg acttctctca attttctagg gggatcaccc       660
     gtgtgtcttg gccaaaattc gcagtcccca acctccaatc actcaccaac ctcctgtcct       720
     ccaatttgtc ctggttatcg ctggatgtgt ctgcggcgtt ttatcatatt cctcttcatc       780
     ctgctgctat gcctcatctt cttattggtt cttctggatt atcaaggtat gttgcccgtt       840
     tgtcctctaa ttccaggatc aacaacaacc agtacgggac catgcaaaac ctgcacgact       900
     cctgctcaag gcaactctat gtttccctca tgttgctgta caaaacctac ggatggaaat       960
     tgcacctgta ttcccatccc atcgtcctgg gctttcgcaa aatacctatg ggagtgggcc      1020
     tcagtccgtt tctcttggct cagtttacta gtgccatttg ttcagtggtt cgtagggctt      1080
     tcccccactg tttggctttc agctatatgg atgatgtggt attgggggcc aagtctgtac      1140
     agcatcgtga gtccctttat accgctgtta ccaattttct tttgtctctg ggtatacatt      1200
     taa                                                                    1203
//


  
spacer
spacer