Dbfetch

ID   ON263102; SV 1; linear; genomic DNA; STD; HUM; 4094 BP.
XX
AC   ON263102;
XX
DT   14-JUN-2023 (Rel. 144, Created)
DT   15-JUN-2023 (Rel. 144, Last updated, Version 1)
XX
DE   Homo sapiens MHC class I protein (HLA-B) gene, HLA-B-B*15extended allele,
DE   complete cds.
XX
KW   .
XX
OS   Homo sapiens (human)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Euarchontoglires; Primates; Haplorrhini; Catarrhini; Hominidae;
OC   Homo.
XX
RN   [1]
RP   1-4094
RA   Khor S.-S., Ito I., Sato T., Tokunaga K.;
RT   ;
RL   Submitted (17-APR-2022) to the INSDC.
RL   Genome Medical Science Project, National Center for Global Health and
RL   Medicine, Toyama 1-21-1, Shinjuku Ward, Tokyo 162-8655, Japan
XX
DR   MD5; 87b7ce735c456d38e99179410edec425.
XX
CC   ##Assembly-Data-START##
CC   Assembly Method       :: NGSengine v. 2.25.0.25342
CC   Sequencing Technology :: PacBio
CC   ##Assembly-Data-END##
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4094
FT                   /organism="Homo sapiens"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:9606"
FT   gene            <1..>4094
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT   mRNA            join(<1..357,487..756,1002..1277,1853..2128,2233..2349,
FT                   2791..2823,2930..>4094)
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /product="MHC class I protein"
FT   exon            <1..357
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=1
FT   5'UTR           <1..284
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT   CDS             join(285..357,487..756,1002..1277,1853..2128,2233..2349,
FT                   2791..2823,2930..2973)
FT                   /codon_start=1
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /product="MHC class I protein"
FT                   /protein_id="WCC58481.1"
FT                   /translation="MRVTAPRTVLLLLSGALALTETWAGSHSMRYFYTAMSRPGRGEPR
FT                   FIAVGYVDDTQFVRFDSDAASPRMAPRAPWIEQEGPEYWDRETQISKTNTQTYRESLRN
FT                   LRGYYNQSEAGSHTLQRMYGCDVGPDGRLLRGHDQSAYDGKDYIALNEDLSSWTAADTA
FT                   AQITQRKWEAAREAEQWRAYLEGLCVEWLRRYLENGKETLQRADPPKTHVTHHPISDHE
FT                   ATLRCWALGFYPAEITLTWQRDGEDQTQDTELVETRPAGDRTFQKWAAVVVPSGEEQRY
FT                   TCHVQHEGLPKPLTLRWEPSSQSTIPIVGIVAGLAVLAVVVIGAVVATVMCRRKSSGGK
FT                   GGSYSQAASSDSAQGSDVSLTA"
FT   exon            487..756
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=2
FT   exon            1002..1277
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=3
FT   exon            1853..2128
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=4
FT   exon            2233..2349
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=5
FT   exon            2791..2823
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=6
FT   exon            2930..>4094
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
FT                   /number=7
FT   3'UTR           2974..>4094
FT                   /gene="HLA-B"
FT                   /allele="B*15extended"
XX
SQ   Sequence 4094 BP; 770 A; 1151 C; 1240 G; 933 T; 0 other;
     gatcaggacg aagtcccagg tcccggacgg ggctctcagg gtctcaggct ccgagagcct        60
     tgtctgcatt ggggaggcgc agcgttgggg attccccact cccacgagtt tcacttcttc       120
     tcccaaccta tgtcgggtcc ttcttccagg atactcgtga cgcgtcccca tttcccactc       180
     ccattgggtg tcgggtgtct agagaagcca atcagtgtcg ccggggtccc agttctaaag       240
     tccccacgca cccacccgga ctcaaaatct cctcagacgc cgagatgcgg gtcacggcgc       300
     cccgaaccgt cctcctgctg ctctcgggag ccctggccct gaccgagacc tgggccggtg       360
     agtgcggggt cggcagggaa atggcctctg tggggaggag cgaggggacc gcaggcgggg       420
     gcgcaggacc cggggagccg cgccgggagg agggtcgggc gggtctcagc ccctcctcgc       480
     ccccaggctc ccactccatg aggtatttct acaccgccat gtcccggccc ggccgcgggg       540
     agccccgctt catcgcagtg ggctacgtgg acgacaccca gttcgtgagg ttcgacagcg       600
     acgccgcgag tccgaggatg gcgccccggg cgccatggat agagcaggag gggccggagt       660
     attgggaccg ggagacacag atctccaaga ccaacacaca gacttaccga gagagcctgc       720
     ggaacctgcg cggctactac aaccagagcg aggccggtga gtgaccccgg cctggggcgc       780
     aggtcacgac tccccatccc ccacgtacgg cccgggtcgc cccgagtctc cgggtccgag       840
     atccgccccc ctgaggccgc gggacccgcc caaaccctcg accggcgaga gccccaggcg       900
     cgtttacccg gtttcatttt cagttgaggc caaaatcccc gcgggttggt cggggcgggg       960
     cggggctcgg gggacggggc tgaccgcggg gcctgggcca gggtctcaca ccctccagag      1020
     gatgtacggc tgcgacgtgg ggccggacgg gcgcctcctc cgcgggcatg accagtccgc      1080
     ctacgacggc aaggattaca tcgccctgaa cgaggacctg agctcctgga ccgcggcgga      1140
     cacggcggct cagatcaccc agcgcaagtg ggaggcggcc cgtgaggcgg agcagtggag      1200
     agcctacctg gagggcctgt gcgtggagtg gctccgcaga tacctggaga acgggaagga      1260
     gacgctgcag cgcgcgggta ccaggggcag tggggagcct tccccatctc ctataggtcg      1320
     ccggggatgg cctcccacga gaagaggagg aaaatgggat cagcgctaga atgtcgccct      1380
     cccttgaatg gagaatggca tgagttttcc tgagtttcct ctgagggccc cctcttctct      1440
     ctaggacaat taagggatga cgtctctgag gaaatggagg ggaagacagt ccctaggata      1500
     gtgatcaggg gtcccctttg acccctgcag cagccttggg aaccgtgact tttcctctca      1560
     ggccttgttc tctgcctcac actcagtgtg tttggggctc tgattccagc acttctgagt      1620
     cactttacct ccactcagat caggagcaga agtccctgtt ccccgctcag agactcgaac      1680
     tttccaatga ataggagatt atcccaggtg cctgcgtcca ggctggtgtc tgggttctgt      1740
     gccccttccc caccccaggt gtcctgtcca ttctcaggct ggtcacatgg gtggtcctag      1800
     ggtgtcccat gagagatgca aagcgcctga attttctgac tcttcccatc agacccccca      1860
     aagacacatg tgacccacca ccccatctct gaccatgagg ccaccctgag gtgctgggcc      1920
     ctgggcttct accctgcgga gatcacactg acctggcagc gggatggcga ggaccaaact      1980
     caggacaccg agcttgtgga gaccagacca gcaggagata gaaccttcca gaagtgggca      2040
     gctgtggtgg tgccttctgg agaagagcag agatacacat gccatgtaca gcatgagggg      2100
     ctgccgaagc ccctcaccct gagatggggt aaggaggggg atgaggggtc atatctgttc      2160
     tcagggaaag caggagccct tctggagccc ttcagcaggg tcagggcccc tcatcttccc      2220
     ctcctttccc agagccatct tcccagtcca ccatccccat cgtgggcatt gttgctggcc      2280
     tggctgtcct agcagttgtg gtcatcggag ctgtggtcgc tactgtgatg tgtaggagga      2340
     agagctcagg tagggaaggg gtgaggggtg gggtctgggt tttcttgtcc cactgggggt      2400
     ttcaagcccc aggtagaagt gttccctgcc tcattactgg gaagcagcat ccacacaggg      2460
     gctaacgcag cctgggaccc tgtgtgccag cacttactct tttgtgcagc acatgtgaca      2520
     atgaaggaca gatgtatcgc cttgatggtt gtggtgttgg ggtcctgatt ccagcattca      2580
     tgagtcaggg gaaggtccct gctaaggaca gaccttagga gggcagttgg tccaggaccc      2640
     acacttgctt tcctcgtgtt tcctgatcct gccctgggtc tgtagtcata cttctggaaa      2700
     ttccttttgg ttccaagacg aggaggttcc tctaagatct catggtcctg cttcctccca      2760
     gtcccctcac aggacatttt cttcccacag gtggaaaagg agggagctac tctcaggctg      2820
     cgtgtaagtg gtgggggtgg gagtgtggag gagctcaccc accccataat tcctcctgtc      2880
     ccacgtctcc tgcgggctct gaccaggtcc tgtttttgtt ctactccagc cagcgacagt      2940
     gcccagggct ctgatgtgtc tctcacagct tgaaaaggtg agattcttgg ggtctagagt      3000
     gggtggggtg gcgggtctgg gggtgggtgg ggcagtgggg aaaggcctgg gtaatggaga      3060
     ttctttgatt gggatgtttc gcgtgtgtcg tgggctgttc agagtgtcat cacttaccat      3120
     gactaaccag aatttgttca tgactgttgt tttctgtagc ctgagacagc tgtcttgtga      3180
     gggaccgaga tgcaggattt cttcacgcct cccctttgtg acttcaagag cctctggcat      3240
     ctctttctgc aaaggcacct gaatgtgtct gcgtccctgt tagcataatg tgaggaggtg      3300
     gagagacagc ccacccttgt gtccactgtg acccctgttc ccatgctgat ctgtgtttcc      3360
     tccccagtca tctttcttgt tccagagagg tggggctgga tgtctccatc tctgtctcaa      3420
     ctttatgtgc actgagctgc aacttcttac ttccctactg aaaataagaa tctgaatata      3480
     aatttgtttt ctcaaatatt tgctatgaga ggttgatgga ttaattaaat aagtcaattc      3540
     ctggaatttg aaagagcaaa taaagacctg agaaccttcc agaatctgca tgttcgctgt      3600
     gctgagtctg ttgcaggtgg ggtgtggaga aggctgtggg gggccgagtg tggatggggc      3660
     ctgtgcccat ttggtgttga gtccatcatg ggctttatgt ggttagtcgt cagctgggtc      3720
     accttcactg ctccattgtc cttgtccctt cagtggaaac ttgtccagtg ggagctgtga      3780
     ccacagaggc tcacacatcg cccagggcgg cccctgcaca cgggggtctc tgtgcattct      3840
     gagacaaatt ttcagagcca ttcacctcct gctctgcttc tagagctcct tttctgctct      3900
     gctcttctgc cctctctccc tgccctggtt ctagtgatct tggtgctgaa tccaatccca      3960
     actcatgaat ctgtaaagca gagtctaatt tagacttaca tttgtctgtg aaattggacc      4020
     catcatcaag gactgttctt tcctgaagag agaacctgat tgtgtgctgc agtgtgctgg      4080
     ggcagggggt gcgg                                                        4094
//