Dbfetch

ID   HLA00401; SV 1; standard; DNA; HUM; 4304 BP.
XX
AC   HLA00401;
XX
SV   HLA00401.1
XX
DT   14-NOV-1991 (Rel. 1.0.0, Created, Version 1)
DT   16-JAN-2024 (Rel. 3.55.0, Last Updated, Version 1)
XX
DE   HLA-C*01:02:01:01, Human MHC Class I sequence
XX
KW   Human MHC; HLA; Class I; HLA-C; Allele; HLA-C*01:02:01:01;
XX
OS   Homo Sapiens (human)
OC   Eukaryota; Metazoa; Chordata; Vertebrata; Mammalia; Eutheria; Primates;
OC   Catarrhini; Hominidae; Homo.
XX
CC   --------------------------------------------------------------------------
CC   IPD-IMGT/HLA Release Version 3.55.0
CC   --------------------------------------------------------------------------
CC   Copyrighted by the IPD-IMGT/HLA Database, Distributed under the Creative
CC   Commons Attribution-NoDerivs License, see;
CC   http://www.ebi.ac.uk/ipd/imgt/hla/licence/ for further details.
CC   --------------------------------------------------------------------------
XX
RN   [1]
RP   1-4304
RX   PUBMED; 3032784.
RA   Gussow D, Rein RS, Meijer I, de Hoog W, Seemann GH, Hochstenbach FM, Ploegh
RA   HL;
RT   "Isolation, expression, and the primary structure of HLA-Cw1 and HLA-Cw2
RT   genes: evolutionary aspects.";
RL   Immunogenetics 25:313-322(1987).
XX
RN   [2]
RP   1-4304
RX   PUBMED; 1384166.
RA   Zemmour J, Gumperz JE, Hildebrand WH, Ward FE, Marsh SGE, Williams RC,
RA   Parham P;
RT   "The molecular basis for reactivity of anti-Cw1 and anti-Cw3 alloantisera
RT   with HLA-B46 haplotypes.";
RL   Tissue Antigens 39:249-257(1992).
XX
RN   [3]
RP   1-4304
RX   PUBMED; 7871529.
RA   Steinle A, Schendel DJ;
RT   "HLA class I alleles of LCL 721 and 174 x CEM.T2 (T2).";
RL   Tissue Antigens 44:268-270(1994).
XX
RN   [4]
RP   1-4304
RX   PUBMED; 9062969.
RA   Wang H, Tokunaga K, Akaza T, Tadokoro K, Shibata Y, Juji T;
RT   "Identification of HLA-C alleles using PCR-single-strand-conformation
RT   polymorphism and direct sequencing.";
RL   Tissue Antigens 49:134-140(1997).
XX
RN   [5]
RP   1-4304
RX   PUBMED; 12622774.
RA   Cox ST, McWhinnie AJ, Robinson J, Marsh SGE, Parham P, Madrigal JA, Little
RA   AM;
RT   "Cloning and sequencing full-length HLA-B and -C genes.";
RL   Tissue Antigens 61:20-48(2003).
XX
RN   [6]
RP   1-4304
RX   PUBMED; 20196829.
RA   Xu YP, Yang B, Zeng J, Wang D, Deng Z;
RT   "Characterization of the genomic full-length sequence of HLA-Cw*010201,
RT   Cw*0706 and Cw*0801 in Chinese individuals.";
RL   Tissue Antigens 75:179-181(2010).
XX
RN   [7]
RP   1-4304
RX   PUBMED; 21585707.
RA   Zhu F, He Y, Zhang W, He J, He J, Xu X, Lv H, Yan L;
RT   "Analysis for complete genomic sequence of HLA-B and HLA-C alleles in the
RT   Chinese Han population.";
RL   International Journal of Immunogenetics 38:281-284(2011).
XX
RN   [8]
RP   1-4304
RX   PUBMED; 21658009.
RA   Xu Y, Deng Z, OhUign C, Wang D, Gao S, Zend J, Yang B, Jin S, Zou H;
RT   "Charaterization and polymorphic analysis of 4.5 kb genomic full-length
RT   HLA-C in Chinese Han population.";
RL   Tissue Antigens 78:102-114(2011).
XX
RN   [9]
RP   1-4304
RX   PUBMED; 30337930.
RA   Suzuki S, Ranade S, Osaki K, Iyo S, Shigenari A, Ohnuki Y, Oka A, Masuya A,
RA   Harting J, Baybayan P, Kitazume M, Sunaga J, Morishima S, Morishima Y,
RA   Inoko H, Kulski JK, Shiina T;
RT   "Reference grade characterization of polymorphisms in full-length HLA class
RT   I and II genes with short-read sequencing on the ION PGM system and
RT   long-reads generated by single molecule, real-time sequencing on the PacBio
RT   platform.";
RL   Frontiers in Immunology 9:2294(2018).
XX
CC   --------------------------------------------------------------------------
CC   The sequence below is the official allele sequence as approved by the
CC   WHO Nomenclature Committee for Factors of the HLA System.
CC   Any cross references may differ from the sequence shown below.
CC   --------------------------------------------------------------------------
XX
DR   EMBL; AJ420242; AJ420242.1.
DR   EMBL; D50852; D50852.1.
DR   EMBL; FJ515900; FJ515900.1.
DR   EMBL; FJ827032; FJ827032.1.
DR   EMBL; HG794388; HG794388.1.
DR   EMBL; HM543696; HM543696.1.
DR   EMBL; KU319215; KU319215.1.
DR   EMBL; LC257747; LC257747.1.
DR   EMBL; M16272; M16272.1.
DR   EMBL; M84171; M84171.1.
DR   EMBL; Z46809; Z46809.1.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4304
FT                   /organism="Homo sapiens"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:9606"
FT                   /ethnic="Asian, European, Native American, Undefined"
FT                   /cell_line="009386"
FT                   /cell_line="08009391"
FT                   /cell_line="AP"
FT                   /cell_line="BRUG"
FT                   /cell_line="H10021"
FT                   /cell_line="JM44"
FT                   /cell_line="KRC-005"
FT                   /cell_line="LATIF"
FT                   /cell_line="LCL721"
FT                   /cell_line="PACO752792"
FT                   /cell_line="T7527"
FT                   /cell_line="TTY"
FT   CDS             join(496..568,699..968,1215..1490,2078..2353,2475..2594,
FT                   3034..3066,3174..3221,3386..3390)
FT                   /codon_start=1
FT                   /gene="HLA-C"
FT                   /allele="HLA-C*01:02:01:01"
FT                   /product="MHC Class I HLA-C*01:02:01:01 sequence"
FT                   /translation="MRVMAPRTLILLLSGALALTETWACSHSMKYFFTSVSRPGRGEPR
FT                   FISVGYVDDTQFVRFDSDAASPRGEPRAPWVEQEGPEYWDRETQKYKRQAQTDRVSLRN
FT                   LRGYYNQSEAGSHTLQWMCGCDLGPDGRLLRGYDQYAYDGKDYIALNEDLRSWTAADTA
FT                   AQITQRKWEAAREAEQRRAYLEGTCVEWLRRYLENGKETLQRAEHPKTHVTHHPVSDHE
FT                   ATLRCWALGFYPAEITLTWQWDGEDQTQDTELVETRPAGDGTFQKWAAVMVPSGEEQRY
FT                   TCHVQHEGLPEPLTLRWEPSSQPTIPIVGIVAGLAVLAVLAVLGAVVAVVMCRRKSSGG
FT                   KGGSCSQAASSNSAQGSDESLIACKA"
FT   UTR             1..495
FT   exon            496..568
FT                   /number="1"
FT   intron          569..698
FT                   /number="1"
FT   exon            699..968
FT                   /number="2"
FT   intron          969..1214
FT                   /number="2"
FT   exon            1215..1490
FT                   /number="3"
FT   intron          1491..2077
FT                   /number="3"
FT   exon            2078..2353
FT                   /number="4"
FT   intron          2354..2474
FT                   /number="4"
FT   exon            2475..2594
FT                   /number="5"
FT   intron          2595..3033
FT                   /number="5"
FT   exon            3034..3066
FT                   /number="6"
FT   intron          3067..3173
FT                   /number="6"
FT   exon            3174..3221
FT                   /number="7"
FT   intron          3222..3385
FT                   /number="7"
FT   exon            3386..3390
FT                   /number="8"
FT   UTR             3391..4304
SQ   Sequence 4304 BP; 832 A; 1204 C; 1297 G; 971 T; 0 other;
     ttattttgct ggatgtagtt taatattacc tgaggtaagg taaggcaaag agtgggaggc        60
     agggagtcca gttcagggac ggggattcca ggagaagtga aggggaaggg gctgggcgca       120
     gcctgggggt ctctccctgg tttccacaga cagatccttg gccaggactc aggcacacag       180
     tgtgacaaag atgcttggtg taggagaaga gggatcagga cgaagtccca ggtcccgggc       240
     ggggttctca gggtctcagg ctccaagggc cgtgtctgca ctggggaggc gccgcgttga       300
     ggattctcca ctcccctgag tttcacttct tctcccaacc tgcgtcgggt ccttcttcct       360
     gaatactcat gacgcgtccc caattcccac tcccattggg tgtcgggttc tagagaagcc       420
     aatcagcgtc tccgcagtcc cggttctaaa gtccccagtc acccacccgg actcagattc       480
     tccccagacg ccgagatgcg ggtcatggcg ccccgaaccc tcatcctgct gctctcggga       540
     gccctggccc tgaccgagac ctgggcctgt gagtgcgggg ttgggaggga aacggcctct       600
     gcggagagga acgaggtgcc cgcccggcga gggcgcagga cccggggagc cgcgcaggga       660
     ggagggtcgg gcgggtctca gcccctcctc gcccccaggc tcccactcca tgaagtattt       720
     cttcacatcc gtgtcccggc ctggccgcgg agagccccgc ttcatctcag tgggctacgt       780
     ggacgacacg cagttcgtgc ggttcgacag cgacgccgcg agtccgagag gggagccgcg       840
     ggcgccgtgg gtggagcagg aggggccgga gtattgggac cgggagacac agaagtacaa       900
     gcgccaggca cagactgacc gagtgagcct gcggaacctg cgcggctact acaaccagag       960
     cgaggccggt gagtgacccc ggcccggggc gcaggtcacg acccctcctc atcccccacg      1020
     gacggcccgg gtcgccccaa gtctcccggt ctgagatcca ccccgaggct gcggaacccg      1080
     cccagaccct cgaccggaga gagccccagt cacctttacc cggtttcatt ttcagtttag      1140
     gccaaaatcc ccgcgggttg gtcgggactg gggcggggct cgggggacgg ggctgaccac      1200
     gggggcgggg ccagggtctc acaccctcca gtggatgtgt ggctgcgacc tggggcccga      1260
     cgggcgcctc ctccgcgggt atgaccagta cgcctacgac ggcaaggatt acatcgccct      1320
     gaacgaggac ctgcgctcct ggaccgccgc ggacaccgcg gctcagatca cccagcgcaa      1380
     gtgggaggcg gcccgtgagg cggagcagcg gagagcctac ctggagggca cgtgcgtgga      1440
     gtggctccgc agatacctgg agaacgggaa ggagacgctg cagcgcgcgg gtaccagggg      1500
     cagtggggag ccttccccat ctcccgtaga tctcccggca tggcctccca cgaggagggg      1560
     aggaaaatgg gatcagcgct agaatatcgc cctcccttga atggagaatg ggatgagttt      1620
     tcctgagttt cctctgaggg ccccctctgc tctctaggac aattaaggga tgaagtcctt      1680
     gaggaaatgg aggggaagac agtccctgga atactgatca ggggtcccct ttgaccactt      1740
     tgaccactgc agcagctgtg gtcaggctgc tgacctttct ctcaggcctt gttctctgcc      1800
     tcacgctcaa tgtgtttgaa ggtttgattc cagcttttct gagtccttcg gcctccactc      1860
     aggtcaggac cagaagtcgc tgttcctccc tcagagacta gaactttcca atgaatagga      1920
     gattatccca ggtgcctgtg tccaggctgg cgtctgggtt ctgtgccccc ttccccaccc      1980
     caggtgtcct gtccattctc aggatggtca catgggcgct gttggagtgt cgcaagagag      2040
     atacaaagtg tctgaatttt ctgactcttc ccgtcagaac acccaaagac acacgtgacc      2100
     caccatcccg tctctgacca tgaggccacc ctgaggtgct gggccctggg cttctaccct      2160
     gcggagatca cactgacctg gcagtgggat ggggaggacc aaactcagga caccgagctt      2220
     gtggagacca ggccagcagg agatggaacc ttccagaagt gggcagctgt gatggtgcct      2280
     tctggagaag agcagagata cacgtgccat gtgcagcacg aggggctgcc ggagcccctc      2340
     accctgagat ggggtaagga gggggatgag gggtgatgtg tcttctcagg gaaagcagaa      2400
     gtcctggagc ccttcagccg ggtcagggct gaggcttgga ggtcagggcc cctcaccttc      2460
     ccctcctttc ccagagccgt cttcccagcc caccatcccc atcgtgggca tcgttgctgg      2520
     cctggctgtc ctggctgtcc tagctgtcct aggagctgtg gtggctgttg tgatgtgtag      2580
     gaggaagagc tcaggtaggg aaggggtgag gagtggggtc tgggttttct tgttccactg      2640
     ggagtttcaa gccccaggta gaagtgtgcc ccacctcgtt actggaagca ccatccacac      2700
     atgggccatc ccagcctggg accctgtgtg ccagcactta ctctgttgtg aagcacatga      2760
     caatgaagga cagatgtatc accttgatga ttatggtgtt ggggtccttg attccagcat      2820
     tcatgagtca ggggaaggtc cctgctaagg acagacctta ggagggcagt tgcttcagaa      2880
     cccacagctg ctttccccgt gtttcctgat cctgccctgg gtctgcagtc atagttctgg      2940
     aaacttctct tgggtccaag actaggaggt tcccctaaga tcgcatggcc ctgcctcctc      3000
     cctgtcccct cacagggcat tttcttccca caggtggaaa aggagggagc tgctctcagg      3060
     ctgcgtgtaa gtgatggcgg tgggcgtgtg gaggagctca cccaccccat aattcctctt      3120
     gtcccacatc tcctgcgggc tctgaccagg tctttttttt tgttctaccc cagccagcaa      3180
     cagtgcccag ggctctgatg agtctctcat cgcttgtaaa ggtgagattc tggggagctg      3240
     aagtggtcgg gggtggggca gagggaaaag gcctaggtaa tggggatcct ttgattggga      3300
     cgtttcgaat gtgtggtgag ctgttcagag tgtcatcact taccatgact gacctgaatt      3360
     tgttcatgac tattgtgttc tgtagcctga gacagctgcc tgtgtgggac tgagatgcag      3420
     gatttcttca cacctctcct ttgtgacttc aagagcctct ggcatctctt tctgcaaagg      3480
     catctgaatg tgtctgcgtt cctgttagca taatgtgagg aggtggagag acagcccacc      3540
     cccgtgtcca ccgtgacccc tgtccccaca ctgacctgtg ttccctcccc gatcatcttt      3600
     cctgttccag agaagtgggc tggatgtctc catctctgtc tcaacttcat ggtgcgctga      3660
     gctgcaactt cttacttccc taatgaagtt aagaacctga atataaattt gttttctcaa      3720
     atatttgcta tgaagggttg atggattaat taaataagtc aattcctgga agttgagaga      3780
     gcaaataaag acctgagaac cttccagaat ccgcatgttc gctgtgctga gtctgttgca      3840
     ggtgggggtg gggaaggctg tgaggagacg agtgtggacg gggcctgtgc ctagttgctg      3900
     ttcagttctt catgggcttt atgtggtcag tcctcagctg ggtcaccttc actgctccat      3960
     tgtccttgtc ccttcagtgg aaacttgtcc agcgggagct gtgaccacag aggctcacac      4020
     atcgcccagg gcagcccctg cacacgggag tccctgtgct ttctgagaca aattttcaga      4080
     cccagtcagc tcctgccctc cttctagggc tcctcttctg ctttggtctc ctgccctctc      4140
     tcccttccct gattccagtg atcttcgtgc tgactccaat cccaactcat gaatctaaag      4200
     cagagcctaa tttagattta tatttgtttg taaaattggg tccatagtct agaattgttc      4260
     cttcctgaag agagaaacct gattgtgtgc tgcagtgtgc gggg                       4304
//