Dbfetch

ID   J00191; SV 1; linear; genomic DNA; STD; HUM; 4123 BP.
XX
AC   J00191; V00526;
XX
DT   24-SEP-1992 (Rel. 33, Created)
DT   17-JUN-2008 (Rel. 96, Last updated, Version 10)
XX
DE   Human MHC class I transplantation antigen (hla) gene.
XX
KW   antigen; cell surface antigen; cell surface glycoprotein; class I gene;
KW   integral membrane protein; major histocompatibility complex.
XX
OS   Homo sapiens (human)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Euarchontoglires; Primates; Haplorrhini; Catarrhini; Hominidae;
OC   Homo.
XX
RN   [1]
RP   1-4123
RX   DOI; 10.1073/pnas.79.3.893.
RX   PUBMED; 6461010.
RA   Malissen M., Malissen B., Jordan B.R.;
RT   "Exon/intron organization and complete nucleotide sequence of an HLA gene";
RL   Proc. Natl. Acad. Sci. U.S.A. 79(3):893-897(1982).
XX
DR   MD5; 29848b123126af2fc2aea03d722c1eda.
DR   IMGT/HLA; HLA-H*02:06; HLA02555.
XX
CC   sequence contains 7 exons. the structure of the protein encoded by
CC   this unit is closely homologous with known class i transplantation
CC   antigens. putative polyadenylation signal aataaa at 3514.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..4123
FT                   /organism="Homo sapiens"
FT                   /map="chromosome 6"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:9606"
FT   gene            245..308
FT                   /gene="HLA"
FT   exon            <245..308
FT                   /gene="HLA"
FT                   /number=1
FT                   /note="hla antigen (signal peptide)"
FT   CDS             join(245..308,434..703,946..1221,1792..2067,2171..2287,
FT                   2729..2761,2904..2947)
FT                   /partial
FT                   /codon_start=1
FT                   /note="hla antigen"
FT                   /db_xref="GOA:P01893"
FT                   /db_xref="HGNC:HGNC:4965"
FT                   /db_xref="InterPro:IPR001039"
FT                   /db_xref="InterPro:IPR003006"
FT                   /db_xref="InterPro:IPR003597"
FT                   /db_xref="InterPro:IPR007110"
FT                   /db_xref="InterPro:IPR010579"
FT                   /db_xref="InterPro:IPR011161"
FT                   /db_xref="InterPro:IPR011162"
FT                   /db_xref="InterPro:IPR013783"
FT                   /db_xref="InterPro:IPR036179"
FT                   /db_xref="InterPro:IPR037055"
FT                   /db_xref="UniProtKB/Swiss-Prot:P01893"
FT                   /protein_id="AAA36218.1"
FT                   /translation="MAPRTLLLLLSGALALTQTWARSHSMRYFYTTMSRPGAGEPRFIS
FT                   VGYVDDTQFVRFDSDDASPREEPRAPWMEREGPKYWDRNTQICKAQAQTERENLRIALR
FT                   YYNQSEGGSHTMQVMYGCDVGPDGPFLRGYEQHAYDGKDYIALNEDLRSWTAADMAAQI
FT                   TKRKWEAARRAEQRRVYLEGEFVEWLRRYLENGKETLQRADPPKTHMTHHPISDHEATL
FT                   RCWALGFYPAEITLTWQRDGEDQTQDTELVETRPAGDGTFQKWAAVVVPSGEEQRYTCH
FT                   VQHEGLPEPLTLRWEPSSQPTVPIVGIVAGLVLLVAVVTGAVVAAVMWRKKSSDRKGGS
FT                   YSQAASSNSAQGSDVSLTA"
FT   intron          309..433
FT                   /note="myoglobin cds intron B"
FT   exon            434..703
FT                   /number=2
FT                   /note="hla antigen (alpha1 domain)"
FT   intron          704..945
FT                   /note="myoglobin cds intron B"
FT   exon            946..1221
FT                   /number=3
FT                   /note="hla antigen (alpha2 domain)"
FT   intron          1222..1791
FT                   /note="LMW ppk cds intron J"
FT   exon            1792..2067
FT                   /number=4
FT                   /note="hla antigen (alpha3 domain)"
FT   intron          2068..2170
FT                   /note="LMW ppk cds intron I"
FT   exon            2171..2287
FT                   /number=5
FT                   /note="hla antigen (membrane segment)"
FT   intron          2288..2728
FT                   /note="50kd cds intron E"
FT   exon            2729..2761
FT                   /number=6
FT                   /note="hla antigen (cytoplasmic segment)"
FT   intron          2762..2903
FT                   /note="50kd cds intron F"
FT   exon            2904..>2947
FT                   /number=7
FT                   /note="hla antigen (cytoplasmic segment)"
XX
SQ   Sequence 4123 BP; 839 A; 1125 C; 1173 G; 984 T; 2 other;
     cccgaaggcg gtgtatggat tggggatgcc ccgccttggg gattcgccac ctccgcagtt        60
     tctcttcttc tcacaacctg cgacgggtcc ttcttcctcg atactcacga agcggacaca       120
     gttctcattc ccactaggtg tcgggtttct agagaagcca atcggtgccg ccgcggtccc       180
     ggttctaaag tccccacgca cccaccggga ctcagattct ccccagacgc cgaggatggt       240
     gctcatggcg ccccgaaccc tcctcctgct gctctcaggg gccctggccc tgacccagac       300
     ctgggcgcgt gagtgcaggg tctgcaggga aatggtcggg aggagngagg ggcccgcccg       360
     gcggggtgcg caggacccag ggagccgcgc agggaggagg gtcgggcggg tctcagctcc       420
     tcctcgctcc caggttccca ctccatgagg tatttctaca ccaccatgtc ccggcccggc       480
     gccggggagc cccgcttcat ctccgtcggc tacgtggacg atacgcagtt cgtgcggttc       540
     gacagcgacg acgcgagtcc gagagaggag ccgcgggcgc cgtggatgga gcgggagggg       600
     ccaaagtatt gggaccggaa cacacagatc tgcaaggccc aggcacagac tgaacgagag       660
     aacctgcgga tcgcgctccg ctactacaac cagagcgagg gcggtgagtt gaccccggcc       720
     cggggcgcag gtcacgaccc ctccccatcc cccacggagg gccgggtcgc ctcgagtctc       780
     tgggtccgag atccaccccg aaaccgcggg atcccgagac ccttgacctg ggagaggccc       840
     aggcgccttt acccggtttc attttcagtt taggccaaaa tccccgcggg ttggtcgggg       900
     cggggctggg ctcgggggac cgggctgacc gcgggggcgg gccaggttct cacaccatgc       960
     aggtgatgta tggctgcgac gtggggcccg acgggccttt cctccgcggg tatgaacagc      1020
     acgcctacga cggcaaggat tacatcgccc tgaacgagga cctgcgctcc tggaccgcgg      1080
     cggacatggc agctcagatc accaagcgca agtgggaggc ggcccgtcgg gcggagcagc      1140
     ggagagtcta cttggagggc gagttcgtgg agtggctccg cagatacttg gagaacggga      1200
     aggagacgct gcagcgcgcg ggtaccaggg ccacagggcg cctccctgat cgcctgtaga      1260
     tctccggggc tggcctccca caagaaaggg agacaaatgg gaccaacact ataatatcgc      1320
     cctccctctg gtcttgaggg agaagaatcc tcttgggttt ccagagagtg actctgaggg      1380
     tccgccctgc tctctgacac aattaaggga tgaaatctgt gaggaaatga agggaagaca      1440
     atccctggaa tactgatgag tggttccctt tgacactggc agcagccttg ggccccgtga      1500
     cttttcctct caggccttgt tctctgcttc acactcaatg tgcgtggggg tctgagtccc      1560
     tcagcctcca ctcaggtcag gaccagaagt cgctgttccc tcttcaggga ctagaatttt      1620
     ccacggaata ggagattatt ctaggtgcct ctgtctaggc tgttgtctgg gttctgtgct      1680
     cccttcccca ccctaggcat cctgtcaatt ctcaagatgg ccacatgcgt gctggtggag      1740
     tgtcccatga cagatgcaaa atgcctgaat tttctgactc tttcccgtca gaccccccca      1800
     agacacatat gacccaccac cccatctctg accatgaggc caccctgagg tgctgggccc      1860
     tgggcttcta ccctgcggag atcacactga cctggcagcg ggatggggag gaccagaccc      1920
     aggacacgga gctcgtggag accaggcctg caggggatgg aaccttccag aagtgggcgg      1980
     ctgtggtggt gccttctgga gaggagcaga gatacacctg ccatgtgcag catgagggtc      2040
     tgcccgagcc cctcaccctg agatggggta aggagggaga tgggggtgtc atgtctctta      2100
     gggaaagccg gagacctctc tggagagctt agcagggtca gggttccctc accttccccc      2160
     cttttcccag agccatcttc ccagcccacc gtccccatcg tgggcatcgt tgctggcttg      2220
     gttctacttg tagctgtggt cactggagct gtggtcgctg ctgtaatgtg gaggaagaag      2280
     agctcaggta aggaaggggt gaggagtgtg gtctgagaat ttcttgtctc actgagagtt      2340
     ccaagcccca agtagaagtg ccctgcctag ttactgggaa gcaccatcca cactcatggg      2400
     cctacccagc ctgggccctg tgtgccagca cttactcttt tgtaaagcac ctgttacaat      2460
     gagggacaga tttattacct tgatgactgt ggtgatggga cctgatccca gcagtcacaa      2520
     gtcacagggg aaggtccccg aggacagacc tcagaagggc ggttggtcna ggacccacat      2580
     ctgctttctt catgtttcct gatcccgccc tgggtctgca gttgcacatt tctggaaact      2640
     tctctggggt ccgagacttg gaggttcctc taggacctta tggccctggc ttctttctgg      2700
     catctcacag gacattttct tcccacagat agaaaaggag ggagctactc tcaggctgca      2760
     agtaagtatg aaggaggctg atccctgaaa tcctttggat attgtgtttg ggagcccatg      2820
     ggggagctca cccaccccac aattcttcct ctagccacat ctactgtggg atctgaccag      2880
     gtcctgtttt tattctactc caggcagcaa cagtgcccag ggctctgatg tgtctctcac      2940
     ggcttgaaac ctgagacctt ggggggcctg atgtgtgggg gatgttgggg gggaacagtg      3000
     gacacagctg tgctatgggg ttctttgaat ttgatgtttt gagcatgcga tgggctgcca      3060
     aagtgtcatc cattactggg acagatatga atttgttcat gaatattttt tctatagtgt      3120
     gagacagctg ccttgtgtgg gactgagagg caagagttgt tcctgccttc cctttgtgac      3180
     ttgaagaacc ctgactttct ttctacaaag gcacctgaat gtgtctgtgt tcctgtaggc      3240
     ataatgtgtg gaggagggga gaccaaccca ccctcatgtc caccatgacc ctcttcccca      3300
     cgctgactgt gttccctccc caatcatctt tcctgttcca gagaggaggg gctgagatgt      3360
     ctccatcttt ttctcaactt tatgtgcact gagctgtaat tcttacttcc ctcttaaaat      3420
     tgaatcttga gtaaacattt actttttcaa attcttgcca tgagagggtt gatgacttaa      3480
     ttaaaggaga agattcctaa aatttgagag acaaaataaa tggaacacat gagaaccttc      3540
     cagagtccat gtgtttcttg tgctgatttg ttgcagggga ggagaatagg tggggctgtg      3600
     cctagtgggt gctcaggccc agtatggact ttatgtggtc actgctcagc tgggtcatct      3660
     ttgctccttc attctccttg gcccttcagt agaaccttgt cctaccacca cctgtgatca      3720
     cagggacttg gatgtcacct acagtggtcc ctgcatacaa atctcattgt agtatcaaga      3780
     gactaatttt cagacctgtc cagctcttgc cctcctccta gggctctttc ctggattgta      3840
     tttttcatct tgcctccaat ctttttaaag gaagcagatt ctaaaatttg cagagaggag      3900
     gggcccatag tttctcatca tagtgaactt tctgttggag ctcctcttct gctctcttac      3960
     tcttcttcct tccctgagtt gtagtaatcc tagtgctggc tccagtccaa actcatggat      4020
     ttacaaagca gagtctaatt tagattcata cgtggttgga aaattggacc cataagccta      4080
     gggttatctt tcctgaagag aaaaatatgg ttgtgtgctg cag                        4123
//