Dbfetch

ID   AJ242600; SV 1; linear; mRNA; STD; INV; 3234 BP.
XX
AC   AJ242600;
XX
DT   07-JAN-2000 (Rel. 62, Created)
DT   15-APR-2005 (Rel. 83, Last updated, Version 4)
XX
DE   Loligo opalescens mRNA for glutamate receptor (gluR gene), splice variant 1
XX
KW   alternative splicing; gluR gene; glutamate receptor.
XX
OS   Doryteuthis opalescens
OC   Eukaryota; Metazoa; Lophotrochozoa; Mollusca; Cephalopoda; Coleoidea;
OC   Neocoleoidea; Decapodiformes; Teuthida; Myopsina; Loliginidae; Doryteuthis.
XX
RN   [1]
RP   1-3234
RA   Battaglia A.A.;
RT   ;
RL   Submitted (25-MAY-1999) to the INSDC.
RL   Battaglia A.A., Neurobiology Laboratory, Stazione Zoologica "Anton Dohrn",
RL   Villa Comunale Naples, 80121, ITALY.
XX
RN   [2]
RA   Battaglia A.A., Nardi G., Iaccarino P., Gentile S., de Santis A.,
RA   Gilly W.F.;
RT   "Cloning and functional characterization of an AMPA-selective receptor
RT   subunit in squid (Loligo opalescens) giant fiber motor system";
RL   Unpublished.
XX
DR   MD5; c5c15961326ac84079524d93a4dbc6ab.
XX
CC   splice variant 2 (AJ534693)
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..3234
FT                   /organism="Doryteuthis opalescens"
FT                   /mol_type="mRNA"
FT                   /country="USA:California"
FT                   /dev_stage="adult"
FT                   /tissue_lib="stellate ganglion"
FT                   /tissue_type="nervous system"
FT                   /db_xref="taxon:1051066"
FT   5'UTR           1..141
FT                   /gene="gluR"
FT                   /function="promoter"
FT   CDS             142..2916
FT                   /gene="gluR"
FT                   /product="glutamate receptor"
FT                   /db_xref="GOA:Q9U0T0"
FT                   /db_xref="InterPro:IPR001320"
FT                   /db_xref="InterPro:IPR001508"
FT                   /db_xref="InterPro:IPR001828"
FT                   /db_xref="InterPro:IPR019594"
FT                   /db_xref="InterPro:IPR028082"
FT                   /db_xref="UniProtKB/TrEMBL:Q9U0T0"
FT                   /experiment="experimental evidence, no additional details
FT                   recorded"
FT                   /protein_id="CAB65182.1"
FT                   /translation="MAPAIGLPPASTFPQLCFVILALSGSAIAAKGSTKRISIGSVFDV
FT                   ESEKIQTAFRFAVDRFNTIENSAQLKLNPLSRGNRRTDSFSLGNALCSIMSKGVFAVFG
FT                   KANSSMLATVKSYSDTFQIPYLTTSMAMNTTDQSPYMLFLRPINIRAIVDLIEHLGWRV
FT                   VHYIYISNEGLMRVQQLFQVMGKSDLQMTLNVKRASDVTSYVILKELHHTNPELDIHAV
FT                   LDMSIPMASELMNLLSEDPRVHNRRFHFLLVEPGIQELDFAKIGLYGYNVSGFQLVDFN
FT                   NMTVRLFLSDWTKIDPAEWPGAGVKTITYEAALAVDAVSLFTRAMKNLSNLGLFESLFI
FT                   RARSGANSSKTCAAERLNVWNKGKHVLKAMKETEFDGLTGRVAFDDRGHRKEFTLDVLD
FT                   IGITRGAVKIGYWTPRDGLTMLKRKMVRPINAPSSENRTRIVTTIQTPPYIMKKPKPID
FT                   GHPLIGNDKYEGYCVDLARKVAHEVGFDYVFQMVKDGAYGSKLANDSWNGMVGELIRLE
FT                   ADMAIAPLTISAVRERVIDFSKPFMSLGISIMIKKPADQKAHVFSFLDPLSYEIWMCIL
FT                   FAFIGVSVVLFLVSRFSPSGWHVEDESNITNDFTISNSLWFSLGAFMQQGCDFSPRSIS
FT                   GRIVGSVWWFFTLIIISSYTANLAAFLTVERMSTPIESAEDLAKQTEIEYGTLRSGTTE
FT                   AFFKTSKVAVYERMWAYMTSKTPSVFTDKIQDGITSVRDSNGKYAFLVESSTNDYINNR
FT                   LPCDTMKVGSNLDSKGFGIATPAGSDLGDKLTLAVLKLREDGELDKLQKFWWVGKGQCT
FT                   PQDKNTDGGQSALTLSNVAGIFYILIGGLILAIIVAVAEFLYKSKVDSKKSKTSFGLAL
FT                   KSKARLSFRSHPAREDSSSGTLLRKSMSRYTYTGPSQSMGFDTVPEGNTHTQV"
FT   sig_peptide     142..237
FT                   /gene="gluR"
FT   mat_peptide     238..2913
FT                   /gene="gluR"
FT                   /product="glutamate receptor"
FT   3'UTR           2917..3217
FT                   /gene="gluR"
FT   regulatory      3218..3234
FT                   /gene="gluR"
FT                   /regulatory_class="polyA_signal_sequence"
XX
SQ   Sequence 3234 BP; 903 A; 747 C; 773 G; 811 T; 0 other;
     cacgagcgag catgtaacgt cacgaaggca ccacccagac tatggaggat ctgatcccag        60
     tttttccgcg tgacccttac gaccagtgac aacgattaca acaccgtgta gttctactgt       120
     ggtaccacca acagacccag gatggctcca gccatcggac taccaccggc cagcacgttc       180
     ccccagctgt gtttcgttat tctcgctcta tccggatctg caatagcagc taaggggtct       240
     acaaaacgca tatcaatagg ctcagtattc gacgttgaat cggaaaaaat ccagacggcg       300
     tttcgctttg ctgtggatcg ctttaacaca atcgagaatt ccgcccaact gaaattgaac       360
     cccctttcgc gaggaaatcg acgaacagat agtttctccc tcggcaatgc actctgttcc       420
     attatgtcca agggtgtttt tgctgtattc ggaaaggcga actcttcaat gctggcgaca       480
     gtcaagtcgt acagtgacac cttccaaatt ccgtatctaa ctacaagtat ggccatgaac       540
     acaacagatc agtcgcccta catgctattt ttgcgtccca ttaacatccg ggctattgtc       600
     gacctcatag agcacttggg gtggagggtg gttcattaca tatatatttc gaacgaaggt       660
     ttaatgcgtg ttcagcaact gtttcaggtg atggggaaga gcgatcttca aatgaccctg       720
     aacgtcaaac gtgcgtccga tgtcactagt tacgtaattc ttaaagaact tcatcatacc       780
     aaccccgagt tggacattca tgccgtgctg gatatgtcaa tacctatggc gagtgaacta       840
     atgaatctgc tgagtgagga tccacgagtc cacaacagac gatttcactt cttgctagta       900
     gagccaggaa tccaagaatt ggactttgcc aagattggat tgtatggcta caatgtaagt       960
     ggcttccaac tggtcgactt caataatatg actgttcggc tatttctctc ggactggacg      1020
     aaaatcgacc cagcagaatg gcccggggct ggggtgaaaa caatcacgta cgaggcggcg      1080
     ttggcagtcg acgccgtcag cttgtttacg cgtgcaatga agaatttgtc caatctcggt      1140
     ttatttgagt cccttttcat ccgcgctagg agtggagcca acagcagcaa aacttgtgca      1200
     gccgagcgtc tgaatgtgtg gaacaaaggt aaacatgtgc tcaaggcaat gaaagagacg      1260
     gagtttgatg gccttactgg tcgagtggca tttgacgata gaggtcaccg caaagagttc      1320
     actctggatg ttcttgatat aggaattacc cgcggcgcag tcaagattgg ttactggacc      1380
     ccgagggatg gattgactat gctcaagcgt aaaatggtcc gccctattaa tgcgcccagc      1440
     tctgagaaca gaacaaggat tgtgactacg atccagactc ctccttacat aatgaagaaa      1500
     ccgaagccga tagacggtca ccctcttata ggcaatgaca agtacgaagg atattgtgta      1560
     gaccttgctc gaaaggttgc gcatgaagtt ggctttgact acgtgttcca gatggtaaaa      1620
     gatggcgcct acggttcgaa gctcgcaaat gattcgtgga atggtatggt aggagaacta      1680
     ataaggctgg aggcggatat ggccattgcc ccactgacga tctcagctgt gcgggagagg      1740
     gtcattgatt tctccaaacc ctttatgagc ctgggaatca gtatcatgat aaaaaaacca      1800
     gcggaccaga aagctcacgt gttctcgttc ctcgacccgt tatcctacga gatctggatg      1860
     tgcatcttgt ttgccttcat tggagtcagc gtggtcttgt ttttggtcag tcgcttcagc      1920
     cctagcgggt ggcacgtgga agatgagtcg aatattacga atgattttac catttccaac      1980
     agcctctggt tttcgctggg cgccttcatg caacagggat gtgatttctc acctcgatcg      2040
     atttctggac gtatagtcgg aagcgtatgg tggttcttca ccctgatcat tatttcgtct      2100
     tacactgcca acctggccgc cttcctcaca gtggaaagaa tgtccactcc gattgaatcc      2160
     gctgaggatc ttgccaaaca gacggaaatc gaatatggaa ctttaaggtc aggcacaaca      2220
     gaagctttct ttaagacttc taaggtagcg gtctatgagc gaatgtgggc ttatatgaca      2280
     tcaaagaccc ctagtgtctt tacggataaa atccaagatg gcataaccag cgttcgagat      2340
     tccaacggaa agtatgcttt cctcgtcgaa tcctctacta acgattatat caacaaccgt      2400
     ttgccctgtg atacaatgaa agtcggatca aatcttgact caaaaggttt cggcatcgct      2460
     acaccagccg gctccgactt aggagataaa ctcacacttg ctgttctcaa gttgcgcgaa      2520
     gatggagagt tagataagct gcaaaaattc tggtgggtgg ggaaaggtca gtgtacgcca      2580
     caggacaaga atactgatgg aggccaaagt gcccttacat tgtccaacgt ggctggcatt      2640
     ttctacatcc ttatcggagg actcatatta gccatcatcg tcgcagtcgc ggaattcctt      2700
     tataaatcta aagttgacag taaaaaatca aagacatcat ttggacttgc cctgaaatca      2760
     aaagccagac tttctttccg aagccatcct gctcgggaag atagcagctc gggaaccctt      2820
     ctcagaaagt ccatgtcaag gtatacctac acgggcccat cccagagtat gggatttgac      2880
     acggtaccgg aaggtaacac tcacactcaa gtgtgagatg ttaaattgac caactgcagt      2940
     gaaccagcga gtgacactca gtcgttacct gccattcagg acattttttt gctcattata      3000
     aacacaattc agaacgaaag aagaaaaaat tgtttaatga aaggaagaaa agaaacagga      3060
     tcgaaaccct gttcgtaaat gctcactgga aagggagaca cttgttcgcc taaaacaaaa      3120
     gggaattcta atgttcaggt ggaaacacga atgagtgtat ccgcgtgtgg gtcagctggg      3180
     attattgtta gcaagatggc agcgtaccca cactggcaaa aaaaaaaaaa aaaa            3234
//
ID   D87894; SV 1; linear; genomic DNA; STD; FUN; 1674 BP.
XX
AC   D87894;
XX
DT   27-SEP-1996 (Rel. 49, Created)
DT   14-NOV-2006 (Rel. 89, Last updated, Version 4)
XX
DE   Rhizopus oligosporus DNA for chitinase, complete cds.
XX
KW   chi3; chitinase.
XX
OS   Rhizopus microsporus var. oligosporus
OC   Eukaryota; Fungi; Fungi incertae sedis; Mucoromycotina; Mucorales;
OC   Mucorineae; Rhizopodaceae; Rhizopus.
XX
RN   [1]
RP   1-1674
RA   Yamazaki D.;
RT   ;
RL   Submitted (14-SEP-1996) to the INSDC.
RL   Daisuke Yamazaki, The University of Tokyo, Department of Agricultural
RL   Chemistry; 1-1-1 Yayoi, Bunkyo-ku, Tokyo 113, Japan
RL   (Tel:03-3812-2111(ex.5170), Fax:03-3812-9246)
XX
RN   [2]
RA   Takaya N., Yamazaki D., Horiuchi H., Ohta A., Takagi M.;
RT   "Intracellular chitinase gene from Rhizopus oligosporus: molecular cloning
RT   and characterization";
RL   Microbiology (Reading, Engl.) 144:2647-2654(1998).
XX
DR   MD5; aaffbb9c0c27696108c87fee57d3acb1.
DR   StrainInfo; 193640; 0.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1674
FT                   /organism="Rhizopus microsporus var. oligosporus"
FT                   /strain="IFO8631"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:4847"
FT   CDS             join(271..326,386..500,555..591,651..1645)
FT                   /codon_start=1
FT                   /gene="chi3"
FT                   /product="chitinase"
FT                   /db_xref="GOA:Q92270"
FT                   /db_xref="InterPro:IPR001223"
FT                   /db_xref="InterPro:IPR001579"
FT                   /db_xref="InterPro:IPR011583"
FT                   /db_xref="InterPro:IPR013781"
FT                   /db_xref="InterPro:IPR017853"
FT                   /db_xref="InterPro:IPR029070"
FT                   /db_xref="UniProtKB/TrEMBL:Q92270"
FT                   /protein_id="BAA13489.1"
FT                   /translation="MEPPPATNGPVIAGYFANWGIYDRKYNVVDVATQANKLTHILYAF
FT                   ANVQPDGQVVLGDAYADIEKHFPANQAVNRKEDGWNDPGKNLYGNFKQFYLLKQQHRHL
FT                   KVSLSIGGYTWSTHFGPVARDPQKRRLFVDSSIKHLANLGLDGLDIDWEYPKDDEEAFY
FT                   YVHLLYELRLALDRYQQQCQQLIQSRLLLTVAVPCGPDHYRKLRLTEMQPYVDLFYLMA
FT                   YDYAGSWDSFADHQAAVYGGRLNTEQAVQHYIACGIPPYKLVVGMPLYGRGFCNTAGPG
FT                   HPFQGLPRGTWEEGQFNYKTLPKPGAVEYHDFNRLASWSYDPQAREFITYDTPQMVAAK
FT                   CNYIQQRRLGGAMFWELSADCPQRSLINAAYDGLGRRLDQVPNHLDYPMSEYDNVRNGM
FT                   K"
FT   exon            271..326
FT                   /number=1
FT   intron          327..385
FT                   /number=1
FT   exon            386..500
FT                   /number=2
FT   intron          501..554
FT                   /number=2
FT   exon            555..591
FT                   /number=3
FT   intron          592..650
FT                   /number=3
FT   exon            651..1645
FT                   /number=4
XX
SQ   Sequence 1674 BP; 506 A; 331 C; 347 G; 490 T; 0 other;
     aataatgaaa ccactaattc aagagtattg tgtgtatgcc ttgttatttc ttcatgatcc        60
     aagggtttct cgcgtcaaca gtatgttctg agctttttgt tgttgtcata tctacttatt       120
     catgtttgga atgaaatgtc aattgtctca tcttcctaaa gtgtatacaa gtttttgttc       180
     tacaatagaa ctctacaaca gctgaatata atgataaaaa tagatatttt cttggctctt       240
     tttttcattt tacttttctt gacttctcat atggaaccac ctccagcaac aaacggacct       300
     gttattgcag gttactttgc taattggtaa cattgcataa caaaggcaaa aggggagctt       360
     aactcaacta actagaatgt aataggggaa tctacgatag aaaatacaat gttgttgatg       420
     tagctactca agccaataag ttgactcata ttttatatgc atttgctaat gtccaaccgg       480
     atggtcaagt tgttcttggg gtagtataaa ttattgcaag atatagaata taataataat       540
     aattataaat ataggacgct tatgcagata ttgaaaagca ttttccagca agtaaaaaaa       600
     taataataaa caaatataaa acctctccct aattcataca taatatgtag accaagcagt       660
     caaccgaaaa gaagatggat ggaatgatcc aggcaagaac ctttacggta actttaagca       720
     gttctattta ctcaagcaac aacaccgtca tctcaaagtg tcgcttagca ttggcggata       780
     tacatggtcc actcattttg gcccggttgc gcgtgatcct cagaaacgca gattgtttgt       840
     agatagcagc atcaaacacc tagccaactt gggtctggac gggctagata ttgactggga       900
     gtaccccaaa gatgatgagg aagcgtttta ttatgtgcat ctgctctatg agttgcgact       960
     ggcgcttgac agatatcaac aacagtgcca acaactgatt cagtcgcgac tattactcac      1020
     agtagccgtg ccttgtggcc ctgaccatta tcgtaaattg agattgaccg aaatgcaacc      1080
     ttacgtggac ctattttacc tcatggcata cgactatgct ggttcatggg attctttcgc      1140
     agatcatcaa gcggctgttt atggtggcag attgaataca gaacaagcag tacagcacta      1200
     tatcgcctgt ggtatccctc catataagct agtcgtaggc atgcctttat atggtcgagg      1260
     attctgcaat acggcggggc caggtcatcc tttccaagga ctgcctcgcg gtacctggga      1320
     agagggtcaa tttaattaca agacattgcc aaaaccgggc gctgtagaat accacgactt      1380
     taatcgacta gcctcatggt cttatgaccc tcaggctcgt gaatttatca cctatgatac      1440
     acctcagatg gttgctgcaa agtgcaatta catacaacaa agacggttgg gtggtgccat      1500
     gttttgggaa ctaagtgcgg attgtcctca gagaagcctg atcaacgcgg cctatgacgg      1560
     cttaggaagg cgattagatc aggtacctaa tcatttagat tatccaatga gtgagtatga      1620
     caatgtacga aacggtatga aataaagcat cccttttggc aggtggttct caaa            1674
//
ID   J00231; SV 1; linear; mRNA; STD; HUM; 1089 BP.
XX
AC   J00231;
XX
DT   13-JUN-1985 (Rel. 06, Created)
DT   17-APR-2005 (Rel. 83, Last updated, Version 9)
XX
DE   Human Ig gamma3 heavy chain disease OMM protein mRNA.
XX
KW   C-region; gamma heavy chain disease protein;
KW   gamma3 heavy chain disease protein; heavy chain disease; hinge exon;
KW   immunoglobulin gamma-chain; immunoglobulin heavy chain;
KW   secreted immunoglobulin; V-region.
XX
OS   Homo sapiens (human)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Euarchontoglires; Primates; Haplorrhini; Catarrhini; Hominidae;
OC   Homo.
XX
RN   [1]
RP   1-1089
RX   DOI; 10.1073/pnas.79.10.3260.
RX   PUBMED; 6808505.
RA   Alexander A., Steinmetz M., Barritault D., Frangione B., Franklin E.C.,
RA   Hood L., Buxbaum J.N.;
RT   "gamma Heavy chain disease in man: cDNA sequence supports partial gene
RT   deletion model";
RL   Proc. Natl. Acad. Sci. U.S.A. 79(10):3260-3264(1982).
XX
DR   MD5; dbfb2a63ffcc88671722e91e641adcaa.
DR   CABRI; LMBP 2079.
DR   CABRI; LMBP 2146.
DR   CABRI; LMBP 2147.
DR   CABRI; LMBP 2151.
DR   CABRI; LMBP 2192.
DR   CABRI; LMBP 2193.
DR   CABRI; LMBP 2194.
DR   CABRI; LMBP 2211.
DR   CABRI; LMBP 2316.
DR   CABRI; LMBP 2586.
DR   CABRI; LMBP 2587.
DR   CABRI; LMBP 2589.
DR   CABRI; LMBP 2590.
DR   CABRI; LMBP 3306.
DR   EuropePMC; PMC2739203; 19682364.
DR   IMGT/LIGM; J00231.
XX
CC   The protein isolated from patient OMM is a gamma heavy chain
CC   disease (HCD) protein. It has a large 5' internal deletion
CC   consisting of most of the variable region and the entire ch1
CC   domain. [1] suggests that the protein abnormality is from a partial
CC   gene deletion rather than from defective splicing.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..1089
FT                   /organism="Homo sapiens"
FT                   /map="14q32.33"
FT                   /mol_type="mRNA"
FT                   /db_xref="taxon:9606"
FT   mRNA            <1..1089
FT                   /note="gamma3 mRNA"
FT   CDS             23..964
FT                   /codon_start=1
FT                   /gene="IGHG3"
FT                   /note="OMM protein (Ig gamma3) heavy chain"
FT                   /db_xref="GOA:P01860"
FT                   /db_xref="HGNC:HGNC:5527"
FT                   /db_xref="InterPro:IPR003006"
FT                   /db_xref="InterPro:IPR003597"
FT                   /db_xref="InterPro:IPR007110"
FT                   /db_xref="InterPro:IPR013783"
FT                   /db_xref="PDB:4WWI"
FT                   /db_xref="PDB:4ZNC"
FT                   /db_xref="UniProtKB/Swiss-Prot:P01860"
FT                   /protein_id="AAA52805.1"
FT                   /translation="MKXLWFFLLLVAAPRWVLSQVHLQESGPGLGKPPELKTPLGDTTH
FT                   TCPRCPEPKSCDTPPPCPRCPEPKSCDTPPPCPRCPEPKSCDTPPPCPXCPAPELLGGP
FT                   SVFLFPPKPKDTLMISRTPEVTCVVVDVSHEDPXVQFKWYVDGVEVHNAKTKLREEQYN
FT                   STFRVVSVLTVLHQDWLNGKEYKCKVSNKALPAPIEKTISKAKGQPXXXXXXXXXXXXE
FT                   EMTKNQVSLTCLVKGFYPSDIAVEWESNGQPENNYNTTPPMLDSDGSFFLYSKLTVDKS
FT                   RWQQGNIFSCSVMHEALHNRYTQKSLSLSPGK"
FT   sig_peptide     26..79
FT                   /gene="IGHG3"
FT                   /note="OMM protein signal peptide"
FT   mat_peptide     80..961
FT                   /gene="IGHG3"
FT                   /note="OMM protein mature peptide"
XX
SQ   Sequence 1089 BP; 240 A; 358 C; 271 G; 176 T; 44 other;
     cctggacctc ctgtgcaaga acatgaaaca nctgtggttc ttccttctcc tggtggcagc        60
     tcccagatgg gtcctgtccc aggtgcacct gcaggagtcg ggcccaggac tggggaagcc       120
     tccagagctc aaaaccccac ttggtgacac aactcacaca tgcccacggt gcccagagcc       180
     caaatcttgt gacacacctc ccccgtgccc acggtgccca gagcccaaat cttgtgacac       240
     acctccccca tgcccacggt gcccagagcc caaatcttgt gacacacctc ccccgtgccc       300
     nnngtgccca gcacctgaac tcttgggagg accgtcagtc ttcctcttcc ccccaaaacc       360
     caaggatacc cttatgattt cccggacccc tgaggtcacg tgcgtggtgg tggacgtgag       420
     ccacgaagac ccnnnngtcc agttcaagtg gtacgtggac ggcgtggagg tgcataatgc       480
     caagacaaag ctgcgggagg agcagtacaa cagcacgttc cgtgtggtca gcgtcctcac       540
     cgtcctgcac caggactggc tgaacggcaa ggagtacaag tgcaaggtct ccaacaaagc       600
     cctcccagcc cccatcgaga aaaccatctc caaagccaaa ggacagcccn nnnnnnnnnn       660
     nnnnnnnnnn nnnnnnnnnn nnnnngagga gatgaccaag aaccaagtca gcctgacctg       720
     cctggtcaaa ggcttctacc ccagcgacat cgccgtggag tgggagagca atgggcagcc       780
     ggagaacaac tacaacacca cgcctcccat gctggactcc gacggctcct tcttcctcta       840
     cagcaagctc accgtggaca agagcaggtg gcagcagggg aacatcttct catgctccgt       900
     gatgcatgag gctctgcaca accgctacac gcagaagagc ctctccctgt ctccgggtaa       960
     atgagtgcca tggccggcaa gcccccgctc cccgggctct cggggtcgcg cgaggatgct      1020
     tggcacgtac cccgtgtaca tacttcccag gcacccagca tggaaataaa gcacccagcg      1080
     ctgccctgg                                                              1089
//
ID   K00650; SV 1; linear; genomic DNA; STD; HUM; 6210 BP.
XX
AC   K00650; M16287;
XX
DT   26-JUL-1991 (Rel. 28, Created)
DT   14-NOV-2006 (Rel. 89, Last updated, Version 4)
XX
DE   Human fos proto-oncogene (c-fos), complete cds.
XX
KW   c-myc proto-oncogene; fos oncogene; proto-oncogene.
XX
OS   Homo sapiens (human)
OC   Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia;
OC   Eutheria; Euarchontoglires; Primates; Haplorrhini; Catarrhini; Hominidae;
OC   Homo.
XX
RN   [1]
RP   1-4165
RX   DOI; 10.1073/pnas.80.11.3183.
RX   PUBMED; 6574479.
RA   van Straaten F., Muller R., Curran T., Van Beveren C., Verma I.M.;
RT   "Complete nucleotide sequence of a human c-onc gene: deduced amino acid
RT   sequence of the human c-fos protein";
RL   Proc. Natl. Acad. Sci. U.S.A. 80(11):3183-3187(1983).
XX
RN   [2]
RX   DOI; 10.1016/0092-8674(85)90285-5.
RX   PUBMED; 2414012.
RA   Treisman R.;
RT   "Transient accumulation of c-fos RNA following serum stimulation requires a
RT   conserved 5' element and c-fos 3' sequences";
RL   Cell 42(3):889-902(1985).
XX
RN   [3]
RP   4166-6210
RX   PUBMED; 3555978.
RA   Verma I.M., Deschamps J., Van Beveren C., Sassone-Corsi P.;
RT   "Human fos gene";
RL   Cold Spring Harb. Symp. Quant. Biol. 51:0-0(0).
XX
DR   MD5; 2cdb1f2aa6c13c384c8522058c958a7c.
DR   EPD; EP11145; HS_FOS.
DR   Ensembl-Gn; ENSG00000170345; homo_sapiens.
DR   Ensembl-Tr; ENST00000303562; homo_sapiens.
DR   Ensembl-Tr; ENST00000535987; homo_sapiens.
DR   Ensembl-Tr; ENST00000555686; homo_sapiens.
DR   EuropePMC; PMC116128; 11711622.
DR   EuropePMC; PMC1752353; 9166000.
DR   EuropePMC; PMC19553; 9012824.
DR   EuropePMC; PMC3220474; 21937452.
XX
CC   [2]  sites; promoter region.
CC   C-fos is the human cellular homolog of the v-fos oncogene of
CC   Finkel-Biskis-Jinkins murine osteosarcoma virus (FBJ-MuSV).  [2] It
CC   was found that both human and murine c-fos genes contained an
CC   enhancer-like element in their 5' noncoding regions that was
CC   necessary for increased transcription following serum activation.
CC   The FBJ-MuSV v-fos oncogene contains a deletion relative to murine
CC   and human c-fos proto-oncogenes that causes complete divergence of
CC   the COOH terminal protein sequences encoded.  That deletion
CC   corresponds to positions 3182-3285 inclusive of this sequence.  The
CC   FBJ-MuSV v-fos sequence is more closely related to murine than
CC   human c-fos sequences.  The FBJ-MuSV v-fos coding sequence ends at
CC   a 'tag' stop codon coresponding to positions 3434-2436 of this
CC   sequence [1].  [1] notes two alu repeats beginning aproximately 500
CC   and 1700 nucleotides downstream of the last base in this sequence.
CC   A TATA box is located at positions 701-707.  Two potential
CC   polyadenylation signals are present in the 3' untranslated region.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..6210
FT                   /organism="Homo sapiens"
FT                   /map="14q24.3"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:9606"
FT   misc_feature    402..453
FT                   /note="transcriptional activator region [2]"
FT   prim_transcript 734..>3329
FT                   /note="c-fos mRNA [1]"
FT   gene            889..1029
FT                   /gene="FOS"
FT   CDS             join(889..1029,1783..2034,2466..2573,2688..3329)
FT                   /codon_start=1
FT                   /note="c-fos protein"
FT                   /db_xref="GOA:P01100"
FT                   /db_xref="HGNC:HGNC:3796"
FT                   /db_xref="InterPro:IPR000837"
FT                   /db_xref="InterPro:IPR004827"
FT                   /db_xref="InterPro:IPR029816"
FT                   /db_xref="PDB:1A02"
FT                   /db_xref="PDB:1FOS"
FT                   /db_xref="PDB:1S9K"
FT                   /db_xref="UniProtKB/Swiss-Prot:P01100"
FT                   /protein_id="AAA52471.1"
FT                   /translation="MMFSGFNADYEASSSRCSSASPAGDSLSYYHSPADSFSSMGSPVN
FT                   AQDFCTDLAVSSANFIPTVTAISTSPDLQWLVQPALVSSVAPSQTRAPHPFGVPAPSAG
FT                   AYSRAGVVKTMTGGRAQSIGRRGKVEQLSPEEEEKRRIRRERNKMAAAKCRNRRRELTD
FT                   TLQAETDQLEDEKSALQTEIANLLKEKEKLEFILAAHRPACKIPDDLGFPEEMSVASLD
FT                   LTGGLPEVATPESEEAFTLPLLNDPEPKPSVEPVKSISSMELKTEPFDDFLFPASSRPS
FT                   GSETARSVPDMDLSGSFYAADWEPLHSGSLGMGPMATELEPLCTPVVTCTPSCTAYTSS
FT                   FVFTYPEADSFPSCAAAHRKGSSSNEPSSDSLSSPTLLAL"
FT   exon            <889..1029
FT                   /gene="FOS"
FT                   /number=1
FT                   /note="c-fos protein; G00-119-917"
FT   intron          1030..1782
FT                   /note="c-fos intron A"
FT   exon            1783..2034
FT                   /number=2
FT   intron          2035..2465
FT                   /note="c-fos intron B"
FT   exon            2466..2573
FT                   /number=3
FT   intron          2574..2687
FT                   /note="c-fos intron C"
FT   exon            2688..>3329
FT                   /number=4
FT                   /note="c-fos protein"
XX
SQ   Sequence 6210 BP; 1497 A; 1571 C; 1619 G; 1523 T; 0 other;
     gcaggaacag tgctagtatt gctcgagccc gagggctgga ggttagggga tgaaggtctg        60
     cttccacgct ttgcactgaa ttagggctag aattggggat gggggtaggg gcgcattcct       120
     tcgggagccg aggcttaagt cctcggggtc ctgtactcga tgccgtttct cctatctctg       180
     agcctcagaa ctgtcttcag tttccgtaca agggtaaaaa ggcgctctct gccccatccc       240
     ccccgacctc gggaacaagg gtccgcattg aaccaggtgc gaatgttctc tctcattctg       300
     cgccgttccc gcctcccctc ccccagccgc ggcccccgcc tccccccgca ctgcaccctc       360
     ggtgttggct gcagcccgcg agcagttccc gtcaatccct ccccccttac acaggatgtc       420
     catattagga catctgcgtc agcaggtttc cacggccttt ccctgtagcc ctggggggag       480
     ccatccccga aacccctcat cttggggggc ccacgagacc tctgagacag gaactgcgaa       540
     atgctcacga gattaggaca cgcgccaagg cgggggcagg gagctgcgag cgctggggac       600
     gcagccgggc ggccgcagaa gcgcccaggc ccgcgcgcca cccctctggc gccaccgtgg       660
     ttgagcccgt gacgtttaca ctcattcata aaacgcttgt tataaaagca gtggctgcgg       720
     cgcctcgtac tccaaccgca tctgcagcga gcaactgaga agccaagact gagccggcgg       780
     ccgcggcgca gcgaacgagc agtgaccgtg ctcctaccca gctctgcttc acagcgccca       840
     cctgtctccg cccctcggcc cctcgcccgg ctttgcctaa ccgccacgat gatgttctcg       900
     ggcttcaacg cagactacga ggcgtcatcc tcccgctgca gcagcgcgtc cccggccggg       960
     gatagcctct cttactacca ctcacccgca gactccttct ccagcatggg ctcgcctgtc      1020
     aacgcgcagg taaggctggc ttcccgtcgc cgcggggccg ggggcttggg gtcgcggagg      1080
     aggagacacc gggcgggacg ctccagtaga tgagtagggg gctcccttgt gcctggaggg      1140
     aggctgccgt ggccggagcg gtgccggctc gggggctcgg gacttgctct gagcgcacgc      1200
     acgcttgcca tagtaagaat tggttccccc ttcgggaggc aggttcgttc tgagcaacct      1260
     ctggtctgca ctccaggacg gatctctgac attagctgga gcagacgtgt cccaagcaca      1320
     aactcgctaa ctagagcctg gcttcttcgg ggaggtggca gaaagcggca atcccccctc      1380
     ccccggcagc ctggagcacg gaggagggat gagggaggag ggtgcagcgg gcgggtgtgt      1440
     aaggcagttt cattgataaa aagcgagttc attctggaga ctccggagcg gcgcctgcgt      1500
     cagcgcagac gtcagggata tttataacaa accccctttc aagcaagtga tgctgaaggg      1560
     ataacgggaa cgcagcggca ggatggaaga gacaggcact gcgctgcgga atgcctggga      1620
     ggaaaagggg gagacctttc atccaggatg agggacattt aagatgaaat gtccgtggca      1680
     ggatcgtttc tcttcactgc tgcatgcggc actgggaact cgccccacct gtgtccggaa      1740
     cctgctcgct cacgtcggct ttccccttct gttttgttct aggacttctg cacggacctg      1800
     gccgtctcca gtgccaactt cattcccacg gtcactgcca tctcgaccag tccggacctg      1860
     cagtggctgg tgcagcccgc cctcgtctcc tctgtggccc catcgcagac cagagcccct      1920
     caccctttcg gagtccccgc cccctccgct ggggcttact ccagggctgg cgttgtgaag      1980
     accatgacag gaggccgagc gcagagcatt ggcaggaggg gcaaggtgga acaggtgagg      2040
     aactctagcg tactcttcct gggaatgtgg gggctgggtg ggaagcagcc ccggagatgc      2100
     aggagcccag tacagaggat gaagccactg atggggctgg ctgcacatcc gtaactggga      2160
     gccctggctc caagcccatt ccatcccaac tcagactctg agtctcaccc taagaagtac      2220
     tctcatagtt tcttccctaa gtttcttacc gcatgctttc agactgggct cttctttgtt      2280
     ctcttgctga ggatcttatt ttaaatgcaa gtcacaccta ttctgcaact gcaggtcaga      2340
     aatggtttca cagtggggtg ccaggaagca gggaagctgc aggagccagt tctactgggg      2400
     tgggtgaatg gaggtgatgg cagacacttt tactgaatgt cggtcttttt ttgtgattat      2460
     tctagttatc tccagaagaa gaagagaaaa ggagaatccg aagggaaagg aataagatgg      2520
     ctgcagccaa atgccgcaac cggaggaggg agctgactga tacactccaa gcggtaggta      2580
     ctctgtgggt tgctcctttt taaaacttaa gggaaagttg gagattgagc ataagggccc      2640
     ttgagtaaga ctgtgtctta tgctttcctt tatccctctg tatacaggag acagaccaac      2700
     tagaagatga gaagtctgct ttgcagaccg agattgccaa cctgctgaag gagaaggaaa      2760
     aactagagtt catcctggca gctcaccgac ctgcctgcaa gatccctgat gacctgggct      2820
     tcccagaaga gatgtctgtg gcttcccttg atctgactgg gggcctgcca gaggttgcca      2880
     ccccggagtc tgaggaggcc ttcaccctgc ctctcctcaa tgaccctgag cccaagccct      2940
     cagtggaacc tgtcaagagc atcagcagca tggagctgaa gaccgagccc tttgatgact      3000
     tcctgttccc agcatcatcc aggcccagtg gctctgagac agcccgctcc gtgccagaca      3060
     tggacctatc tgggtccttc tatgcagcag actgggagcc tctgcacagt ggctccctgg      3120
     ggatggggcc catggccaca gagctggagc ccctgtgcac tccggtggtc acctgtactc      3180
     ccagctgcac tgcttacacg tcttccttcg tcttcaccta ccccgaggct gactccttcc      3240
     ccagctgtgc agctgcccac cgcaagggca gcagcagcaa tgagccttcc tctgactcgc      3300
     tcagctcacc cacgctgctg gccctgtgag ggggcaggga aggggaggca gccggcaccc      3360
     acaagtgcca ctgcccgagc tggtgcatta cagagaggag aaacacatct tccctagagg      3420
     gttcctgtag acctagggag gaccttatct gtgcgtgaaa cacaccaggc tgtgggcctc      3480
     aaggacttga aagcatccat gtgtggactc aagtccttac ctcttccgga gatgtagcaa      3540
     aacgcatgga gtgtgtattg ttcccagtga cacttcagag agctggtagt tagtagcatg      3600
     ttgagccagg cctgggtctg tgtctctttt ctctttctcc ttagtcttct catagcatta      3660
     actaatctat tgggttcatt attggaatta acctggtgct ggatattttc aaattgtatc      3720
     tagtgcagct gattttaaca ataactactg tgttcctggc aatagtgtgt tctgattaga      3780
     aatgaccaat attatactaa gaaaagatac gactttattt tctggtagat agaaataaat      3840
     agctatatcc atgtactgta gtttttcttc aacatcaatg ttcattgtaa tgttactgat      3900
     catgcattgt tgaggtggtc tgaatgttct gacattaaca gttttccatg aaaacgtttt      3960
     attgtgtttt taatttattt attaagatgg attctcagat atttatattt ttattttatt      4020
     tttttctacc ttgaggtctt ttgacatgtg gaaagtgaat ttgaatgaaa aatttaagca      4080
     ttgtttgctt attgttccaa gacattgtca ataaaagcat ttaagttgaa tgcgaccaac      4140
     cttgtgctct tttcattctg gaagtcttgt aagtttctga aaggtattat tggagaccag      4200
     tttgtcaaga agggtagctg ctggaggggg acacaccctc tgtctgatcc cttatcaaag      4260
     aggacaagga aactatagag ctgattttag aatattttac aaatacatgc cttccattgg      4320
     aatgctaaga ttttctactg cttctgggga cgggaaaccg ctgtgtaaca gcttttgtgg      4380
     gaatacattt tttctgtttc agtactcgca gggggaaata tttaaatttt gttgtgctaa      4440
     tattaaattc agatgttttg atcttaaagg aaccctttaa gcaaacagaa cctagctttg      4500
     tacagactat tttaactttt tattctcaca aaatcacgtg gagggttatt ctacttcaaa      4560
     gatgagcaaa ttgaagaatg gttagaataa acaactttct tgatattccg ttatcggcat      4620
     tagaatcttc ctgctcgtta tcgtatccag caggctgaac tgcctcttga tacttggtta      4680
     aaaaaaattt tcaggccggg cgcggtggcc catgcctgta atcctagcac tttgggaggc      4740
     cgaggcaggc ggatcacctg aggtcgggag ttcgagacca gcctgaccaa catggagaaa      4800
     ccccgtcttt actaaaaata caaaattagc ctggtgtggt ggtgcatgcc tgtaatccta      4860
     gctacttgag aggctgagac aggaaaatca cttgaactcg ggaggcggat gttgcagcga      4920
     actgagattg cgccattgca ctccagcctg ggcaacaaga ttgaaactct gtttaaaaaa      4980
     aaaagttttc actaatgtgt acattttttt gtactctttt attctcgaaa gggaaggagg      5040
     gctattgccc tatcccttat taataaatgc attgtggttt ctggtttctc taataccata      5100
     tgcccttcat tcagtttata gtgggcggaa gtgggggaga aaaagttgct cagaaatcaa      5160
     aagatatctc aaacagcaca aataatggct gatcgttctg caaacaaaaa gttacataat      5220
     agctcaagaa ggagaagtca acatgactct gaacaagctt taacttagaa actttatcat      5280
     cttaaggaag aacgtgacct ttgtccagga cgtctctggt aatggggcac ttacacacac      5340
     atgcacacgt acaaaccaca gggaaaggag accgcccttc tgcctctgct cgcgagtatc      5400
     acgcaggcac catgcactat gttttcacac acactgggtg gaagaagagc ttcagcgcca      5460
     gtcttctaat gctttggtga taatgaaaat cactgggtgc ttatggggtg tcatattcaa      5520
     tcgagttaaa agttttaatt caaaatgaca gttttactga ggttgatgtt ctcgtctatg      5580
     atatctctgc ccctcccata aaaatggaca tttaaaagca acttaccgct ctttagatca      5640
     ctcctatatc acacaccact tggggtgctg tttctgctag acttgtgatg acagtggcct      5700
     taggatccct gtttgctgtt caaagggcaa atattttata gcctttaaat atacctaaac      5760
     taaatacaga attaatataa ctaacaaaca cctggtctga aataacaagg tgatctaccc      5820
     tggaaggaac ccagctggtg ggccaggagc ggtggctcac acctgtaatt ccagcacttt      5880
     gggaggctga gacaggagga tcactggagt ccaggagttt gagaccagcc tgggcaacat      5940
     ggcaaaaccc agtgtgcttc tgttgtccca gctacactac tcaggaggct gaggcaggag      6000
     tatgacttga gcctgggagg gggaggttgc agagaactga tattgcacca ccactgcact      6060
     ccagcctggg tgacacagca aaaccctatc tcaaaaaaaa aaaaaaaaaa aaggaaccca      6120
     gctggttcct gtaggtgtgc aataataaca accagaggaa gaaaaggaag acgatttccc      6180
     agatgaagaa gggcagctgg accttcggac                                       6210
//