Dbfetch

LOCUS       NM_001029045            2189 bp    mRNA    linear   INV 22-NOV-2023
DEFINITION  Caenorhabditis elegans Polypeptide
            N-acetylgalactosaminyltransferase 4 (gly-4), mRNA.
ACCESSION   NM_001029045
VERSION     NM_001029045.6
DBLINK      BioProject: PRJNA158
KEYWORDS    RefSeq.
SOURCE      Caenorhabditis elegans
  ORGANISM  Caenorhabditis elegans
            Eukaryota; Metazoa; Ecdysozoa; Nematoda; Chromadorea; Rhabditida;
            Rhabditina; Rhabditomorpha; Rhabditoidea; Rhabditidae; Peloderinae;
            Caenorhabditis.
REFERENCE   1  (bases 1 to 2189)
  AUTHORS   Sulson,J.E. and Waterston,R.
  CONSRTM   Caenorhabditis elegans Sequencing Consortium
  TITLE     Genome sequence of the nematode C. elegans: a platform for
            investigating biology
  JOURNAL   Science 282 (5396), 2012-2018 (1998)
   PUBMED   9851916
  REMARK    Erratum:[Science 1999 Jan 1;283(5398):35]
REFERENCE   2  (bases 1 to 2189)
  CONSRTM   NCBI Genome Project
  TITLE     Direct Submission
  JOURNAL   Submitted (22-NOV-2023) National Center for Biotechnology
            Information, NIH, Bethesda, MD 20894, USA
REFERENCE   3  (bases 1 to 2189)
  AUTHORS   WormBase.
  CONSRTM   WormBase Consortium
  TITLE     Direct Submission
  JOURNAL   Submitted (29-OCT-2023) WormBase Group, European Bioinformatics
            Institute, Cambridge, CB10 1SA, UK. Email: help@wormbase.org
REFERENCE   4  (bases 1 to 2189)
  AUTHORS   Sulson,J.E. and Waterston,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (03-MAR-2003) Nematode Sequencing Project: Sanger
            Institute, Hinxton, Cambridge CB10 1SA, UK and The Genome Institute
            at Washington University, St. Louis, MO 63110, USA
COMMENT     REVIEWED REFSEQ: This record has been curated by WormBase. This
            record is derived from an annotated genomic sequence (NC_003283).
            
            On Feb 2, 2021 this sequence version replaced NM_001029045.5.
FEATURES             Location/Qualifiers
     source          1..2189
                     /organism="Caenorhabditis elegans"
                     /mol_type="mRNA"
                     /strain="Bristol N2"
                     /db_xref="taxon:6239"
                     /chromosome="V"
     gene            1..2189
                     /gene="gly-4"
                     /locus_tag="CELE_Y116F11B.12"
                     /db_xref="GeneID:180302"
                     /db_xref="WormBase:WBGene00001629"
     CDS             138..1907
                     /gene="gly-4"
                     /locus_tag="CELE_Y116F11B.12"
                     /standard_name="Y116F11B.12a"
                     /note="Confirmed by transcript evidence"
                     /codon_start=1
                     /product="Polypeptide N-acetylgalactosaminyltransferase 4"
                     /protein_id="NP_001024216.1"
                     /db_xref="EnsemblGenomes-Gn:WBGene00001629"
                     /db_xref="EnsemblGenomes-Tr:Y116F11B.12a.1"
                     /db_xref="EnsemblGenomes-Tr:Y116F11B.12a.2"
                     /db_xref="GeneID:180302"
                     /db_xref="WormBase:WBGene00001629"
                     /translation="MLPRMLKMKTVGTVLAVIWLFGLAFIYVQSTSSSLRPPGRHPPP
                     LPQLDPLIPQNPPQNDEIRPKKSAPPIPTINLAEDTTIHERTEKDVTWKTFDVEKFLN
                     KGKWHQGEDKYKANSFNQEASDALNPTRKIPDSREPQCRDVDYSKVGMQPTTVIITYH
                     NEARSSLLRTVFSVFNQSPEELLLEIVLVDDNSQDVEIGKELAQIQRITVLRNNQREG
                     LIRSRVKGAQVARAPVLTFLDSHIECNQKWLEPLLARIAENPKAVVAPIIDVINVDNF
                     NYVGASADLRGGFDWTLVFRWEFMNEQLRKERHAHPTAPIRSPTMAGGLFAISKEWFN
                     ELGTYDLDMEVWGGENLEMSFRVWQCGGSLEIMPCSRVGHVFRKKHPYTFPGGSGNVF
                     QKNTRRAAEVWMDEYKAIYLKNVPSARFVNFGDITDRLAIRDRLQCKSFKWYLENVYP
                     QLEIPRKTPGKSFQMKIGNLCLDSMARKESEAPGLFGCHGTGGNQEWVFDQLTKTFKN
                     AISQLCLDFSSNTENKTVTMVKCENLRPDTMVVEKNGWLTQGGKCLTVNQGSGGDWLI
                     YGAHCELNNGAQRWIFEKLDTYE"
ORIGIN      
        1 tactcactca tgtccaccgc cgggacgaga aactgagctt cttgtgcggg aaattttcaa
       61 cttttcacac atttcttttt ggtttaatta ttggataaag acacagaaga aagcattcat
      121 taaaaaaaat tgccaaaatg ctgccgagaa tgctgaaaat gaagacggtg ggcaccgttt
      181 tggcagtcat ttggctgttt ggattggcat tcatttatgt gcaatctacg agctcaagct
      241 taaggccacc gggacgtcat ccaccaccac taccacagct cgacccttta ataccccaaa
      301 acccgccgca aaacgacgaa attcggccga aaaagagcgc gccgcccatt ccaacgataa
      361 atttggcaga agataccaca attcatgaga gaaccgaaaa agatgtcact tggaagacat
      421 tcgatgtgga aaagtttttg aataagggga aatggcatca gggagaggac aaatacaagg
      481 ccaactcatt caaccaagaa gcctccgacg cgctaaaccc cacccgaaaa attccggatt
      541 cccgtgagcc ccaatgccgt gacgtggatt attcgaaagt tggcatgcag ccaactacag
      601 taatcattac ttaccataat gaagcccgga gctcactttt acggacggtc tttagtgttt
      661 tcaatcagtc accggaggaa ttgctgctgg aaattgtgct agtcgacgat aattcccagg
      721 atgtcgaaat tggaaaagag ttggctcaaa ttcaacgaat tacagtactc cgtaataatc
      781 aacgggaggg tctgattcgg agccgggtta aaggagccca agtggctcgg gctccggtgc
      841 tcacattcct cgatagtcat attgagtgta atcagaaatg gcttgaaccc ctgttggcta
      901 gaattgccga gaatccgaaa gccgtcgttg caccgattat cgatgttatc aatgttgata
      961 attttaatta tgttggagcg agtgccgatt tgaggggagg attcgactgg accctagtct
     1021 tccgctggga attcatgaac gaacagctcc gcaaggaacg ccacgcccat ccgacggcgc
     1081 ctattcggtc gcctacaatg gccggaggcc tattcgcaat ctcaaaagaa tggttcaacg
     1141 aactgggaac ctatgacctc gatatggaag tatggggtgg cgaaaatctg gaaatgtcat
     1201 tcagagtctg gcagtgcggc ggctcactgg aaattatgcc atgctcccgg gttgggcatg
     1261 ttttccggaa gaaacatcct tatacattcc ccgggggatc cggaaacgtg ttccagaaaa
     1321 atacgagaag agccgctgaa gtatggatgg acgagtataa ggcgatttat ttgaaaaatg
     1381 taccttcggc cagatttgtc aattttggag acataaccga ccgcctggcc attcgagacc
     1441 gcctacagtg taaatcgttc aaatggtacc tggaaaatgt gtacccacag ttggaaatcc
     1501 cgcgaaaaac gcctggaaaa tcgttccaaa tgaaaatcgg caacctctgc ttggattcga
     1561 tggctcgaaa agaatcagaa gctccggggc tcttcggttg tcatggtacc ggtggaaatc
     1621 aggaatgggt ctttgatcag ctcaccaaga catttaaaaa tgcgatttct cagttgtgcc
     1681 tcgatttttc gtcaaacacc gagaataaga cggtgacaat ggtcaaatgt gaaaatctga
     1741 gacccgacac aatggtcgtg gagaaaaacg gatggctaac gcaaggcgga aaatgcctta
     1801 cggtgaatca gggctccggc ggcgattggc tcatctacgg agctcactgt gagcttaaca
     1861 atggtgctca gcgatggatt ttcgagaaat tggatactta tgaataaaaa atcgattttt
     1921 tttcgcattt cccatctcaa taatatcatt tttcccttaa ttttcctgtg attttcccaa
     1981 ttttttactc cgttttcccc ttaaaaatgt gccttttttc ctgccttttc cccccctatg
     2041 aaattccaat ttttcaatcg atacttgccc ttattaactt tctttttttt caatttttct
     2101 acttaatact ttaatttata tgttttaatt gtcatacatg acactgaaaa atttttgcca
     2161 aaaatttgaa ttaataaatt ttgtttttt
//