Dbfetch

LOCUS       NM_001129118            2002 bp    mRNA    linear   INV 22-NOV-2023
DEFINITION  Caenorhabditis elegans SUZ domain-containing protein (szy-20),
            mRNA.
ACCESSION   NM_001129118
VERSION     NM_001129118.4
DBLINK      BioProject: PRJNA158
KEYWORDS    RefSeq.
SOURCE      Caenorhabditis elegans
  ORGANISM  Caenorhabditis elegans
            Eukaryota; Metazoa; Ecdysozoa; Nematoda; Chromadorea; Rhabditida;
            Rhabditina; Rhabditomorpha; Rhabditoidea; Rhabditidae; Peloderinae;
            Caenorhabditis.
REFERENCE   1  (bases 1 to 2002)
  AUTHORS   Sulson,J.E. and Waterston,R.
  CONSRTM   Caenorhabditis elegans Sequencing Consortium
  TITLE     Genome sequence of the nematode C. elegans: a platform for
            investigating biology
  JOURNAL   Science 282 (5396), 2012-2018 (1998)
   PUBMED   9851916
  REMARK    Erratum:[Science 1999 Jan 1;283(5398):35]
REFERENCE   2  (bases 1 to 2002)
  CONSRTM   NCBI Genome Project
  TITLE     Direct Submission
  JOURNAL   Submitted (22-NOV-2023) National Center for Biotechnology
            Information, NIH, Bethesda, MD 20894, USA
REFERENCE   3  (bases 1 to 2002)
  AUTHORS   WormBase.
  CONSRTM   WormBase Consortium
  TITLE     Direct Submission
  JOURNAL   Submitted (29-OCT-2023) WormBase Group, European Bioinformatics
            Institute, Cambridge, CB10 1SA, UK. Email: help@wormbase.org
REFERENCE   4  (bases 1 to 2002)
  AUTHORS   Sulson,J.E. and Waterston,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (03-MAR-2003) Nematode Sequencing Project: Sanger
            Institute, Hinxton, Cambridge CB10 1SA, UK and The Genome Institute
            at Washington University, St. Louis, MO 63110, USA
COMMENT     REVIEWED REFSEQ: This record has been curated by WormBase. This
            record is derived from an annotated genomic sequence (NC_003280).
            
            On Apr 15, 2020 this sequence version replaced NM_001129118.3.
FEATURES             Location/Qualifiers
     source          1..2002
                     /organism="Caenorhabditis elegans"
                     /mol_type="mRNA"
                     /strain="Bristol N2"
                     /db_xref="taxon:6239"
                     /chromosome="II"
     gene            1..2002
                     /gene="szy-20"
                     /locus_tag="CELE_C18E9.3"
                     /db_xref="GeneID:174430"
                     /db_xref="WormBase:WBGene00004105"
     CDS             35..1726
                     /gene="szy-20"
                     /locus_tag="CELE_C18E9.3"
                     /standard_name="C18E9.3d"
                     /note="Confirmed by transcript evidence"
                     /codon_start=1
                     /product="SUZ domain-containing protein"
                     /protein_id="NP_001122590.1"
                     /db_xref="EnsemblGenomes-Gn:WBGene00004105"
                     /db_xref="EnsemblGenomes-Tr:C18E9.3a"
                     /db_xref="EnsemblGenomes-Tr:C18E9.3d"
                     /db_xref="GeneID:174430"
                     /db_xref="GOA:B2D6L4"
                     /db_xref="InterPro:IPR024771"
                     /db_xref="UniProtKB/TrEMBL:B2D6L4"
                     /db_xref="WormBase:WBGene00004105"
                     /translation="MSKENVSLVVADSWDDADADPVKELMDKVEKVKLLQRKEEKKEA
                     FFEKVKAEESSGVVSKLQTEEGLGPSAEEPKRVFLRRPKDGFAASENVIEASPPTSAD
                     TEEQPVTNVRSRSHHKLNQKEKQPAPTYEERQAAYQAARNRILGTEYKPDNQEIKEIK
                     FIDRSKSPETLKMTQQNMVEHYGEELSRELMEQPAEIVPPERQYTPDFTLQQPPPSVS
                     ESGGVYNGPPGFQQKQPNFQPTLQQQSLHQQQYLDNQYMMQMNVQIPIQYHNQTQHQF
                     VPHEASAISTTSQNSNGDGQNDQAIYYYQAPTQQPMNYIPYNLPNMAYPPPNFQPQGQ
                     LHHQMNAGQLHQIQQQQQQCQQIQHQPPQQHQQVINGQVMNQQNQRNQVNSYPQQNGA
                     GRGQNRQPMMYQMPCNSGPTAKPPPLMNQMQNRCMTNNGQNYQNRNMQQQGQQRSYSS
                     QPQNGQFYQNGNSNQNNPNNGRKQQHQPQQQQNKSGKFGQNRNDMQKNNYQPNLQQPP
                     MSQNPIPFGCPPRNVNAIREQHANNGSPNTGAGILGPHPMMSASQWPALQQNRPQ"
ORIGIN      
        1 agccacacac atttcctctg tttctaattg cgttatgagt aaagaaaatg tttctctagt
       61 tgtcgccgat agctgggatg atgcagatgc ggatccagtc aaggaattaa tggataaggt
      121 tgagaaggta aaacttcttc agcggaagga agaaaagaag gaagcatttt ttgagaaagt
      181 aaaagcagaa gagagtagcg gtgtcgtttc gaaactccag acagaagaag gtctcggacc
      241 atcagctgaa gagcctaaac gagtgttcct tcggcgccct aaagatggtt ttgctgcatc
      301 tgaaaatgtc atcgaagcat cgccaccaac atctgcagat acagaagaac agccagtgac
      361 aaacgtccga tctcgctctc accacaaatt aaatcaaaag gaaaaacaac ctgctcctac
      421 ttatgaggaa cgacaagctg cataccaagc agctcgtaac agaattttgg gaaccgagta
      481 caaacccgat aatcaggaaa tcaaagaaat caagtttatt gatcgctcca aatcacctga
      541 aactctcaaa atgactcaac aaaacatggt agagcactat ggagaggaat tgagccgcga
      601 attaatggag cagccagctg aaattgtccc tcctgaacgg caatatactc cagattttac
      661 gcttcagcag ccaccaccat cggtatcgga gagcggcgga gtttacaatg gaccgcctgg
      721 gtttcaacag aagcaaccaa atttccagcc aacgttacaa caacaatcgc ttcatcaaca
      781 acagtatttg gataatcagt atatgatgca gatgaacgta caaattccga tacagtatca
      841 taatcagacc caacatcagt ttgttccgca tgaagcctca gctatttcca caacatcaca
      901 aaacagcaac ggtgatggtc aaaatgatca agcgatatat tattatcagg cgcctaccca
      961 acagccaatg aactacattc cgtacaatct accaaacatg gcctacccac ctccaaactt
     1021 ccaaccccaa ggacaactgc accatcaaat gaatgcagga caactacacc aaattcaaca
     1081 acaacagcaa caatgccaac agattcaaca tcaaccgcct cagcaacacc aacaggttat
     1141 aaatggccaa gtgatgaatc aacagaacca aagaaatcag gtgaatagtt atccacagca
     1201 gaatggtgct ggtcgtggac agaatcgaca gccgatgatg tatcagatgc catgcaacag
     1261 tgggccgaca gcaaagcccc cgccgttgat gaatcaaatg cagaatagat gtatgaccaa
     1321 caatggtcaa aactatcaga ataggaatat gcagcagcaa ggtcagcagc gatcatattc
     1381 gtcacagcct cagaatggtc agttctacca aaacggaaat tccaaccaga acaatccgaa
     1441 taatggtaga aaacagcagc atcagccaca gcagcagcag aacaaatcag gaaaattcgg
     1501 acagaataga aatgatatgc aaaagaacaa ttatcaacca aatctacagc aacctccgat
     1561 gagtcaaaat ccaattccat ttggatgccc accacgtaat gtgaatgcga ttcgagaaca
     1621 acacgcaaac aatggatccc caaacactgg cgctggaatt cttggaccac atccaatgat
     1681 gtctgcatcc caatggccag cgttgcagca gaatcggcct caatagtttg ttattccatt
     1741 ctacgaacac tctatagaca attcatgctt taaccacgtc tttttgatgt gctgtgatgg
     1801 tcatcttttc acatttatct cccttttctt gttccatcag tccgattcgg aattgtgtta
     1861 atcaacacgg gtcgtacttc ctctttctcc ccccatctcc acatatttat atcattattt
     1921 tctacattca ttttggcatg tttcaagtta ttcaattttc tattgttata tgagccaagt
     1981 ttgatgaaga aattatcttg tt
//