Dbfetch

LOCUS       NM_001356738            1140 bp    mRNA    linear   INV 22-NOV-2023
DEFINITION  Caenorhabditis elegans Homeobox domain-containing protein (ceh-22),
            partial mRNA.
ACCESSION   NM_001356738
VERSION     NM_001356738.3
DBLINK      BioProject: PRJNA158
KEYWORDS    RefSeq.
SOURCE      Caenorhabditis elegans
  ORGANISM  Caenorhabditis elegans
            Eukaryota; Metazoa; Ecdysozoa; Nematoda; Chromadorea; Rhabditida;
            Rhabditina; Rhabditomorpha; Rhabditoidea; Rhabditidae; Peloderinae;
            Caenorhabditis.
REFERENCE   1  (bases 1 to 1140)
  AUTHORS   Sulson,J.E. and Waterston,R.
  CONSRTM   Caenorhabditis elegans Sequencing Consortium
  TITLE     Genome sequence of the nematode C. elegans: a platform for
            investigating biology
  JOURNAL   Science 282 (5396), 2012-2018 (1998)
   PUBMED   9851916
  REMARK    Erratum:[Science 1999 Jan 1;283(5398):35]
REFERENCE   2  (bases 1 to 1140)
  CONSRTM   NCBI Genome Project
  TITLE     Direct Submission
  JOURNAL   Submitted (22-NOV-2023) National Center for Biotechnology
            Information, NIH, Bethesda, MD 20894, USA
REFERENCE   3  (bases 1 to 1140)
  AUTHORS   WormBase.
  CONSRTM   WormBase Consortium
  TITLE     Direct Submission
  JOURNAL   Submitted (29-OCT-2023) WormBase Group, European Bioinformatics
            Institute, Cambridge, CB10 1SA, UK. Email: help@wormbase.org
REFERENCE   4  (bases 1 to 1140)
  AUTHORS   Sulson,J.E. and Waterston,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (03-MAR-2003) Nematode Sequencing Project: Sanger
            Institute, Hinxton, Cambridge CB10 1SA, UK and The Genome Institute
            at Washington University, St. Louis, MO 63110, USA
COMMENT     REVIEWED REFSEQ: This record has been curated by WormBase. This
            record is derived from an annotated genomic sequence (NC_003283).
            
            On Apr 15, 2020 this sequence version replaced NM_001356738.2.
            COMPLETENESS: incomplete on both ends.
FEATURES             Location/Qualifiers
     source          1..1140
                     /organism="Caenorhabditis elegans"
                     /mol_type="mRNA"
                     /strain="Bristol N2"
                     /db_xref="taxon:6239"
                     /chromosome="V"
     gene            <1..>1140
                     /gene="ceh-22"
                     /locus_tag="CELE_F29F11.5"
                     /db_xref="GeneID:179485"
                     /db_xref="WormBase:WBGene00000445"
     CDS             1..1140
                     /gene="ceh-22"
                     /locus_tag="CELE_F29F11.5"
                     /standard_name="F29F11.5d"
                     /note="Partially confirmed by transcript evidence"
                     /codon_start=1
                     /product="Homeobox domain-containing protein"
                     /protein_id="NP_001343841.1"
                     /db_xref="GeneID:179485"
                     /db_xref="GOA:A0A2C9C3N2"
                     /db_xref="InterPro:IPR001356"
                     /db_xref="InterPro:IPR009057"
                     /db_xref="InterPro:IPR017970"
                     /db_xref="InterPro:IPR020479"
                     /db_xref="UniProtKB/TrEMBL:A0A2C9C3N2"
                     /db_xref="WormBase:WBGene00000445"
                     /translation="MFNVSALAAATPSIASVSSVASPSEQHGLSTSVGVGVNDTTSRT
                     GDGGAASSASSASAAPQQQSQSALHNKTFHFYIHNFSIRVIHFYSIISKKFFGENSKS
                     LEAKWDTLLPTDTNLQCSTWPDSIPLLAVSGYSATPTFSFDPCTYGSYDPSAYFASNG
                     IAGSMYTLPDQFPRSENDMLDNSNTSNGNKSDKDGIKLEDEDEILEDEENDEEDDGTG
                     KRKKRKRRVLFTKAQTYELERRFRSQKYLSAPEREALAMQIRLTPTQVKIWFQNHRYK
                     TKKSHTDKPINAALLTTMPNAFSSQSTAASFPTRAMPIPMLVRDSSARSSDISSTSPY
                     TVAFGSANSGYLPTPSAYLPATSGYFSNGPSAASSYMTNTQWWPS"
ORIGIN      
        1 atgttcaacg tgtcggcgct agcagcagcg acgccttcta tcgcttcggt ttcatccgtt
       61 gcaagcccat cggagcaaca tggattgtct acaagtgttg gcgtcggagt gaatgatacc
      121 acttctcgaa ctggagatgg cggcgccgct tcatcggctt caagtgcatc agcggcgcca
      181 caacagcagt cacaatcggc acttcataac aagacgtttc atttctatat ccacaacttt
      241 tccattcgcg ttattcattt ctactcaatt atttccaaga agttttttgg cgaaaattcc
      301 aaatcactcg aagctaaatg ggacactcta cttcccaccg acaccaattt acaatgttcc
      361 acgtggcctg atagcattcc attacttgca gtttcaggat attctgctac tcccacattt
      421 tccttcgatc cttgcacata cggcagctat gatccatctg catattttgc ttcaaacgga
      481 attgctggtt ccatgtacac tctacctgat caatttccac gttctgagaa tgatatgcta
      541 gataacagca atacatcaaa tggaaacaaa agcgataaag atggaatcaa acttgaagat
      601 gaagatgaaa ttctggaaga tgaagagaat gacgaagaag atgatggaac tggaaaacgg
      661 aaaaagagaa agcgtcgcgt tttgttcaca aaagcacaaa cttatgaact tgaacgacga
      721 ttccgctcgc aaaaatatct gagcgcgcct gaacgtgaag ctcttgcaat gcaaattcga
      781 cttactccga ctcaagtaaa aatttggttc caaaatcatc gatacaaaac aaaaaaaagt
      841 catacggata agccaataaa cgcggcgctt cttaccacaa tgcccaatgc attttcaagt
      901 caatcgacag cggccagttt tccaacaaga gcaatgccga taccaatgct agtccgtgac
      961 tcttctgctc gttcttcgga catttcctca acatctccat acacggtagc atttggaagt
     1021 gccaattcag gatacctacc aacaccttcc gcctacctcc cagccacttc cgggtatttt
     1081 tcaaacggac cttcagcagc ttcttcctac atgaccaata ctcaatggtg gccttcttga
//