spacer
spacer

EBI Dbfetch

ID   U48404; SV 2; linear; genomic DNA; STD; PRO; 2898 BP.
XX
AC   U48404;
XX
DT   14-MAR-1996 (Rel. 47, Created)
DT   07-DEC-2006 (Rel. 90, Last updated, Version 2)
XX
DE   Azotobacter chroococcum strain MCD1 HisI (hisI), HisE (hisE), TatA (tatA),
DE   TatB (tatB), and tatC (tatC) genes, complete cds; and unknown genes.
XX
KW   .
XX
OS   Azotobacter chroococcum
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Pseudomonadales;
OC   Pseudomonadaceae; Azotobacter.
XX
RN   [1]
RP   1-2898
RA   Yates M., Souza E.M.;
RT   "A second DNA region involved in H2-dependent respiration in Azotobacter
RT   chroococcum";
RL   Unpublished.
XX
RN   [2]
RP   1-2898
RA   Yates M.G., Souza E.M.;
RT   ;
RL   Submitted (05-FEB-1996) to the EMBL/GenBank/DDBJ databases.
RL   Department of Biochemistry, Universidade Federal do Parana, Centro
RL   Politecnico - Jardim das Americas, Curitiba, Pr 81531-990, Brazil
XX
RN   [3]
RC   Sequence update by submitter
RP   1-2898
RA   Souza E.M.;
RT   ;
RL   Submitted (04-DEC-2006) to the EMBL/GenBank/DDBJ databases.
RL   Department of Biochemistry, Universidade Federal do Parana, Centro
RL   Politecnico - Jardim das Americas, Curitiba, Pr 81531-990, Brazil
XX
CC   On Dec 5, 2006 this sequence version replaced gi:1224003.
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..2898
FT                   /organism="Azotobacter chroococcum"
FT                   /strain="MCD1"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:353"
FT   CDS             <1..534
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /product="unknown"
FT                   /note="ORF1"
FT                   /db_xref="GOA:Q43924"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q43924"
FT                   /protein_id="AAA92105.1"
FT                   /translation="EFEAAIRTVCEPIFEKPLKDISFGQLLLRLFQTARRFNMEVQPQL
FT                   VLLQKTLLNIEGLGRQLYPELDLWTTAKPFLERWMRKRMSPKAMLDNLQGQLEQLPHLA
FT                   QMTRAALEGMARPAHGAPPPRDRHILRLLGAALLAGGVLLASRAPLNVADAWPGWLMLA
FT                   SGLYLLVRRQRFPD"
FT   gene            566..976
FT                   /gene="hisI"
FT   RBS             566..569
FT                   /gene="hisI"
FT   CDS             575..976
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hisI"
FT                   /product="HisI"
FT                   /note="ORF2; similar to the N-terminal of phosphoribosyl
FT                   c-AMP hydrolase"
FT                   /db_xref="GOA:Q43925"
FT                   /db_xref="InterPro:IPR002496"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q43925"
FT                   /protein_id="AAA92106.1"
FT                   /translation="MKDWLDEIHWNADGLVPAIAQDHKTGRILMMAWMNRESLALTVRE
FT                   NRAIYWSRSRGKLWRKGEESGHLQKVHEVRLDCDADVIVLQVEQLGGIACHTGRESCFY
FT                   RVFEDGAWKVVEPILKDPDAIYHAGHRHE"
FT   gene            958..1301
FT                   /gene="hisE"
FT   RBS             958..961
FT                   /gene="hisE"
FT   CDS             969..1301
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="hisE"
FT                   /product="HisE"
FT                   /note="ORF3; similar to the C-terminal of phosphoribosyl
FT                   c-AMP hydrolase"
FT                   /db_xref="GOA:Q43926"
FT                   /db_xref="InterPro:IPR008179"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q43926"
FT                   /protein_id="AAA92107.1"
FT                   /translation="MSDTLNQLAEVLEARKNAAPDSSYVASLYHKGLNKILEKVGEESV
FT                   ETILAAKDAAASGDCSELIYETADLWFHSLVMLAALGQHPQAVLDELERRFGLSGHAEK
FT                   AARPKS"
FT   gene            1341..1585
FT                   /gene="tatA"
FT   RBS             1341..1345
FT                   /gene="tatA"
FT   CDS             1352..1585
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="tatA"
FT                   /product="TatA"
FT                   /note="ORF4"
FT                   /db_xref="GOA:A1EHP9"
FT                   /db_xref="InterPro:IPR006312"
FT                   /db_xref="UniProtKB/TrEMBL:A1EHP9"
FT                   /protein_id="ABL10099.1"
FT                   /translation="MGFGGISIWQLLIILLIVVMLFGTKRLKSLGSDLGDAIKGFRKSM
FT                   DNEENKAPPVEEQKGQTIEAQARKVEEPARKD"
FT   gene            1574..1929
FT                   /gene="tatB"
FT   RBS             1574..1577
FT                   /gene="tatA"
FT   CDS             1588..1929
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="tatB"
FT                   /product="TatB"
FT                   /note="ORF5"
FT                   /db_xref="GOA:A1EHQ0"
FT                   /db_xref="InterPro:IPR003998"
FT                   /db_xref="UniProtKB/TrEMBL:A1EHQ0"
FT                   /protein_id="ABL10100.1"
FT                   /translation="MFDIGFSELLLVGLVALLVLGPERLPVAARMAGLWIGRLKRSFNT
FT                   LKTEVEREIGADEIRRQLHNERILELEREMKQSLQPPAPSAPDETAASPATPPQPASPA
FT                   AHSDKTPSP"
FT   gene            1913..2693
FT                   /gene="tatC"
FT   RBS             1913..1917
FT                   /gene="tatB"
FT   CDS             1926..2693
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /gene="tatC"
FT                   /product="tatC"
FT                   /note="ORF6; mutations in this gene affect the culture pH"
FT                   /db_xref="GOA:P54085"
FT                   /db_xref="InterPro:IPR019822"
FT                   /db_xref="UniProtKB/Swiss-Prot:P54085"
FT                   /protein_id="AAA92109.2"
FT                   /translation="MTARPDSDQDMPLVAHLTELRSRLLRSVAAVLLIFAALFYFAQDI
FT                   YALVSAPLRAYLPEGATMIATGVASPFLAPFKLTLMISLFLAMPVVLHQVWGFIAPGLY
FT                   QHEKRIAMPLMASSVLLFYAGMAFAYFVVFPIMFGFFASVTPEGVAMMTDIGQYLDFVL
FT                   TLFFAFGVAFEVPVATFLLIWVGIVDVASLRNSRPYVIVGCFVVGMVLTPPDVFSQTLL
FT                   AVPMWLLFEIGVFFGARIRHREEPAASDGPSQP"
FT   sig_peptide     1926..2021
FT                   /gene="tatC"
FT   mat_peptide     2022..2660
FT                   /gene="tatC"
FT                   /product="TatC"
FT   CDS             2690..>2898
FT                   /codon_start=1
FT                   /transl_table=11
FT                   /product="unknown"
FT                   /note="ORF7"
FT                   /db_xref="UniProtKB/TrEMBL:A1EHP8"
FT                   /protein_id="ABL10101.1"
FT                   /translation="MNLLLLDDADFVAADRVILRDRRLRHLQEVHRAEAGDGLRIGRLG
FT                   GVMGEGRLLRLEAAEAELQVAFDR"
XX
SQ   Sequence 2898 BP; 481 A; 1030 C; 918 G; 469 T; 0 other;
     gaattcgagg cggcgatccg caccgtctgc gagccgatct tcgagaagcc cttgaaggac        60
     atctccttcg gccagctgct gctgcgcctg ttccagaccg cccggcgctt caacatggag       120
     gtccagccgc agctggtgct gctgcagaag accctgctca acatcgaggg gctcggccgc       180
     cagctctatc cggagctgga cctgtggacc accgccaagc ccttcctcga gcgctggatg       240
     cgcaagcgca tgagcccgaa ggccatgctc gacaacctgc agggccagct cgaacagctg       300
     ccgcatctgg cgcagatgac ccgcgcggcg ctggaaggca tggcccggcc ggcgcacggc       360
     gccccgccgc cccgcgaccg gcacatcctg cgcctgctcg gcgccgccct gctggccggc       420
     ggcgtgctgc tcgccagccg ggcgccgctg aacgtcgcgg acgcctggcc gggctggctg       480
     atgctcgcca gcggcctcta tctgctggta cgccgccagc gcttccccga ctgacccggt       540
     tgtcgcgacg cccgcacgtc gcaacggagt ggatatgaaa gactggctgg acgagattca       600
     ctggaacgcc gatggcctgg taccggccat cgcccaggat cacaagaccg ggcgcatcct       660
     gatgatggcc tggatgaacc gcgagtccct ggccctgacc gtccgggaaa atcgcgccat       720
     ctactggtca cgctcgcgtg gtaagctctg gcgcaaaggc gaggaatcgg gccacctgca       780
     gaaggtgcac gaagtgcgcc tggactgcga cgccgacgtg atcgtcctgc aggtcgagca       840
     gctcggcggc atcgcctgcc acaccggccg cgaaagctgc ttctaccgcg ttttcgaaga       900
     cggcgcctgg aaggtcgtcg agccgatcct caaggacccc gacgccatct accatgcagg       960
     acaccgtcat gagtgacacc ctcaaccagc tggccgaagt gctagaggcg cgcaagaacg      1020
     ccgccccgga cagctcctac gtggccagcc tgtaccacaa gggcctgaac aagatcctcg      1080
     agaaggtcgg cgaggaatcg gtggaaacca tcctcgccgc caaggacgcc gccgccagcg      1140
     gcgactgcag cgagctgatc tacgagaccg ccgacctctg gttccacagc ctggtcatgc      1200
     tcgccgccct cggccagcat ccccaggccg tgctcgacga actggagcgg cgcttcggcc      1260
     tgtccgggca tgcggaaaag gccgcacggc cgaagtcctg agcacggccg ggacacggca      1320
     atttcttcac gtctttacgg agcgaaccat catgggtttt ggcggtatca gcatctggca      1380
     acttctgatc atcctgctca tcgtcgtcat gctgttcggc accaagcgcc tgaagagcct      1440
     tggctcggac ctgggcgatg cgatcaaggg cttccgcaag tcgatggaca acgaggagaa      1500
     caaggcgccg cccgtcgaag agcagaaagg ccagaccatc gaggcccagg cccgcaaggt      1560
     cgaggaaccg gccaggaaag actgagcatg ttcgacatcg gcttcagcga actcctgctg      1620
     gtcggcctgg tcgccctgct ggtgctcggc cccgagcgcc tgccggtcgc cgcgcgcatg      1680
     gccgggctgt ggatcggccg cctgaaacgc agcttcaaca ccctcaagac agaagtggag      1740
     cgcgagatcg gcgccgacga gattcgccgc cagctgcata acgagcgaat cctcgagctg      1800
     gagcgggaga tgaagcagag cctgcagccg ccggcgccga gcgcgccgga cgagaccgcg      1860
     gccagccctg cgacgccccc tcagccggcc tcccctgccg cccactccga caagacgccc      1920
     agcccatgac agcccgaccg gacagcgacc aggacatgcc cctggtcgcg cacctgaccg      1980
     agctgcgctc gcgcctgctg cgcagcgtgg cggcagtgct gctgatcttc gccgcactct      2040
     tctacttcgc ccaggacatc tacgccctgg tctcggcgcc cctgcgcgcc tacctgccgg      2100
     aaggcgcgac catgatcgcc accggcgtgg cctcgccgtt cctcgcgccg ttcaagctga      2160
     ccctgatgat ctcgctgttc ctcgccatgc cggtggtcct ccaccaggtc tggggcttca      2220
     tcgcgccggg gctgtaccag cacgagaaac gcatcgccat gccgttgatg gcctccagcg      2280
     tgctgctctt ctatgccggc atggccttcg cctacttcgt ggtcttcccg atcatgttcg      2340
     gcttcttcgc cagcgtgacc ccggaaggcg tggcgatgat gaccgatatc ggccagtacc      2400
     tggacttcgt gctcaccctg ttcttcgcct tcggtgtggc cttcgaggtg ccggtggcga      2460
     ccttcctgct gatctgggtg ggcatcgtcg acgtggcaag cctgcgcaac agtcgcccct      2520
     acgtgatcgt cggctgcttc gtggtcggca tggtcctcac cccgccagac gtgttctccc      2580
     agaccctgct cgccgtgccc atgtggctgc tgttcgagat cggcgtgttc ttcggcgcgc      2640
     ggatccgcca ccgcgaggag ccggccgcct ccgacggccc gtcgcaaccg tgaacctgct      2700
     gctgctcgac gacgccgact tcgtcgccgc cgaccgggtg atcctgcgcg accgccgcct      2760
     gcgccacctg caggaagtgc atcgcgccga ggccggcgac ggcctgcgca tcggccgtct      2820
     gggcggggtc atgggcgaag gccgactgct gcgcctggag gcggcggagg ccgaactgca      2880
     ggtagccttc gaccggga                                                    2898
//


  
spacer
spacer