spacer
spacer

EBI Dbfetch

ID   AL513383; SV 1; circular; genomic DNA; STD; PRO; 218160 BP.
XX
AC   AL513383;
XX
PR   Project:236;
XX
DT   26-OCT-2001 (Rel. 69, Created)
DT   13-MAY-2009 (Rel. 100, Last updated, Version 7)
XX
DE   Salmonella enterica subsp. enterica serovar Typhi str. CT18 plasmid pHCM1
XX
KW   .
XX
OS   Salmonella enterica subsp. enterica serovar Typhi str. CT18
OC   Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacteriales;
OC   Enterobacteriaceae; Salmonella;
OC   Salmonella enterica subsp. enterica serovar Typhi.
OG   Plasmid pHCM1
XX
RN   [1]
RP   1-218160
RX   DOI; 10.1038/35101607
RX   PUBMED; 11677608.
RA   Parkhill J., Dougan G., James K.D., Thomson N.R., Pickard D., Wain J.,
RA   Churcher C., Mungall K.L., Bentley S.D., Holden M.T.G., Sebaihia M.,
RA   Baker S., Basham D., Brooks K., Chillingworth T., Connerton P., Cronin A.,
RA   Davis P., Davies R.M., Dowd L., White N., Farrar J., Feltwell T.,
RA   Hamlin N., Haque A., Hien T.T., Holroyd S., Jagels K., Krogh A.,
RA   Larsen T.S., Leather S., Moule S., O'Gaora P., Parry C., Quail M.,
RA   Rutherford K., Simmonds M., Skelton J., Stevens K., Whitehead S.,
RA   Barrell B.G.;
RT   "Complete genome sequence of a multiple drug resistant Salmonella enterica
RT   serovar Typhi CT18";
RL   Nature 413(6858):848-852(2001).
XX
RN   [2]
RP   1-218160
RA   Parkhill J.;
RT   ;
RL   Submitted (25-OCT-2001) to the EMBL/GenBank/DDBJ databases.
RL   Submitted on behalf of the Salmonalla sequencing team, Sanger Centre,
RL   Wellcome Trust Genome Campus, Hinxton, Cambridge CB10 1SA E-mail:
RL   parkhill@sanger.ac.uk
XX
DR   GR; AL513383_GR.
DR   RFAM; RF00240; RNA-OUT.
DR   Sample; ERS000058.
XX
CC   Notes:
CC   Details of S. typhi sequencing at the Sanger Centre
CC   are available on the World Wide Web.
CC   (URL, http://www.sanger.ac.uk/Projects/S_typhi/)
XX
FH   Key             Location/Qualifiers
FH
FT   source          1..218160
FT                   /organism="Salmonella enterica subsp. enterica serovar
FT                   Typhi str. CT18"
FT                   /plasmid="pHCM1"
FT                   /strain="CT18"
FT                   /mol_type="genomic DNA"
FT                   /db_xref="taxon:220341"
FT   CDS             complement(join(218131..218160,1..528))
FT                   /transl_table=11
FT                   /gene="HCM1.01c"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.01c, possible membrane protein, len: 185 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions. Spans sequence end"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S6"
FT                   /protein_id="CAD09619.2"
FT                   /translation="MNQTETGPSGFTETTVDEERIAIRVMIGDVVGRYRKQVPPDRVQK
FT                   ATFEVNGGLLMALLLALLMLVCIIQRLATGDRLMSFTGEPDVRDIQFTLMLVIEFALGM
FT                   VVWFLIATGEFSRPWLYRLTPAKPVWLFDEVEDADLVLLSGNPFIKRWLHKEILKIRRL
FT                   TYTRLDEELEKIAPLPGQPPAQ"
FT   RBS             complement(536..540)
FT                   /note="possible RBS"
FT   CDS             complement(742..1053)
FT                   /transl_table=11
FT                   /gene="HCM1.02c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.02c, hypothetical protein, len: 103 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S5"
FT                   /protein_id="CAD09620.1"
FT                   /translation="MMYPDITGVKMKLSQLEVGMTVWSLSRTKMGNTTIKTVTLHSVVI
FT                   KEVHDNHVIASWNGNAPRRFGETAITGWKKEKPLLIRDRSGSARLATREEKARILDTK"
FT   CDS             complement(1367..1690)
FT                   /transl_table=11
FT                   /gene="HCM1.03c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.03c, hypothetical protein, len: 107 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5P4"
FT                   /protein_id="CAD09621.1"
FT                   /translation="MNKPLVSFAELSGNAINVARQSVIDMEMDATREKIGKARSLFHSG
FT                   IHRAVNGYPLIQSAANQLAVIKRLLGDTKYLDACITENLCMFSPEGYLYLFMQRRFINE
FT                   PVA"
FT   RBS             complement(1697..1702)
FT                   /note="possible RBS"
FT   repeat_region   1871..1883
FT                   /note="13 bp inverted repeat flanking IS1"
FT   repeat_region   complement(1871..2585)
FT                   /note="IS1"
FT   CDS             complement(1876..2346)
FT                   /transl_table=11
FT                   /gene="insB"
FT                   /gene_synonym="HCM1.04c"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.04c, insB, possible IS1 transposase, len: 156
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISB_ECOLI (EMBL:D10483), insB, Escherichia coli
FT                   insertion element IS1 protein InsB (167 aa), fasta scores;
FT                   E(): 0, 91.6% identity in 167 aa overlap"
FT                   /db_xref="GOA:Q935S4"
FT                   /db_xref="InterPro:IPR005063"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S4"
FT                   /protein_id="CAD09622.1"
FT                   /translation="MPGNRPHYGRWPQHDFTSFKKLRPQSVTSRIQPGSDVIVCAKSRQ
FT                   RWLFYAYDRLRKTVVAHVFGERTMATLGRLMSLLSPFDVVIWMTDGWPLYESRLKGKLH
FT                   VISKRYTQRIERHNLNLRQHLARLGRKSLSFSKSVELHDKVIGHYLNIKHYQ"
FT   CDS             complement(2265..2540)
FT                   /transl_table=11
FT                   /gene="insA"
FT                   /gene_synonym="HCM1.05c"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.05c, insA, probable IS1 transposase, len: 91
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISA1_ECOLI (EMBL:X52534), insA, Escherichia coli
FT                   insertion element IS1 protein InsA (91 aa), fasta scores;
FT                   E(): 0, 98.9% identity in 91 aa overlap. Contains PS00017
FT                   ATP/GTP-binding site motif A (P-loop). Contains probable
FT                   helix-turn-helix motif at aa 67-88"
FT                   /db_xref="GOA:P0ADH1"
FT                   /db_xref="InterPro:IPR003220"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0ADH1"
FT                   /protein_id="CAD09623.1"
FT                   /translation="MASVSISCPSCSATDGVVRNGKSTAGHQRYLCSHCRKTWQLQFTY
FT                   TASQPGTHQKIIDMAMNGVGCRATARIMGVGLNTILRHLKNSGRSR"
FT   misc_feature    complement(2284..2289)
FT                   /note="possible translational frameshift site, similar to
FT                   that determined experimentally (EMBL:X52534)"
FT   misc_feature    complement(2472..2495)
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   repeat_region   complement(2573..2585)
FT                   /note="13 bp inverted repeat flanking IS1"
FT   CDS             complement(2694..3644)
FT                   /transl_table=11
FT                   /gene="corA"
FT                   /gene_synonym="HCM1.07c"
FT                   /product="putative magnesium and cobalt transport protein"
FT                   /note="HCM1.07c, corA, probable magnesium and cobalt
FT                   transport protein, len: 316 aa; similar to many e.g.
FT                   SW:CORA_ECOLI (EMBL:L11042), corA, Escherichia coli
FT                   magnesium and cobalt transport protein (316 aa), fasta
FT                   scores; E(): 0, 99.1% identity in 316 aa overlap. Contains
FT                   Pfam match to entry PF01544 CorA, CorA-like Mg2+
FT                   transporter protein. Contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="GOA:Q9L5P6"
FT                   /db_xref="InterPro:IPR002523"
FT                   /db_xref="InterPro:IPR004488"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5P6"
FT                   /protein_id="CAD09624.1"
FT                   /translation="MLSAFQLENNRLTRLEVEESQPLVNAVWIDLVEPDDDERLRLQSE
FT                   LGQSLATRPELEDIEASARFFEDDDGLHIHSFFFFEDAEDHAGNSTVAFTIRDGRLFTL
FT                   RERELPAFRLYRMRARSQSMVDGNAYELLLDLFETKIEQLADEIENIYSDLEQLSRVIM
FT                   EGHQGDEYDEALSTLAELEDIGWKVRLCLMDTQRALNFLVRKARLPGGQLEQAREILRD
FT                   IESLLPHNESLFQKVNFLMQAAMGFINIEQNRIIKIFSVVSVVFLPPTLVASSYGMNFE
FT                   FMPELKWRFGYPAAIIFMILAGLAPYLYFKRKNWL"
FT   misc_feature    complement(2697..3584)
FT                   /note="Pfam match to entry PF01544 CorA, CorA-like Mg2+
FT                   transporter protein, score 432.90, E-value 2.8e-126"
FT   RBS             complement(3653..3656)
FT                   /note="possible RBS"
FT   RBS             4004..4007
FT                   /note="possible RBS"
FT   CDS             4014..4343
FT                   /transl_table=11
FT                   /gene="HCM1.08"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.08, hypothetical protein, len: 109 aa; similar
FT                   to the N-terminal half of SW:YIGE_ECOLI (EMBL:L02122),
FT                   yigE, Escherichia coli hypothetical protein (254 aa), fasta
FT                   scores; E(): 0, 97.9% identity in 95 aa overlap"
FT                   /db_xref="InterPro:IPR018711"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S3"
FT                   /protein_id="CAD09625.1"
FT                   /translation="MAHQLLIGKGMITLNLKRIFLALTLLPLFAVAADDCALSDPTLTV
FT                   QAYTVNPQTERVKMYWQKANGEAWGTLHALLADINSQGQVQMAMNGGILNLTVFDIKYR
FT                   KKEVF"
FT   CDS             complement(4363..4569)
FT                   /transl_table=11
FT                   /gene="HCM1.10c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.10c, hypothetical protein, len: 68 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5P8"
FT                   /protein_id="CAD09626.1"
FT                   /translation="MGHVDYTRTLRVQLYDASRFHDGATAEQAGELHTVAFSKPAIADD
FT                   IQKIVDTTAEVLGKRYSVNVFSN"
FT   RBS             complement(4577..4581)
FT                   /note="possible RBS"
FT   CDS             complement(4604..4828)
FT                   /transl_table=11
FT                   /gene="HCM1.13c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.13c, hypothetical protein, len: 74 aa; unknown
FT                   function. Similar to HCM1.30c, hypothetical protein (74
FT                   aa), fasta scores; E(): 8.7e-18, 57.1% identity in 63 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5P9"
FT                   /protein_id="CAD09627.1"
FT                   /translation="MHNLEISTIAIFSAQYKNIEEAENAGALYSVDIEYPMTLNDLSLL
FT                   CESVAKAVGVPNGVKYQFVTQPQPEESDY"
FT   RBS             complement(4836..4840)
FT                   /note="possible RBS"
FT   CDS             complement(4882..5088)
FT                   /transl_table=11
FT                   /gene="HCM1.15c"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.15c, putative membrane protein, len: 68 aa;
FT                   unknown function. Contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S2"
FT                   /protein_id="CAD09628.1"
FT                   /translation="MKLFYSKPVRFIVIICVFLLGVDNLSDMFVDISRPVFYGGLAALL
FT                   AAAVVIARVDYNKNAEKKASQVH"
FT   RBS             complement(5098..5102)
FT                   /note="possible RBS"
FT   CDS             complement(5484..5744)
FT                   /transl_table=11
FT                   /gene="HCM1.17c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.17c, hypothetical protein, len: 86 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5Q1"
FT                   /protein_id="CAD09629.1"
FT                   /translation="MVIDAENSEMHQVRDFIAANWSLFTSHIREKSMTDEQAEEEAQRI
FT                   FVVVGGGRVKAFASLRDSARCWICTLFSGLSANLSAGQPSL"
FT   RBS             complement(5753..5756)
FT                   /note="possible RBS"
FT   CDS             complement(5833..6324)
FT                   /transl_table=11
FT                   /gene="HCM1.20c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.20c, hypothetical protein, len: 163 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S1"
FT                   /protein_id="CAD09630.1"
FT                   /translation="MTTLTFEIAGVKKLLEELRSAERFNATIEQLFEPSNYPGGTPLNE
FT                   EGKTEVEMNQTGGIFWPSSKHIDPARLTPQILLVKDHGVYLITNASLDGTPVSRDTVVY
FT                   ARGMNPSVDDEWYDEAEEALGGDDSSVSIPVAWFELALKKKFNAFSIKVSPTKITLVNG
FT                   "
FT   CDS             complement(6329..6637)
FT                   /transl_table=11
FT                   /gene="HCM1.21c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.21c, hypothetical protein, len: 102 aa; shares
FT                   a region of similarity with TR:Q9X5P0 (EMBL:AF127177)
FT                   Escherichia coli hypothetical protein (208 aa), fasta
FT                   scores; E(): 0.00012, 34.9% identity in 83 aa overlap and
FT                   TR:O85616 (EMBL:AF071034), L0009, Escherichia coli O157:H7
FT                   hypothetical protein from a pathogenicity island (65 aa),
FT                   fasta scores; E(): 0.00047, 43.1% identity in 58 aa
FT                   overlap"
FT                   /db_xref="InterPro:IPR009301"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5Q3"
FT                   /protein_id="CAD09631.1"
FT                   /translation="MQINKVMSLLDILTSWLEDNINMESDLFFDNDVDNTTSESLYPAV
FT                   EKANAVLSKLASLSSETIQATRQRLQDAVEGKGEVSTADVKELLLATRYLMLTTDGE"
FT   RBS             complement(6334..6337)
FT                   /note="possible RBS"
FT   CDS             complement(6845..7225)
FT                   /transl_table=11
FT                   /gene="HCM1.22c"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.22c, possible membrane protein, len: 126 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions. Contains PS00044 Bacterial
FT                   regulatory proteins, lysR family signature"
FT                   /db_xref="UniProtKB/TrEMBL:Q935S0"
FT                   /protein_id="CAD09632.1"
FT                   /translation="MKFILMFFILAILIWGFTGLTFKDAILFTSVGLSISVVALSALLV
FT                   VALTFVMAAMYAAHELGSLGKMIISQVVLVGFWNLIFSVIPDGKLISFFGVNVWQSGSY
FT                   LVYFMTVLVAVFAAYIALQKQR"
FT   misc_feature    complement(7088..7180)
FT                   /note="PS00044 Bacterial regulatory proteins, lysR family
FT                   signature"
FT   CDS             complement(7312..7596)
FT                   /transl_table=11
FT                   /gene="HCM1.23c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.23c, hypothetical protein, len: 94 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R9"
FT                   /protein_id="CAD09633.1"
FT                   /translation="MVPFCHKLEEKLMTSNRCREIKTPPEHIIADYILRFMKNNKEAKL
FT                   YEAMSRLESKINLFVADGHDELHIRALLNQAAHSHTKESLKQACERICN"
FT   CDS             complement(7598..7918)
FT                   /transl_table=11
FT                   /gene="HCM1.24c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.24c, hypothetical protein, len: 106 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R8"
FT                   /protein_id="CAD09634.1"
FT                   /translation="MIPFFILKDISLVTRFSIINLNPIHSITCKDMNMDKYLALDRALN
FT                   EILTPVPTPFSTLFAGEIKAECHRIAAGESNPQPSHILDRRLLALCKAGQINYTTGKGW
FT                   LK"
FT   CDS             complement(7995..8348)
FT                   /transl_table=11
FT                   /gene="HCM1.25c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.25c, hypothetical protein, len: 117 aa; unknown
FT                   function. Contains PS00044 Bacterial regulatory proteins,
FT                   lysR family signature"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R7"
FT                   /protein_id="CAD09635.1"
FT                   /translation="MSLLRLTDISMDIYDMTEKEVRMDEDKVLSFINSGDGDAGDLLDD
FT                   AMPTAARRFYRLTQSMHTLLGEVREHFPDAMFYSANGKVSLLLGSSHNKHDQPMQEMVA
FT                   VSATQLHIEGGDW"
FT   misc_feature    complement(8121..8213)
FT                   /note="PS00044 Bacterial regulatory proteins, lysR family
FT                   signature"
FT   CDS             complement(8364..8972)
FT                   /transl_table=11
FT                   /gene="HCM1.26c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.26c, hypothetical protein, len: 202 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R6"
FT                   /protein_id="CAD09636.1"
FT                   /translation="MFLHLVPKILHPMGNLCTLDSVSVPELSLRLTGNDLVAMRPYPNK
FT                   QYLVGMLKGRRALNGFLVKSPRAFEEFTMVSVWNIEGFGKITHTLKTFVEDTDYDLVSH
FT                   DVLLAQGSYRAQASEQCRVHPVYKNIAPVHIEPKMESLLSTEPNFENDVCETHSWGMLV
FT                   RSRDEGFKAMTMPSARLQESVALRGDRQPQLEQAIVITG"
FT   RBS             complement(8980..8984)
FT                   /note="possible RBS"
FT   CDS             complement(9003..9527)
FT                   /transl_table=11
FT                   /gene="HCM1.27c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.27c, hypothetical protein, len: 174 aa; unknown
FT                   function"
FT                   /db_xref="GOA:Q935R5"
FT                   /db_xref="InterPro:IPR002711"
FT                   /db_xref="InterPro:IPR003615"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R5"
FT                   /protein_id="CAD09637.1"
FT                   /translation="MKVLNNKGAVIELPNFSELLPKVESDDGRFSKPKNKISKEQRAEL
FT                   RLKFGGRCAYCGCPLPEKGWHADHVEPVRRDFEMVRAPAGSRVTHRARSTGKVMHPELH
FT                   AIENLFPACAPCNLFKGALSVEGMRKEISRQVERARAYSVNFRTAERFGLIEVTEKPVV
FT                   FWFEIHQATAQ"
FT   CDS             complement(9558..9869)
FT                   /transl_table=11
FT                   /gene="HCM1.28c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.28c, hypothetical protein, len: 103 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R4"
FT                   /protein_id="CAD09638.1"
FT                   /translation="MNNEMSSLGTQKAEGPFVLLTLVGEGFIFDERHEIVRINGRPKQI
FT                   GVKRNYFESDLGEGKAKYWTLDINEAHVFPTLDAATEQLCKLSRPHLIKIRKLIQENK"
FT   CDS             complement(9866..10597)
FT                   /transl_table=11
FT                   /gene="HCM1.29c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.29c, hypothetical protein, len: 243 aa; shows
FT                   weak similarity to TR:O03965 (EMBL:U64984) Myxococcus
FT                   xanthus bacteriophage Mx8 hypothetical protein (222 aa),
FT                   fasta scores; E(): 2.6e-06, 36.4% identity in 242 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R3"
FT                   /protein_id="CAD09639.1"
FT                   /translation="MCEPCVKGVSTVKTRGMLFNDEMVRAILADQKTQTRRIIKPQYSS
FT                   DEWSIRPAQTPRHRGHTHDWWLPTGTQPYSALRPCPYGVVGDRITVREAFSLLGNEDAC
FT                   AVDWNDNIVMDRTEAARIYRASCEQRSGDYGLWSIPDEADWKPRTENMKFEGAWTPSIH
FT                   MPRWASRIALEITDLRVERLNTISEEDAKAEGAPTECCVLGDKHFLGFRSLWKNTYGED
FT                   SWQANPWVWVVNFKRITGEVV"
FT   RBS             complement(9873..9878)
FT                   /note="possible RBS"
FT   CDS             complement(10705..10929)
FT                   /transl_table=11
FT                   /gene="HCM1.30c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.30c, hypothetical protein, len: 74 aa; unknown
FT                   function. Similar to HCM1.13c, hypothetical protein (74
FT                   aa), fasta scores; E(): 1.3e-16, 57.1% identity in 63 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5Q9"
FT                   /protein_id="CAD09640.1"
FT                   /translation="MPIQEKTTVFVFNACHADKAAAASANALHSLEVEYPMTLNDLSLL
FT                   CESVAKALDVPGGVKYEITTEPVVDGEYD"
FT   RBS             complement(10938..10941)
FT                   /note="possible RBS"
FT   CDS             complement(11016..11480)
FT                   /transl_table=11
FT                   /gene="HCM1.31c"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.31c, possible membrane protein, len: 154 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R2"
FT                   /protein_id="CAD09641.1"
FT                   /translation="MTDIKEKQNHFSKLKCIAISWHFNKPTGKEHLLLFVAIVAWIFPG
FT                   LVFFKHSLWGGLLFFFFVAGSYAFLAFPHFTHRKKIWKERLDQSLKEYQPLDLQAWAYF
FT                   KDRVREEGMTYKACESWMSTEASALYKSPKQEWSFLDSTSVGENDKSQPD"
FT   RBS             complement(11488..11493)
FT                   /note="possible RBS"
FT   CDS             complement(11663..14092)
FT                   /transl_table=11
FT                   /gene="HCM1.32c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.32c, hypothetical protein, len: 809 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R1"
FT                   /protein_id="CAD09642.1"
FT                   /translation="MDLINIATIQRKPNSGNNMYIEMKETFLELPSEIQFSEAANAAIL
FT                   TQDKWGDVWQTLKTDADLNYTDAGEPVSLASRVTTATSAIYHAITEGWTMCVGYSGGKD
FT                   SHSLLHLFLMALIRAVRNGSNVSQHHFIQMSDTLIENPEMHHQATQVLSQLRAFIAEQE
FT                   LPLTVLVARPSMTQSWVGRILTGRGLPTWTNSSTRQCATDLKRSPLRQAKARYLKNAPA
FT                   SVRNKVCLMLGSRDDESARRADNILRMGGQADSVSLTEHGGELYPVKEWRAQDIWSFLM
FT                   ACGSLARFPLPSFLPDNFSLATLYKDATGECIWTPEKSTVRSSACGARYGCSLCCAVGI
FT                   DHSMETLLRTDPEKYGYQAGLNRLQRFLTKIQYDWSLRDYIGRKVFEGGYVRLQPNVFS
FT                   SSLTERLFHICCSLDYVEAQRAAAVHEKLLSGEIEDTAHNRRMSEPQFRLVQEANVLHI
FT                   DFLWSLHCFNPRPFRAIELYRQVWEGGALDLLDDEPAMQPVPRTPMPAPRWMKLPEGRI
FT                   GTSFDGLSDPSSEIAYFDGREDERASRSLMSSGEGLNIVAFEEEDELTVDEDTASWIIW
FT                   HEYDGLRQRVSDGEFTPVAAAQYLLRYGAVRISRGKGAVYHRLAQRGQAYSRLGINDQT
FT                   PLPSLLASRRFKILTDSDYRLLVARKLRGQRQKLRFWCCVAACVALHTYNKTPLGGWIT
FT                   TQLETEQQLHLARTGDELKARTLDAVLTLCNLRISSQQPEERLYYRAVRKRFLETLAGC
FT                   ISPEREGTLREVIWELRMLSGPQSSKKTGFRHVDECRERTAALLRPLLKRMVRLLA"
FT   CDS             complement(14215..14727)
FT                   /transl_table=11
FT                   /gene="HCM1.33c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.33c, hypothetical protein, len: 170 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935R0"
FT                   /protein_id="CAD09643.1"
FT                   /translation="MPRDCLIIPDCHRNSRWHGELKMTNKILILSASCINEFASDVPQS
FT                   VFFSIDTSLAKRIRELAAYVKENDLYAAEFFFYDCHWSETLEEDIEVLMSQAAFIESDS
FT                   SGQETMLRDVMPSCRTETTSIRVMKESFHLTAVPRHCGDDMMLNTPLIPLAELESNATV
FT                   LITQQYS"
FT   CDS             complement(14709..15515)
FT                   /transl_table=11
FT                   /gene="HCM1.34c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.34c, hypothetical protein, len: 268 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q9"
FT                   /protein_id="CAD09644.1"
FT                   /translation="MANNYTQASFTILCSQEQAQMALDAIAYVTDTDVAEGEHLLSKPV
FT                   SECSLTELLVLGIIQNHPECDPFEPTFGQSESPENNYELELKAEITGKGLAICHDESIN
FT                   LDHAIAVTTAVLSVFNLPEMVTINAAFVCDRPRENEFGGATIVVTKDTHHYEEGFNFSR
FT                   LMNEAHDAGVQYALVKVNQYNHEYTYTQCYLMSCKKSESAYDVARHRLASDESTPDNPG
FT                   EDGVIILSEEDNTSMALHSVTELMPVVYESLSKLLPSLDELCPVTA"
FT   RBS             complement(15523..15529)
FT                   /note="possible RBS"
FT   CDS             complement(15743..15934)
FT                   /transl_table=11
FT                   /gene="HCM1.35c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.35c, hypothetical protein, len: 63 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q8"
FT                   /protein_id="CAD09645.1"
FT                   /translation="MMFDDEEEVMLVEADSCGEAEAAFQQHIDEGVAHLDQVLVISSAS
FT                   LQSLLPDRLIASSLTHTV"
FT   CDS             complement(16063..16395)
FT                   /transl_table=11
FT                   /gene="HCM1.36c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.36c, hypothetical protein, len: 110 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5R5"
FT                   /protein_id="CAD09646.1"
FT                   /translation="MESEQLITKITQTLKRPDGSEVRIVVEQAFGSGLTPSLGVYVLRR
FT                   PTTANNWQLCKTAPHKDWRTMSVDEYQKHGRSEMLRYVSIGEILRLSAAIGKPMSYVDT
FT                   CPGLQG"
FT   CDS             complement(16895..18076)
FT                   /transl_table=11
FT                   /gene="HCM1.38c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.38c, hypothetical protein, len: 393 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q7"
FT                   /protein_id="CAD09647.1"
FT                   /translation="MKLFGISSRDSGMDAMFYIQASTKQQASFIFDFLATRLYAHCQLI
FT                   EPLNETIIPSLSRTTLSLQPWSQNSQTRTSEMQMVTHGLTLSGAVMVEHSRQIVDFCDN
FT                   LGLRLDAPTGKPGWTELINADCEQLNSPRLYPVLIQPGTEGQFQIYVPAPAVIDADTVI
FT                   ASVIDECFSDVTSYCLAGTPFPMTEKPVIRMEAHLSDAHTRVFELTFISYNLALSATVY
FT                   DKNLRQVLMLCEDFGVTLQGRAGASCHAYMRNEYRRLAHVGVYSRSGAENDVRAYSSDK
FT                   EETLIRQLMTQATAGSALIPARHGKQFNGVLMNANPSSATTGFIYLSPEFPQGQFMMTA
FT                   EVVKSSCTPRGISYIETVDGYRFIVTAYDTKAMHSLTEFLAVNEDYFTPYRWE"
FT   CDS             complement(18085..18381)
FT                   /transl_table=11
FT                   /gene="HCM1.39c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.39c, hypothetical protein, len: 98 aa; unknown
FT                   function"
FT                   /db_xref="InterPro:IPR007711"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q6"
FT                   /protein_id="CAD09648.1"
FT                   /translation="MIHSFKDRRLEKFFRNGKSTAGIPAELINAISCRLETLNNVKNER
FT                   ELLSGSLRYERLRMTANRYSSIRVNSKYRLFFEWNDGVHNVHLSAHDYKSLIH"
FT   RBS             complement(18387..18391)
FT                   /note="possible RBS"
FT   CDS             complement(18445..18912)
FT                   /transl_table=11
FT                   /gene="HCM1.40c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.40c, hypothetical protein, len: 155 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5R8"
FT                   /protein_id="CAD09649.1"
FT                   /translation="MDKYFDRSGMAIDNAKIKCIDSVKGTGEYIYRVTCNKCNGRGERN
FT                   HFYKSRCIACNATGYSLVTTRTCYTLTALYRIYPEAARKISAAQAAERQRAVQSKTSAF
FT                   NLWCQNHQELVDAITQQDGENSFLNSLKSTLSRKFPLSDKQLTVAARILGM"
FT   RBS             complement(18920..18924)
FT                   /note="possible RBS"
FT   repeat_region   18961..18997
FT                   /note="inverted repeat; 34/36 (94%) matches, 1 gaps"
FT   CDS             19211..19537
FT                   /transl_table=11
FT                   /gene="HCM1.41"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.41, hypothetical protein, len: 108 aa;
FT                   improbable CDS"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5R9"
FT                   /protein_id="CAD09650.1"
FT                   /translation="MPVRHLNDALLPVAETVHMADMYNTHGLTQFRGVAQRRDAALIWK
FT                   TQASTGASGSRHSQAETPEPVRLPAVSLVPVYKTRLIRRYRWRTPRRLEAFGNCLGQRT
FT                   PAFR"
FT   RBS             19759..19763
FT                   /note="possible RBS"
FT   CDS             19772..20548
FT                   /transl_table=11
FT                   /gene="HCM1.42"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.42, hypothetical protein, len: 258 aa; unknown
FT                   function. Similar to HCM1.43, hypothetical protein (258
FT                   aa), fasta scores; E(): 1.7e-27, 32.8% identity in 262 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5S0"
FT                   /protein_id="CAD09651.1"
FT                   /translation="MPKYLLPAELAEIVCGLLVQPALLNELKTPATHKAFMQDIGELVA
FT                   KHCGGQIDGVIMPEVRDEDSQADYLTSPDETPYIVVSPGQDMHSLTDNVWRHHARDGWL
FT                   DHIKGSVEESPDELPTHKECAVRRYTLQRLLLQEETSHANLPVQVVRMCEYSTDDVEQT
FT                   DSSAEFNVTMALGGHAMLAVKDTDSRLVMALTLLIENGVPSVHVNAGDTDPSVLHIRAA
FT                   HGGLVLSTDSLNHDFSISPSDQYTYGRPGLLLKAAY"
FT   repeat_region   complement(20616..20651)
FT                   /note="inverted repeat; 34/36 (94%) matches, 1 gaps"
FT   CDS             20698..21474
FT                   /transl_table=11
FT                   /gene="HCM1.43"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.43, hypothetical protein, len: 258 aa; unknown
FT                   function. Similar to HCM1.43, hypothetical protein (258
FT                   aa), fasta scores; E(): 2.7e-29, 32.8% identity in 262 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q5"
FT                   /protein_id="CAD09652.1"
FT                   /translation="MAKLISTRELATIITALLVKPELLGELDSPEKHRALMEDLGRVVA
FT                   EHCGGNVTEIALPETDGTAAEGALQNGQPVRYLETKESSPYLIVHPDASLPSVTQNVWM
FT                   HADHDGWEEHFNGETDALTPEMSEQFRQQVYALLTPESHTTSSEMRLTLQDWQLGEAEI
FT                   PEEDCQPYQVKVLAENKNVQCEVTNETGTTCFGLILEIDRGVPTLHIDTGSDSLLHIHA
FT                   AHDGLVLTPDAPSHRFEDAPVDRFSYNSPSLLVPGV"
FT   RBS             21526..21530
FT                   /note="possible RBS"
FT   CDS             21539..21661
FT                   /transl_table=11
FT                   /gene="HCM1.43a"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.43a, hypothetical protein, len: 40 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q4"
FT                   /protein_id="CAD09653.1"
FT                   /translation="MGDVATLPPKINDGVLRRWNARGKADKEALADYGVSVKEE"
FT   RBS             21650..21656
FT                   /note="possible RBS"
FT   CDS             21663..22004
FT                   /transl_table=11
FT                   /gene="HCM1.44"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.44, hypothetical protein, len: 113 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5S2"
FT                   /protein_id="CAD09654.1"
FT                   /translation="MRELLGMAGAEHQASVMYQTFGHLDAKLGEKHKGHFVFINGQHGD
FT                   LCVVHSEFSSFDEGPGYFSDRADFIWELVKNDGPCSKVGIYRFDGEYALPKRRNGRRFS
FT                   GSVTCLQAF"
FT   CDS             22009..22368
FT                   /transl_table=11
FT                   /gene="HCM1.45"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.45, hypothetical protein, len: 119 aa; unknown
FT                   function. Contains PS00017 ATP/GTP-binding site motif A
FT                   (P-loop)"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q3"
FT                   /protein_id="CAD09655.1"
FT                   /translation="MLHERRQVFRTTGGGTVRVQPSPHNNSTEYIIMTNANANDGKTSP
FT                   VLPTLEQVYALLKANYKPARFADRDGEIWGHEYSWNLARSSLQDLEKYGKSYVSKHSDR
FT                   MGDGFSFGPDLVIIR"
FT   misc_feature    22114..22137
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             22596..23300
FT                   /transl_table=11
FT                   /gene="HCM1.46"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.46, hypothetical protein, len: 234 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q2"
FT                   /protein_id="CAD09656.1"
FT                   /translation="MTMKNTVIPTVTENEMGEVITRHSAYGLVSVSRTSTTGQRLYASD
FT                   LSHKEVVTMTFSESEQIERDGVIRHRLAEGRRRSPLLQVSLSPAQWATMITSFGMSDGV
FT                   PCTINSLIRGDYERQPEIGYIESTRERYERQIREAAEREMAKLHEKLEVLRLLAVKGKA
FT                   GKRELDEAYQSLLSVINNLPVNLAFTNQLIQESMVNIVSHGKAELEATAMGVAARLGMK
FT                   EMSSLASLEEKK"
FT   CDS             complement(23333..23752)
FT                   /transl_table=11
FT                   /gene="HCM1.48c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.48c, hypothetical protein, len: 139 aa; unknown
FT                   function. Contains g{8} repeat"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q1"
FT                   /protein_id="CAD09657.1"
FT                   /translation="MSELAEKPLITRVAPLERIYYCASRAEGLKPDRHEIRMQSQFLLL
FT                   GVIWLPPALAMAELERLLKGYDADHSRLLENVLETAHQQFLKFCEPQKREGGGVENHVE
FT                   CPRQDDALQCLRFMSTRYALAVDLCAAYVCSRYGR"
FT   repeat_region   complement(23460..23467)
FT                   /note="(g)8"
FT   CDS             complement(23840..26224)
FT                   /transl_table=11
FT                   /gene="HCM1.49c"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.49c, possible periplasmic protein, len: 794 aa;
FT                   unknown function, contains probable N-terminal signal
FT                   sequence and PS00017 ATP/GTP-binding site motif A (P-loop).
FT                   Similar to HCM1.56c, possible periplasmic protein (818 aa),
FT                   fasta scores; E(): 0, 35.4% identity in 831 aa overlap.
FT                   Also similar in parts to HCM1.50, HCM1.51, HCM1.52 and
FT                   HCM1.53 (in that order), suggesting that together they
FT                   represent a pseudogene"
FT                   /db_xref="UniProtKB/TrEMBL:Q7WZD9"
FT                   /protein_id="CAD09658.1"
FT                   /translation="MKFCRRPLIVAVYTALLFPLYSQAQLYNYSYTDTRGTKVNAEPTR
FT                   EYLNPGSAITLNLISGLDRYERVTVTRSSDNVQMFQSVTGLVTVADRITAADGSEYYGK
FT                   SMTLPVLGEGTFSLKSETLDNKSNVVATTSYSFSIDITPPVLPDPMQWIRAGFQYGSLD
FT                   IFGDRTATQAISLSNVSDARSGLDKAEWFAIDSSGVRRTVNAQLNALTGVVQALAAVAA
FT                   GSTVAPVSPAYYTVGFRVYDKAGNWTETSHRSGIDRTIPSYIQHQVRNAKTGVWEDYVP
FT                   GMTIFENPVKFRYKRLKSDSTNFNGTDFGWVDQITNSDNTYFYTEATVSYPETYMYYEL
FT                   HTKAGLNVNLQYKTLKFTPGNGVAEAPRYLSGQYHFRDANTWTSSDIVRFTGPDCVDLG
FT                   RVNVEPRSYVQTATIVGIGSCNVSVGESSCQVSMNYCKTSGKGYVPYQIHIRGTGSYAN
FT                   LGGLQSHFYTYWDMNAPVINSIVSSPLDKTVVMLVTDSDVTNDWTNYMWATNIFNLTLK
FT                   DTSNKVSTLSPKNVTVLNYQLKQVTFDYSALPSGKYTATGAATDTYNNTAELTLSNTIL
FT                   HDVTPPVVDISFEGKQADGALVKGLENLVITLADDMTKASLKSITLSGGPTSDKVSVGW
FT                   YSQGTDKYGLNYPRIFPATDDADSYQLTAVAVDEAGNTTTKVSRFRYVPNNLIEFNTLK
FT                   TLAVGMGLKTSDNQPLAYLRTNSIRKKDGSLITGAQTGTLTVRKDAAFAVSMNGVAVVP
FT                   GDSKDITIDFGQGDGVLIPIFPATSGNVGESSFMIELPQIQ"
FT   misc_feature    complement(25910..25933)
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   RBS             complement(26232..26236)
FT                   /note="possible RBS"
FT   CDS             26475..27077
FT                   /transl_table=11
FT                   /gene="HCM1.50"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.50, possible periplasmic protein, len: 200 aa;
FT                   unknown function, contains probable N-terminal signal
FT                   sequence. Similar to the N-termini of HCM1.49c and
FT                   HCM1.56c. HCM1.51, HCM1.52 and HCM1.53 (in that order) are
FT                   also similar to the corresponding regions of HCM1.49c and
FT                   HCM1.56c, suggesting that together they represent a
FT                   pseudogene"
FT                   /db_xref="UniProtKB/TrEMBL:Q7WZD8"
FT                   /protein_id="CAD09659.1"
FT                   /translation="MKNQAIALAMAMLGVSVPASAQIYESIFTDTNGIEVHAPSTRLLL
FT                   NPASPVTLTLIAGLDRYVNVKITSATGTQLLNTTTTRTSVSDRLKAGDGSEFYGKKVTL
FT                   PVLGEGRSVVQVSILDLNQSVVATYSYNWLVDTTPLSGNALTGNAAYGSTAGSVWKMGL
FT                   EATGQFDFTSTNVTDVNGIEKGMFYVYHSNGSLFSTT"
FT   misc_feature    26475..28076
FT                   /note="extent of possible pseudogene"
FT   CDS             27180..27476
FT                   /transl_table=11
FT                   /gene="HCM1.51"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.51, hypothetical protein, len: 98 aa; unknown
FT                   function. Similar to parts of HCM1.49c and HCM1.56c.
FT                   HCM1.50, HCM1.52 and HCM1.53 (in that order) are also
FT                   similar to the corresponding regions of HCM1.49c and
FT                   HCM1.56c, suggesting that together they represent a
FT                   pseudogene"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5S9"
FT                   /protein_id="CAD09660.1"
FT                   /translation="MTTQETPEPFRCSSFDMITIWAVRDPQSSASVVPGVSGYPAYSAG
FT                   MTVNENPIHLVYRVPKSNYRSYAEGGLLFYNLYSSPTEIATDSTYTYVEMILP"
FT   CDS             27481..27894
FT                   /transl_table=11
FT                   /gene="HCM1.52"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.52, hypothetical protein, len: 137 aa; unknown
FT                   function. Similar to parts of HCM1.49c and HCM1.56c.
FT                   HCM1.50, HCM1.51 and HCM1.53 (in that order) are also
FT                   similar to the corresponding regions of HCM1.49c and
FT                   HCM1.56c, suggesting that together they represent a
FT                   pseudogene"
FT                   /db_xref="UniProtKB/TrEMBL:Q7WZD6"
FT                   /protein_id="CAD09661.1"
FT                   /translation="MVYGLENIRIALADNLTTPRITRLQITGGPTADNVELTWSPAGTN
FT                   VYAPEYPRLFPSFEPSENYALSVTVSDSQSNSKTYTQKFSYLPNNLVQLHNLRTLSVSS
FT                   ALKTSLNEPLAYLSTNVLRKSNGEIAKTSRVRR"
FT   CDS             27936..28076
FT                   /transl_table=11
FT                   /gene="HCM1.53"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.53, hypothetical protein, len: 46 aa; unknown
FT                   function. Similar to parts of HCM1.49c and HCM1.56c.
FT                   HCM1.50, HCM1.51 and HCM1.52 (in that order) are also
FT                   similar to the corresponding regions of HCM1.49c and
FT                   HCM1.56c, suggesting that together they represent a
FT                   pseudogene"
FT                   /db_xref="UniProtKB/TrEMBL:Q7WZD5"
FT                   /protein_id="CAD09662.1"
FT                   /translation="MQAALGESVEVKIDMGLGDNLLVPIYPAENGKVGTSEFMIQIDEL
FT                   K"
FT   repeat_region   complement(28329..28345)
FT                   /note="iteron associated with repA; 83% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   complement(28350..28366)
FT                   /note="iteron associated with repA; 84% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   complement(28371..28387)
FT                   /note="iteron associated with repA; 89% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   complement(28392..28408)
FT                   /note="iteron associated with repA; 100% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   complement(28415..28431)
FT                   /note="iteron associated with repA; 90% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   CDS             28468..29349
FT                   /transl_table=11
FT                   /gene="repA"
FT                   /gene_synonym="HCM1.54"
FT                   /product="replication initiation protein"
FT                   /note="HCM1.54, repA, replication initiation protein, len:
FT                   293 aa; highly similar to many RepHI1B repA proteins e.g.
FT                   TR:Q08088 (EMBL:X68824), repA, Escherichia coli replication
FT                   initiation protein from plasmid pIP522 (293 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 293 aa overlap. Contains
FT                   Pfam match to entry PF01651 RepA, RepA family. Similar to
FT                   HCM1.64, repA2, replication initiation protein (291 aa),
FT                   fasta scores; E(): 7.2e-34, 35.2% identity in 290 aa
FT                   overlap"
FT                   /db_xref="GOA:Q7AQZ8"
FT                   /db_xref="InterPro:IPR000525"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQZ8"
FT                   /protein_id="CAD09663.1"
FT                   /translation="MSSNNNKLSLVIEESLKDSGEVIQLFPTLKQTIQPKVLLRLGVFV
FT                   PTLKSTDKGGRKSHHIDATEPLSRLSIVEGEGYSQIQIYGPRLDMDTDFKSWCGIVYAL
FT                   SNRPLDSEGQLELNFPEFAKFCGFDTKRIDKQLKERFDASLTRIARTNISFIKKIPGTD
FT                   DQITINMHLVESTYYDSSTGKIIIKPNSKLNTLYRVDGKTRLYLKTLQKLARKESAQAL
FT                   YLYLAELPSTFYRIGFDRLRGRLQLSSHLGNQNATVKKALGQLKEIGFLEYSIDKENGD
FT                   YVLNILKRNMKP"
FT   misc_feature    28582..29331
FT                   /note="Pfam match to entry PF01651 RepA, RepA family, score
FT                   603.30, E-value 1.5e-177"
FT   repeat_region   29394..29410
FT                   /note="iteron associated with repA; 96% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29435..29451
FT                   /note="iteron associated with repA; 91% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   complement(29452..29468)
FT                   /note="iteron associated with repA; 91% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29556..29572
FT                   /note="iteron associated with repA; 94% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29591..29607
FT                   /note="iteron associated with repA; 100% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29662..29678
FT                   /note="iteron associated with repA; 100% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29729..29745
FT                   /note="iteron associated with repA; 100% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29796..29812
FT                   /note="iteron associated with repA; 87% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   repeat_region   29851..29867
FT                   /note="iteron associated with repA; 92% identity to
FT                   consensus TACCCGGTATAGTGGAT"
FT   CDS             complement(29935..30432)
FT                   /transl_table=11
FT                   /gene="HCM1.55c"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.55c, possible periplasmic protein, len: 165 aa;
FT                   unknown function, contains a possible N-terminal signal
FT                   sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q935Q0"
FT                   /protein_id="CAD09664.1"
FT                   /translation="MMKSNAPLIILICLMIAFSAYVKSWSLLYTLLAASVSLTVMISLP
FT                   FIVSPLQHSKFIALRILRLLVITLWTIGLVGVFFSVVERLVWVNADSYPAWLAKELDSP
FT                   AITDGENFIKATESFEKICGKNKGYLSVVTKHNGIFMRCDDSLSFDSWWKGVYRLKTPE
FT                   TR"
FT   CDS             complement(30447..30650)
FT                   /transl_table=11
FT                   /gene="HCM1.55ac"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.55ac, hypothetical protein, len: 67 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P9"
FT                   /protein_id="CAD09665.1"
FT                   /translation="MIHFAEREARERKAHASSGPIVTLSSVIEAFFGIRFTPVQNDGNF
FT                   SKAADDYKRSLSKLVQNGAPKE"
FT   CDS             complement(31101..33557)
FT                   /transl_table=11
FT                   /gene="HCM1.56c"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.56c, possible periplasmic protein, len: 818 aa;
FT                   unknown function, contains a probable N-terminal signal
FT                   sequence. Similar to HCM1.49c, possible periplasmic protein
FT                   (749 aa), fasta scores; E(): 0, 35.4% identity in 831 aa
FT                   overlap. Also similar in parts to HCM1.50, HCM1.51, HCM1.52
FT                   and HCM1.53 (in that order), suggesting that together they
FT                   represent a pseudogene"
FT                   /db_xref="UniProtKB/TrEMBL:Q7WZD4"
FT                   /protein_id="CAD09666.1"
FT                   /translation="MRKILTGCIIATAIASVYPAAAQIFSYSYTDTNQLAKTLKPATQS
FT                   YLNPASTMTLNLISGLDRYERVSVTRDSDKKVMYSAVTGKISVADRIVAADGTEYYGKD
FT                   LALPALGEGAFTVINDTLDLQQAVVSSSTYHFTIDTTAPKYTSIYPSQNAGYEMVLSGP
FT                   VWGLGRGGSGQFSIFADGVDDANGIDKIRLVIKRGNGTVVSDNTLSYDTAAKRAFYPWI
FT                   KDSVTQPGMPTSDLNEEFTFNFIITDKAGNTLNIPPQRFLFDDQIGEYTPFAVHDSRVS
FT                   TSVVPGISSGYVPFVRGLSVLENPYRMVIRIPRTNWKPYRNGGITILNNYGGAKVISED
FT                   TTYVYVEVKLPQGALDINYYRPVNTYQWSGGDLTQYASWLNWDPASVKSPAWGSPAIER
FT                   QMSDGTWFNSVNWKYFKASDMPVNLTQIRFNVQARPYDQKITGGATCNIPAGSTSCTVA
FT                   LTQAITNGTTGYLHSGYEVRSTTESTFFMPIWENVVWHTLGPSVTGYDYNDTTNILQVY
FT                   INQPGDGSYFDTVKLSRVWLSDKSRNNADINVTGTLTGRNTATGNYTYEFNLKLIPEGS
FT                   YNVQLNAQDSFNNTGSLDYKTVTVDNTPPSISISYETKPITSSVTVYGLENIRIQLADT
FT                   LTKPSLTRMTLRGGPVSDAVELSWVNLGNNLYAPNYPKIFPSLNDGETYTLTVQAKDEM
FT                   NNVKESAVEFSYLPNNLVRLENLKTISVSTALKTSDDTPLAVLYASQLRKKDGSIATGK
FT                   QDAILTVRKDAAFGVTVNGVSAAPGESKNVQLDLGLGDSRSFPIFPSTSGVVGTSEFML
FT                   NIEELK"
FT   RBS             complement(33564..33567)
FT                   /note="possible RBS"
FT   CDS             complement(34003..34179)
FT                   /transl_table=11
FT                   /gene="HCM1.56ac"
FT                   /product="hypothetical protein"
FT                   /note="HCM.56ac, hypothetical protein, len: 58 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5T5"
FT                   /protein_id="CAD09667.1"
FT                   /translation="MSKSSPVLPEDRDDIEFVMDDFQRSLGKSKPVREVQFLGESQQSE
FT                   ESANSADSPWFES"
FT   RBS             complement(34186..34190)
FT                   /note="possible RBS"
FT   CDS             complement(34194..35948)
FT                   /transl_table=11
FT                   /gene="HCM1.57c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.57c, hypothetical protein, len: 584 aa; shares
FT                   a region of similarity with TR:O37396 (EMBL:AF021249),
FT                   M.CviQIII, Chlorella virus NY-2A DNA probable adenine
FT                   methyltransferase (372 aa), fasta scores; E(): 0.15, 29.4%
FT                   identity in 119 aa overlap. C-terminal half similar to
FT                   TR:Q52611 (EMBL:U03474) Proteus vulgaris ORF associated
FT                   with restriction endonuclease PvuRts1 I (290 aa), fasta
FT                   scores; E(): 2.5e-19, 29.1% identity in 292 aa overlap.
FT                   Highly similar to TR:P95799 (EMBL:U60283), traG1, Serratia
FT                   marcescens hypothetical restriction methylase from plasmid
FT                   R478 (563 aa), fasta scores; E(): 0, 70.8% identity in 558
FT                   aa overlap. Contains PS00092 N-6 Adenine-specific DNA
FT                   methylases signature"
FT                   /db_xref="GOA:Q935P8"
FT                   /db_xref="HSSP:2ADM"
FT                   /db_xref="InterPro:IPR002052"
FT                   /db_xref="InterPro:IPR002296"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P8"
FT                   /protein_id="CAD09668.1"
FT                   /translation="MSANLLAFCSRLLSWYQINPSKRTGAMSAVESDSLPMGAPGSSLV
FT                   AYMPHTGLLINDDNFLPEMREELDVINRQVESYNDELSLLRSMSAQFLKCGNQKLYSYL
FT                   SGYNHLISEADASYAENALRSEYWKRVMALTDVLSVMSDEKKKEWDKQFTADRYHLPPQ
FT                   EIPDFTLDAVVTTVVALLNDRHQFIKDRVYAVFQSLSRQHKTNKAFGFSTRMITSGVCE
FT                   GVKDKWVKLKVEFKESGLMPLSELRVICSYFRGETVKPVYDTKKMVENMVGHVGFRNWI
FT                   SLDGNSIRFRVYKNGSMHIDVHPDIAERLNNILAAIVPLALPAERVAHTKATLQEFPAL
FT                   KRCIDFHSRMQLAELDFTQNEKEWSSWTSLGYAGENADKTRQVNADVLRFLGARVTSYH
FT                   VTFDYDPTEVMRFIGHMGAMPDIKSHQFYPSSARLSEYVASIIAAGEGERLLEPNIGHG
FT                   DLLQCFPKSVNVTGIELDTLNCLVSRAKGYETTEADFLAWSAANQIQKFDCVVMNPPFA
FT                   DNRAKLHLLAAASHLVPGGRLAAVLPLSLQGIDNLLGEGFRTEWMDTFDNEFDNTAVSV
FT                   RVLYAERF"
FT   misc_feature    complement(34401..34421)
FT                   /note="PS00092 N-6 Adenine-specific DNA methylases
FT                   signature"
FT   CDS             complement(36134..37291)
FT                   /transl_table=11
FT                   /gene="HCM1.58c"
FT                   /product="putative DNA-binding protein"
FT                   /note="HCM1.58c, possible DNA-binding protein, len: 385 aa;
FT                   contains a region of weak similarity to putative chromosome
FT                   partitioning proteins e.g. TR:O84694 (EMBL:AE001339), parB,
FT                   Chlamydia trachomatis chromosome partitioning protein (281
FT                   aa), fasta scores; E(): 0.0018, 26.7% identity in 135 aa
FT                   overlap. Contains a possible helix-turn-helix motif at aa
FT                   184-205 (Score 1105, +2.95 SD). Similar to HCM1.286c,
FT                   possible DNA-binding protein (401 aa), fasta scores; E():
FT                   1.1e-19, 31.9% identity in 298 aa overlap and HCM1.63c,
FT                   hypothetical protein (358 aa), fasta scores; E(): 3e-16,
FT                   28.6% identity in 290 aa overlap"
FT                   /db_xref="GOA:Q9L5T7"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5T7"
FT                   /protein_id="CAD09669.1"
FT                   /translation="MSDLMTDSQQQTNSRVFKSPLVSFSTVTGSGRFVSGMKQFRDANP
FT                   DLCNEVTEQKAWAISPTVVQITEGFNSREMGMGEAYYQLPEVADHLNNIKNAYIRGDYV
FT                   DPIRVLIKDGIPYVRQGHCRLKAALMAVAEGHSNLTILCIEMKADEISCELTTIDGNRG
FT                   LALSPVALGESYRRLQALGGWSLDRIAEREGKSNTTIAALIRLTGCCVYLKKLIHADAI
FT                   SYVAVLSLIDEFGETEAVARIEKMIADLEKADSSGIQIKKTPRGQIRVVPSDFKPARVP
FT                   PVLATKAVEGVKLITTSLLQKLGDIELPEVTDSSEDEEITFTLNRSMLEMLKNLQSEIT
FT                   ESENKQLRRAENRQARLKGEKVTYKTKKNDKNGGEPQSETPPAQA"
FT   RBS             complement(37297..37300)
FT                   /note="possible RBS"
FT   RBS             37639..37642
FT                   /note="possible RBS"
FT   CDS             37651..38475
FT                   /transl_table=11
FT                   /gene="HCM1.59"
FT                   /product="putative DNA modification methylase"
FT                   /note="HCM1.59, possible DNA modification methylase, len:
FT                   274 aa; similar to many modification methylases e.g.
FT                   SW:ML21_LACLC (EMBL:U16027), LlaIIA, Lactococcus lactis
FT                   modification methylase (284 aa), fasta scores; E():
FT                   1.1e-26, 36.5% identity in 271 aa overlap. Contains PS00092
FT                   N-6 Adenine-specific DNA methylases signature"
FT                   /db_xref="GOA:Q935P7"
FT                   /db_xref="HSSP:2DPM"
FT                   /db_xref="InterPro:IPR002052"
FT                   /db_xref="InterPro:IPR002294"
FT                   /db_xref="InterPro:IPR012326"
FT                   /db_xref="InterPro:IPR012327"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P7"
FT                   /protein_id="CAD09670.1"
FT                   /translation="MRKHTPIIKWAGGKTKLMPFLSKHFPHDKSRRWVEPFIGGGAVFL
FT                   NMFATEALLADSNPDLINLYRNIQRNKPAFIREVQLLAERHFEEEDYYVLRNTFNSTSF
FT                   DDAPLQRAAIFYAMNRLGYNGLCRYNLKRKFSVPWGKRYQFSLDIQKVDYLSFRLSSVE
FT                   LKTADFGQTLEFAGGGDQIYCDPPYDKISKTSFVSYDGIPFDKSAHVKLADMLVDANRK
FT                   GASVAISNSMTPFTLELYEERGFDIHTHNAYRSVGSQSKSRKKEIEILAVLR"
FT   misc_feature    38194..38214
FT                   /note="PS00092 N-6 Adenine-specific DNA methylases
FT                   signature"
FT   CDS             complement(38490..39311)
FT                   /transl_table=11
FT                   /gene="HCM1.60c"
FT                   /product="hypothetical protein"
FT                   /note="HCM.60c, hypothetical protein, len: 273 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5T9"
FT                   /protein_id="CAD09671.1"
FT                   /translation="MQNDLGLGFIRKSARTSAKIISRKVTFPLDDLDNAKLTLTGLQCH
FT                   PSCRFPFYQLSMLIHNQLAEHGVISADENAPFTVSISIHEWLSRARVAFIDYHGLRNSD
FT                   KTVMITRAHLEELLTYLSTTLAVYVPYSKKRLNFSFLTSFTLVKTSQSYTLTFPGVLRP
FT                   FLMLLGGLIQEFMTEKLLKRRNAQFVIFDYLRKSRRHSHKITDIVNDLQLHTVNVRIMN
FT                   VLTQLADQGFISFICEGKRGERSIEELQFIPYASRDHSEVLSFEEWISPID"
FT   RBS             complement(39318..39321)
FT                   /note="possible RBS"
FT   CDS             complement(39594..40301)
FT                   /transl_table=11
FT                   /gene="HCM1.61c"
FT                   /product="hypothetical protein"
FT                   /note="HCM.61c, hypothetical protein, len: 235 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5U0"
FT                   /protein_id="CAD09672.1"
FT                   /translation="MKHSLFFTQDGYLLPSSVKPIYGKDGHYYAVITRECFECGGTGKI
FT                   ANAVCVTCNGSKTSPATEEKLVLKECIEFLETIPELRCNPDLEAWKRRHSEQLALLQAD
FT                   NSKFAASIAQQLNNNLFLTVRQLESFYSTYQPVSEAFSENAGFPIEHSFNIGDVVSFDI
FT                   IFTEVRAAFSKGSHSYFFTFTGKKQNDGFALTGNVQDHVLLGHSYHLSGKVRKIHYFDS
FT                   VPYALLTVFKLTA"
FT   CDS             complement(40298..40498)
FT                   /transl_table=11
FT                   /gene="HCM1.62c"
FT                   /product="hypothetical protein"
FT                   /note="HCM.62c, hypothetical protein, len: 66 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P6"
FT                   /protein_id="CAD09673.1"
FT                   /translation="MDKIAQFTVINTYNDLLITKGTLDRNIEEIKAGKRFDHFEEGHDQ
FT                   YVQKVTDALQLVEARLENLKK"
FT   RBS             complement(40313..40316)
FT                   /note="possible RBS"
FT   RBS             complement(40505..40510)
FT                   /note="possible RBS"
FT   CDS             complement(40516..41592)
FT                   /transl_table=11
FT                   /gene="HCM1.63c"
FT                   /product="hypothetical protein"
FT                   /note="HCM.63c, hypothetical protein, len: 358 aa; unknown
FT                   function. Similar to HCM1.58c, possible DNA-binding protein
FT                   (385 aa), fasta scores; E(): 7.5e-20, 28.6% identity in 290
FT                   aa overlap and HCM1.286c, possible DNA-binding protein (401
FT                   aa), fasta scores; E(): 1.6e-14, 32.8% identity in 189 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5U2"
FT                   /protein_id="CAD09674.1"
FT                   /translation="MNHCDYQIIEISPKALFIESGFNPREAVIGELCYEQEPVKSTIVS
FT                   IKQAYKEGRRVDLIKVVKKDSNYVVRQGHCRYRALSLALAEGADIQLISVVVMNYKNKS
FT                   EEYLENLDGNRNNGLNPVALAYALAEALKLGSTVESLAMRYQRSSTAIRNQLKILDMPL
FT                   ELQRLISLNLIKKTLAIEIMLKYSNDHAKVLAHLESCSLLVPSTEPEPVLSKTSSVQTS
FT                   SNDEKLDNPETLPVHVIPKEVKTKSITRSSLGIKRLSHKKTERLKTEFIGLIDTVRPAL
FT                   NDSNKLTELIFDGQHSNLFTNISSTSITKTTESVKITLDEAKLQLLLSLLNDENTAIII
FT                   PKSKVTELHEIRDLLTSE"
FT   RBS             complement(41598..41603)
FT                   /note="possible RBS"
FT   repeat_region   41991..42009
FT                   /note="iteron associated with repA2; 93% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   42012..42030
FT                   /note="iteron associated with repA2; 88% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   42033..42051
FT                   /note="iteron associated with repA2; 83% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   42056..42074
FT                   /note="iteron associated with repA2; 92% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   CDS             42127..43002
FT                   /transl_table=11
FT                   /gene="repA2"
FT                   /gene_synonym="HCM1.64"
FT                   /product="replication initiation protein"
FT                   /note="HCM1.64, repA2, replication initiation protein, len:
FT                   291 aa; identical to TR:Q07464 (EMBL:M95772), repA,
FT                   Salmonella typhi replication protein from plasmid R27 (291
FT                   aa), fasta scores; E(): 0, 100.0% identity in 291 aa
FT                   overlap. Contains Pfam match to entry PF01651 RepA, RepA
FT                   family. Contains probable helix-turn-helix motif at aa
FT                   113-134 (Score 1269, +3.51 SD). Similar to HCM1.54, repA,
FT                   replication initiation protein (293 aa), fasta scores; E():
FT                   0, 35.2% identity in 290 aa overlap"
FT                   /db_xref="GOA:Q7BRX0"
FT                   /db_xref="InterPro:IPR000525"
FT                   /db_xref="UniProtKB/TrEMBL:Q7BRX0"
FT                   /protein_id="CAD09675.1"
FT                   /translation="MSDNNEVTHPFDVTNTETGKTYQLSPNSSKSVQPIALLRLSVFTP
FT                   VGTKEKRYRNFEVDASDELSSMELARSEGYDDIRITGLKLSMSTDFKCWLGCIMAFSKY
FT                   GFASDKITLSFNEFAKMCGISSTNINKRTRSRFQEALANLASVVISFRDSKTERFTVTH
FT                   LVQKAVIDPKKDTVELVGDPSMWELYRYDHKTLLSLQVLSVLAKKEAAQSLYIYFEAMP
FT                   AGTLFVSMKRLRERLLLTTPVRTQNQIIRKAMLELKSIGYLEYQEVKKGRDIQFQIFKR
FT                   SPKLALAKHS"
FT   misc_feature    42127..77106
FT                   /note="98.1% identical to Salmonella typhi plasmid R27 tra2
FT                   region (EMBL:AF105019) bases 2880..38245"
FT   misc_feature    42238..42966
FT                   /note="Pfam match to entry PF01651 RepA, RepA family, score
FT                   558.90, E-value 3.4e-164"
FT   repeat_region   complement(43057..43075)
FT                   /note="iteron associated with repA2; 98% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   complement(43151..43169)
FT                   /note="iteron associated with repA2; 88% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   complement(43235..43253)
FT                   /note="iteron associated with repA2; 89% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43476..43494
FT                   /note="iteron associated with repA2; 89% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43495..43515
FT                   /note="repeat associated with repA2; 91% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43520..43538
FT                   /note="iteron associated with repA2; 90% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43538..43558
FT                   /note="repeat associated with repA2; 91% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43563..43581
FT                   /note="iteron associated with repA2; 94% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43581..43601
FT                   /note="repeat associated with repA2; 91% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43605..43623
FT                   /note="iteron associated with repA2; 99% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43624..43644
FT                   /note="repeat associated with repA2; 85% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43667..43687
FT                   /note="repeat associated with repA2; 93% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43692..43710
FT                   /note="iteron associated with repA2; 92% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43711..43731
FT                   /note="repeat associated with repA2; 88% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43736..43754
FT                   /note="iteron associated with repA2; 94% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43755..43775
FT                   /note="repeat associated with repA2; 92% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43780..43798
FT                   /note="iteron associated with repA2; 95% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43799..43819
FT                   /note="repeat associated with repA2; 83% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   repeat_region   43824..43842
FT                   /note="iteron associated with repA2; 100% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43867..43885
FT                   /note="iteron associated with repA2; 94% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43910..43928
FT                   /note="iteron associated with repA2; 89% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43953..43971
FT                   /note="iteron associated with repA2; 90% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   43997..44015
FT                   /note="iteron associated with repA2; 99% identity to
FT                   consensus AAAAGCATTTGCATGAATG"
FT   repeat_region   44055..44075
FT                   /note="repeat associated with repA2; 81% identity to
FT                   consensus GGGCGCTGAAAGGTGCCTTTG"
FT   RBS             44347..44350
FT                   /note="possible RBS"
FT   CDS             44356..44709
FT                   /transl_table=11
FT                   /gene="trhA"
FT                   /gene_synonym="HCM1.67"
FT                   /product="putative pilin precursor"
FT                   /note="HCM1.67, trhA, probable pilin precursor, len: 117
FT                   aa; highly similar to TR:AAD54053 (EMBL:AF105019), trhA,
FT                   Salmonella typhi putative pilin from plasmid R27 (117 aa),
FT                   fasta scores; E(): 0, 99.1% identity in 117 aa overlap. R27
FT                   trhA shown to be involved in plasmid transfer by mini-Tn10
FT                   knockout. Contains a probable signal sequence similar to
FT                   that of SW:P04737 (EMBL:K01147), traA, Escherichia coli
FT                   F-plasmid pilus. Very weak similarity to and conservation
FT                   of gene order with Escherichia coli F-plasmid traALE genes"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P5"
FT                   /protein_id="CAD09676.1"
FT                   /translation="MELTLNTNVERGKTNAFAFLKSKHAKVPLFILLVLANCSFAYAGS
FT                   DDGAFGDIWAYMSEALTGAPGKIIACGMLFSVAYFGVVKPNLGLALVSALMMLVMANGE
FT                   KIISSFLDAGIPL"
FT   CDS             44728..45078
FT                   /transl_table=11
FT                   /gene="trhL"
FT                   /gene_synonym="HCM1.69"
FT                   /product="putative plasmid transfer protein"
FT                   /note="HCM1.69, trhL, probable plasmid transfer protein,
FT                   len: 116 aa; identical to TR:AAD54052 (EMBL:AF105019),
FT                   trhL, Salmonella typhi putative pilus synthesis and
FT                   assembly protein from plasmid R27 (116 aa), fasta scores;
FT                   E(): 0, 100.0% identity in 116 aa overlap. R27 trhL shown
FT                   to be involved in plasmid transfer by mini-Tn10 knockout.
FT                   Contains hydrophobic, possible membrane-spanning regions.
FT                   Very weak similarity to and conservation of gene order with
FT                   Escherichia coli F-plasmid traALE genes"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGT2"
FT                   /protein_id="CAD09677.1"
FT                   /translation="MRGIFPLSGVFMTSQYEIPPHTYRFPYRINMPLLILFWDAKQLGI
FT                   TFVTIASGNIFDFFITSVVVAVVFWFAYKKAAEEGIRGKLKHKLWWYGFFPGKSVFSSR
FT                   YFTDPFIRNLYS"
FT   CDS             45078..45875
FT                   /transl_table=11
FT                   /gene="HCM1.70"
FT                   /gene_synonym="trhE"
FT                   /product="putative pilus assembly protein"
FT                   /note="HCM1.70, trhE, probable pilus assembly protein, len:
FT                   265 aa; identical to TR:AAD54051 (EMBL:AF105019), trhE,
FT                   Salmonella typhi putative pilus assembly protein from
FT                   plasmid R27 (265 aa), fasta scores; E(): 0, 100.0% identity
FT                   in 265 aa overlap. R27 trhE shown to be involved in plasmid
FT                   transfer by mini-Tn10 knockout. Very weak similarity to and
FT                   conservation of gene order with Escherichia coli F-plasmid
FT                   traALE genes, however traE (and homologues) have a strong
FT                   predicted hydrophobic region near the N-terminus absent
FT                   from this predicted CDS"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGT3"
FT                   /protein_id="CAD09678.1"
FT                   /translation="MELRMKLLSRLKIPFIKNSSNGDFDNKDETSQKGGEEVKGSFLDS
FT                   KARFSKEIEGSEIGITYSALIKRDEKLLRVNTVAMIIIGVLVVKNQFLTDPVTIVLPPN
FT                   MTEEVKVVGNKASESYKTQWALFFSTLIGNINPTNIGFVTTTILDALSPDLQAKTRESL
FT                   QQQTNIMQARGVEQSFKPIDMYYDTKNDMVYVWGTKSTRLINVPDKTESSKWTFEWVLG
FT                   MKNGRPRIAYVNQYSGTPNIKKITINGKEQLATLDNPPPSIGN"
FT   CDS             45878..47110
FT                   /transl_table=11
FT                   /gene="HCM1.71"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.71, possible periplasmic protein, len: 410 aa;
FT                   identical to TR:AAD54050 (EMBL:AF105019) Salmonella typhi
FT                   hypothetical protein from plasmid R27 (410 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 410 aa overlap. Contains
FT                   a probable N-terminal signal sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGT4"
FT                   /protein_id="CAD09679.1"
FT                   /translation="MTSKKVFHCTAITAVILLATSNVVFAEDYQLPATVNNPVVMPVGA
FT                   DEFQNGVKNAIIKDTGTTTETVQATKPTTALPSLSPASSASPAVNEITGALSNNPTLAG
FT                   YQQQVKSGNFDSYGRPAGKEPQQNAQSTGSPSKADELYVEARNRYKEVQRVNVPPGGNI
FT                   VLPVSRGLQNRISTSFKNASVSTSTPADEASIFVNGGDVFISTNTDKPIGIMLSEDSVP
FT                   ESTYNLTLVPLDVPGAMISVTTSLSPTMQAKRETSLDKQNYDEMLARSQSEELTPSDPR
FT                   QDDHKQRIIDLLTPVALGEVPSGFSLQEDRLSRIPSSEQSPCNFNMYAKLGQRLVGSRE
FT                   LIDVVLVKNDKPYGQVVADQQCITEGVVASALFDKAFLQPGEETELYIVRDKLFKERQT
FT                   RVTTRPSLIKR"
FT   CDS             47112..47552
FT                   /transl_table=11
FT                   /gene="HCM1.72"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.72, possible membrane protein, len: 146 aa;
FT                   identical to TR:AAD54049 (EMBL:AF105019) Salmonella typhi
FT                   hypothetical protein from plasmid R27 (146 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 146 aa overlap. Contains
FT                   hydrophobic, possible membrane-spanning region near the
FT                   N-terminus"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGT5"
FT                   /protein_id="CAD09680.1"
FT                   /translation="MRKATFLTVISFGLVVFLGTSYYYQTKYIPKGTVNIFPDVHRQGE
FT                   IVDDAFEKSTIVISDPTLADKFVGSSTESVGRHEVNVIKELGTQNNGSKFIHDESDKSG
FT                   LTVGDKWPRAGEPYIVPQMTEYERNLKVKRFQQPKNGVNNGH"
FT   RBS             47532..47535
FT                   /note="possible RBS"
FT   CDS             47542..48900
FT                   /transl_table=11
FT                   /gene="trhB"
FT                   /gene_synonym="HCM1.73"
FT                   /product="putative plasmid transfer protein"
FT                   /note="HCM1.73, trhB, probable plasmid transfer protein,
FT                   len: 452 aa; identical to TR:AAD54048 (EMBL:AF105019),
FT                   trhB, Salmonella typhi putative pilus assembly protein from
FT                   plasmid R27 (456 aa), fasta scores; E(): 0, 100.0% identity
FT                   in 452 aa overlap. R27 trhB shown to be involved in plasmid
FT                   transfer by mini-Tn10 knockout. Also similar to transfer
FT                   genes from other plasmids e.g. TR:Q9Z4H6 (EMBL:AF030442),
FT                   htdB, Serratia marcesans pilus assembly protein homolog
FT                   from plasmid R478 (388 aa), fasta scores; E(): 0, 82.2%
FT                   identity in 388 aa overlap. Contains a possible N-terminal
FT                   signal sequence"
FT                   /db_xref="InterPro:IPR010501"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5U6"
FT                   /protein_id="CAD09681.1"
FT                   /translation="MDIKKAWENKTVRISVIGAALMVLIVVISQSIFTTPVKKEKKTQK
FT                   KDMQTGFLIDDSQMNKLSNEESQKTYNEMVRQNRIDQNAAKADRDKAEKAQQENKAQIA
FT                   SLASQVQQLTTQLTEMQTSRNGNRNLDAGGPRNNVNEQAPAKPYQLNPNAAVNGVSSGY
FT                   APISPTRNSPMRTITQSSIKTNGTDGVIQVMPISENRIREGREVVAGSEKAPTRTIRGD
FT                   GTAPVDSKARHAARKDEMFLPATSIITGVLITGLEAPTSLSSKAEPMPVTMRIKKDIIM
FT                   PNNYTMDLRDCNLLGSAVGDLASQRAYIRATSISCVNSKGKAFDVIVEAYAVSENDGKN
FT                   GIRGNLISRNGNAIAGSAFAGGLSALAGSLSPSKVSSLNIDPNSTAQYQSPNIGALGAL
FT                   AGAGAAQGGLNRLVDYYTSIAEQQWPIVEISPGRPITFVVQKGATIPTNLTSR"
FT   CDS             48909..49421
FT                   /transl_table=11
FT                   /gene="HCM1.74"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.74, hypothetical protein, len: 170 aa;
FT                   identical to TR:AAD54047 (EMBL:AF105019) Salmonella typhi
FT                   hypothetical protein from plasmid R27 (170 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 170 aa overlap"
FT                   /db_xref="InterPro:IPR000595"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGT7"
FT                   /protein_id="CAD09682.1"
FT                   /translation="MENNNDNESPKKSESADSLNIDAAKPVGGIRTTKKVTLEIDIEKT
FT                   LKYLMVAGLAVLIVIYGYKGGRFVYDNFKAMSQPAYQIAVLDMQTLRKVFNKQNPVLDS
FT                   QQSKTNFENYFKALMKVYRERGYLVIDASLAVTIPENVEIVSYIDLGGSFGEVQSLPGE
FT                   PKESEIR"
FT   CDS             49422..50279
FT                   /transl_table=11
FT                   /gene="HCM1.75"
FT                   /product="putative plasmid transfer protein"
FT                   /note="HCM1.75, possible plasmid transfer protein, len: 285
FT                   aa; identical to TR:AAD54046 (EMBL:AF105019) Salmonella
FT                   typhi hypothetical protein from plasmid R27 (250 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 250 aa overlap.
FT                   N-terminal half is highly similar to TR:Q9Z4H5
FT                   (EMBL:AF030442), htdT, Serratia marcesans putative transfer
FT                   associated protein from plasmid R478 (157 aa), fasta
FT                   scores; E(): 0, 69.0% identity in 142 aa overlap, shown by
FT                   Tn7 insertion to be involved in transfer"
FT                   /db_xref="InterPro:IPR012336"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P4"
FT                   /protein_id="CAD09683.1"
FT                   /translation="MKKLLLSLLISITSACPPLTLAVENVLNNRDAAALMEKAKEGGVS
FT                   TKPLDGVLAKMKSYKPKDAIYIPTGGLYLFQDERSQLMAVTTDGRYTITGGSVMDILQR
FT                   KSVLSVEDIRKSFFINLDDAPFPLETVASIPLGNPKLKRQAAIFITLDCDGCQDLIKKF
FT                   YDEREKYRVDIVLIPSPGEPKQELRQLWCSKEKGKVNDLDILRWLMGNKADIEKRLLTK
FT                   EEAEACPAEPLVASLMLAGIYKLQGVPSVVRQDGLAGNGIPKDFDYWLKQSVEPLLKNP
FT                   FDTN"
FT   CDS             50289..51239
FT                   /transl_table=11
FT                   /gene="trhV"
FT                   /gene_synonym="HCM1.76"
FT                   /product="putative plasmid transfer protein"
FT                   /note="HCM1.76, trhV, probable plasmid transfer protein,
FT                   len: 316 aa; identical to TR:AAD54045 (EMBL:AF105019),
FT                   trhV, Salmonella typhi probable plasmid transfer protein
FT                   from plasmid R27 (316 aa), fasta scores; E(): 0, 100.0%
FT                   identity in 316 aa overlap. R27 trhV shown to be involved
FT                   in plasmid transfer by mini-Tn10 knockout. Highly similar
FT                   to TR:Q9Z4H4 (EMBL:AF030442), htdD, Serratia marcesans
FT                   putative transfer associated protein from plasmid R478 (324
FT                   aa), fasta scores; E(): 0, 79.2% identity in 313 aa
FT                   overlap, shown by Tn7 insertion to be involved in transfer.
FT                   Contains PS00017 ATP/GTP-binding site motif A (P-loop)"
FT                   /db_xref="InterPro:IPR014118"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGT9"
FT                   /protein_id="CAD09684.1"
FT                   /translation="MNIKKVIFSALVVGSSSYLAGCTIGSAESECPGIEKGVICKGPRE
FT                   VMELTNNRDDLSGLGEEEANSGKGKSAVNDSQYPAQLTPPGAVQYPKSSVLVNKPVTYT
FT                   TTEVKPVGQLPVMYDQTLKMGAPTSTIGPRPISGNPVNSNVRMTTSYNSNGSSVNPFLH
FT                   PSAEVVKKTTQVVTPAPAPRYVAPNSDINASKDLYSINNGQPVNPTLSSGQVQQYRTQG
FT                   YKQAVVAPEPLAVLQQGRVMRITFAPYTDDNDALNLPGFVYVNVKPQTWIAGKNSTSNP
FT                   ARIVPLEVQDAARENMQQQQRATKAVSSNGIVRQL"
FT   misc_feature    50478..50501
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   RBS             51238..51241
FT                   /note="possible RBS"
FT   CDS             51248..53929
FT                   /transl_table=11
FT                   /gene="trhC"
FT                   /gene_synonym="HCM1.77"
FT                   /product="plasmid transfer protein"
FT                   /note="HCM1.77, trhC, plasmid transfer protein, len: 893
FT                   aa; highly similar to TR:AAD54044 (EMBL:AF105019), trhC,
FT                   Salmonella typhi plasmid transfer protein from plasmid R27
FT                   (887 aa), fasta scores; E(): 0, 99.2% identity in 893 aa
FT                   overlap. Also similar to SW:TRAC_ECOLI (EMBL:M30936), traC,
FT                   Escherichia coli transfer protein from the F plasmid (875
FT                   aa), fasta scores; E(): 9.1e-15, 22.8% identity in 893 aa
FT                   overlap and to other traC homologues. Contains PS00017
FT                   ATP/GTP-binding site motif A (P-loop)"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P3"
FT                   /protein_id="CAD09685.1"
FT                   /translation="MRSANVYNKELSRHQLGGFIPVYDQIPGTHYFLLDGNRLGFMFIC
FT                   SPSPGVFDNQQDVLTELFKMDFPTDTICQTSLTALPDLILHLSAWSAVRGGRMEGHDKL
FT                   KGDLLTAYQLDYYDRSLNEPLKPDHDKLMLRDFQVWISFSIPLKSALPSEIEKSRIDAL
FT                   YSDLISKLNTVGLFPHKVGAENWLYCMDKLLHPGKTSRWSEGHVEASTMRRLNEQINVP
FT                   GRKYTVTENHFSSTTQSNDISEHRYFKQLSVVKFPEFVNFGCMYELVVNWLNGRKTIFS
FT                   PFMITQTVHFADPLKLSRENVRYKAITNKQASIPTVLTFCPRLKDMDNDYMTITRELED
FT                   GARLLHSYLTFTVMGNSAVDVQSAADQLKSFYLESRVNVADDSYIVFPSFVSSLPMCND
FT                   PKTILELDRFEVVSNTGAAHMTPIFGPWKGNTDRPVLNLVSREGQLLGLDIFKTSASYN
FT                   MVVGATSGAGKSFWVAYIINNYLGAGPRSNNLIHYRDTFEGFKNNSYDAFDPDGAQIFV
FT                   VDVGRSYQGISEQYTNSQFIDFGKKPDFTLNPFAFLTDVTVGERVFDEAPVFNDDSNNH
FT                   DDDKDKVAQTIMVLNQLKIMASEKGNIDDFQQSVMLQLISEEYNESRKVGRTGSITGFA
FT                   RRCSNHEDKRIKDIGDQLGQWCEGGIYGNRFTENLPPINFDSRFIVLELEELKGTPHLQ
FT                   TVVLMSIIQAAQHAMFIKKDGRRRLFILDEAWEYIRPDNASGSSNHSNQFFSSFLEAAW
FT                   RRFRKTNCAGICITQSFEDYFTSSVGRALTANSPWKIIMKQEKESIEAMKVNNYFSTTD
FT                   AEYERMKNIRTVKRAFSEMLVRFENFQEICRLYVDRKMELCFTTDSTDRGKLWEIQSRL
FT                   DCSYGEAIEILYEQEVASKSAA"
FT   misc_feature    52634..52657
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   repeat_region   54578..54631
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   54632..54685
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   54686..54739
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   54740..54793
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   54794..54847
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   54848..54901
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   54902..54954
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   55753..55806
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   55807..55860
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   55863..55911
FT                   /note="54 bp direct repeat (bases 5 - 54)"
FT   repeat_region   55912..55965
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   55966..56018
FT                   /note="54 bp direct repeat (bases 2 - 54)"
FT   repeat_region   56019..56072
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   56073..56126
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   56127..56180
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   56183..56231
FT                   /note="54 bp direct repeat (bases 5 - 54)"
FT   repeat_region   56232..56283
FT                   /note="54 bp direct repeat (bases 3 - 54)"
FT   repeat_region   56284..56335
FT                   /note="54 bp direct repeat (bases 3 - 54)"
FT   repeat_region   56336..56387
FT                   /note="54 bp direct repeat (bases 3 - 54)"
FT   repeat_region   56388..56441
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   repeat_region   56442..56495
FT                   /note="54 bp direct repeat (bases 1 - 54)"
FT   CDS             56742..57995
FT                   /transl_table=11
FT                   /gene="HCM1.86"
FT                   /product="putative plasmid partition protein"
FT                   /note="HCM1.86, possible plasmid partition protein, len:
FT                   417 aa; identical to TR:AAD54041 (EMBL:AF105019), parB,
FT                   Salmonella typhi putative partition protein from plasmid
FT                   R27 (417 aa), fasta scores; E(): 0, 100.0% identity in 417
FT                   aa overlap. Shows weak similarity to TR:Q44030
FT                   (EMBL:X90708), parA28, Alcaligenes eutrophus protein
FT                   involved in plasmid partitioning and stability (306 aa),
FT                   fasta scores; E(): 8.6e-07, 27.3% identity in 278 aa
FT                   overlap. Contains a probable helix-turn-helix motif at aa
FT                   50-71 (Score 1015, +2.64 SD)"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGU3"
FT                   /protein_id="CAD09686.1"
FT                   /translation="MNLIDKIALVGQRMKSEQISLKESLLVSSRVSVSDDSVDGVDRLI
FT                   YNHCLNKKNLSDFFGKSRVTFNKILADLEEKELVGAPIYQNKNHLYTRWDVQKIMDALN
FT                   YPRYSDYYCSRTIVTQNHKGGTGKSTTSGVLAVAAALDLHLNARILLIEWDPQGSIGSG
FT                   MIQSVAEDDVFLTAIDAILGVYEEDSDYRKYLDLGYSEEQIIEGMPFSTHLPNLDVITA
FT                   FPTDARFKDKYWQCSREERTELLLRFKEVILPVLKSKYDLIIIDTPPEDSPITWAADEA
FT                   ADGILVAVSPREYDYASTTDFMLTISERFKQSPSKGENLSWFKVLAVNVDDKSPYEKIV
FT                   LDKLVRTVQELFMSANIKNSEAFKAAASRGRTVLDIKKSEELCSPKQLDVAEESVMAVY
FT                   QQFINEIKSFSVKQGGNV"
FT   CDS             57992..58999
FT                   /transl_table=11
FT                   /gene="HCM1.87"
FT                   /product="putative plasmid partition protein"
FT                   /note="HCM1.87, possible plasmid partition protein, len:
FT                   335 aa; identical to TR:AAD54040 (EMBL:AF105019), repA,
FT                   Salmonella typhi putative replication protein from plasmid
FT                   R27 (335 aa), fasta scores; E(): 0, 100.0% identity in 335
FT                   aa overlap. Similar to plasmid partition proteins (some
FT                   putative) e.g. SW:PARB_ECOLI (EMBL:X02954), parB,
FT                   Escherichia coli plasmid partition protein (343 aa), fasta
FT                   scores; E(): 1.1e-15, 27.9% identity in 315 aa overlap.
FT                   Contains a probable helix-turn-helix motif at aa 174-195
FT                   (Score 1336, +3.74 SD)"
FT                   /db_xref="GOA:Q9RGU4"
FT                   /db_xref="InterPro:IPR003115"
FT                   /db_xref="InterPro:IPR014884"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGU4"
FT                   /protein_id="CAD09687.1"
FT                   /translation="MSDEQHIGNDKSRYINAPKRTEVIHRSGLQGLKGQPRLKKLFTLH
FT                   NGRKLEAEHIIVPAEKVELETTVHPLNPRNQEALSVNAVRDILKDIEARGVDTEGVAVK
FT                   RNGVYLLIEGSRRRFCCIQSAKELPLWVLPDDVNADDINSIISATQTSRRFSYREVGLK
FT                   YLREMEEHGFVTNEELANYHGISHVSVSKRVQAAKINSTLIALFPDYEAIPNSYYNRLF
FT                   RLQKYIEKNLFSLEEVVENTREEIRDLDISDIAEAQKTVMEKITTVVEKLDIKPPSKGW
FT                   DTRELATFTNKDKYARISKSSSGRKIRFEFNRMNRELIDEIEKFIKSKLSEMNN"
FT   CDS             complement(59182..59574)
FT                   /transl_table=11
FT                   /gene="HCM1.88c"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.88c, possible periplasmic protein, len: 130 aa;
FT                   identical to TR:AAD54039 (EMBL:AF105019) Salmonella typhi
FT                   hypothetical protein from plasmid R27 (130 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 130 aa overlap. Contains
FT                   a probable N-terminal signal sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGU5"
FT                   /protein_id="CAD09688.1"
FT                   /translation="MKYILTVLCIFFCQTASAYPYRIYTAPEGAIVKNILTNEVIGKTP
FT                   VEVDVSNTEAGSTFGISMYRHENVAIKIFTVMPNAENNFTVSGPDVATMSLPGKAPLNV
FT                   TNDSNAAAVHIDLRPFLSEPAHHPVQ"
FT   CDS             complement(59571..60092)
FT                   /transl_table=11
FT                   /gene="HCM1.89c"
FT                   /product="putative lipoprotein"
FT                   /note="HCM1.89c, possible lipoprotein, len: 173 aa; highly
FT                   similar to TR:AAD54038 (EMBL:AF105019) Salmonella typhi
FT                   hypothetical protein from plasmid R27 (173 aa), fasta
FT                   scores; E(): 0, 99.4% identity in 173 aa overlap. Contains
FT                   a possible N-terminal signal sequence and an appropriately
FT                   positioned PS00013 Prokaryotic membrane lipoprotein lipid
FT                   attachment site"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P2"
FT                   /protein_id="CAD09689.1"
FT                   /translation="MIKVSAFILTLLVTGCQSVGSKIAVLPSVGFDPIMSNRTEAYTDG
FT                   KVTFLIESSGTDVWLLAKNGTKEFIELSDLNLGGSRCTYSSRGKQLISPSSVTIFTVPT
FT                   VGLLGLCYDNNDQLTFINNSFKNISQSSRDGLTLPLLFSIKYKFPGSFDSKQIVVTQSF
FT                   DLEFLQKEQS"
FT   RBS             complement(59580..59585)
FT                   /note="possible RBS"
FT   misc_feature    complement(60045..60077)
FT                   /note="PS00013 Prokaryotic membrane lipoprotein lipid
FT                   attachment site"
FT   CDS             complement(60085..60924)
FT                   /transl_table=11
FT                   /gene="HCM1.90c"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.90c, possible periplasmic protein, len: 279 aa;
FT                   identical to TR:AAD54037 (EMBL:AF105019) Salmonella typhi
FT                   putative surface exclusion protein from plasmid R27 (279
FT                   aa), fasta scores; E(): 0, 100.0% identity in 279 aa
FT                   overlap. Contains a probable N-terminal signal sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGU7"
FT                   /protein_id="CAD09690.1"
FT                   /translation="MLKLELIILPLLAFLGPSNITNASTKTPIPSSQLSDAKTGVNYEF
FT                   ITIAANYVNGMWLVDGRQRPVIKTSMTKRNYLQIENDSASTPLNLVIPKIEFSIIAKNG
FT                   VFISKFISLDEDASGKRILWLEPGSSMTISFVNDLSSTPLQALVSVTKQKKEVIAIFGP
FT                   DQGKKFTLPLPSDSQQSSIDYVPSPEIALRINAPKKLQPAIAIPEDASASLLPSHTYKI
FT                   RAAEKVRTFKFSSFVWVGKRNNLLGGSDYFTKELKIYPGENFDISTIQKTTMRTEND"
FT   CDS             complement(60924..61895)
FT                   /transl_table=11
FT                   /gene="HCM1.91c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.91c, hypothetical protein, len: 323 aa;
FT                   identical to TR:AAD54036 (EMBL:AF105019) Salmonella typhi
FT                   putative surface exclusion protein from plasmid R27 (323
FT                   aa), fasta scores; E(): 0, 100.0% identity in 323 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGU8"
FT                   /protein_id="CAD09691.1"
FT                   /translation="MQFQKEAFMASEHVQTIDLTNFSGRVFFLADPHGHYSTLCNLIHS
FT                   ISEPDEELIVFSTGNLFDYGPEPMELMTAINTGIFDGRSVRVFSAAGAGEEMLKKLLPI
FT                   NKDRRTYYPSTFLNERWCARGGRWHKQINRNYLEEEICKLLSTQLATVMKVLFKGNISI
FT                   GICPSDYTDIRQGFNNTYNALLAFNQANVNIFQSQFLYGMDHAVRPVNVSDVNLVVLGR
FT                   NPVNSIRKAHGLPLTNLPVLIGNCLHINTGSLYMSEISSPALLAPGIPPTTVPAITLVE
FT                   LILASTPTLICHQMILNKNGIYTQNTAPLNLDSNDNNIEATL"
FT   RBS             complement(60935..60938)
FT                   /note="possible RBS"
FT   CDS             62245..63279
FT                   /transl_table=11
FT                   /gene="HCM1.92"
FT                   /product="putative plasmid stability/partition protein"
FT                   /note="HCM1.92, possible plasmid stability/partition
FT                   protein, len: 344 aa; identical to TR:AAD54035
FT                   (EMBL:AF105019), stbA, Salmonella typhi putative
FT                   stability/partitioning protein from plasmid R27 (344 aa),
FT                   fasta scores; E(): 0, 100.0% identity in 344 aa overlap.
FT                   Similar to others e.g. SW:STBA_ECOLI (EMBL:X12777), stbA,
FT                   Escherichia coli StbA protein from the stability locus of
FT                   IncFII plasmid NR1 (320 aa), fasta scores; E(): 7.9e-28,
FT                   33.2% identity in 316 aa overlap"
FT                   /db_xref="InterPro:IPR009440"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGU9"
FT                   /protein_id="CAD09692.1"
FT                   /translation="MTELAKTKLAVAESNSTELETLKVVIDDGSKAAKLVCTNNQGDLV
FT                   PLLTQNSFVADFRVSHDGLIPFNYLIDGLQRFSHHSESSNALETTDVAHQYDEISRLNV
FT                   HHALHSSGLMPQDVHLYVTLPLSQFYTALGETNNENIQRKKDNLMKPVERYIDGKRVSF
FT                   NVVSVTVFPESLPAVTRADEIESIESFESSLVIDLGGTTLDVASITGQLEQISSVRGFD
FT                   RIGCSIVYDEIRRYLDSAKLNASNAYIHHLVDNRENKASLKVSPEDLDGVFNAVNGAVA
FT                   QLQEKVIKAVTQVEERPHNVFLVGGGSYLIEPAVRKHFDKSKIIMVDNPQFALSLAIAD
FT                   TVFA"
FT   RBS             63313..63316
FT                   /note="possible RBS"
FT   CDS             63323..64000
FT                   /transl_table=11
FT                   /gene="HCM1.93"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.93, hypothetical protein, len: 225 aa;
FT                   identical to TR:AAD54034 (EMBL:AF105019), orf B, Salmonella
FT                   typhi hypothetical protein from plasmid R27 (225 aa), fasta
FT                   scores; E(): 0, 99.1% identity in 225 aa overlap.
FT                   N-terminal half similar to corresponding region of
FT                   TR:P95794 (EMBL:U59131), orf B, Serratia marcescens
FT                   hypothetical protein from plasmid R478 (206 aa), fasta
FT                   scores; E(): 2.3e-20, 58.2% identity in 110 aa overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P1"
FT                   /protein_id="CAD09693.1"
FT                   /translation="MTKKSEKENDRIQISAFWLSERQSPYAYNFLKKNSLTHRGEQISL
FT                   IRSAITTGLVLNNLFPELSSFINGLNERLTAADLNRFFNDEFNKDKLNNENLKEQISFM
FT                   LDSKFNELFSMINGCDFSKATFSTTSQSDVSETLKAERVRDQRLELIPKELTVNPKPET
FT                   LEILTPIESAKKNDSGLNTSHGSAAVSASQSENTVLSEHAQIQGVTRKPKKKANANLAN
FT                   LAK"
FT   CDS             64566..65018
FT                   /transl_table=11
FT                   /gene="htdA"
FT                   /gene_synonym="HCM1.94"
FT                   /product="transfer repressor"
FT                   /note="HCM1.94, htdA, transfer repressor, len: 150 aa;
FT                   identical to TR:Q52322 (EMBL:L20342), htdA, IncHI1 transfer
FT                   repressor (150 aa), fasta scores; E(): 0, 100.0% identity
FT                   in 150 aa overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q7BRX1"
FT                   /protein_id="CAD09694.1"
FT                   /translation="MLSRNSLIHGLRRDQLIEVLSISEFPVVLVENPFIQPKSTGKKPV
FT                   IFNIDEFHVSIAPISSLKYDWEWAPIDTILIEVVIPPAEADLVSAENDFLRDAGIGHIQ
FT                   CEPGGVSIRRTVTFVGGITADNLLYQLRLMCVSALHLIGEELEDES"
FT   RBS             64996..64999
FT                   /note="possible RBS"
FT   CDS             65008..65442
FT                   /transl_table=11
FT                   /gene="htdF"
FT                   /gene_synonym="HCM1.95"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.95, htdF, possible periplasmic protein, len:
FT                   144 aa; identical to TR:AAD54032 (EMBL:AF105019), htdF,
FT                   Salmonella typhi protein from plasmid R27 (144 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 144 aa overlap. Contains
FT                   a possible N-terminal signal sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q7BRX2"
FT                   /protein_id="CAD09695.1"
FT                   /translation="MKVNFKKVIPLLMVGLTVAGSYSIFNAKPSKPDLYDFTGKVLKTT
FT                   SVFQPCDKESTPSLNIQIADNGSVHINGVASKVTFVERVPGNEIAVKCTGLQVKNSRLV
FT                   HTSSYTMIISEGKGGFVISDLTHTKDNEVMSGTWFFKKRV"
FT   CDS             65439..66002
FT                   /transl_table=11
FT                   /gene="htdK"
FT                   /gene_synonym="HCM1.96"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.96, htdK, hypothetical protein, len: 187 aa;
FT                   identical to TR:AAD54031 (EMBL:AF105019), htdK, Salmonella
FT                   typhi protein from plasmid R27 (187 aa), fasta scores; E():
FT                   0, 100.0% identity in 187 aa overlap and similar to
FT                   TR:P95792 (EMBL:U59129), htdK, Serratia marcescens protein
FT                   from plasmid R478 (177 aa), fasta scores; E(): 0, 51.1%
FT                   identity in 178 aa overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGV1"
FT                   /protein_id="CAD09696.1"
FT                   /translation="MTMSDLSATGAKPQRVRVFSQSVAMAFEVNLDKSRSADNSAFVTE
FT                   TEKYYLSLQFAPPSDNREYGWNSEGSILMKLSQNEAMALASVFLRIKPTLKFEKRKTTH
FT                   RTHQAYKNINIGPNDRGGLLVSASIVPVKMGTFKPLNYNLPVTQMDCVSTGLFLLGFLT
FT                   LKMPWVSSESIITALRLSESKSGQ"
FT   CDS             66122..70420
FT                   /transl_table=11
FT                   /gene="HCM1.97"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.97, possible periplasmic protein, len: 1432 aa;
FT                   N-terminal 960 aa highly similar to TR:AAD54030
FT                   (EMBL:AF105019) Salmonella typhi hypothetical protein from
FT                   plasmid R27 (960 aa), fasta scores; E(): 0,99.8% identity
FT                   in 950 aa overlap and C-terminal 439 aa highly similar to
FT                   the adjacent R27 ORF TR:AAD54029 (EMBL:AF105019) Salmonella
FT                   typhi hypothetical protein from plasmid R27 (439 aa), fasta
FT                   scores; E(): 0, 99.8% identity in 439 aa overlap. Contains
FT                   a possible N-terminal signal sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q935P0"
FT                   /protein_id="CAD09697.1"
FT                   /translation="MRKSGLCLTLLFSLIASIKSVQAEAIMISGKLQADMPAVTFNPGP
FT                   GDFVAFVNNNTITASGTGNACNVTVDDRATSSVDNLVCFFEWLPNTSGFTANGFNLTGI
FT                   PNAAGELKLPYKISYFSGSERQKVEVVNGEYTVNALVPVKPTITGLKSSMNGVVQDGYT
FT                   LKSYLKDEAIRNVTVSVEPRNYVQYISIGSGSACEVAIGGNGCTIDVGSIKVSDSDLLM
FT                   GSREITVTANSKNNYFAPPEAQKLTLTWDYRPPVVDHTLWNFTDEAKTISVGGQEIYTG
FT                   ARTVAVAVKVPQEGTEGEWWLPTAMTLTMNPDGVFKPTTKVTLEDGTVIDFKQSWATPL
FT                   RRTLQPVSGPQKVGDEYLYIFDLTDLTNGSYAASFTVENNSKNTSTYNEPESKLMLSDN
FT                   PTLMVLKDGAALAKRAPVYFLNEIIVAAFQGQAGVADIKAVTIDNKLVELTPTNHKGIY
FT                   YLPVGDDLEVNADHEITVIAENLYGKIVTFNTTFTYQPTGFTLKNFEKDITLYSRVRQY
FT                   TDLMSQTAGDKCTLFTTEENALAYLEWYGDKSDITACYPQWNNVPDGLEFYFKGRTPGL
FT                   TGFFNKTGDNLLDYQVYMINGKGSKAVSSRNRHVLITQLPYNPVLTYKKNKVLTGINDN
FT                   TALAYTTGGEAARLLAKVVPADVTVYVSQNGGESVKTTFKNRSSNNDATTFVQRLKVAS
FT                   APLWTKNVFDIAVEYSKEPTMRTVDTLNVYTVPDFNIRAAMEIEDKKTATTMELPLKVS
FT                   VGRYNNSTRKSSFSRTTMGDWDVTIYAQKSVYGKDPETGRYKTTYERTPLTEALPVNDA
FT                   GVVETKIKIENMDLGNVRLVGIAKVRSPFADFELTRETSAVSIRVYKGEELEGNLSKSL
FT                   IIGRIPLSTLVNFKSASTANSDALAPTEWQESSDNGQTWTMLQDMTGKRSISIRKTEVG
FT                   KWLYRAKMTNKFTSKESYSDVLTVVTYKQPKLSIDVAEILEGDDLPVTLLDNDEPIPQG
FT                   TAEVMWSEDKVNWVQGDTTYNVSAADTLPPTIYARMRYLDSDELAEESSWKETSARLTV
FT                   AKPKRLSVSVSGISSVEVGSKVTLDGKYTNPNSRFKNGNDVIEEWTAPDGQKIRGANLS
FT                   ITLTEQMLDKQGYAAFEYSAWLADSKDSTISTRKVSVKSWVYKFPEMKVSTKLKYTMAP
FT                   STLHVALSGIKDGGYPGVTYSREWIYDKDNISVLKDDGDTKEFAIAKPGKYTLVIVFRD
FT                   NRNNEQRIENTFVVDEQTPMTVEMTPKFSNKFMRAPLDVTLRSNIKLAHSADSIDTVTY
FT                   KVNGEVVPGSKNYWAQLISGLTEKKYEVTLDVVSKMGQRGTASVDFEVVKNAAPQCALS
FT                   YTESNMSWSFTNKCIDTDGKLVRYEWYINDELRNVFGSTATLSKNLNRGKQDIRVVAYD
FT                   DSGDSATQRTTVYGPDEGASKSVDSVETSQ"
FT   CDS             70694..71206
FT                   /transl_table=11
FT                   /gene="trhF"
FT                   /gene_synonym="HCM1.98"
FT                   /product="putative pilin maturation protein"
FT                   /note="HCM1.98, trhF, possible pilin maturation protein,
FT                   len: 170 aa; highly similar to TR:AAD54027 (EMBL:AF105019),
FT                   trhF, Salmonella typhi plasmid transfer protein from
FT                   plasmid R27 (170 aa), fasta scores; E(): 0, 99.4% identity
FT                   in 170 aa overlap. Shows weak similarity to signal
FT                   peptidases e.g. SW:LEPC_BACCL (EMBL:Z27457), sipC, Bacillus
FT                   caldolyticus signal peptidase I from plasmids pTA1015 and
FT                   pTA1040 (182 aa), fasta scores; E(): 0.013, 25.1% identity
FT                   in 171 aa overlap. Appears to be missing the proposed
FT                   catalytic serine residue of IncP transfer system signal
FT                   peptidases, therefore may not be active. Contains Pfam
FT                   match to entry PF00461 Peptidase_S26, Signal peptidase I.
FT                   Contains hydrophobic, possible membrane-spanning region
FT                   near the N-terminus"
FT                   /db_xref="InterPro:IPR011056"
FT                   /db_xref="InterPro:IPR015927"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N9"
FT                   /protein_id="CAD09698.1"
FT                   /translation="MREYIPKKRGLLSFDWYVPINLGILILVMLIFFNRFTFGHGLLNG
FT                   CLPADFYMIDLKDKSVSSGNIIAFHMPKSVRFIRENEKVIKIVAGVGGDRLRVTLDGVY
FT                   NGNKFYKANARRISVKYGIPAETIERELTIPEGEVFLIGQTDHSWDSRFWGPVKLTSVI
FT                   GKTYAIF"
FT   misc_feature    71096..71185
FT                   /note="Pfam match to entry PF00461 Peptidase_S26, Signal
FT                   peptidase I, score 15.50, E-value 0.0009"
FT   CDS             71193..72701
FT                   /transl_table=11
FT                   /gene="trhW"
FT                   /gene_synonym="HCM1.99"
FT                   /product="plasmid transfer protein"
FT                   /note="HCM1.99, trhW, plasmid transfer protein, len: 506
FT                   aa; highly similar to TR:AAD54026 (EMBL:AF105019), trhW,
FT                   Salmonella typhi plasmid transfer protein from plasmid R27
FT                   (502 aa), fasta scores; E(): 0, 99.8% identity in 502 aa
FT                   overlap. R27 trhW shown to be involved in plasmid transfer
FT                   by mini-Tn10 knockout. C-terminal half shows weak
FT                   similarity to SW:TRAW_ECOLI (EMBL:M93106), traW,
FT                   Escherichia coli F-pilus assembly protein (210 aa), fasta
FT                   scores; E(): 1.8e-05, 25.4% identity in 193 aa overlap.
FT                   Contains a probable N-terminal signal sequence"
FT                   /db_xref="InterPro:IPR019106"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N8"
FT                   /protein_id="CAD09699.1"
FT                   /translation="MRSFELKTTIKPLASCLAFYALISTAVASPQYQQVADDIARQAQV
FT                   LGAQIPVPHASEGPLPSGSLDSPDTKKYIRQAEAMKKNGDLSQQTNRGYVPGMNADSVQ
FT                   AVIDHTQAIRAQSNNSEAVNDIIRRRDEIQGNSQLSESALKSVENKPEVMRSQSSNIEK
FT                   MFGSSGITAADFERKIDSSREEVLSTENGITIFASFSLPDYVLEDLLRTASEHKARVVF
FT                   NGLKKGTTRLPETQAAINQLVVKGKFDSPLITIDPDAFNQYQITQVPTIISREQSRFAK
FT                   MVGSFNVDFFQRELARKPDQDLFPIAGTTYPVEEKSIIKELEERAQKYDWDGAKKRAVA
FT                   DTWKNQYMVNLPPAQEHKEWLIDPTIRVTQDVKDKQGRVIASAGELINPLARFPQNLTM
FT                   IIFDPMNPGQLEWAEKQYRQRLGSGQVMPMFTRIKQENGWDHLNDLREKFNGKVFKVNE
FT                   QIIARFQIKNTPALISTEKEKFRITQFSEAEIRGIGTKIAAEEN"
FT   CDS             72891..73898
FT                   /transl_table=11
FT                   /gene="trhU"
FT                   /gene_synonym="HCM1.100"
FT                   /product="plasmid transfer protein"
FT                   /note="HCM1.100, trhU, plasmid transfer protein, len: 335
FT                   aa; identical to TR:AAD54025 (EMBL:AF105019), trhU,
FT                   Salmonella typhi plasmid transfer protein from plasmid R27
FT                   (335 aa), fasta scores; E(): 0, 100.0% identity in 335 aa
FT                   overlap. R27 trhU shown to be involved in plasmid transfer
FT                   by mini-Tn10 knockout. Similar to others e.g. SW:TRAU_ECOLI
FT                   (EMBL:M34695), traU, Escherichia coli F-plasmid conjugative
FT                   transfer protein (330 aa), fasta scores; E(): 0, 32.9%
FT                   identity in 322 aa overlap"
FT                   /db_xref="InterPro:IPR009649"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGV7"
FT                   /protein_id="CAD09700.1"
FT                   /translation="MLSLSLPAMTMAADTGVPGAMCQSAGVWQGLIKNICWSCIFPMRI
FT                   MGIGAAPEGAAPSRPGCYCTDQNGIPEIGWQLSFFQPVKIVEVVKSPWCSPFLEGTMLQ
FT                   KSQFDIGKSNTNQPMTATEAGFYDVHLWEFPIMTMLKLLVIGECTAEPYVDASLTYISE
FT                   VDPMWESDLLTLVLNPEAVVFANPIASMVCAADCVAVTAGKDNLAAYFCAGCDGNLYPL
FT                   TGHIYANDDAVRTSSLITQRLLTKLHRQGMLMRTMGADAMCEKTWEYFTPRSQYRLSML
FT                   YPTPEANGPDCCHRLGDSVHDWSTLKGGRKKIGIDNYVYMLWRYNDCCVRYIPN"
FT   CDS             73921..77097
FT                   /transl_table=11
FT                   /gene="trhN"
FT                   /gene_synonym="HCM1.101"
FT                   /product="plasmid transfer protein"
FT                   /note="HCM1.101, trhN, plasmid transfer protein, len: 1058
FT                   aa; identical to TR:AAD54024 (EMBL:AF105019), trhN,
FT                   Salmonella typhi plasmid transfer protein from plasmid R27
FT                   (1058 aa), fasta scores; E(): 0, 100.0% identity in 1058 aa
FT                   overlap. R27 trhN shown to be involved in plasmid transfer
FT                   by mini-Tn10 knockout. Contains a possible N-terminal
FT                   signal sequence"
FT                   /db_xref="InterPro:IPR009726"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGV8"
FT                   /protein_id="CAD09701.1"
FT                   /translation="MKHRKIISSAIIASMIANTMSWAFYVSLINIALTPKIFAADAIFD
FT                   QLENNFNLANPNANRNATTSAQDIVEKYKNADSGENLSGKISEKYVGKAESTNLNVGKY
FT                   GTPNSNESVMSNAVSDGKSIGKAVQLPSMSGGTINSNYTKEGAKLLSRDSSGNIGISNN
FT                   PNTTAGTKTSTGELFSSEQKHSDVQFNAGGRYGDENGFINDIKNRKSQLFEAQSYDGVA
FT                   YRTLVNANKENPASTIKPNDPMFNAGRNEIGNAVAGTGNWLQNCNTETSKQTITTHYPD
FT                   YKEFYCNSPKKDNFNSCTITRDFSVPVYISGGNGDMSMCGDNCVRVWFGRRDDNYWNDG
FT                   VYDNSLTLKFHPDAKLATAKIINAEWDDHMRVTLDGTQIFAHIDGAYRSSNYPSPQGQW
FT                   ELKKSWKLDKVYDITEQVKTSVYQEQDREVTMASRVWVGGGGEGYFEVEMTFENMKLED
FT                   KHIQEPAGCFDAVQTPNSFCRFDRFVNMDVGTKRLPESVLKMATPLYKGDTGYLTWKTN
FT                   LEGYFCDPLAKEKLCSYDAKGNIMKDPTGKDLCYNYDDIKNMPDACSTYKNDAACVLDN
FT                   QTCAEGWFDEGTNTCYMYEQKYTCDRGKDVVREVESQTNSCVGMIPCSGGTCETGPKEE
FT                   NKDFGKVAAYSNMVQYMQGEAKCEDPNDPNSCSVFEGKAEWCGRSVGFVNGLAKTDCCE
FT                   KPQGAAGSLEAIMLAGSMIRNTNWTRVNAQLVNWTGGESGTWASMANSVGEWTASAGKT
FT                   VGQMWNNVTSSITSVYENVAGNLGRTVGSSAAGESGQLAKETMSSFGLGKLKQMAMEKA
FT                   YDLLPDTVRDFVFKNVATTGGEIVFSAAVQNFMLALNVIGWIYTAYQVTKMLLEMLVAC
FT                   DQKEMEASIHKNQKSCFTLDTNRCVKYLNLGFTKKCVKKATDMCCYNSMLSRVIMQQAY
FT                   PQLGIDPVTSNCVGLSIGQIQKLDFDKIDLTEWINDAVQVGEVPDQYATFSESSITANL
FT                   PFKNENYQLPSERTKDAMGGEENMIKARQENAQAIKEENVDCSYLPRPAICEVGSTYVD
FT                   PITGKEIPKY"
FT   RBS             77418..77422
FT                   /note="possible RBS"
FT   CDS             77433..78419
FT                   /transl_table=11
FT                   /gene="HCM1.102"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.102, hypothetical protein, len: 328 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N7"
FT                   /protein_id="CAD09702.1"
FT                   /translation="MTTQSSSIQYAYALDGEGTLTHIGAALRSHTYTCPGCKSPLTPVM
FT                   GEFNAKHFRHSEECCALETYLHKCGKEAFFYRYQQALSREMPISLELERRVACNGSHLA
FT                   LVRDEARQCVKSVPARYNLTQFFDQAELEKHDKVTGLRPDVMLYDTTGERRCYVEICVT
FT                   HPCSQDKIEAGIPILEFKVQSASDIQMLLTGAYSIKEKILRVFNWLPPFQSVDTCSGVC
FT                   SVGNVYMSVWSLSGSGRLYEQTMPLAEVDLTINSDVNTWPRSLGAAELADNLRAFIRHA
FT                   DPHSLFPNCIMCEQAGRWEDGYLQCHSKAKIVPYTEARQCANYKVKA"
FT   CDS             78416..80455
FT                   /transl_table=11
FT                   /gene="HCM1.103"
FT                   /product="putative DNA helicase"
FT                   /note="HCM1.103, possible DNA helicase, len: 679 aa;
FT                   similar to several e.g. TR:O24736 (EMBL:AB001291), uvrD,
FT                   Thermus aquaticus DNA helicase (692 aa), fasta scores; E():
FT                   6.5e-21, 28.1% identity in 627 aa overlap. Contains Pfam
FT                   match to entry PF00580 UvrD-helicase, UvrD/REP helicase and
FT                   PS00017 ATP/GTP-binding site motif A (P-loop). Similar to
FT                   HCM1.107, trhI, probable DNA helicase (618 aa), fasta
FT                   scores; E(): 1.1e-08, 23.2% identity in 621 aa overlap"
FT                   /db_xref="GOA:Q935N6"
FT                   /db_xref="HSSP:1PJR"
FT                   /db_xref="InterPro:IPR000212"
FT                   /db_xref="InterPro:IPR014016"
FT                   /db_xref="InterPro:IPR014017"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N6"
FT                   /protein_id="CAD09703.1"
FT                   /translation="MTKRLTWEQKSIVNHDTGHALVKAVPGSGKTTTLVKRVERLVKTG
FT                   TDPRSILILMYNKSAQVSFTEKLKTALMSSVIPEIRTFHSLALKIVGYGERQQIIKKKD
FT                   LITPSDYRYEQLVKQAYRYGFDHEANYIDPNEIENFELFIARCRAAAVTPVDAANDPTF
FT                   SNIKRGFIHAYGRYCELLEENSLRTFDDCLIEAVALLRNDSSLGAHFKHIIVDEYQDVN
FT                   LIQHDMTRLLSKSDTSVMAVGDVNQCIYEWRGARPDFIGGLFERHYPNTKVFQLSCTFR
FT                   FGHELSLMANSVIRRNSTKLTKLCVSHPSTPKTEVRLHFDNCLSKVLSNLSVSSGTQAI
FT                   LSRTKANLAEAEIVLRLCGLPYRYLNGSSALHTRTEIGILVVGVLLSVYGDLRLLENHP
FT                   NKQAIVYGFLKEAGFSWQKGQFKAALSGLMAPHADLWSALGQLFEGAQYQKDRLGRLAT
FT                   ICQKDGEETPAIDVLRRLSMEGFIDSVGSEGVTRTGSNDQQRGVVRIGELLDSSKIDSR
FT                   TFLNLILNPGEAATDCDPFILSTLHGSKGLEWDNVILIGLNEQEFPGGKPDDVYSVRTS
FT                   MNTPPAEEEIEEERRLFYVGITRTKQQLNLVVPLDEGLARWLKNRWDSTPKKSPIATRF
FT                   VYEAGWTACAVTSDAIYNSTVEKQKADFSKFHQWYLRDLQRLKV"
FT   misc_feature    78431..79864
FT                   /note="Pfam match to entry PF00580 UvrD-helicase, UvrD/REP
FT                   helicase, score 19.30, E-value 3.2e-09"
FT   misc_feature    78485..78508
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             complement(80458..80712)
FT                   /transl_table=11
FT                   /gene="HCM1.104c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.104c, hypothetical protein, len: 84 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N5"
FT                   /protein_id="CAD09704.1"
FT                   /translation="MLALGVSYPPKSGWIERLIGTEVSDEQYERFLGHSTSKQAEQILR
FT                   GEQPAKGLQYAKRAKKLASERKATIDLDNEHLSEIEKYR"
FT   CDS             complement(81234..82106)
FT                   /transl_table=11
FT                   /gene="HCM1.106c"
FT                   /product="putative lipoprotein"
FT                   /note="HCM1.106c, possible lipoprotein, len: 290 aa;
FT                   identical to TR:AAD54023 (EMBL:AF105019) Salmonella typhi
FT                   hypothetical protein from plasmid R27 (290 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 290 aa overlap. Contains
FT                   a probable N-terminal signal sequence and an appropriately
FT                   positioned PS00013 Prokaryotic membrane lipoprotein lipid
FT                   attachment site"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGV9"
FT                   /protein_id="CAD09705.1"
FT                   /translation="MKNKRFVSLVSALVASASLVGCAGNAGQSPNSAQHSDTHGLYWHA
FT                   NAKDSVAKNAYSLAGFDVSFNEETVQPGGDADNFLSKLLISGSMGYVTGGLSGLSIMSL
FT                   GSLYSSSDAEYIQVNQYVVFVPNPKKLPYNDESLVRAGAAYVYNHTKESQVMLGFNPSK
FT                   QSAALASCKIDRAVINKWSTCELTSKPAPDVMPTNSMYSFQAIRPATGTEIPQLNLPAG
FT                   EYSVIRYVFIPFKGNESSNNFSGIIFRSDSPKFTMPGGAAASINGKDYYLFSGEYGQKG
FT                   FPEKTLKSK"
FT   misc_feature    complement(82041..82073)
FT                   /note="PS00013 Prokaryotic membrane lipoprotein lipid
FT                   attachment site"
FT   CDS             82216..84072
FT                   /transl_table=11
FT                   /gene="trhI"
FT                   /gene_synonym="HCM1.107"
FT                   /product="putative DNA helicase"
FT                   /note="HCM1.107, trhI, probable DNA helicase, len: 618 aa;
FT                   identical to TR:AAD54022 (EMBL:AF105019), trhI, Salmonella
FT                   typhi putative ATP-dependent helicase from plasmid R27 (618
FT                   aa), fasta scores; E(): 0, 100.0% identity in 618 aa
FT                   overlap. Similar to others e.g. TR:O24736 (EMBL:AB001291),
FT                   uvrD, Thermus aquaticus DNA helicase (692 aa), fasta
FT                   scores; E(): 1.1e-13, 25.0% identity in 645 aa overlap.
FT                   Contains Pfam match to entry PF00580 UvrD-helicase,
FT                   UvrD/REP helicase and PS00017 ATP/GTP-binding site motif A
FT                   (P-loop). Similar to HCM1.103, possible DNA helicase (679
FT                   aa), fasta scores; E(): 1.4e-08, 23.2% identity in 621 aa
FT                   overlap"
FT                   /db_xref="GOA:Q9RGW0"
FT                   /db_xref="HSSP:1UAA"
FT                   /db_xref="InterPro:IPR000212"
FT                   /db_xref="InterPro:IPR014016"
FT                   /db_xref="InterPro:IPR014017"
FT                   /db_xref="UniProtKB/TrEMBL:Q9RGW0"
FT                   /protein_id="CAD09706.1"
FT                   /translation="MSLVKKNPSNLNRIIKGTKYSEAFMGKPTDEQRVIIENANANNMV
FT                   IAAPGSGKSFTMIEAVISILRQFPYAKVGMVTFTRAATNSLAEKLKRRLSKKDQDRVLV
FT                   NTFHGFIRMQLDMVNWKGKMLISSAQRSVIHRALKESGAPFRYPDAEFAIDAIGREMDT
FT                   DIISVRHTRQQIHLFNTYQAICQKDHVADLNALSRFVVGQMYSGKMQPLNLTHLVVDEV
FT                   QDTDSIQYAWISLHTRAGVNTSIVGDDDQAIYSFRASGGVKIFQQFEKQFRPNIFYLNT
FT                   CFRCEPEILKVAGALIEKNVYRYAKDLRSAKGGGGKVHFRSYVDMDEQIQGILNLINQD
FT                   PIGWAILSRGNAHLDQLESLIEQPVLRYGGKSFWDEKETSDVLHLMAFFRHSNDVRLMK
FT                   RVLALFGENEEVLDQTALSMKGRKVTFGELNIPNESSLETRTLHSNFTRFTQETREKVE
FT                   IEKRFANLIKWMELSSIKMRTQKGSPSLSRIALDTCKQWAEKTGWQNMINRAAAMCLGP
FT                   KKKDEEYTPDKVVLSTLHGSKGLEWKNVIIMSCNADQIPSKRSVGQEAIEEERRLLFVG
FT                   FTRAEQQLHVMWYGDPSFFLSECAEDKLKEAAKSRTESPLTE"
FT   misc_feature    82300..83610
FT                   /note="Pfam match to entry PF00580 UvrD-helicase, UvrD/REP
FT                   helicase, score -7.10, E-value 2.9e-08"
FT   misc_feature    82354..82377
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             84470..85345
FT                   /transl_table=11
FT                   /gene="HCM1.108"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.108, possible membrane protein, len: 291 aa;
FT                   unknown function, Contains hydrophobic, possible
FT                   membrane-spanning region near C-terminus"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5V4"
FT                   /protein_id="CAD09707.1"
FT                   /translation="MSKSKARSKALLIAFADLIPDMDKVVNKKLLDSLNVYSGHDNDLI
FT                   VIMNEDGPTIIELNSLKSVSMLAQKLSAFSTYYHVEMQQILVNPIDFEKAYTLLKEAPA
FT                   IPMFKTLADLDKFLNEEFEKYGLNTFLDVDNLDYSLAKSRELKNDQLVAWVSEIIEKRE
FT                   KLALRNRFNEVTKAHYETVDAMYAAVRPLMKELGFPDELMLHTFSELSVFDSKGWDYAI
FT                   KSKIEFLTKREEQCLDYQMKADKRQATVDELLAQINNAKTVKAPRSFGQLFGFSVIAMM
FT                   TFMFIVNKFI"
FT   RBS             85392..85396
FT                   /note="possible RBS"
FT   CDS             85404..85781
FT                   /transl_table=11
FT                   /gene="HCM1.109"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.109, hypothetical protein, len: 125 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5V5"
FT                   /protein_id="CAD09708.1"
FT                   /translation="MSYLEYVNEVKVSGIVISAMEKEMTSGNVGLLIKLKNRMKTEING
FT                   EITEREFSIQIKVSPEMYSGCFTGINQGDELMVSGYLVVDTITLEGREHPLDYMRVVAT
FT                   SKLAHIPKPPKGFGQSSFRQI"
FT   RBS             85832..85836
FT                   /note="possible RBS"
FT   CDS             85842..86828
FT                   /transl_table=11
FT                   /gene="HCM1.110"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.110, hypothetical protein, len: 328 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5D8"
FT                   /protein_id="CAD09709.1"
FT                   /translation="MKQKIRPTAFCSKQMDFFSIFDFEEEEKEIITIVESPLDYINDAI
FT                   AAQQSIQSEDKHSGPELEPSVSEDVALPGNCPKLLKNQILHDISFAAETDYLFTLEEYS
FT                   AELGGLVFDWAPEDVYQLYVVAMEESLENVRHLVITKSLYSTDEFGNITVNPLLEAETR
FT                   WYMSKSFELTCATHGIDAIEFRSELKKSLYEYTHSYGGENAELARYHQDKEVILHDCKE
FT                   EMGWDIFFEQDYLLQENKLAMKWTDRDIMDVYSKVFKSTINLFEKLVVNNKLTLRDTFG
FT                   WVIVNPTFERQFEWIESEVFEIVGTHLGYNVAAIRTQMATACRMTFH"
FT   RBS             86876..86879
FT                   /note="possible RBS"
FT   CDS             86888..87940
FT                   /transl_table=11
FT                   /gene="HCM1.111"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.111, hypothetical protein, len: 350 aa; shows
FT                   weak similarity SW:COBS_PSEDE (EMBL:M62869), cobS,
FT                   Pseudomonas denitrificans cobalamin biosynthesis protein
FT                   (332 aa), fasta scores; E(): 8.4e-06, 21.4% identity in 308
FT                   aa overlap and its homologues. Contains PS00017
FT                   ATP/GTP-binding site motif A (P-loop)"
FT                   /db_xref="GOA:Q935N4"
FT                   /db_xref="InterPro:IPR003593"
FT                   /db_xref="InterPro:IPR011704"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N4"
FT                   /protein_id="CAD09710.1"
FT                   /translation="MTNAATVLKSDNSVQEEIIGNLLPANVISSKMFANKEQYYLVKAK
FT                   DLFGIPEMDEDMIVPVFKKFSPYRANLNKDYIPNSRILEQVVKLLVSNDIDLSVCLKGE
FT                   SGSGKTEMAMYISHMLNWPLTIKQINSNIRADELEGERSLINGNTSFVPSELVTAFQEG
FT                   HLILLDEVDKIDPDTAAKLHMPIERKPWSLAANGGEVVKANKFTRFMGTSNTNMSGGSR
FT                   KFVSSQRQDAAFIKRFLIVEMERPSEVALTNVLLKRYNNLPMLVIEKFVSVAVAVNNTG
FT                   TDDSVMDIRQLVAWVGTSMTLKTMSLLDTFKIAFASALPAHATGMVLEAIDLILGDDKN
FT                   RTMEYYTAKK"
FT   misc_feature    87194..87217
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             87979..88248
FT                   /transl_table=11
FT                   /gene="HCM1.112"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.112, hypothetical protein, len: 89 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E0"
FT                   /protein_id="CAD09711.1"
FT                   /translation="MTDFAHLTFYGFLSANGTETFVIAQDGNQYIGLKQHNNDYSFICY
FT                   EVCNKDMEAMIKGLESKGFMYQGSIQSADVENEFPGILLTTLEK"
FT   RBS             88308..88311
FT                   /note="possible RBS"
FT   CDS             88319..89446
FT                   /transl_table=11
FT                   /gene="HCM1.114"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.114, hypothetical protein, len: 375 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E1"
FT                   /protein_id="CAD09712.1"
FT                   /translation="MTFNTSKLNKVSAKEISENFIKAYPDLQEGAVITKIEISGCQGSR
FT                   RTDKIELSYGGDDITDQKSVSKSEVRWIDIKALSFKSTITSRISTLCSRLCIRYSNMWI
FT                   LPVERMEEFLEEAQEIEREFQAGIQNVVDNYDTHIQAEKDRSPLMSDLIDQLKLTKDDF
FT                   VKSFRFNLAHFIPFSPISVEGDETQDFYQEQLITDLADEAMKVYTKISKNDNLRSSTID
FT                   RLKQMQDKIISFMFIHKEAVVLAEAIKHIMNNLPKGAISSPRDVAVLKQWFYFMSDASM
FT                   LKRIISGEQKVTDWLDSITRSFNIDSQVTAANSLNTAEDDVFSSANVFREDPVEDLENK
FT                   AVNAPEPAVGPDEDVSIQASGSNRAFDCELELTGW"
FT   CDS             89524..91536
FT                   /transl_table=11
FT                   /gene="HCM1.116"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.116, hypothetical protein, len: 670 aa; unknown
FT                   function"
FT                   /db_xref="InterPro:IPR002035"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E2"
FT                   /protein_id="CAD09713.1"
FT                   /translation="MKFDLKSSPRHIQRLTNIASVISGINGIYVIIDNKVSTPYFNTQN
FT                   NVCVLPNGDYSDERFVKLIEGFICHEAGHGRYTEHEVYREAFVGELINADGFISIDDDL
FT                   KADFQNLKQKQKAYARACRLKGLINLFDDVQMEEKTGIDYQEAKKRLAVTYALMVEAGR
FT                   MTVDISSTPQNPVQFIEMYLLNTLRVNVLQQEGHKETLDPFFDYAKKILAPVTSEVDEI
FT                   IHQALSCKSTQNCDSLARKTLALLERLRDEAKEKQQEEEQSKDPHDDTDESSGSENEPD
FT                   TEPNGDSQGEGDGDKEGQGDDSGDGKAPAEGNGLPDQSGGDEQNAENSNGEPDGESEGD
FT                   ESATPGSDDADSTPSLNDSSNGNSSDGESNFSPEQWDMLAKLLDDFLNSDEESEDFHEV
FT                   LAKEISVIAASVSDEVKAEFGASEWDVPDLNIDLNVYNEALNISQTLGADLSVLQQVKM
FT                   RGQFKTRDRGLSFDINRLIQSPMGVRDVFRSQSESKNRGHVGLVIVRDISGSMSLEHRY
FT                   IHAIKTDLALTLAIEAISKMHVANVIYPFVDKDFEVIKTFDENAEEKLSKFSLGCKGNN
FT                   TPTGSALNAALELLLESQFDRKIVFLITDGYPTESAYTINDVFSVAESNGIEIAGVGIK
FT                   TDVLMGFNEGTFVNVDDISLLPNEVSKLVHQILSN"
FT   RBS             91595..91601
FT                   /note="possible RBS"
FT   CDS             91608..91829
FT                   /transl_table=11
FT                   /gene="HCM1.116a"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.116a, hypothetical protein, len: 73 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E3"
FT                   /protein_id="CAD09714.1"
FT                   /translation="MTQIKTYRVEYEKVGTMHRVRIFGRMGEIVKSELPEERILRDVSI
FT                   PEGNGEMATSMVDGFIQRLENIGFKTEA"
FT   CDS             91923..93176
FT                   /transl_table=11
FT                   /gene="HCM1.117"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.117, hypothetical protein, len: 417 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N3"
FT                   /protein_id="CAD09715.1"
FT                   /translation="MPDKREQMTYASQAVKRTPHEVTDHFIKMVHARIAEVSGWRYVFD
FT                   RIPAFKDACDKAPGQVPCPFSGVGKSKFRFRKKDLFTGCAIHNDFPVNAFCDGIDVLAE
FT                   YYKLSKTQTCKKILTDFFGMDLYAPLTDADLESERRYKSTVRATETLDSDEVEKRGRKL
FT                   EVIYHYTGEIKPESPVWVYLRNRGLNRVLSNLPKDLGLNKRLYYMDKSLEKPTIYPGMI
FT                   AIYRDTRGRPLTIHRTFVELNGDKAHVENPKLMMKPPADMTGGSIQLYDPHFNPGTRTW
FT                   TLGVAEGIENALSVTEATSTPCWAASSAWCLENVEVPDSLLPPPGVKVIQFYIWADKDL
FT                   VNTKGTSPGMESAKRLQERMKEFFAKRYPTSELTIKVFEPDFDIPVGKKGVDWNDVLKL
FT                   TGPDGFPVKWAPECLAQL"
FT   RBS             93438..93441
FT                   /note="possible RBS"
FT   CDS             93451..93975
FT                   /transl_table=11
FT                   /gene="HCM1.118"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.118, hypothetical protein, len: 174 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E5"
FT                   /protein_id="CAD09716.1"
FT                   /translation="MNIENQDLFNTFAAVISSHIVEQPSSCYYLHDNEIDFTILKHSII
FT                   DKDKNLLYVIRPSGTCLLRCDKYFFPNYYLTSRGDYKAFKYVHFNLATREAEEITWQQA
FT                   FEILSKPGRPPLRGSLGKFDYLKLVIDDLRARGYADFLPAYNLDGLRHFAVKDERPSLV
FT                   SYIDNVMALCA"
FT   CDS             93966..94931
FT                   /transl_table=11
FT                   /gene="HCM1.119"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.119, hypothetical protein, len: 321 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N2"
FT                   /protein_id="CAD09717.1"
FT                   /translation="MRIKITHIFTTSLMAPPIGVALRVESGGLMKLATDLVNAVLIKNG
FT                   IVPTSINELPVTSLVKPLTQVHLSLYLKTTHLSQFVPDYVESLKDCPVSYDIGLELQQC
FT                   INSAELLCEDMESLEFISVWIELYTCNSKQQRFEKSNFSFRTEDIELAKMLSCSHEILI
FT                   SQAACFWLLYFEDFMKYVRNRLCALLRQVLILIAGLRNVYLQRNEDQLIKRVKHGNEML
FT                   EVTLKAVALCSIERYLKSYASLRTEAAASGFIKCIQSYISTGWRHGYIVCQYSKNGRSL
FT                   GKSLPLFIKETSEHNIQKRVNRLISSTISGRNKDLGLYDF"
FT   RBS             94993..94996
FT                   /note="possible RBS"
FT   CDS             95002..95937
FT                   /transl_table=11
FT                   /gene="HCM1.120"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.120, hypothetical protein, len: 311 aa; unknown
FT                   function. Similar to HCM1.121, hypothetical protein (306
FT                   aa), fasta scores; E(): 2.8e-07, 22.4% identity in 254 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E7"
FT                   /protein_id="CAD09718.1"
FT                   /translation="MKIIEKIINAFLISRKHSVKVSNVICLSGTDGKFTGICCDADVSF
FT                   DFLYSYAPAYSSTFLDIPFPGFEDQDIADCVKCQLDVVKNKRNRSFLIDHIRFPVSSRE
FT                   GFTLTRGDSYDVTECEYNKERLLHLTRQGRFCEDYLTFKDGLSSFFSFVNFELHEIVKE
FT                   GIRLALDVLNKITSDQPDRLIKDFKYHDCFGSYNVQIFSKGLPVDILETMIAPDRLLSN
FT                   LSGSRQIMKNASRYLKGFALSNRVYMKYGWRLADVDTSDYAKVMSDREMHARDDLKAFC
FT                   SVFFKECFASGKYEYEAYLSERQHAIRNGY"
FT   RBS             96003..96006
FT                   /note="possible RBS"
FT   CDS             96015..96935
FT                   /transl_table=11
FT                   /gene="HCM1.121"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.121, hypothetical protein, len: 306 aa; unknown
FT                   function. Similar to HCM1.120, hypothetical protein (311
FT                   aa), fasta scores; E(): 7.1e-06, 22.4% identity in 254 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5E8"
FT                   /protein_id="CAD09719.1"
FT                   /translation="MKAIYKIIEAMLVKMGFEGAVIQSVNLETGVIQSLVVKADIPVRT
FT                   LMPHLRRYLRDCEPLWGHDVDYHPIAQYCSGAALLKAGPVTLETFRFEVSVSTAHLRLV
FT                   DVEPDCLNEGVNREKLEYVYYRSSNADKDLILGMVEKGHNFINHLHELLRSRLSTALPL
FT                   IFAVTEKIAESSVPQVVTSFFSVDHQINAQIVVEPVPVSVADQIISADWNVCSVSGADK
FT                   FLNHVNRYLSGRVMKRRIYAVIEACDGGSLSLNANLGCFTSPLLVTEYKMVQSHSSSLY
FT                   RKAINNSLKQVNSYAPEHSDDLLSM"
FT   RBS             96996..96999
FT                   /note="possible RBS"
FT   CDS             97008..97943
FT                   /transl_table=11
FT                   /gene="HCM1.122"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.122, hypothetical protein, len: 311 aa; unknown
FT                   function. Similar to HCM1.123, hypothetical protein (318
FT                   aa), fasta scores; E(): 4.3e-28, 27.6% identity in 312 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N1"
FT                   /protein_id="CAD09720.1"
FT                   /translation="MFNESDDKNFVSAMLKCQLGLNISQEDITIYDKENHFEQLSFKAN
FT                   VALDDLLFYLDLYISELIKHNAPYSETEVLRTKIKYFLKVYEKSGFQNIRIRGYHNAHS
FT                   TIDIVDIASLILAGSVPESEHDSIDPVLRKEIYQNRMSVEGKVLIARFALKQFFHSDFG
FT                   DFILEFEKSISKCLNTSLQIIKSVKNSFNRLGQYQYQRRVKDDLTLHLDLNTDEYPACM
FT                   PDLYIGFKESEGTTGVYRDDEKIIRLYTGVSSGKDVPVMMTVRFTGCDGSVLSESSHGT
FT                   FCSVGPTGRVQVCDRVALVQEAVEELRDVV"
FT   RBS             98108..98111
FT                   /note="possible RBS"
FT   CDS             98120..99076
FT                   /transl_table=11
FT                   /gene="HCM1.123"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.123, hypothetical protein, len: 318 aa; unknown
FT                   function. Similar to HCM1.122, hypothetical protein (311
FT                   aa), fasta scores; E(): 2.7e-30, 27.6% identity in 312 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935N0"
FT                   /protein_id="CAD09721.1"
FT                   /translation="MTNSTDNQNYVRAVLAGIGIDFDETEMFISVSHCQSDEVSFTCSI
FT                   SASELRESAGHYVDTLNDTQLAGLDADALKKRLVYFLEVFDLVSGQYLDISGKHFATSR
FT                   FEYDDVCSEILSNSADSAQPGGYDREEYKRLMEVDGQVLIARFALEKFWDTHFIGLINY
FT                   VSDEITSGLYEVYRTFSDINMAGYTFSEYSYTRRITDELSLHISLKEDDFEEQLTDCYM
FT                   DETTLPSGKVVLRRNNESIIGIYEGYASKSYFPMVANVRVLDTDGEVVTELYQGVNVSE
FT                   LAGGRIKIHDRQELISEVFANLREFIPASEDKIFDAA"
FT   RBS             99478..99483
FT                   /note="possible RBS"
FT   CDS             99489..99758
FT                   /transl_table=11
FT                   /gene="HCM1.124"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.124, hypothetical protein, len: 89 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5F2"
FT                   /protein_id="CAD09722.1"
FT                   /translation="MPATTILSNNPVNSVFSNDNSHFTYRHIDFSIELLLSSGTDSQLE
FT                   YLFLKPAAEVKIDLQRRLASGERYVTTESCDNFSEVDGCMGHDC"
FT   CDS             99813..100403
FT                   /transl_table=11
FT                   /gene="HCM1.125"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.125, possible membrane protein, len: 196 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M9"
FT                   /protein_id="CAD09723.1"
FT                   /translation="MMTESFFDWVVYCITGVILASAFLEGKRTRFPAAFFYGSIVLLVV
FT                   LIVAGALNWWFYRSKFGSVVVIFAATTLLMTRFRLVIYAFRFRTLVADLQSHVAKGFRI
FT                   ILVLPENEDEKTVLLSKLSKVIHSGTLFYTRTALGPYSGDLLHALGQKHRNGEGYLLLC
FT                   EQQLPARTWLSTVENGQPEKSIAVNFHSIPDME"
FT   RBS             100397..100400
FT                   /note="possible RBS"
FT   CDS             100411..100668
FT                   /transl_table=11
FT                   /gene="HCM1.126"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.126, hypothetical protein, len: 85 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5F4"
FT                   /protein_id="CAD09724.1"
FT                   /translation="MSNTDSQTVPADALCENSSQVKIQLSRSASRALTTAKEILETRGL
FT                   VSVSTEDLVQACLEENQPLDLASIYLEHRLKQKGTSICEF"
FT   CDS             100742..101278
FT                   /transl_table=11
FT                   /gene="HCM1.127"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.127, hypothetical protein, len: 178 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5F5"
FT                   /protein_id="CAD09725.1"
FT                   /translation="MKSKIHSSGTSGTKRVLKTDIALPLLCWVFTSPFSNWTDKFFTGT
FT                   EVPEGSLPGLEQAPEAIFRFVLNDEGFDVGFDAVGMDLCCFSIPLSTMPTKNLDDEETL
FT                   SRLTGDVIHGVLLSLPEYIEMPDRLVYQLTDEVMAFNSHCGNGILHGWTTAQELWRNEI
FT                   LPRTTILMQQTSVIH"
FT   CDS             101295..101750
FT                   /transl_table=11
FT                   /gene="HCM1.128"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.128, possible membrane protein, len: 151 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M8"
FT                   /protein_id="CAD09726.1"
FT                   /translation="MKKRLYLLEWKLRETRAWLGWMVFWIIISFMFLSAMFMTGHLLNK
FT                   VVLQPVWLCIWSLPWLGFLLKVRVTEMDKGLVNTLQLGDLPVFRWSRSVVPGTWSVDRI
FT                   NGRYRLNRIGTDGLTVHYPWRLYYQPLFLTPDKQISDINGREHERKF"
FT   CDS             101965..102243
FT                   /transl_table=11
FT                   /gene="HCM1.130"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.130, hypothetical protein, len: 92 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M7"
FT                   /protein_id="CAD09727.1"
FT                   /translation="MMHLLVEGKGVIPDVSVSDLGNVQNIRNELIGLGWWVKFGVKQDW
FT                   QRINLQRQPVSFGLLNDLNRCFRHDGQQVEPLPLYTTGNPGELRKVL"
FT   RBS             102322..102325
FT                   /note="possible RBS"
FT   CDS             102332..103291
FT                   /transl_table=11
FT                   /gene="HCM1.131"
FT                   /product="putative DNA replication terminus site-binding
FT                   protein"
FT                   /note="HCM1.131, possible DNA replication terminus
FT                   site-binding protein, len: 319 aa; shows weak similarity to
FT                   TUS proteins from the Enterobacteriaceae e.g. SW:TUS_ECOLI
FT                   (EMBL:D90037), tus, Escherichia coli DNA replication
FT                   terminus site-binding protein (309 aa), fasta scores; E():
FT                   0.01, 25.5% identity in 208 aa overlap and SW:TUS_SALTY
FT                   (EMBL:AF045242), tus, Salmonella typhimurium DNA
FT                   replication terminus site-binding protein (309 aa), fasta
FT                   scores; E(): 0.012, 25.6% identity in 203 aa overlap"
FT                   /db_xref="GOA:Q9L5F9"
FT                   /db_xref="InterPro:IPR008865"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5F9"
FT                   /protein_id="CAD09728.1"
FT                   /translation="MASEDLLFYRDRILERIEKLRSFLNDHQPVMAELMTVGTVTRHEE
FT                   RLKEVNPIEVSTISDASVDEIIRVIQDFCIDDIDVLSRNSTKVTTKYPGLIIVPEGAEQ
FT                   LSGIICDINDAKSDFASAMKRVNSEKHIRFKEVHRKLPGLVTAHSTRKILFVEEQLKKV
FT                   TFAWRLNRNQVKTNASDLIAMLDKRRLVAVKSPVTTDLTVVANIDRAKALLERKVLRDG
FT                   EGYRLCRTNTFPVPIAHLFTYRPEGKERGSSKYAETDYKVVKASLPIFGVGQKPTIKRL
FT                   QDWVPAQDEALSNGRRSNHSYTELVPGADLGIFIMRKV"
FT   RBS             103291..103295
FT                   /note="possible RBS"
FT   CDS             103302..104210
FT                   /transl_table=11
FT                   /gene="HCM1.132"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.132, hypothetical protein, len: 302 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5G0"
FT                   /protein_id="CAD09729.1"
FT                   /translation="MQWISTTSQKLDERLYRVCVWVKKYHEDAINRVVLTVDLSKARHD
FT                   PIEDQVRAELLCGHYFLMRKENNAKSAPADQNFEFLPDGRNLSWQTSTPGLQHLLLNSN
FT                   VPESLRPLADYIQMRLAKLTMVPMSGTIMKAALEDSISWVKVDLRYYWQYELVNSHLGP
FT                   VQVTHKALVRFGRLAKHDENASAIRMLRQRLSSPFIQEFEMPGEELKRKQKIMNTVDVK
FT                   MLFHTHYPGQKLLLARYANGWVLVDCFLFHHIKPKKKAKNKTKAGKSETQNIKSTGSED
FT                   HGTGHYGVHRVVTLTGSGVDQ"
FT   RBS             104139..104142
FT                   /note="possible RBS"
FT   CDS             104146..104490
FT                   /transl_table=11
FT                   /gene="HCM1.133"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.133, possible membrane protein, len: 114 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5G1"
FT                   /protein_id="CAD09730.1"
FT                   /translation="MELGIMVCIVLLLSLAAVWISNKTVGLLEIHYFKRPLSMEYAAWL
FT                   RVMCAGLLFIFIQMVPAFTFLYTLKLVALLNLGVQTMKLNGVYKFKRTGMMPPKDAPHD
FT                   LGRFNPFRKK"
FT   CDS             complement(104515..105696)
FT                   /transl_table=11
FT                   /gene="HCM1.134c"
FT                   /product="putative recombinase"
FT                   /note="HCM1.134c, possible recombinase, len: 393 aa; shows
FT                   weak similarity to SW:RECR_BPP1 (EMBL:X03453), cre,
FT                   bacteriophage P1 recombinase (343 aa), fasta scores; E():
FT                   2.7e-05, 25.9% identity in 352 aa overlap. The 4 active
FT                   site residues identified in cre appear to be conserved.
FT                   Contains Pfam match to entry PF00589 Phage_integrase,
FT                   'Phage' integrase family"
FT                   /db_xref="GOA:Q9L5G2"
FT                   /db_xref="HSSP:2CRX"
FT                   /db_xref="InterPro:IPR002104"
FT                   /db_xref="InterPro:IPR010998"
FT                   /db_xref="InterPro:IPR011010"
FT                   /db_xref="InterPro:IPR013762"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5G2"
FT                   /protein_id="CAD09731.1"
FT                   /translation="MNSKPVTRQFEDSDLHQELVTFEVPNNDLKELIFYFSHMKYNTAK
FT                   TYLQWLRSWNEWYQANAGKEGNEAWPASSLPVTEPPLLAYLDYLQGSLSHSSIKGCLHA
FT                   LNSIHRKALDRPGIITSKVKSILASLEQAEAREQKVTRQATPFLVSDLKALIKAHGTTQ
FT                   SVRKLRDLCIIWTGFETLLRSAELRRIRMQDLVLNEQTGSFTLTVYRTKSTVSTLLTYH
FT                   LTPHLTATLIRLMDMVKRDQQSHPKDYLFQAVNYQDSGYMPPGWGLRSKGNEINTLLKN
FT                   HNMPYRPTRPPIGKNGKPIIVDDEGMLSKNTLLRAFEAFWDELHPQEAGTRCWTGHSVR
FT                   VGGAIELANAGYTHLQIMEMGNWSNPEMVSRYIRNIDAGKKAMTKFMREALDE"
FT   misc_feature    complement(104551..105276)
FT                   /note="Pfam match to entry PF00589 Phage_integrase, 'Phage'
FT                   integrase family, score 9.80, E-value 3.7e-05"
FT   CDS             105911..106123
FT                   /transl_table=11
FT                   /gene="HCM1.135"
FT                   /product="putative regulatory protein"
FT                   /note="HCM1.135, probable regulatory protein, len: 70 aa;
FT                   similar to Hha/YmoA class of bacterial regulators e.g.
FT                   SW:HHA_ECOLI (EMBL:X57977), hha, Escherichia coli
FT                   haemolysin expression modulating protein (72 aa), fasta
FT                   scores; E(): 2.6e-10, 48.6% identity in 72 aa overlap and
FT                   SW:YMOA_YEREN (EMBL:X58058), ymoA, Yersinia enterocolitica
FT                   gene modulating the expression of virulence functions (67
FT                   aa), fasta scores; E(): 1e-09, 50.7% identity in 67 aa
FT                   overlap. Plasmid-borne homologue exists in Escherichia coli
FT                   plasmid pO157 TR:Q9ZGV7 (EMBL:AF074613), L7004, Escherichia
FT                   coli putative hemolysin expression modulating protein (69
FT                   aa), fasta scores; E(): 2.3e-08, 40.6% identity in 69 aa
FT                   overlap and plasmid R100 TR:O32581 (EMBL:Y13856), rmoA,
FT                   Escherichia coli RmoA protein (69 aa), fasta scores; E():
FT                   2.7e-08, 40.6% identity in 69 aa overlap"
FT                   /db_xref="HSSP:1JW2"
FT                   /db_xref="InterPro:IPR007985"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M6"
FT                   /protein_id="CAD09732.1"
FT                   /translation="MSETKQAYLMKFRKCSSFDTLEKVFERLCEKNAGIASLEISGAYD
FT                   HRKAELTMKKLYDKVPASVWTLVRQ"
FT   repeat_region   106385..106397
FT                   /note="13 bp inverted repeat flanking IS1"
FT   repeat_region   106385..107132
FT                   /note="IS1"
FT   CDS             106430..106705
FT                   /transl_table=11
FT                   /gene="insA"
FT                   /gene_synonym="HCM1.136"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.136, insA, probable IS1 transposase, highly
FT                   similar to many e.g. SW:ISA1_ECOLI (EMBL:X52534), insA,
FT                   Escherichia coli insertion element IS1 protein InsA (91
FT                   aa), fasta scores; E(): 0, 96.7% identity in 91 aa overlap.
FT                   Contains PS00017 ATP/GTP-binding site motif A (P-loop).
FT                   Contains a probable helix-turn-helix motif at aa 64-85
FT                   (Score 1364, +3.83 SD)"
FT                   /db_xref="GOA:Q935M5"
FT                   /db_xref="InterPro:IPR003220"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M5"
FT                   /protein_id="CAD09733.1"
FT                   /translation="MASVSISRPSCSATDGVVRNGKSTAGHQRYLCSHCRKTWQLQFTY
FT                   TASQPGTHQKIIDMAINGVGCRATARIMGVGLNTILRHLKNSGRSR"
FT   misc_feature    106475..106498
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             106624..107127
FT                   /transl_table=11
FT                   /gene="insB"
FT                   /gene_synonym="HCM1.136a"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.136a, insB, possible IS1 transposase, len: 167
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISB_ECOLI (EMBL:D10483), insB, Escherichia coli
FT                   insertion element IS1 protein InsB (167 aa), fasta scores;
FT                   E(): 0, 98.8% identity in 167 aa overlap"
FT                   /db_xref="GOA:Q935M4"
FT                   /db_xref="InterPro:IPR005063"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M4"
FT                   /protein_id="CAD09734.1"
FT                   /translation="MPGNCPHYGRWPQHDFTSLKKLRPQSVTSRIQPGSDVIVCAEMDE
FT                   QWGYVGAKSRQRWLFYAYDRLRKTVVAHVFGERTMATLGRLMSLLSPFDVVIWMTDGWP
FT                   LYESRLKGKLHVISKRYTQRIERHNLNLRQHLARLGRKSLSFSKSVELHDKVIGHYLNI
FT                   KHYQ"
FT   misc_feature    106681..106686
FT                   /note="possible translational frameshift site, similar to
FT                   that determined experimentally (EMBL:X52534)"
FT   repeat_region   complement(107120..107132)
FT                   /note="13 bp inverted repeat flanking IS1"
FT   misc_feature    107404..107616
FT                   /note="86% identity to F-plasmid origin of replication in
FT                   EMBL:J01724"
FT   repeat_region   107518..107537
FT                   /note="similar to incB repeats; 86% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   107539..107558
FT                   /note="similar to incB repeats; 98% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   107572..107591
FT                   /note="similar to incB repeats; 91% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   107594..107613
FT                   /note="similar to incB repeats; 93% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   CDS             107709..108464
FT                   /transl_table=11
FT                   /gene="rep"
FT                   /gene_synonym="HCM1.137"
FT                   /product="putative replication initiation protein"
FT                   /note="HCM1.137, rep, probable replication initiation
FT                   protein, len: 251 aa; similar to many e.g. SW:REPE_ECOLI
FT                   (EMBL:J01724), rep, Escherichia coli rep protein from the F
FT                   plasmid (251 aa), fasta scores; E(): 0, 94.8% identity in
FT                   249 aa overlap. Contains Pfam match to entry PF01051
FT                   RepB_protein, Initiator RepB protein"
FT                   /db_xref="GOA:P62539"
FT                   /db_xref="InterPro:IPR000525"
FT                   /db_xref="InterPro:IPR011991"
FT                   /db_xref="UniProtKB/Swiss-Prot:P62539"
FT                   /protein_id="CAD09735.1"
FT                   /translation="MAEIAVINHKKRKNSPRIVQSNELTEAAYSLSRDQKRLLYLFVHQ
FT                   IRKSDGSLQEHDGICEIHVAKYAETFGLTSAEASKDIRQALKGFAGKEVVFYRPEEDAG
FT                   DEKGYESFPWFIKRAHSPSRGLYSVHINPYLIPFFIGLQNRFTQFRLSETKEITNPYAM
FT                   RLYESLCQYRKPDGSGVVSLKIDWIMERYQLPQSYQRMPDFRRRFLKASVDEINSRTPM
FT                   RLSYIEKKKGRQTTHIVFSFRDITSMTIE"
FT   misc_feature    108300..108428
FT                   /note="Pfam match to entry PF01051 RepB_protein, Initiator
FT                   RepB protein, score 21.30, E-value 2.5e-05"
FT   repeat_region   complement(108465..108484)
FT                   /note="similar to incB repeats; 90% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108487..108506)
FT                   /note="similar to incB repeats; 94% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108520..108539)
FT                   /note="similar to incB repeats; 90% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108542..108561)
FT                   /note="similar to incB repeats; 94% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108575..108594)
FT                   /note="similar to incB repeats; 100% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108597..108616)
FT                   /note="similar to incB repeats; 94% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108630..108649)
FT                   /note="similar to incB repeats; 100% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108722..108741)
FT                   /note="similar to incB repeats; 86% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   complement(108746..108765)
FT                   /note="similar to incB repeats; 93% identity to consensus
FT                   CTGTGACAAATCACCCTCAA"
FT   repeat_region   108797..108809
FT                   /note="13 bp inverted repeat flanking IS1"
FT   misc_feature    108797..109544
FT                   /note="IS1"
FT   CDS             108842..109117
FT                   /transl_table=11
FT                   /gene="insA"
FT                   /gene_synonym="HCM1.138"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.138, insA, probable IS1 transposase, len: 91
FT                   aa; highly similar to many e.g. SW:ISA1_ECOLI
FT                   (EMBL:X52534), insA, Escherichia coli insertion element IS1
FT                   protein InsA (91 aa), fasta scores; E(): 0, 97.8% identity
FT                   in 91 aa overlap. Contains PS00017 ATP/GTP-binding site
FT                   motif A (P-loop). Contains a probable helix-turn-helix
FT                   motif at aa 64-85 (Score 1462, +4.17 SD)"
FT                   /db_xref="GOA:Q7AQV4"
FT                   /db_xref="InterPro:IPR003220"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQV4"
FT                   /protein_id="CAD09736.1"
FT                   /translation="MASVSISCPSCSATDGVVRNGKSTAGHQRYLCSHCRKTWQLQFTY
FT                   TASQPGTHQKIIDMAMNGVGCRATARIMGVGLNTIFRHLKNSGRSR"
FT   misc_feature    108887..108910
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             109036..109539
FT                   /transl_table=11
FT                   /gene="insB"
FT                   /gene_synonym="HCM1.136a"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.139, insB, possible IS1 transposase, len: 167
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISB_ECOLI (EMBL:D10483), insB, Escherichia coli
FT                   insertion element IS1 protein InsB (167 aa), fasta scores;
FT                   E(): 0, 89.8% identity in 167 aa overlap"
FT                   /db_xref="GOA:Q935M3"
FT                   /db_xref="InterPro:IPR005063"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M3"
FT                   /protein_id="CAD09737.1"
FT                   /translation="MPGNRPHYGRWPQHDFPPFKKLRPQSVTSRIQPGSDVIVCAEMDE
FT                   QWGYVGAKSRQLWLFYAYDRIRRTVVAHVFGERTLATLERLPGLLSAFEVVVWMTDDWP
FT                   LYESRLKGKLHVISKRYTQRIERHNLNLRQHLARLGRKSLSFSKSVELHDKVIGHYLTI
FT                   KHYQ"
FT   misc_feature    109093..109098
FT                   /note="possible translational frameshift site, similar to
FT                   that determined experimentally (EMBL:X52534)"
FT   repeat_region   complement(109532..109544)
FT                   /note="13 bp inverted repeat flanking IS1"
FT   CDS             109949..111022
FT                   /transl_table=11
FT                   /gene="HCM1.141"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.141, hypothetical protein, len: 357 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5G8"
FT                   /protein_id="CAD09738.1"
FT                   /translation="MRKSYTYGIPFGLHRETGRFLDITEVSRGSACNCICPGCRTDLIA
FT                   RQGEVKLWHYSHSTDLLGDCDGLMEAIRGKIIEIIQEKQLLGFPHLLAGYDGGTVPLDE
FT                   VSGSGSMFGATADLFVKVNDLCVAVFLDIDRSVAGKLTFDHLHASEMVAALRIDLPDIE
FT                   YEISQVQLGRRDGTYSECIEKIIIDATESREWLYHPMMQELGTEPLKVYEGREPAEAGP
FT                   LLQRLSDCPLKLPDNLPQSMNVLIRMQQATIVCLCRLTVRASDIAQTDEFPLFMRYFRL
FT                   HCLDTSEHVNYEKLLNWQDMITKSKEGQLLTVEERDYLQEIVRIGLYNHRLKSVCLTAC
FT                   EDSRVGESEGPNNYSLL"
FT   CDS             complement(111100..111243)
FT                   /transl_table=11
FT                   /gene="HCM1.141ac"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.141ac, hypothetical protein, len: 47 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M2"
FT                   /protein_id="CAD09739.1"
FT                   /translation="MRPLALSEDGLIQDAFTKEEPLGLVLMAVPIYITGLIMIGTLFTC
FT                   KK"
FT   CDS             complement(111279..111767)
FT                   /transl_table=11
FT                   /gene="HCM1.142c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.142c, hypothetical protein, len: 162 aa;
FT                   similar to TR:Q9Z4G2 (EMBL:AB021078), yadA, Escherichia
FT                   coli hypothetical protein from plasmid IncI1 ColIb-P9 (149
FT                   aa), fasta scores; E(): 1.2e-28, 54.9% identity in 142 aa
FT                   overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M1"
FT                   /protein_id="CAD09740.1"
FT                   /translation="MVSPMEKTQSPAERFYESIYYSDESLEEDYLAELRNFSSDHWDTA
FT                   LRAARLSAAVKRFKTSEMLRFILEFVVPENAQEDAPDLTPLAAKRLCNSLFGRSGSQSI
FT                   LVYVFGQAGRVHRSATCSPKTIEAIAALYRSDAERYWNSTLATIERVKHTYRAKIRNS"
FT   CDS             111903..112178
FT                   /transl_table=11
FT                   /gene="HCM1.143"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.143, hypothetical protein, len: 91 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935M0"
FT                   /protein_id="CAD09741.1"
FT                   /translation="MSVKCLPLQSGLDEKDQGLFQNGRNTRNVEENVALNNMIAIFKKV
FT                   GVTHYVYSIYHFQIVIKIRLPERQKQKKSIKQKCMVSILPPATLAP"
FT   CDS             112168..112368
FT                   /transl_table=11
FT                   /gene="HCM1.144"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.144, hypothetical protein, len: 66 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L9"
FT                   /protein_id="CAD09742.1"
FT                   /translation="MRPDNFILGEGALIITYPIRKAGNQNVTRISKMQRFNISVFSVSW
FT                   QQSRSAGTGKLYSTSPGLAGD"
FT   RBS             112424..112429
FT                   /note="possible RBS"
FT   CDS             112435..112827
FT                   /transl_table=11
FT                   /gene="HCM1.145"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.145, hypothetical protein, len: 130 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L8"
FT                   /protein_id="CAD09743.1"
FT                   /translation="MDDKEQFTSLVAKHASRFTEEQLAGYDACSQYGECVSPSYEVFRG
FT                   YRTRHTLDEFLELAISLNAIHPDEYLTDMLLKPHEVIGALADEGDQLNNATPVYFFPDT
FT                   GVYAAAVSETRVLDAWLCWPCYPANW"
FT   repeat_region   112896..112912
FT                   /note="inverted repeat; 17/17 (100%) matches, 0 gaps"
FT   repeat_region   complement(113131..113147)
FT                   /note="inverted repeat; 17/17 (100%) matches, 0 gaps"
FT   CDS             113240..113443
FT                   /transl_table=11
FT                   /gene="HCM1.146"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.146, hypothetical protein, len: 67 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L7"
FT                   /protein_id="CAD09744.1"
FT                   /translation="MFSTEKKSEHLGQIIVIDPALLGQGIEVGPVVVFDLGHASKGVAD
FT                   LMRDAEKLDGLSPTTIANRLSR"
FT   RBS             113587..113590
FT                   /note="possible RBS"
FT   CDS             113598..114524
FT                   /transl_table=11
FT                   /gene="HCM1.149"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.149, hypothetical protein, len: 308 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L6"
FT                   /protein_id="CAD09745.1"
FT                   /translation="MRSEIPSGRFFCLDEFHNFHMSDDVLRERLRSIDGIPAVSYQVNG
FT                   ENVFVFEKLVQLVKQNGHNLESALALVPKATMTAAEAIEAWSVFPEPYSRETNTIDHSQ
FT                   AIYHPYLNAYLPRKYPDRESCNADAARLLLGNPVEGEGDFVYRGQSMVLRQPFTLDRLP
FT                   PRPEWDVPVSEDASAYTHLWNTDFVSGFAPVTESLFNGIKSAEWEWNHAIAATYAYMGN
FT                   PECISSLWSRAGEFGLEQLELKSWDVDEQDPEHYQQFQALYPELSMLSPAIIQKAYDEY
FT                   CESMWENPERCDGFLYHLIGVVSEFGK"
FT   CDS             complement(114531..114986)
FT                   /transl_table=11
FT                   /gene="merR"
FT                   /gene_synonym="HCM1.151c"
FT                   /product="putative mercuric resistance operon regulatory
FT                   protein"
FT                   /note="HCM1.151c, merR, probable mercuric resistance operon
FT                   regulatory protein, len: 151 aa; highly similar to many
FT                   e.g. SW:MERR_PSEAE (EMBL:Z00027), merR, Pseudomonas
FT                   aeruginosa mercuric resistance operon regulatory protein
FT                   from plasmid pVS1 (144 aa), fasta scores; E(): 0, 92.3%
FT                   identity in 142 aa overlap. Contains Pfam match to entry
FT                   PF00376 merR, Bacterial regulatory proteins, merR family
FT                   and PS00552 Bacterial regulatory proteins, merR family
FT                   signature. Contains a probable helix-turn-helix motif at aa
FT                   8-29 (Score 1571, +4.54 SD). Similar to HCM1.245, merR,
FT                   probable mercuric resistance operon regulatory protein (144
FT                   aa), fasta scores; E(): 0, 89.4% identity in 142 aa
FT                   overlap"
FT                   /db_xref="GOA:Q935L5"
FT                   /db_xref="HSSP:1Q0A"
FT                   /db_xref="InterPro:IPR000551"
FT                   /db_xref="InterPro:IPR009061"
FT                   /db_xref="InterPro:IPR011794"
FT                   /db_xref="InterPro:IPR015358"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L5"
FT                   /protein_id="CAD09746.1"
FT                   /translation="MQINFENLTIGVFAKAAGVNVETIRFYQRKGLLPEPDKPYGSIRR
FT                   YGEADVTRVRFVKSAQRLGFSLDEIAELLRLEDGTHCEEASGLAEHKLKDVREKMADLA
FT                   RMEAVLSELVCACHARKGNVFCPLIASLQDGTKLAASARGSHGVTTP"
FT   misc_feature    complement(114849..114956)
FT                   /note="Pfam match to entry PF00376 merR, Bacterial
FT                   regulatory proteins, merR family, score 66.90, E-value
FT                   4.2e-16"
FT   misc_feature    complement(114888..114956)
FT                   /note="PS00552 Bacterial regulatory proteins, merR family
FT                   signature"
FT   misc_feature    complement(114900..114956)
FT                   /note="Pfam match to entry PF00376 merR, Bacterial
FT                   regulatory proteins, merR family, score 29.10, E-value
FT                   7.8e-05"
FT   RBS             complement(114996..114999)
FT                   /note="possible RBS"
FT   RBS             115046..115050
FT                   /note="possible RBS"
FT   CDS             115058..115423
FT                   /transl_table=11
FT                   /gene="merT"
FT                   /gene_synonym="HCM1.152"
FT                   /product="putative mercuric transport protein"
FT                   /note="HCM1.152, merT, probable mercuric transport protein,
FT                   len: 121 aa; highly similar to many e.g. SW:MERT_SERMA
FT                   (EMBL:M24940), merT, Serratia marcescens mercuric transport
FT                   protein from plasmid pDU1358 (116 aa), fasta scores; E():
FT                   0,96.5% identity in 115 aa overlap. Contains hydrophobic,
FT                   probable membrane-spanning regions. Similar to HCM1.234c,
FT                   merT, probable mercuric transport protein (116 aa), fasta
FT                   scores; E(): 0, 93.0% identity in 115 aa overlap"
FT                   /db_xref="GOA:Q935L4"
FT                   /db_xref="InterPro:IPR003457"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L4"
FT                   /protein_id="CAD09747.1"
FT                   /translation="MSEPQKSEPQNGRGALFAGGLAAILASACCLGPLVLIALGFSGAW
FT                   IGNLTVLEPYRPIFIGAALVALFFAWRRIYRPAQACKPGEVCAIPQVRATYKLIFWIVA
FT                   ALVLVSLGFPYVMPFFY"
FT   RBS             115428..115432
FT                   /note="possible RBS"
FT   CDS             115439..115714
FT                   /transl_table=11
FT                   /gene="merP"
FT                   /gene_synonym="HCM1.153"
FT                   /product="putative mercuric transport protein periplasmic
FT                   binding protein"
FT                   /note="HCM1.153, merP, probable mercuric transport protein
FT                   periplasmic binding protein, len: 91 aa; highly similar to
FT                   many e.g. SW:MERP_PSEAE (EMBL:Z00027), merP, Pseudomonas
FT                   aeruginosa mercuric transport protein periplasmic component
FT                   precursor from plasmid pVS1 (91 aa), fasta scores; E():
FT                   2.5e-27, 84.4% identity in 90 aa overlap. Contains Pfam
FT                   match to entry PF00403 HMA, Heavy-metal-associated domain
FT                   and PS01047 Heavy-metal-associated domain. Contains a
FT                   probable N-terminal signal sequence. Similar to HCM1.233c,
FT                   merP, probable mercuric transport protein periplasmic
FT                   binding protein (91 aa), fasta scores; E(): 6.4e-31, 82.4%
FT                   identity in 91 aa overlap"
FT                   /db_xref="GOA:P0A216"
FT                   /db_xref="InterPro:IPR001757"
FT                   /db_xref="InterPro:IPR001802"
FT                   /db_xref="InterPro:IPR006121"
FT                   /db_xref="InterPro:IPR011795"
FT                   /db_xref="InterPro:IPR017969"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0A216"
FT                   /protein_id="CAD09748.1"
FT                   /translation="MKKLFAALALAAVVAPVWAATQTVTLSVPGMTCASCPITVKHALS
FT                   KVEGVSKTDVSFDKRQAVVTFDDAKTNVQKLTKATEDAGYPSSLKR"
FT   misc_feature    115508..115705
FT                   /note="Pfam match to entry PF00403 HMA,
FT                   Heavy-metal-associated domain, score 101.20, E-value
FT                   1.8e-27"
FT   misc_feature    115520..115609
FT                   /note="PS01047 Heavy-metal-associated domain"
FT   RBS             115732..115735
FT                   /note="possible RBS"
FT   CDS             115742..116167
FT                   /transl_table=11
FT                   /gene="merC"
FT                   /gene_synonym="HCM1.157"
FT                   /product="putative mercury transport protein"
FT                   /note="HCM1.157, merC, probable mercury transport protein,
FT                   len: 141 aa; highly similar to many e.g. TR:O66048
FT                   (EMBL:U90263), merC, Pseudomonas stutzeri MerC protein from
FT                   plasmid pPB (141 aa), fasta scores; E(): 0, 80.1% identity
FT                   in 141 aa overlap. Contains hydrophobic, probable
FT                   membrane-spanning regions. Similar to HCM1.232c, merC,
FT                   probable mercury transport protein (140 aa), fasta scores;
FT                   E(): 0, 73.0% identity in 141 aa overlap"
FT                   /db_xref="InterPro:IPR004891"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQV2"
FT                   /protein_id="CAD09749.1"
FT                   /translation="MGLITRIAGKTGALGSVVSAMGCAACFPAIASFGAAIGLGFLSQY
FT                   EGLFIGILLPMFAGIALLANAIAWLNHRQWRRTALGTIGPILVLAAVFLMRAYGWQSGG
FT                   LLYVGLALMVGVSVWDFISPAHRRCGPDSCELPEQRG"
FT   RBS             116194..116198
FT                   /note="possible RBS"
FT   CDS             116206..117891
FT                   /transl_table=11
FT                   /gene="merA"
FT                   /gene_synonym="HCM1.158"
FT                   /product="putative mercuric reductase"
FT                   /EC_number="1.16.1.1"
FT                   /note="HCM1.158, merA, probable mercuric reductase, len:
FT                   561 aa; highly similar to many e.g. SW:MERA_PSEAE
FT                   (EMBL:Z00027), merA, Pseudomonas aeruginosa mercuric
FT                   reductase from plasmid pVS1 (EC 1.16.1.1) (561 aa), fasta
FT                   scores; E(): 0, 93.0% identity in 561 aa overlap. Contains
FT                   Pfam matches to entry PF00403 HMA, Heavy-metal-associated
FT                   domain and to entry PF00070 pyr_redox, Pyridine
FT                   nucleotide-disulphide oxidoreductase class-I. Contains
FT                   PS01047 Heavy-metal-associated domain and PS00076 Pyridine
FT                   nucleotide-disulphide oxidoreductases class-I active site.
FT                   Similar to HCM1.231c, merA, probable mercuric reductase
FT                   (564 aa), fasta scores; E(): 0, 85.0% identity in 565 aa
FT                   overlap"
FT                   /db_xref="GOA:Q935L3"
FT                   /db_xref="HSSP:1AW0"
FT                   /db_xref="InterPro:IPR000815"
FT                   /db_xref="InterPro:IPR001327"
FT                   /db_xref="InterPro:IPR004099"
FT                   /db_xref="InterPro:IPR006121"
FT                   /db_xref="InterPro:IPR011796"
FT                   /db_xref="InterPro:IPR012999"
FT                   /db_xref="InterPro:IPR013027"
FT                   /db_xref="InterPro:IPR016156"
FT                   /db_xref="InterPro:IPR017969"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L3"
FT                   /protein_id="CAD09750.1"
FT                   /translation="MTTLKITGMTCDSCAAHVKEALEKVPGVQSALVSYPKGTAQLAIE
FT                   AGTSSDALTTAVAGLGYEATLADAPPTDNRAGLLDKMRGWIGAADKPSGNERPLQVVVI
FT                   GSGGAAMAAALKAVEQGAQVTLIERGTIGGTCVNVGCVPSKIMIRAAHIAHLRRESPFD
FT                   GGMPPTPPTILRERLLAQQQARVEELRHAKYEGILDGNSAITVLHGEARFKDDQSLIVS
FT                   LNEGGERVVMFDRCLVATGASPAVPPIPGLKESPYWTSTEALASDTIPERLAVIGSSVV
FT                   ALELAQAFARLGSKVTALARNTLFFREDPAIGEAVTAAFRAEGIEVLEHTQASQVAHMD
FT                   GEFVLTTTHGELRADKLLVATGRTPNTRSLALEAAGVAVNAQGAIVIDKGMRTSSPNIY
FT                   AAGDCTDQPQFVYVAAAAGTRAAINMTGGDAALDLTAMPAVVFTDPQVATVGYSEAEAH
FT                   HDGIETDSRLLTLDNVPRALANFDTRGFIKLVIEEGSGRLIGVQAVAPEAGELIQTAVL
FT                   AIRNRMTVQELADQLFPYLTMVEGLKLAAQTFSKDVKQLSCCAG"
FT   misc_feature    116209..116403
FT                   /note="Pfam match to entry PF00403 HMA,
FT                   Heavy-metal-associated domain, score 90.10, E-value
FT                   2.8e-24"
FT   misc_feature    116221..116310
FT                   /note="PS01047 Heavy-metal-associated domain"
FT   misc_feature    116506..117870
FT                   /note="Pfam match to entry PF00070 pyr_redox, Pyridine
FT                   nucleotide-disulphide oxidoreductase class-I, score 757.30,
FT                   E-value 6.3e-224"
FT   misc_feature    116602..116634
FT                   /note="PS00076 Pyridine nucleotide-disulphide
FT                   oxidoreductases class-I active site"
FT   RBS             117896..117903
FT                   /note="possible RBS"
FT   CDS             117909..118274
FT                   /transl_table=11
FT                   /gene="merD"
FT                   /gene_synonym="HCM1.159"
FT                   /product="putative mercuric resistance operon coregulator"
FT                   /note="HCM1.159, merD, probable mercuric resistance operon
FT                   coregulator, len: 121 aa; highly similar to many e.g.
FT                   SW:MERD_PSEA (EMBL:Z00027), merD, Pseudomonas aeruginosa
FT                   mercuric resistance protein from plasmid pVS1 (121 aa),
FT                   fasta scores; E(): 0, 88.4% identity in 121 aa overlap.
FT                   Similar to HCM1.230c, merD, probable mercuric resistance
FT                   operon coregulator (120 aa), fasta scores; E(): 0, 82.6%
FT                   identity in 121 aa overlap"
FT                   /db_xref="GOA:P0A2Q6"
FT                   /db_xref="InterPro:IPR000551"
FT                   /db_xref="InterPro:IPR009061"
FT                   /db_xref="InterPro:IPR011797"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0A2Q6"
FT                   /protein_id="CAD09751.1"
FT                   /translation="MSAYTVSRLALDAGVSVHIVRDYLLRGLLRPVAYTTGGYGLFDDT
FT                   ALQRLRFVRAAFEAGIGLDALARLCRALDAADGDGASAQLAVLRQLVERRREALASLEM
FT                   QLAAMPTEPAQHAESLP"
FT   RBS             118259..118262
FT                   /note="possible RBS"
FT   CDS             118271..118507
FT                   /transl_table=11
FT                   /gene="HCM1.160"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.160, hypothetical protein, len: 78 aa; highly
FT                   similar to ORFs from transposable elements containing
FT                   mer-operons e.g. TR:Q52111 (EMBL:L04303), urf1,
FT                   Acinetobacter calcoaceticus unassigned open reading frame
FT                   from plasmid pKLH2 (78 aa), fasta scores; E(): 6.4e-32,
FT                   98.7% identity in 78 aa overlap"
FT                   /db_xref="InterPro:IPR007746"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L2"
FT                   /protein_id="CAD09752.1"
FT                   /translation="MNSPEHLPSETHKPITGYLWGALAVLTCPCYLPILAIVLAGTTAG
FT                   AFIGEHWGIAALTLTGLFVLSVTRLLRAFKGRS"
FT   RBS             118561..118565
FT                   /note="possible RBS"
FT   CDS             118573..118785
FT                   /transl_table=11
FT                   /gene="HCM1.161"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.161, hypothetical protein, len: 70 aa; similar
FT                   to part of SW:TNPM_ECOLI (EMBL:M10791), tnpM, Escherichia
FT                   coli transposon Tn21 modulator protein (116 aa), fasta
FT                   scores; E(): 8.8e-19, 71.0% identity in 69 aa overlap and
FT                   to hypothetical proteins from many transposable elements"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQV1"
FT                   /protein_id="CAD09753.1"
FT                   /translation="MNANAPNTASCTTCCVCCKEIPLDAAFTPEGAEYVEHFCGLDCYE
FT                   RFQARAKAATESDIAPVPGGSQPSD"
FT   repeat_region   118817..118939
FT                   /note="123 bp inverted repeat flanking IS6100"
FT   repeat_region   complement(118817..119971)
FT                   /note="IS6100"
FT   CDS             complement(119023..119787)
FT                   /transl_table=11
FT                   /gene="HCM1.162c"
FT                   /product="putative transposase"
FT                   /note="HCM1.162c, probable transposase, len: 254 aa;
FT                   identical to TR:Q49185 (EMBL:X53635), tnp, Mycobacterium
FT                   fortuitum Tn610 transposase (254 aa), fasta scores; E(): 0,
FT                   100.0% identity in 254 aa overlap. Highly similar to many
FT                   other transposases. Contains Pfam match to entry PF01438
FT                   Transposase_3, Transposase"
FT                   /db_xref="GOA:Q7AQV0"
FT                   /db_xref="InterPro:IPR001584"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQV0"
FT                   /protein_id="CAD09754.1"
FT                   /translation="MTDFKWRHFQGDVILWAVRWYCRYPISYRDLEEMLAERGISVDHT
FT                   TIYRWVQCYAPEMEKRLRWFWRRGFDPSWRLDETYVKVRGKWTYLYRAVDKRGDTIDFY
FT                   LSPTRSAKAAKRFLGKALRGLKHWEKPATLNTDKAPSYGAAITELKREGKLDRETAHRQ
FT                   VKYLNNVIEADHGKLKILIKPVRGFKSIPTAYATIKGFEVMRALRKGQARPWCLQPGIR
FT                   GEVRLVERAFGIGPSALTEAMGMLNHHFAAAA"
FT   misc_feature    complement(119188..119787)
FT                   /note="Pfam match to entry PF01438 Transposase_3,
FT                   Transposase, score 502.60, E-value 2.9e-147"
FT   repeat_region   complement(119849..119971)
FT                   /note="123 bp inverted repeat flanking IS6100"
FT   CDS             119966..120250
FT                   /transl_table=11
FT                   /gene="HCM1.163"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.163, hypothetical protein, len: 94 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L1"
FT                   /protein_id="CAD09755.1"
FT                   /translation="MTIVPPAPGLIEQLRHMVQMLVDPFGQFFDGLLLELVTFPELDVQ
FT                   GPGHLVEVPADSSKLPARFPYGVHFFISEDRHPVQRPQSFLYLNSPANM"
FT   CDS             complement(120417..120899)
FT                   /transl_table=11
FT                   /gene="dhfR"
FT                   /gene_synonym="HCM1.165c"
FT                   /product="putative dihydrofolate reductase"
FT                   /EC_number="1.5.1.3"
FT                   /note="HCM1.165c, dhfR, probable dihydrofolate reductase,
FT                   len: 160 aa; highly similar to many e.g. SW:DYR5_ECOLI
FT                   (EMBL:X12868), dhfRV, Escherichia coli dihydrofolate
FT                   reductase type V (EC 1.5.1.3) (157 aa), fasta scores; E():
FT                   0, 89.8% identity in 157 aa overlap. Contains Pfam match to
FT                   entry PF00186 DiHfolate_red, Dihydrofolate reductase and
FT                   PS00075 Dihydrofolate reductase signature"
FT                   /db_xref="GOA:Q935L0"
FT                   /db_xref="HSSP:1DHI"
FT                   /db_xref="InterPro:IPR001796"
FT                   /db_xref="InterPro:IPR012259"
FT                   /db_xref="InterPro:IPR017925"
FT                   /db_xref="UniProtKB/TrEMBL:Q935L0"
FT                   /protein_id="CAD09756.1"
FT                   /translation="MRTLKVSLMAAKAKNGVIGCGPDIPWSAKGEQLLFKALTYNQWLL
FT                   VGRKTFESMGALPNRKYAVVTRSGWTSNDDNVVVFQSIEEAMDRLAEFTGHVIVSGGGE
FT                   IYRETLPMASTLHLSTIDIEPEGDVFFPSIPNTFEVVFEQHFTSNINYCYQIWKKG"
FT   misc_feature    complement(120504..120881)
FT                   /note="Pfam match to entry PF00186 DiHfolate_red,
FT                   Dihydrofolate reductase, score 136.60, E-value 9.8e-39"
FT   misc_feature    complement(120783..120851)
FT                   /note="PS00075 Dihydrofolate reductase signature"
FT   CDS             complement(<120907..120963)
FT                   /transl_table=11
FT                   /gene="HCM1.166c"
FT                   /product="putative aminoglycoside acetyltransferase"
FT                   /note="HCM1.166c, possible aminoglycoside
FT                   acetyltransferase, partial CDS, len: 19 aa; highly similar
FT                   to the N-termini of aminoglycoside 3' N-acetyltransferases
FT                   e.g. SW:AAC1_PSEAE (EMBL:U12338), aacC1, Pseudomonas
FT                   aeruginosa gentamicin 3'-acetyltransferase from plasmid
FT                   R1033 (177 aa), fasta scores; E(): 1.4e-07, 94.7% identity
FT                   in 19 aa overlap"
FT                   /db_xref="GOA:Q935K9"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K9"
FT                   /protein_id="CAD09757.1"
FT                   /translation="MLWSSNDVTQQGSRPKTKL"
FT   CDS             121046..122059
FT                   /transl_table=11
FT                   /gene="int"
FT                   /gene_synonym="HCM1.167"
FT                   /product="putative integrase"
FT                   /note="HCM1.167, int, probable integrase, len: 337 aa;
FT                   identical to SW:INT2_ECOLI (EMBL:U12338), int, Escherichia
FT                   coli integrase/recombinase (E2 protein) from plasmid pLM020
FT                   (337 aa), fasta scores; E(): 0, 100.0% identity in 337 aa
FT                   overlap. Highly similar to many others. Contains Pfam match
FT                   to entry PF00589 Phage_integrase, 'Phage' integrase family"
FT                   /db_xref="GOA:P62592"
FT                   /db_xref="InterPro:IPR002104"
FT                   /db_xref="InterPro:IPR004107"
FT                   /db_xref="InterPro:IPR010998"
FT                   /db_xref="InterPro:IPR011010"
FT                   /db_xref="InterPro:IPR011946"
FT                   /db_xref="InterPro:IPR013762"
FT                   /db_xref="UniProtKB/Swiss-Prot:P62592"
FT                   /protein_id="CAD09758.1"
FT                   /translation="MKTATAPLPPLRSVKVLDQLRERIRYLHYSLRTEQAYVHWVRAFI
FT                   RFHGVRHPATLGSSEVEAFLSWLANERKVSVSTHRQALAALLFFYGKVLCTDLPWLQEI
FT                   GRPRPSRRLPVVLTPDEVVRILGFLEGEHRLFAQLLYGTGMRISEGLQLRVKDLDFDHG
FT                   TIIVREGKGSKDRALMLPESLAPSLREQLSRARAWWLKDQAEGRSGVALPDALERKYPR
FT                   AGHSWPWFWVFAQHTHSTDPRSGVVRRHHMYDQTFQRAFKRAVEQAGITKPATPHTLRH
FT                   SFATALLRSGYDIRTVQDLLGHSDVSTTMIYTHVLKVGGAGVRSPLDALPPLTSER"
FT   misc_feature    121313..122011
FT                   /note="Pfam match to entry PF00589 Phage_integrase, 'Phage'
FT                   integrase family, score 201.70, E-value 1.1e-56"
FT   RBS             122356..122359
FT                   /note="possible RBS"
FT   CDS             122365..122922
FT                   /transl_table=11
FT                   /gene="tnpR"
FT                   /gene_synonym="HCM1.168"
FT                   /product="resolvase"
FT                   /note="HCM1.168, tnpR, resolvase, len: 185 aa; highly
FT                   similar to many e.g. SW:TNP2_ECOLI (EMBL:X01298), tnpR,
FT                   Escherichia coli transposon Tn21 resolvase (186 aa), fasta
FT                   scores; E(): 0, 82.7% identity in 185 aa overlap. Contains
FT                   Pfam match to entry PF00239 recombinase, Site-specific
FT                   recombinases, PS00397 Site-specific recombinases active
FT                   site and PS00398 Site-specific recombinases signature 2.
FT                   Contains a probable helix-turn-helix motif at aa 162-183
FT                   (Score 1545, +4.45 SD)"
FT                   /db_xref="GOA:Q7AQU9"
FT                   /db_xref="InterPro:IPR006118"
FT                   /db_xref="InterPro:IPR006119"
FT                   /db_xref="InterPro:IPR006120"
FT                   /db_xref="InterPro:IPR009057"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQU9"
FT                   /protein_id="CAD09759.1"
FT                   /translation="MQGQRIGYVRVSSFDQNPERQLEGVQVARVFTDKASGKDTQRPEL
FT                   ERLLAFVREGDTVVVHSMDRLARNLDDLRRIVQGLTQRGVRMEFVKEGLKFTGEDSPMA
FT                   NLMLSVMGAFAEFERALIRERQREGIVLAKQRGAYRGRKKSLNSEQIAELKRRVAAGDQ
FT                   KTLVARDFGISRETLYQYLRED"
FT   misc_feature    122380..122904
FT                   /note="Pfam match to entry PF00239 recombinase,
FT                   Site-specific recombinases, score 285.50, E-value 6.8e-82"
FT   misc_feature    122386..122412
FT                   /note="PS00397 Site-specific recombinases active site"
FT   misc_feature    122527..122565
FT                   /note="PS00398 Site-specific recombinases signature 2"
FT   misc_feature    122925..125828
FT                   /note="Pfam match to entry PF01526 Transposase_7,
FT                   Transposase, score 2053.90, E-value 0"
FT   CDS             122925..125897
FT                   /transl_table=11
FT                   /gene="tnpA"
FT                   /gene_synonym="HCM1.169"
FT                   /product="transposase"
FT                   /note="HCM1.169, tnpA, transposase, len: 990 aa; highly
FT                   similar to many e.g. SW:TRA7_ECOLI (EMBL:X14236), tnpA,
FT                   Escherichia coli transposase for transposon Tn3926 (990
FT                   aa), fasta scores; E(): 0, 99.9% identity in 990 aa
FT                   overlap. Contains Pfam match to entry PF01526
FT                   Transposase_7, Transposase"
FT                   /db_xref="GOA:Q7AQU8"
FT                   /db_xref="InterPro:IPR002513"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQU8"
FT                   /protein_id="CAD09760.1"
FT                   /translation="MPRRSILSATERESLLALPDAKDELIRHYTFNETDLSVIRQRRGA
FT                   ANRLGFAVQLCYLRFPGTFLGVDEPPFPPLLRMVAAQLKMPVESWSEYGQREQTRREHL
FT                   VELQTVFGFKPFTMSHYRQAVHTLTELALQTDKGIVLASALVENLRRQSIILPAMNAIE
FT                   RASAEAITRANRRIYAALTDSLLSPHRQRLDELLKRKDGSKVTWLAWLRQSPAKPNSRH
FT                   MLEHIERLKSWQALDLPAGIERQVHQNRLLKIAREGGQMTPADLAKFEVQRRYATLVAL
FT                   AIEGMATVTDEIIDLHDRIIGKLFNAAKNKHQQQFQASGKAINDKVRMYGRIGQALIEA
FT                   KQSGSDPFAAIEAVMPWDTFAASVTEAQTLARPADFDFLHHIGESYATLRRYAPQFLGV
FT                   LKLRAAPAAKGVLDAIDMLRGMNSDSARKVPADAPTAFIKPRWAKLVLTDDGIDRRYYE
FT                   LCALSELKNALRSGDVWVQGSRQFKDFDEYLVPVEKFATLKLASELPLAVATDCDQYLH
FT                   DRLELLEAQLATVNRMAAANDLPDAIITTASGLKITPLDAAVPDAAQAMIDQTAMLLPH
FT                   LKITELLMEVDEWTGFTRHFTHLKTSDTAKDKTLLLTTILADAINLGLTKMAESCPGTT
FT                   YAKLSWLQAWHIRDETYSTALAELVNAQFRQPFAGNWGDGTTSSSDGQNFRTGSKAEST
FT                   GHINPKYGSSPGRTFYTHISDQYAPFSAKVVNVGIRDSTYVLDGLLYHESDLRIEEHYT
FT                   DTAGFTDHVFGLMHLLGFRFAPRIRDLGETKLFIPKGDAAYDALKPMISSDRLNIKQIR
FT                   AHWDEILRLATSIKQGTVTASLMLRKLGSYPRQNGLAVALRELGRIERTLFILDWLQSV
FT                   ELRRRVHAGLNKGEARNALARAVFFYRLGEIRDRSFEQQRYRASGLNLVTAAIVLWNTV
FT                   YLERATSALRGNGTALDDTLLQYLSPLGWEHINLTGDYLWRSSAKVGAGKFRPLRPLPP
FT                   A"
FT   repeat_region   125916..125927
FT                   /note="12 bp inverted repeat flanking IS"
FT   misc_feature    125916..127167
FT                   /note="IS"
FT   RBS             125965..125968
FT                   /note="possible RBS"
FT   CDS             125976..126915
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.170"
FT                   /product="putative transposase (pseudogene)"
FT                   /note="HCM1.170, probable transposase (pseudogene), len: ;
FT                   highly similar to many e.g. SW:TRA8_YEREN (EMBL:Z48244),
FT                   Yersinia enterocolitica transposase for insertion sequence
FT                   element IS1328 (334 aa), fasta scores; E(): 7e-31, 69.2%
FT                   identity in 104 aa overlap and E(): 0, 63.5% identity in
FT                   211 aa overlap"
FT   repeat_region   complement(127156..127167)
FT                   /note="12 bp inverted repeat flanking IS"
FT   CDS             127673..128164
FT                   /transl_table=11
FT                   /gene="HCM1.174"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.174, possible periplasmic protein, len: 163 aa;
FT                   unknown function, contains a probable N-terminal signal
FT                   sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K8"
FT                   /protein_id="CAD09762.1"
FT                   /translation="MKLTKMMATLFLLIPLTSFSQELGQRISQDDSAELANKAGTALTE
FT                   MLLLKVQQLPQVKKNSGMDLAAANDAVASLLSKEFFIFKPVDEISIKTSAQKLKELNDD
FT                   ADALAKGYTIIQPDDVGSSYISYKVTSSSRTCFIRLSKDLSSSLNTRIVTVNSMECSNP
FT                   "
FT   RBS             128593..128596
FT                   /note="possible RBS"
FT   CDS             128603..129409
FT                   /transl_table=11
FT                   /gene="HCM1.175"
FT                   /product="putative DNA-binding protein"
FT                   /note="HCM1.175, possible DNA-binding protein, len: 268 aa;
FT                   unknown function, contains PS00017 ATP/GTP-binding site
FT                   motif A (P-loop). Contains a probable helix-turn-helix
FT                   motif at aa 210-231 (Score 1104, +2.95 SD)"
FT                   /db_xref="GOA:Q9L5H4"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5H4"
FT                   /protein_id="CAD09763.1"
FT                   /translation="MREPRPRHTLQVVCVPSLNIQDLGLTSFHSWLLSKGYDTTNARNN
FT                   RTCWAREGGWHLKRCRHLATGEDHFWFIAFNGTGGDIFPVKTQQDYRAAYRKLEAYGYA
FT                   PAVIEQLNTGVAYNLAYSRTPLKRPESATSELKRKPDVNIQGEPCERFVTERSSAAQNK
FT                   FKTLLIENFAGRCAVTGWVNGGVLVAAHIEHGTRYNPSNGILLTPTMHALFDADLMGID
FT                   PSTLTVHFKPGIEAGELFEGKTLNPLVYDLDTDRLAARWADFIGAE"
FT   misc_feature    129311..129334
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             129515..129934
FT                   /transl_table=11
FT                   /gene="HCM1.176"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.176, hypothetical protein, len: 139 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K7"
FT                   /protein_id="CAD09764.1"
FT                   /translation="MIQQMQNCLSGYLKATIVILSAGLTGCDLANGTAESGVYQKYTNG
FT                   PFKEPTIVMSPGWRMDDHGREALIFGSSHCPDVNGNNTSEGGCVLIEEHSATVAVTVVD
FT                   ATNQSRRQETWTIERKKDRVIVKRPDNSFVMPWGK"
FT   CDS             129981..130691
FT                   /transl_table=11
FT                   /gene="HCM1.177"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.177, hypothetical protein, len: 236 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K6"
FT                   /protein_id="CAD09765.1"
FT                   /translation="MCVERPDGAFDIYTGRFIQFHQIDNSRRKIVEISDPDLVGMTYSI
FT                   PMVFNGGKFSGQGVTCLSLPAVTLIKVTFPSRTYQEGQEQITMSSPDLALFSEDVRKNC
FT                   AGTCVLTGVRGRQRTEAAHIKPRHAGGEPDVTNGILLRSDINTLFDNWHFSIDPDSMKA
FT                   RFSPDVLSVDKDLLQLEGKQIDFSRLQMPINIEHLRHHWNKFFNRHVNPVIKNALNKKI
FT                   NNYEKRPVSSNIHY"
FT   RBS             130750..130754
FT                   /note="possible RBS"
FT   CDS             130761..130943
FT                   /transl_table=11
FT                   /gene="HCM1.178"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.178, hypothetical protein, len: 60 aa;
FT                   hydrophobic protein"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K5"
FT                   /protein_id="CAD09766.1"
FT                   /translation="MNLKSIVPKAAGLAAWIVGIIYSGFALSVLWGGFCASRCGADHNS
FT                   MGYWNLLLGRHNKRQ"
FT   repeat_region   130852..130859
FT                   /note="(g)8"
FT   CDS             complement(131457..131861)
FT                   /transl_table=11
FT                   /gene="HCM1.178ac"
FT                   /product="putative DNA-binding protein"
FT                   /note="HCM1.178ac, probable DNA-binding protein, len: 134
FT                   aa; similar to many histone-like proteins e.g.
FT                   SW:STPA_ECOLI (EMBL:X69210), stpA, Escherichia coli
FT                   DNA-binding protein (134 aa), fasta scores; E(): 4.7e-26,
FT                   61.9% identity in 134 aa overlap. Contains Pfam match to
FT                   entry PF00816 Histone_HNS, H-NS histone family"
FT                   /db_xref="GOA:Q935K4"
FT                   /db_xref="HSSP:1NI8"
FT                   /db_xref="InterPro:IPR001801"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K4"
FT                   /protein_id="CAD09767.1"
FT                   /translation="MSEALKSLNNIRTLRAQGRELPLEILEELLEKLSVVVEERRQEES
FT                   SKEAELKARLEKIESLRQLMLEDGIDPEELLSSFSAKSGAPKKVREPRPAKYKYTDVNG
FT                   ETKTWTGQGRTPKALAEQLEAGKTLDDFLI"
FT   misc_feature    complement(131475..131861)
FT                   /note="Pfam match to entry PF00816 Histone_HNS, H-NS
FT                   histone family, score 222.70, E-value 5.3e-63"
FT   RBS             complement(131866..131869)
FT                   /note="possible RBS"
FT   CDS             complement(132123..132395)
FT                   /transl_table=11
FT                   /gene="HCM1.179c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.179c, hypothetical protein, len: 90 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K3"
FT                   /protein_id="CAD09768.1"
FT                   /translation="MNRTDDSITQLSSLYERLGAVAHELEYCKILLPEHSEQLDLDAAA
FT                   TYAMMLRIEQWAANVKNAYNTNTYDPFHINEKDKQLRNQEEENQY"
FT   CDS             complement(132392..133060)
FT                   /transl_table=11
FT                   /gene="HCM1.180c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.180c, hypothetical protein, len: 222 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5I1"
FT                   /protein_id="CAD09769.1"
FT                   /translation="MAASRITHLITSCTKGKHSQCGSMPELSIRSGQTPEEAMSSWAAT
FT                   IKRSQSASPVPALSLYAGNHWSTAKEILRTTENLELWVISAGLGFLNSRDLVDAYEATF
FT                   HDLPFSHRQWWRELTNTFGKERTAKSIETLMAARPFDDYVIAASPVYIEATEDDILAGA
FT                   SKLNNHIAQLTVVTSGEYSGLLESYLIRSESRMMRQLSSNMVCLNIKLAQYIIGSRRYS
FT                   "
FT   repeat_region   133176..133199
FT                   /note="inverted repeat; 21/24 (87%) matches, 0 gaps"
FT   repeat_region   complement(133454..133477)
FT                   /note="inverted repeat; 21/24 (87%) matches, 0 gaps"
FT   RBS             133555..133559
FT                   /note="possible RBS"
FT   CDS             133567..134022
FT                   /transl_table=11
FT                   /gene="HCM1.181"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.181 hypothetical protein, len: 151 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5I2"
FT                   /protein_id="CAD09770.1"
FT                   /translation="MSMNSQPELKLSTRTEQLASSRDAAMQKFLDGMTLIAEASAICGF
FT                   SLFNSKIMAPNAFGLPASLAASIEEGRQQIDRKTWNNLFEETGIDRFWNHNQRAEFRES
FT                   LRNAPPIASLTVIRSTLRQAVAMRSITLAEGFVDLLCQLDRRYKTNA"
FT   CDS             134029..134379
FT                   /transl_table=11
FT                   /gene="HCM1.182"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.182 hypothetical protein, len: 116 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K2"
FT                   /protein_id="CAD09771.1"
FT                   /translation="MMPKKLVLRGIFPDSNMMRYNGFSQDNLFYLNDFENVVCICSNAA
FT                   TPPVGSGMNMYDRLAVLRKTDFTGDITDPKGWKFRLFGNGNVHISVECESLHNALNDLI
FT                   SIYFANQIPAKG"
FT   RBS             134372..134376
FT                   /note="possible RBS"
FT   CDS             134382..135602
FT                   /transl_table=11
FT                   /gene="HCM1.183"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.183, hypothetical protein, len: 406 aa; unknown
FT                   function, rich in Ser, Thr, Glu and Gln"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5I4"
FT                   /protein_id="CAD09772.1"
FT                   /translation="MMTDNVNLMNGDEQTASSLSEETSKTPPLSPELLKNSPYSSIAKV
FT                   KYFTEIEQICLDKSISTENLDQFFKAHWLRDKMGGSFARAQEMLAAYKQYVDEVPEEAR
FT                   AIEIPDQIKDAFSDFTAFITWYFRLSYTAIQSDSVKIAKAEITQLRQRNAEILEELSQS
FT                   KEQATVLNNEKVNLINLLEQQRELSSKLEDSLQEAEETLAGTQSELQHAQNEIQLLQQT
FT                   VGTLNQQLSERKQELASQQEYQKQLNDENKAQQVELTALKSQNDHLQRTVSDLKVSVSQ
FT                   LEQDLSSVQTHSSELSSSLAEKDTTLTLVRSELSTAKGENDQLRAEAQRLADESLVAKK
FT                   VQTDQTEELQQLRNQMISMEATLNAEKTIAESLRGTIKQLTEAMTGAVAIKPKSSGASK
FT                   PRNKKTT"
FT   CDS             complement(135657..135860)
FT                   /transl_table=11
FT                   /gene="HCM1.184c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.184c, hypothetical protein, len: 67 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K1"
FT                   /protein_id="CAD09773.1"
FT                   /translation="MAYILSMSEQVKLKAFLAAVLDDYKLGAISQQQAVGGITSLVDAI
FT                   EISDSGKISLMLSEGRKLLRTG"
FT   CDS             complement(135898..137193)
FT                   /transl_table=11
FT                   /gene="HCM1.185c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.185c, hypothetical protein, len: 431 aa;
FT                   similar to TR:O85897 (EMBL:AF079317) Sphingomonas
FT                   aromaticivorans hypothetical protein from plasmid pNL1 (450
FT                   aa), fasta scores; E(): 3.1e-14, 25.3% identity in 372 aa
FT                   overlap"
FT                   /db_xref="InterPro:IPR009553"
FT                   /db_xref="UniProtKB/TrEMBL:Q935K0"
FT                   /protein_id="CAD09774.1"
FT                   /translation="MGQKFAVFIAYDDEPNTKRYSAEFQTQDEYVKGWQSALKKAHHTS
FT                   GQKSVISCGCRGKGAKRLYVRSLPNSDTFILIKAANTGTEHDPSCVFFDLDARHTGLKG
FT                   YASNVVRINNEGTMSIRLGIGMTEKDPPEKSEVPSLPQIQRPEGGQASMTLSGLLSLLW
FT                   TEAGLNVWYPNMAGKRNDSLVRYRMLEAAKQIRSGRACIGDHLFIGVADSKSKVASEQV
FT                   QLLSSAELSDKRLLLLSVLPRYDAEKHEKPLKFLPMRNFGGMPLTFFNSDGHWDSVKRR
FT                   FPLEYAAWKNGGKVVVFALTSPVSVTSRGISARAHQIVLMLVSDNWIPLDSSYEAIVSR
FT                   KLDAEHRHYVKPMRYDASASDVFPDFYLLDTRSDKPFPMEVFGMSTPAYLARKELKKAY
FT                   YNQEYGAYGWWHWDATEKTEYQELPHFPEARR"
FT   RBS             complement(137197..137203)
FT                   /note="possible RBS"
FT   CDS             complement(137218..137388)
FT                   /transl_table=11
FT                   /gene="HCM1.186c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.186c, hypothetical protein, len: 56 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J9"
FT                   /protein_id="CAD09775.1"
FT                   /translation="MMTYFDSAEDLTISKQRALQELAKHGVVASDIDVFFSELGEREEY
FT                   NAQEVLIWLGY"
FT   RBS             complement(137390..137396)
FT                   /note="possible RBS"
FT   CDS             complement(137517..138944)
FT                   /transl_table=11
FT                   /gene="HCM1.187c"
FT                   /product="putative DNA modification methylase"
FT                   /note="HCM1.187c, probable DNA modification methylase, len:
FT                   475 aa; similar to many e.g. SW:MTE2_ECOLI (EMBL:X05050)
FT                   Escherichia coli modification methylase EcoRII (EC
FT                   2.1.1.73) from plasmid N3 (477 aa), fasta scores; E(): 0,
FT                   66.7% identity in 442 aa overlap. Contains Pfam match to
FT                   entry PF00145 DNA_methylase, C-5 cytosine-specific DNA
FT                   methylase, PS00094 C-5 cytosine-specific DNA methylases
FT                   active site and two PS00095 C-5 cytosine-specific DNA
FT                   methylases C-terminal signature"
FT                   /db_xref="GOA:Q935J8"
FT                   /db_xref="HSSP:6MHT"
FT                   /db_xref="InterPro:IPR001525"
FT                   /db_xref="InterPro:IPR018117"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J8"
FT                   /protein_id="CAD09776.1"
FT                   /translation="MYNDRTEPAITALLNDETPSSIHKLLVQVASIYDVKDLAAQLNAA
FT                   TGSDWSRASLIRQIKGSVNECRITQEEYHYLRSLLPSRPADYDQKFFRFIDLFAGIGGL
FT                   RSGFDAIGGKCVFTSEWNQFSRRTYSANWYCDETEHYFNSDIRDITLSNLPDVSDDQAY
FT                   ASIDASIPDHDVLLAGFPCQPFSIAGVSKKNSLGRKHGFECDTQGTLFFDVARIIRAKQ
FT                   PAIFVLENVKNLKSHDKGNTFRIIMKALDELGYDVADCDAHGSKDPKIIDGKNFRPQHR
FT                   ERIVLVGFRRDLKLHDGFSLSGVSALYPSRRPTLGELLDAEVDSRYILSPKLWEYLYNY
FT                   AKKHQAKGNGFGFGLVNPLDKSVVCRTLSARYYRDGSEILLDRGWDHSIGEKDFNDPVN
FT                   MARRPRRLTPRECARLMGFEQPGKVTFRIPVSDTQAYRQFGNSVIVDVFAAVASLLRSR
FT                   IEIAVAARLKGEFEAAS"
FT   misc_feature    complement(137574..138671)
FT                   /note="Pfam match to entry PF00145 DNA_methylase, C-5
FT                   cytosine-specific DNA methylase, score 273.90, E-value
FT                   2e-78"
FT   misc_feature    complement(137580..137636)
FT                   /note="PS00095 C-5 cytosine-specific DNA methylases
FT                   C-terminal signature"
FT   misc_feature    complement(137856..137912)
FT                   /note="PS00095 C-5 cytosine-specific DNA methylases
FT                   C-terminal signature"
FT   misc_feature    complement(138387..138425)
FT                   /note="PS00094 C-5 cytosine-specific DNA methylases active
FT                   site"
FT   RBS             complement(138950..138953)
FT                   /note="possible RBS"
FT   RBS             139159..139162
FT                   /note="possible RBS"
FT   CDS             139168..139683
FT                   /transl_table=11
FT                   /gene="HCM1.188"
FT                   /product="putative nuclease"
FT                   /note="HCM1.188, possible nuclease, len: 171 aa; similar to
FT                   SW:NUC_SHIFL (EMBL:U30471), nuc, Shigella flexneri
FT                   micrococcal nuclease precursor (174 aa), fasta scores; E():
FT                   9e-07, 38.8% identity in 152 aa overlap and to many
FT                   bacterial hypothetical proteins e.g. SW:YC96_HAEIN
FT                   (EMBL:U32809), HI1296, Haemophilus influenzae hypothetical
FT                   protein (179 aa), fasta scores; E(): 2.1e-20, 41.1%
FT                   identity in 158 aa overlap. Contains Pfam match to entry
FT                   PF00565 SNase, Staphylococcal nuclease homologues. Contains
FT                   a possible N-terminal signal sequence"
FT                   /db_xref="GOA:Q935J7"
FT                   /db_xref="HSSP:1EYC"
FT                   /db_xref="InterPro:IPR006021"
FT                   /db_xref="InterPro:IPR016071"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J7"
FT                   /protein_id="CAD09777.1"
FT                   /translation="MTLLKKLLLPTLIVLFPAATLAAQSSFEAKVVKIIDGDTITALDG
FT                   QNTSIKIRLYGIDAPESKQAFGQKSKQALSAAIAAQNITVIDHGPDIYGRMLGTIWLDG
FT                   YDINASMVDSGYAWVYRFDGNAIVPNYLKFEASAQKAVKGLWVDPNPVAPWEWRQQNQK
FT                   PQKTKSRG"
FT   misc_feature    139240..139611
FT                   /note="Pfam match to entry PF00565 SNase, Staphylococcal
FT                   nuclease homologues, score 120.60, E-value 2.9e-32"
FT   CDS             139680..140612
FT                   /transl_table=11
FT                   /gene="HCM1.189"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.189, hypothetical protein, len: 310 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J6"
FT                   /protein_id="CAD09778.1"
FT                   /translation="MTAMTRQHPLLKIALNSDGHLSWPILPGETHRCPTCLRHVTTGPD
FT                   GDLVHSMEEGGNVCIPSASVVISKAIIEMLSAGERLYVNPIKNGNKTLAPSFIFLHTDQ
FT                   QLRPFINSDYQPAGASWRSDKGFRLGLFFMNERASKINKDQFDFIAVIDPLTFQSEFDA
FT                   TWSRGEFDDPLKALRYSIVSENLSSVWVKWPVKNLQPRKETVMADYWYDYYSPHSPAQQ
FT                   AACTATVTGIDGNVSGETIYMLQIALERSTVEYQLVKSLGVILLLDNTGNLVSEAQPHF
FT                   DIIIKACISGVRDFVLQNPRTLGFENKVA"
FT   CDS             140668..141447
FT                   /transl_table=11
FT                   /gene="HCM1.190"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.190, hypothetical protein, len: 259 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J5"
FT                   /protein_id="CAD09779.1"
FT                   /translation="MVQVLNTTGLNYQLEKTITEAEERIILISPYLKLSNRIKELIEDK
FT                   NRLKVDIRIVYGKSELNSKEYEWLTNLPFVRLSFCKNLHAKLYANENQCIVCSLNLYDF
FT                   SQINNHEIGVLIIKEQEKDAYTSSLNEAQRLIRISTDNIQPLTTDKETTGSKESEKTNK
FT                   ESSDFTSAFHEEPLTNQNGLITDLNTNSKLTSTNLAKNHKTDLLSLYKKLIEAGYLMDV
FT                   EGKYILTDAGIAAGAEAKPNRYKKGENYFLWPDNLAL"
FT   CDS             141444..141731
FT                   /transl_table=11
FT                   /gene="HCM1.191"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.191, hypothetical protein, len: 95 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J4"
FT                   /protein_id="CAD09780.1"
FT                   /translation="MILHHVLCPCVAMRDIEGSMKNSLFSTDSNTGVTFTISPHGQGCK
FT                   LSVEPEYRRKGTQNYDGWFPRYYTKPQYAKAALTRFLGEPVNWLDCNDHN"
FT   CDS             141795..142094
FT                   /transl_table=11
FT                   /gene="HCM1.192"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.192, possible membrane protein, len: 99 aa;
FT                   unknown function. Contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J3"
FT                   /protein_id="CAD09781.1"
FT                   /translation="MENLDVVSAVDFYLEKAFYLFGFIMLGMAWLTFRAGSTYQHFKNA
FT                   DKLVSEGRGSVSSGKEPEMIRRLKFQTLIWYIANCVVLALSTIAFGYLFYLLHS"
FT   CDS             complement(142344..142952)
FT                   /transl_table=11
FT                   /gene="HCM1.193c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.193c, hypothetical protein, len: 202 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J2"
FT                   /protein_id="CAD09782.1"
FT                   /translation="MKEKTLDSVSLLISKIRRLDWQRLKEFFGPLAFNHPDCIDAIMTD
FT                   GISTDASFTILNALISRTEMMSSGEYAIEHDRSKNLLTYNERLNFLINCDKEGEFKHSE
FT                   IATISFPLNLKKVYQIDSKESPSVQLCDVLIGACIESVYQLMDSKVLNQNSVLSLYQDS
FT                   QLIHFIPDIDFEGQKKFRKGSQSEEYLTFIQNEIYSSKL"
FT   repeat_region   142985..142999
FT                   /note="15 bp inverted repeat flanking IS10"
FT   repeat_region   142985..144299
FT                   /note="IS10"
FT   CDS             143085..144293
FT                   /transl_table=11
FT                   /gene="HCM1.194"
FT                   /product="transposase"
FT                   /note="HCM1.194, transposase, len: 402 aa; identical or
FT                   highly similar to Tn10 transposases e.g. TR:AAD50242
FT                   (EMBL:AF162223) Shigella flexneri IS10-left transposase
FT                   from Tn10 (402 aa), fasta scores; E(): 0, 100.0% identity
FT                   in 402 aa overlap"
FT                   /db_xref="GOA:Q7AQU3"
FT                   /db_xref="InterPro:IPR002559"
FT                   /db_xref="InterPro:IPR012337"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQU3"
FT                   /protein_id="CAD09783.1"
FT                   /translation="MCELDILHDSLYQFCPELHLKRLNSLTLACHALLDCKTLTLTELG
FT                   RNLPTKARTKHNIKRIDRLLGNRHLHKERLAVYRWHASFICSGNTMPIVLVDWSDIREQ
FT                   KRLMVLRASVALHGRSVTLYEKAFPLSEQCSKKAHDQFLADLASILPSNTTPLIVSDAG
FT                   FKVPWYKSVEKLGWYWLSRVRGKVQYADLGAENWKPISNLHDMSSSHSKTLGYKRLTKS
FT                   NPISCQILLYKSRSKGRKNQRSTRTHCHHPSPKIYSASAKEPWILATNLPVEIRTPKQL
FT                   VNIYSKRMQIEETFRDLKSPAYGLGLRHSRTSSSERFDIMLLIALMLQLTCWLAGVHAQ
FT                   KQGWDKHFQANTVRNRNVLSTVRLGMEVLRHSGYTITREDSLVAATLLTQNLFTHGYVL
FT                   GKL"
FT   repeat_region   complement(144285..144299)
FT                   /note="15 bp inverted repeat flanking IS10"
FT   CDS             144632..147967
FT                   /transl_table=11
FT                   /gene="HCM1.195"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.195, hypothetical protein, len: 1111 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J1"
FT                   /protein_id="CAD09784.1"
FT                   /translation="MGDLVSKNNIDRLERFHSLLAGQYWSALVDIPAEAIVAGDTLLIN
FT                   SLRYVDNNLHTVILRAHPRHYGEWVSVEIVAENGSKSTKDKRLNEHRFLTADFLALFEY
FT                   QPDHEIIRQSELKGIQDEVADLQMRLTETLQDPSALRELAIKRVEDEEASKKGGATEDR
FT                   MLPAVRNAEDVAVTMALGTVQNALSQGISEAQVSLMAKVAEREGKIAGAVANIITSRTG
FT                   AITRALEKMHPYYAELAAAKLAGTQEGIEQASKIQAGVLTLELFVGKNVTVVDVAEGEP
FT                   ADSSIPLTLCQKKLVVDEEFSAWSDIDEHFDFRSLSAFLKALKDNQGLVEQIFPTERCV
FT                   LVMVTTRRFIDYGDTWANAENNEKNSIVFLMVRNGQNIKQIYSPVESHLGASRLFPSED
FT                   EQQGHFRGFDGTTIKFEDVAYTDRLKAHDLMALHYRRLLIMLFGLDQRLALFGQFYPQH
FT                   EKANFLNLSFQERYFHFLHDEDGTGLLASPDSQTLDEFISEKNSYIQPGSRLLCNWREL
FT                   MTPRTAPGAVKEDSGYSGYSFIADPEDNVSAAVVYRQGDTLAVDVAVKRFSTDKMFNCK
FT                   VNVSAYSPWRRGEAELAYLCLDAVGPEELTRFIQQRKFRSNHLFYIRFFKAAIKFLEQE
FT                   RENELPHRQYLLAAMQDSGMHLPGNIQELIHQCIASWKTGNRGVSLAVGMSTEKGRQAL
FT                   LNQLYRLTQGASEMVSVIQEHVAASGSQLLRAGVNSSGNYVAFIAPKPYECDNRLEAHA
FT                   WVHRVVYATGKRNIRETGRSWVSMPERSASEITLWEDEEQSRKWYSMTPVFSSWTEKQK
FT                   LFEMCEKGAGLLKGAMGTPDDEEYGDLLEMWGDAYIACNASGEHVTTPDMFLPVGLIKS
FT                   RKSLKLIALGTCSTEHWMYARAGDDDSRELLLELYTSWYEYPDKARARLLSMAEKNSGL
FT                   RFVLLEGKSRKLERFAVKRPEEIVNWHAGNLKEIPTMLNDQWACHMAMVSQNDKVYLTP
FT                   DLLDDDGLPNFNGVTRQVPGEGYQPVNVYEFESDYFNAVYDADGKKVALCHWYDVTDNS
FT                   YSAEELIGNMPHNAFKFLQYRLDNIEQAEAFIKYRNRNYQPRENADWPEPPEGVKRYVI
FT                   RARS"
FT   RBS             148723..148729
FT                   /note="possible RBS"
FT   CDS             148734..149120
FT                   /transl_table=11
FT                   /gene="HCM1.196"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.196, hypothetical protein, len: 128 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5K0"
FT                   /protein_id="CAD09785.1"
FT                   /translation="MGVDMNYEFQKKSPKGWDRVNDNFSNDRSYLLYSWLGLDARNTWG
FT                   VAAITPLRGLPDDIELQWDEDGCDDYWGEHSQTWLLSDEILASTSPVAIEDDEPGSVVA
FT                   EFCAEVQRLHGLHGTVRIVLGFTG"
FT   CDS             complement(149132..149557)
FT                   /transl_table=11
FT                   /gene="HCM1.197c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.197c, hypothetical protein, len: 141 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5J9"
FT                   /protein_id="CAD09786.1"
FT                   /translation="MTDQASIPVDTPVLALATDAYSSLKNILNDNGTSDTTGTCMFASL
FT                   LVCEFAHRRGMSAAVRGGNGTDDGGIFNESGGHGHYWCEVSAGEMIFYIDIAAEQFGYP
FT                   SFIIKNANDVSGWPRYIPGDQVTVDEHVRITLSGGIR"
FT   RBS             complement(149568..149571)
FT                   /note="possible RBS"
FT   CDS             complement(149591..150064)
FT                   /transl_table=11
FT                   /gene="HCM1.198c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.198c, hypothetical protein, len: 157 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935J0"
FT                   /protein_id="CAD09787.1"
FT                   /translation="MGSIKELLFDIQEEWRHEWISINYPEAEEETLEWDAAAQEYSWFR
FT                   DWMEEAAEQQHFEASLNCIPERLQEALDELHELQGLLETEQLIVSPNLLSELKNLSIQE
FT                   GYMLKIENVLPPNFRVFLVREGFIFPGESWVCGSGYWLPESEVLKNGINSLLV"
FT   CDS             complement(150147..150506)
FT                   /transl_table=11
FT                   /gene="HCM1.199c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.199c, hypothetical protein, len: 119 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I9"
FT                   /protein_id="CAD09788.1"
FT                   /translation="MWHNGLPRTVIINNMDVVIRKLIMEISISLDVLFEALMILGHGRV
FT                   WMQEMEFENLPGYSCYRELRTWDNRIVAWWSDADDTWYLCVEVDVITAVPSHIPNKKGE
FT                   LSEEVCFQLMALGRY"
FT   RBS             151041..151045
FT                   /note="possible RBS"
FT   CDS             151052..152449
FT                   /transl_table=11
FT                   /gene="HCM1.201"
FT                   /product="putative transposase"
FT                   /note="HCM1.201, possible transposase, len: 465 aa; similar
FT                   to many e.g. SW:TRA2_STRPN (EMBL:U04047) Streptococcus
FT                   pneumoniae transposase for insertion sequence IS1202 (465
FT                   aa), fasta scores; E(): 8.9e-14, 26.8% identity in 332 aa
FT                   overlap and SW:Y4BF_RHISN (EMBL:AE000065), Y4BF, Rhizobium
FT                   sp. (strain NGR234) putative transposase from plasmid sym
FT                   pNGR234a (457 aa), fasta scores; E(): 0, 44.6% identity in
FT                   426 aa overlap. Contains a probable helix-turn-helix motif
FT                   at aa 28-49 (Score 1752, +5.15 SD)"
FT                   /db_xref="GOA:Q935I8"
FT                   /db_xref="InterPro:IPR001584"
FT                   /db_xref="InterPro:IPR009057"
FT                   /db_xref="InterPro:IPR012337"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I8"
FT                   /protein_id="CAD09789.1"
FT                   /translation="MAIHDAGMFTVKEINRLKILQDVVERNLRPGQAAEMLGITPRHCS
FT                   RLLKRYRQSGPLGMNNQSRGRTGNRLLPTSLTDQALSIIRERYRDFGPTLAREKLEEVH
FT                   GLVLGKETIRRLMIKAGLWIPRRQRAPKIHQPRYRRPCTGELIQIDGCDHHWFENRGRP
FT                   CTALVYVDDATSRLMHLLFVKSESTFSYFEATRGYIEKYGKPMILYSDKASVFRVNNKH
FT                   ATTGPGETQFARAMRCLNITPLCAETSQAKGRVERAHLTLQDRLVKELRLKGISTIEAA
FT                   NAFAEEYMADYNRRFAKAPLHDFNAHRPLALDDDLDAEFTWREPRRVSKSLTVQYDKML
FT                   YLIEDSEYSRRAIGKYIDVWHYPDGHKELRLNGVLLPYSTYDRLSEVDPVAIVDNKRLG
FT                   HVLDVARQVQKKRDNNRSQSLPSGDEPSRRRHAPGINKSQRSLNEDDLLEAIIKLQGSS
FT                   EAIFGKR"
FT   CDS             152712..153518
FT                   /transl_table=11
FT                   /gene="HCM1.203"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.203, hypothetical protein, len: 268 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I7"
FT                   /protein_id="CAD09790.1"
FT                   /translation="MYMTGQEINDKKKEYLELLDREENEQIYQTYLEENTMFIPREFEQ
FT                   NHGIHFSTVFRKLPLSSDYKPDFVYLSKSSDNWNVVLVEIEKPSSKYFKNNSTTFHADF
FT                   NLALQQMNTWRAWFDDESNRNHFKNNILQGFIEPAHMGRNPFNFKYVLVHGRRSEYENN
FT                   TQKTALIRGQQRSDFSIISFDSLAENIEKKYKLYVGVKKNSHYELISKEFVDEGIFSWM
FT                   NIDFLAITQSIYDDAIAKSDSWHHYIIKENGTVKTMDYALPRIKII"
FT   repeat_region   complement(153546..153558)
FT                   /note="13 bp inverted repeat flanking IS1"
FT   repeat_region   complement(153546..154293)
FT                   /note="IS1"
FT   CDS             complement(153551..154054)
FT                   /transl_table=11
FT                   /gene="insB"
FT                   /gene_synonym="HCM1.204c"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.204c, insB, possible IS1 transposase, len: 167
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISB_ECOLI (EMBL:D10483), insB, Escherichia coli
FT                   insertion element IS1 protein InsB (167 aa), fasta scores;
FT                   E(): 0, 97.0% identity in 167 aa overlap"
FT                   /db_xref="GOA:Q7AQU0"
FT                   /db_xref="InterPro:IPR005063"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQU0"
FT                   /protein_id="CAD09791.1"
FT                   /translation="MPGNRPHYGRWPQHDFPPFKKLRPQSVTSRIQPGSDVIVCAEMDE
FT                   QWGYVGAKSRQRWLFYAYDRLRKTVVAHVFGERTMATLGRLMSLLSPFDVVIWMTDGWP
FT                   LYESRLKGKLHVISKRYTQRIERHNLNLRQHLARLGRKSLSFSKSVELHDKVIGHYLNI
FT                   KHYQ"
FT   CDS             complement(153973..154248)
FT                   /transl_table=11
FT                   /gene="insA"
FT                   /gene_synonym="HCM1.205c"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.205c, insA, probable IS1 transposase, len: 91
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISA1_ECOLI (EMBL:X52534), insA, Escherichia coli
FT                   insertion element IS1 protein InsA (91 aa), fasta scores;
FT                   E(): 0, 97.8% identity in 91 aa overlap. Contains PS00017
FT                   ATP/GTP-binding site motif A (P-loop). Contains a probable
FT                   helix-turn-helix motif at aa 64-85 (Score 1462, +4.17 SD)"
FT                   /db_xref="GOA:Q7AQV4"
FT                   /db_xref="InterPro:IPR003220"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQV4"
FT                   /protein_id="CAD09792.1"
FT                   /translation="MASVSISCPSCSATDGVVRNGKSTAGHQRYLCSHCRKTWQLQFTY
FT                   TASQPGTHQKIIDMAMNGVGCRATARIMGVGLNTIFRHLKNSGRSR"
FT   misc_feature    complement(153992..153997)
FT                   /note="possible translational frameshift site, similar to
FT                   that determined experimentally (EMBL:X52534)"
FT   misc_feature    complement(154180..154203)
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   repeat_region   complement(154281..154293)
FT                   /note="13 bp inverted repeat flanking IS1"
FT   RBS             154514..154519
FT                   /note="possible RBS"
FT   CDS             154527..155186
FT                   /transl_table=11
FT                   /gene="cat"
FT                   /gene_synonym="HCM1.206"
FT                   /product="chloramphenicol acetyltransferase"
FT                   /EC_number="2.3.1.28"
FT                   /note="HCM1.206, cat, chloramphenicol acetyltransferase,
FT                   len: 219 aa; highly similar or identical to many e.g.
FT                   SW:CAT_ECOLI (EMBL:V00623), cat, Escherichia coli
FT                   chloramphenicol acetyltransferase (EC 2.3.1.28) (219 aa),
FT                   fasta scores; E(): 0, 100.0% identity in 219 aa overlap.
FT                   Contains Pfam match to entry PF00302 CAT, Chloramphenicol
FT                   acetyltransferase and PS00100 Chloramphenicol
FT                   acetyltransferase active site"
FT                   /db_xref="GOA:P62580"
FT                   /db_xref="InterPro:IPR001707"
FT                   /db_xref="InterPro:IPR018372"
FT                   /db_xref="UniProtKB/Swiss-Prot:P62580"
FT                   /protein_id="CAD09793.1"
FT                   /translation="MEKKITGYTTVDISQWHRKEHFEAFQSVAQCTYNQTVQLDITAFL
FT                   KTVKKNKHKFYPAFIHILARLMNAHPEFRMAMKDGELVIWDSVHPCYTVFHEQTETFSS
FT                   LWSEYHDDFRQFLHIYSQDVACYGENLAYFPKGFIENMFFVSANPWVSFTSFDLNVANM
FT                   DNFFAPVFTMGKYYTQGDKVLMPLAIQVHHAVCDGFHVGRMLNELQQYCDEWQGGA"
FT   misc_feature    154542..155153
FT                   /note="Pfam match to entry PF00302 CAT, Chloramphenicol
FT                   acetyltransferase, score 526.70, E-value 1.7e-154"
FT   misc_feature    155094..155126
FT                   /note="PS00100 Chloramphenicol acetyltransferase active
FT                   site"
FT   CDS             complement(155387..155764)
FT                   /transl_table=11
FT                   /gene="HCM1.207c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.207c, hypothetical protein, len: 125 aa;
FT                   identical to TR:Q9WTH2 (EMBL:AP000342), ybjA, Shigella
FT                   flexneri hypothetical protein from plasmid R100 (125 aa),
FT                   fasta scores; E(): 0, 100.0% identity in 125 aa overlap.
FT                   Also shows weak similarity to other hypothetical proteins
FT                   e.g. TR:O87371 (EMBL:AF051917) Staphylococcus aureus
FT                   hypothetical protein from plasmid pSK41 (130 aa), fasta
FT                   scores; E(): 0.0038, 31.2% identity in 109 aa overlap"
FT                   /db_xref="GOA:Q7AQT8"
FT                   /db_xref="InterPro:IPR000182"
FT                   /db_xref="InterPro:IPR016181"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT8"
FT                   /protein_id="CAD09794.1"
FT                   /translation="MKDYLCKKLFNRLSGTLVIRARCGNNITGLACCNILYPSPRYSGQ
FT                   LHIKELYVSQCDRNKGTGKAIMRFIARLALEQECLSLSWNAEKSNPGANRFYQALGGRI
FT                   NDHIVNYYLHGESLSKLASGI"
FT   RBS             complement(155772..155775)
FT                   /note="possible RBS"
FT   repeat_region   155823..155834
FT                   /note="12 bp inverted repeat flanking IS4321"
FT   repeat_region   155823..157139
FT                   /note="IS4321"
FT   CDS             complement(156075..157079)
FT                   /transl_table=11
FT                   /gene="HCM1.209c"
FT                   /product="putative transposase"
FT                   /note="HCM1.209c, probable transposase, len: 334 aa; highly
FT                   similar to many e.g. SW:TRA8_YEREN (EMBL:Z48244) Yersinia
FT                   enterocolitica transposase for insertion sequence element
FT                   IS1328 (334 aa), fasta scores; E(): 0, 66.3% identity in
FT                   332 aa overlap and TR:P77600 (EMBL:U67194), tnpA,
FT                   Escherichia coli putative transposase from plasmid
FT                   IncP-beta R751 (334 aa), fasta scores; E(): 0, 99.4%
FT                   identity in 334 aa overlap"
FT                   /db_xref="GOA:Q935I6"
FT                   /db_xref="InterPro:IPR002525"
FT                   /db_xref="InterPro:IPR003346"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I6"
FT                   /protein_id="CAD09795.1"
FT                   /translation="MENIALIGIDLGKNSFHIHCQDRRGKAVYRKKFTRPKLIEFLATC
FT                   PATTIAMEACGGSHFMARKLEELGHSPKLISPQFVRPFVKSNKNDFVDAEAICEAASRP
FT                   SMRFVQPRTESQQAMRALHRVRESLVQDKVKTTNQMHAFLLEFGISVPRGAAVISRLST
FT                   ILEDNSLPLYLSQLLLKLQQHYHYLVEQIKDLESQLKRKLDEDEVGQRLLSIPCVGTLT
FT                   ASTISTEIGDGKQYASSRDFAAATGLVPRQYSTGGRTTLLGISKRGNKKIRTLLVQCAR
FT                   VFIQKLEHQSGKLADWVRDLLCRKSNFVVTCALANKLARIAWALTARQQTYVA"
FT   RBS             complement(157087..157090)
FT                   /note="possible RBS"
FT   repeat_region   complement(157128..157139)
FT                   /note="12 bp inverted repeat flanking IS4321"
FT   CDS             complement(join(157158..159638,160461..>160654))
FT                   /pseudo
FT                   /codon_start=3
FT                   /transl_table=11
FT                   /gene="tnpA"
FT                   /gene_synonym="HCM1.210c"
FT                   /product="transposase (pseudogene)"
FT                   /note="HCM1.210c, tnpA, transposase (pseudogene), len: 2481
FT                   bp; highly similar to many e.g. SW:TRA3_ECOLI
FT                   (EMBL:X04891), tnpA, Escherichia coli transposase for
FT                   transposon TN21 (988 aa), fasta scores; E(): 0, 98.9%
FT                   identity in 826 aa overlap. The N-terminus is truncated.
FT                   Contains Pfam match to entry PF01526 Transposase_7,
FT                   Transposase"
FT                   /db_xref="PSEUDO:CAD09796.1"
FT   misc_feature    complement(157227..159638)
FT                   /note="Pfam match to entry PF01526 Transposase_7,
FT                   Transposase, score 1653.00, E-value 0"
FT   CDS             complement(159604..160230)
FT                   /transl_table=11
FT                   /gene="HCM1.211c"
FT                   /product="putative transposase"
FT                   /note="HCM1.211c, probable transposase, len: 208 aa; highly
FT                   similar to many e.g. TR:Q52625 (EMBL:X00011) Proteus
FT                   vulgaris transposon Tn 2680 (204 aa), fasta scores; E(): 0,
FT                   100.0% identity in 197 aa overlap. Has no stop codon within
FT                   the inverted repeats of the putative transposable unit"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I5"
FT                   /protein_id="CAD09797.1"
FT                   /translation="MIAFNHVVPVLNLSVFNVRRAPAFAFEQSKRATIGGRFIRVDESR
FT                   DLPLLHVVEDFTQKPVCSFAVTTGGEIKIDSAAPAVDGPVQIRPAAIDLHVGFIHVPRA
FT                   KIGRVTPVPAQPFFHFRRITLNPAVNRGVIDIHSAFSQHLLQLTVTDAVFAVPAYGPQN
FT                   DVTLKMPAFEWVHVQLHQQKGMISLSPPTICNSARAGECRGDHPC"
FT   repeat_region   complement(159639..159653)
FT                   /note="15 bp inverted repeat flanking IS15/26"
FT   repeat_region   complement(159639..160460)
FT                   /note="IS15/26"
FT   repeat_region   complement(160446..160460)
FT                   /note="15 bp inverted repeat flanking IS15/26"
FT   misc_feature    complement(160461..160655)
FT                   /note="Pfam match to entry PF01526 Transposase_7,
FT                   Transposase, score 76.10, E-value 7.6e-20"
FT   repeat_region   complement(160655..160668)
FT                   /note="14 bp inverted repeat flanking IS15/26"
FT   repeat_region   complement(160655..161474)
FT                   /note="IS15/26"
FT   CDS             complement(160707..161411)
FT                   /transl_table=11
FT                   /gene="HCM1.213c"
FT                   /product="putative transposase"
FT                   /note="HCM1.213c, probable transposase, len: 234 aa; highly
FT                   similar to many e.g. TR:Q56369 (EMBL:M12900) probable
FT                   transposase from IS15-R (234 aa), fasta scores; E(): 0,
FT                   99.6% identity in 234 aa overlap. Contains Pfam match to
FT                   entry PF01438 Transposase_3, Transposase"
FT                   /db_xref="GOA:Q7AQT7"
FT                   /db_xref="InterPro:IPR001584"
FT                   /db_xref="InterPro:IPR012337"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT7"
FT                   /protein_id="CAD09798.1"
FT                   /translation="MNPFKGRHFQRDIILWAVRWYCKYGISYRELQEMLAERGVNVDHS
FT                   TIYRWVQRYAPEMEKRLRWYWRNPSDLCPWHMDETYVKVNGRWAYLYRAVDSRGRTVDF
FT                   YLSSRRNSKAAYRFLGKILNNVKKWQIPRFINTDKAPAYGRALALLKREGRCPSDVEHR
FT                   QIKYRNNVIECDHGKLKRIIGATLGFKSMKTAYATIKGIEVMRALRKGQASAFYYGDPL
FT                   GEMRLVSRVFEM"
FT   misc_feature    complement(160809..161411)
FT                   /note="Pfam match to entry PF01438 Transposase_3,
FT                   Transposase, score 501.80, E-value 5.3e-147"
FT   RBS             complement(161418..161421)
FT                   /note="possible RBS"
FT   repeat_region   complement(161461..161474)
FT                   /note="14 bp inverted repeat flanking IS15/26"
FT   misc_feature    161477..161701
FT                   /note="Pfam match to entry PF00239 recombinase,
FT                   Site-specific recombinases, score 106.60, E-value 1.3e-28"
FT   CDS             161477..161728
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.215"
FT                   /product="putative resolvase (pseudogene)"
FT                   /note="HCM1.215, probable resolvase (pseudogene), len: 252
FT                   bp; similar to many e.g. SW:TNP4_KLEPN (EMBL:M55547), tnpR,
FT                   Klebsiella pneumoniae transposon Tn1331 resolvase from
FT                   plasmid pJHC-MW1 (185 aa), fasta scores; E(): 2e-30, 89.5%
FT                   identity in 95 aa overlap. Contains Pfam match to entry
FT                   PF00239 recombinase, Site-specific recombinases"
FT                   /db_xref="PSEUDO:CAD09799.1"
FT   RBS             161900..161905
FT                   /note="possible RBS"
FT   CDS             161911..162771
FT                   /transl_table=11
FT                   /gene="bla"
FT                   /gene_synonym="HCM1.216"
FT                   /product="beta-lactamase"
FT                   /EC_number="3.5.2.6"
FT                   /note="HCM1.216, bla, beta-lactamase, len: 286 aa; highly
FT                   similar to many e.g. SW:BLAT_ECOLI (EMBL:J01749), bla,
FT                   Escherichia coli beta-lactamase precursor encoded by
FT                   several plasmids (EC 3.5.2.6) (286 aa), fasta scores; E():
FT                   0, 100.0% identity in 286 aa overlap. Contains Pfam match
FT                   to entry PF00144 beta-lactamase, Beta-lactamase and PS00146
FT                   Beta-lactamase class-A active site"
FT                   /db_xref="GOA:P62594"
FT                   /db_xref="InterPro:IPR000871"
FT                   /db_xref="InterPro:IPR001466"
FT                   /db_xref="InterPro:IPR012338"
FT                   /db_xref="UniProtKB/Swiss-Prot:P62594"
FT                   /protein_id="CAD09800.1"
FT                   /translation="MSIQHFRVALIPFFAAFCLPVFAHPETLVKVKDAEDQLGARVGYI
FT                   ELDLNSGKILESFRPEERFPMMSTFKVLLCGAVLSRVDAGQEQLGRRIHYSQNDLVEYS
FT                   PVTEKHLTDGMTVRELCSAAITMSDNTAANLLLTTIGGPKELTAFLHNMGDHVTRLDRW
FT                   EPELNEAIPNDERDTTMPAAMATTLRKLLTGELLTLASRQQLIDWMEADKVAGPLLRSA
FT                   LPAGWFIADKSGAGERGSRGIIAALGPDGKPSRIVVIYTTGSQATMDERNRQIAEIGAS
FT                   LIKHW"
FT   misc_feature    161992..162768
FT                   /note="Pfam match to entry PF00144 beta-lactamase,
FT                   Beta-lactamase, score 425.70, E-value 4.2e-124"
FT   misc_feature    162100..162147
FT                   /note="PS00146 Beta-lactamase class-A active site"
FT   CDS             162921..163322
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.217"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.217, hypothetical protein, len: 133 aa; unknown
FT                   function, similar to parts of several bacterial
FT                   hypothetical proteins e.g. TR:AAA92748 (EMBL:L06418), sulI,
FT                   Escherichia coli hypothetical protein from plasmid pDGO100
FT                   (341 aa), fasta scores; E(): 1.3e-29, 76.3% identity in 93
FT                   aa overlap"
FT                   /db_xref="PSEUDO:CAD09801.1"
FT   repeat_region   163306..163319
FT                   /note="14 bp inverted repeat flanking IS15/26"
FT   repeat_region   163306..164125
FT                   /note="IS15/26"
FT   RBS             163359..163362
FT                   /note="possible RBS"
FT   misc_feature    163369..163971
FT                   /note="Pfam match to entry PF01438 Transposase_3,
FT                   Transposase, score 501.80, E-value 5.3e-147"
FT   CDS             163369..164073
FT                   /transl_table=11
FT                   /gene="HCM1.219"
FT                   /product="putative transposase"
FT                   /note="HCM1.219, probable transposase, len: 234 aa; highly
FT                   similar to many e.g. TR:Q56369 (EMBL:M12900) probable
FT                   transposase from IS15-R (234 aa), fasta scores; E(): 0,
FT                   99.6% identity in 234 aa overlap. Contains Pfam match to
FT                   entry PF01438 Transposase_3, Transposase"
FT                   /db_xref="GOA:Q7AQT7"
FT                   /db_xref="InterPro:IPR001584"
FT                   /db_xref="InterPro:IPR012337"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT7"
FT                   /protein_id="CAD09802.1"
FT                   /translation="MNPFKGRHFQRDIILWAVRWYCKYGISYRELQEMLAERGVNVDHS
FT                   TIYRWVQRYAPEMEKRLRWYWRNPSDLCPWHMDETYVKVNGRWAYLYRAVDSRGRTVDF
FT                   YLSSRRNSKAAYRFLGKILNNVKKWQIPRFINTDKAPAYGRALALLKREGRCPSDVEHR
FT                   QIKYRNNVIECDHGKLKRIIGATLGFKSMKTAYATIKGIEVMRALRKGQASAFYYGDPL
FT                   GEMRLVSRVFEM"
FT   repeat_region   complement(164112..164125)
FT                   /note="14 bp inverted repeat flanking IS15/26"
FT   CDS             164126..164842
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.220"
FT                   /product="putative replication initiation protein
FT                   (pseudogene)"
FT                   /note="HCM1.220, probable replication initiation protein
FT                   (pseudogene), len: 717 bp; highly similar to SW:REPJ_ECOLI
FT                   (EMBL:M28829), repA, Escherichia coli regulatory protein
FT                   from plasmid IncQ RSF1010 (279 aa), fasta scores; E(): 0,
FT                   100.0% identity in 235 aa overlap. N-terminus is truncated"
FT   CDS             164829..165680
FT                   /transl_table=11
FT                   /gene="HCM1.221"
FT                   /product="putative replication protein"
FT                   /note="HCM1.221, probable replication protein, len: 283 aa;
FT                   highly similar to TR:Q52351 (EMBL:M28829), repC,
FT                   Escherichia coli replication protein from plasmid IncQ
FT                   RSF1010 (283 aa), fasta scores; E(): 0, 98.6% identity in
FT                   283 aa overlap. Contains PS00017 ATP/GTP-binding site motif
FT                   A (P-loop)"
FT                   /db_xref="InterPro:IPR010522"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I4"
FT                   /protein_id="CAD09804.1"
FT                   /translation="MVKPKNKHSLSHVRHDPAHCLAPGLFRALKRGERKRSKLDVTYDY
FT                   GDGKRIEFSGPEPLGADDLRILQGLVAMAGPNGLVLGPEPKTEGGRQLRLFLEPKWEAV
FT                   TADAMVVKGSYRALAKEIGAEVDSGGALKHIQDCIERLWKVSIIAQNGRKRQGFRLLSE
FT                   YASDEADGRLYVALNPLIAQAVMGGGQHVRISMDEVRALDSETARLLHQRLCGWIDPGK
FT                   TGKASIDTLCGYVWPSEASGSTMRKRRQRVREALPELVALGWTVTEFAAGKYDITRPKA
FT                   AG"
FT   misc_feature    165474..165497
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   CDS             165988..166803
FT                   /transl_table=11
FT                   /gene="HCM1.222"
FT                   /product="dihydropteroate synthase"
FT                   /EC_number="2.5.1.15"
FT                   /note="HCM1.222, dihydropteroate synthase, len: 271 aa;
FT                   highly similar to many e.g. SW:DHP2_ECOLI (EMBL:M36657),
FT                   sulII, Escherichia coli dihydropteroate synthase type II
FT                   encoded by several plasmids (EC 2.5.1.15) (271 aa), fasta
FT                   scores; E(): 0, 99.6% identity in 271 aa overlap. Contains
FT                   Pfam match to entry PF00809 DHPS, Dihydropteroate synthase
FT                   and PS00792 Dihydropteroate synthase signature 1"
FT                   /db_xref="GOA:Q935I3"
FT                   /db_xref="HSSP:1EYE"
FT                   /db_xref="InterPro:IPR000489"
FT                   /db_xref="InterPro:IPR006390"
FT                   /db_xref="InterPro:IPR011005"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I3"
FT                   /protein_id="CAD09805.1"
FT                   /translation="MNKSLIIFGIVNITSDSFSDGGRYLAPDAAIAQARKLMAEGADVI
FT                   DLGPASSNPDAAPVSSDTEIERIAPVLDALKADGIPVSLDSYQPATQAYALSRGVAYLN
FT                   DIRGFPDAAFYPQLAKSSAKLVVMHSVQDGQADRREAPAGDIMDHIAAFFDARIAALTG
FT                   AGIKRNRLVLDPGMGFFLGAAPETSLSVLARFDELRLRFDLPVLLSVSRKSFLRALTGR
FT                   GPGDVGAATLAAELAAAAGGADFIRTHEPRPLRDGLAVLAALKETARIR"
FT   misc_feature    166006..166053
FT                   /note="PS00792 Dihydropteroate synthase signature 1"
FT   misc_feature    166009..166776
FT                   /note="Pfam match to entry PF00809 DHPS, Dihydropteroate
FT                   synthase, score 433.90, E-value 1.4e-126"
FT   misc_feature    166108..166149
FT                   /note="PS00793 Dihydropteroate synthase signature 2"
FT   RBS             166852..166856
FT                   /note="possible RBS"
FT   misc_feature    166864..167658
FT                   /note="Pfam match to entry PF01636 APH, Aminoglycoside
FT                   phosphotransferase, score 454.70, E-value 7.7e-133"
FT   CDS             166864..167667
FT                   /transl_table=11
FT                   /gene="strA"
FT                   /gene_synonym="HCM1.223"
FT                   /product="streptomycin phosphotransferase"
FT                   /note="HCM1.223, strA, streptomycin phosphotransferase,
FT                   len: 267 aa; highly similar to many e.g. TR:Q57009
FT                   (EMBL:M95402), strA, Erwinia amylovora streptomycin
FT                   phosphotransferase from plasmid pEa34 (267 aa), fasta
FT                   scores; E(): 0, 99.6% identity in 267 aa overlap and
FT                   SW:APHE_STRGR (EMBL:X53527), aphE, Streptomyces griseus
FT                   streptomycin 3''-kinase (EC 2.7.1.87) (272 aa), fasta
FT                   scores; E(): 0, 51.1% identity in 262 aa overlap. Contains
FT                   Pfam match to entry PF01636 APH, Aminoglycoside
FT                   phosphotransferase"
FT                   /db_xref="GOA:Q7AQT5"
FT                   /db_xref="InterPro:IPR002575"
FT                   /db_xref="InterPro:IPR011009"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT5"
FT                   /protein_id="CAD09806.1"
FT                   /translation="MNRTNIFFGESHSDWLPVRGGESGDFVFRRGDGHAFAKIAPASRR
FT                   GELAGERDRLIWLKGRGVACPEVINWQEEQEGACLVITAIPGVPAADLSGADLLKAWPS
FT                   MGQQLGAVHSLSVDQCPFERRLSRMFGRAVDVVSRNAVNPDFLPDEDKSTPQLDLLARV
FT                   ERELPVRLDQERTDMVVCHGDPCMPNFMVDPKTLQCTGLIDLGRLGTADRYADLALMIA
FT                   NAEENWAAPDEAERAFAVLFNVLGIEAPDRERLAFYLRLDPLTWG"
FT   CDS             167667..168503
FT                   /transl_table=11
FT                   /gene="strB"
FT                   /gene_synonym="HCM1.224"
FT                   /product="streptomycin phosphotransferase"
FT                   /note="HCM1.224, strB, streptomycin phosphotransferase,
FT                   len: 278 aa; highly similar to many e.g. TR:Q57204
FT                   (EMBL:M95402), strB, Erwinia amylovora streptomycin
FT                   phosphotransferase from plasmid pEa34 (278 aa), fasta
FT                   scores; E(): 0, 100.0% identity in 278 aa overlap"
FT                   /db_xref="GOA:Q7AQT4"
FT                   /db_xref="InterPro:IPR006748"
FT                   /db_xref="InterPro:IPR011009"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT4"
FT                   /protein_id="CAD09807.1"
FT                   /translation="MFMPPVFPAHWHVSQPVLIADTFSSLVWKVSLPDGTPAIVKGLKP
FT                   IEDIADELRGADYLVWRNGRGAVRLLGRENNLMLLEYAGERMLSHIVAEHGDYQATEIA
FT                   AELMAKLYAASEEPLPSALLPIRDRFAALFQRARDDQNAGCQTDYVHAAIIADQMMSNA
FT                   SELRGLHGDLHHENIMFSSRGWLVIDPVGLVGEVGFGAANMFYDPADRDDLCLDPRRIA
FT                   QMADAFSRALDVDPRRLLDQAYAYGCLSAAWNADGEEEQRDLAIAAAIKQVRQTSY"
FT   repeat_region   168511..168525
FT                   /note="15 bp inverted repeat flanking IS15/26"
FT   repeat_region   168511..169332
FT                   /note="IS15/26"
FT   CDS             168741..169361
FT                   /transl_table=11
FT                   /gene="HCM1.225"
FT                   /product="putative transposase"
FT                   /note="HCM1.225, probable transposase, len: 206 aa; highly
FT                   similar to many e.g. TR:Q52625 (EMBL:X00011) Proteus
FT                   vulgaris transposon Tn 2680 (204 aa), fasta scores; E(): 0,
FT                   99.5% identity in 197 aa overlap. Has no stop codon within
FT                   the inverted repeats of the putative transposable unit"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I2"
FT                   /protein_id="CAD09808.1"
FT                   /translation="MIAFNHVVPVLNLSVFNVRRAPAFAFEQSKRATIGGRFIRVDESR
FT                   DLPLLHVVEDFTQKPVCSFAVTTGGEIKIDSAAPAVNGPVQIRPAAIDLHVGFIHVPRA
FT                   KIGRVTPVPAQPFFHFRRITLNPAVNRGVIDIHSAFSQHLLQLTVTDAVFAVPAYGPQN
FT                   DVTLKMPAFEWVHVQLHQQKGMISLSPPTICNSAHRRSSGCGR"
FT   repeat_region   complement(169318..169332)
FT                   /note="15 bp inverted repeat flanking IS15/26"
FT   CDS             complement(169333..170619)
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.226c"
FT                   /product="putative transposase (pseudogene)"
FT                   /note="HCM1.226c, possible transposase (pseudogene), len:
FT                   429 aa; highly similar to many e.g. TR:Q56381
FT                   (EMBL:U42226), tniA, Shigella flexneri possible transposase
FT                   from plasmid R100 (571 aa), fasta scores; E(): 0, 100.0%
FT                   identity in 429 aa overlap. Truncated at the C-terminus"
FT   CDS             complement(170658..171365)
FT                   /transl_table=11
FT                   /gene="HCM1.227c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.227c, hypothetical protein, len: 235 aa;
FT                   similar to many hypothetical proteins e.g. TR:Q9WTI2
FT                   (EMBL:AP000342), yaeA, Shigella flexneri hypothetical
FT                   protein from plasmid R100 (235 aa), fasta scores; E(): 0,
FT                   100.0% identity in 235 aa overlap. Contains Pfam match to
FT                   entry PF00563 DUF2, Domain of unknown function 2"
FT                   /db_xref="InterPro:IPR001633"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT3"
FT                   /protein_id="CAD09810.1"
FT                   /translation="MTSSQPAGWTAAELAQAAARGQLDLHYQPLVDLRDHRIAGAEALM
FT                   RWRHPRLGLLPPGQFLPLAESFGLMPEIGAWVLGEACRQMHKWQGPAWQPFRLAINVSA
FT                   SQVGPTFDDEVKRVLADMALPAELLEIELTESVAFGNPALFASFDALRAIGVRFAADDF
FT                   GTGYSCLQHLKCCPITTLKIDQSFVARLPDDARDQTIVRAVIQLAHGLGMDVIFRRRLH
FT                   QLIGRNGCCAASS"
FT   misc_feature    complement(170664..171338)
FT                   /note="Pfam match to entry PF00563 DUF2, Domain of unknown
FT                   function 2, score 197.30, E-value 2.4e-55"
FT   CDS             complement(171362..171598)
FT                   /transl_table=11
FT                   /gene="HCM1.229c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.229c, hypothetical protein, len: 78 aa; highly
FT                   similar to ORFs from transposable elements containing
FT                   mer-operons e.g. TR:Q57069 (EMBL:X03405), merE, Pseudomonas
FT                   aeruginosa hypothetical protein from plasmid R100 (78 aa),
FT                   fasta scores; E(): 1.3e-22, 98.7% identity in 78 aa
FT                   overlap"
FT                   /db_xref="InterPro:IPR007746"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT2"
FT                   /protein_id="CAD09811.1"
FT                   /translation="MNAPDKLPPETRQPVSGYLWGALAVLTCPCHLPILAAVLAGTTAG
FT                   AFLGEHWGVAALALTGLFVLAVTRLLRAFRGGS"
FT   CDS             complement(171595..171957)
FT                   /transl_table=11
FT                   /gene="merD"
FT                   /gene_synonym="HCM1.230c"
FT                   /product="putative mercuric resistance operon coregulator"
FT                   /note="HCM1.230c, merD, probable mercuric resistance operon
FT                   coregulator, len: 120 aa; highly similar to many e.g.
FT                   SW:MERD_SHIFL (EMBL:L29404), merD, Shigella flexneri
FT                   mercuric resistance protein from plasmid IncFII NR1 (120
FT                   aa), fasta scores; E(): 0, 99.2% identity in 120 aa
FT                   overlap. Similar to HCM1.159, merD, probable mercuric
FT                   resistance operon coregulator (121 aa), fasta scores; E():
FT                   0, 82.6% identity in 121 aa overlap"
FT                   /db_xref="GOA:Q7AQT1"
FT                   /db_xref="InterPro:IPR000551"
FT                   /db_xref="InterPro:IPR009061"
FT                   /db_xref="InterPro:IPR011797"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT1"
FT                   /protein_id="CAD09812.1"
FT                   /translation="MSAYTVSQLAHNAGVSVHIVRDYLVRGLLRPVACTTGGYGVFDDA
FT                   ALQRLCFVRAAFEAGIGLDALARLCRALDAADGAQAAAQLAVLRQLVERRRAALAHLDA
FT                   QLASMPAERAHEEALP"
FT   RBS             complement(171606..171611)
FT                   /note="possible RBS"
FT   RBS             complement(171963..171970)
FT                   /note="possible RBS"
FT   CDS             complement(171975..173669)
FT                   /transl_table=11
FT                   /gene="merA"
FT                   /gene_synonym="HCM1.231c"
FT                   /product="putative mercuric reductase"
FT                   /EC_number="1.16.1.1"
FT                   /note="HCM1.231c, merA, probable mercuric reductase, len:
FT                   564 aa; highly similar to many e.g. SW:MERA_SHIFL
FT                   (EMBL:J01730), merA, Shigella flexneri mercuric reductase
FT                   from plasmid IncFII NR1 (EC 1.16.1.1) (564 aa), fasta
FT                   scores; E(): 0, 99.6% identity in 564 aa overlap. Contains
FT                   Pfam matches to entry PF00403 HMA, Heavy-metal-associated
FT                   domain and to entry PF00070 pyr_redox, Pyridine
FT                   nucleotide-disulphide oxidoreductase class-I. Contains
FT                   PS01047 Heavy-metal-associated domain and PS00076 Pyridine
FT                   nucleotide-disulphide oxidoreductases class-I active site.
FT                   Similar to HCM1.158, merA, probable mercuric reductase (561
FT                   aa), fasta scores; E(): 0, 85.0% identity in 565 aa
FT                   overlap"
FT                   /db_xref="GOA:Q7AQT0"
FT                   /db_xref="HSSP:1AFJ"
FT                   /db_xref="InterPro:IPR000815"
FT                   /db_xref="InterPro:IPR001327"
FT                   /db_xref="InterPro:IPR004099"
FT                   /db_xref="InterPro:IPR006121"
FT                   /db_xref="InterPro:IPR011796"
FT                   /db_xref="InterPro:IPR012999"
FT                   /db_xref="InterPro:IPR013027"
FT                   /db_xref="InterPro:IPR016156"
FT                   /db_xref="InterPro:IPR017969"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQT0"
FT                   /protein_id="CAD09813.1"
FT                   /translation="MSTLKITGMTCDSCAVHVKDALEKVPGVQSADVSYAKGSAKLAIE
FT                   VGTSPDALTAAVAGLGYRATLADAPSVSTPGGLLDKMRDLLGRNDKTGSSGALHIAVIG
FT                   SGGAAMAAALKAVEQGARVTLIERGTIGGTCVNVGCVPSKIMIRAAHIAHLRRESPFDG
FT                   GIAATTPTIQRTALLAQQQARVDELRHAKYEGILEGNPAITVLHGSARFKDNRNLIVQL
FT                   NDGGERVVAFDRCLIATGASPAVPPIPGLKDTPYWTSTEALVSETIPKRLAVIGSSVVA
FT                   LELAQAFARLGAKVTILARSTLFFREDPAIGEAVTAAFRMEGIEVREHTQASQVAYING
FT                   EGDGEFVLTTAHGELRADKLLVATGRAPNTRKLALDATGVTLTPQGAIVIDPGMRTSVE
FT                   HIYAAGDCTDQPQFVYVAAAAGTRAAINMTGGDAALNLTAMPAVVFTDPQVATVGYSEA
FT                   EAHHDGIKTDSRTLTLDNVPRALANFDTRGFIKLVVEEGSGRLIGVQAVAPEAGELIQT
FT                   AALAIRNRMTVQELADQLFPYLTMVEGLKLAAQTFNKDVKQLSCCAG"
FT   misc_feature    complement(171996..173372)
FT                   /note="Pfam match to entry PF00070 pyr_redox, Pyridine
FT                   nucleotide-disulphide oxidoreductase class-I, score 736.50,
FT                   E-value 1.2e-217"
FT   misc_feature    complement(173244..173276)
FT                   /note="PS00076 Pyridine nucleotide-disulphide
FT                   oxidoreductases class-I active site"
FT   misc_feature    complement(173472..173666)
FT                   /note="Pfam match to entry PF00403 HMA,
FT                   Heavy-metal-associated domain, score 84.70, E-value
FT                   9.7e-23"
FT   misc_feature    complement(173565..173654)
FT                   /note="PS01047 Heavy-metal-associated domain"
FT   RBS             complement(173678..173683)
FT                   /note="possible RBS"
FT   CDS             complement(173721..174143)
FT                   /transl_table=11
FT                   /gene="merC"
FT                   /gene_synonym="HCM1.232c"
FT                   /product="putative mercury transport protein"
FT                   /note="HCM1.232c, merC, probable mercury transport protein,
FT                   len: 140 aa; highly similar to many e.g. TR:O66048
FT                   (EMBL:U90263), merC, Pseudomonas stutzeri MerC protein from
FT                   plasmid pPB (141 aa), fasta scores; E(): 0, 63.5% identity
FT                   in 137 aa overlap. Contains hydrophobic, probable
FT                   membrane-spanning regions. Similar to HCM1.157, merC,
FT                   probable mercury transport protein (141 aa), fasta scores;
FT                   E(): 0, 73.0% identity in 141 aa overlap"
FT                   /db_xref="InterPro:IPR004891"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQS9"
FT                   /protein_id="CAD09814.1"
FT                   /translation="MGLMTRIADKTGALGSVVSAMGCAACFPALASFGAAIGLGFLSQY
FT                   EGLFISRLLPLFAALAFLANALGWFSHRQWLRSLLGMIGPAIVFAATVWLLGNWWTANL
FT                   MYVGLALMIGVSIWDFVSPAHRRCGPDGCELPAKRL"
FT   CDS             complement(174179..174454)
FT                   /transl_table=11
FT                   /gene="merP"
FT                   /gene_synonym="HCM1.233c"
FT                   /product="putative mercuric transport protein periplasmic
FT                   binding protein"
FT                   /note="HCM1.233c, merP, probable mercuric transport protein
FT                   periplasmic binding protein, len: 91 aa; highly similar to
FT                   many e.g. SW:MERP_SHIFL (EMBL:J01730), merP, Shigella
FT                   flexneri mercuric transport protein periplasmic component
FT                   precursor from plasmid IncFII NR1 (91 aa), fasta scores;
FT                   E(): 5.1e-32, 98.9% identity in 91 aa overlap. Contains
FT                   Pfam match to entry PF00403 HMA, Heavy-metal-associated
FT                   domain and PS01047 Heavy-metal-associated domain. Contains
FT                   a probable N-terminal signal sequence. Similar to HCM1.153,
FT                   merP, probable mercuric transport protein periplasmic
FT                   binding protein (91 aa), fasta scores; E(): 6.4e-31, 82.4%
FT                   identity in 91 aa overlap"
FT                   /db_xref="GOA:Q935I1"
FT                   /db_xref="HSSP:1AFJ"
FT                   /db_xref="InterPro:IPR001757"
FT                   /db_xref="InterPro:IPR001802"
FT                   /db_xref="InterPro:IPR006121"
FT                   /db_xref="InterPro:IPR011795"
FT                   /db_xref="InterPro:IPR017969"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I1"
FT                   /protein_id="CAD09815.1"
FT                   /translation="MKKLFASLALAAAVAPVWAATQTVTLAVPGMTCVACPITVKKALS
FT                   KVEGVSKVDVGFEKREAVVTFDDTKASVQKLTKATADAGYPSSVKQ"
FT   misc_feature    complement(174188..174385)
FT                   /note="Pfam match to entry PF00403 HMA,
FT                   Heavy-metal-associated domain, score 95.50, E-value
FT                   7.9e-26"
FT   misc_feature    complement(174284..174373)
FT                   /note="PS01047 Heavy-metal-associated domain"
FT   RBS             complement(174461..174465)
FT                   /note="possible RBS"
FT   CDS             complement(174468..174818)
FT                   /transl_table=11
FT                   /gene="merT"
FT                   /gene_synonym="HCM1.234c"
FT                   /product="putative mercuric transport protein"
FT                   /note="HCM1.234c, merT, probable mercuric transport
FT                   protein, len: 116 aa; highly similar to many e.g.
FT                   SW:MERT_SHIFL (EMBL:J01730), merT, Shigella flexneri
FT                   mercuric transport protein from plasmid IncFII NR1 (116
FT                   aa), fasta scores; E(): 0, 100.0% identity in 116 aa
FT                   overlap. Contains hydrophobic, probable membrane-spanning
FT                   regions. Similar to HCM1.152, merT, probable mercuric
FT                   transport protein (121 aa), fasta scores; E(): 0, 93.0%
FT                   identity in 115 aa overlap"
FT                   /db_xref="GOA:P0A219"
FT                   /db_xref="InterPro:IPR003457"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0A219"
FT                   /protein_id="CAD09816.1"
FT                   /translation="MSEPQNGRGALFAGGLAAILASTCCLGPLVLVALGFSGAWIGNLT
FT                   VLEPYRPLFIGAALVALFFAWKRIYRPVQACKPGEVCAIPQVRATYKLIFWIVAVLVLV
FT                   ALGFPYVVPFFY"
FT   RBS             174877..174880
FT                   /note="possible RBS"
FT   CDS             174890..175324
FT                   /transl_table=11
FT                   /gene="merR"
FT                   /gene_synonym="HCM1.235"
FT                   /product="putative mercuric resistance operon regulatory
FT                   protein"
FT                   /note="HCM1.235, merR, probable mercuric resistance operon
FT                   regulatory protein, len: 144 aa; highly similar to many
FT                   e.g. SW:MERR_SHIFL (EMBL:K03089), merR, Shigella flexneri
FT                   mercuric resistance operon regulatory protein from plasmid
FT                   IncFII NR1 (144 aa), fasta scores; E(): 0, 100.0% identity
FT                   in 144 aa overlap. Contains Pfam match to entry PF00376
FT                   merR, Bacterial regulatory proteins, merR family and
FT                   PS00552 Bacterial regulatory proteins, merR family
FT                   signature. Contains a probable helix-turn-helix motif at aa
FT                   8-29 (Score 1571, +4.54 SD). Similar to HCM1.151c, merR,
FT                   probable mercuric resistance operon regulatory protein (151
FT                   aa), fasta scores; E(): 0, 89.4% identity in 142 aa
FT                   overlap"
FT                   /db_xref="GOA:P0A2Q8"
FT                   /db_xref="InterPro:IPR000551"
FT                   /db_xref="InterPro:IPR009061"
FT                   /db_xref="InterPro:IPR011794"
FT                   /db_xref="InterPro:IPR015358"
FT                   /db_xref="UniProtKB/Swiss-Prot:P0A2Q8"
FT                   /protein_id="CAD09817.1"
FT                   /translation="MENNLENLTIGVFAKAAGVNVETIRFYQRKGLLREPDKPYGSIRR
FT                   YGEADVVRVKFVKSAQRLGFSLDEIAELLRLDDGTHCEEASSLAEHKLKDVREKMADLA
FT                   RMETVLSELVCACHARKGNVSCPLIASLQGEAGLARSAMP"
FT   misc_feature    174920..174976
FT                   /note="Pfam match to entry PF00376 merR, Bacterial
FT                   regulatory proteins, merR family, score 29.10, E-value
FT                   7.8e-05"
FT   misc_feature    174920..174988
FT                   /note="PS00552 Bacterial regulatory proteins, merR family
FT                   signature"
FT   misc_feature    174920..175027
FT                   /note="Pfam match to entry PF00376 merR, Bacterial
FT                   regulatory proteins, merR family, score 64.40, E-value
FT                   2.4e-15"
FT   repeat_region   175343..175354
FT                   /note="12 bp inverted repeat flanking IS4321"
FT   repeat_region   175343..176659
FT                   /note="IS4321"
FT   RBS             175392..175395
FT                   /note="possible RBS"
FT   CDS             175403..176407
FT                   /transl_table=11
FT                   /gene="HCM1.236"
FT                   /product="putative transposase"
FT                   /note="HCM1.236, probable transposase, len: 334 aa; highly
FT                   similar to many e.g. SW:TRA8_YEREN (EMBL:Z48244) Yersinia
FT                   enterocolitica transposase for insertion sequence element
FT                   IS1328 (334 aa), fasta scores; E(): 0, 66.3% identity in
FT                   332 aa overlap and TR:P77600 (EMBL:U67194), tnpA,
FT                   Escherichia coli putative transposase from plasmid
FT                   IncP-beta R751 (334 aa), fasta scores; E(): 0, 97.3%
FT                   identity in 334 aa overlap"
FT                   /db_xref="GOA:Q934H6"
FT                   /db_xref="InterPro:IPR002525"
FT                   /db_xref="InterPro:IPR003346"
FT                   /db_xref="UniProtKB/TrEMBL:Q934H6"
FT                   /protein_id="CAD09818.1"
FT                   /translation="MENIALIGIDLGKNSFHIHCQDHRGKAVYRKKFTRPKLIEFLATC
FT                   PATTIAMEACGGSHFMARKLAELGHFPKLISPQFVRPFVKSNKNDFVDAEAICEAASRP
FT                   SMRFVQPRTESQQAMRALHRVRESLVQDKVKTTNQMHAFLLEFGISVPRGAAVISRLST
FT                   LLEDSSLPLYLSQLLLKLQQHYHYLVEQIKDLESQLKRKLDEDEVGQRLLSIPCVGTLT
FT                   ASTISTEIGDGKQYASSRDFAAATGLVPRQYSTGGRTTLLGISKRGNKKIRTLLVQCAR
FT                   VFIQKLEHQSGKLADWVRELLCRKSNFVVTCALANKLARIAWALTARQQTYEA"
FT   repeat_region   complement(176648..176659)
FT                   /note="12 bp inverted repeat flanking IS4321"
FT   repeat_region   complement(176752..177500)
FT                   /note="IS1"
FT   repeat_region   176753..176765
FT                   /note="13 bp inverted repeat flanking IS1"
FT   CDS             complement(176758..177261)
FT                   /transl_table=11
FT                   /gene="insB"
FT                   /gene_synonym="HCM1.238c"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.238c, insB, possible IS1 transposase, len: 167
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISB_ECOLI (EMBL:D10483), insB, Escherichia coli
FT                   insertion element IS1 protein InsB (167 aa), fasta scores;
FT                   E(): 0, 97.0% identity in 167 aa overlap"
FT                   /db_xref="GOA:Q7AQU0"
FT                   /db_xref="InterPro:IPR005063"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQU0"
FT                   /protein_id="CAD09819.1"
FT                   /translation="MPGNRPHYGRWPQHDFPPFKKLRPQSVTSRIQPGSDVIVCAEMDE
FT                   QWGYVGAKSRQRWLFYAYDRLRKTVVAHVFGERTMATLGRLMSLLSPFDVVIWMTDGWP
FT                   LYESRLKGKLHVISKRYTQRIERHNLNLRQHLARLGRKSLSFSKSVELHDKVIGHYLNI
FT                   KHYQ"
FT   CDS             complement(177180..177455)
FT                   /transl_table=11
FT                   /gene="insA"
FT                   /gene_synonym="HCM1.239c"
FT                   /product="putative IS1 transposase"
FT                   /note="HCM1.239c, insA, probable IS1 transposase, len: 91
FT                   aa; highly similar to many from Enterobacteriaceae e.g.
FT                   SW:ISA1_ECOLI (EMBL:X52534), insA, Escherichia coli
FT                   insertion element IS1 protein InsA (91 aa), fasta scores;
FT                   E(): 0, 97.8% identity in 91 aa overlap. Contains PS00017
FT                   ATP/GTP-binding site motif A (P-loop). Contains a probable
FT                   helix-turn-helix motif at aa 64-85 (Score 1462, +4.17 SD)"
FT                   /db_xref="GOA:Q7AQV4"
FT                   /db_xref="InterPro:IPR003220"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQV4"
FT                   /protein_id="CAD09820.1"
FT                   /translation="MASVSISCPSCSATDGVVRNGKSTAGHQRYLCSHCRKTWQLQFTY
FT                   TASQPGTHQKIIDMAMNGVGCRATARIMGVGLNTIFRHLKNSGRSR"
FT   misc_feature    complement(177199..177204)
FT                   /note="possible translational frameshift site, similar to
FT                   that determined experimentally (EMBL:X52534)"
FT   misc_feature    complement(177387..177410)
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   repeat_region   complement(177488..177500)
FT                   /note="13 bp inverted repeat flanking IS1"
FT   CDS             177511..177822
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.240"
FT                   /product="hypothetical protein (pseudogene)"
FT                   /note="HCM1.240, probable pseudogene, len: 312 bp; highly
FT                   similar to part of SW:TETC_ECOLI (EMBL:J01830), tetC,
FT                   Escherichia coli transposon Tn10 protein (197 aa), fasta
FT                   scores; E(): 0, 99.0% identity in 103 aa overlap. Truncated
FT                   at the N-terminus"
FT   CDS             complement(177935..179140)
FT                   /transl_table=11
FT                   /gene="tetA"
FT                   /gene_synonym="HCM1.241c"
FT                   /product="tetracycline resistance protein"
FT                   /note="HCM1.241c, tetA, tetracycline resistance protein,
FT                   len: 401 aa; highly similar to many e.g. SW:TCR2_ECOLI
FT                   (EMBL:V00611), tetA, Escherichia coli tetracycline
FT                   resistance protein, class B (401 aa), fasta scores; E(): 0,
FT                   99.8% identity in 401 aa overlap. Contains PS00216 Sugar
FT                   transport proteins signature 1. Contains hydrophobic,
FT                   probable membrane-spanning regions"
FT                   /db_xref="GOA:Q7BN13"
FT                   /db_xref="InterPro:IPR001958"
FT                   /db_xref="InterPro:IPR005829"
FT                   /db_xref="InterPro:IPR011701"
FT                   /db_xref="InterPro:IPR016196"
FT                   /db_xref="UniProtKB/TrEMBL:Q7BN13"
FT                   /protein_id="CAD09822.1"
FT                   /translation="MNSSTKIALVITLLDAMGIGLIMPVLPTLLREFIASEDIANHFGV
FT                   LLALYALMQVIFAPWLGKMSDRFGRRPVLLLSLIGASLDYLLLAFSSALWMLYLGRLLS
FT                   GITGATGAVAASVIADTTSASQRVKWFGWLGASFGLGLIAGPIIGGFAGEISPHSPFFI
FT                   AALLNIVAFLVVMFWFRETKNTRDNTDTEVGVETQSNSVYITLFKTMPILLIIYFSAQL
FT                   IGQIPATVWVLFTENRFGWNSMMVGFSLAGLGLLHSVFQAFVAGRIATKWGEKTAVLLG
FT                   FIADSSAFAFLAFISEGWLVFPVLILLAGGGIALPALQGVMSIQTKSHQQGALQGLLVS
FT                   LTNATGVIGPLLFAVIYNHSLPIWDGWIWIIGLAFYCIIILLSMTFMLTPQAQGSKQET
FT                   SA"
FT   misc_feature    complement(178910..178960)
FT                   /note="PS00216 Sugar transport proteins signature 1"
FT   CDS             179219..179845
FT                   /transl_table=11
FT                   /gene="tetR"
FT                   /gene_synonym="HCM1.243"
FT                   /product="tetracycline repressor protein"
FT                   /note="HCM1.243, tetR, tetracycline repressor protein, len:
FT                   208 aa; highly similar to many e.g. SW:TER2_ECOLI
FT                   (EMBL:X00694), tetR, Escherichia coli tetracycline
FT                   repressor protein (207 aa), fasta scores; E(): 0, 100.0%
FT                   identity in 207 aa overlap. Contains Pfam match to entry
FT                   PF00440 tetR, Bacterial regulatory proteins, tetR family
FT                   and PS01081 Bacterial regulatory proteins, tetR family
FT                   signature. Contains a probable helix-turn-helix motif at aa
FT                   26-47 (Score 2218, +6.74 SD)"
FT                   /db_xref="GOA:Q9S455"
FT                   /db_xref="HSSP:1A6I"
FT                   /db_xref="InterPro:IPR001647"
FT                   /db_xref="InterPro:IPR003012"
FT                   /db_xref="InterPro:IPR004111"
FT                   /db_xref="InterPro:IPR009057"
FT                   /db_xref="InterPro:IPR011075"
FT                   /db_xref="InterPro:IPR012287"
FT                   /db_xref="InterPro:IPR015893"
FT                   /db_xref="UniProtKB/TrEMBL:Q9S455"
FT                   /protein_id="CAD09823.1"
FT                   /translation="MMSRLDKSKVINSALELLNEVGIEGLTTRKLAQKLGVEQPTLYWH
FT                   VKNKRALLDALAIEMLDRHHTHFCPLEGESWQDFLRNNAKSFRCALLSHRDGAKVHLGT
FT                   RPTEKQYETLENQLAFLCQQGFSLENALYALSAVGHFTLGCVLEDQEHQVAKEERETPT
FT                   TDSMPPLLRQAIELFDHQGAEPAFLFGLELIICGLEKQLKCESGS"
FT   misc_feature    179246..179386
FT                   /note="Pfam match to entry PF00440 tetR, Bacterial
FT                   regulatory proteins, tetR family, score 88.40, E-value
FT                   8e-23"
FT   misc_feature    179282..179374
FT                   /note="PS01081 Bacterial regulatory proteins, tetR family
FT                   signature"
FT   misc_feature    179294..179359
FT                   /note="Pfam match to entry PF00440 tetR, Bacterial
FT                   regulatory proteins, tetR family, score 28.50, E-value
FT                   3.7e-06"
FT   CDS             complement(179823..180509)
FT                   /transl_table=11
FT                   /gene="HCM1.244c"
FT                   /product="putative transcriptional regulator"
FT                   /note="HCM1.244c, possible transcriptional regulator, len:
FT                   228 aa; similar to e.g. TR:AAD50245 (EMBL:AF162223), jemC,
FT                   Shigella flexneri hypothetical protein from transposon Tn10
FT                   (228 aa), fasta scores; E(): 0, 99.6% identity in 228 aa
FT                   overlap. Contains Pfam match to entry PF01022 HTH_5,
FT                   Bacterial regulatory protein, arsR family. Contains a
FT                   probable helix-turn-helix motif at aa 40-61 (Score 1172,
FT                   +3.18 SD)"
FT                   /db_xref="GOA:Q935I0"
FT                   /db_xref="InterPro:IPR001845"
FT                   /db_xref="InterPro:IPR011991"
FT                   /db_xref="UniProtKB/TrEMBL:Q935I0"
FT                   /protein_id="CAD09824.1"
FT                   /translation="MANLIRKEVTFESSIAAIGAAMSDISRVKILSALMDGRAWTATEL
FT                   SSVANISASTASSHLSKLLDCQLITVVAQGKHRYFRLAGKDIAELMESMMGISLNHGVH
FT                   ARVSTPVHLRKARTCYDHLAGEVAVKIYDSLCQQQWITENGSMITLSGIQYFHEMGIDV
FT                   PSKHSRKICCACLDWSERRFHLGGYVGAALFSLYESKGWLTRHLGYREVTITEKGYAAF
FT                   KTHFHI"
FT   misc_feature    complement(180219..180455)
FT                   /note="Pfam match to entry PF01022 HTH_5, Bacterial
FT                   regulatory protein, arsR family, score 46.40, E-value
FT                   6.2e-10"
FT   CDS             complement(180517..180903)
FT                   /transl_table=11
FT                   /gene="HCM1.245c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.245c, hypothetical protein, len: 128 aa;
FT                   unknown function, identical to TR:Q9WTF2 (EMBL:AP000342),
FT                   ydjB, Shigella flexneri hypothetical protein from plasmid
FT                   R100 (162 aa), fasta scores; E(): 0, 100.0% identity in 162
FT                   aa overlap"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H9"
FT                   /protein_id="CAD09825.1"
FT                   /translation="MFDVHVVLDNQIGQLALLGKTLGNKGIGLEGGGIFTVGDECHAHF
FT                   LVEQGKEAKIALEQAGLLVLAIRTPLIRKLKQEKPGELGEIARVLAENNINILVQYSDH
FT                   ANQLILITDNDSMAASVTLPWAIK"
FT   CDS             complement(180896..181216)
FT                   /transl_table=11
FT                   /gene="HCM1.246c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.246c, hypothetical protein, len: 106 aa;
FT                   unknown function, identical to TR:Q9WTF3 (EMBL:AP000342),
FT                   ydjA, Shigella flexneri hypothetical protein from plasmid
FT                   R100 (106 aa), fasta scores; E(): 0, 100.0% identity in 106
FT                   aa overlap"
FT                   /db_xref="GOA:Q7BN17"
FT                   /db_xref="InterPro:IPR007138"
FT                   /db_xref="InterPro:IPR011008"
FT                   /db_xref="UniProtKB/TrEMBL:Q7BN17"
FT                   /protein_id="CAD09826.1"
FT                   /translation="MIAVIFEVQIQPDQQTRYLTLAEELRPLLSHVAGFISIERFQSLA
FT                   TEGKMLSLSWWENEYAVLQWKNHVLHAKAQQEGRESIFDFYKISIAHITREYSFKKDKD
FT                   NV"
FT   RBS             complement(180906..180910)
FT                   /note="possible RBS"
FT   RBS             complement(181223..181226)
FT                   /note="possible RBS"
FT   CDS             181660..182864
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.247"
FT                   /product="putative glutamate permease (pseudogene)"
FT                   /note="HCM1.247, probable glutamate permease (pseudogene),
FT                   len: 1205 bp; highly similar to SW:GLTS_ECOLI
FT                   (EMBL:D00626), gltS, Escherichia coli sodium/glutamate
FT                   symport carrier protein (401 aa), fasta scores; E(): 0,
FT                   54.5% identity in 288 aa overlap and E(): 2.8e-11, 40.8%
FT                   identity in 103 aa overlap. The sequence contains a
FT                   frameshift and therefore appears to be a pseudogene"
FT   CDS             183095..183220
FT                   /transl_table=11
FT                   /gene="HCM1.248"
FT                   /product="putative transcriptional regulator (partial)"
FT                   /note="HCM1.248, possible transcriptional regulator remant,
FT                   len: 41 aa; similar to the N-termini of transcriptional
FT                   regulators e.g. SW:LYSR_ECOLI (EMBL:J01614), lysR,
FT                   Escherichia coli transcriptional activator of
FT                   diaminopimelate decarboxylase (311 aa), fasta scores; E():
FT                   1.3e-06, 53.5% identity in 43 aa overlap. The remainder of
FT                   the CDS has been truncated"
FT                   /db_xref="GOA:Q935H8"
FT                   /db_xref="InterPro:IPR000847"
FT                   /db_xref="InterPro:IPR011991"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H8"
FT                   /protein_id="CAD09828.1"
FT                   /translation="MKLRHLDIFYAVMTCGSLTRAAEVLHISQPAASKALKHAEH"
FT   repeat_region   183224..183238
FT                   /note="15 bp inverted repeat flanking IS10"
FT   repeat_region   complement(183224..184538)
FT                   /note="IS10"
FT   CDS             complement(183230..184438)
FT                   /transl_table=11
FT                   /gene="HCM1.249c"
FT                   /product="transposase"
FT                   /note="HCM1.249c, transposase, len: 402 aa; identical or
FT                   highly similar to Tn10 transposases e.g. TR:AAD50242
FT                   (EMBL:AF162223) Shigella flexneri IS10-left transposase
FT                   from Tn10 (402 aa), fasta scores; E(): 0, 100.0% identity
FT                   in 402 aa overlap"
FT                   /db_xref="GOA:Q7AQU3"
FT                   /db_xref="InterPro:IPR002559"
FT                   /db_xref="InterPro:IPR012337"
FT                   /db_xref="UniProtKB/TrEMBL:Q7AQU3"
FT                   /protein_id="CAD09829.1"
FT                   /translation="MCELDILHDSLYQFCPELHLKRLNSLTLACHALLDCKTLTLTELG
FT                   RNLPTKARTKHNIKRIDRLLGNRHLHKERLAVYRWHASFICSGNTMPIVLVDWSDIREQ
FT                   KRLMVLRASVALHGRSVTLYEKAFPLSEQCSKKAHDQFLADLASILPSNTTPLIVSDAG
FT                   FKVPWYKSVEKLGWYWLSRVRGKVQYADLGAENWKPISNLHDMSSSHSKTLGYKRLTKS
FT                   NPISCQILLYKSRSKGRKNQRSTRTHCHHPSPKIYSASAKEPWILATNLPVEIRTPKQL
FT                   VNIYSKRMQIEETFRDLKSPAYGLGLRHSRTSSSERFDIMLLIALMLQLTCWLAGVHAQ
FT                   KQGWDKHFQANTVRNRNVLSTVRLGMEVLRHSGYTITREDSLVAATLLTQNLFTHGYVL
FT                   GKL"
FT   CDS             complement(184508..184858)
FT                   /transl_table=11
FT                   /gene="HCM1.250c"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.250c, possible periplasmic protein, len: 116
FT                   aa; unknown function, contains a probable N-terminal signal
FT                   sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H7"
FT                   /protein_id="CAD09830.1"
FT                   /translation="MKIKNIVLAGIISLVFSVHASDKQNIKRDPIPYLGYDAVTSNMCI
FT                   DAGGLTDPVEMRKKATETLLMILHKQPGDKLSKQSEDTIEAFVTRTRSSSDDISKCQFS
FT                   ADESPNDFYQNH"
FT   repeat_region   complement(184524..184538)
FT                   /note="15 bp inverted repeat flanking IS10"
FT   RBS             complement(184865..184868)
FT                   /note="possible RBS"
FT   CDS             complement(185006..185620)
FT                   /transl_table=11
FT                   /gene="HCM1.251c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.251c, hypothetical protein, len: 204 aa;
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H6"
FT                   /protein_id="CAD09831.1"
FT                   /translation="MAIDTDDTDPVDAEACEKYLAQLRELEAYRAYRTTAAIDWFFDQA
FT                   TRAIHGELWLAACTTFLNGIETSLMVTMKLKASQAQPQAPTPLVDLSDMATLSNALLRR
FT                   AHQAGMPVTLLAFPDEQDLLTKIADGAPKLPYAEIVRVRHNLCHGNILEHIITASDGMG
FT                   EPVRLFTPECMRDLAQTLSAVSKVWIAGLHQYWCDNNLSMP"
FT   RBS             complement(185628..185631)
FT                   /note="possible RBS"
FT   CDS             185798..186232
FT                   /transl_table=11
FT                   /gene="mucA"
FT                   /gene_synonym="HCM1.252"
FT                   /product="putative DNA-repair modulator"
FT                   /note="HCM1.252, mucA, probable DNA-repair modulator, len:
FT                   144 aa; similar to members of the ImpA/MucA/UmuD/LexA
FT                   family e.g. SW:UMUD_SALTY (EMBL:M57431), umuD, Salmonella
FT                   typhimurium protein involved in UV protection and SOS
FT                   mutagenesis (139 aa), fasta scores; E(): 4.1e-21, 51.7%
FT                   identity in 120 aa overlap. Contains Pfam match to entry
FT                   PF00717 Peptidase_S24, Peptidase family S24"
FT                   /db_xref="GOA:Q935H5"
FT                   /db_xref="HSSP:1UMU"
FT                   /db_xref="InterPro:IPR006197"
FT                   /db_xref="InterPro:IPR011056"
FT                   /db_xref="InterPro:IPR015927"
FT                   /db_xref="InterPro:IPR019759"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H5"
FT                   /protein_id="CAD09832.1"
FT                   /translation="MSVFPERFASPPRDTTPFFSDLLSCGVMSPCAGHEDNELNLHDFV
FT                   VRNRPATFFVRASGLSMVDAGINDGAILVVDRSLTAEHGSIVVALVDGEFTVKILQTFP
FT                   KLMLMPSNPAFKPIPVNPDTLEIWGVVTFALNQFPHVHAR"
FT   misc_feature    185813..186169
FT                   /note="Pfam match to entry PF00717 Peptidase_S24, Peptidase
FT                   family S24, score 135.40, E-value 1e-36"
FT   CDS             186216..187475
FT                   /transl_table=11
FT                   /gene="mucB"
FT                   /gene_synonym="HCM1.253"
FT                   /product="putative DNA-repair modulator"
FT                   /note="HCM1.253, mucB, probable DNA-repair modulator, len:
FT                   419 aa; similar to members of the ImpB/MucB/SamB family
FT                   e.g. SW:MUCB_ECOLI (EMBL:D90147), mucB, Escherichia coli
FT                   protein involved in UV protection and SOS mutagenesis from
FT                   plasmid IncN pKM101 (420 aa), fasta scores; E(): 0, 46.8%
FT                   identity in 412 aa overlap. Contains Pfam match to entry
FT                   PF00817 IMS, impB/mucB/samB family"
FT                   /db_xref="GOA:Q935H4"
FT                   /db_xref="InterPro:IPR001126"
FT                   /db_xref="InterPro:IPR017963"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H4"
FT                   /protein_id="CAD09833.1"
FT                   /translation="MYMHVDINGAYAAFECAMDPKLAKSPLIIASNNDATIIAMNRLAK
FT                   NTGLKRGMPIFKCRDLIEQHHIAVRSSNFTLYEDYSNRFHETLEGFAEDTDRYSVDESF
FT                   MLLKNMDKIVDFEEYGCLIRRTLLHNLSLTCGIGVSTTKTLAKLCTYASKRWAATGGVV
FT                   VLTDPFRIKKLLSLISTREIWGIGRKISERLTAYGIITACDFYDSDVRFLRKAFGVEME
FT                   RTWRELHGESCFRLHESPPVRQQIIVSRSFGQRLNTFSKMHEAVSFFTGRAAEQLRNDG
FT                   SWTRQITVFIQSSPFARAEARYSSCGIEPLTATQDTRDLVSAAGAILTRIYKPGIDYAK
FT                   AGVMLSSMTDGTEQLSLFDERPARRGSEALMKVMDRFNKEHRGSLFLACEGIHQDFRGK
FT                   QAMLSPRYTTRWNELLVVKA"
FT   misc_feature    186228..187265
FT                   /note="Pfam match to entry PF00817 IMS, impB/mucB/samB
FT                   family, score 403.60, E-value 1.8e-117"
FT   CDS             complement(187527..188336)
FT                   /transl_table=11
FT                   /gene="HCM1.254c"
FT                   /product="putative outer membrane protein"
FT                   /note="HCM1.254c, possible outer membrane protein, len: 269
FT                   aa; shows weak similarity to TR:Q57333 (EMBL:Z11828), com1,
FT                   Coxiella burnetii outer membrane protein precursor (252
FT                   aa), fasta scores; E(): 2e-09, 28.6% identity in 266 aa
FT                   overlap. Also similar to TR:Q9X610 (EMBL:AF130422), bcfH,
FT                   Salmonella typhimurium hypothetical protein (269 aa), fasta
FT                   scores; E(): 6.3e-24, 31.4% identity in 258 aa overlap.
FT                   Contains a probable N-terminal signal sequence"
FT                   /db_xref="GOA:Q9L5K7"
FT                   /db_xref="InterPro:IPR001853"
FT                   /db_xref="InterPro:IPR012335"
FT                   /db_xref="InterPro:IPR012336"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5K7"
FT                   /protein_id="CAD09834.1"
FT                   /translation="MIKLNYLKPVASVLISAVIATAGSVYITSKYLKPDVPGNDEIGRV
FT                   AASYLVKNPQYLLEAGKALEKENTNASLERIIPYAPALFETKETPNIGPDNAAVAVIEF
FT                   FDYQCHFCMQVAPVVESVLSQSTDVKFFFKEFPIFAGSKPVSAMGAATGLHVYQTFGAE
FT                   AYRKYHNNLMTSAYVFFNNQRAFTLNDLDMVVNKSGFNSSFGDREKSRYENVISGNMQL
FT                   GEALGINGTPGFIIMNMQKPDAATTSFIPGAVDEATLKYAIQKARGG"
FT   CDS             188443..189054
FT                   /transl_table=11
FT                   /gene="HCM1.255"
FT                   /product="putative lipoprotein"
FT                   /note="HCM1.255, possible lipoprotein, len: 203 aa; unknown
FT                   function, contains a possible N-terminal signal sequence
FT                   (weak prediction) and an appropriately positioned PS00013
FT                   Prokaryotic membrane lipoprotein lipid attachment site"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5K8"
FT                   /protein_id="CAD09835.1"
FT                   /translation="MLRQFFLLTATTFLCGCGYHFGNDVDAYDLLPRPVGSKKFEIVAP
FT                   DDSIQSRMFAARFASGLTGKGFNISSHQPEYILRFSYSKTQENLQYSELPVTGITGYVI
FT                   EKKTTRKDKHGQTETDYDYKPVSGIVGTETVSQRHFWRRLDVEVYPAGKNAQQVLKVSM
FT                   QSNAPIPSDSVAYSAMIDALTGNLDAPLRSGNYVASVPWN"
FT   misc_feature    188461..188493
FT                   /note="PS00013 Prokaryotic membrane lipoprotein lipid
FT                   attachment site"
FT   CDS             complement(189113..189535)
FT                   /transl_table=11
FT                   /gene="HCM1.256c"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.256c, possible membrane protein, len: 140 aa;
FT                   unknown function, contains hydrophobic, probable
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5K9"
FT                   /protein_id="CAD09836.1"
FT                   /translation="MSLWLSIVTRATGLPDKRYLNDPVILRYYQQKIQKAPYALVGWTL
FT                   CFMATIGVSLGLDLSNQMLLLVLLILIFLMVVLQGRYQFMHPERCINAKFYQTVLDDAS
FT                   VSDIQKAQFEYLFVTKVDELTIGDLYRLYDFNRGGR"
FT   CDS             complement(189558..189950)
FT                   /transl_table=11
FT                   /gene="HCM1.257c"
FT                   /product="puatative periplasmic protein"
FT                   /note="HCM1.257c, possible periplasmic protein, len: 130
FT                   aa; unknown function, contains a probable N-terminal signal
FT                   sequence"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H3"
FT                   /protein_id="CAD09837.1"
FT                   /translation="MKSAILTTLMLVAVGSQPVFAAKCQFGACDADTVASSESLVSAAQ
FT                   TDKDAVLKKLNDATSRSDVMSKRFESYLSNDRLKVNTDSTKKGPSNEIAKPRDELAPVR
FT                   QLKAIRPELVQTPIFQPIVAFYERLA"
FT   CDS             complement(189976..190725)
FT                   /transl_table=11
FT                   /gene="HCM1.258c"
FT                   /product="putative thiol:disulfide interchange protein"
FT                   /note="HCM1.258c, probable thiol:disulfide interchange
FT                   protein, len: 249 aa; similar to e.g. SW:DSBC_ERWCH
FT                   (EMBL:X76687), dsbC, Erwinia chrysanthemi thiol:disulfide
FT                   interchange protein precursor (238 aa), fasta scores; E():
FT                   8.2e-26, 36.2% identity in 218 aa overlap. Contains a
FT                   probable N-terminal signal sequence"
FT                   /db_xref="HSSP:1EEJ"
FT                   /db_xref="InterPro:IPR009094"
FT                   /db_xref="InterPro:IPR012335"
FT                   /db_xref="InterPro:IPR012336"
FT                   /db_xref="InterPro:IPR018950"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5L1"
FT                   /protein_id="CAD09838.1"
FT                   /translation="MNKTIKASLFLLASCTALSMNAQTANTDVLPDAALKKLREVGLSI
FT                   EHIEPSPVKDIYTVISREGVSYVSKDGDYIFTGSLFHVNGKDVENTTEQAILKGVREFA
FT                   TKTKSIEYKSANEKYRLAVFTDITCGFCQKLHQDLQSYLDAGISIKFLAFPRAGLNSVV
FT                   AGNMAKIWCAAKPNDALDAAMSPTSTIPEGRPDEACLDTIKSHFQVASTIPLQGTPTMV
FT                   TLSGKPQLFTGWMSPENLVTRMGAEQK"
FT   RBS             complement(190731..190736)
FT                   /note="possible RBS"
FT   RBS             190861..190864
FT                   /note="possible RBS"
FT   CDS             190873..191388
FT                   /transl_table=11
FT                   /gene="HCM1.259"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.259, hypothetical protein, len: 171 aa; similar
FT                   to CDS present in plasmid-borne type IV pilus biogenesis
FT                   clusters e.g. TR:Q47073 (EMBL:Z68186), bfpH, Escherichia
FT                   coli BfpH protein from plasmid pMAR2 (148 aa), fasta
FT                   scores; E(): 6.6e-11, 37.0% identity in 135 aa overlap.
FT                   Unlike BfpH, this CDS does not have a predicted N-terminal
FT                   signal sequence. Also similar to TR:P71189 (EMBL:U67194),
FT                   trbN, Enterobacter aerogenes protein possibly involved in
FT                   mating-pair formation from plasmid R751 (211 aa), fasta
FT                   scores; E(): 1.8e-08, 29.4% identity in 119 aa overlap and
FT                   to SW:IAGB_SALTI (EMBL:X80892), iagB, Salmonella typhi
FT                   invasion protein (160 aa), fasta scores; E(): 0.00031,
FT                   29.1% identity in 117 aa overlap. Contains Pfam match to
FT                   entry PF01464 SLT, Transglycosylase SLT domain"
FT                   /db_xref="InterPro:IPR008258"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5L2"
FT                   /protein_id="CAD09839.1"
FT                   /translation="MFIPPVDDVKPIPVPVEIYTQCITDASRFFGIDAELVFTLFDNEG
FT                   GKVGTFSRNKNGTYDIGPMQINSSNLPEIRDHFPSVTWRVLAYDACASFWVGTWWLYRK
FT                   IVDRKGNVFEGIADYNSKTPKVRATYIFNFMIKYNRRIQRRNGMDELYQWTQPKPQYNG
FT                   HIVKNLPE"
FT   misc_feature    190933..191298
FT                   /note="Pfam match to entry PF01464 SLT, Transglycosylase
FT                   SLT domain, score 13.10, E-value 0.0061"
FT   CDS             191440..192003
FT                   /transl_table=11
FT                   /gene="HCM1.261"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.261, hypothetical protein, len: 187 aa; unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H2"
FT                   /protein_id="CAD09840.1"
FT                   /translation="MRLLENENVLRKRLTMLQSIYKFLFNLCSSPQLPKNKDVDGILSH
FT                   EEITAGLWGPLPSIHVVLFLDFDGVVHKCQNESFERMHLIERLLDASPSMFIVISSSWR
FT                   ECGSITYLKSLFRSPYRDRVIGATPSLYLPSGSIGVRAAECEDFVTRHKVKAFICLDDD
FT                   ATLFLQSTRTCFVQIITPGLMKRI"
FT   CDS             complement(192297..196286)
FT                   /transl_table=11
FT                   /gene="HCM1.262"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.262, probable membrane protein, len: 1329 aa;
FT                   unknown function, contains hydrophobic, possible
FT                   membrane-spanning regions. Contains {agg}5 motif which may
FT                   be a site for slipped-strand mispairing"
FT                   /db_xref="InterPro:IPR012931"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H1"
FT                   /protein_id="CAD09841.1"
FT                   /translation="MDYNIYTVGDIEFVWSALNGIALIFSQYTGVKAFLTTAAVLAGAS
FT                   LFYKTWLWLLNPTKAEVPIFSWILGLILFSMAIVRVDVTIESVKSGEVRNVDGIPIFIA
FT                   AMGTVTTNLSQGLLKDYKTAFDPLAPIDFAATTLDDDITLGPMIRFVKFLQWGGDSQGY
FT                   CSAFPEPASGLGAMNVCATVQSLAYNCLKGTQNSSAKIAGKETIFNDIFSANIVDSMER
FT                   INQAMKGSLKNASANIVGVNSSKSATCEEVWSTVKQVTSTPEARQTIALIGQTNGILAP
FT                   DEAGGAASGASFTDVMASANGMYGKAIGAYDATLSLFIMNELRNGASKYKTPLGLASDM
FT                   QLFEASLKRTNTMASQGQLWLQLSGAAIAFLEMFAYMVAPFALLMLLALGGNGVAAAAK
FT                   YLQLILFVNMWPITAVMVNAYVKKVATADLDTWSTLNSQSNAVTWMGLPGLAETYSSYL
FT                   SVASALYALIPVLTLFLMTQSIHPMMNAMKGVTPPAPVDSSHLTPKVWDAPNSGKSSFG
FT                   DVNRTALTSTGQGFSGGGAMDSSNFRLGTWNAGSSIASSQGQGAAFTSSAMSAASNTFQ
FT                   QAFNQMSEVGRTGQSGQQFTSNLQSLKSFTDQAGANIANSVGAKHGINSQQLAGVVSNL
FT                   LLNGSLGLGGEEKLGKGGGGGLAQKVMDSLGIKAEGQVGSGITKSNSGNESLLTDLSKA
FT                   ITTQLTENSGLTDQMTKAAAQINSDQFAQTNAFKEAATKMNQSTQTMAENLSTSLSTNA
FT                   SANTGMTLDSRQAINLDRFSDSIRNKNFSDEDVRNFARKNGLDENAFMEKFNSYNDTFK
FT                   ASTQLGSQLQRTDALVATTRDFSEQKIAIDTARGETAESNKQDLRETSSLLKGLVADFG
FT                   GNAQQMLPITNQLDRITGDASGINTIAQAQDRTPEHVNTSSVMSADRVADVGQSMDAQA
FT                   KAGLVQNQQNANQHVGGQTESGVTPYNVDKISKEDIQGIHQGNVNKSYSEENQNVLSSL
FT                   EKNTPVVTNETVGRVQGAGVDVQHANQTFDQLQAGSGGKHATSGMGTISDKLNNMYGDN
FT                   QIRGISGNLPNYFGRIANDPTKKPDDKRAELAAQAVFTYGASTMATGAEKEQLKADTQN
FT                   ILSELSHYNVRWGMNDLQNIHEGFNMHNKASGSLDSVVRANLGEGGSGGGLVGQRTQTT
FT                   TDLLVGNKIESNTERGVIGSTLLSGQESVARGLDVIGAKPVNDMLSGMGILTTPSSLAN
FT                   DASNPQNMPSSLLGKVGNHLQMSDGVSEVTSRYKDMGGDGIKAYETASQNSERAIRQQL
FT                   TDDPRFGPDKADAFVSFMKSNLNNTNEPYQSRIEKAKSWLNENKK"
FT   repeat_region   complement(192497..192504)
FT                   /note="(g)8"
FT   repeat_region   complement(194320..194334)
FT                   /note="(agg)5"
FT   CDS             complement(196295..197710)
FT                   /transl_table=11
FT                   /gene="HCM1.263c"
FT                   /product="putative pilus-assembly protein"
FT                   /note="HCM1.263c, possible pilus-assembly protein, len: 471
FT                   aa; similar to e.g. SW:TRH1_ECOLI (EMBL:M59763), traH,
FT                   Escherichia coli TraH protein from the F-plasmid (458 aa),
FT                   fasta scores; E(): 2.8e-09, 26.5% identity in 452 aa
FT                   overlap. Contains a probable N-terminal signal sequence"
FT                   /db_xref="InterPro:IPR010927"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5L5"
FT                   /protein_id="CAD09842.1"
FT                   /translation="MRADFHVCAKKLLLSLAVCTAMIAPNAVADNAMRNIFNGMMTTTS
FT                   PASFETATRTGVVGGSFSYRTTNVNTNLVSMSFPKASVGCNGIDVFLGSFSMINGDQLV
FT                   QVARGIAQGAAIYAFNVAVSAICADCAATINDIQNKLQALNKFAKDSCNATYSFLTENV
FT                   GPPSQFANAVSSGPASMLGTLNGLLPDFGSSMTKSPETVTSQVKAKDPEEFAEKFSGNL
FT                   FYMSFMDIDKGSMNIGGVTELSGYRLAEQLMSLVGTVIINWDAKGEKAGMEVRPSTMTV
FT                   SDFIMGPPAGGSIKMLKCSPAPDPASARKSQCLVMSEVTDGGFKGLKDTISDLLIQVQT
FT                   KAISDVRISDDELRIISYIGIPTILDSLQTFDVPEGYAYIQDISAIAATSLVINMLRQV
FT                   EAKISAMNIPSESLSGRRQDLTRLSENLTNQVKAAYELTRSQVGNSSDVISAWDDRRLK
FT                   RKAFMESLRGTGN"
FT   CDS             complement(197700..198746)
FT                   /transl_table=11
FT                   /gene="HCM1.264c"
FT                   /product="putative pilus-assembly protein"
FT                   /note="HCM1.264c, possible pilus-assembly protein, len: 348
FT                   aa; shows weak similarity to e.g. SW:TRAF_ECOLI
FT                   (EMBL:M20787), traF, Escherichia coli TraF protein from the
FT                   F-plasmid (247 aa), fasta scores; E(): 2.1e-09, 24.5%
FT                   identity in 212 aa overlap. Contains a probable N-terminal
FT                   signal sequence"
FT                   /db_xref="InterPro:IPR012336"
FT                   /db_xref="InterPro:IPR014111"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5L6"
FT                   /protein_id="CAD09843.1"
FT                   /translation="MTRLTLIPSKMLVLLSLFITGVHANEEQALIKDTPFVSGQAFKKG
FT                   FFWYDDPTRKTEEEITETKPPVASSTQPEQEEKIELNSKWLKDNMPQLLTKAMDNPTPE
FT                   NLSRFYTAQRLMLDIGTRFSDKSKDYFLKNPMMSEKRRQPVEKVALDAHRTVVEKNQQS
FT                   VMKDIFTKSGLFFFFQSTCQFCHEESQILQFMENYYSVDILPVSMDGRPLQNGLFQDFS
FT                   VPNAQIIDQFKIREVPTIFLVSKDGSSAQRISEGMITAEELKNTIILAAKGMKLIDDAS
FT                   FQSTLDIKRQYTIGEDGVITVNKSEMDSDPFLLQRIMDKKLEGYDMPTADPVNYLNVGG
FT                   SLGGAYAR"
FT   RBS             complement(197715..197721)
FT                   /note="possible RBS"
FT   RBS             complement(198755..198759)
FT                   /note="possible RBS"
FT   CDS             complement(199358..199870)
FT                   /transl_table=11
FT                   /gene="HCM1.266c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.266c, hypothetical protein, len: 170 aa:
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5L8"
FT                   /protein_id="CAD09844.1"
FT                   /translation="MAKVDQTKANMLLSATKTMSLGANKNSIRILYGNHVAENIDFRSE
FT                   PQQNFKKGIRGWSRRTDNRRAFSAVIDVAVNYFGFDPIHPESSFRNIDFNRIMSVLHNL
FT                   GYFVCAPEVNKIIEILTSMKEIEELETCAKCKRPYIVPYTNDTHCPRCRLSSTSSAIAR
FT                   YSQEELD"
FT   CDS             complement(199873..200673)
FT                   /transl_table=11
FT                   /gene="HCM1.268c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.268c, hypothetical protein, len: 266 aa:
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5L9"
FT                   /protein_id="CAD09845.1"
FT                   /translation="MSESDNITRNLLGKLLRTEISIIRSYRAFLMLLPLHGSSKYQTGS
FT                   PLLQRRLFGNGFGAMIDNAFEVETRPGSFLVPRSLSKEISWDKFFVAVVDGDTNVIREY
FT                   DSEDTDFGIYNEGEKVTLLSGQEEFYNPRKIQQLRSKCVDIQNDYLMQVFFMSMLAPEF
FT                   VSIFFGLKPATVEAIKDVGMSSLKLINDVVLFPRTIPFTPGLGDDSATLKSKVFAWAYE
FT                   ISADIRLGKISDDLMELLRYDTMFTCHRQDVFNTLANKVLLKDY"
FT   RBS             complement(199880..199884)
FT                   /note="possible RBS"
FT   RBS             complement(200684..200688)
FT                   /note="possible RBS"
FT   repeat_region   201039..201103
FT                   /note="inverted repeat; 50/64 (78%) matches, 2 gaps"
FT   repeat_region   complement(201107..201171)
FT                   /note="inverted repeat; 50/64 (78%) matches, 2 gaps"
FT   RBS             201421..201426
FT                   /note="possible RBS"
FT   CDS             201431..201916
FT                   /transl_table=11
FT                   /gene="HCM1.269"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.269, hypothetical protein, len: 161 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5M0"
FT                   /protein_id="CAD09846.1"
FT                   /translation="MSKSKLLKSLEISRTLLRSQIDVLREEAEELITNYWIEWKERNHI
FT                   ERNLPRDSKTLKKEYLGSYAPKVELIGNARKVTITWHQFSPYKNRPPSHMSKRISPMKS
FT                   GKYTKSCFVNHASWEYEMIEKTEGLLEPYRELLEFYHAAYIELGRKVRQYSKSEVAQ"
FT   CDS             201913..202635
FT                   /transl_table=11
FT                   /gene="HCM1.270"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.270, hypothetical protein, len: 240 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5M1"
FT                   /protein_id="CAD09847.1"
FT                   /translation="MTDVTMNESEHKVPDVNTRSPHASDNSRRVVQSKNEHYGMATVTI
FT                   TPGTPDFNRFLTARNRSVIRGFDDVSIAISSLFRTVNAVKHPELVQAIQDWFNELHEEN
FT                   NLMKNNLERHIATIHIDESDPFFSSTEFSPFRFEPVQLNFNNQNTMRFYKHIFEMNNLL
FT                   TQMHKFNSLGQLPVSDYNVMAHNIIRSLNMYIERVKKTLNVSRRAKGAYSPDEFIEKVK
FT                   QYKSVQAYIAAELSGKRR"
FT   RBS             202633..202638
FT                   /note="possible RBS"
FT   CDS             202646..205681
FT                   /transl_table=11
FT                   /gene="HCM1.271"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.271, hypothetical protein, len: 1011 aa:
FT                   unknown function"
FT                   /db_xref="GOA:Q935H0"
FT                   /db_xref="InterPro:IPR003607"
FT                   /db_xref="InterPro:IPR011119"
FT                   /db_xref="UniProtKB/TrEMBL:Q935H0"
FT                   /protein_id="CAD09848.1"
FT                   /translation="MNFRALFLSMQRVFGIFSRRENDVSELMMKDAANFSPFAQIIGEQ
FT                   KYTVPDHPNPEVLKFIEYPTRPAGIQTFNEQSILSLYRDKLHSISMMLAISDGDIREDA
FT                   YTFTNLVLKPLIEYIRWIHLLPASENHHHNGIGGLLSHSLEVAMISLKNANHSELRPIG
FT                   YQDEEVVRRKVYLYAAFICGLVHDAGKVYDLDIVSLNLSETLTWAPSSQSLLDWARENN
FT                   VVEYEIHWRKRIHNQHNIWSSVFLERILDPVCMSFLDRVKKERVYAKMVTALNVYNDGN
FT                   DFLSKCVRTSDYYSTGTDLNVLRDPIMGLRSNDAAARAIGTIKHNFTSININNYKTKPM
FT                   HIIIVNGEVYLNENAFLDFVLSDFAAHKFNFPQGDAGKTVLVESLVQRGYVEPYDDERV
FT                   VHYFIPGTYSENEIASIFRNGIGKLEFYNLLKLRWIGLIFDSYKIPDSVPGLFSVNANK
FT                   DFIYIDEQKTVTEYRRPVPGRESVTRVTDTVNDAIENTPQYGLQLVNGPDADSNNIISS
FT                   ENTESITDSLEESGADISNEIFETQVVTAIDTAETVNADEPEQVEEHDDRSQIHLVEQL
FT                   HEMLLSAPLPHHAVINIDSVPYLDLDAAIALIPGIDEAAFCNGPFFQLTYRDGSLDGMW
FT                   IVRDVNNLRLIQLGDNCAGMQVSTSEPRNTSSLKSLFDTSMYQPLDIPEAPSVNEAASP
FT                   PQTPLELPQPRLNAPVAEEASSVAEQTNAHSEPDSVIATEYEQYGHLLEETLDSDGEAY
FT                   SDLIASDSTEAEYPATDPQSSDFAQLPRETALSVAPGDLDYSEGAIKPPAPDATGKETI
FT                   LTSPEPAEDVRETVAAVEKASHLSPALARLFAVSTHAEKKHEKTQEPSPVKEVKNPTSS
FT                   TTVKAPISIEPPGAEEKEAVEEFTLLNDGEVTELEYVEIATMLHQILTKLSGSFKRKRK
FT                   NRFMVLTQNTFYLTQSCIEKYGTQLNAPELFNQLPQYQVTSGAVVNTKCIAFNIPTLVA
FT                   ASDRAKVDIELIINKLKEVGNL"
FT   CDS             205681..207765
FT                   /transl_table=11
FT                   /gene="HCM1.272"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.272, possible membrane protein, len: 694 aa:
FT                   unknown function. Contains hydrophobic, possible
FT                   membrane-spanning regions. Contains PS00017 ATP/GTP-binding
FT                   site motif A (P-loop)"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G9"
FT                   /protein_id="CAD09849.1"
FT                   /translation="MTKSKRTNLHAQENFYRPILEYRSASVLLICAVIMLVMGFRSDGV
FT                   NIAPIILYTAVFLLLVCLYRCKTAHPYLMAHWRVFQRQIMFISLKSLRTINKSNFFSNE
FT                   RKYRQLVQEYKKNNRPVPDRKTYFCNGFEWGPEHADRAYQIANLSSDKREIALPFVLSP
FT                   IARHFETMARSMGGNNAIFAVDRRAPIFVTEDNWFGHTLITGNVGTGKTVLQRLLSISM
FT                   LHLGHVIVVIDPKNDAEWRQSLMDEASELGLPFYKFHPAQPSSSVCIDVCNAYTNVSDL
FT                   TSRLLSLVSVPGEVNPFVQYAEALISTVITGLSYTDKKPSIYLIHKNMKSHMSVVNLTI
FT                   KVMECCFARHYGPDVWMEKVKYASNDTLQVRFKRLTEWFNAHFLNYEGAEPIEWIDTVG
FT                   RLVDYSMSDPEHMSKMTAGIMPLFSRLTEQPLNELLSPSPNTLTSREIVTSDGMFSTGG
FT                   VLYISLDGLSNPESARAISQLIMSDLTSCAGSRYNADDGDMSSHSRISIFVDEAHSAIN
FT                   NSMINLLAQGRAAQIALFICTQTISDFIAAANAETANRITGLCNNYISLRVNDTPTQTL
FT                   VVENFGKSPISTNMVTYTTGSETTLPHNNFSGSISERKQTTLEESIPKELLGQVPKFHI
FT                   VARLQDGRKVVGQIPIAVSEKAMKPNTTLLEMFLKPAGKVTLRQNVGLSYLNKYLRKLH
FT                   "
FT   misc_feature    206293..206316
FT                   /note="PS00017 ATP/GTP-binding site motif A (P-loop)"
FT   RBS             207749..207754
FT                   /note="possible RBS"
FT   CDS             207762..208868
FT                   /transl_table=11
FT                   /gene="HCM1.273"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.273, hypothetical protein, len: 368 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G8"
FT                   /protein_id="CAD09850.1"
FT                   /translation="MMDEQITLTQNQIFSASLKVSKSRSLVKRRMQSLGLKFTESQDVR
FT                   NRLAGIEKGALKCVGQFCHDNDAESLSAMAIILSELFLLQGELSTSNEYGDHETSYWTV
FT                   AQGPCDEWVQSLLASENGRRTFNSFRITFDNSEERRSLVEKNAKMLGSYLLPYFVNFTN
FT                   AASAFITLPNSITFKQVQRNKPLIHPETTLSHILTIEDSAFLSRIKFKLISAIDRLPDP
FT                   SGQYANMFNHIMDRALLTHLNREQIDSPCVCKKVISTYADTMLTLPIFNTTITGKYRHW
FT                   TPWGINFVEFSRQAAKEKSCVYVPEPGQIHWKSPEHKELAEYSLINQIIPQQYHWLLGV
FT                   PTIWRSHYRDHSKRLDLFKEWRDANGCG"
FT   RBS             208843..208847
FT                   /note="possible RBS"
FT   CDS             208855..209517
FT                   /transl_table=11
FT                   /gene="HCM1.275"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.275, possible membrane protein, len: 220 aa:
FT                   unknown function. Contains hydrophobic, possible
FT                   membrane-spanning regions"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5M5"
FT                   /protein_id="CAD09851.1"
FT                   /translation="MAADNSARAIFIRGLLLLGMMLYLIYSLGFQNTDELKQQITQEVN
FT                   ASRSLISNDRWLSVIANSEATLSTLINDYKLIDYLNTILIPDTSTPARGMNYVAEKMTS
FT                   VNYTVAKNLPLLIYQSIFRWNLILGWLILFSPYLIAMLADGMYQWKLKRYVFGNVTVQF
FT                   YRIWFRAFWIIGALTFIYLSMPNMSLFNNIAQLFPPVALLILGIALNRLWSNFQKLM"
FT   CDS             209530..210711
FT                   /transl_table=11
FT                   /gene="HCM1.276"
FT                   /product="putative peptidase"
FT                   /note="HCM1.276, possible peptidase, len: 393 aa; shows
FT                   weak similarity to many putative peptidases (signal
FT                   peptidase-like) e.g. SW:PFAP_LEPBO (EMBL:L27482), pfaP,
FT                   Leptospira borgpetersenii putative peptidase which was
FT                   detected by reaction to mAbs raised against a periplasmic
FT                   flagaella-associated protein (204 aa), fasta scores; E():
FT                   5.3e-09, 33.5% identity in 179 aa overlap. Contains Pfam
FT                   match to entry PF01343 Peptidase_U7, Peptidase family U7.
FT                   Contains one hydrophobic, possible membrane-spanning region
FT                   near the N-terminus. Alternatively, assuming codon 27 as
FT                   the true start codon, this region could represent an
FT                   N-terminal signal sequence"
FT                   /db_xref="GOA:Q9L5M6"
FT                   /db_xref="InterPro:IPR002142"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5M6"
FT                   /protein_id="CAD09852.1"
FT                   /translation="MFKRNNKKSPANIKESLDENADRFYKMFRIHTTSKVVISLLALAA
FT                   AGVSAFNIYDKYQESEGRMDHIAVVRISGEMGTGSEVGDGSVIATALAKAYNNPHAKAV
FT                   IIEAESGGGGPSDAIIIYRQINALRSHQQKIERVSHAESTSKPRNTSDHSASRSQADSN
FT                   AELSKRNTLDVLSAGSGHFISDMENSYKPIIVSVKGICASACYYAVSPADAIYADSSAL
FT                   TGSIGVRMDHWNLSRVMDTVGVKNEPLTAGEFKDALDPYHPLSDATRDFMQKQILDAMH
FT                   EQFIADVEQGRGKKLLSRPEADAVALYSGRVWTTQQAIRYGLIDGDLTPVEVRSRLSQM
FT                   YSTTIFKTYNEPQRSLRSALGMLMSLSTNVETLAGTTSRILDSVQATSYPTVR"
FT   misc_feature    210082..210555
FT                   /note="Pfam match to entry PF01343 Peptidase_U7, Peptidase
FT                   family U7, score 104.50, E-value 2.1e-27"
FT   CDS             210728..211441
FT                   /transl_table=11
FT                   /gene="HCM1.277"
FT                   /product="putative periplasmic protein"
FT                   /note="HCM1.277, possible periplasmic protein, len: 237 aa;
FT                   unknown function, similar at the N-terminus to TR:Q9X2X2
FT                   (EMBL:AF065404), pXO1-01, Bacillus anthracis hypothetical
FT                   protein from virulence plasmid pX01 (167 aa), fasta scores;
FT                   E(): 2.9e-09, 28.1% identity in 146 aa overlap. Contains a
FT                   possible N-terminal signal sequence"
FT                   /db_xref="InterPro:IPR011528"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G7"
FT                   /protein_id="CAD09853.1"
FT                   /translation="MVWRVIGISIIVLVLIVLYCLMGFVSSAIAERRTARQIEIYLPDD
FT                   AEGLLSDLTLPVNATGTTQIDHVLIASHGLYVIEQKNYAGKLYGKLEESHWRKWKSSGT
FT                   LKLQNPFRQNYGHIRAIQSTLRASELECINVVIINGPCKFEGEKPDWLCMGMEEFVRKV
FT                   TERRQLNVFKPEAVSFIRGELKLKRKPPGLYTDLNHIHNVTTRYKTTMRLEQRITYNLL
FT                   RFSRLILSKMFRSAK"
FT   CDS             complement(211468..211824)
FT                   /transl_table=11
FT                   /gene="HCM1.278c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.278c, hypothetical protein, len: 118 aa:
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5M8"
FT                   /protein_id="CAD09854.1"
FT                   /translation="MTTANVTTTTYRSDDIVPFRRPQGDLDNRYMPQAYALVRSWASKP
FT                   AEYGAGVLATYRQPVVNLGYKIKGTRVVLILVPIECEPVGVKMTDAALWPSLSIGEAMR
FT                   IMQEAWQNIPELNP"
FT   RBS             complement(211832..211836)
FT                   /note="possible RBS"
FT   CDS             complement(211911..212225)
FT                   /transl_table=11
FT                   /gene="HCM1.279c"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.279c, possible membrane protein, len: 104 aa:
FT                   unknown function. Contains hydrophobic, possible
FT                   membrane-spanning region"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G6"
FT                   /protein_id="CAD09855.1"
FT                   /translation="MNTFLYVLVGWIIVLYLVNKVREKYSKPKTVNILVKRNGVYQEVE
FT                   AVVMPRSHNSDVGTGKTGNEAAPQWLNKEDDISELEYYSGGSLLKAARDFEAQQMEQKF
FT                   "
FT   RBS             complement(212230..212236)
FT                   /note="possible RBS"
FT   CDS             complement(212540..212776)
FT                   /transl_table=11
FT                   /gene="HCM1.279ac"
FT                   /product="putative membrane protein"
FT                   /note="HCM1.279ac, possible membrane protein, len: 78 aa:
FT                   unknown function. Contains hydrophobic, possible
FT                   membrane-spanning region"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G5"
FT                   /protein_id="CAD09856.1"
FT                   /translation="MMLLNIALILYVAVCLYLCLRNKKALYRFQGGGRQFTQSSKSGAN
FT                   TGESGFFLISGYSDTGVGGDSGDAGGGCGGGGD"
FT   RBS             complement(212781..212785)
FT                   /note="possible RBS"
FT   CDS             complement(213149..213385)
FT                   /transl_table=11
FT                   /gene="HCM1.279bc"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.279bc, hypothetical protein, len: 78 aa;
FT                   similar to hypothetical proteins e.g. SW:YKFF_ECOLI
FT                   (EMBL:AE000133), ykfF, Escherichia coli hypothetical
FT                   protein (79 aa), fasta scores; E(): 1.3e-07, 37.3% identity
FT                   in 67 aa overlap"
FT                   /db_xref="InterPro:IPR009253"
FT                   /db_xref="UniProtKB/Swiss-Prot:Q9L5N1"
FT                   /protein_id="CAD09857.1"
FT                   /translation="MSDLFSSESPVTLAQARTVAAGYQNVFIENLQPAGHFQIVIRDHR
FT                   DHDSQLVWRNWNYESGANDALNSYLQSHGLKAS"
FT   RBS             complement(213393..213397)
FT                   /note="possible RBS"
FT   CDS             complement(213431..213976)
FT                   /transl_table=11
FT                   /gene="HCM1.280c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.280c, hypothetical protein, len: 181 aa:
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5N2"
FT                   /protein_id="CAD09858.1"
FT                   /translation="MKTLNIQVNDIAAISALGGSMLADIIAAQYKVIDDTKDASEMAMP
FT                   CIAYGQIPANIGPGVFINRVYSMDSQSLSASQRYELFNGLATQAFTFFFQSGWYGAFRV
FT                   VSFRDNGPAGLLNIGIVHDKVLNEFCDDFPRANVSETGFNCGMTFDQIRMFISDLAYQM
FT                   PLYNNQDHFVKLAKHLAA"
FT   CDS             complement(214057..214494)
FT                   /transl_table=11
FT                   /gene="HCM1.281c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.281c, hypothetical protein, len: 145 aa:
FT                   unknown function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5N3"
FT                   /protein_id="CAD09859.1"
FT                   /translation="MYKYDRNRQTFNLINALQPVYRNNGGGLFEFDRRKQHETADLIFE
FT                   ALTFSPTPELELAKFVRLKSVRRIAQFDDGEVRYGVHVELDEAVNINSFRIFKDDNTGG
FT                   FDFYLFSVLGNNAELVQINLDASNIHLQDIFERSTGLCLSY"
FT   RBS             complement(214504..214507)
FT                   /note="possible RBS"
FT   CDS             214547..214870
FT                   /transl_table=11
FT                   /gene="HCM1.282"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.282, hypothetical protein, len: 107 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5N4"
FT                   /protein_id="CAD09860.1"
FT                   /translation="MPVGDQLFALQRGETLLGQYRQYGNVGYTVVTPCVKQHLPGASVV
FT                   TAHFHFLFRSMAGGNSLLIETFILGSRALLQCRINKGVKRVRTIRCISQIGFHNTSYVF
FT                   GII"
FT   CDS             complement(214976..215161)
FT                   /transl_table=11
FT                   /gene="HCM1.283c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.283c, hypothetical protein, len: 61 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G4"
FT                   /protein_id="CAD09861.1"
FT                   /translation="MNTERSNGTTLWIEHGFIILKDSVLALIMLKRLISASECVATRIC
FT                   WSGKKLPNNAPPMEAS"
FT   CDS             complement(215158..215439)
FT                   /transl_table=11
FT                   /gene="HCM1.284c"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.284c, hypothetical protein, len: 93 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5N7"
FT                   /protein_id="CAD09862.1"
FT                   /translation="MKNTAINISTKKPLQTVKDPVTRVSIHCTAKDEKGADVEVNILDL
FT                   EQHHTTNEIKLTFGGSPSQALTMLSRVMVVLQQQAAEELQRNSCSRLQ"
FT   RBS             complement(215450..215455)
FT                   /note="possible RBS"
FT   CDS             complement(215505..216710)
FT                   /transl_table=11
FT                   /gene="HCM1.286c"
FT                   /product="putative DNA-binding protein"
FT                   /note="HCM1.286c, possible DNA-binding protein, len: 401
FT                   aa: unknown function, contains probable helix-turn-helix
FT                   motif at aa 169-190 (Score 1483, +4.24 SD). Similar to
FT                   HCM1.58c, possible DNA-binding protein (385 aa), fasta
FT                   scores; E(): 3e-21, 31.6% identity in 297 aa overlap and
FT                   HCM.63c, hypothetical protein (358 aa), fasta scores; E():
FT                   7.1e-13, 31.9% identity in 191 aa overlap"
FT                   /db_xref="GOA:Q935G3"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G3"
FT                   /protein_id="CAD09863.1"
FT                   /translation="MSTVENDVKTANNDISLRTYLERTGNGARKSNGLVINPAVVEEEE
FT                   GFNTRTAGIGESYYSLPDVVAHLNSLKESYKIDPLSVQAIVVQILNGRPVLRQGACRIR
FT                   AVAMANIELADEGRELITLIRCEEFRGSRASAEQFTLDGNSNLALSVVAEALSIKRMVE
FT                   DAEEPKTFAELAKRRGKTEQHLRQMVRVLDLPEALQAMLVKGEVSMYVALDEYLYSGDE
FT                   AVNNITKAIDVYGKATAKTLKFVKAGNIDAAMKPKAAIVPDANATPPETTVTEQTSGEG
FT                   TNDETTPPQLVDGSAGTNPEPTPERTPAPQMKDPVKTPEPKAVSVSSVLNKKTVTTIAD
FT                   TAIPLFSRIAEEAKQRAAKNLSDDTYTLVLTNDEMNAICEAHGDLTQYLRKHAEKQNKG
FT                   QA"
FT   RBS             complement(216718..216722)
FT                   /note="possible RBS"
FT   CDS             complement(216827..217223)
FT                   /pseudo
FT                   /transl_table=11
FT                   /gene="HCM1.287c"
FT                   /product="hypothetical protein (pseudogene)"
FT                   /note="HCM1.287c, possible pseudogene, len: 397 bp; unknown
FT                   function, may change frame (from frame 5 to frame 6) at
FT                   {g}8, suggesting that this CDS is subject to slipped-strand
FT                   mispairing"
FT   repeat_region   complement(216982..216989)
FT                   /note="(g)8"
FT   CDS             217313..217504
FT                   /transl_table=11
FT                   /gene="HCM1.288"
FT                   /product="hypothetical protein"
FT                   /note="HCM1.288 hypothetical protein, len: 63 aa: unknown
FT                   function"
FT                   /db_xref="UniProtKB/TrEMBL:Q9L5P0"
FT                   /protein_id="CAD09865.1"
FT                   /translation="MSSTDRYSLHGQPGTEIAPCRRKAENLKFDKAAGSYFLHVQTNKG
FT                   LADDRKEKRVSPTGETLF"
FT   CDS             complement(217566..217724)
FT                   /transl_table=11
FT                   /gene="HCM1.290c"
FT                   /product="putative stable plasmid inheritance protein"
FT                   /note="HCM1.290c, probable stable plasmid inheritance
FT                   protein, len: 52 aa; similar to many proteins implicated in
FT                   killing of plasmid-free cells e.g. SW:HOK_ECOLI
FT                   (EMBL:X05813), hok, Escherichia coli HoK protein from
FT                   plasmid IncFII R1 (52 aa), fasta scores; E(): 5e-13, 73.1%
FT                   identity in 52 aa overlap. Contains Pfam match to entry
FT                   PF01848 HOK_GEF, Hok/gef family and PS00556 Hok/gef family
FT                   cell toxic proteins signature. Contains hydrophobic,
FT                   possible membrane-spanning region"
FT                   /db_xref="GOA:Q935G2"
FT                   /db_xref="InterPro:IPR000021"
FT                   /db_xref="InterPro:IPR018084"
FT                   /db_xref="UniProtKB/TrEMBL:Q935G2"
FT                   /protein_id="CAD09866.1"
FT                   /translation="MKLPNQPVVLCVLIVCLTLLIFTWLTRNSLCELRLKDGTREVSAV
FT                   MDYESGK"
FT   misc_feature    complement(217569..217718)
FT                   /note="Pfam match to entry PF01848 HOK_GEF, Hok/gef family,
FT                   score 89.60, E-value 6.2e-23"
FT   misc_feature    complement(217632..217691)
FT                   /note="PS00556 Hok/gef family cell toxic proteins
FT                   signature"
FT   RBS             complement(217734..217739)
FT                   /note="possible RBS"
XX
SQ   Sequence 218160 BP; 57942 A; 50902 C; 52901 G; 56415 T; 0 other;
     ggcgattttc tccagttcct catcgaggcg ggtatacgtc agcctcctga ttttcaagat        60
     ttccttgtga agccagcgtt tgataaaggg attgccggaa agcagtacca ggtctgcatc       120
     ctccacttca tcaaaaagcc agacgggttt tgccggagta aggcggtaga gccaggggcg       180
     ggaaaactcc cccgttgcaa tcagaaacca gacaaccatg ccaagtgcga actcgatgac       240
     cagcatcagg gtaaactgaa tatcccggac gtcaggctct ccggtaaagc tcattaggcg       300
     gtcgccagtt gccagacgct gaataataca gaccagcatc agcagagcca gtaacagcgc       360
     catgagcagc ccgccgttca cttcaaaagt agctttctgg acgcgatcag gcggcacctg       420
     cttacggtag cggccgacca catcaccaat cattaccctg atggctatgc gttcttcatc       480
     gaccgttgtt tcggtaaatc cggacgggcc cgtttctgtt tgattcatgt accctctcct       540
     ctctctgaaa aataatggta agacgcaagc tgatcatacc aggtgagcag gagtggtttt       600
     gtcggttaaa ggctggaaaa aaacggttaa aaaaagaggg aaatgacagc aagaaggtgg       660
     gatgcagtaa gcggctttgg ttccctccgg ttctgtgggg aggaaacggc cagaacagca       720
     gaccgatacg atgggcgggc gctattttgt atccagaatt cgtgcctttt cttcccgcgt       780
     cgccagtcgg gcacttccgg aacggtcgcg gatcagcagt ggcttttcct ttttccaacc       840
     agtgatagcc gtttccccga aacgacgcgg tgcattgcca ttccagctgg caatcacgtg       900
     attatcgtgt acttccttga tgacgacaga atgaagagtc accgtcttaa tggtggtgtt       960
     tcccattttg gtccgggaga gtgaccagac ggtcatcccc acctccagct gactgagttt      1020
     catctttact ccggtaatat cgggatacat cattaaacga cgtggagacg taggttagca      1080
     taagcactca cagcggatac tgccgccaga taacagggtg aggtatccgc catgagcagt      1140
     ctttacggct ggcgttattc ggccagggcg cgggtaatag acgcacgctg acgctggcgc      1200
     tcagccttac gctggctgcg gcgatatagc ggcttcgcgg cagcgtagcg acaatcttcc      1260
     gggtggtacc agcaacagcc gcagggctca ggctggggtt ttccggcaag tccgaatggt      1320
     ttcataatgt caccttttaa atggaataat gttcaggtcc cgtccatcag gccacgggtt      1380
     cattaatgaa gcggcgttgc ataaacaggt acagataacc ctctggcgag aacatacaaa      1440
     gattctcggt aatacaggca tcgaggtact tcgtgtcgcc aaggagtcgc ttaatgacag      1500
     ccagctggtt agccgcagac tgaatcagcg gatagccatt cacggcacga tgaatacctg      1560
     agtggaataa cgaacgagcc tttccaatct tttcccgggt tgcgtccatt tccatatcga      1620
     taacagactg acgcgcaaca ttaatagcat tgccggataa ctccgcgaag ctaaccagag      1680
     gcttattcat aaaaaactcc ttccaggtat gtgagcttat tatatcaata cggactttgc      1740
     cccaaacaac ccgactcgaa atattttgga aattactcta ataactaaaa atggcacccg      1800
     gaaaatagaa tgaatttatt ttaagcttgc cgaacatggc tggcggcgga attaaatttg      1860
     ggtaatgact ccaacttatt gatagtgttt tatgttcaga taatgcccga tgactttgtc      1920
     atgcagctcc accgattttg agaacgacag cgacttccgt cccagccgtg ccaggtgctg      1980
     cctcagattc aggttatgcc gctcaattcg ctgcgtatat cgcttgctga ttacgtgcag      2040
     ctttcccttc aggcgggatt catacagcgg ccagccatcc gtcatccata tcaccacgtc      2100
     aaagggtgac agcaggctca taagacgccc cagcgtcgcc atcgtgcgtt caccgaatac      2160
     gtgcgcaaca accgtcttcc ggagcctgtc atacgcgtaa aacagccagc gctggcgcga      2220
     tttagcgcag acgatgacgt cactgcccgg ctgtatgcgc gaggttaccg actgcggcct      2280
     gagtttttta aatgacgtaa aatcgtgttg aggccaacgc ccataatgcg ggcggttgcc      2340
     cggcatccaa cgccattcat ggccatatca atgattttct ggtgcgtacc gggttgagaa      2400
     gcggtgtaag tgaactgcag ttgccatgtt ttacggcagt gagagcagag atagcgctga      2460
     tgtccggcgg tgcttttgcc gttacgcacc accccgtcag tagctgaaca ggagggacag      2520
     ctgatagaaa cagaagccac tggagcacct caaaaacacc atcatacact aaatcagtaa      2580
     gttggcagca tcaccgaaaa taaaatagag agagttttca atccgcatga ctttaaaaaa      2640
     gacaattttt agaaataagc cggataaaaa aatagcttta tccggcactc atattacaac      2700
     cagttcttcc gcttaaagta cagatacggt gccaggcccg cgaggatcat aaagataatc      2760
     gcggcagggt agccgaacct ccacttcagt tctggcataa actcaaagtt catgccatag      2820
     ctggaagcaa cgagcgtcgg cggcaggaat accacggata ccaccgagaa gattttgatg      2880
     atgcggttct gctcgatgtt gataaaaccc attgccgcct gcatcaggaa gttcaccttc      2940
     tggaacaggg attcgttatg cggcagcagg gattcgatat ctcgcaggat ttcacgcgcc      3000
     tgctccagtt gcccacccgg taaacgcgct ttacgcacca ggaagttgag cgcgcgctgg      3060
     gtatccatca gacacaggcg aactttccag ccgatatctt ccagttccgc cagagtggag      3120
     agcgcctcgt cgtactcatc gccctgatgc ccttccataa tcacccggct caactgctcc      3180
     aggtcgctat agatattttc aatttcatct gccaactgtt cgattttggt ttcgaacaga      3240
     tccagcagca actcgtaggc gttaccgtct accatcgact ggctacgggc acgcatacga      3300
     tacagacgaa aagcgggcag ttcacgctca cgcagagtaa acagacgacc atcacggatg      3360
     gtaaatgcca cagtggagtt accggcgtga tcttccgcat cttcaaagaa gaagaaggag      3420
     tgaatatgca ggccgtcgtc gtcttcaaag aaacgtgccg atgcttcgat gtcttccagt      3480
     tccgggcggg ttgccaggct ctggccaagt tcagattgta agcgcagtcg ctcgtcgtcg      3540
     tccggttcga caagatcaat ccatactgca tttacaaggg gttgtgactc ttcgacttcc      3600
     agccgggtca gtcggttatt ttccagttga aatgcgctca gcatgaccgg gactcccaat      3660
     gcttaaaata tcggacagtt cggtgggcac acagaaacaa attgggtttc agaccattaa      3720
     acagcctgac tcagcgcgac gggaaaaatt gaggtcgctg acaaccgcta aggctatcag      3780
     caaaaaggga tagccttagg agttgatcct ggatgacagg atagtgagcc agtatctact      3840
     gggtgtgtcc aaggcgaatg tcctcttaga gtgatcgtgc gcgcatgtta cgccagcaaa      3900
     attttgccgt caacacgcaa cagaacacca cagaacaata gttgaacttc gcgctttttg      3960
     gtactcgtca aggtcgctaa caggataaaa aaatcccaca tccaggacct ataatggcgc      4020
     atcagctact cattggtaaa ggaatgatca ccttgaatct caaacggatt tttctcgccc      4080
     tcaccttact tcccttgttt gctgttgccg ctgatgattg cgcactctca gatccgacgc      4140
     tgaccgtaca ggcgtatacc gttaatcctc aaacagagcg ggtgaaaatg tactggcaaa      4200
     aagccaatgg cgaagcgtgg ggaacgttac atgctctgct ggcggatatt aatagtcagg      4260
     gtcaggtgca gatggcgatg aacggcggca tcttaaattt gacggttttt gatataaaat      4320
     atagaaagaa ggaggttttc tgaatacctc cttcactggc gctcagttcg agaatacgtt      4380
     aacgctgtac cgtttaccga gcacctcggc agtggtatcg acaattttct gaatatcatc      4440
     ggcaatcgcg ggtttactga atgcgacggt gtgcagttca ccagcctgtt ccgccgtcgc      4500
     accatcatga aagcggctgg catcgtaaag ctggacccgg agtgtccggg tataatcgac      4560
     atggcccatt attcctctcc tgttcagtca ggcgctatac gcgttaataa tcactttctt      4620
     ccggttgcgg ctgggtgaca aactggtact tcaccccatt agggacgcca acggcttttg      4680
     ctacagattc acacagcagc gacaggtcat tcagagtcat cggatattcg atatcgacgg      4740
     aatataaggc cccggcgttc tcggcctctt cgatattttt atactgggca ctgaaaatgg      4800
     ctatggtaga gatttcaagg ttatgcatga gtcagtcctt gttaataaaa aagaagccac      4860
     cgtaaggtgg ctgaataaag gttaatggac ctggctggcc tttttttccg cgttcttgtt      4920
     gtaatcaacg cgggcaataa cgacggcagc ggccaggagt gcagcgagac cgccgtagaa      4980
     tactggtcgg gagatatcga cgaacatatc gctcaggtta tcaacgccga ggagaaatac      5040
     gcagataatg acgataaagc gaacaggttt gctgtagaac aatttcatca ggagctatcc      5100
     ttctggggtg aaatgacacc agcattacac catatcagat gccaattttt tttcggtaac      5160
     gggcctattt tgacaagaaa aaagacacat cagggaggca atgacgagag tattttcgag      5220
     gtgcctatgg cctgtcactt cctgaactca ggaaaagaac gatgctgtag aacacaatcg      5280
     aaatatagaa aagtaacttt tccaccgacg atatgtccgg cggcaagtta ttcttatgca      5340
     gggcacaaat cagtgaattg ggttccgcgc gggaaagtca aaaaaacttg catgtcgttc      5400
     cggatgccag gcgacgtagc acatagattt gggcctgtgt aagcggggag ctgggacgtt      5460
     ttgtgtctgc cataatgttc cttttataac gagggctgtc cggctgacag attagcggac      5520
     agacctgaaa ataacgtgca tatccagcac ctggctgaat ccctgagcga ggcaaatgcc      5580
     tttactcttc cccctccgac aacaacaaaa atgcgttgag cttcctcttc ggcctgttca      5640
     tcagtcatgc ttttctcgcg gatgtgcgaa gtaaacaggc tccagtttgc agcgataaaa      5700
     tcacgtactt gatgcatttc cgaattctca gcgtcaataa ccatttttag tgtcctgtgt      5760
     cttaaataag gtccgccctg ttaatagatc agggacggac tgtttaagcg agatagccag      5820
     cctgtgccgt ggttatccat tcaccagagt gatttttgtg ggggatactt tgatactaaa      5880
     agcattaaat ttctttttaa gagcgagttc aaaccacgcc accgggatag agaccgaact      5940
     atcatcgccg cccaatgcct cctctgcctc gtcataccat tcatcatcaa cagacggatt      6000
     catcccacgg gcatagacaa ccgtatcacg ggaaacaggg gttccatcca gagatgcatt      6060
     ggtaatcaga tagacgccat gatcttttac cagaaggatc tgtggagtca ggcgggccgg      6120
     gtcaatgtgt ttggatgatg gccagaaaat tccccccgtc tggttcattt ccacttctgt      6180
     tttgccctct tcgttgagag gagtaccgcc ggggtaattt gacggttcaa aaagctgttc      6240
     aatggttgca ttgaaccgtt ccgccgagcg gagttcttcg aggagctttt ttaccccagc      6300
     aatttcgaat gttaatgtgg tcataaactt attctccatc cgtagtcagc atcagatatc      6360
     gggtggccag tagcaactct ttgacgtcag cagttgaaac ctcccctttg ccttctaccg      6420
     cgtcctgcaa acgctgacgc gtcgcctgaa tcgtctctga cgacagtgac gccagtttgc      6480
     tcaatacagc gttagctttt tccacagcgg gatacaggga ctctgaggtg gtattgtcta      6540
     catcgttatc gaaaaacagg tcagactcca tattaatatt gtcttcgagc cagctggtaa      6600
     gaatatcaag taaagacata actttattaa tctgcatttt tctcgccctc ggttgatgta      6660
     attcaaatat aacaaactgt ctcgtctggc taataaccca gaatgaaaaa ataagcgatt      6720
     tattagatag gactgaatta aatttaaatg gagtgcagcc ggactcagtt taaaaacact      6780
     ccgcgctaaa ggcagaaaaa agccttccga aagggaaggc ttatgcacta catcaggaaa      6840
     agaactatcg ctgcttctgg agcgcgatat acgctgcgaa aacagctacc aacaccgtca      6900
     tgaagtaaac tagatatgaa ccagattgcc agacattaac gccaaaaaac gaaattaatt      6960
     ttccgtccgg gataacagaa aaaatcaggt tccagaatcc aaccagaacg acctgagaga      7020
     taatcatttt accaagcgat cccagttcat gagccgcata cattgcagcc atgacaaatg      7080
     tcagagctac cacaagcagc gcagacaaag ccacaaccga aatgctcagg ccgacggatg      7140
     taaacagaat ggcatcttta aaagtcagac ctgtaaaacc ccagatcaga atggctaaaa      7200
     tgaaaaacat aaggataaat ttcactagaa ttgcgtccct ctttcggtgg cagagtgtcg      7260
     gtcaggatgc ctgtggcgag gcaactacag acagaattta acacaaaaaa tttaattaca      7320
     aatccgttca caggcctgtt tcaatgattc tttggtatgg ctatgtgcgg cctgatttaa      7380
     caatgcccgg atgtgtagtt catcatgacc gtcagctaca aagagattga ttttactttc      7440
     aaggcggctc atggcttcgt agagttttgc ctctttattg ttcttcataa agcgaagaat      7500
     gtaatccgca ataatatgct ctggtggcgt tttaatttca cggcagcgat tgcttgtcat      7560
     gagtttttcc tcaagtttgt ggcaaaatgg caccatctca tttaagccac ccttttccgg      7620
     ttgtataatt aatttgacct gctttacaca gcgccagcaa acggcgatca agaatatgcg      7680
     acggttgcgg attgctttcc ccggctgcaa tccggtgaca ctctgctttg atctctccgg      7740
     caaataatgt cgagaacggc gtaggaactg gggtaagaat ttcgttgagt gccctgtcca      7800
     gcgccagata cttatccata ttcatgtcct tgcaggtaat tgaatggatg gggtttaaat      7860
     ttattatact gaatcgagtt actaaactaa tatccttcag gatgaagaaa ggaatcatcc      7920
     accttcagta tgtattcgac atataggaca cgtctctaaa atttttcgcg ttttcgcgat      7980
     ttacaccgac aggcctacca gtcaccacct tcgatatgaa gttgcgtcgc agaaacagcc      8040
     accatttcct gcattggctg gtcatgcttg ttatgactac tcccaagcag taggctcacc      8100
     ttgccgttag cggaataaaa catagcatca ggaaaatgct ctctgacttc ccccagcaat      8160
     gtgtgcatcg actgagtcag tcggtagaat cgacgtgcgg cagtcggcat tgcatcatca      8220
     aggagatctc cggcgtcgcc gtccccgctg tttatgaaac tcagtacctt atcttcgtcc      8280
     attcgaacct ctttttcagt catgtcatat atatccattg agatatctgt cagcctgagc      8340
     aacgacatca ggctgacctt cgctcacccg gtaataacga tggcctgttc caattgtggc      8400
     tggcgatccc cccgcagcgc taccgactcc tggaggcgtg cggaaggcat cgtcattgcc      8460
     ttaaacccct catcccgcga acgcaccagc atcccccacg aatgggtttc acagacatcg      8520
     ttctcgaaat tgggttcggt cgacagcagt gattccatct tcggttcgat gtgtaccggc      8580
     gcaatgtttt tataaacagg gtgaacacga cactgttcag acgcttgtgc tcggtagctc      8640
     ccttgcgcca gcagcacgtc atgggaaacc aggtcataat ctgtatcttc gacaaaagtc      8700
     ttcagggtgt gcgttatttt gccgaatcct tcgatattcc agacggacac catcgtaaac      8760
     tcttcaaacg cacggggact tttgaccaaa aatccattca gcgccctacg ccccttcagc      8820
     atccccacca ggtattgctt gttgggataa gggcgcatcg caacaaggtc attaccagtc      8880
     aggcgtagcg acagttccgg gacgcttacg gaatccagcg tgcaaagatt tcccatcgga      8940
     tgcaggattt ttggtacaag gtgcaaaaac atcggtattc tcctcgttta ttaagccttc      9000
     aattattgtg ccgtcgcctg atgtatttcg aaccagaaga caaccggctt ttccgtgact      9060
     tcaattaacc caaatcgctc tgcggttctg aagttgacgc tgtatgccct ggcgcgttct      9120
     acctggcggc ttatttcttt cctcatgcct tcaacactta atgcaccttt aaagagattg      9180
     cagggggcgc aagccggaaa aagattttcg attgcatgca gttcagggtg catgacctta      9240
     ccggtacttc gagcccggtg tgtcactcga cttccagcgg gggctctgac catttcaaaa      9300
     tcccgcctca ccggttcaac atgatcggca tgccagcctt tttccggcaa aggacagccg      9360
     cagtaggcac accgaccgcc aaatttcaaa cgcagttcgg ctcgttgctc tttggatatt      9420
     ttattttttg gttttgaaaa tcgcccatca tcagattcaa ccttcgggag gagttctgaa      9480
     aaattgggta attcgattac tgcgcctttg ttatttagaa ctttcaccgg acctcccaac      9540
     catattaaga cgatttttta tttattttcc tgaattagtt ttcgaatttt aatcaggtgt      9600
     ggtcggctta atttgcatag ctgttcggtc gcggcatcca gagtgggaaa tacatgggcc      9660
     tcattaatat ccagtgtcca gtatttcgct ttaccttctc ccagatcaga ttcaaagtaa      9720
     ttccgcttta ccccaatctg ctttggtctt ccattaattc tgacgatttc atgccgctcg      9780
     tcgaagataa aaccctctcc gaccaacgtc aggaggacaa aagggccctc ggccttttgc      9840
     gtacccagcg aactcatctc attattcata cgacctcccc ggtaatacgc ttaaagttga      9900
     cgacccagac ccacgggttg gcctgccaac tgtcctcgcc gtacgtgttt ttccagaggc      9960
     tgcggaagcc aagaaagtgc ttatcgccaa gaacacaaca ttctgttggt gcgccttcag     10020
     ctttggcatc ttcctcgctg atggtattta accgctctac ccgcaaatcg gtaatttcca     10080
     gtgcaatacg gctggcccag cgaggcatat ggattgaagg tgtccacgca ccttcgaact     10140
     tcatattttc ggtacgaggc ttccagtcgg cctcatcagg gatcgaccac agcccataat     10200
     cccccgaccg ctgttcgcag ctcgcccggt aaatgcgggc tgcttcagtc ctgtccatca     10260
     cgatgttgtc attccagtcc accgcgcacg catcttcatt cccgagcaat gaaaacgcct     10320
     cacggaccgt aatgcggtcg ccaactacgc cgtacggaca aggccgaagc gccgagtatg     10380
     gctgggtccc tgttggaagc caccagtcat gcgtgtgccc gcgatgtcgc ggtgtttgcg     10440
     caggccttat agaccattca tccgaactat attgaggctt tataatccgc cgcgtctgtg     10500
     ttttctgatc tgccagaatt gcccggacca tttcatcatt aaaaagcatt ccacgtgtct     10560
     tcactgtgct gactcctttc acacatggtt cacacattga gaggcctatc cctctttatc     10620
     agccaggcat accgaaactg tcggtagttt tacgggaacg ggcaactgcc cccctacctg     10680
     ataaagtggt gttctccccc aaaattaatc gtattcccca tccactaccg gctcagtcgt     10740
     aatttcatat ttcactccgc cgggtacatc caacgcttta gcgacggact cacacagcaa     10800
     tgacaaatca ttcagggtca ttgggtattc aacttccagg ctgtgcagtg cattggcgct     10860
     ggcagcagca gccttgtcag catgacaggc attaaaaacg aaaacggtgg ttttttcttg     10920
     aataggcata gtgcaatcct ctgaataatt agccctgtga tcagggcggt ttttgattaa     10980
     atttaaatgt tcgttttcaa taattagtga atctgttaat cgggttgtga cttatcattt     11040
     tctccaaccg aagtgctgtc gagaaatgac cattcttgtt tggggctttt atataatgca     11100
     ctagcctcag tactcatcca tgactcacag gctttataag tcatgccttc ctctctaacg     11160
     cggtccttaa aatacgccca ggcttgcaga tcaagcggct gatactcttt cagcgactgg     11220
     tcaagccttt ccttccagat tttcttccga tgagtaaaat gaggaaaagc caggaatgca     11280
     taactacctg caacaaaaaa aaagaacagg agtccgcccc atagagaatg tttgaaaaac     11340
     accagtcctg ggaaaatcca tgccacaatg gcaacaaata aaagaaggtg ctccttccca     11400
     gtaggtttat taaaatgcca ggaaattgca atacacttta atttactaaa gtgattttgt     11460
     ttctccttaa tatcggtcat atatcagtcc ttacttataa aaaaatggtt attattagtc     11520
     tgatgtaaaa gttacttttc aaaacagtcc ctttaacgaa ttccgcacct gcgctcatta     11580
     caacacacac cattcggcgc tttttccgtt aacggggcta ttttcacgtt ttttgcacgt     11640
     atgtctgatt ttgctggtgg gctcacgcca gcaggcggac catacgtttc aacagaggcc     11700
     ttaacaacgc cgccgtcctc tcccggcatt catccacatg ccggaacccc gtctttttcg     11760
     aagactgggg gccggataac atccgcagct cccagatgac ttcccgtaag gttccttcgc     11820
     gctccggcga aatacacccg gctaatgtct ccagaaagcg ttttcttacg gcccggtaat     11880
     acagacgttc ttccggttgc tgtgacgaaa tccgcaggtt acagagggtc aggacagcgt     11940
     caagagtcct tgccttcagt tcgtctcccg tccgggccag atgtagctgt tgttctgtct     12000
     ccagttgcgt cgttatccac ccccccagag gggttttgtt gtaggtgtgc agtgccacac     12060
     aggccgcaac acagcaccag aagcgcagtt tctgccgctg cccccgcagt ttgcgggcta     12120
     cgagcaagcg ataatcgctg tcggtcagga tcttgaaacg gcggctggcg agcagagacg     12180
     gcagcggcgt ctggtcgtta atgccaagac gtgaataggc ctgcccgcgt tgagcgagtc     12240
     gatggtacac cgcacctttc ccccgcgaaa ttcggacggc gccgtatcta agcaggtact     12300
     gtgccgccgc cacaggggta aactcaccgt cagacacacg ctggcgtaat ccgtcatatt     12360
     catgccagat aatccaggat gccgtgtctt catcgaccgt cagctcatcc tcttcttcga     12420
     atgcaacgat gttcaggcct tccccgctac tcatcagact gcgggaagct cgctcatcct     12480
     cccgaccgtc aaaataggct atttcggatg acggatcgga cagcccgtca aatgacgtcc     12540
     cgatacggcc ttccggcaac ttcatccagc gtggtgctgg catcggcgtg cggggtactg     12600
     gttgcatagc tggctcatcg tcgagaagat ccagtgcccc cccttcccac acctggcggt     12660
     aaagttcaat ggcacgaaat gggcgcgggt taaagcaatg cagtgaccag agaaagtcga     12720
     tatgcagcac gttagcctcc tgcaccagtc gaaactgcgg ctccgacatg cggcggttat     12780
     gcgcggtatc ttcgatctcg cctgaaagta acttttcatg caccgctgcg gcccgctgag     12840
     cctccacgta atcgaggctg caacagatat ggaacagtct ttcggtcagg gacgacgaga     12900
     acacattggg ctgaagacgc acatacccgc cctcaaacac tttgcgtccg atataatccc     12960
     gaaggctcca gtcgtactga attttggtca ggaaacgctg aaggcggttg agaccagcct     13020
     ggtagccgta cttctcaggg tcagtgcgga gtaaggtttc catcgagtga tcaatgccga     13080
     cggcgcagca tagcgagcat ccatagcgag cgccgcaggc agaagaccgg acagtggatt     13140
     tctccggcgt ccagatacat tccccggtcg cgtctttgta aagcgtggcg aggctgaagt     13200
     tgtccggcaa aaagcttggc agcggaaatc gcgccagaga accacaggcc atcagaaatg     13260
     accagatatc ctgtgcccgc cactctttca ccgggtacag ttcgccgccg tgctccgtga     13320
     gcgagacgct gtccgcctgc ccgcccattc ttaggatgtt gtctgcccga cgggcgctct     13380
     catcatcgcg ggaacccagc atcaggcaca ctttgttgcg gacagaagca ggtgcatttt     13440
     tcagataacg ggctttggcc tggcgcagtg gagaacgctt tagatctgta gcgcattgac     13500
     gcgtagaaga atttgtccag gttggaagtc cacgcccggt cagaatgcgt ccgacccagc     13560
     tctgggtcat ggacgggcgg gccacaagga cggtcaaagg cagttcttgt tcggcaataa     13620
     aggctctgag ctggctgaga acctgcgtgg cctgatgatg catctcaggg ttttcaatca     13680
     gggtgtcaga catctgaatg aagtggtgct ggctgacgtt cgacccgttt cgtactgcac     13740
     ggatcaaggc cataaggaac aagtgcagta gcgagtgaga gtctttcccg ccgctgtagc     13800
     cgacgcacat ggtccagcct tcggtaatcg catgataaat ggcactggtt gccgtcgtca     13860
     cgcgcgaagc gagactgacc ggctcaccgg catcagtata attcagatcc gcatcggtct     13920
     tcagtgtctg ccagacatcg ccccatttat cctgcgtcag aatggcagcg ttagccgcct     13980
     cagaaaattg aatttctgag ggtaattcaa ggaatgtttc tttcatttcg atatacatat     14040
     tatttcctga atttggcttt cgctgtattg tcgcgatatt tattaaatcc atttaatatc     14100
     ttcagcgcaa tatgtgaagc taaaaatagt taaattgaaa tcatgccaat ttaattaaat     14160
     aacactgaac aaataaaatt acgcggcaat aaatatatta tattctccac gctctcacga     14220
     atactgctgg gtaattaaaa ccgtcgcatt tgattccagc tctgccaacg gaattagggg     14280
     cgtattgagc atcatgtcat cgccgcaatg acggggtaca gccgtcagat gaaatgattc     14340
     tttcatgacc cggatggaag ttgtttccgt gcggcaggag ggcattacgt cccggagcat     14400
     cgtttcctgt ccgctgctgt cactttcaat aaacgcagcc tgcgacatga gaacctcaat     14460
     gtcctcttcc aatgtttcgg accagtggca gtcatagaag aaaaactcgg cggcgtacaa     14520
     atcattttct ttcacgtatg ccgccagttc acggatacgc ttagccagcg acgtatcaat     14580
     ggaaaagaag acgctttgcg ggacatcact cgcaaattca ttgatgcagc tagcggacaa     14640
     aatcaggatt ttattggtca ttttcagctc tccatgccac cggctgttcc ggtggcaatc     14700
     agggattatc aggcagtcac ggggcacaat tcgtcaagtg aaggcagtaa tttgctcagg     14760
     ctttcgtaca cgacgggcat caattcagtg acgctgtgaa gcgccatgct ggtattgtct     14820
     tcttcgctga gaatgataac tccatcctca ccaggattgt cgggcgtgct ctcgtcagag     14880
     gccaggcggt ggcgtgcaac gtcataagcc gattctgatt ttttgcagct catcagatag     14940
     cattgagtgt atgtgtattc gtggttgtac tggttcactt tcaccaacgc atactgaaca     15000
     ccggcatcat gagcttcgtt catcaggcga gaaaaattaa agccttcttc gtagtggtgt     15060
     gtatctttag tcaccacaat agtcgcaccg ccgaactcgt tttcgcgtgg tcggtcgcag     15120
     acgaaagcgg cattgattgt gaccatctca ggcaggttaa acaccgacaa cacggcagtt     15180
     gttaccgcga tagcgtggtc gaggttaatg ctttcatcat ggcagattgc caggccttta     15240
     ccggtgattt ccgctttgag ttccagctcg taattgtttt ctggtgactc cgactgacca     15300
     aaagtcggct caaacggatc gcactccggg tggttctgaa taatacccag gacaagcaat     15360
     tcagtgaggg aacactctga aaccggttta gacagcaagt gttcaccttc cgccacatcc     15420
     gtgtctgtaa catacgcaat cgcgtccagt gccatctgtg cctgttcctg tgaacagaga     15480
     attgtgaagg atgcctgagt gtaattgttc gccattgcat aactccttat ttaattaaat     15540
     gtgattgctg tctgtgaata gataatatca aaacagatac ctgcacctaa taaccaataa     15600
     tgaaatatgt tcgaaatttt tatagagcag acagcgccat atttaataat ccaactttta     15660
     ttctggatac ggtgtaaaat aaatatacgg gaaaacaaaa aaccgccaca agggcggaat     15720
     ttattagacg ggaaagattt ggttatacgg tatgtgtcag ggaggaagca atgagcctgt     15780
     ctggtaacag tgattgtagg gacgcagacg aaataacaag cacctgatcc aagtgcgcta     15840
     caccttcgtc gatatgttgc tggaatgccg cttcagcttc accgcaggag tccgcttcga     15900
     ccagcatcac ctcttcctca tcatcaaaca tcatgcggcc tgagataata tacagtcggc     15960
     ttaagtctgg ggtatttaca gcgatgccct gttagttaat catcattttt ctccgccttc     16020
     aatttttaaa tttgtcagtt ctgctacgtg taaaaaacag catcagccct gtaaacccgg     16080
     acaggtatca acgtagctca ttggtttgcc gatcgcggcg ctcaggcgaa ggatttcgcc     16140
     gatggagacg taccgaagca tttccgaacg cccgtgtttc tggtattcat ccaccgacat     16200
     agtgcgccag tccttgtgcg gtgcggtttt gcacaactgc cagttgttgg cagtggtcgg     16260
     gcgacgcagg acatatacac ccagcgaagg cgtgaggcca ctgccgaatg cctgctccac     16320
     cacaatacgt acttcagagc cgtcggggcg tttcagtgtc tgagtaattt tagtaatgag     16380
     ctgttcggat tccatactat taacctcgac cgtcagttgg gttgctgtag ggatatttta     16440
     ccaaagtcgg ctctctggct aataagtaag aagtgatttt ttttcattca ttgaagtttc     16500
     tttcatatgg aatgaatatt aattatttaa actgactcgg cctattttaa ttattattaa     16560
     tcagggtatt taatgtgcaa attggcaggg cgctgaatta ccgggcatcc attgcccgga     16620
     cagtttatta aaaaaactga taatgccccg ccggagaatt acgccaattc ctgtgaaggc     16680
     atggtctggc tgaaaagtta cttttcccgg ttgccctgcc ttgatcccgt atcgtttata     16740
     ccggtctgct cttacatcct acctgggcag cagctggcta cggtgatcgg gtattaaaat     16800
     agaaccggtc tgttttaccg cagattcaac gccccgcacc tagcgtaaaa tcgcctttcc     16860
     cggatgccct ccttagtcgt ccggcacgat ggcgctactc ccagcgataa ggggtaaaat     16920
     agtcctcgtt aacagcaaga aattcggtca gggaatgcat cgccttcgtg tcatatgccg     16980
     tcacaataaa acggtatccg tccaccgttt cgatgtagct gatcccccgt ggcgtgcaac     17040
     tggatttcac aacttccgcc gtcatcataa actgcccttg cggaaattcc ggtgacaggt     17100
     agataaagcc agtggtggct gatgacgggt tggcattcat cagcacgccg ttaaattgct     17160
     ttccgtgccg cgccggaatc aacgcgctcc ccgctgtcgc ctgagtcatc aactggcgga     17220
     tcagggtttc ctctttatct gagctgtagg cgcgaacatc attttcagcc ccggagcgtg     17280
     agtagacgcc gacatgagca agacgtcggt actcgttacg catataggca tgacaggatg     17340
     caccggctcg cccctgaaga gtgacgccaa agtcttcaca taacatcagt acctggcgca     17400
     ggtttttgtc atagaccgtg gcagagagcg ccaggttata gctgatgaat gtcagctcaa     17460
     aaacccgggt atgtgcgtca ctaaggtgtg cctccatgcg gatcactggt ttctccgtca     17520
     ttggaaacgg cgtaccggcc aagcagtacg aggtaacatc gctaaaacac tcgtcgatca     17580
     cactggcaat gaccgtatcg gcgtcaatga cagccggagc tggaacataa atctgaaact     17640
     gtccttcagt gcccggttgg atcaggacgg ggtatagacg cggggaattg agttgttcgc     17700
     agtcggcatt gatcagttct gtccaaccgg gttttccggt gggagcatca aggcgaagac     17760
     ccaggttatc gcagaagtcg acgatctggc gggagtgctc caccatcact gccccggaga     17820
     gtgtcagacc gtgcgtaacc atctgcatct cactcgtccg ggtctgggag ttctgggacc     17880
     agggctgtaa tgaaagcgtc gtccgactta aggagggaat gatggtttca ttcagaggtt     17940
     caataagctg gcaatgcgca tacagccggg tggcgaggaa gtcaaatatg aagcttgcct     18000
     gttgttttgt gctggcctga atataaaaca tcgcatccat gcctgaatcc cgggatgaaa     18060
     taccgaaaag tttcattttt taccttaatg gatgagcgat ttataatcat gcgccgacag     18120
     gtggacgtta tgtacgccat cgttccactc aaagaatagc cgatattttg aattaactcg     18180
     aatggaagaa taccggtttg cggtcattct taagcgttcg taccgcaaac taccagataa     18240
     caattcgcgt tcgtttttaa cattatttaa cgtttccagt ctgcatgaaa tcgcattaat     18300
     cagttcagca ggaatgcctg ccgtggattt tccattacgg aaaaactttt ccaatcgcct     18360
     gtctttaaat gaatggatca tattttcctc cgtaacgaaa tgagtttaaa taaataagaa     18420
     ttaaaaaagc ctgaatctaa tttattacat cccgaggatt ctggctgcga ccgtcagttg     18480
     tttatcactt aatggaaatt tgcgtgataa cgtcgacttc aggctgttca aaaaactgtt     18540
     ctcgccgtct tgctgcgtga tggcgtccac cagttcttgg tggttctgac accagaggtt     18600
     gaacgcggaa gtctttgatt gaacagcacg ttgacgctct gctgcctgag cggctgagat     18660
     cttgcgagca gcttctgggt atatgcgata cagtgcagtc agggtgtaac aggtacgggt     18720
     agtgaccagg ctatagccag tggcattaca ggcaatacag cggctcttat aaaagtgatt     18780
     gcgttcgcca cgtccattgc atttattgca agtaacacgg taaatatatt ccccggtgcc     18840
     ttttactgaa tcaatacact taatcttagc gttatcgatt gccattccgc tacggtcaaa     18900
     gtatttatcc atttttgatt cctcaggttt ggtctgaagt aataatgaca gattggcctc     18960
     gctggctaat aacctgaacg aacgtttttt gaaaataaat caggaaggat gattgagatg     19020
     atttatatat gcaggattca attttaatgg agggtatttt cagaattatc tgtttacaaa     19080
     aaacgaaaca aatcctaatg aggcatttat tgcatcacaa taaaagtgat tgcttttcac     19140
     tcatttgagt agcgatgctt aagtatttat ccgttttaag gtataacagc agcgtgatac     19200
     ggctcaggga atgcctgtcc gtcaccttaa tgatgcttta cttccggttg ccgaaacagt     19260
     ccatatggct gacatgtata acacgcacgg tctaacgcag ttccgggggg tggcacagcg     19320
     gcgtgatgcc gctttaatct ggaaaacgca ggcatctact ggtgcctcag gatcgcggca     19380
     ctcgcaagct gaaacaccag agcctgttcg tcttccggct gtatcgctcg tccccgtcta     19440
     caaaacccgt ctcatccgca ggtatcgctg gcgcactccc agacggttag aggctttcgg     19500
     gaactgcctg ggtcaaagaa caccggcgtt caggtagctg ttgaaatgga catctacacg     19560
     tttttgttca agtgattcag ttgtggtgag ggcataacgg gtaatgccct cccgtgaagc     19620
     cctgagaaaa gttacttttc caggattaat gcagtcttgc ttttaatata aattcagggg     19680
     atattttttt aaaaaaatac ctgtcgtcaa cttattagaa aagtaagtca aaatgctaga     19740
     gtgttctcat tcaaaaagag gagaactaac catgccaaaa tatttgttac ctgccgagct     19800
     tgcggaaatt gtttgtggat tactggtgca accagcatta ttgaatgaat taaaaacacc     19860
     agccacgcat aaagcattta tgcaggacat cggcgagctg gtggcgaaac attgcggcgg     19920
     tcaaattgac ggcgtgatca tgcctgaggt acgcgatgaa gacagccagg ccgattacct     19980
     gacatctcca gatgaaaccc cttatattgt tgtctctcct ggccaggaca tgcactccct     20040
     cacagataac gtctggcgtc atcatgcccg ggatggctgg cttgaccata tcaaaggcag     20100
     tgtcgaagaa agccctgatg aactgccgac ccacaaagag tgcgctgtac gccgctacac     20160
     cctccagcgt ctgctccttc aggaagaaac cagccatgct aatctgccag tacaggtggt     20220
     acggatgtgt gagtacagca ccgacgatgt tgagcagacc gattcttcag cagagtttaa     20280
     cgtcacaatg gcgctcggtg gtcatgccat gctggcagta aaagatacag attcccgtct     20340
     ggtgatggcc ctgacactct tgattgaaaa tggagttccc tctgtccacg ttaatgcggg     20400
     tgacactgat ccttcagttc tgcacatccg ggcagctcac ggtggtctgg ttctttcaac     20460
     cgactccctt aatcatgatt tcagtatttc gccctctgac cagtatacct acggacgccc     20520
     tggattatta ttgaaagccg cctactgatt tattaattca aaatccgtca ttattattta     20580
     cccccatttt tcgcccctaa cttatggggc gagtatattt taaaaaactt tctttcaggt     20640
     tattagccag caaactagaa ctggtagaat taattcatca gagaaaaggg gactatcatg     20700
     gctaaattaa tttcgacgcg tgaactggca acaattatta ctgcattact ggtaaaacca     20760
     gaattactgg gcgagctgga ttccccagaa aaacatcgcg ccctgatgga agatctgggg     20820
     cgtgttgtgg cagagcattg tggcggtaat gtcactgaaa tcgcactacc ggagaccgat     20880
     ggtacggctg ctgaaggcgc gttgcagaat ggccagcccg tccgctatct ggaaaccaaa     20940
     gaaagctctc cgtatctcat cgtacaccct gacgcctcac tgccgtcggt gacgcaaaac     21000
     gtctggatgc acgctgatca tgatggctgg gaagagcatt tcaacggaga gaccgatgcc     21060
     ctgactccag agatgagcga gcagttccgc cagcaggttt atgcactgct gacgccggaa     21120
     tcccatacca cctcttcaga aatgagactg actttgcagg actggcaact gggtgaagcc     21180
     gagatcccag aagaagactg tcagccctac caggtgaagg tgttagcaga aaataaaaac     21240
     gttcagtgcg aagtgacgaa tgaaaccggc accacgtgtt tcggcctcat tttggagatc     21300
     gaccgtggtg taccgacgct gcacattgat acgggcagtg attcactgct gcacattcac     21360
     gcggcacatg acggcctggt tctgacaccg gatgcaccga gccacagatt tgaagatgct     21420
     cctgtagatc gcttttctta taacagcccg tccctgttgg tgcctggggt gtaaccaggc     21480
     aaactgccca gcggtatttt ggccccgggt aaaattattc agaacaggag tcaggcagat     21540
     gggcgatgtt gccacactac caccgaaaat taacgatggc gtacttcgac gctggaatgc     21600
     tcgcggtaaa gcggataaag aggcgctggc cgactatggc gttagcgtga aggaggagtg     21660
     aattgcgcga attacttgga atggcaggtg cagaacatca agcctccgta atgtatcaaa     21720
     cgttcggaca cctcgacgcg aagctaggcg aaaagcataa aggtcacttc gtttttatca     21780
     acggccagca cggcgatctg tgcgttgtgc atagtgaatt ttcatccttt gacgaaggtc     21840
     caggctattt cagtgaccgt gccgacttca tctgggaatt agttaaaaac gacggcccat     21900
     gctctaaggt cgggatttac cgatttgacg gcgaatacgc gcttcctaag cgccggaatg     21960
     ggagaagatt ttcaggaagc gtaacgtgcc tgcaagcatt ctaattccgt gctgcatgag     22020
     cgccgacagg tcttccgtac aacgggaggc ggcacagttc gcgtgcaacc atccccacac     22080
     aataactcga ctgagtacat aataatgacg aacgctaacg caaatgacgg gaagaccagc     22140
     ccggtattac ccactctcga acaggtctat gctctgctca aggccaacta taaacccgca     22200
     cgatttgctg atcgggatgg ggaaatctgg gggcatgagt attcatggaa cttggcaaga     22260
     tccagtttgc aagacctgga gaaatacggg aaatcatatg tatccaagca ttccgaccgg     22320
     atgggcgatg gattcagttt tggtcctgac ctggtcatta ttcgctgaca tacgcacgga     22380
     agtgagtaag atggctggct gcgccggaga actagagtaa tgaagggtaa aaatatcgtg     22440
     gctcgtgtcg tgcgggaagc ggcctataag tgggaaactc gccaccaatt gcagcaggcg     22500
     tacaattcag cgagtgacgt gggaaaagtt cccagacatt ccggttccgc atctgattta     22560
     cgccagacgc tgtcattttt aattctttgt agggcatgac gatgaaaaac acagtaatac     22620
     cgacggtgac tgaaaacgag atgggagagg tgatcacccg ccactcggct tacggactgg     22680
     tatcagtaag ccgcacgtcc acgacgggac agcgccttta tgcctccgac ctcagtcata     22740
     aagaggtagt cacgatgacc ttcagtgaat cagagcagat tgaacgcgac ggtgtgatcc     22800
     gtcatcgact ggcggaaggc cgacgccgct caccgctcct gcaagtcagt ctgtctccgg     22860
     cgcagtgggc cacgatgatc acatcgttcg gaatgagtga cggcgtgccg tgtaccatta     22920
     acagcctgat tcgcggcgat tatgagcggc agccggagat tggctatatt gagtcgacac     22980
     gcgaacgata cgaacggcag atccgggaag ccgctgagcg tgaaatggcg aaattgcatg     23040
     aaaagctgga agtgctgcgt ttgctggcgg taaaaggcaa ggctggaaag cgtgagcttg     23100
     acgaagccta tcagtcgctg ttaagcgtaa tcaataactt gccggtcaat ctggccttca     23160
     ccaaccaact cattcaggaa tccatggtga atatcgtctc acacggcaag gccgaactcg     23220
     aagccaccgc catgggcgta gccgctcgtc tgggtatgaa agaaatgagc agccttgcct     23280
     cgctggaaga gaagaagtaa ccggtgcgcc cgcccgtaaa tcatgaaatg cactaacgtc     23340
     catacctgct gcacacatac gcggcacaca gatcaacggc cagcgcatac cgcgttgaca     23400
     taaaccgtaa acactgaagt gcgtcgtcct gtcggggaca ttctacgtgg ttttctacgc     23460
     cccccccttc tctcttctgc ggctcacaga acttcaggaa ttgctggtgg gcagtctcca     23520
     ggacgttttc cagtaaccgg ctgtggtcag cgtcatatcc cttcagcagg cgttccagtt     23580
     ctgccatagc gagtgcaggt ggtaaccaga tgacgccaag cagcaaaaac tggctctgca     23640
     ttcgaatttc atggcgatct ggcttcagac cctctgcccg ggaagcgcaa taataaatcc     23700
     tctccagggg agctacacgc gtgataagag gtttctcagc aagttctgac atgcgactaa     23760
     atcagcctgt ttcgtttctt tctgattacg ttaagacact atgaaaaagc cccgtaatac     23820
     ggggccggtt cggaggcagt tactggattt gcggcagctc gatcatgaag cttgattcac     23880
     cgacattgcc gctggtggcc gggaagatgg ggatcaggac gccatcaccc tgcccgaaat     23940
     ctatcgtgat gtctttcgaa tccccgggta cgacggccac cccattcata ctaaccgcaa     24000
     aggccgcatc tttgcggacc gtcagcgtgc cggtttgtgc tccagtgatc agcgaaccat     24060
     cttttttccg gatgctattg gtacgcagat acgccagcgg ctggttatct gatgtcttca     24120
     gccccatacc cacggccagc gttttgagag tgttaaattc aatcaggttg ttcggtacat     24180
     aacggaaccg gctgaccttt gtcgtggtat taccggcttc atctaccgca accgcagtaa     24240
     gctggtagga atccgcatca tctgtcgcgg ggaagatacg cgggtagttc agcccgtatt     24300
     tatcagttcc ctggctgtac cagcccacac tgactttgtc agaagtgggt ccgccgctca     24360
     gcgtgatgct tttcagggaa gcttttgtca tatcgtcggc cagtgtgatc accagatttt     24420
     ccagcccttt gaccagtgct ccgtcagcct gctttccctc aaaactgata tcgacaacag     24480
     gcggcgtgac gtcatgcagg atggtattcg atagcgtcag ttctgccgtg ttgttgtagg     24540
     tgtccgtcgc ggcacccgtt gcagtgtatt tcccggaggg taacgcgctg taatcaaacg     24600
     tcacttgttt cagctggtag ttcaggaccg taacgttttt cggcgacaag gtagagactt     24660
     tattactggt gtccttcagt gtgaggttaa agatattggt ggcccacata taattggtcc     24720
     agtcgttagt tacgtcactg tccgtcacca gcattaccac cgttttatcc agtgggctgg     24780
     agacgatact gttgataacc ggggcgttca tatcccagta ggtgtagaaa tgcgactgta     24840
     gtccgccgag atttgcgtat gaaccggtcc ctctgatatg aatttggtac ggaacatagc     24900
     ctttcccgct cgtcttacag taattcatgc tgacctggca actgctctca cccactgaaa     24960
     cattgcaact gccaatgccg acgatagtag cagtttgcac ataagagcgc ggttcaacgt     25020
     ttacacgacc caaatctacg caatccggcc cggtaaacct gacgatgtca ctcgaagtcc     25080
     atgtattagc atctctgaaa tggtactgcc ctgacaaata gcggggggct tcagccacgc     25140
     cgttacccgg agtaaatttc agcgttttgt actggaggtt gacgttaagg cccgctttag     25200
     tatgaagctc gtagtacata taggtttccg ggtagctcac cgtggcttca gtataaaaat     25260
     aggtattgtc ggagttggta atctgatcga cccagccgaa gtctgtcccg ttaaaattgg     25320
     ttgagtccga tttaaggcgt ttgtacctga atttgactgg gttctcgaaa atagtcatgc     25380
     caggaacata atcttcccag acgcctgttt tcgcattccg cacctgatgt tgaatgtagc     25440
     tgggtattgt acgatcaata ccagagcgat gtgatgtttc tgtccagttc ccggctttgt     25500
     cataaacccg aaaacctacg gtgtaatatg ccggactgac gggcgcaacc gtgcttcctg     25560
     ccgccaccgc cgccagtgcc tggaccaccc ccgtgagtgc attcagctga gcatttacag     25620
     tccggcggac accgctgctg tcaatagcaa accactccgc tttatccagt cctgacctcg     25680
     catcagagac gttcgataac gaaatggcct gggttgcggt cctgtcgccg aaaatatcca     25740
     gacttccgta ctgaaaacca gccctgatcc actgcatcgg atctggtaga acgggaggag     25800
     tgatatcgat gctgaaagag tagctggttg tcgccacgac attcgactta ttgtcgagtg     25860
     tttcggattt aagagaaaaa gtaccctcgc ccagtaccgg cagtgtcatg gacttgccgt     25920
     agtactcact accatcagcg gcagtgatcc tgtcggccac tgtcaccagg ccggtgacac     25980
     tctggaacat ctgcacatta tcggatgaac gtgtcacggt aacgcgctcg tagcggtcga     26040
     gaccagatat cagattcagc gtaattgcgc tgcccgggtt gagatactct ctggtgggtt     26100
     cagcattcac tttcgtgccg cgtgtgtcgg tatacgaata gttgtaaagc tgagcctggc     26160
     tgtaaagcgg gaacagcagt gccgtataga cggcgacaat caacggacgt cggcaaaatt     26220
     tcatttcggt tctcctggtt ggccagaaaa ttttacctga atcgttttct tcgcccgggc     26280
     gctaagaggg gtaattgttc agtaaaacat cgtccgtttg tgtgcttttt gccagattta     26340
     atcggcaggc ctgcgggaaa taccccatcc caatgtccgt tttaggctga ttaattcccc     26400
     agaaatcccc cccttaacgg aaaaatccgc agggcagacg tttaaaatag caacaactaa     26460
     aaggggaata ctgaatgaaa aatcaggcta tagctttggc tatggctatg ctcggagtct     26520
     cagttccggc atctgctcaa atttatgaat ccatcttcac agataccaat ggtattgaag     26580
     ttcacgcccc ctcaacccgg ctgttgctga atccggcctc accggtaacc ctgacgctca     26640
     ttgccggtct tgaccgttat gtgaatgtca aaatcaccag cgccaccggc acgcaactgc     26700
     tgaacaccac tactacgcgc accagcgtat ccgaccgtct gaaggccgga gatggcagcg     26760
     aattttacgg aaaaaaagta actttaccgg tgcttggcga aggcaggtcg gttgtgcagg     26820
     tcagtattct ggatctgaat cagtccgttg tagccaccta cagctacaac tggctggtag     26880
     acaccacacc gctgtctggt aatgccctca caggcaacgc cgcctatgga tcaactgcgg     26940
     gtagcgtctg gaaaatgggg ctggaggcca cggggcagtt tgattttacc tcaaccaatg     27000
     tcacggacgt aaatggcatc gagaaaggta tgttttatgt ctatcacagt aacggcagtc     27060
     tgttcagtac gacgtgactg gtcagaagat gtatcacact tactcaaaaa actcggtcaa     27120
     aggcgcgggt attcccgaca gcaatctgga tgaagatttc acggccaagg tagtcattta     27180
     tgacaacgca ggaaacaccc gaacccttcc gttgcagctc tttcgatatg ataactatct     27240
     gggcggtccg agatccgcaa agctccgcca gcgtggtgcc aggggtttcc ggatatccgg     27300
     cctattcagc tgggatgacc gttaatgaga atccgattca tcttgtatat cgcgtgccaa     27360
     agtccaacta ccggtcatat gccgagggcg gcctgctatt ctataacctg tattcttccc     27420
     cgaccgagat tgcgacggac agcacctata cctacgttga aatgatcctg ccctagtacg     27480
     gtggtatacg ggctggagaa tatccgtata gctctggcgg ataacctgac aacaccccgg     27540
     atcacccgtc ttcagataac cggagggcca acggcagata acgttgagct cacgtggtca     27600
     cctgctggca cgaacgttta tgcgccagaa tatccaaggc tgttcccctc attcgagcct     27660
     tccgaaaact atgcgcttag cgtgacggtc tccgacagtc agtcgaacag caaaacttat     27720
     acccagaaat tcagctacct cccgaataac ctagtgcagt tgcataacct gcgaacctta     27780
     tccgtcagtt cagcactcaa aacgtcgtta aatgagcctc ttgcttatct gtcaaccaac     27840
     gtgttgcgta agtccaacgg tgagattgca aaaacgtcca gagtgcgacg ctaacggtac     27900
     gtaaagacgc tgccttcggt attaagttca acggcgtgca ggccgcgctt ggtgaatctg     27960
     tagaggtgaa aattgatatg gggctcggtg ataacctttt agtacctata taccctgctg     28020
     aaaacggcaa agtgggtaca tccgagttca tgatccagat cgatgagctg aagtaatgag     28080
     aatgggccgt cggtagtact ggcggcttaa cgaaagtaac tttttctgta agggttgaag     28140
     tgtgcttctg atgtttttag aacggatcgg aatttactca cattttgatc gtgatgattc     28200
     aatacgtgac agagcatagt tatcaacagg atagaataat aataaagatc aatagaggat     28260
     caatagcaga tcaaaaagga ataacgatcc tcgcagccca gtgatatcgg gcctctcagc     28320
     ggatcagcat ccactgtaca gggggagaaa tacactatgt cgggtaatcc atccactgta     28380
     ccgggcgcat aatccactat accgggtaga ttcgatacac tatagcgggt aggatgtaga     28440
     tcttatgcac aaaacggatc tcccaatatg tcaagtaata acaacaagtt atctctcgtc     28500
     attgaagagt ccctaaaaga ttcaggggaa gttatacaac tctttcccac attaaaacag     28560
     accattcaac cgaaagtttt actccgccta ggtgtgtttg tgccgacttt gaaatctacg     28620
     gacaaggggg ggaggaagag ccatcatatc gatgccactg agccgctatc aaggttatct     28680
     attgtagagg gtgaaggtta cagccagatc caaatctacg ggccgcgtct cgatatggat     28740
     accgatttca aatcatggtg tgggatcgtt tatgcgttgt ctaaccggcc gcttgattca     28800
     gaaggtcagc tggagctgaa ttttccggag tttgcaaaat tttgtgggtt tgataccaag     28860
     cgcattgata aacaactgaa agagcgcttt gatgcttcgc tgacgcgtat agcccggacc     28920
     aacatttcat ttattaagaa aatacccggt acagatgatc agataacgat aaacatgcac     28980
     ctggtggaat cgacgtatta cgacagttcc acgggaaaaa tcatcatcaa gccaaattcg     29040
     aagctcaata cgctgtatcg cgtcgacggt aaaacccgac tctacctgaa gacattgcaa     29100
     aaactggccc gtaaggagtc cgcacaggcc ctgtacctgt atctggctga gctgccgagc     29160
     accttttacc gcatcggatt cgatcggctt cgtggacgac tccaactgtc atcacacctc     29220
     ggtaaccaga atgccacggt taaaaaggcg ctgggccagc ttaaagagat cggttttctg     29280
     gaatactcca tagacaaaga aaacggcgat tacgtactga atattctaaa gagaaacatg     29340
     aagccatgac cgatgccgga taatgcacct gcctgccgcg tgggtggctg cgttacccgg     29400
     tatagtggac attcttctcc tttccactct gctttacccg gtacaatgga tctccactac     29460
     accgggtagt gtcaggccta aaattacgat gcagcccctc ctcttcagcc ttacactgaa     29520
     tatttagtgt gttttttcac caaaaatgtg atctataccc ggtacagtgg agtcacagaa     29580
     atgtgatccg tacccggtat agtggatgag aactactgct aatcggttac cgggaatgtg     29640
     gtggtactgg gtggaaaggt ttacccggta tagtggatcg tggcagtgtc atctttccgg     29700
     atagcatgac gtcacggtta ggaaaccgta cccggtatag tggatagcga atggtgtaca     29760
     accctgttaa cgtgatgatg ctgaagtgaa agtttaaccc ggtttagtgg agcgacttaa     29820
     agcgcgtacc agtagctgat gggggagcag cacccggtac agtggagggg cggatatcgt     29880
     cgtaaaggtc ttaactaaaa gatgaccatt cagtcgcagc attaaagaaa tatatcatcg     29940
     agtctcaggg gttttaagcc ggtagacacc cttccaccag gagtcgaaag acaagctatc     30000
     atcgcagcgc ataaatatgc cgttatgctt ggtgacaacg ctaagatagc ctttattttt     30060
     cccgcagatc ttctcaaaag actctgttgc tttaataaaa ttttcaccat ccgtgatggc     30120
     cggagaatcc agttccttcg ccagccatgc cggatagctg tccgcattaa cccatacaag     30180
     gcgttcaaca actgaaaaga agacgccgac aaggccaatc gtccaaagcg taataaccag     30240
     taaacgcaaa attcgtaagg ctataaattt tgagtgctgt agaggcgaaa cgataaaagg     30300
     cagtgagatc atgactgtga gtgagactga tgccgccagc aaggtgtata acaatgacca     30360
     tgatttaaca taggcggaaa aagcgatcat taaacaaatc agaatgatga gcggtgcatt     30420
     gcttttcatc atgcccgtgc taattttcat tcttttgggg ctccattttg tacgagtttt     30480
     gagagactgc gtttgtaatc atccgctgcc ttagaaaagt taccgtcatt ctgtaccggc     30540
     gtaaagcgaa tgccaaaaaa cgcctcaatg acggaggaaa gcgtcactat cggtcctgac     30600
     gaggcatggg cttttcgctc ccgagcctca cgctccgcaa agtggatcac cggtccccta     30660
     gaaaatgaga gtgagtcatg ggaagaccag tctgtttata gccacagtag ttaaacgcac     30720
     cccgccagtc cgtcgctgtt tgacatcatg gccgcgaatt aggttaacgt cgcccggtat     30780
     agtgtaatcc caggctgaac ctgtgtttgc agctggtggc cctgcatcca tcaccatgac     30840
     aggcgctggc cgcaggaatc gcgtgccgga tgaagggtat ccactatacc gggtgaatga     30900
     tatgttgatc cacgctgacg ggtagtttta tgagcaaacc cgcagcgagt ggcaggcctg     30960
     tgtcattcgc agttttactg atgggacgga aggttatcca caaaaacggt gaataaccct     31020
     gtgaccggaa tctggataat catcattgcg gcgacaacaa cagaaagaag tggcccggac     31080
     ttggccaccc taccctgctt ttacttcagt tcctctatat tcagcataaa ttcagaagtt     31140
     ccaacgacgc cggaagtcga aggaaaaata gggaagctgc ggctgtcacc cagacccaga     31200
     tccaactgaa catttttgct ctccccagga gctgcggaaa ccccattcac cgtgacgccg     31260
     aaggctgcat ccttacgcac cgtcagtatc gcgtcctgtt tcccggttgc gatagacccg     31320
     tccttcttac gcagctggct ggcataaaga accgccagcg gtgtgtcatc ggacgttttc     31380
     agcgcggtac taacggagat ggtcttaagg ttttccagac gaaccaggtt gttcggcaag     31440
     taactaaatt cgacggcgct ttctttaacg ttgttcatct cgtctttggc ctgcacggta     31500
     agcgtgtaag tttcgccgtc gttaagtgaa ggaaagatct tcgggtaatt cggggcataa     31560
     agattatttc cgaggtttac ccacgacaac tcaacagcat cagataccgg gccaccgcga     31620
     agcgtcattc gcgttaaaga gggcttggtc agggtatctg cgagctgaat acgaatgttc     31680
     tccagtccat acaccgttac actgctggtg ataggtttgg tttcgtagct gatactgatg     31740
     gacggcggcg tgttatcgac cgtcacagtc ttatagtcca gactacccgt attgttgaac     31800
     gaatcctggg cgttgagctg cacgttatag ctgccctccg ggattagttt caggttgaac     31860
     tcgtatgtat aattcccggt tgctgtgtta cgccccgtta gtgttccggt cacattgata     31920
     tccgcgttat tgcgggattt gtcggacagc cacacccggc tcagtttaac ggtatcgaaa     31980
     tacgatccgt ctcccggctg gttgatgtaa acctgaagga tgttggtcgt atcattgtag     32040
     tcatagccag tgaccgaagg ccccagcgta tgccagacga cgttttccca gataggcatg     32100
     aagaaggtgg attctgttgt ggaacgtacc tcataaccac tatgcagata gccggtggtg     32160
     ccgtttgtaa tcgcctgtgt cagggcgacg gtacacgacg ttgacccggc agggatgttg     32220
     caggtggcac cgccagtaat tttttggtcg tagggccttg cctgcacatt gaaacggatc     32280
     tgggtcaggt tcaccggcat atctgaagcc ttgaagtatt tccaattgac gctgttaaac     32340
     caggtaccat cggacatctg tcgctcaatc gccggactcc cccatgcagg actttttacc     32400
     gaagccgggt cccagttcag ccaggaggcg tattgagtca gatcgcctcc ggaccattgg     32460
     tacgtgttca ctgggcgata gtagtttata tccagagcgc cctggggaag cttcacctcg     32520
     acgtacacat aggtcgtgtc ttctgaaata accttagcac cgccataatt gttaagaatg     32580
     gtgatgccgc cgttacggta tggcttccag ttggttcggg ggatacggat gaccatacgg     32640
     tatgggtttt cgagtacaga tagcccccga acaaacggga cgtaccctga agagatcccc     32700
     gggaccacac tcgtactgac gcgtgagtca tgaaccgcaa agggggtgta ttcacctatc     32760
     tggtcatcaa ataaaaagcg ctgcggcgga atattcagcg tgtttccggc tttatctgtg     32820
     atgataaaat tgaaggtaaa ttcttcattg agatcgctgg tgggcatacc gggttgagtg     32880
     accgagtcct tgatccaggg gtaaaaggca cgttttgccg ccgtatcgta actgagtgtg     32940
     ttgtcggaca cgactgtgcc atttccgcgc ttgatgacca gacggatctt gtctatgcca     33000
     ttcgcatcat caactccatc agcaaagatg gaaaactggc cagatcctcc gcgcccaagc     33060
     ccccaaactg ggccactcag gaccatttca tagcctgcgt tctggctcgg gtagatgctg     33120
     gtatactttg gcgctgtagt gtcgattgtg aaatgatacg ttgaagagct gacgacagcc     33180
     tgctggagat ccagagtatc gttgatgacg gtgaaggccc cttcaccgag tgcgggtaac     33240
     gccaagtcct ttccgtaata ttccgtgccg tctgcggcaa caatgcgatc tgcgacgctt     33300
     atctttcctg tcactgcgga atacatgacc tttttgtcac tgtccctggt cacactcact     33360
     cgttcgtatc ggtcaaggcc ggagatcaga ttcagggtca ttgtgcttgc cggattaagg     33420
     tagctctgcg tggcaggctt aagcgtcttt gccagctgat tggtgtcagt atacgaatag     33480
     ctgaaaatct gagccgccgc cggataaact gaagctatgg ccgtggcaat gatacagcct     33540
     gtcagaattt tacgcatgtg atactcccgg gatgtatttg cccctatttt acgaaatctt     33600
     ttcacctggg cttgctggtt agccggggta tttcacggca taaaactttt aaatgttgcc     33660
     gtgatagcaa tgttgtcggg tcagaacaaa acgaaagtta aggcaacttc aacagggctg     33720
     attacggtgg aagaaaagta acttttctct tgagaagaaa taggaaaagc agaaattagg     33780
     acgattaaat gaggtgaaat gtcagcaaca ggcgatgatt gtccatcatc gtaagggagg     33840
     gtacagggtg ccgctgcctt actggcatca tgttgatgtc cagctcttca tacccgtttg     33900
     taccttagcc ggaactgttg ttcagtacag gtaaaagttg taataactcc ccgctcactg     33960
     ccggggagtc attttaaatc agcacggcgc catcagaata gattagcttt caaaccaggg     34020
     cgaatcggca gagttcgcag attcttcact ttgctgtgac tctcccagaa attgcacttc     34080
     acgtactggt ttacttttcc ccaggctccg ctggaaatca tccatcacaa actcaatatc     34140
     atcacggtcc tcaggcaaga caggcgaact tttggacata gtctttcctt cagttaaaag     34200
     cgttctgcat acagaacgcg gacggagacg gcagtgttgt caaactcatt atcgaaggta     34260
     tccatccact cggtcctgaa cccctcgccc agcaggttat cgatcccctg aagggacaga     34320
     ggcaggacgg cagctaaacg cccgccggga accagatgag acgcagcggc cagcagatgc     34380
     agcttagccc ggttgtcagc aaaaggaggg ttcatcacca cgcaatcaaa tttctgaatc     34440
     tgattcgccg ccgaccaggc cagaaaatcg gcttccgtgg tctcgtaacc tttagcccgg     34500
     gagaccagac aattcagtgt atccagttcg atgccggtta cgttgacact tttcgggaaa     34560
     cattgaagca aatccccgtg cccaatattg ggctccagca gccgttcccc ctccccggcc     34620
     gcaataatgg atgcgacgta ttcactgagt cgcgccgacg acggataaaa ctggtgggat     34680
     ttaatatcag gcatggcgcc catatgtccg atgaagcgca tcacttcggt cgggtcataa     34740
     tcaaacgtca catggtagct tgtcactcgg gcaccgagaa atcgcagaac atccgcgttc     34800
     acctgccgcg ttttatcagc gttctcaccg gcatagccga gcgatgtcca gctggaccat     34860
     tccttttcat tctgggtaaa atccagctct gcaagctgca tccgtgaatg aaaatcgatg     34920
     cagcgtttca gtgccgggaa ctcctgcaac gtcgctttgg tatgggccac gcgttcagca     34980
     ggcagagcca gagggacgat ggcagcaaga atgttgttaa gccgttcggc gatatcagga     35040
     tgcacatcaa tgtgcatcga tccgtttttg tagacccgaa aacgaatact gttgccatcc     35100
     aggctgatcc agtttctgaa tccaacatga ccaaccatat tctcaaccat ttttttcgtg     35160
     tcatagaccg gtttaactgt ttcgccccgg aaataagaac agatcacccg caactccgaa     35220
     agtggcatga ggccggattc tttaaactca accttcagtt ttacccattt gtctttcacg     35280
     ccttcacata cgccggaggt gatcatgcga gtagagaagc caaatgcttt attggttttg     35340
     tgttgacggc ttaatgactg aaagacggca tagacacgat ctttaatgaa ctgatgccgg     35400
     tcattgagca acgcgacaac cgtggtaaca acagcatcga gtgtaaaatc agggatctcc     35460
     tgaggaggaa ggtggtaacg gtcagcagta aactgcttat cccattcttt cttcttttcg     35520
     tcagacatca cagacagtac atcggtcagg gccatgaccc tcttccagta ttctgaacgc     35580
     agcgcgtttt ctgcgtagct ggcatccgct tctgaaatga gatgattgta tccggagagg     35640
     tatgaataga gcttctgatt cccgcatttc aggaactgag cggacatgga cctcagtaag     35700
     ctaagctcat cgttatatga ttcgacctgc ctgttaatga catcgagctc ttcccgcatt     35760
     tcgggcagga agttatcgtc gttaataagg aggccagtat gaggcatata agcaaccaga     35820
     gaactcccag gggcacccat tggcagggaa tcagattcaa cagcagacat agcaccagtc     35880
     ctttttgaag ggtttatctg ataccaggat aacaaccttg aacaaaaagc taataggttg     35940
     gctgacatga aaatggagaa attaacactg cggaaagtca gaaagacaga tgtggtttta     36000
     atcagaagaa acgggccgga gacaggacaa aaaaacccct acatagtagg ggcaacgggg     36060
     ggagagcctg ggtggctcgc tctaaaatat cgtacttctt attgtagtct tctcacactc     36120
     tgaaataatt catttaagcc tgtgctgggg gtgtttcgga ttgcggttct ccgccatttt     36180
     tatcgttttt cttggttttg taagtcactt tttccccttt caatcgggct tgccgatttt     36240
     cggcccggcg aagctgcttg ttttctgatt ccgtaatctc actttgcagg ttcttgagca     36300
     tctccagcat gctccggttc agcgtaaagg taatttcttc atcttcgctg gagtcggtca     36360
     cctccggcaa ctcgatatca ccgagtttct gcaatagact cgtcgtaatg agtttgaccc     36420
     cttcgacggc ttttgtagcg agaactggtg gaacacgtgc gggtttaaaa tcggaaggga     36480
     caacacggat ctgcccgcgt ggcgttttct taatctggat accgcttgaa tcagcctttt     36540
     caaggtctgc gatcatcttt tcgatccgcg caacagcttc cgtttcaccg aactcatcga     36600
     taagggacag gactgctaca taggaaatgg catcggcatg gatcagtttt ttgagataga     36660
     cacagcagcc ggttaaacga ataagagcag caattgtggt attacttttt ccctcacgtt     36720
     cggcaatacg gtcaagcgac catccaccca gcgcctgaag acgtcggtag gattcaccca     36780
     aagccacagg agaaagagcc aggccacggt ttccgtcaat cgttgtcaat tcgcagctga     36840
     tctcatcggc tttcatctcg atgcaaagaa tggtgaggtt agaatgccct tctgccacag     36900
     ccatcaaagc agcctttaaa cggcaatgtc cctggcgaac gtacggaatg ccgtctttga     36960
     tcagaacgcg gatagggtct acgtaatcac cccggatgta cgcattcttg atgttattga     37020
     gatgatcggc gacttctggc aactggtaat aagcttcccc cattcccatc tcacgggagt     37080
     tgaatccttc cgtgatttga accacggttg ggctgatagc ccatgctttc tgttcagtga     37140
     cttcattaca aaggtcaggg ttcgcgtcgc ggaactgctt cataccactg acgaatcggc     37200
     cggaaccggt cactgttgaa aaagacacga gtggggattt aaagacccgt gagttagttt     37260
     gctgttggga atcagtcatc agatcactca tagatactcc gttgaattct tttttgtcat     37320
     acctttcatc tgtgcgtgaa tactaccgga aaaaaaaatc tcactttttc gttaaaaagg     37380
     tactttttgg gtctattccg aattgaacga ggaaaattgt tctggcgatc agaacaaaaa     37440
     gaaaaaataa ctcaaataaa acagatggtt atggttaatt cgtaaaggat aaactttttt     37500
     ctgagaagtg aaaaaaaatt aaaaaatgtg tcgaaatgac aatctcgtta acaaaagcca     37560
     cgttttttcc tgctcatacc ttattggtag caatccgcct ttcggtacca taagtgtggc     37620
     ataccgataa agctgaacgg agaagactcg ttgcgaaaac atacaccaat catcaaatgg     37680
     gcggggggta aaaccaaact gatgccgttc ctcagtaagc acttcccaca tgataagagc     37740
     cgacgctggg ttgaaccgtt tatcggcggt ggcgccgtgt ttctgaacat gtttgccacc     37800
     gaggctctcc tagcagacag caacccggac ctaatcaatc tgtaccgcaa catacagcga     37860
     aataaaccgg cattcatcag agaagtgcag ctgctggcgg aaaggcattt tgaagaagag     37920
     gattactacg tgctgcgtaa tacctttaac agcaccagtt ttgatgatgc cccgctacaa     37980
     cgagcagcca ttttctacgc gatgaatcga ctcggatata acggtctgtg tcgttacaac     38040
     ctgaagcgaa agttctcagt tccatgggga aagcgatacc agttcagtct ggatatccag     38100
     aaggttgatt acctctcatt caggctttcg agcgttgaat tgaaaaccgc agattttggt     38160
     cagacgctgg agtttgcagg tggtggtgac caaatatatt gcgatccgcc atatgacaaa     38220
     atcagtaaaa ccagctttgt aagctatgat ggtataccgt tcgataagag cgcacatgtt     38280
     aaactggcgg atatgctggt ggatgctaat cgtaaagggg cctcagtggc catatccaac     38340
     agcatgactc cctttacgct ggagctctat gaagaacgcg gttttgatat tcatactcac     38400
     aacgcttatc ggtctgtcgg cagtcaatca aagtcgcgta agaaggaaat agaaattctg     38460
     gccgtccttc gttgagcggc gatcagtagt tagtcgatcg ggcttatcca ttcctcgaag     38520
     ctcagcactt cggaatggtc acggctggca tagggaataa actgaagctc ttcaattgat     38580
     cgctcccctc tcttaccttc gcatataaac gatatgaacc cctgatctgc aagttgggta     38640
     aggacattca tgattcgtac gttcactgta tgcaactgaa gatcattcac gatatcggta     38700
     attttgtgtg aatggcgccg ggactttcgc aaataatcaa agatgacaaa ctgggcattc     38760
     cgtcgcttca ataatttttc cgtcataaat tcctgaatta atccccccag caacatcagg     38820
     aacggacgaa gtaccccagg gaacgttaac gtataagact gcgatgtttt gaccagagtg     38880
     aaggacgtca ggaagctgaa gtttagtcgc ttctttgaat acgggacata aacagccaat     38940
     gtcgtagaca agtaagtaag caattcttcc agatgagcgc gtgtgatcat gaccgtctta     39000
     tcgctattac gaagaccgtg ataatcaata aatgccactc tggcacgact cagccactcg     39060
     tgaatgctta tggatacagt gaacggtgcg ttttcatcgg cagaaatgac gccgtgctca     39120
     gcgagttggt tatggataag catagacagc tggtaaaatg gaaaacggca ggatggatga     39180
     cactgtaggc cagttagcgt tagctttgca ttatccaagt catcgagcgg aaaagtaact     39240
     tttcgggaaa taatttttgc tgacgttctt gctgacttgc ggatgaaccc aagtccaaga     39300
     tcattttgca tatatcactc cgttttaaca aaatctcctt aacctatatg ttaagaagag     39360
     acaaaaaatt aaaaaatata attaataaga ttatcatttt taatttaaaa gattagttaa     39420
     taacgggtgt tgaatttaaa ataaatcggc ttattttcgg agtgtaaaac cgggtaaaaa     39480
     cccgatgcgt gagcaacaga tttgacgtga gtgagtcggc acgacagtgc agaaagccgg     39540
     tggctaatgt aaaaacggcc tgtatttggg agttccggtc actagacacc aggctatgct     39600
     gttaatttaa acacagtcag taatgcgtag ggcactgagt caaagtagtg gatctttctc     39660
     acttttcccg aaagatgata gctatgcccc aataaaacgt gatcctgaac attaccagtc     39720
     aacgcgaatc catcattctg ctttttgcct gtaaaagtaa aaaaatagct atgagaacct     39780
     tttgaaaacg cagctcgcac ttctgtaaaa ataatatcaa aactaactac atcaccaatg     39840
     ttgaaagaat gttcaattgg aaaaccggcg ttttctgaaa aagcttcaga aacaggctgg     39900
     tatgtcgagt agaaagactc caactgacgg actgttaaaa agagattgtt gtttaactgc     39960
     tgtgcaatgc ttgctgcaaa cttagaattg tcagcttgca gcaatgctaa ctgctcgctg     40020
     tgcctacgtt tccaggcttc aagatcggga ttgcagcgaa gttccgggat agtttcaagg     40080
     aattcaatgc actctttcag taccagcttt tcctctgtgg ctggagacgt tttggagcca     40140
     ttgcatgtca cacagacggc gttcgcaatc tttccagtcc ctccgcattc aaagcactca     40200
     cgggtgataa cggcgtaata gtgtccatct ttaccgtaga taggctttac ggatgatggc     40260
     agtaaataac catcctgagt aaaaaaaaga gaatgtttca ttttttaagg ttctccagtc     40320
     gagcctccac gagctgtaaa gcgtcagtta ccttctgtac gtattgatcg tgcccttctt     40380
     caaaatgatc aaaacgcttt ccagccttga tctcttcaat gttgcgatcg agtgtgcctt     40440
     ttgtaataag tagatcgtta taagtattaa ttacagtaaa ctgtgcaatc ttgtccataa     40500
     acggtcctta gcattctact cacttgttaa caggtcacga atttcatgca gttctgtaac     40560
     cttagatttt ggaatgatga tagcagtatt ttcatcattc agaaggctta ataaaagctg     40620
     gagttttgct tcatctagag tgatctttac actttccgtt gtctttgtga tggaagtgct     40680
     gctgatgttc gtaaataaat tggaatgttg tccgtcgaaa attaattcgg tgagtttatt     40740
     actgtcgttt agtgctggcc gtacagtatc aatcagcccg ataaattcag tttttaagcg     40800
     ttcagttttt ttatgagaaa gccgtttaat acccaatgaa ctgcgagtga tggattttgt     40860
     tttaacttcc ttaggaataa catgaacagg gagtgtttcc gggttatcta gtttctcatc     40920
     gtttgatgat gtttgaacgc ttgatgtctt agataaaaca ggttctggtt cagttgatgg     40980
     tactaaaaga gaacacgatt ccaaatgtgc aaggactttt gcatggtcat tggaatactt     41040
     caacatgatc tcaatcgcga gtgttttttt aatcaggttt agactgatta aacgttgtag     41100
     ttctaaaggc atatcaagga ttttaagctg gttacgaata gcagtgctag accgttgata     41160
     gcgcatagca agggattcaa cggtagagcc aagcttcagc gcctctgcca gtgcataagc     41220
     taaggctacg ggattaagac cgttattcct attcccatca aggttctcca ggtattcttc     41280
     acttttattc ttatagttca taacaactac tgaaatgagc tgaatatcag ctccttccgc     41340
     aagagcaaga gatagtgctc tgtaacggca atgcccctgc cttacaacgt aattggagtc     41400
     tttcttaaca accttaatta aatcgactcg tctgccctct ttataggctt gtttaataga     41460
     aacaatggtc gattttactg gttcctgttc ataacaaagt tcaccaatta ccgcttcacg     41520
     tggattgaat ccagattcga taaaaagtgc tttaggactg atctcaataa tctgatagtc     41580
     gcagtgattc atataacctc ctttttatta catgatacat taattgactc agtttcaaat     41640
     aacccaaaag caaaaaacaa ttaattcggt gcttgactgt aattttagtt atgaaggaat     41700
     taggccattt taatttgaaa tttttaaatc tgaatggttt gaaattaata tatcttaaaa     41760
     gcttaagatt gattgatact tcttccggct gcattcccta cttggctaga gtccgaacct     41820
     gaacttttta ggtcagagtt ggttaacaga cggaatttat ccacgttttc cacaagttag     41880
     atcaattctt tagatcaaga gagatcaaga gagtacaaaa aagatcacag gttccgtaaa     41940
     tgactgattt tattatggaa taagcatgat caggcattca ggtgcatgta aaaagcattt     42000
     gattgaataa gaaaagcatt tacttgaatt gaaaaggcat ttagtttaat gcgagaaaag     42060
     catttgcacg aataatctat tcacatctaa atgtatcaag ggataaacca tggtgggtaa     42120
     atttaaatga gtgataacaa tgaggtaaca catccttttg atgtgaccaa cacggagaca     42180
     gggaagactt atcaactgag tccaaactct tcgaaatcgg tccaacccat tgctttactg     42240
     cgcttaagtg tttttacccc ggtgggaact aaagagaagc gatacagaaa ttttgaggtt     42300
     gacgcttctg atgagttgtc gagcatggag ctggcccgtt cagaaggata cgatgacatt     42360
     cggatcactg gtcttaagct ttcgatgtca accgatttta agtgttggct cggttgcata     42420
     atggcgttca gcaaatatgg tttcgcttcc gataaaatca cattgtcatt caatgagttt     42480
     gcaaaaatgt gtggtatcag ttctacaaac ataaacaagc gaactcgctc acgatttcag     42540
     gaggcgctag caaacctagc ttccgttgtg atttctttcc gtgattcaaa aactgaacgt     42600
     tttactgtca cgcaccttgt gcagaaagca gtgattgatc ctaagaagga caccgtagag     42660
     ttggtgggcg atccctcaat gtgggagctt taccggtatg atcataaaac cttacttagt     42720
     ttgcaggtgc tttcggttct cgctaaaaaa gaggcagcac aaagcctgta catatatttt     42780
     gaggcgatgc ctgccggtac gttattcgta agcatgaagc gtttgcgtga gcgacttctg     42840
     ttgacgactc ctgtacgaac tcaaaaccag atcatcagga aggcgatgct ggagttaaaa     42900
     tcaataggat atcttgaata tcaagaggtt aagaaaggta gagatatcca gttccagatt     42960
     tttaaaagaa gtccaaaact tgctctggca aaacacagtt gatgctccgg gtatagtacg     43020
     cacaaaagtt actttggatg taatgaggag tatgggcatt catccaaatg ctttttaatg     43080
     tttctccgga tttgaacacc cttccctgtt tccaaacttc ctatcatttc tgatacccgg     43140
     gttcttctgg tattcgttcg aatgcttttc agaaaaaatc atgcttgcta gttgagacaa     43200
     cgtaacctat tcattttgct agtttaataa gactcattca tacatatgcc tttaactaca     43260
     ctaccctcca tcgtgttgta ttgggcttta aacgcaaatc cctatactcc ttgtgccact     43320
     cggcgtattt acagttcctt aacgcctgca aacgactggg atatgagcct ggtcgacggc     43380
     attttatgaa tatgcaggcc aatgaaggac ctagagaaat aacataacat tctgataata     43440
     aatgaaaatt actcaaattg gatatcaagg agatgaaagg catttgtttc aatggagagc     43500
     aaaaaagtgc cttttgtata aaagcatttg ctccaatggc ggcagaaaag tgccttttgt     43560
     ataaaagcat ttgcttcaat ggcggcagaa aagtgccttt tgaaaaaagc atttgtatga     43620
     atgctgcggt gaaagttgct tttggtcggg aagcagggct cgcaagggac agtgtaaggt     43680
     gcctttgttc gaaaagcatt tgcacgaata ggagaatgca agttgccttt ggtcggaaag     43740
     catttgaatg aatggggaag tgtaagttgc ctttggttgg aaagcatttg catgaatgag     43800
     tccctgatag gtgtctttgt ttgaaaagca tttgcatgaa tggattcaga agaagtgact     43860
     tttacgataa gcatttgaat gaatgggcac cgcagacgcg cattccccaa tcagcatttg     43920
     aatgaatgag ctccgcagtt ttgctttcat cgaacagcat tcgtatgaat gtgctccgca     43980
     gaggtggctt tcattgaaaa gcatttgtat gaatggggga tacataatcc ttgtgggtga     44040
     aaagcactcg catcaatggg ggaaaagtga cttttggaat gtcatcctta ccgtgtcctt     44100
     tgttaaatat ctggctggat gaatgccata aaaatggtaa aggggcagac gatgcccctc     44160
     ttccctattt ggcatgttaa ttaaacgcac cttctttaat ccgattacat gcgggattct     44220
     tttctgacat tcgatggcta aaaaaacacc aagcgcaatt aagtcaaaaa aaaggtggtt     44280
     aacagaaaaa tgaaagaaaa ataaaaagta ttatgccaat gcgttttcgt gaattcaaat     44340
     caacacggag taattatgga actgacattg aatactaacg ttgaaagagg aaaaactaac     44400
     gcttttgcat ttttgaagtc caaacatgca aaagtgcctt tgtttattct cttggtttta     44460
     gcaaattgca gttttgcgta cgcgggttcc gatgatggag ccttcggcga tatctgggcc     44520
     tacatgagcg aagccttgac tggtgcgccg ggtaaaatca tcgcgtgcgg catgttgttc     44580
     tcggtggctt atttcggcgt tgtaaaacct aaccttggtt tggcgctggt atcagcatta     44640
     atgatgctgg ttatggcaaa cggtgaaaaa attatcagct cgttcctgga tgctggtatt     44700
     cctctgtgat ttgttagaac aataacaatg agggggatat tccccctctc tggagttttt     44760
     atgacaagcc agtacgagat accgccacat acatatcgct ttccatacag aataaatatg     44820
     ccgttactaa ttctattctg ggatgcaaag caattgggta taacattcgt gactatcgcg     44880
     agcggtaata tttttgattt ctttataact tcggtagttg tggcggtggt gttctggttt     44940
     gcatataaga aagcagcaga ggaagggatt agaggaaaac taaaacacaa actgtggtgg     45000
     tacggctttt ttcctggaaa atcggtgttt agtagtcgtt actttaccga tccatttatc     45060
     agaaacctct attcttgatg gagctaagaa tgaaacttct cagcaggtta aaaattccat     45120
     tcattaaaaa ttccagtaat ggcgattttg ataacaagga tgagacttcg caaaaaggag     45180
     gtgaagaagt aaaaggaagt tttctggatt caaaagcacg ctttagtaaa gaaattgaag     45240
     gttctgaaat tggaattaca tatagtgcat tgattaaacg cgacgaaaaa ctcctacgtg     45300
     tgaatacagt tgcaatgatc attattgggg ttctggttgt aaaaaatcaa tttctcactg     45360
     atcctgtgac tatagtgcta ccgccaaata tgacggaaga agtcaaagtt gttggaaata     45420
     aagcctcaga atcatataaa acgcagtggg ccttattctt tagtactttg attggaaaca     45480
     taaacccaac aaacatcggt tttgttacaa caactatatt ggatgcgctt tctccggatt     45540
     tacaggcaaa gacccgggaa tcactacagc agcaaaccaa tataatgcag gctcgtggtg     45600
     tagagcagtc atttaagccg atcgatatgt attacgacac caaaaatgac atggtctatg     45660
     tctggggaac aaagtcaact cgtttgatta atgttccgga caaaactgaa tcatccaaat     45720
     ggacgtttga atgggtcctg ggaatgaaaa atggacgacc gcgcatagcc tatgtgaacc     45780
     agtattcagg tacaccaaat attaagaaaa ttacaatcaa cggcaaagaa caactggcaa     45840
     cactcgataa tccgccgccg tcaataggta actaattatg acttcaaaaa aggtttttca     45900
     ctgcaccgcg attacagcag tgattttgct ggcaacttcg aatgtggtat ttgctgaaga     45960
     ctatcagtta ccggcgacag taaataatcc ggtagttatg cctgtcgggg ccgatgaatt     46020
     tcagaacggt gtgaaaaatg cgataattaa agacactggc actacgactg agaccgtaca     46080
     agcaacaaaa ccgacaactg ctctgccaag tctttcacct gcaagcagtg cttctcccgc     46140
     agtcaatgaa ataaccgggg cgttgtcaaa taaccctact ctagctggtt accagcaaca     46200
     ggttaaatca ggaaattttg atagttacgg aagaccagca gggaaagaac ctcaacaaaa     46260
     tgcacaaagt accgggtccc cttcaaaggc agatgaactt tatgttgaag cacgtaatcg     46320
     ctataaagaa gtacaacgag taaacgttcc gcctggtggc aatattgtac tcccggtttc     46380
     tcgggggctg caaaacagaa tttcgacttc atttaaaaat gcatctgtaa gtacttcaac     46440
     gccagctgat gaagccagta ttttcgttaa tggcggggat gtttttattt caacaaatac     46500
     agataagcct ataggaatta tgctttcaga agattcagtt cctgaatcta cttataacct     46560
     gacactggtt ccactggatg taccaggggc catgatttca gtaacaactt ctttgagccc     46620
     gacaatgcag gcaaaacgag aaacttctct tgataaacaa aattatgatg agatgctggc     46680
     acgctcacaa tcagaagagt tgactccttc agaccctcgg caggatgacc ataaacagcg     46740
     gatcattgat ttgttgactc cggttgcact gggtgaggtt ccttctggtt tcagtttaca     46800
     agaagaccgc ttgtcacgca taccaagctc agagcagtcc ccatgtaatt tcaatatgta     46860
     cgccaagtta ggtcaaagac tggtgggatc tcgggaattg atagatgtcg ttcttgttaa     46920
     gaatgataag ccttacggac aggtagtggc tgatcagcaa tgtataactg aaggcgtggt     46980
     tgcaagcgct ctattcgata aagcattcct tcagcccggg gaagagaccg aactttatat     47040
     tgtgcgggat aaattattta aagagcgtca gactcgtgtt actacgcgcc caagcctgat     47100
     taaaagataa tatgagaaaa gctacttttc ttacagtgat ctcgtttggt ttagttgtct     47160
     ttttgggtac cagttattac taccaaacta agtatatccc gaaaggcacc gtgaatatat     47220
     ttcctgatgt ccaccgacag ggtgagatcg ttgatgatgc ctttgagaaa agcacgattg     47280
     ttataagcga cccaacgctt gcggataaat ttgttggaag ttcaaccgag tctgtcggtc     47340
     ggcatgaagt taatgtaata aaagaattgg gcacgcaaaa taatggttcg aaatttattc     47400
     atgatgagtc tgataaatca ggtttgacgg ttggagataa atggcctagg gctggtgaac     47460
     cttatatcgt gcctcagatg acagaatacg agcggaattt gaaagttaag cgattccagc     47520
     aaccaaagaa tggagttaat aatggacatt aaaaaggcct gggaaaataa aactgtcaga     47580
     atctcagtaa ttggtgctgc attgatggta ttgattgttg tcatcagtca atcaatcttt     47640
     accacaccag ttaaaaaaga gaagaaaacc cagaaaaaag atatgcaaac tggattcctt     47700
     attgatgatt cacaaatgaa caagctgagt aatgaggaaa gccagaagac ttataacgaa     47760
     atggtaaggc agaaccgtat tgaccagaac gctgccaagg ctgaccgtga caaagctgaa     47820
     aaggctcagc aagaaaacaa agcacagata gccagtcttg cttcgcaagt tcagcaactc     47880
     actacgcagt tgactgaaat gcagacctca agaaatggta atcgcaatct cgatgcaggc     47940
     ggaccacgca acaacgtcaa tgaacaagcc ccagcaaagc cataccagct taatccaaat     48000
     gcagcggtga acggggttag ttctggatac gcacctatat ctccgacccg aaacagtcca     48060
     atgcggacaa taacacagag ttcaattaag acaaacggca ctgatggtgt cattcaggtg     48120
     atgccgatat cagagaaccg gatcagagag gggcgcgagg ttgttgcggg aagtgaaaag     48180
     gccccaacgc gaactattcg cggcgatggg actgcacctg ttgatagtaa agctcgtcat     48240
     gcggcccgta aggatgaaat gtttcttcca gcgacgtcaa ttattactgg ggtgctaatt     48300
     accgggctgg aagctccaac gagtttgtcc tctaaagcag aaccgatgcc ggttaccatg     48360
     cgcattaaaa aagacatcat catgcctaac aattacacga tggatttgcg tgattgtaat     48420
     ttattgggtt ctgctgtggg ggatctggca tctcagcgtg cgtacattag ggcaacctcc     48480
     atatcgtgtg tcaactcgaa aggaaaagca ttcgacgtaa tagtggaagc ttatgcggtt     48540
     agtgaaaatg acgggaaaaa tggcattcgt gggaatctga taagcagaaa tggaaatgcg     48600
     attgcaggtt ctgcgtttgc aggagggctg tcagcattgg cggggagtct gagtccatca     48660
     aaggtgtctt cgcttaatat agatccaaac tctacggcac aataccaatc gccaaacata     48720
     ggtgcattag gagcgctggc cggagccggt gcagctcagg ggggtctaaa ccgtcttgtg     48780
     gactactata cgtcaatagc tgagcagcag tggccaattg tagaaattag cccagggcgc     48840
     ccaattactt ttgtcgttca aaaaggggcg acaataccta caaacctgac aagccgctga     48900
     gaataattat ggaaaataac aacgacaatg aatcaccaaa aaagagtgag tctgctgata     48960
     gcttaaatat cgacgcggct aaaccggttg ggggtatacg tactaccaaa aaagtaactt     49020
     tagagatcga tatcgagaaa actcttaagt atctgatggt cgcaggcctg gcagttctta     49080
     tcgtgatcta tggatacaag ggtggacgtt ttgtatatga caacttcaaa gcaatgtcgc     49140
     aaccggccta ccagattgcc gtgctggata tgcaaacttt aagaaaagta tttaataagc     49200
     aaaatccggt gttggattcg cagcaatcca aaactaactt tgaaaattat tttaaggcat     49260
     taatgaaggt ttaccgtgaa cgtggctatt tggttattga tgcatccttg gcagtaacta     49320
     ttccagagaa tgttgaaata gtctcttata tcgaccttgg tggaagtttt ggtgaggtac     49380
     aatctcttcc aggcgaacct aaagaaagtg agattcgata attgaaaaag ttacttttgt     49440
     ctctgctgat ttccattacc tcagcgtgcc cgccgcttac tctggctgtt gaaaatgtat     49500
     taaacaatcg tgatgccgct gcgttaatgg aaaaggcaaa agaaggtgga gtatcaacga     49560
     aacctttaga cggtgtattg gcgaaaatga aaagctataa gcctaaagat gctatttaca     49620
     tccctactgg cggtctttat ttgttccagg atgaacgttc tcagttgatg gcggtgacca     49680
     ctgacggacg gtatacaatc acggggggga gcgtcatgga cattcttcag agaaagtcag     49740
     tgttatcagt agaggatata cgaaagtcgt tctttattaa tttagacgac gcccctttcc     49800
     ctcttgaaac tgtggcatcg atacctttag gaaacccaaa actcaaacgt caagcggcaa     49860
     tatttattac gcttgattgt gacggttgtc aggatttaat aaagaaattc tatgatgaac     49920
     gcgaaaagta tcgggtcgat atagttttaa tcccctcccc cggcgagcca aagcaggaat     49980
     tgcgtcaatt atggtgcagt aaagaaaaag gcaaagtgaa tgatcttgat atcttgcgtt     50040
     ggcttatggg taataaggcc gatatagaaa aacgactcct gacgaaagaa gaggcagaag     50100
     catgtccggc tgaaccgtta gtcgcgtcat taatgctggc tggcatttat aaattacagg     50160
     gagtcccctc agttgtaaga caggatggac tcgctggtaa tggcataccg aaagattttg     50220
     attactggtt aaaacaaagt gtcgaaccct tactcaaaaa cccatttgat actaattaag     50280
     gtaatgaaat gaacattaaa aaagttattt tcagcgctct ggttgttggt tcatcttcat     50340
     acctggcggg ttgtactatt ggcagcgcag aatctgaatg cccgggaatt gaaaaaggag     50400
     ttatttgtaa aggcccgcgt gaagttatgg aactgacgaa caatcgtgat gatctctccg     50460
     gccttgggga ggaagaggct aattcgggaa aggggaaatc ggctgtcaat gacagccagt     50520
     accctgccca actaacgccg cctggcgcag tgcagtaccc caagtcgtct gtacttgtta     50580
     ataagccagt gacatacaca acgacggaag taaaaccggt tggacagctc ccggtgatgt     50640
     atgatcagac attaaaaatg ggggcgccaa cttcaacaat tggaccacgg ccaatcagcg     50700
     ggaatcctgt taattctaat gtacggatga caacgagtta caactcaaat gggtcatccg     50760
     ttaacccctt tttgcatccg tctgctgaag tcgtgaaaaa aacaactcag gttgttactc     50820
     ccgcgcctgc accgcgctat gtagcaccaa attctgatat caatgcaagt aaagaccttt     50880
     attccattaa caatggacag ccagtaaacc ctacgctcag ctctgggcag gtacagcaat     50940
     accgtacaca aggctacaaa caggcagtcg ttgcaccaga gcctcttgct gtgcttcagc     51000
     aaggccgcgt catgagaatc acctttgcac catatacgga tgataatgac gcgctaaatc     51060
     tgcctggctt tgtttatgtg aatgtcaaac cgcaaacttg gattgcgggc aaaaattcaa     51120
     catcaaatcc ggcacgaatt gttcctttgg aagtccagga tgcggctcgt gaaaatatgc     51180
     aacagcaaca gcgagcaacg aaagcagttt cgtcaaacgg tattgtgaga caactctgag     51240
     gtcacgaatg agatcagcta acgtctataa taaagaatta agccgtcatc agttaggtgg     51300
     atttattccc gtgtatgatc agattccggg tacacattat tttctacttg acggaaaccg     51360
     actcggtttt atgtttatct gtagtccgtc gcccggtgtc tttgataatc agcaggatgt     51420
     gttaactgaa ttatttaaaa tggacttccc aactgacacc atctgtcaga cctcattaac     51480
     tgcgctgcca gacttgatct tgcacttaag tgcctggtct gccgttcgtg gtggtcgaat     51540
     ggaaggtcat gataagctta agggggattt actcactgca tatcaactgg attattatga     51600
     ccgaagcctg aatgaacctt tgaagccgga ccacgataaa ttgatgcttc gagattttca     51660
     ggtctggatt tccttttcaa ttccattgaa gtcagcactt ccttctgaaa tagaaaagag     51720
     tcgcattgat gcgctttact ctgacttaat cagtaagttg aatacagtag gccttttccc     51780
     acacaaagtt ggtgctgaaa attggcttta ttgcatggat aagttattgc atccgggaaa     51840
     aacatcgcgt tggtctgaag gtcatgttga agctagcacc atgagacgcc taaacgagca     51900
     gatcaatgta ccgggtcgaa aatatacagt gacagagaat catttctcat ctacaacgca     51960
     gagcaatgat atttctgagc atcgttattt caaacaatta tcagtagtga agtttccaga     52020
     atttgtaaac tttggctgca tgtatgaact tgtagttaat tggttgaatg gacgtaaaac     52080
     gatctttagc cctttcatga taacccagac tgtccatttc gccgatcctt taaaattatc     52140
     aagagaaaac gtcagatata aggcaattac taacaaacaa gccagtattc caacagtttt     52200
     gacgttttgt ccaagattaa aggatatgga taatgattac atgacgataa cacgcgaact     52260
     ggaagatggg gctcgcctcc tacacagtta tctgacattt actgtaatgg ggaattcagc     52320
     agttgatgtt cagtctgccg cagaccagtt aaaatcattt tatctggaaa gtcgtgttaa     52380
     tgttgctgat gactcgtaca tagtatttcc ctcatttgtt tcaagcctgc cgatgtgtaa     52440
     tgacccaaag acaatactag aactggatcg ttttgaggtc gtgagtaata ctggtgctgc     52500
     gcacatgacc cccatatttg gtccttggaa aggtaatacg gacagacccg tacttaacct     52560
     tgtctcacga gaaggacagc tgttggggct ggatatcttc aagacttctg ccagctataa     52620
     catggtcgtt ggtgcaacgt ctggtgctgg taaatcattc tgggtcgcat acatcattaa     52680
     taattatcta ggcgcaggtc cgcgttctaa taatctgatc cattatcgag atacttttga     52740
     gggattcaaa aacaattctt atgatgcatt tgaccctgat ggagcccaga ttttcgtagt     52800
     tgatgtcgga cgctcatacc aaggtatttc ggaacaatat actaatagtc agtttataga     52860
     ctttgggaaa aagcctgatt ttacgctaaa tccattcgca tttttgactg atgtgactgt     52920
     tggagagcgt gtttttgatg aagcacctgt ctttaatgac gattcaaata atcatgatga     52980
     tgataaggat aaagtagccc agaccattat ggttctaaac cagttaaaaa taatggcatc     53040
     tgaaaaagga aatattgacg attttcaaca atcggtcatg ctgcaactga ttagtgaaga     53100
     atataacgaa tcacgcaaag ttggacgtac aggctctatt actggatttg cgcgacgctg     53160
     ttctaaccat gaagataagc gtattaaaga tatcggtgac cagttggggc aatggtgtga     53220
     aggagggatt tatgggaatc gctttacaga aaatctcccg ccaataaatt ttgatagccg     53280
     gtttattgtt ctggaacttg aagaattgaa ggggacccca caccttcaga ctgtcgttct     53340
     gatgtcgatt attcaggccg ctcagcatgc aatgtttatc aagaaagacg gacgccgccg     53400
     gttgttcata cttgatgagg catgggagta tatccgtccg gacaatgctt caggttccag     53460
     taatcattca aatcaatttt tctcctcttt ccttgaggcc gcttggcgcc gattcaggaa     53520
     aacgaactgt gccggtattt gtattactca atcctttgaa gattacttca cctcatcggt     53580
     tggtcgcgca ctaacggcta actcgccgtg gaagatcatc atgaagcagg aaaaggaaag     53640
     tattgaagcc atgaaggtga acaactactt ctccacaact gatgcggaat atgagcgtat     53700
     gaaaaatatt cgaacggtaa agcgtgcatt ttccgagatg ctcgtacgat tcgaaaattt     53760
     ccaggagata tgtcgcctct atgtagatag aaaaatggag ctttgcttta cgactgacag     53820
     caccgatcgt ggaaaactat gggaaatcca aagccgactt gattgctctt acggcgaagc     53880
     aattgagatt ctgtacgaac aggaagttgc gagcaaatca gctgcctgac gttttaagtt     53940
     actggttacc tcattttgtt ttgactgagg tatccagtac gtctttgaag taaatagttg     54000
     ttagctgtca ttgcctgccc tcccccgaaa taatagcccg ggttaagaat atctagctcg     54060
     gattaagtcc tctcaaaccg tcatacatga aattcgatgc ctttgtcatt cttcttttga     54120
     aggtgaatga atatgatgaa atttactcca gaattattct ccctaccagg cttttgctgt     54180
     gaagttaatc agagcaggta ttatgttttg ggtacaagaa ccaaccaagg gggtgtggtt     54240
     tttgtatggc agatacaaac atcattttta cggttataat aaataaccat tatatagatg     54300
     aatttgtcgt tttttctttt aagtccttga aataattgga tctaatatct agatgatggt     54360
     tgtataaact atacgttaat tagatttgag aatgcaactg ttatgcgatg cgtagatatt     54420
     attaaggtga atggtttgtt aaaacaacca aaaaacaagt aagatcaggt cttatctcca     54480
     taataactta accatctaac tttctggttg gaataagaaa ccattttaag cttattcaat     54540
     aacgaaattt aaccacttga atcgactgac catggtagaa agttggtagg gtaccgtggc     54600
     attgagcccc cttaatcgcc agaccatgga gggaagctgg ttgcgtaccg tggcatttaa     54660
     cccccttaat cgccagacca tggaggaaag ctgggcgtgt cccatggaat ttaaccccct     54720
     taatcgccag accatggagg aaagctggtc gtgtcccgtg gcatttaacc cccttaatcg     54780
     ccagaccatg gaggaaagct ggttgcgtac cgtggcattt aaccccctta atcgccagac     54840
     catggaggaa agctggtcgt gtcccgtggt atttaacccc cttaatcgcc agaccatggg     54900
     gggaagctgg tcgggtactg tggcatttaa ccccttaatc ggcagaccat ggagggatta     54960
     ttgccgggta ccaggccatt taaccactta ctcgtctgta cacgatggga tgctggttgc     55020
     gtagcgcgga attgctcccc tattcaccag ttctttgcta aaggaaagcc agtctaaaag     55080
     gttttccggc caaaactttt tttgtttcac tacagttatt cgcccttccg ttcagcgtga     55140
     taaaatatac aaaaacgtag aggtaaccca taaaagtaaa agagcttata gaccagctta     55200
     aaaggctcga cccggatgcg tatgtagtag ttgctggatt tgaaaaccag tgtactggac     55260
     acgtggctga agcagatacc attaaagaat gcatgacaat tcctgtacga gcggacagca     55320
     tgtcaggtga ccgtacgctt gcaaaagatg gatcaccttc agtctagttg agggggggag     55380
     atgactaccg cacggaatac ttcgttagtg caatagacga cacggatgaa ttggcctaat     55440
     tatacgaatt gccaaaaaac tctcttattg tcaattgtgg gtatgggcaa ttcatattga     55500
     ttgccaaata ttttttgggt attcgggatg tcttaacaac aggatttgcc gaatacccta     55560
     tttttttgcc aaatatttcg tcattctaag tcgagatcca ggccgaatat cttttaatct     55620
     aatccactca atagacagat tctggtggga tacttattgt gtaccgtcgt attaaaccca     55680
     cttaaccgct agggcgtcac gttgtcctgt ctgcaagccg aggcaatttc ccctttagcc     55740
     aatgaccacg gtgcctgctg gtcgggtacc gtgggattta acccccataa tcgccagacc     55800
     atggaggcaa gctggtcggg taccgtggca tttaaccccc ttaatcgcca ggccatgggg     55860
     aggctggtcg cgtagcgtgg catttaaccc tttaatcgcc aggacatggg gtcattctgg     55920
     tcaggtaccg tggtatttaa ctcccttatt cgccagacca tggggaatgc tggtcgcgta     55980
     tcctggcatt taaccccctt aatcgccaga gcatggcggg aagctggccg ggtaccgtgg     56040
     gatttaaccc ccttaatcgc cagaccatgg aggaaagctg ggcgtgtccc atggaattta     56100
     acccccttaa tcgccagacc atggaggaaa gctggtcgtg tcccgtggca tttaaccccc     56160
     ttaatcgcca ggccatgggg aggctggtcg cgtagcgtgg catttaatcc tttaatcgcc     56220
     aggctatggg gaagctggtc tcgtagcgtg gcatttaacc cccttaatcg ccagactatg     56280
     gggaagcagg tcgcgtagtg tggcatttaa cccccttaat cgccaggcca tggagaagca     56340
     ggtcgcgtag cgtggcattt aacctcctta atcgccaggc catggaggaa tgctggtctc     56400
     gtaccatggc atttaacccc cttaatcgcc aggctatggg gtaatgctgg tcgggtaccg     56460
     tgggatttac cccccttatt gccacatcta tggagtgatc ctgctatgtc ggaagattgg     56520
     tattgttgat acttaagagg cttttggaag acttcaatga actgccaatt gaaattcaat     56580
     aatgcagata ttccaaaatc taagaaaaga atacagaacg ttagcgtaat aatagaatta     56640
     aggttactat taaacgcata acgctaaagt atacgcatta tgcgtaaagt ttacgtatat     56700
     acgtttaatt tcactattta ggtaaaaggg atcggaagag aatgaatcta attgataaga     56760
     tcgcccttgt cggtcaacgc atgaagagcg agcagatctc tctgaaagag tcattattgg     56820
     tctcttcgag ggtttcggta tcggatgata gtgtagacgg tgttgatcgc ctaatctata     56880
     accactgctt gaataaaaaa aatctgtcag atttttttgg taaatctcgc gtaactttta     56940
     acaaaatctt agcggatctt gaagaaaaag aactggttgg tgctcctatc taccagaaca     57000
     aaaaccatct ctatacccgc tgggatgtcc agaaaataat ggatgctctg aactatcctc     57060
     gatatagcga ctactactgt agccgtacaa tcgtaacgca gaaccataag ggtggtacgg     57120
     ggaagagtac aacttcaggc gttcttgcag ttgcggcagc acttgatttg catctaaacg     57180
     cgcggatact gttgatcgaa tgggacccac aagggtctat tggaagcggg atgatccaga     57240
     gcgtagcgga agatgatgtt ttcctgactg ctattgacgc catcttaggg gtttacgaag     57300
     aagactcaga ttacagaaaa tatcttgatt tagggtactc ggaagaacaa attattgaag     57360
     gtatgccttt ttcaacacac cttccgaatc ttgatgttat taccgcattc cctacagatg     57420
     cacgtttcaa agataaatac tggcagtgtt ccagagaaga acgaactgag ttattactac     57480
     gttttaaaga ggtaatcctg ccggtcttga agagcaagta cgacctgatc attatcgata     57540
     ctccaccaga agattcgcca atcacatggg cagcggatga agctgctgat ggcattttgg     57600
     ttgccgtttc acctcgtgag tatgattatg cctcaacaac tgatttcatg ttgacgatca     57660
     gtgagcgatt caaacaatcg ccgagcaagg gcgaaaatct aagctggttc aaagtgttgg     57720