LOCUS       KJ778797                7184 bp    DNA     linear   BCT 29-MAR-2016
DEFINITION  Escherichia coli strain 745-54 serotype O170:K-:H1 O-antigen gene
            cluster, complete sequence.
ACCESSION   KJ778797
VERSION     KJ778797.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 7184)
  AUTHORS   DebRoy,C., Fratamico,P.M., Yan,X., Baranzoni,G., Liu,Y.,
            Needleman,D.S., Tebbs,R., O'Connell,C.D., Allred,A., Swimley,M.,
            Mwangi,M., Kapur,V., Raygoza Garay,J.A., Roberts,E.L. and Katani,R.
  TITLE     Comparison of O-Antigen Gene Clusters of All O-Serogroups of
            Escherichia coli and Proposal for Adopting a New Nomenclature for
            O-Typing
  JOURNAL   PLoS ONE 11 (1), E0147434 (2016)
   PUBMED   26824864
  REMARK    Publication Status: Online-Only
REFERENCE   2  (bases 1 to 7184)
  AUTHORS   Yan,X., Fratamico,P.M., Tebbs,R.S., O'Connell,C.D., Swimley,M.,
            Baranzoni,G.M., Debroy,C. and Liu,Y.
  TITLE     Direct Submission
  JOURNAL   Submitted (30-APR-2014) Molecular Characterization of Foodborne
            Pathogens Research Unit, USDA-ARS, 600 East Mermaid Lane, Wyndmoor,
            PA 19038, USA
COMMENT     ##Assembly-Data-START##
            Assembly Method       :: CLC Genomics Workbench v. 7.0
            Coverage              :: >50X
            Sequencing Technology :: IonTorrent
            ##Assembly-Data-END##
FEATURES             Location/Qualifiers
     source          1..7184
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="745-54"
                     /serotype="O170:K-:H1"
                     /db_xref="taxon:562"
     misc_feature    1..7184
                     /note="O-antigen gene cluster"
     gene            69..1316
                     /gene="wzx"
     CDS             69..1316
                     /gene="wzx"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen flippase"
                     /protein_id="AIG62729.1"
                     /translation="MKLNTTLNKNILYLAVVQGSSYILPLITFPYLVRVLGPELFGVL
                     GFCQASMQYLVLLTDYGFNWTATQQVAKNKKDIEKLTRIFWSVFFAKIFLASLAFIFL
                     AACCFLIEKYKELWVVLFSFSPLVLGNVIYPVWFFQGMEKMKWITICTITARCLVIPL
                     TFIFVKNGQDVWVAALIQGAVNLLAGLMGLCLIRKKRWVDKIIVDYNDIKQCLKDGWH
                     VFISTSAISLYTTSTTVILGFVSGPIAVGYFNVANTIRNAAQGLLNPITQAIYPRINA
                     MYDSDYPQAILLIKKTLRYVGALALLGSIFLYMLAPTIINIGVGYDYEQAISILRWMS
                     FLPFIIVLSNIFGVQTMLVHNFKKEFSRILVISGVTNLIIIYPLIRLFSGDGAAISLL
                     ITELMVSTLMYLFLRSKKIHLIY"
     gene            1328..2434
                     /gene="glf"
     CDS             1328..2434
                     /gene="glf"
                     /codon_start=1
                     /transl_table=11
                     /product="UDP-galactopyranose mutase"
                     /protein_id="AIG62730.1"
                     /translation="MYDYLIVGAGLFGAVCAHELNKKGKKTLVIDRRDHIAGNAYTEN
                     NDGIQVHKYGAHIFHTNDKQIWEYVNSFVEFNRFTNSPLASYKNKLYNLPFNMNTFYQ
                     LWGVKTPTDAIDIINEQRKVLNGKVPGNLEEKAISLVGYDIYEKLIKGYTEKQWGRKA
                     TDLPAFIINRLPVRFTFDNNYFSDRYQGIPIGGYTNLVAKMLEGVEVNLGLDFLKDKE
                     YYSKLAKKIIFTGPIDEFFDYCFGMLEYRSLRFETETLDIDNFQGNAVINYTESTVPY
                     TRIIEHKHFDPVETLHTVITKEYPAEWCKGDEPYYPVNDVKNMSLFKKYKELADKSNV
                     IFGGRLGEYKYYDMHQVIRSALNCSNALIESDAK"
     CDS             2431..3363
                     /codon_start=1
                     /transl_table=11
                     /product="N-glycosyltransferase"
                     /protein_id="AIG62731.1"
                     /translation="MIKKKVIAIIVTFNRKNYLLRTINSLYQQTYKVDEIICVDNCST
                     DGTQKYLLDNDIIGRKNFHYYNTGANLGGAGGFKYGIDCLKDFEYEHVWLMDDDVELE
                     SNCLEILISSDHSSKGIVQPTRYYEDGEFFSYDYKYFNFKNPLREFKLGRVTSEDIEN
                     NDSIKIAAVPFEGPLIASDVINAIGNVNDEYFIIADDTDYSIRASRAGFYCFLIPEAK
                     LKRLIKPCSGQDPSWKVFFFHRNVTLVDKYYAPKYVLYIRACVRVMRYVITVSKRKKT
                     ISNFVAMIHGILAAMKNDITNNITDIQKKYADKK"
     CDS             3347..4153
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferase family 2"
                     /protein_id="AIG62732.1"
                     /translation="MQIKNNINDLTIAISTYGERIVNAKKIALEFSRNGFRVDIIHQA
                     DNPDIIEEEIIDNKQIRYFYQNSKGVTKSRNYAIDVCTTKYIWFMDDDITFDYDNIHQ
                     LYGVLKKINCDNVSVCLTRIKDENGQPRKKYPQSGKIYNKRKIISVGTIEIIADATFL
                     KRNDIKFDENFGAGAAYPVGDEALFLNDVLDSNGSIYHFDLYFLFHPKDSSGIYRSKL
                     HFYSKGIVFRRLYGVIGLFYILYLILFRFNFFKEVSSLYLLKGYLVGGRR"
     gene            4153..5325
                     /gene="wzy"
     CDS             4153..5325
                     /gene="wzy"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen polymerase"
                     /protein_id="AIG62733.1"
                     /translation="MRNILNSTIGIFIVFTIFFPLSPFVFSSGNAGALTTICSIIIIF
                     LLLQQKINVTNNLYMLLFPVLLSFIISALYWQEIMLLNYPKYLIFSIIIVSLLQKNIV
                     YIIGKYSTFVIVFALCCAVIGFIYAAIGGSAIYTITNPNGREFYFYLTTFTVTNYSGF
                     IRPSAFFDEPGALSFYICFVVMLREILWPRKRALNFALLAFGIVTLSLAHIVFTILYI
                     IYCLITKPTTKLIVGLVIILILSFVFLAVLPNKDVVFEYLISRSSSDTDGQGRSALLQ
                     AAIDTLQNAGVGLYIFGIDSNCLVNYDEACRYIYPRMGENILSPVVFGGLLTSWLFYF
                     SYIYVGYKSLRKFIPNFIIFSFLLLYLQRPYIYLLSYSFMFMIALRLSIGFFDKEK"
     gene            5327..6163
                     /gene="epsH"
     CDS             5327..6163
                     /gene="epsH"
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferase"
                     /protein_id="AIG62734.1"
                     /translation="MSSRPLIDVVITSYNRLNLLLLALESVLFQKAHVNTIIIVDDNS
                     SFTKDDFFDKAKKIIENDNTEIIFHKNDKNYGACYCRNLGANLSKAELIAFLDDDDSW
                     DPNHLNSLVDCFHEHVVLAYSGKNIINYQTGKIRRSLSKIQDDNQYEQMLRKNYPGST
                     SSILVKKSALMAVNGFDVSLPAIQDYDFYLRICRLGLLKSSGMYTLNYRNDTPLKITN
                     QLQKARAAYNIIIQKYHGRERMILNRTIYKQNIIKCIRYFDFIYLFKFTRDFINFIVE
                     WR"
     gene            6165..7016
                     /gene="glfT1"
     CDS             6165..7016
                     /gene="glfT1"
                     /codon_start=1
                     /transl_table=11
                     /product="galactofuranosyl transferase"
                     /protein_id="AIG62735.1"
                     /translation="MNERANVVAIVVTFKRKEFLCKILDSLIRQTFPINKIIVIDNNS
                     LDGTKELVEDFCRINTEVNRKIKYYDTGENLGGAGGFKCGFEIARNFDYSHLWLMDDD
                     LLPEDNCLEILLKCNIEGIVQPIRMNMDGTCAELSPINYDLKNPFRLRAKTKTVADIY
                     IKDKTPYLFDIHSVPFEGPLITKSVVEKIGFPNEKFFIFNDDLDYSLRARQKKFRICC
                     SSQAKATRLLKNNIKNDLSSWKGYYMLRNYFYIMRKYGDNFMVRLKPHWAIWIFIFYF
                     FLTGKKI"
ORIGIN      
        1 ctggtagctg taaagccagg ggcggtagcg tgtgtaaaaa cacattaaca ttattttgat
       61 ggatacgtgt gaaattaaat acgactttaa ataaaaatat tttatattta gctgttgtcc
      121 aaggaagttc atatattctg ccattaatta cttttcctta tttagtgaga gtgttagggc
      181 ccgagttatt tggggtgcta ggtttttgtc aggcatcaat gcaataccta gtgttattaa
      241 ctgattatgg atttaattgg acggcaactc agcaagtagc taaaaataaa aaagatattg
      301 aaaaattaac tagaattttt tggtctgttt tttttgcaaa aatattcttg gcaagtcttg
      361 cgtttatatt tttagctgca tgttgttttc ttattgaaaa atataaggaa ctgtgggttg
      421 tattattttc atttagtccc ttggtattgg ggaatgtgat ttatcctgta tggtttttcc
      481 aaggtatgga aaaaatgaaa tggataacta tatgtactat tacggctcga tgcttagtga
      541 tacctttaac attcatcttt gttaaaaatg gacaagacgt atgggttgct gcccttatcc
      601 aaggggcggt taacttatta gcaggcctaa tgggattatg tttgattagg aaaaaaagat
      661 gggttgataa gattattgtt gattataatg atattaaaca gtgcttaaag gatggttggc
      721 atgtatttat ttcaacatca gctataagtc tttatacaac aagcactact gtgattctcg
      781 gatttgtctc gggtccaata gctgttggtt attttaatgt ggctaatacg atacgtaatg
      841 ctgctcaggg gttacttaac ccaattactc aagctatata tcctcgcatt aatgctatgt
      901 atgatagtga ctatccccag gcgattctat taataaaaaa aacgctacgt tatgtaggtg
      961 cattggcctt gttgggttca atttttttat atatgttagc cccaacgata attaatatag
     1021 gtgttggata tgattatgaa caagctatat ctatactgcg ctggatgtct tttttaccat
     1081 ttattattgt tttaagtaat atttttggtg tgcaaacaat gcttgttcat aattttaaaa
     1141 aagaatttag cagaatattg gtaattagtg gggtgacaaa tcttataatt atttacccat
     1201 taattcgttt attttctggt gatggtgcgg ctatttcact attaataacg gaattaatgg
     1261 tatcgacgtt aatgtattta tttttacgct cgaaaaaaat tcatttaatt tactaacagg
     1321 agagcaaatg tacgactatc ttatcgttgg agctggttta tttggggcgg tttgtgctca
     1381 cgaacttaat aaaaaaggga aaaaaacgct tgttattgat agaagagacc atattgcagg
     1441 taatgcatat accgaaaata atgatggcat tcaggtacat aagtatggtg ctcatatttt
     1501 ccataccaat gataaacaaa tatgggaata tgtaaattca tttgtcgagt ttaatcggtt
     1561 tactaactct cctctcgcga gttataaaaa taaactttat aatttgccat ttaatatgaa
     1621 tacattctat caactttggg gtgttaaaac accaacagac gccatagata ttatcaatga
     1681 gcaacgtaaa gttttaaatg gtaaagttcc tggtaatctt gaagaaaagg caatatctct
     1741 agtcggttat gatatttatg aaaaattgat aaaaggctat actgaaaaac agtggggcag
     1801 aaaagcaaca gaccttcctg catttattat taatcgattg ccagtccgct ttacttttga
     1861 taataattat ttctctgatc gttaccaagg tattcctatt ggggggtata ctaatctggt
     1921 agcaaaaatg cttgaaggag tggaagttaa tttaggtttg gattttttaa aagataaaga
     1981 atattattca aaactagcca agaaaataat attcacagga ccgattgatg agttttttga
     2041 ttattgcttt ggtatgttag aatatagatc acttcgattt gaaactgaaa cattagatat
     2101 agataatttt caaggtaacg ccgttataaa ttatacagag tcaacggttc catatacaag
     2161 aataattgag cataaacatt ttgatccagt agaaacttta cacactgtga taacaaaaga
     2221 atatccagca gaatggtgta aaggtgatga gccttattat ccagttaatg atgttaaaaa
     2281 tatgagttta ttcaaaaaat acaaggagtt agcagataaa agtaatgtga tttttggggg
     2341 gcgtttaggc gaatataaat attatgatat gcaccaggtt attcgctcgg ctttaaattg
     2401 ttctaatgca ttaatagaaa gtgacgcaaa atgataaaga aaaaagtaat agctattatt
     2461 gtcacattca acaggaagaa ttatttatta aggacaatta actcattata tcagcagact
     2521 tataaagtcg atgagattat ttgtgtggat aattgtagta cagatgggac gcaaaaatat
     2581 cttctggata atgatattat tggaagaaaa aatttccatt attacaatac aggagcaaat
     2641 cttggtgggg caggaggatt taaatatgga atagactgtc tcaaagactt cgaatatgaa
     2701 catgtgtggc tcatggatga cgatgtcgaa ctcgaatcta actgtttaga aattttaatt
     2761 agtagtgacc attccagtaa aggaatagta cagccaacta gatattatga ggacggtgag
     2821 tttttttcct atgattataa atattttaac tttaagaacc cattgaggga gtttaagtta
     2881 ggaagggtca cctctgaaga tatagaaaat aatgacagca ttaaaattgc agctgttcct
     2941 tttgaaggtc ctttaattgc ttcagatgtt attaatgcta taggtaatgt gaatgatgaa
     3001 tactttatca tagctgatga tacagattat tctataagag ctagccgagc tggattttat
     3061 tgtttcctga tccctgaggc aaaattgaag aggttaataa aaccttgttc aggtcaagat
     3121 ccaagctgga aagtattttt ttttcaccga aatgtaactt tagtcgacaa atattatgca
     3181 cctaaatatg tgctatatat tagggcttgt gttagggtta tgagatatgt tattacggtt
     3241 tctaaaagga agaaaacgat aagcaatttt gtggctatga tacatgggat tctagcagca
     3301 atgaaaaatg atattacaaa caacataact gacatacaaa aaaaatatgc agataaaaaa
     3361 taatattaac gacttgacta tagctatatc gacgtatggc gaaagaatag ttaatgcgaa
     3421 gaaaattgct ttggaattta gtcggaatgg tttcagagtt gatattatac atcaggctga
     3481 taacccagat atcattgagg aagagataat agataataaa caaataaggt atttttatca
     3541 gaacagtaaa ggtgtaacaa aaagtagaaa ttatgctata gatgtttgta caaccaaata
     3601 tatttggttt atggatgatg atattacttt tgattatgat aatattcatc agttgtatgg
     3661 agttttaaaa aaaattaatt gtgataatgt ttccgtgtgt ttaacaagaa ttaaagatga
     3721 aaatggtcaa cctcggaaaa aataccctca aagcggcaaa atatataata aaagaaaaat
     3781 tatatcggtt ggtactatag agataattgc agatgcaacc tttctcaaga ggaatgatat
     3841 aaaatttgat gaaaattttg gcgctggagc tgcttatcca gtgggagatg aagcgttgtt
     3901 tttaaatgat gtattagata gcaatggttc aatttatcat tttgatttat actttctttt
     3961 tcatcctaag gattctagtg gaatatatag aagtaaactt catttttaca gcaaaggtat
     4021 agtttttaga cgactgtatg gtgttatagg attattctat atattgtatt tgattttgtt
     4081 ccgatttaat ttttttaaag aggtgtcgtc tttatattta cttaaaggat acttagttgg
     4141 tggaaggcga taatgagaaa tatcttaaac tcaaccattg gtatatttat tgtttttact
     4201 atattctttc cattaagtcc gtttgttttt tcgagtggta atgcaggtgc tttgacaaca
     4261 atttgctcaa taataataat ttttttatta ttacaacaga aaataaatgt gactaataat
     4321 ctatatatgc ttttatttcc tgttttgtta tcatttataa tctcagcctt atattggcaa
     4381 gagattatgt tgttaaatta tcctaagtat ttaatatttt ccataataat tgtttcttta
     4441 ttacaaaaaa acatcgtata tattattggt aaatattcaa catttgttat agtattcgct
     4501 ttgtgttgcg ctgttattgg atttatatat gcagcaatcg gcgggagtgc gatttataca
     4561 ataacaaatc ccaatggacg tgagttttat ttttatctaa caacatttac ggttactaat
     4621 tattctggat tcattagacc gtcagcattt tttgatgagc ctggggcctt atcattctat
     4681 atatgctttg tagtgatgct tcgtgaaata ttgtggccaa gaaagagagc attaaatttt
     4741 gctttacttg cgttcggaat tgttactcta agtctggcac atatagtgtt tacaattctg
     4801 tatattatct attgtcttat taccaaacca actacgaaat taatagttgg tcttgtaata
     4861 attctaatat tatcatttgt ttttttggca gtactaccaa ataaagatgt tgtattcgag
     4921 tatttaattt ctcgttcatc tagtgataca gatggacagg ggcgatcagc acttcttcaa
     4981 gccgcaattg acaccttgca aaatgcgggt gttggattat acatttttgg aattgattct
     5041 aactgcttag taaattatga tgaagcatgt cgctatattt atccaagaat gggagagaac
     5101 attttatctc cagttgtttt tgggggctta ttaacatcat ggctgttcta tttttcttat
     5161 atatatgtag gttacaaaag tttaagaaag ttcattccta attttataat tttttctttt
     5221 ttattattgt atttgcaacg accatatatt tacttattat catattcatt catgtttatg
     5281 atcgcattgc gactaagtat aggttttttt gataaggaaa aataaaatga gctctaggcc
     5341 attaatagat gttgtcatta ctagttataa tagattgaat ctattgctat tagctttaga
     5401 atcagtcctt tttcaaaaag ctcatgttaa tacaatcatc attgtggatg acaattcatc
     5461 atttacaaaa gatgattttt ttgataaagc aaaaaaaatt attgaaaatg ataatactga
     5521 aataattttc cataaaaatg ataaaaacta tggtgcatgt tattgcagaa accttggtgc
     5581 taatttatcc aaggccgaat taatagcgtt tctggatgat gatgatagct gggatcctaa
     5641 tcatttaaat tcacttgttg actgttttca tgaacatgtt gtacttgcat atagcggaaa
     5701 aaatataatt aattaccaaa cagggaaaat aagacgatct ttgtcaaaga tccaggatga
     5761 taatcaatac gaacaaatgc ttagaaaaaa ttatccgggt tcgacttcgt ctattcttgt
     5821 taagaaaagt gcattaatgg cagtaaatgg ttttgatgtg tcattaccag caatccagga
     5881 ttatgatttt tatcttagaa tatgccgtct tggactacta aaaagtagcg gcatgtatac
     5941 cctcaattat aggaatgata ctccgcttaa aataactaat caattacaaa aagctagagc
     6001 agcatataat ataataatcc aaaaatatca tggtcgtgaa agaatgattt taaatcgcac
     6061 aatttataag caaaatataa ttaagtgcat cagatatttt gattttatat atttgtttaa
     6121 atttacgcgt gattttatta attttatagt tgaatggagg taacgtgaac gaaagggcaa
     6181 atgtagttgc aatagttgtc acatttaaac gtaaagaatt tttgtgcaaa atacttgatt
     6241 cgttgattag acaaacattt cctataaata agataattgt tattgataat aatagcttgg
     6301 atggtactaa agagttagtc gaagattttt gtcgaattaa tacggaagtt aacagaaaaa
     6361 taaaatacta tgatactgga gaaaatttgg ggggggcagg agggtttaaa tgtggttttg
     6421 aaattgctag aaattttgat tattcgcatc tctggcttat ggatgacgat ttgttaccgg
     6481 aagataattg tcttgaaatt ctactcaaat gtaatatcga gggcatagtc cagccaatta
     6541 gaatgaatat ggatgggact tgcgctgaac tttctccaat taattatgat cttaaaaatc
     6601 cgtttcgtct acgagcaaag acgaagacag tagcggatat ttacattaaa gacaaaactc
     6661 catacttgtt tgatatacac agtgtacctt ttgaaggccc attaattact aaaagcgttg
     6721 tcgagaaaat tggtttcccg aacgaaaaat tctttatatt taatgatgac ttggattatt
     6781 cattaagagc acgtcaaaag aagtttagga tttgttgttc ttctcaagcc aaagcaacgc
     6841 gtttactgaa aaataatatc aaaaacgatc tttcctcatg gaaaggatat tatatgctaa
     6901 ggaattattt ctatataatg agaaagtatg gggataattt catggtcaga ttaaaacctc
     6961 attgggcgat atggatattt attttttatt tctttttgac tggaaaaaaa atataaacag
     7021 aatattttca gcttatttgg attctaaaga gttaactaac tctaaaaaat tccgccctta
     7081 ataggttagg taagggtata atataattca tgtttatata caccccctga caggagtaaa
     7141 caatgtcaaa gcaacagatc ggcgtcgtcg gtatggcagt gatg
//