LOCUS       KP710590                6089 bp    DNA     linear   BCT 29-MAR-2016
DEFINITION  Escherichia coli strain K 1a serotype O28ab:K-:H- O antigen gene
            cluster, complete sequence.
ACCESSION   KP710590
VERSION     KP710590.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 6089)
  AUTHORS   DebRoy,C., Fratamico,P.M., Yan,X., Baranzoni,G., Liu,Y.,
            Needleman,D.S., Tebbs,R., O'Connell,C.D., Allred,A., Swimley,M.,
            Mwangi,M., Kapur,V., Raygoza Garay,J.A., Roberts,E.L. and Katani,R.
  TITLE     Comparison of O-Antigen Gene Clusters of All O-Serogroups of
            Escherichia coli and Proposal for Adopting a New Nomenclature for
            O-Typing
  JOURNAL   PLoS ONE 11 (1), E0147434 (2016)
   PUBMED   26824864
  REMARK    Publication Status: Online-Only
REFERENCE   2  (bases 1 to 6089)
  AUTHORS   Baranzoni,G.M., Yan,X., Fratamico,P.M., Debroy,C., Tebbs,R.S.,
            Liu,Y., O'Connell,C.D., Swimley,M. and Matheny,S.
  TITLE     Direct Submission
  JOURNAL   Submitted (22-JAN-2015) Molecular Characterization of Foodborne
            Pathogens, United States Department of Agriculture, 600 E Mermaid
            LANE, WYNDMOOR, PA 19038, USA
COMMENT     ##Assembly-Data-START##
            Assembly Method       :: CLC Genomics Workbench v. 7.0
            Coverage              :: >50X
            Sequencing Technology :: IonTorrent
            ##Assembly-Data-END##
FEATURES             Location/Qualifiers
     source          1..6089
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="K 1a"
                     /serotype="O28ab:K-:H-"
                     /db_xref="taxon:562"
     misc_feature    104..5902
                     /note="O antigen gene cluster"
     gene            104..916
                     /gene="wbbD"
     CDS             104..916
                     /gene="wbbD"
                     /codon_start=1
                     /transl_table=11
                     /product="UDP-Gal:alpha-D-GlcNAc-diphosphoundecaprenol
                     beta-1,3-galactosyltransferase"
                     /protein_id="AJR19368.1"
                     /translation="MFSLGVIFTVYQKTDLSKFVKAIESVVNQTKLPQSIIIVCDGCN
                     SDLFKKAISGVVPHSIKLFFYSYSVNSGPGFARDFGIRKAEEDLIAVMDSDDVSVADR
                     FALQLAFFESNENISVCGGFIEEFDNLSGQRKLRRVPLQHSDIQNAIKIKSPVNNVTA
                     MFKRSDYLSSGGYPALRSSEDYSLWARFISSGYKIHNLDSVLVQVEFDIDAIQRRNGL
                     LHFKNDFITQREMLKNGLIDKFEFVRNITKYCIFRFLPVGVKKMLYQHVLRK"
     gene            939..1331
                     /gene="tagD"
     CDS             939..1331
                     /gene="tagD"
                     /codon_start=1
                     /transl_table=11
                     /product="glycerol-3-phosphate cytidylyltransferase"
                     /protein_id="AJR19369.1"
                     /translation="MNRVITFGTFDVFHVGHINILERAASYGEELIVGVSSDALNFSK
                     KQRYPIYSESDRMKIISSLKFVTSVFLEESLELKLDYIKKYKASTLVMGDDWEGRFDW
                     VKSECDVIYLPRTPSISTTEIIEVVRKL"
     gene            1350..2609
                     /gene="wzx"
     CDS             1350..2609
                     /gene="wzx"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen flippase"
                     /protein_id="AJR19370.1"
                     /translation="MIGLKKNIIFMLIYQIVNYLVPLALTPYLVRILGPSSYGELNYS
                     ISIVLYICLFVDFGFTLSATKRITKYIGNSDKISKLFYTVTVAKTFLLITGITILILS
                     ISTLDTINSVKTIIVISAIQIIATVISPLWLFNGLQLTAVFAVFNIIFKVASIPLVFF
                     LVKTPTDVGYAAFFQTAPLFFSSILALIYLYKKKILIYTNYTPRFKLIIRTLNSSLFY
                     YIGTMSVSLYTMSTPIILGLVSTSEQVGFYSASDKIRAAVVGVYVVIGNVIYPRVQRF
                     YHEDDNLGFQYVKKIIIAVIPLCTIASIMLFYISPFITKYFLGEEFGESELILKIMSP
                     MMFLIPLSIILSNYILLGMGHKKIFSRIPMITATIHIIVATILSLKFGSIGASIAILI
                     SEIVSFILLFITCCKLGYIKKLCVLKI"
     gene            2591..3514
                     /gene="epsJ"
     CDS             2591..3514
                     /gene="epsJ"
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferase"
                     /protein_id="AJR19371.1"
                     /translation="MCTEDLISIIIPVFNAQETIDQCLNSIICCKYQNLEIIVINDGS
                     TDASSEIINDFSRRDERIKIITCENNGVSSARNIGIRHATGIWCCFIDSDDFISADYF
                     DILINDDACNYDIIQMKNIVFSPKQNNMNFFKRKQIFPMSGSAALKEKYAIYVWGKLY
                     KSSILKNTSFSRELSIGEDYYYNCQVFKNASIYYSNEGVYYYSLSPGSLSRGDSTGSK
                     IWERFKSANKIFYYLRDNDEKLALQIFTTFGFIGTLRAYSSFKWILYLIKEIDVEQIK
                     KIKFSAVWTSSCNLKAKILSTLVLCSMMVIK"
     gene            3490..4731
                     /gene="wzy"
     CDS             3490..4731
                     /gene="wzy"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen polymerase"
                     /protein_id="AJR19372.1"
                     /translation="MFDDGDKMSIGILVLVFYVIVNFVMGIVFFNDGFLGGDFYGEKI
                     DNKDLFLWVLGGELLLLITFYAIAVLIVKFTFNKRYPEDYYTVSELALKRFNIFLIVL
                     QTSFILFIFATGFGRISLLMDENSSAANINSPIKYIFVILLPDFLFIVYFLVQKNNKK
                     TIVNLSLYLISNIVRGWVSGPVLLIMAIFLVKKFSFKKIKIKTIISLVTCFIIFVPLV
                     TSLKFGVRFQNDEISAVDLVQDSIENNVSYYLRTLNRFQHISEAYSFMDSMTFIRKDY
                     ADNRIALPFFTNDFINITSKIFSFEPQNLLTYGSKVLLDRPFGNIQSGILPWLSIDYF
                     FSISYILTFFIFTILLSRFCKMLTLGYPVSKNIVIWFTIYYYAHGWLFSYMNLLIAMM
                     IFIIFSKVFGGKILNKDNNYA"
     gene            4724..5902
                     /gene="tagF"
     CDS             4724..5902
                     /gene="tagF"
                     /codon_start=1
                     /transl_table=11
                     /product="CDP-glycerol:poly(glycerophosphate)
                     glycerophosphotransferase"
                     /protein_id="AJR19373.1"
                     /translation="MHKFQTLFWSVIFNILSLLFFLFPLKRNRVIFNSAENKNFNYNS
                     RYLFEFLKNYNNEYEIYFVINDADLRAKLSIEHGGKYFITTYSLKSCFLIMRSKFWII
                     STFESPYVCFVRHHRRIVFHLGHGIPLKAIGQLAKFPTKLKLKLQKILRIRPITHALC
                     YSEEYKTNMSAIFNSDFIEYVPLGQPRNDSIVLKDSVETGKLIKESILNVPSFDKAIL
                     YSPTWRPYDKARFFPFADLEANELNSILSQTKTMLFLRGHPFFESFCPDSFENLSNIH
                     WLNNDVIDDITSHLPFFDKIITDYSSIFIDYLCVNKPIGFLQYDYQQYDDMVGFATDD
                     REIFCGVKIESSDDFISFIIDQDDSWMPERLKIARLLNIKNSGNSLENKMFLDSLRKK
                     "
ORIGIN      
        1 attggtagct gtaagccaag ggcggtagcg tttctattca gttttccttg aacaattttt
       61 tgagtttagc ttattgtaac aaataataat gacgagaata tttatgttta gccttggcgt
      121 aatatttaca gtatatcaaa agacagatct ttcgaaattc gttaaagcta ttgaatctgt
      181 tgtcaatcaa acaaagttgc cacaaagtat tataatcgtt tgtgacggtt gcaactcaga
      241 tttatttaaa aaagctatat caggggttgt ccctcatagc atcaaattgt tcttttactc
      301 atattcagtt aactctggac caggatttgc gcgtgatttt ggcatcagaa aggcagaaga
      361 agatttaatt gctgttatgg attctgacga tgtatcggta gctgaccgat ttgcattgca
      421 actcgctttc ttcgaaagta atgaaaacat atctgtttgt ggtggtttta ttgaagagtt
      481 tgataatctc tcgggtcaaa gaaaattgag acgagtgcca ctgcaacatt cagatattca
      541 aaatgctatt aaaataaagt cacctgtaaa taatgttaca gctatgttca agcgatctga
      601 ttatttatct tcgggtggtt acccagcatt acgaagttca gaagattatt cattatgggc
      661 ccgttttatt tcctcaggat ataaaataca caatttagac tctgttttgg ttcaagtcga
      721 atttgatatc gatgcaattc aaagaagaaa tggattattg cattttaaaa atgactttat
      781 tacacaaaga gaaatgctta aaaatggatt gattgataag tttgagtttg taagaaatat
      841 tactaaatat tgtattttta gatttttacc agttggtgta aaaaaaatgt tataccagca
      901 tgtattaaga aaatgaaatt taaatttgga gttgttgtat gaacagggta attacatttg
      961 gaactttcga tgtgtttcat gttgggcata taaatatctt agagagagcg gctagttatg
     1021 gtgaggagct aattgtaggg gtatcttctg atgccttaaa ttttagcaaa aaacaaagat
     1081 atccgattta ctctgagtcc gatcgtatga aaatcattag ttctttgaaa tttgtcacct
     1141 cagtttttct tgaagaatca ttagagttga aacttgatta cataaaaaaa tataaggctt
     1201 ctactcttgt aatgggggat gactgggaag gtcgttttga ctgggtgaaa tcagaatgtg
     1261 atgtgatata tttacctcgt acgccttcaa tttctacaac agaaataatc gaagtcgtga
     1321 gaaaattata acttaaacta gatataataa tgattgggct aaagaaaaac attatcttca
     1381 tgttaatata ccagatagtt aactatctgg ttccacttgc attgactcca tatttagtta
     1441 gaattttggg gcctagtagc tatggggaat taaattattc aatatcaata gttttatata
     1501 tttgtttatt tgttgatttt gggtttacac ttagtgcgac taagcgaatt acgaaatata
     1561 ttgggaactc tgacaaaata tcgaaattgt tttacactgt aactgtcgct aaaacctttt
     1621 tattaataac tggtattacg atcctcatac ttagtatttc gacacttgac actataaact
     1681 cagtaaaaac tataattgtt atatcggcta tccagataat cgcaacagtg atctctccat
     1741 tatggctatt taatggacta cagctaacgg ccgtttttgc agtttttaat attatattta
     1801 aagtcgcatc tatacccctt gttttttttc ttgtaaaaac accgacagat gttggttatg
     1861 ccgcattttt ccaaacggca cctttatttt ttagctctat tttagctttg atttatctgt
     1921 ataagaaaaa aatactgatt tatacgaatt atacaccccg ttttaaatta attatacgca
     1981 ccttaaattc atcacttttt tattatattg ggactatgtc agtaagtctt tatacgatga
     2041 gcactcctat tatacttgga ttagtgtcga ccagtgagca ggtaggtttt tatagtgcaa
     2101 gtgataagat tagggctgca gttgtcggtg tttatgttgt tataggtaac gtcatttacc
     2161 ccagagttca gcgtttttat catgaagatg ataatttggg ctttcaatat gttaaaaaaa
     2221 tcattatcgc tgtaattcct ttgtgcacaa ttgcatcaat aatgttgttt tatatttctc
     2281 catttattac gaaatatttt cttggtgagg aatttggcga atcggaatta atacttaaaa
     2341 taatgtctcc aatgatgttc ctaataccac tatctatcat tttgtcgaac tatatattac
     2401 tggggatggg gcataaaaaa atattttcac gtataccgat gattacagca actattcata
     2461 taattgtagc aacgattcta agtcttaaat tcggttctat tggagcatca attgcaatac
     2521 ttattagcga aatagttagt tttattttgc tttttataac ttgttgtaag ttaggatata
     2581 ttaaaaaatt atgtgtactg aagatttaat atcaataatt attccagttt ttaatgcaca
     2641 agaaacgatc gatcaatgtc tcaatagtat tatatgctgt aaatatcaga acttagaaat
     2701 aattgttatc aatgatggaa gcacagacgc gagtagcgag attataaatg attttagcag
     2761 aagagatgag cggataaaaa ttataacttg cgaaaacaat ggagttagct cagctagaaa
     2821 tataggaatt aggcatgcta caggtatttg gtgttgtttc attgattccg atgattttat
     2881 ttctgcagac tattttgaca tacttattaa tgacgatgct tgtaattatg atattatcca
     2941 aatgaaaaat attgtatttt ctccaaaaca aaataatatg aattttttta agagaaaaca
     3001 aatttttccg atgtctggct ctgcagcatt gaaagaaaaa tatgcgatct atgtctgggg
     3061 gaaattatat aaaagttcaa ttttaaagaa tacatctttc tcgagagaat tatcgatagg
     3121 tgaggattat tattacaact gccaagtctt taaaaatgct tctatatatt attctaatga
     3181 aggtgtttat tactattcgt taagtcctgg ttcgctttca agaggtgatt caacagggag
     3241 taaaatttgg gaaaggttta agagcgcgaa taaaatattt tattacttga gagacaatga
     3301 tgaaaaatta gcattacaga tttttaccac tttcggattt attggaacat tacgagctta
     3361 ttcttctttt aagtggatct tgtatcttat taaggagata gatgtggaac aaattaaaaa
     3421 aataaaattt tccgcagtgt ggacatctag ttgtaatctt aaagcaaaaa tcctatcgac
     3481 attggtacta tgttcgatga tggtgataaa atgagtattg gtatattggt tcttgtattc
     3541 tatgttatcg taaatttcgt tatgggaatc gtctttttta atgatggttt cttaggaggc
     3601 gatttctacg gcgaaaaaat cgataataaa gatctgtttt tatgggtgtt aggtggggaa
     3661 ttattattat taattacatt ttacgctatt gcagtattaa ttgttaagtt cacttttaac
     3721 aaacgctatc ccgaagatta ctatactgta agtgagttgg ctttaaaaag gtttaatatt
     3781 ttcttaattg tacttcaaac aagttttatt ctgtttattt ttgcgactgg ttttggaaga
     3841 atttcactgc ttatggatga gaattcatct gcagcaaaca ttaattcacc aataaaatat
     3901 atttttgtaa ttctactacc tgattttcta ttcattgttt attttttagt acaaaaaaac
     3961 aacaaaaaga caattgttaa cttatccctt tatctgatta gtaatattgt aagaggatgg
     4021 gtgtctggac ctgtcctgct aatcatggct atttttttag taaagaaatt ttcatttaaa
     4081 aaaataaaaa taaaaactat tatctcttta gttacatgtt ttataatttt tgtacctttg
     4141 gtgacgtcat tgaaatttgg tgttagattt caaaatgatg aaataagcgc agtggatctc
     4201 gttcaagatt ctattgaaaa caatgttagc tattatctta gaactctaaa tagatttcag
     4261 catatatctg aagcgtatag ttttatggat tccatgacat ttattcgtaa agactatgct
     4321 gataacagaa tagcactccc attctttact aatgacttta tcaatattac ttcaaagatt
     4381 ttttcttttg agcctcaaaa tctattgacc tatggtagta aagttctgct tgatagacca
     4441 ttcggtaata tacaatctgg cattcttcct tggctctcta ttgattattt cttttcaatc
     4501 tcttatattt taacattttt tatatttaca attttgcttt cccgtttttg taaaatgcta
     4561 actcttggct atccggtttc aaaaaatata gttatttggt tcactatata ttactatgcg
     4621 catgggtggt tgttttcgta tatgaactta ctaatagcaa tgatgatttt tattattttt
     4681 tccaaggtct ttggaggtaa gattttaaat aaggataata attatgcata aattccaaac
     4741 attgttttgg tctgttattt ttaacatact atctcttctt ttttttcttt ttccattgaa
     4801 aagaaataga gttattttta attcagctga gaataagaat tttaattata actctagata
     4861 cctttttgag tttctaaaaa actataataa tgagtacgaa atatacttcg tcattaatga
     4921 tgctgactta agggcgaaat tatcaattga gcatggcgga aaatacttca taaccacgta
     4981 ttcattaaaa tcatgttttc taattatgcg ttcgaagttc tggatcattt caacatttga
     5041 aagtccctat gtttgttttg tccgccatca tagacgtata gtatttcatt tggggcatgg
     5101 gattccactt aaggctattg gacaattagc taagtttcca acaaaattga aacttaagct
     5161 gcaaaaaatt ttaagaattc gccccattac acacgcttta tgctactctg aagaatacaa
     5221 aacaaatatg agtgccattt ttaattcgga cttcatagaa tatgttcctt tggggcagcc
     5281 acgtaatgac tcgattgttc tcaaagattc agtagaaact ggcaagttaa taaaagaatc
     5341 cattctcaat gtacctagtt ttgataaagc catattgtac tctcctacat ggcgtccata
     5401 tgataaggca aggtttttcc catttgccga tttagaagcg aatgaattga atagtattct
     5461 aagtcaaaca aagacaatgc tatttttaag agggcatcct ttttttgaat ctttttgccc
     5521 agatagcttt gaaaatttat ccaatataca ttggcttaat aatgatgtca ttgatgacat
     5581 tacttcacat ttgccttttt ttgataagat tatcactgat tattcaagta tatttattga
     5641 ttatttatgt gttaataaac caattggttt tttgcaatac gattatcaac agtatgatga
     5701 tatggtcggg ttcgcaactg atgatagaga gattttttgt ggcgtaaaaa ttgaatcttc
     5761 cgatgatttc atttccttca taattgacca agatgattct tggatgccag agcgtttaaa
     5821 aatcgcacgg ttactgaata taaaaaatag tggtaatagc ttagaaaata agatgttcct
     5881 agatagttta cggaaaaaat aaaagagact tattaggttt tttcctttcg tgccaattaa
     5941 ataaattatc taaaacaaaa gctattcaca ataatatgtt ttaagataga attcttagtg
     6001 ttttctaatc tgcgcaaatg cgcggtgacc acacctgaca ggagtatgta atgtccaagc
     6061 aacagatcgg cgtcgtcggt atggcagtg
//