LOCUS       EU296410                7286 bp    DNA     linear   BCT 26-AUG-2008
DEFINITION  Escherichia coli serogroup O32 O-antigen gene cluster, complete
            sequence.
ACCESSION   EU296410
VERSION     EU296410.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 7286)
  AUTHORS   Liu,B., Knirel,Y.A., Feng,L., Perepelov,A.V., Senchenkova,S.N.,
            Wang,Q., Reeves,P.R. and Wang,L.
  TITLE     Structure and genetics of Shigella O antigens
  JOURNAL   FEMS Microbiol. Rev. 32 (4), 627-653 (2008)
   PUBMED   18422615
REFERENCE   2  (bases 1 to 7286)
  AUTHORS   Liu,B., Knirel,Y.A., Feng,L., Perepelov,A.V., Senchenkova,S.N.,
            Wang,Q., Reeves,P.R. and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (24-NOV-2007) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, 23# HongDa Street, Tianjin
            300457, P. R. China
FEATURES             Location/Qualifiers
     source          1..7286
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:562"
                     /note="serogroup: O32"
     misc_feature    359..7053
                     /note="O-antigen gene cluster"
     gene            359..1816
                     /gene="wzx"
     CDS             359..1816
                     /gene="wzx"
                     /note="O-antigen flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="ACD37057.1"
                     /translation="MKKLSAFNNAKWVGLSQITKIFVQVVALVGFSRILQPGEYGIMA
                     MAAVISNFAIIFRDLGTGSAIIQKKKIDDGFLSSLFWMNMIVGGGIMIIIMIISPLVA
                     VFFHESQLTYVLILLSISFPLASLGIIHQSYLERNNKFSQVCFVEMISAIFALGIGIA
                     TALLGGGVYSLVIMTVIQTLISSVGFWFVSNWTPSFSFDKKDINDVLNFSGNLTLFNL
                     VNYFSRNSDNMIIGHYFSTSILGAYSLAYRIMLFPLQSLTSVASRSLYPVISRMKNNN
                     EGNVTDLYLRTLSFISIFTLPLMAGLWLLSDSFVSVVFGEKWILVSSILFWLAPTGFI
                     QSLVSTTGTIYMAYGKVGLLFKLGVFSSFLQIFAFIVGAQYNVIVLAKLYFISNLINF
                     FVAMYFTLKLLSGNLMQLLIKLLPTMFCTIVMLFVVAVIKCVLKHYNYNDITLLISGV
                     CSGSIIYLLLFIVFFRKMLINDLPSALSNKITRMR"
     gene            1820..3031
                     /gene="wzy"
     CDS             1820..3031
                     /gene="wzy"
                     /note="O-antigen polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="ACD37058.1"
                     /translation="MIYIMQSIMIFAFLTKIPLTSIIVVSASVISLILSSVSHDVISI
                     KKVRIKLCILILFLFILLIRILANLALFDNLSQSDLDYIITISLAMVIYITFLVRPNP
                     VALKYGILSAVIFTIVLALIEYILHVNTGSSRFEDPTNMFYLSDNRVPTAFYYNENDM
                     LYFIILFIPFVCQTIKNNILSKAIFISAFLLALIITSKAAIITMCIYFLWNIYNEPKG
                     KSIFIAYISLAFLFLIILLLSWNYLSSTGLAEKVLYRFSGLIDFLSGTGGDNSSNERF
                     EIYTSVFSFLANNIDMIFFGFGSFSYYESVFLREYSLRIADFHNMHLELLTLFGSFVY
                     VFILIFILRRYIELKSIYINGRRVFNFMIVSFCSIMSIISSSIVKYPSFYVFLLLLVF
                     ARKYMDKKNEF"
     gene            2970..3908
                     /gene="wfeA"
     CDS             2970..3908
                     /gene="wfeA"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfeA"
                     /protein_id="ACD37059.1"
                     /translation="MCFFYYWFLLENIWIKKMNFKVSVIIPTYGRPDNLKRAIDSVIE
                     QTYKNIEIIVIDDNGINSKKGHETSTLVRHYPHIIYIKLEKNSGGGMARNKGIERASG
                     DYITFLDDDDYYYPEKIQKQLKFMIENSYDISLCDMEIANPLSKKFKHRKKYSEANGF
                     NLKDFLIAGVAFTPMIMVKKEVLLEVNGFLDTPRFQDHTLMLKMLTVTENVGHLAEQL
                     FVHCSDYTARISNSPRSRKGFLIRHALEKKIVIDNKLCLPKLRFNQCAQISPYVKEKF
                     GKYKYICFMLWSLKFSRSCHSVFLTGYRIMRLCLKK"
     gene            3893..4621
                     /gene="wfeB"
     CDS             3893..4621
                     /gene="wfeB"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfeB"
                     /protein_id="ACD37060.1"
                     /translation="MFKKIMNFFRLTKLSLSTINLSITNSIPVKKYSLGAVYRIKNAE
                     STIELAIRSIIDILDEVVIVDNASSDNTKKIILKLKSEYGEKIKIFQYENELCRAGVG
                     YQECLKKNKDGSLADYYNFSFSKSTTDYILKCDANYIYTKAGKYSIVNALNSGYDVIC
                     FPGVEIFGHHHSYEPFLFKRDSKWIFIDDDMWESIKFNKKVLTHHIILPCFIHVKRLN
                     YIKFYGEAISGVEGLYAKCSKKNH"
     gene            4560..5144
                     /gene="wfeC"
     CDS             4560..5144
                     /gene="wfeC"
                     /codon_start=1
                     /transl_table=11
                     /product="WfeC"
                     /protein_id="ACD37061.1"
                     /translation="MEKLSVVLKAYMQNALKKIIKRIILALFFCRKENNIYFNKSSEP
                     HNCSREYIDNFVQGKLISTAPIRNINIINTEDDYLFDITLSSWAPIANSITLTGYDSF
                     DSVNKAYENIKKVIEIRRGGAQSSYQNISVPLGVVLIPKVYDDITSRDFDYIWGVSLD
                     GQVLQLMLKTGELKKSSIKLSREECFFIYMKEIK"
     gene            5141..5854
                     /gene="wfeD"
     CDS             5141..5854
                     /gene="wfeD"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfeD"
                     /protein_id="ACD37062.1"
                     /translation="MIDNLIKRTPEINRLLENKRVTGVVTFVNPYSYYKIKEYNKISQ
                     LDYIYIDGILLLKLFNFVNGTKIKRHSFDYSSIAKTVFNYSIQNKMKIGLIGSKDYEI
                     EQAVKNIRKKHPGIDISYFHSGYFSSLEEKSSVIDSVIKKSDIIICGLGTPAQEELAL
                     DIKIKSNEHLIFTCGGFFTQTASRADFYYPWIKRYNLMWLQRIVLYKHVRKRFFIDYP
                     KFIVRFISENLMKIFTRSN"
     gene            5857..7053
                     /gene="wfeE"
     CDS             5857..7053
                     /gene="wfeE"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfeE"
                     /protein_id="ACD37063.1"
                     /translation="MKVLYIVNQFPCLSETFVYNQIKGLSNLGHDVKVLAVYKGAKGE
                     EVGVNYRCCATEKLSRLEQLCLLLKSFSIAILKFDPIIIEFIRLLLSFNLSGLVSLSL
                     LRKQIYNYYDTECIIAHFGDCGYYAAMLKKFNIKSVKTIAIYHGYDVSVKKILEKWLP
                     SYKRSFEILDFLLPISELWKNKLLSLGALPEKIIVQHMGININDFNFTSRSLHNLEIK
                     YKTTRILSTGRFVEKKGFKYIVSAMQYLPECSLEIIGDGPLFTDIMRFIDDNNIKNVK
                     CVGALKHNDVKNKLQECDIFCLPSVTGGNGDMEGIPVVLMEAMACGKIVVSTRHSGIP
                     ELIEDGVTGFLCEEKNVEELVEKIKFINSLGTRKKNIAVEARKKVVNDFNNEIIYADL
                     DKIIKC"
ORIGIN      
        1 ataggttaca tgaaggcgtt tgttcaatat gggctacgca atctgaaaga aggtgctaag
       61 ttccgtagag ggattgaaaa attgttatct cattgaactc gaagcaaggt tagcgattct
      121 gtaatgtgaa agtatcactt aacgtttata ggatttaact catgattaat ctattcttat
      181 gattaggatg aataattaat gcctataaaa taacgttaag cttttataat ttgattgttc
      241 taattactca ctatgtgagt agctaaatta taaatattaa aattttataa tttactttat
      301 cagcaatcag gtagctgttg agcttggggc ggtagcgtgg ttattaaaaa ttaggggaat
      361 gaaaaaattg tctgcgttta ataatgcaaa atgggttggg ttatcacaga ttacaaaaat
      421 ttttgtccaa gttgtagctc tcgtgggttt tagcagaata ttacagcctg gagaatatgg
      481 gattatggca atggctgctg taatatcaaa ttttgctatt atattccgtg atcttggtac
      541 tggttctgca attatacaaa agaaaaagat tgatgatggt tttctttctt cccttttttg
      601 gatgaatatg atagttggcg gtgggattat gatcattatt atgattatct caccactcgt
      661 tgctgttttc tttcatgaga gccaattaac atatgtgttg atcttgttat cgatttcttt
      721 tccgttagca agtttaggaa taatacacca atcttattta gaaagaaata ataaattttc
      781 tcaagtttgt tttgttgaaa tgatttccgc tattttcgct ttaggtattg gtattgctac
      841 agcgttattg ggaggcggag tttatagttt agttattatg acggtaattc aaacattgat
      901 atcaagtgta ggtttttggt ttgtgtcaaa ttggactcct tcttttagtt ttgataaaaa
      961 agatataaac gatgttttaa attttagtgg aaatttgacc ctctttaatt tagttaatta
     1021 tttttcgcgc aatagtgaca atatgataat aggtcattat ttttcaacct ctatattagg
     1081 ggcatattca ttagcctata gaataatgct tttcccacta caaagtctca catctgtagc
     1141 atcacgctca ttatatccag tcataagtag aatgaaaaat aataatgaag gtaatgtgac
     1201 cgatttgtat ctgcgcactt tatcttttat ctctatattt actttgccat tgatggcagg
     1261 tctttggctc ctaagtgatt catttgtaag tgttgttttt ggagagaaat ggatattagt
     1321 atcttcaatt ctcttttggc ttgcaccaac cggttttatt caatcattgg tcagcactac
     1381 cggcacaata tatatggcat atgggaaagt tggtttatta tttaaattag gtgtgtttag
     1441 ttcattttta caaatatttg cttttatagt cggtgctcaa tataatgtaa tcgtattagc
     1501 aaaactatat tttatttcaa atttaataaa tttttttgtt gcaatgtatt ttactttaaa
     1561 actattatcg ggaaatttga tgcaactttt aataaaatta ctgccaacca tgttttgtac
     1621 aatagttatg ttatttgtgg tagcggttat taaatgtgta ttgaaacatt ataattataa
     1681 tgacatcacc ttacttattt caggtgtttg tagtggaagt attatatatt tattgttatt
     1741 tattgttttt tttagaaaga tgttgattaa tgatcttcct tctgcgttat caaataaaat
     1801 aacaaggatg cgttaattta tgatatatat tatgcaatct atcatgattt ttgcgtttct
     1861 gactaaaata ccgctaacca gcataattgt tgtaagtgca tctgtaatat cattaatcct
     1921 tagtagtgta tctcatgatg ttataagtat aaaaaaagta aggattaaac tctgcattct
     1981 tatactattt ttgtttatat tacttatacg tatacttgca aatctagctc tttttgataa
     2041 tttatcgcag tccgatttgg attatataat aactatttcg ttggcaatgg tgatttatat
     2101 aacattttta gttcgtccca accctgttgc tttaaaatat ggtatcctat cagcggtgat
     2161 ctttacaatt gtattggcgc ttatagagta cattttacat gttaatacag ggtcttctcg
     2221 gtttgaggat cctacaaata tgttctacct ctcagataat cgtgtgccga ctgcttttta
     2281 ttataatgaa aatgatatgt tatattttat cattcttttc attccctttg tatgccaaac
     2341 tataaaaaac aatatattgt cgaaagcaat tttcatatca gcttttcttt tagctttaat
     2401 cattacctca aaagcagcga ttataacaat gtgcatttat tttctatgga atatatataa
     2461 tgaacctaaa ggtaaaagta tatttatagc atatatttca cttgcatttt tatttttaat
     2521 tatactattg ctgagttgga attatctttc ctctactggt ctggctgaga aggtattata
     2581 tagattttca ggattaattg atttcttatc aggaacagga ggagataaca gttcaaatga
     2641 acgttttgaa atttatacat cagtgttttc ttttctggct aataatattg atatgatatt
     2701 ttttgggttt ggtagtttta gttattatga gagtgttttc ttaagagaat attctctaag
     2761 aattgctgat ttccataata tgcatttaga attacttact ttgtttggga gttttgtata
     2821 tgtattcatc ttgatattca tccttagaag atatatcgaa ttaaaaagta tttacattaa
     2881 tggaagaaga gtgtttaact ttatgattgt ttctttctgt tctattatgt ctataatttc
     2941 tagttctatt gtgaaatatc catcttttta tgtgtttctt ttattactgg tttttgctag
     3001 aaaatatatg gataaaaaaa atgaatttta aagttagtgt tattattccg acttacggaa
     3061 ggcctgataa tttaaaacgt gcgattgaca gtgtcatcga gcagacatat aaaaatatag
     3121 aaattatagt tatcgatgat aatggtatta atagtaaaaa aggacatgaa acatcaacgt
     3181 tggttagaca ttatccccat attatctata ttaagttaga aaaaaactca ggtgggggga
     3241 tggcaagaaa taaaggaatt gaacgagcat ctggggatta tattaccttt ttagatgatg
     3301 atgattatta ttatcctgaa aaaatacaaa agcaattgaa gttcatgatt gaaaatagct
     3361 atgatatttc tctatgtgat atggaaatag caaatccctt aagtaaaaaa tttaagcata
     3421 gaaaaaaata ctctgaagca aatggcttca atttaaagga ttttttaata gcaggtgtgg
     3481 catttactcc tatgattatg gtaaaaaagg aagtattact tgaggttaac ggctttttgg
     3541 atactccccg ttttcaagat catactttga tgctaaagat gttgactgtt acagaaaatg
     3601 ttggccattt ggctgagcaa ctatttgttc attgttctga ctataccgct agaatcagta
     3661 actccccaag atctaggaaa ggttttttaa ttaggcatgc ccttgaaaaa aaaatagtaa
     3721 tagacaataa actttgcttg cctaaattaa ggtttaatca gtgtgctcaa atttcccctt
     3781 atgtaaaaga aaaatttgga aaatacaagt atatttgctt tatgttatgg tctcttaaat
     3841 tctctcgaag ctgccatagc gtatttttaa ctggatatag gattatgaga ttatgtttaa
     3901 aaaaataatg aatttttttc gattgaccaa acttagtctt tcaacaataa accttagtat
     3961 aactaactct attccagtca aaaaatattc actaggtgca gtttatcgga ttaaaaatgc
     4021 cgaatcgaca attgaattgg ctataagatc cattattgat attttggatg aagtagttat
     4081 tgtagataat gcatcttctg ataatacaaa aaaaattata ttaaaattaa agagtgaata
     4141 tggagaaaaa ataaagatct ttcaatatga gaatgaattg tgtagagcgg gggtgggata
     4201 tcaggaatgt ttgaaaaaaa ataaagatgg tagtcttgca gattattaca atttttcttt
     4261 ttcaaaatca acaaccgatt atattttaaa gtgtgatgct aattatattt acacaaaagc
     4321 tgggaaatat tcgattgtta atgcattaaa cagtggctat gacgtaattt gttttcctgg
     4381 tgtagaaata tttgggcatc atcactccta tgaacctttt ttatttaagc gagattcaaa
     4441 gtggatattt atagatgacg acatgtggga aagtattaag tttaacaaga aggtgcttac
     4501 gcatcatata attttacctt gtttcattca tgtgaaaaga ttaaattata ttaaatttta
     4561 tggagaagct atcagtggtg ttgaaggctt atatgcaaaa tgctctaaaa aaaatcatta
     4621 aacgaattat tttagcgctt tttttttgta gaaaagaaaa taatatttat ttcaataaat
     4681 ccagtgaacc acataattgt tctcgagaat atattgataa ttttgttcaa ggaaaactaa
     4741 taagcacagc acctattcgt aacatcaata taataaatac tgaggatgat tatttattcg
     4801 acattacatt gtcttcatgg gctccaatag ctaatagtat taccttaact ggctatgact
     4861 ctttcgacag tgttaataaa gcttatgaga acataaaaaa agttattgag attagaagag
     4921 ggggggctca atcttcatat cagaatataa gtgtcccttt aggagttgta ttgataccta
     4981 aagtttatga tgatattacg tcacgcgatt ttgactatat ttggggtgtt tctcttgatg
     5041 gtcaagtgct gcaattaatg ttaaaaacag gcgagttaaa aaaaagtagc ataaaactct
     5101 ccagagaaga atgttttttt atttatatga aggaaattaa gtgatcgata atctcataaa
     5161 aagaacccct gaaattaata ggttgttaga aaataaaaga gttacagggg ttgttacatt
     5221 tgttaatcct tactcatatt ataaaataaa ggaatataat aagatatcac aactcgatta
     5281 catatatata gatggcattc tattattgaa gctatttaat ttcgttaatg ggacgaaaat
     5341 taaacggcat agttttgatt atagttcgat agctaaaact gtttttaatt attctataca
     5401 aaataaaatg aaaataggat taatcggttc taaggattat gaaatagagc aagctgtaaa
     5461 gaatattaga aaaaaacatc cgggaattga tatatcttat tttcattccg gatatttttc
     5521 ctcattagag gaaaaaagct ctgttataga ttctgttatt aaaaaaagtg atattataat
     5581 ttgtggttta ggaacccctg cgcaggaaga attggcgctt gatataaaaa taaaatctaa
     5641 tgaacattta atttttacat gtggtggttt tttcacacag acggcttcga gagcagactt
     5701 ctactaccca tggattaaga gatataatct tatgtggctg caacggattg ttttatataa
     5761 acatgttagg aaaagatttt ttatcgatta cccgaagttt atagttagat ttatatctga
     5821 aaatttaatg aaaatattca cgagaagtaa ttgataatga aggttttata tattgttaat
     5881 cagttccctt gtctttcgga aacatttgtt tacaatcaaa ttaagggatt aagtaattta
     5941 ggtcatgatg ttaaggtgct agccgtttat aaaggtgcta agggagagga agttggtgtc
     6001 aattataggt gttgtgcaac tgagaaatta tctagacttg agcaactatg tttgctctta
     6061 aaatcattct caattgccat tttaaaattt gatccaataa ttattgagtt tattcgccta
     6121 ttgttgagct tcaatttgtc aggactagtt agcctttctt tattaagaaa gcagatttat
     6181 aattactatg atactgaatg cataattgcc catttcggtg attgtggata ttatgcagca
     6241 atgctcaaaa aattcaacat taaaagtgtg aagacaatag ctatatatca tgggtatgat
     6301 gtaagtgtga aaaaaattct tgaaaaatgg cttccctcat ataagagaag ttttgagatt
     6361 ttagatttct tattgccaat tagtgaacta tggaaaaata aattactttc cctcggagca
     6421 ttaccagaaa aaataattgt gcaacatatg gggataaata ttaatgattt caactttact
     6481 tcaaggtcat tgcataattt agaaataaaa tataaaacaa ctaggatact gtctacggga
     6541 cgttttgttg aaaaaaaagg atttaaatat attgtttctg ctatgcaata tcttcctgag
     6601 tgttcgttgg agattattgg agatggccct ttatttactg atataatgcg atttattgat
     6661 gataataata taaaaaacgt aaaatgtgtt ggtgccttga agcataatga cgtcaaaaat
     6721 aaattacagg agtgtgatat tttttgtcta ccatcagtaa ctggcggtaa tggagatatg
     6781 gaaggtatac cagttgtatt aatggaggca atggcctgtg gtaaaatagt tgtatccaca
     6841 aggcatagtg gaatccctga attgatagag gatggcgtaa caggatttct ctgtgaagaa
     6901 aaaaatgttg aagaactcgt tgaaaaaatc aagtttatta actcgctggg aacgcgtaag
     6961 aaaaatattg ctgttgaggc gagaaaaaaa gtagttaatg atttcaataa cgagataatc
     7021 tatgctgatt tagataaaat aattaagtgc taatgtaata gttattttag acaattttat
     7081 tgaacgaatt gcatagaaaa ctatcttctc ttagtctttt gactgagtca tttttcagaa
     7141 acaatcaagc cgcaaataac tcgcggtaac ccctgacagg agtaaacaat gtcaaagcaa
     7201 cagatcggcg tcgtcggtat ggcagtgatg ggacgcaacc ttgcgctcaa tatcgaaagc
     7261 cgtggttata ccgtctctat tttcaa
//