LOCUS       EU694098                8041 bp    DNA     linear   BCT 22-SEP-2008
DEFINITION  Escherichia coli serogroup O21 O antigen gene cluster, complete
            sequence.
ACCESSION   EU694098
VERSION     EU694098.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 8041)
  AUTHORS   Ren,Y., Liu,B., Cheng,J., Liu,F., Feng,L. and Wang,L.
  TITLE     Characterization of Escherichia coli O3 and O21 O antigen gene
            clusters and development of serogroup-specific PCR assays
  JOURNAL   J. Microbiol. Methods 75 (2), 329-334 (2008)
   PUBMED   18700154
REFERENCE   2  (bases 1 to 8041)
  AUTHORS   Ren,Y., Liu,B., Cheng,J., Liu,F., Feng,L. and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (04-MAY-2008) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, 23 Hongda Street, Tianjin 300457,
            P. R. China
FEATURES             Location/Qualifiers
     source          1..8041
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:562"
                     /note="serogroup: O21"
     misc_feature    1..8041
                     /note="contains O antigen gene cluster; also contains galF
                     and gnd"
     gene            1082..2317
                     /gene="wzx"
     CDS             1082..2317
                     /gene="wzx"
                     /note="O unit flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="ACH97158.1"
                     /translation="MFTIKTVFVLRIFGAILALSTSVMISRTLNMSEAGGVFFLLSVT
                     GIISSLSSLGQNNLILKKCASVKYALKARGVFFLRCIKRSVISSIILSIILIPVIHYF
                     SPQLLLRNTWCLAILLIISSSVNILLYSFLQSQGLVTFSVVLQYIFQPLLFIFFVLLI
                     VLIKNESVLLVSLSYFFSIILIGGGGGVYSYYKFRDDFNQLETESIPFRLKELSEYFI
                     GNSLGMLIVQSYVVLSGLLLPAADVAIIAVSDRISLVINLFAMSISTILAPKVASLYS
                     QSKMNEIKELTKKAMFFIMIPCVLMALLFPFFSGLILSIFGVQYSNASEVLIILVMTQ
                     IINAIFCPVYVFLNMSDRQGFISKLHIYMLIPSLVITFYLTNIFGVVGIAVSKLIVVS
                     LINIIPLIYCILLSNRVIK"
     gene            2317..3108
                     /gene="wclN"
     CDS             2317..3108
                     /gene="wclN"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WclN"
                     /protein_id="ACH97159.1"
                     /translation="MSLYSILKKLILSFHYYLFTISFLSAKNDKKYSNRLDFDDYVAA
                     KLRKQNEYKRKIPSVSVIYRVKNGSEYIEASILSISGLASQIIVVDNNSTDNTRDIVE
                     RLSNQLADVCSIQLYSYDKNLAIAGEGYKDQVTKGDGSLAEFYNFSFSLGDCDYLMKV
                     DAHYIFSAYGVDILQKQIAKNYDGVVFRGLEFFGKWMSNELFLYKRSLGLKYCDGELY
                     EQLMWDKSTVRVKTIIKPLYLHVKRLSYVKNLYNTKKAIYVKYNK"
     gene            3117..3926
                     /gene="wclO"
     CDS             3117..3926
                     /gene="wclO"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WclO"
                     /protein_id="ACH97160.1"
                     /translation="MNNKRISIIIPTYNSSIILEENIKIISSYKQCKIFVIDDGSVSD
                     EARKNKIICNNYGCNYTYTLNQGPSHARYVGLLDSDTEFCFFLDTDDYIAEFALDWGV
                     NYLLENNEVDAIVFRSDYVEEFNCKNETGNIFTIKKYNRGLIQECIECLGYPKQFTLG
                     WNQSNTLYRRNKIIDAYKIRYLTWGEDIPLKLKLISVMSLISVRTLGGSQIKISYGRG
                     YKYTPKQIVELALEVYRTSLNNAFCLAFITVIRYMLSYFYKRLKQLSSKRK"
     gene            3929..4609
                     /gene="wclP"
     CDS             3929..4609
                     /gene="wclP"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WclP"
                     /protein_id="ACH97161.1"
                     /translation="MKRKLVDFCIISLPQHNERRDKLKNEMAKYDIECRVSHAIDGRK
                     LLAEKYFSLFKIRSSKMFGRGFLTPSELGCFLSHKKALTEFLASGRKWLVVLEDDVLP
                     KENVKYLDEMINSFCSSSVYILGGQDGLKSFSRVIMGRKSICGVRKVILGTHRWLYRT
                     CCYCVDIKGAERILRLMEENSFFCDDWSYIVRNAKLDNVFYGQYFSHPVNLNSSSIEA
                     ERLFIAEK"
     gene            4606..5688
                     /gene="wzy"
     CDS             4606..5688
                     /gene="wzy"
                     /note="O antigen polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="ACH97162.1"
                     /translation="MIYIIINTIVLFYMFLFNAYNRIPYGKLIIGGICVFFMTLLPAF
                     QYGVGTDYFSYQNIYNNANELDTFYQNKEYLFYGYMRLYQLTGWGFKGFIALTALLQS
                     LLVFVIVFQLWKNYGYSLVLVFFLFWVVTNLFHTQMNIIRASFSIYLFAISILYKFRG
                     KLLLSFILMVAALGFHRSALIGFCFLVIPDKMYFFACKHAFKIYVLTFLLFLFSYLQQ
                     IIYYIVQNLFPYYSHYLSSFDESSVSIMNVLTKMYWIPFNLLFLILLRLKVFVIKDNE
                     RKLIGMWALTVNVYLLMLSFDFISRVNYYFVIFYIIPIIYVIKYTVKNRYFVCLYLSL
                     LYCFIPYLLKVILFPIAEFYYKSYLF"
     gene            5698..6453
                     /gene="wclQ"
     CDS             5698..6453
                     /gene="wclQ"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WclQ"
                     /protein_id="ACH97163.1"
                     /translation="MMGLFMGNETVSIIMPAYNAEETIKDSILSILKQTYEDFKLYII
                     NDNSSDSTEHIIKSIIDERIVYLLNRNGKGVSSARNVGIAACNGRYIAFCDSDDVWFE
                     TKLEEQLKILSAGNYKVVCSNYEVFYADTNVIKERRFKEVITYNNMLQSNHIGNLTGI
                     YDSTQIGKVYQQEIGHEDYLMWLTIVKKAKLVYCIQKNLARYYIHNTGLSSNKFTAAM
                     WQWNIYRRVLSFSLFKSLVLFFIYSVRALAKRL"
ORIGIN      
        1 attgtggctg cagggatcaa agaaatcctc ttggtaactc acgcgtccaa gaacgcggtc
       61 gaaaaccact tcgacacctc ttatgaatta gaatctcttc ttgaacagcg cgtgaagcgt
      121 caactactgg cggaagttca atccatctgc ccgccgggtg tgaccattat gaacgtgcgt
      181 cagggcgaac ctttaggtct gggccactcc attttgtgtg cgcgaccggt cattggtgac
      241 aacccatttg tcgtggtatt gccggacgtt gttatcgatg acgccagcgc cgacccgctg
      301 cgctacaatc ttgccgctat gattgcgcgc ttcaatgaaa cgggacgcag ccaggtgctg
      361 gcaaaacgta tgccgggcga tctctctgaa tactccgtca ttcagaccaa agaaccgctg
      421 gatcgcgaag gtaaagtcag ccgcattgtt gaatttatcg aaaaaccgga tcagccgcag
      481 acgctggact cagatatcat ggccgtaggt cgttatgtgc tttctgccga tatttggccg
      541 gaactggaac gtactcagcc tggtgcatgg ggacgtattc aactgactga tgccattgcc
      601 gaactggcga aaaaacatgc tgtggatgca atgctgatga ctggcgacag ttacgactgc
      661 ggcaaaaaaa tgggctatat gcaggcgttt gtgaagtatg gtttgagaaa cattatgcta
      721 ggcacaaaat tccgtggtaa aatagaagaa ataattataa atgattttta atgaagataa
      781 aaggcgggag aaaatagtaa tatgaaagtc gtcaaccgat tatctaagct aatgtttaaa
      841 atatcagatg atgtttagat cttttatggt gattttttgc ttcatgtgat ttagaaaacg
      901 gtctcttgtt ttattatcaa tgaatttatt aagattgcca tgttataagt ttgtgttagt
      961 gaactggtag ctgttaagcc aggggcggta gcgttgtttt ttgcgtcttg cggggtagta
     1021 tctataccct cccccctatt atttgttgca aagaggtctt tgggtaaata acgagaagtt
     1081 aatgtttaca attaaaactg tatttgtgtt gaggatattc ggcgctatac ttgcgctgtc
     1141 aacgagtgtg atgatatcaa gaacgctcaa tatgagtgag gctggtgggg ttttcttcct
     1201 attatcagta actggaataa tatcgtccct atcctcttta ggacaaaata atttaatttt
     1261 gaaaaaatgt gcctcagtta aatatgcatt aaaagcacga ggcgtttttt ttcttagatg
     1321 cataaaacgg agtgttatat ccagtattat cttatctatc attttaatac ctgtaattca
     1381 ttatttttcg ccacaattat tattacgaaa tacatggtgt ttggcgattc tgttgataat
     1441 atcatcgtca gtaaatatat tgttatattc ctttttacag tctcaaggtc ttgtcacttt
     1501 tagtgttgtt ctgcagtata tatttcaacc cttattgttt attttttttg tattacttat
     1561 tgttctgatt aaaaatgaaa gtgttttact ggtgtcttta tcatacttct tctcaattat
     1621 tcttattgga ggaggggggg gggtatactc gtattataaa tttagggacg atttcaatca
     1681 gttagaaaca gagtcaatac cgtttagact gaaagaatta tcagagtatt tcattggtaa
     1741 ctcattagga atgctgattg ttcaatctta tgttgtactt tccggtttgt tgctcccagc
     1801 tgctgatgtc gctattattg ctgtgtctga tagaatatcc ttggttataa atttatttgc
     1861 aatgtcaatt agcacaattc tggcacctaa ggtcgccagt ttatacagcc aaagtaaaat
     1921 gaatgaaata aaagagctaa ctaaaaaagc tatgttcttc ataatgatac catgtgtttt
     1981 aatggctctt ctgtttccct ttttttcagg gctgatatta tctatatttg gtgttcaata
     2041 cagtaatgct agcgaagtgt taattatttt agttatgacg cagattatta atgcaatatt
     2101 ttgccctgta tatgtttttt taaatatgag tgatcggcaa ggttttataa gtaaattgca
     2161 tatatatatg cttataccgt ctcttgttat aacattttat ctgactaaca tatttggtgt
     2221 tgttggaata gctgtgtcta agttaattgt cgtgtcattg attaatataa tcccattgat
     2281 ttactgtatt ttattgtcta atcgagtgat aaagtgatga gtttatattc tattttaaaa
     2341 aagttaattt tatcttttca ttactatctt tttactattt cctttttatc tgcgaaaaac
     2401 gataagaagt actccaatcg gttagatttt gatgattatg ttgcagctaa gctaagaaaa
     2461 cagaatgaat ataagaggaa aataccaagt gtctctgtta tatatagagt caaaaacgga
     2521 tctgaatata tagaggcatc tatattgtct atttcggggt tagcatcaca aataattgtt
     2581 gtagataata attctacaga taatacaaga gatattgtag aaagattatc gaatcaatta
     2641 gctgatgttt gctctataca actttactct tatgataaaa atctcgctat tgctggagaa
     2701 gggtataaag atcaggtgac aaagggagat ggttcactgg ccgaatttta taattttagt
     2761 ttttctttag gtgattgtga ttatttaatg aaagtcgatg cccattatat tttttcggca
     2821 tacggtgttg atattttgca aaagcagata gcaaaaaatt atgatggtgt cgtttttcga
     2881 gggttagagt tttttgggaa gtggatgagc aatgagctgt ttttatataa acgttcactg
     2941 ggtctgaaat attgtgatgg cgaattatat gaacagttaa tgtgggataa atcaaccgtc
     3001 agggtaaaaa ctatcattaa acccctttac ttgcatgtta aacggttatc ctatgttaaa
     3061 aacctttata acacaaagaa agccatatac gtaaaataca ataaataggc aatagaatga
     3121 ataataaaag aatatcaata ataataccaa cttataattc gagcataata ttagaggaaa
     3181 atattaaaat aatcagtagc tataagcagt gtaagatttt tgtaattgat gatggttcag
     3241 tttctgatga agcgcgcaaa aataaaatta tttgtaataa ttacgggtgt aattacacct
     3301 atactcttaa tcaaggccct tctcacgcaa gatatgtagg cttattggat tcagatacag
     3361 aattttgttt ttttcttgat actgatgatt atattgctga atttgctctt gattggggtg
     3421 ttaattattt attagaaaat aatgaggttg atgccatcgt ctttagaagt gattatgtgg
     3481 aagagtttaa ttgtaaaaac gagacaggta atattttcac aataaaaaaa tataacagag
     3541 gattaataca agaatgtata gagtgtttag ggtatccaaa gcaatttact cttggttgga
     3601 atcaatctaa tacgttgtat cgtagaaata aaatcattga tgcttataaa ataagatatt
     3661 tgacttgggg ggaagatata ccattaaaac taaaactaat ttctgttatg tcgctaattt
     3721 ctgtgagaac tctgggaggg tctcaaatta aaatatccta tggacgggga tataaatata
     3781 caccaaaaca aatagttgag cttgctctgg aggtttacag aacgtcccta aataatgcat
     3841 tttgtcttgc attcataaca gttataagat atatgctttc atatttttat aaaagattaa
     3901 aacaactgtc cagtaaaagg aagtgagaat gaaaagaaaa cttgttgact tttgtataat
     3961 atcattacct caacataatg aaaggagaga taaattaaaa aatgaaatgg cgaagtatga
     4021 catagaatgt cgtgtttctc atgctattga tggacggaaa ttattggcag aaaaatactt
     4081 ttctttattt aaaattaggt cctcaaagat gtttggaaga ggttttttaa ctccgtcgga
     4141 attgggatgt ttcttgagtc ataaaaaagc tttaacggaa tttttggcga gtggaaggaa
     4201 atggttggtg gttttggaag atgacgtttt gcccaaggaa aatgttaaat atttggacga
     4261 aatgattaat tcattctgct catcaagtgt ctatattttg ggtggacagg atggtctaaa
     4321 aagctttagt cgtgtcataa tggggagaaa atcaatatgt ggggtgcgaa aagtaatatt
     4381 aggtacacat cgttggttat ataggacatg ctgttattgt gtggatatta aaggcgctga
     4441 gagaattctg aggttaatgg aagaaaatag tttcttttgt gatgactgga gttacattgt
     4501 aagaaatgcg aaactggata atgtatttta tggtcaatac ttttctcatc ctgtaaattt
     4561 aaactctagt tctatcgaag ctgaacgtct ttttattgca gaaaaatgat atatattata
     4621 attaatacta ttgtgctttt ttatatgttt ttgtttaatg catataatcg tattccttat
     4681 gggaaattaa ttatcggggg catatgcgtt ttttttatga ctctgttgcc agcatttcaa
     4741 tacggtgttg gaacagatta ttttagctat caaaatatat ataataatgc taatgaactc
     4801 gatacctttt atcaaaataa ggaatatctc ttttatggat atatgaggct atatcaactg
     4861 actggatggg gattcaaagg ttttattgcg ttaactgctt tattacaatc tttattggtg
     4921 tttgttattg tttttcagtt atggaaaaac tatggttatt ctcttgtttt ggtttttttt
     4981 cttttttggg ttgttactaa tttatttcat acccagatga atataataag agcatcattt
     5041 tcaatttatt tgtttgcaat atcaattctc tataagttta gagggaaatt attgttatct
     5101 ttcatattaa tggttgctgc tttaggtttt catcgctctg ctttgattgg tttctgtttt
     5161 ctcgtaattc cagataagat gtattttttt gcgtgtaaac atgcttttaa aatttatgtg
     5221 ttgacttttt tattgtttct tttctcttat cttcagcaaa ttatttatta tatagtgcaa
     5281 aatttattcc cctattactc acattattta tcctcattcg atgaaagttc tgtgagtata
     5341 atgaatgtac taactaaaat gtattggatt ccatttaatt tgctattcct tatcttatta
     5401 agactaaagg tttttgttat aaaagataat gagcgaaagt taattggtat gtgggcttta
     5461 acggtgaatg tttatttgtt aatgctcagt tttgatttta tttcaagggt taactactat
     5521 tttgtgatat tttatataat cccgataatt tatgttatta aatacactgt taagaataga
     5581 tacttcgttt gtttgtatct ctcattatta tactgtttta ttccgtatct attaaaggtt
     5641 attctgtttc ctatcgcaga attttattat aaatcatact tgttctaatt ttgaataatg
     5701 atggggcttt ttatgggtaa tgaaacagta tcaataatta tgccagctta taatgctgaa
     5761 gaaactatta aagatagtat tttgtcaatt ttaaaacaaa cgtatgagga ttttaaatta
     5821 tatataatca atgataattc gtcggattca acagaacata ttattaagtc tattatcgat
     5881 gaacgtattg tttatttact aaatcgaaat ggtaagggag tatcttcggc tagaaatgtt
     5941 gggattgctg cttgtaatgg tagatatatt gcattttgtg atagtgatga tgtttggttt
     6001 gagactaaac tcgaagaaca actgaaaata ttgagtgctg gaaattataa agttgtttgt
     6061 tcaaactatg aggtttttta tgctgataca aatgtaataa aagaaagaag gtttaaggaa
     6121 gttattacat ataataatat gctgcaatct aatcatattg gtaacttaac tggtatttat
     6181 gactcaactc agatagggaa agtatatcaa caggaaattg gtcatgaaga ttacctaatg
     6241 tggttaacaa tagtaaaaaa agcaaagctg gtttattgca tacagaaaaa tcttgccaga
     6301 tattatatac ataatacggg gttgtcctca aataagttca ctgcagctat gtggcaatgg
     6361 aatatttata gaagagtatt gtctttttca ttattcaagt cattagttct tttttttatt
     6421 tattcagtaa gagctcttgc taagagactt taattagaat ggttttatta ggttttgata
     6481 ttataaaatg tatgtctttt agatctgata gtcgatgtat ccaaaaggtt tagtttttgg
     6541 gacatagaga gataagcctt tcctaaatat attagaagta aacccgttac tcatattcag
     6601 ccgcttattt gcagcggtga gcacctcaga caggagtaaa caatgtcaaa gcaacagatt
     6661 ggcgtcgtcg gtatggcagt gatggggcgc aaccttgcgc tcaacatcga aagccgtggt
     6721 tataccgtct ctattttcaa ccgttcccgt gaaaagacgg aagaagttat tgccgaaaat
     6781 ccaggcaaga aactggttcc ttactatacg gtgaaagagt ttgttgaatc tctggaaacg
     6841 cctcgtcgca tcctgttaat ggtgaaagca ggtgcaggca cggatgctgc tattgattcc
     6901 ctcaagccat acctcgataa aggtgacatc atcattgatg gtggtaacac cttcttccag
     6961 gacaccattc gtcgtaaccg tgagctttct gcagaaggct ttaactttat cggtaccggt
     7021 gtttccggtg gtgaagaagg tgcgctgaaa ggtccttcca ttatgcctgg cggacagaaa
     7081 gaagcctata aactggttgc accgatcctg accaaaatcg ccgcagtggc tgaagacggg
     7141 gagccatgcg ttacctatat tggtgccgat ggcgcaggtc actatgttaa gatggttcac
     7201 aacggtattg aatacggtga tatgcagctg attgctgaag cctattctct gcttaaaggc
     7261 ggcctgaatc tctctaacga agaactggca cagaccttta ccgagtggaa taacggtgaa
     7321 ctgagcagct acctgatcga catcaccaaa gacatcttca ctaaaaaaga tgaagacggt
     7381 aactacctgg ttgatgtgat cctggatgaa gcggctaaca aaggtaccgg taaatggacc
     7441 agccagagcg cgctggatct cggagaaccg ctgtcgctga ttaccgagtc tgtgtttgca
     7501 cgttatatct cttctctgaa agatcagcgc gttgccgcat ctaaagttct ctctggtccg
     7561 caagcgcagc cagctagcga caaggctgag ttcatcgaaa aagttcgtcg tgcgctgtat
     7621 ctgggcaaaa tcgtttctta cgctcagggc ttctctcagc tgcgtgctgc gtctgaagag
     7681 tacaactggg atctgaacta cggcgaaatc gcgaagattt tccgtgctgg ctgcatcatc
     7741 cgtgcgcagt tcctgcagaa aatcaccgat gcatatgccg aaaatccgca gatcgctaac
     7801 ctgctgctgg ccccgtactt caagcaaatt gccgatgact accagcaggc gctgcgcgat
     7861 gtcgtcgctt atgcggtaca gaacggtatc ccggttccga ccttcgccgc tgcggttgcc
     7921 tattacgata gctaccgtgc cgctgttctg cctgcgaact taatccaggc acagcgcgac
     7981 atcagcagct gggagcaaca aaccggaaag tacaacataa gattgaacaa tcagcattcc
     8041 t
//