LOCUS       DQ008592                5660 bp    DNA     linear   BCT 07-OCT-2005
DEFINITION  Escherichia coli serogroup O174 O antigen gene cluster, partial
            sequence.
ACCESSION   DQ008592
VERSION     DQ008592.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 5660)
  AUTHORS   Beutin,L., Kong,Q., Feng,L., Wang,Q., Krause,G., Leomil,L., Jin,Q.
            and Wang,L.
  TITLE     Development of PCR assays targeting the genes involved in synthesis
            and assembly of the new Escherichia coli O 174 and O 177 O antigens
  JOURNAL   J. Clin. Microbiol. 43 (10), 5143-5149 (2005)
   PUBMED   16207976
REFERENCE   2  (bases 1 to 5660)
  AUTHORS   Beutin,L., Kong,Q., Feng,L., Wang,Q., Krause,G., Leomil,L., Jin,Q.
            and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (14-APR-2005) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, 23# HongDa Street, Tianjin
            300457, P.R. China
FEATURES             Location/Qualifiers
     source          1..5660
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:562"
                     /note="serogroup: O174"
     misc_feature    <1..>5660
                     /note="O antigen gene cluster"
     gene            51..794
                     /gene="wbcX"
     CDS             51..794
                     /gene="wbcX"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WbcX"
                     /protein_id="AAY28247.1"
                     /translation="MSTVTLVITSCGRFELLEKTISSLVNRYPFTEKIIIEDSGNVKV
                     INKIKEKYDRDFTILINEKNIGQIKSIDKAYSLVTTEYIFHCEDDWHFYRDGFIEDSL
                     DILKEYRHISMVSLRDWLNDVSINCHMERSTLLQTGNGTRFFMLKPKNGDGWGGYSFN
                     PGLRRLQDYKEIIGQFSKVGHEKNISLYFLEKGMNMALLESSAVEHIGWNHHILSKNN
                     PQERFYLLKKYLPKEVTNVLKIIYRKIAG"
     gene            797..2068
                     /gene="wzx"
     CDS             797..2068
                     /gene="wzx"
                     /note="O unit flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="AAY28248.1"
                     /translation="MKYLFIWSLTPKLYELSLNLSIGIALINYLGPVEQGKIGFLINL
                     CTLMSFLTTLGIGPVYSNFVSRSNNERLISNKFKENVTLRFLGYILFLLVSLLFLFFF
                     KRGLIYLSIPFLIGKLFFSFDIYYNLIEGKAGFKNYAISKFISLTCINVFRLYCIYAQ
                     LDIYWVAFSFFLTDFLTFFVYFLLFDKFKYFGFKFDYKKSLIIFKINYKLALSTIVVS
                     LFTQLDIVMIGTMLGDKAAGEYYASTRLATPLVFISTIIISTFFSKLSRNWVVNKKEY
                     YELLAFISGSIIFSYSAIVLIIFIFGNDIFFLFFSSEYKASYDLFLIHIVGLIFVLLG
                     PLTGKHLIIKKDYGAELSKTLLAAIVNIALTSIAVLKYENLNLVAVSTLISYMIANFG
                     YFIVKKDWLLIKAILNGVNPLFLVRYAKKIL"
     gene            2049..3188
                     /gene="wzy"
     CDS             2049..3188
                     /gene="wzy"
                     /note="O unit polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="AAY28249.1"
                     /translation="MLKRYSNLIFSFVIAFSFFSYVMNPSLKFIYKSPVINFIPFLLC
                     CLITIIFLTEKKIKLNYYELFSILYVGFFFILQYTYFIQSTDSIETLLRLMSVNFSFL
                     FGLLLGWCFKRESIEKLFILWVLLLSIANICGVINYSDGVEFNHLNFTLPLGTVVTWL
                     IFKAFMKDTDRYIFTLSVILFLFFNIIFAGSRTAIFLPILVSLFIMVIFRKYVSIKKT
                     VISFIILITITIISLPYILSNLNAYFLSKVQNMADISEDSRYNLYLKCFNMLLEHPLG
                     IGYGNYKYFITEPYPHNILLEIGLNSGVLGCFVFITYVMITTIVIIKKTKSCYNEKNL
                     FVLTIFLYSLFSWMFSNDFASSSVVFFLLGVLGHIASSNNEKEIK"
     gene            3191..4075
                     /gene="wbcY"
     CDS             3191..4075
                     /gene="wbcY"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WbcY"
                     /protein_id="AAY28250.1"
                     /translation="MFSIVITTKDRAYYLKRAVDSILKSTISPKDIVIINDGGKAICE
                     NDFPPMKHITLSIVNNRFSMGANYSRNQGIDKALTNYVFLLDDDDAFTPTTFENRINI
                     IKSSVDIGVVFTGINIVSSKNLDKVIRKSKNINDQITTHQLLTEGNVIGSTSRALIRK
                     DLFCEAGRFDPQLSCLQDYDLWIRMSLVSRIVNDHKYGVYYTIHDNGRQISTNYEKYM
                     QVGKLLINKYDSLLNKNTINAFKSNIYLRVAISASASSNKARLKYSFMSLKYRLNIKA
                     LALFLFPSSVLKRFYNYV"
     gene            4661..5482
                     /gene="wbcZ"
     CDS             4661..5482
                     /gene="wbcZ"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WbcZ"
                     /protein_id="AAY28251.1"
                     /translation="MKGFSVLMSVYKGEKENYLDECFKSLHEQTIKANEIILVIDGPV
                     SKELYQVIDKWGEVLPIIKVKLDKNVGLGQALNIGLKHCNFELVARMDTDDYCVKDRF
                     LLQMKFFEEHNDIMVLGGEIEEYDQSLSIPLGKRTTALSHEEIIELAKKRNPLNHMTV
                     MYKKSFILSVGGYQHHLYMEDYNLWLRVLASGGCICNLPKVLVHVRAGEEMIKRRKGW
                     IYIKSEIQLARLKSKLNITCFWNNYYTMTLRILARLMPTPLLKFVYSKLRTSKLA"
ORIGIN      
        1 attggtagct gtaagccaag ggcggtagcg taaacatttg agaggaatta atgagtacag
       61 ttacactcgt tataactagt tgcggtagat ttgaattatt agaaaaaaca atatcttctc
      121 ttgtaaatag gtacccattt acagagaaga tcataattga ggattctggt aatgtaaaag
      181 ttataaacaa aataaaagaa aaatatgata gggattttac aatcttaata aatgaaaaaa
      241 acattggaca aattaaaagc atcgataagg catatagttt agtcactacc gaatatatat
      301 tccattgtga agatgattgg catttctata gagacggatt catagaagat tcattagata
      361 tattgaaaga gtatagacac atttcaatgg tatcacttag agattggcta aatgatgtat
      421 cgatcaattg tcatatggaa agatccacgc tcttacaaac gggaaatgga acaagatttt
      481 tcatgttaaa acccaaaaat ggtgatggct ggggagggta ttcgttcaac ccggggctga
      541 gacgacttca agattataaa gaaataatcg gacaattttc aaaagtaggg catgaaaaaa
      601 atataagttt atatttttta gaaaaaggaa tgaatatggc gctattagaa tcttcagctg
      661 ttgagcacat aggttggaat caccatatat tgagtaaaaa taatcctcaa gaaagatttt
      721 atttgcttaa aaaatattta ccaaaggaag taactaatgt gctcaagata atttatagaa
      781 aaattgctgg gtgattatga aatatctttt tatttggtct cttactccca aattatatga
      841 attaagcctt aatctttcta tcgggatagc tcttataaat tatctaggac ctgtagaaca
      901 aggtaaaata ggttttttaa ttaatttatg cacattaatg agttttctta ccacgcttgg
      961 aattgggcct gtatattcta attttgttag tcgttcaaat aatgaaagat taatatccaa
     1021 taaatttaag gagaatgtta cattaaggtt tttaggttat attttgtttc ttctggtttc
     1081 acttttattt ctattcttct ttaaaagggg gttgatatat ttatcaatac catttttaat
     1141 agggaaatta tttttcagtt ttgatatata ttataacctc attgaaggta aggctggatt
     1201 taaaaattat gcaatttcaa aatttatatc tttgacatgt ataaatgtat ttcggttata
     1261 ttgtatatat gcacaattag atatatattg ggttgcgttt tcattctttt tgactgattt
     1321 cttgacattt tttgtgtatt ttttgttatt tgacaaattt aagtatttcg gttttaaatt
     1381 tgattacaaa aaatcattaa ttatatttaa gataaactat aagttagcat tatctacaat
     1441 agttgtaagt ctctttactc agctggatat agtaatgatc ggaactatgc ttggagataa
     1501 agctgcaggt gagtattatg catcaactag actcgctact cctttagttt ttatatcaac
     1561 aattattata agcacttttt tttcaaaact ttctagaaac tgggttgtta ataaaaaaga
     1621 atattatgaa cttttagctt tcattagtgg aagtataatt ttttcgtatt cagcaattgt
     1681 actcattatt tttatatttg gaaacgatat atttttcttg tttttcagtt cagaatataa
     1741 agcctcttat gatttattct taatccatat tgtaggtttg atttttgtac ttttaggccc
     1801 gcttactggg aagcatttaa taattaaaaa agattatggg gcagaactta gcaaaacctt
     1861 attggcagca attgttaata tagccttaac ttccattgca gtgttaaaat atgaaaatct
     1921 taacttagtg gccgttagta cattaataag ttatatgatt gctaattttg gttactttat
     1981 agtaaaaaaa gattggctat taatcaaagc tatattgaat ggtgttaatc cccttttttt
     2041 ggtgagatat gctaaaaaga tactctaacc ttatattttc ttttgttatt gcgttttcct
     2101 ttttttcata cgtaatgaat cccagtttaa aatttatata taaatcacca gtaataaatt
     2161 ttatcccttt tttgttatgt tgtttgataa caatcatttt tcttacagag aaaaaaatca
     2221 agcttaacta ttatgaatta ttttcaattc tttatgttgg gttctttttt atacttcaat
     2281 atacctattt tatacaatcg acagattcaa tagaaacttt actacgatta atgtcggtaa
     2341 atttttcatt cttatttgga ttactattag gctggtgttt taaaagggag tcaattgaga
     2401 agctttttat actatgggtc ctattacttt ctattgctaa tatctgcggt gtaatcaatt
     2461 attctgatgg ggtggaattt aatcatttga actttacatt acctctaggg actgttgtta
     2521 catggttaat ttttaaagca tttatgaaag atactgatag gtacatattc acattatctg
     2581 ttatattatt tttatttttt aatataatat ttgccggaag tcggactgct atttttctac
     2641 caatcttagt aagtttattt attatggtga tatttagaaa atatgtgtct ataaagaaaa
     2701 cagtgatctc attcattata ttgataacaa taactataat atcattgcct tatattttaa
     2761 gtaacttgaa tgcttatttt ttaagcaagg ttcaaaatat ggctgatatc agtgaggata
     2821 gtcgttataa tttatatttg aaatgtttta atatgctttt agagcatcct cttggaatag
     2881 ggtatggcaa ttataaatat tttatcactg aaccttatcc tcataatatt cttttagaaa
     2941 ttgggctgaa tagtggggtt ttaggatgtt ttgtgtttat aacctatgtg atgatcacca
     3001 caatagtcat aataaagaaa acaaaatcct gctataatga aaaaaatcta tttgttttga
     3061 ctatattttt atattcactt tttagctgga tgttttcaaa cgattttgca agtagcagtg
     3121 ttgttttttt cttattgggt gtgctaggtc acatagcctc tagtaataat gaaaaagaga
     3181 ttaaataaat atgttttcta tagtaattac aactaaagac cgggcttatt atttgaaaag
     3241 agcagttgac agcatattaa aatcaactat ttctccaaaa gatatcgtaa taattaatga
     3301 tggtgggaag gctatatgtg aaaatgattt tccacctatg aaacatatta cattaagtat
     3361 agttaataat cgtttttcaa tgggagctaa ctattcaaga aatcaaggaa ttgataaagc
     3421 cttaactaat tatgtatttt tacttgatga tgatgatgcc tttactccaa ctacctttga
     3481 aaatagaatt aatataatta aatcttcagt ggatattggg gtcgttttta ctggaattaa
     3541 tatagtatca tccaaaaatt tggataaagt aattagaaaa tcaaaaaaca tcaatgacca
     3601 aatcactacg catcagcttc taacagaagg caatgttatc ggatctacat cacgtgcatt
     3661 aattcgtaaa gatttattct gtgaagcggg aagatttgat cctcaattaa gctgtcttca
     3721 ggattatgat ttatggatta gaatgtcatt ggtatcaaga attgtcaatg atcacaaata
     3781 cggagtttat tatacaatac acgacaatgg gcgacaaatt agtactaatt atgaaaaata
     3841 tatgcaagta ggaaaattgt taataaataa atatgattct cttcttaata aaaatacaat
     3901 taatgctttt aagtctaata tttacttaag agttgcaata tctgcctctg cttcatcaaa
     3961 taaagcaaga ttaaaatatt cttttatgtc attaaaatat aggcttaata ttaaagcttt
     4021 agctttgttc ctattcccta gctctgttct taaaagattt tataattatg tataagtttg
     4081 aatgagtaat tgcaatatta ttacgttttc tgtatttaaa ctcaagattt tttcttttca
     4141 cctttctttt tgctaggcac ttgttgaata gtagatggat gtgtaataca ataatggaag
     4201 atgtcttagt gatttataca tttcaataaa ctttcaaaaa aagttaatta taacgcatat
     4261 atttaaatga tttatattta atgtttgtta gtcagataaa tattttattg tctctatagc
     4321 tataggcttt tgttactttt aaataaagaa gatatgtgaa aaataaacaa ttttaatgaa
     4381 gagtggagcc atgtgattca tgtgttctaa tttttatctt aataacaatg atgtacaatg
     4441 gcatggttac aatactattt aatatggtag gggtagtatc tttgaagtag tttatattaa
     4501 aaactatgtt cgtaaattat atatgttccg acaatatata aagattttag atagagggat
     4561 tatctagtaa tacaatgcgt tagataaaat aaatccgtat ctctattact aaaacaatta
     4621 aatgttttat taaagacaag gatattaaga gggcatatta atgaaaggtt tttcggtact
     4681 tatgtctgtt tataaaggtg aaaaggaaaa ctatcttgat gagtgtttta aaagcctgca
     4741 tgaacagaca attaaagcta atgaaatcat tttggttatt gacggcccag tttccaaaga
     4801 attatatcag gttatagata aatgggggga ggttctgccc attataaaag ttaaacttga
     4861 taaaaatgta gggcttggac aagctttaaa tataggcctt aagcactgta attttgagtt
     4921 ggttgcacga atggatactg atgattattg tgtaaaggat agatttttat tacagatgaa
     4981 attcttcgaa gaacacaatg atataatggt cttggggggc gagatagagg aatacgacca
     5041 atccttgagt attccattag gcaaaagaac aacagcatta tctcacgaag aaataattga
     5101 acttgcaaaa aaaagaaatc ctctcaacca tatgacagtc atgtataaaa aaagctttat
     5161 cttaagtgtt ggaggttatc aacatcattt atatatggaa gattataatc tttggttgag
     5221 agtattagct tctggtggtt gtatttgcaa cttacctaag gtattagtgc atgtaagagc
     5281 tggggaagaa atgatcaaaa gacgaaaagg ctggatatat atcaagagtg aaatacagct
     5341 agcacgttta aaaagtaagt taaatataac ctgtttctgg aataactact atacaatgac
     5401 acttaggatc cttgccagac taatgccgac gccacttcta aaattcgtat attctaaact
     5461 tagaacgtct aaattagctt gatgttgaca tttcatttgt ggggagggtg aattaattca
     5521 tttaaaatga taaaacattg cgccaaatgc caataaaaag ttatattttt acacggaatc
     5581 tgaagtaacc tttatagttc atcccctgac aggagtaaac aatgtccaag caacagatcg
     5641 gcgtcgtcgg tatggcagtg
//