LOCUS       AY654590               16573 bp    DNA     linear   BCT 05-JUL-2005
DEFINITION  Escherichia coli O59 O-antigen gene cluster, complete sequence.
ACCESSION   AY654590
VERSION     AY654590.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 16573)
  AUTHORS   Guo,H., Kong,Q., Cheng,J., Wang,L. and Feng,L.
  TITLE     Characterization of the Escherichia coli O59 and O155 O-antigen
            gene clusters: the atypical wzx genes are evolutionary related
  JOURNAL   FEMS Microbiol. Lett. 248 (2), 153-161 (2005)
   PUBMED   15990253
REFERENCE   2  (bases 1 to 16573)
  AUTHORS   Guo,H., Kong,Q., Cheng,J., Wang,L. and Feng,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (15-JUN-2004) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, Hongda 23, Tianjin 300457, China
FEATURES             Location/Qualifiers
     source          1..16573
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:562"
                     /note="serogroup: O59"
     CDS             1354..2565
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyltransferase"
                     /protein_id="AAV74375.1"
                     /translation="MKILIVNTFFYPNEIGGAEFSCKVLAEALAERGHDVSVLSTTNG
                     ESRQTRLGKLKLYYLKLSNVFWHGKSKKQGAIKGIIWHAMDSFNPIMFFKLLKLFKEI
                     RPDVIHTNNIVGFSCSLWFAALVLNIPVVHTLRDYYLKCYRSCMRKNNKNCDSQCVAC
                     KLLTTPRKIISSNVNAVIGNSQYMINSHLKNNYFSNTPMKKVIFNAWNPSTDLQKHQN
                     LLWQRVEHARFGFIGRITEEKGIELLLRSFKNIKNQPFSNKISLIVAGEGDDNYIKKL
                     SDEYSDTDGILFVGKVEPEDFYKRIDFTIVPSLWEEPLARVVFESFFFSLPVLTTARG
                     GNAEVVKHGQNGFIFSETVESLSATMQMALNVNYIEMSKAAFYSRLKFTNENLVSSYE
                     NIYRRIKHEEK"
     gene            2552..3721
                     /gene="wzy"
     CDS             2552..3721
                     /gene="wzy"
                     /note="O-antigen polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="AAV74376.1"
                     /translation="MKKSEFQAEKLIILFYFIINLCTFIIITSSSIYIGDPAGEYYTV
                     PLDIAIILFISNTAIYYLLYLIYRCCVSHIAFHNEVIIKRIETLLFLGVTIALLGFFW
                     IDYGRAEYQSTSPFGFVFRLIPYSVIWLLYVSINSKWNAKSIFLIVYYVAAKIIMGWS
                     GILLALFWVLFIKYYSAKKRSFLFMCMCMTLLVILYFSAPIVYYLKYYIRYAGQFEFN
                     YPVLLSKLTARLSTIQNVLYIYQNTNVFTNLYNKYLFDGFYFIEPITSILPRALLGIS
                     ATNFETIYVNIVTGEFNPGVIFYLGLFGKLLAYFNTGIYNFGNFFIVTFVLLGGLFIL
                     LKLNFKKAANPFIFYTIIQFALSGSIEELSYTLYGICLVLIFCKIRFGIHNENRY"
     CDS             3705..4781
                     /codon_start=1
                     /transl_table=11
                     /product="mannosyltransferase"
                     /protein_id="AAV74377.1"
                     /translation="MKIGIDSTALVKNRTGVGNYIYSILNELVKNTEHQFILYSNKEI
                     FYPDLPNVRKVIHSSTYKGPVWQNTSLIYSLFKDRPDVFWGGNGYLPMLVPKKTKLIL
                     TVHDLVYKYAGRTMPTISRLSRRFFQPLSVNKADAIVAVSHATADEVYKEYGVRPDCV
                     VHPQISPLFSLQEKSNLAKIKEKYQLNEYILTIGTLEPRKNMVALIQAYLNVVSLGYK
                     LPVLAIAGGKGWMQGELDKLVEKGVAKGIIRKLGYVSDPDLAVLYSGAQLFVLASIYE
                     GFGMPILEAQASGCPVLISRIKSMIEAAGDICCTFEPDIQSIENSLINLSKGNQPLIC
                     RLPYTIENKIDIAAKKYEKLMRLS"
     CDS             4919..5962
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyltransferase"
                     /protein_id="AAV74378.1"
                     /translation="MTYPIPDDGVYTSVYRCHHPRIISYFSCLLALPTNIPLQVAYYY
                     SPKFKKIINKLVPEHDLLLPHLIRVAGYVKKNSTPKILEMTDAISMNYERVCKLKNST
                     GIKGLIYKIERNRLNQYEKSIAKYFDQTIFVSQHDKNYLFRNLPDLYHKSLVCTNGVD
                     VANFKNTLFKRSYKLIFIGNMFSVQNFDAAFWFCESVLPILRQYGPFTFHVIGKISLE
                     NSKKLSAYEGVFVTGAVDNVMDYANNSLAGICSVRLAAGVQNKILEYMAMGIPAITTS
                     IGLEGLFAVDGESIVVANTPHEFVSTILKLFNDPSFGKTISKNGLGYVQQNHSWSEKL
                     QPLIQVINNLIEE"
     gene            5966..7363
                     /gene="manC"
     CDS             5966..7363
                     /gene="manC"
                     /note="mannose-1-phosphate guanyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="ManC"
                     /protein_id="AAV74379.1"
                     /translation="MSSIIPVIMAGGSGSRLWPLSRELRPKQFLKLDGELTMLQATIN
                     RLKNFVTTQPLVICNEDHRFLVAEQLRYLGKLENNIILEPFGRNTAPAIALAAFTALQ
                     SSSLKEDPILLVLAADHVIRDEESFKRSVQQAVPYAKSGKLVTFGIVPTHAETGYGYI
                     QRGKELNDAYSVKQFVEKPELETAQQYFNSGEYYWNSGMFLFRASRYLDELALFRPDI
                     YTACGKAIGAIDPDHDFVRIDKDAFNSCPSDSIDYAVMEKTSDAVVVPMDAGWSDVGS
                     WLSLWELSKKDSMGNSFHGDVIQHSSKNNFVFTESCLVSLVGVEKLVVVQTKDAILVA
                     DQNKVQDVKNIVEKLKNSCRTEHRIHREVFRPWGKHDLIDDGDVYRVKRISVKPGERL
                     SLQMHHHRAEHWIVVSGIAKVTNGDNIYLLKENESTFIPSGTIHALENPGEIMLELIE
                     VQSGVCLDENDIIRL"
     gene            7485..8915
                     /gene="manB"
     CDS             7485..8915
                     /gene="manB"
                     /note="phosphomannomutase"
                     /codon_start=1
                     /transl_table=11
                     /product="ManB"
                     /protein_id="AAV74380.1"
                     /translation="MTKYNSSSLIANSNVNFGTSGARGLVVDFTHNVCAAFTHAFLSV
                     IEKHFKFDTVAVAIDNRPSSFNIAQACVFAIKQHGYGIEYHGVIPTPALAHYSMQKNI
                     PCIMVTGSHIPFDRNGLKFYRPDGEITKEDELAIVNSEYTFSPVGVLPHLETSSQGAD
                     CYLERYVSLFYSDILKGKRIGVYEHSSAGRDLYASLFNQLGAEVISLGRSDEFVPIDT
                     EAVSDEDRVLAREWSKKYNLDAIFSTDGDGDRPLVADENGEWLRGDILGLLTAIELNI
                     KALAIPVSCNTAIEESNKFASIQRTKIGSPYVIAAFADLAKQFDSVAGFEANGGFLLA
                     SDLQINDKELKSLPTRDAVLPALMLLIASRNSTISQLINNLPQRFTWSDRVKNFPSDS
                     SQQIIKNAISSPNNFFNSLGYESLSCSSIDETDGARFTLNNGDIIHLRPSGNAPELRC
                     YAEASDENQAKQYVTNVLGNITSLIS"
     gene            9112..10518
                     /gene="gnd"
     CDS             9112..10518
                     /gene="gnd"
                     /note="6-phosphogluconate dehydrogenase"
                     /codon_start=1
                     /transl_table=11
                     /product="Gnd"
                     /protein_id="AAV74381.1"
                     /translation="MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIA
                     ENPGKKLVPYYTVKEFVESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGN
                     TFFQDTIRRNRELSAEGFNFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIA
                     AVAEDCEPCVTYIGADGAGHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLSNEELAQT
                     FTEWNNGELSSYLIDITKDIFTKKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEP
                     LSLITESVFARYISSLKDQRVAASKVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYA
                     QGFSQLRAASEDYNWDLNYGEIAKIFRAGCIIRAQFLQKITDAYAENPKIANLLLAPY
                     FKQIADDYQQALRDVVAYAVQNGIPVPTFSTAVAYYDSYRAAVLPANLIQAQRDYFGA
                     HTYKRIDKEGVFHTEWLD"
     gene            10638..11921
                     /gene="wzx"
     CDS             10638..11921
                     /gene="wzx"
                     /note="O-antigen flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="AAV74382.1"
                     /translation="MSNYIKNAGWIFFEKFVRIAISFMLFAFVSRVLNPNDFGVLSYY
                     QTITTMLLALTNLGFDNVLINEFNQNEKHNKIFATAFWSRIIVSTVVILLFAVGVCFY
                     DLPMVNKIVLLLCLSSLVFQTQNTYVSYFQSQLQASIITKISFLSLLLSALVKVYLLM
                     TDKNIIWFAFSYSFDFAVSFLFFAVFSYKRNYVSISLRYFDLNVLKGLLRSSWPIIAS
                     AVIVVLYTRLDQLMIMNMLGSDSVAIFSVAIKISEAYLFVPAALVTSYYPLISKSPSN
                     DNIRFYFDVVFATSIIMAVGVAIISFFLIPIMFGEYYACSYTILIVLLLGSLFSILGS
                     ACTNLMIVYGLSYLRLIRAIFGLLVNFSLNLIFIPKYGVIGAAYASVVSQIFAAWVSN
                     AFSKKTIECFKLQTITVLTCGVLGGRQLCQILFKK"
     CDS             12001..12399
                     /codon_start=1
                     /transl_table=11
                     /product="acetyltransferase"
                     /protein_id="AAV74383.1"
                     /translation="MFLEYYYSYRYYRLFKIPIANHLTIGLKKLGEKNTIFPHPVGIV
                     IGKKVSIGNNCTIYQNVTIGVSNNKTEDYPIIGDNVIIYAGAIIIGSVSIGNNVIIGA
                     GCIVTKDVPEDKIAVGSPMKIIDKKANVLY"
     gene            12506..13672
                     /gene="ugd"
     CDS             12506..13672
                     /gene="ugd"
                     /note="UDP-Glc-6-dehydrogenase"
                     /codon_start=1
                     /transl_table=11
                     /product="Ugd"
                     /protein_id="AAV74384.1"
                     /translation="MKITISGTGYVGLSNGILIAQNHEVVALDIVQAKVDMLNKKQSP
                     IVDKEIEEYLATKDLNFRATTDKYDAYKNADYVIIATPTDYDPKTNYFNTSSVEAVIR
                     DVTEINPNAVMIIKSTIPVGFTESIKERFGIENVIFSPEFLREGKALYDNLHPSRIVI
                     GEQSERAERFAALLQEGAIKQDIPTLFTDSTEAEAIKLFANTYLAMRVAYFNELDSYA
                     ESLGLNSRQIIEGVCLDPRIGNHYNNPSFGYGGYCLPKDTKQLLANYQSVPNNLISAI
                     VDANRTRKDFIADSILARKPKVVGVYRLIMKSGSDNFRASSIQGIMKRIKAKGVPVIV
                     YEPAMKEDDFFRSRVVRDLDAFKQEADVIISNRMSADLADVADKVYTRDLFGND"
     gene            complement(13738..14742)
                     /gene="gla"
     CDS             complement(13738..14742)
                     /gene="gla"
                     /note="GlcA epimerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Gla"
                     /protein_id="AAV74385.1"
                     /translation="MKFLVTGAAGFIGFYVSKRLLAAGHQVVGIDNLNDYYDVNLKQA
                     RLDLLKHDNFSFYKIDLADREKMAALFADERFDRVINLAAQAGVRYSLENPNAYADAN
                     LIGFLNILEGCRYNNVQHLLYASSSSVYGMNLKMPFSTDDSVDHPVSLYAATKKANEL
                     MAHTYSHLYGLPTTGLRFFTVYGPWGRPDMALFKFTKAMLEGKSIDVYNFGKMKRDFT
                     YIDDIAEAIIRLQDVIPEKDPQWAVETGSPATSSAPYRVYNIGNSSPVELMDYINALE
                     EALGIEANKNMMPLQPGDVLETSADTKALYDVIGFKPETSVKEGVKNFVEWYRNFYKV
                     "
     gene            15094..16128
                     /gene="wzz"
     CDS             15094..16128
                     /gene="wzz"
                     /note="O-antigen chain length determinant"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzz"
                     /protein_id="AAV74386.1"
                     /translation="MAIIAKLWRLKIISSVRVMMRVENNNVSGQNHDPEQIDLIDLLV
                     QLWRGKMTIIISVIVAIALAIGYLVVAKEKWTSTAIVTQPDVGQIAGYTNAMNVIYGP
                     AVPKVSDIQTSLIGRYSTAFSALAETLDNQEEPEKLTIEPTVKNQSLPLAVSYVGETA
                     EGAQKQLAQYIQQVDDQVNEELEKDLKDNIALRMKNLQDSLKTQEVVAQEQKDLRIRQ
                     IQEALQYANQAQVTKPQVQQTEDVTQDTLFLLGSEALESMIKHEATRPLVFSPNYYQT
                     RQNLLDIESLKVDDLDIHAYRYVMKPTLPIRRDSPKKAITLILAVLLGGMVGAGIVLG
                     RNALRNYNAK"
ORIGIN      
        1 attgtggctg cagggatcaa agaaatcctc ctggtaactc acgcgtccaa gaacgcggtc
       61 gaaaaccact tcgacacctc ttatgaatta gaatctctcc ttgagcagcg cgtgaagcgt
      121 caactactgg cggaagtaca gtccatttgc ccgccgggag tgaccattat gaacgtgcgt
      181 cagggcgaac ctttaggttt gggccactcc attttatgtg cacgacccgc cattggtgac
      241 aacccatttg tcgtggtgct gccagacgtt gtgatcgatg acgccagcgc cgacccgctg
      301 cgctacaacc ttgcggccat gattgcgcgc ttcaacgaaa cgggccgcag ccaggtgctg
      361 gcaaaacgta tgccaggtga cctctctgaa tactccgtca ttcagaccaa agagccgctg
      421 gaccgcgaag gtaaagtcag ccgcattgtt gaattcatcg aaaaaccgga tcagccgcaa
      481 acgctggact cagatattat ggccgtgggc cgttatgtgc tttctgccga tatttggccg
      541 gaacttgaac gcactcagcc tggtgcatgg gggcgtattc agctgactga tgctattgcc
      601 gaactggcga aaaaacagtc tgttgatgca atgctgatga ctggtgacag ttacgactgc
      661 ggcaaaaaaa tgggctatat gcaggcgttt gtgaagtatg gactacgcaa cctgaaagaa
      721 ggggcgaagt tccgcaaagg gattgagaag ctgttaagcg aataatgaaa atctgaccgg
      781 atgtaacggt tgataagaaa attataacgg cagtgaagat tcgtggcgaa agtaatttgt
      841 tgcgaatatt cctgccgttg ttttatataa acaatcagaa taacaacgag ttagcaatag
      901 gattttagtc aaagttttcc aggattttcc ttgtttccag agctgattgg taagacaatt
      961 agcgtttgaa tttatgaggg ctttgcgggg ttagatgcag agttcgtgac atccattgag
     1021 aatctacgca gtgcactggt agctgttaag ccaggggcgg tagcgtgggt gaaacgttta
     1081 ataatgagat ataagttatg attatttcta aacttagccg gcataaaatt gcttgtgctg
     1141 agtcagagtt agaacttgta aattatagta tataaattaa actgtgaaat attattgcgg
     1201 taatcttacc aaaaagctgt atgaatttac cataaaacaa atattgattg tgttcttggt
     1261 tttttattaa gcagatcaat agttgttatc tattgccttg ttgggtaata aggcatctat
     1321 aaatcttgat ggttaatatt taagtcccaa taaatgaaaa ttttgattgt aaatactttt
     1381 ttttatccaa atgaaattgg tggtgctgag ttttcatgta aggtattagc agaagctctt
     1441 gcggaacggg ggcatgatgt gtctgtttta tctacaacaa atggggaatc aagacaaact
     1501 aggttaggta aattgaagtt gtattattta aaattaagta atgtgttctg gcatggtaaa
     1561 tcaaaaaaac aaggagcaat aaaagggatt atatggcatg ctatggattc atttaacccg
     1621 attatgttct ttaaattatt aaaattattt aaagaaatca ggcctgatgt tatacataca
     1681 aataatatag ttggctttag ttgctcatta tggtttgctg ctttagtttt aaatattcct
     1741 gttgtccaca cgttacgtga ttattattta aaatgttatc gttcatgcat gcggaaaaat
     1801 aataaaaatt gtgattctca atgtgttgca tgtaagttat taacaacacc aagaaaaatt
     1861 atttcatcga atgtaaatgc tgttattggc aatagccagt atatgattaa ctctcatttg
     1921 aaaaataatt atttttcaaa tacaccgatg aaaaaagtaa tatttaatgc atggaaccca
     1981 tcaacagacc ttcaaaaaca tcaaaattta ctttggcaac gagtagaaca tgcacgattc
     2041 ggttttattg gaagaatcac agaggaaaaa ggaattgaac tattgttaag gtcgttcaaa
     2101 aatataaaga accaaccttt tagcaataaa atcagcttaa tagttgcggg ggaaggagat
     2161 gacaattata taaagaaatt atctgatgaa tattcagata cagatggcat attattcgtt
     2221 gggaaagtag aacccgaaga tttctataag cggattgatt ttactattgt tccgtcttta
     2281 tgggaagagc cattagcaag agttgttttt gagtcatttt tcttttcatt gcctgttttg
     2341 acaacagctc gaggaggaaa tgccgaagtt gtgaagcatg ggcagaatgg gtttattttc
     2401 tccgaaacag tagagtcttt gtcggcaaca atgcagatgg cactgaatgt aaattatatt
     2461 gagatgtcta aggctgcttt ttatagtcga ttaaaattta cgaatgaaaa tctggtttca
     2521 tcctatgaaa atatatatcg aagaataaaa catgaagaaa agtgaatttc aagcagaaaa
     2581 actaataatt ttgttttatt ttataataaa tctttgcacc tttataatta ttacatcgtc
     2641 atcgatatat ataggtgatc cagcgggtga atattatact gtgccgcttg atatagctat
     2701 aatattattt attagtaata ctgctatata ttatctttta tacttgatct atcgttgttg
     2761 tgtatcacat attgcattcc acaatgaagt tatcataaaa agaattgaaa ctttattgtt
     2821 tttaggtgtt acaattgcat tattaggctt tttttggatt gattatggac gagctgaata
     2881 tcaaagtaca tctccatttg gttttgtctt taggttaata ccttattccg tcatttggct
     2941 tctctatgtt tcaattaatt caaaatggaa tgcaaaaagt atattcctta ttgtttacta
     3001 tgttgccgct aaaataataa tgggatggag tggtatatta ttagcactct tctgggtttt
     3061 gtttataaaa tattacagtg cgaagaaacg tagtttttta tttatgtgta tgtgcatgac
     3121 tctgctagtc atattgtatt tttcggctcc tatagtttat tatttgaaat attacataag
     3181 atatgctggt cagtttgaat ttaattatcc tgtgctatta tcgaagctta cggcaagatt
     3241 atctactatt cagaatgtgt tgtatattta tcaaaatact aatgtattca caaacttata
     3301 taataagtat ttatttgatg gtttttattt tatcgaacca ataacatcta tcttgcctag
     3361 agctctttta ggtataagtg caactaactt tgaaactata tatgtaaaca tcgtaactgg
     3421 agagttcaac ccaggtgtca tattttattt gggattgttt ggtaaactat tagcttactt
     3481 taatacaggg atatataatt ttggcaactt tttcattgta acctttgttc ttcttggggg
     3541 gctatttata ttactcaaat taaactttaa aaaagcagcc aaccctttta ttttttatac
     3601 aatcatacaa tttgctctta gtggctcgat agaggaacta tcatatacac tatacggtat
     3661 ttgtcttgtt ttaatatttt gtaaaatacg gtttggtatt cataatgaaa ataggtattg
     3721 attcaactgc acttgtaaaa aatagaactg gagtaggtaa ttatatatat tcaattttaa
     3781 acgaattagt taaaaataca gaacatcaat ttattttata ttctaacaaa gaaatatttt
     3841 atcctgattt gccaaatgtt agaaaagtta ttcattcatc gacttataaa gggccagtat
     3901 ggcaaaatac aagtttgatt tattccctct tcaaagatag acctgatgtt ttttgggggg
     3961 ggaatgggta tttaccaatg ttagttccga agaaaacaaa gctgatttta acagttcatg
     4021 atcttgtata taaatatgct ggtcgtacaa tgcctaccat cagtagatta tctcgtaggt
     4081 tttttcagcc attatctgta aataaagctg atgcaatagt tgcagtcagt catgcaactg
     4141 cagatgaggt atataaagaa tatggtgtcc gacctgattg tgtggtccat cctcagatat
     4201 ctccgttatt ttcattacaa gaaaaatcta acttagcgaa aattaaagaa aaataccagc
     4261 ttaatgagta tatattgaca attggaaccc ttgaaccacg aaaaaatatg gtggctttaa
     4321 tccaggcata tctaaacgta gtatcattgg gttataaatt acctgtactg gcaattgctg
     4381 gaggtaaagg ctggatgcag ggagagttag ataaattagt agagaagggg gtggcaaaag
     4441 gtattatcag aaaattaggt tatgtatctg atccggattt agcggttctt tattcaggag
     4501 ctcaactttt tgttttagca tctatttatg aaggttttgg tatgccgatt ctggaggctc
     4561 aagccagcgg gtgtcctgtg cttatatcca gaataaaatc tatgatagag gccgcaggtg
     4621 atatttgctg tacttttgag ccagatatac agtctattga gaactctctt ataaatctat
     4681 caaaagggaa tcagcctctt atttgtcggc taccatatac tattgaaaat aaaattgata
     4741 ttgcagctaa aaaatatgaa aaattgatga ggttatcttg aagaaaatat tggtaattac
     4801 cccaagattt ccatatccag tgatcggagg agatagatta cgtatttatg aaatatgtaa
     4861 agagctgtct cgtaaatact cattgactct ggttagtttg tgtgagtcga atgaagaaat
     4921 gacatatcct atccctgatg atggtgttta tacatcagta tatagatgtc atcatccacg
     4981 aatcatatcg tatttttcat gcttactagc actgcctact aacataccac tgcaagttgc
     5041 ttattactat tctcccaaat ttaaaaaaat aattaataag ttagttcctg aacatgattt
     5101 attattacct catttaattc gtgttgctgg gtatgtaaaa aaaaactcaa ctcctaaaat
     5161 attagaaatg actgatgcta tttctatgaa ttatgagaga gtatgtaaat taaaaaatag
     5221 tacaggaatt aaaggtctta tatataaaat tgagcgtaac cgtctaaatc aatatgaaaa
     5281 atcaatagca aaatactttg atcagacaat ttttgtatct caacatgata agaactacct
     5341 ttttagaaat ttaccagact tatatcataa gtcattagtt tgtacaaatg gagttgatgt
     5401 tgctaacttt aaaaatacat tgtttaaaag aagctacaaa cttattttta ttggcaacat
     5461 gttttctgtt caaaattttg atgcggcttt ttggttttgt gaatctgtat tacctatact
     5521 tcgtcaatat ggaccattta cctttcatgt tataggtaaa atatcgttag aaaactcaaa
     5581 aaaactttca gcatatgagg gggttttcgt tactggggct gtagataatg ttatggacta
     5641 tgcaaataat tctttggcgg gcatatgttc agtaagatta gctgcgggtg tacagaataa
     5701 aattttagag tacatggcta tgggaatacc ggcaataaca acatcgattg gtttggaggg
     5761 gttattcgct gttgacggcg aaagtatagt tgtggctaat acacctcatg agtttgtatc
     5821 aacaatattg aaattgttta atgatccaag ttttggaaaa accatttcaa aaaatggatt
     5881 aggttatgtt caacaaaatc attcgtggtc tgagaaatta caacccctaa ttcaagtaat
     5941 taataattta atcgaagagt agtttatgtc tagtataatt cctgttatta tggctggcgg
     6001 ttctggtagt cgtttatggc ctctttcgcg cgaacttcgt ccaaagcaat tccttaagct
     6061 tgatggtgag ctaacaatgc tgcaagcgac tatcaatcgt ttaaaaaatt tcgttacgac
     6121 gcaaccattg gttatttgta atgaagatca ccgattttta gttgctgaac agttacgtta
     6181 tttaggtaaa cttgaaaata atatcatctt agagccattt ggacgtaata ctgcgccagc
     6241 aatagctttg gctgcattca cagctttaca gagctcttct cttaaggaag atcctatatt
     6301 gttagtatta gcggcagatc atgttatccg agatgaagag tcatttaaaa gatcagttca
     6361 acaagcagtt ccttatgcta aatctggaaa acttgttact tttggcattg tacctaccca
     6421 tgcggaaacc ggatatggat atatacaacg aggaaaggaa ttaaatgatg cttattcagt
     6481 taaacaattt gtcgaaaagc ccgagcttga aaccgcacaa caatatttta atagcggaga
     6541 atattattgg aatagtggta tgttcttgtt tcgtgctagc cgctatcttg atgaactggc
     6601 attattccga ccagatattt atactgcttg tggtaaagca ataggggcta ttgacccaga
     6661 tcatgacttt gttcgtattg ataaagatgc attcaattct tgtccaagtg attctattga
     6721 ttatgctgta atggaaaaaa cttcagatgc agtagtcgtt ccgatggatg ctggttggtc
     6781 tgatgttgga tcttggctat cgttatggga gctttcaaaa aaagattcta tggggaattc
     6841 atttcatggt gatgtgattc aacatagtag taaaaataat tttgttttta cagagagctg
     6901 tttggttagt ttggttggtg ttgaaaaact tgtagtcgta caaacaaaag atgcaatatt
     6961 agttgctgat cagaataaag ttcaagatgt aaaaaatata gttgagaaac taaaaaatag
     7021 ctgccgtaca gaacatcgta tacaccggga agtttttcgc ccttggggaa agcatgattt
     7081 aattgacgat ggagatgtat atcgagtcaa aaggataagt gttaaaccgg gtgagaggct
     7141 ttcattgcaa atgcatcatc atagagctga acactggata gttgtatctg gtatagctaa
     7201 agttacgaat ggtgacaata tatatctttt aaaagaaaat gaatcaacat tcataccttc
     7261 aggtacgatt catgccttag aaaatccagg agaaataatg ctggagctta ttgaggtgca
     7321 atcgggagta tgcttggatg aaaatgatat tatccgttta taaggtcact tataattgaa
     7381 gttaaagagt ttctattaaa ataggctatt tggagctttg acagttgttt agtatttaat
     7441 cgcaaaaatg atatctttat ttataatgtt aaaggtagtg tcctatgact aagtataata
     7501 gttcttcatt aatagccaat agtaatgtga attttggtac tagtggtgct cgtggattag
     7561 tcgttgattt tactcacaat gtttgtgctg cttttactca tgcatttctt tcggttatcg
     7621 aaaaacactt taagtttgac acagtggctg tagcaataga taacagacct agtagtttta
     7681 atatagcaca agcatgtgtt ttcgctataa aacagcatgg atatggcatc gaatatcatg
     7741 gtgtcattcc gactcctgca ttagctcatt attcgatgca gaaaaatatt ccctgtataa
     7801 tggtcactgg gagtcatata ccttttgatc gtaatggttt aaaattctac cgaccagatg
     7861 gtgaaatcac aaaagaggat gagctcgcaa ttgtaaatag tgaatataca ttttctcctg
     7921 taggtgtatt acctcatctt gaaacaagct ctcaaggtgc ggactgctac ttggaacgtt
     7981 atgtttctct tttttattct gatattttaa aggggaaaag aataggggta tatgaacatt
     8041 ctagtgcggg gcgcgattta tatgcttctc tttttaatca attgggtgca gaggtcattt
     8101 ccctaggcag aagtgatgag ttcgttccga ttgatacgga agcagtaagt gatgaagatc
     8161 gtgtacttgc aagagagtgg tctaaaaaat ataatcttga tgctattttc tcaacagatg
     8221 gcgatggtga tcgtccttta gttgccgatg aaaatggtga atggttaaga ggcgatattc
     8281 tgggactact tactgctatt gaacttaata tcaaggcgtt ggctattcca gtgagttgta
     8341 atacagcaat tgaagagtct aataaatttg caagtataca acgaacgaaa ataggttctc
     8401 cttatgtaat tgcagcattt gcagatcttg ctaagcaatt tgattcagtc gctggttttg
     8461 aagctaatgg tggttttctc cttgcctccg atttacaaat taatgacaag gaattaaaat
     8521 cgttgcctac acgagatgct gtgttaccag cattaatgct cttaatagct tctcgcaata
     8581 gtactatttc tcaactgatt aataatcttc ctcagcgatt cacttggtca gatagagtta
     8641 aaaacttccc ttcagattca agtcaacaaa ttataaagaa tgccatatcg tcacccaata
     8701 atttctttaa tagtttaggt tatgaatcat tatcctgttc ctctattgat gaaacggatg
     8761 gtgcaagatt tactttaaat aatggtgata ttatacatct ccgtccttcc ggtaatgctc
     8821 cagaactccg ttgttatgct gaggccagtg atgaaaatca ggctaagcaa tatgttacga
     8881 atgtgctggg aaatattacc tctttgattt cttgatgtta taggtttatc tacgcttata
     8941 tgtgtgcgta ggtttgatta cacgtagatg ctggtataca gaattgaaga acggtatttg
     9001 ttgcattaat gaaattcagc actacacaca ttcgtgcaac ttgagataac atctcaatca
     9061 tattcaagtc gcgcatacat cgcggtgaac accccctgac aggagtaaac aatgtcaaag
     9121 caacagatcg gcgtcgtcgg tatggcagtg atggggcgca accttgcgct caacatcgaa
     9181 agccgtggtt ataccgtctc tattttcaac cgttcccgtg agaaaacgga agaagtgatt
     9241 gccgaaaatc caggcaagaa actggttcct tactatacgg tgaaagagtt tgttgaatct
     9301 ctggaaacgc ctcgtcgcat cctgttaatg gtgaaagcag gtgcaggcac ggatgctgct
     9361 attgattccc tcaagccata cctcgataaa ggtgacatca ttattgatgg tggtaatacc
     9421 ttcttccagg acaccattcg tcgtaaccgt gagctttctg ccgaaggttt taacttcatc
     9481 ggtaccggtg tttccggcgg tgaagaaggt gcgctgaaag gtccttccat tatgcctggt
     9541 gggcagaaag aagcctatga actggttgca ccgatcctga ccaaaatcgc cgcagtggct
     9601 gaagactgtg agccatgcgt tacctatatt ggtgccgatg gtgcaggtca ctatgtgaag
     9661 atggttcaca acggtattga atacggcgat atgcagctga ttgctgaagc ctattctctg
     9721 cttaaaggtg gcttgaacct ttccaacgaa gaactggcgc agacctttac cgagtggaat
     9781 aacggtgaac tgagcagcta cctgattgac atcactaaag acatcttcac taaaaaagat
     9841 gaagacggta actacctggt tgatgtgatt ctggatgaag cggcgaacaa aggtaccggt
     9901 aaatggacca gccagagcgc gctggatctc ggcgaaccgc tgtcgctgat taccgagtct
     9961 gtgtttgcac gttatatctc ttctctgaaa gatcagcgtg ttgccgcatc taaagttctc
    10021 tctggcccgc aagcacagcc agcaggcgac aaagctgagt ttatcgagaa agttcgccgt
    10081 gcgctgtatc tgggcaaaat cgtttcttac gctcagggct tctctcagct acgcgccgcg
    10141 tcggaagatt acaattggga tctgaactac ggcgaaatcg cgaagatttt ccgtgctggt
    10201 tgcatcatcc gtgcgcagtt cctgcagaaa atcaccgatg cgtatgccga aaatcccaaa
    10261 atcgctaacc tgctgttggc tccgtacttt aagcaaatcg ccgacgacta ccagcaggca
    10321 ctgcgtgatg tcgtcgctta tgcagtgcaa aacggtattc cggttccaac cttctctacg
    10381 gcggttgcct attacgatag ctaccgtgcc gcggtgctgc ctgcgaacct gatccaggca
    10441 caacgtgact atttcggtgc gcatacttat aaacgcattg ataaagaagg tgtgttccat
    10501 accgaatggt tggattaaaa acgatttgag tttttgaatt aagagcctac gatgtgttag
    10561 gctctttaaa atattatatt catggtatta tttaaaattt gaatatcttc taaggtcaaa
    10621 atgtaatgag ataatagatg tcaaattata ttaaaaatgc aggttggatt ttttttgaaa
    10681 aatttgtgcg aatagctatc agctttatgc tcttcgcgtt tgtttcaaga gtcttgaacc
    10741 ctaatgattt tggagtgctg tcgtattatc aaacaattac aactatgcta ctggccttaa
    10801 ctaacttggg ttttgataac gttcttatta atgagtttaa tcaaaatgag aaacataata
    10861 aaatctttgc aacagcattt tggtcgagaa tcatagtttc aactgttgtg atattattat
    10921 ttgcagttgg ggtttgtttt tatgatcttc ctatggttaa taaaattgtt ttgttgctgt
    10981 gtttgtctag tttagtcttt caaactcaaa acacttatgt atcatatttt caatcacaat
    11041 tgcaagcctc tattattaca aaaataagtt ttctttcact tcttctatct gctttagtga
    11101 aagtgtattt attaatgaca gataaaaata tcatatggtt tgcattttca tatagtttcg
    11161 attttgctgt ttccttttta ttttttgctg tgttttccta taagcgaaat tatgtttcaa
    11221 ttagtttaag atattttgat ttgaatgtgt tgaaaggctt gcttcgtagt tcttggccaa
    11281 ttatagcttc cgctgtaata gttgtgcttt acactagatt agatcaacta atgatcatga
    11341 atatgttagg ttctgactcc gtagcaatat ttagtgtagc aataaaaatc tcagaggcat
    11401 atttatttgt acctgcagca ttagttacat catattatcc attgatttct aaatccccta
    11461 gtaatgacaa tattcgattt tattttgatg tagtgtttgc cacttccatt attatggcag
    11521 ttggagttgc aataatatca ttttttttga ttccgataat gtttggtgaa tattatgctt
    11581 gttcatatac aatattaatt gtattattgt taggatcatt gttttcaatt ttaggttcag
    11641 catgcaccaa tttaatgata gtttatggtt tatcttattt gagattaatt agagcaatat
    11701 ttggattgct agtgaatttt tctcttaatt taatatttat tccgaagtat ggggttattg
    11761 gtgctgcata tgcttcagtg gtaagccaga tatttgctgc ttgggtaagt aatgctttta
    11821 gtaaaaaaac tatagagtgt ttcaagctac aaactatcac tgtattaaca tgtggtgtgt
    11881 tgggagggcg gcagctatgt cagattcttt tcaaaaagtg agtgccaaaa tgatcagtaa
    11941 aaacacaaaa aaaaatggaa tattaagaga cttttctttc atttaaatgt aagatggcgt
    12001 gtgtttcttg agtattatta tagctataga tattatcgtc tatttaagat accaattgct
    12061 aatcatctca cgattggctt aaaaaaatta ggagagaaaa atactatttt tcctcatcct
    12121 gtaggtatag tgattggaaa aaaagtcagt ataggaaata attgtactat ctatcaaaat
    12181 gtgacgattg gtgtgagtaa caataaaact gaggattatc ctattatcgg agacaatgtt
    12241 attatttatg ctggtgctat cataataggt agtgttagca tagggaataa tgtgataatt
    12301 ggtgccggat gtattgtaac aaaagacgtt cctgaggata agattgctgt tggctcaccg
    12361 atgaaaataa tagataagaa ggctaatgtt ctctattgat aattaggcca tcatttccga
    12421 tggccgatat attgtcttga ctctaatatg aatttcatgc tagtactata attactgtaa
    12481 tttttcgata attaagaatt taagtatgaa aataacaatt tcaggaacag gttatgttgg
    12541 tctttcaaat ggtattctga ttgcgcaaaa tcacgaagtg gttgctttag atatcgttca
    12601 ggccaaagtg gacatgctta acaagaagca gtcaccgatt gttgataagg agattgaaga
    12661 gtatctggcg actaaagatc tcaatttccg cgctacgaca gataagtatg acgcgtataa
    12721 aaatgccgat tacgttatta ttgccacacc taccgattat gatccgaaaa cgaattattt
    12781 taatacctca agcgtggaag cggtcattcg cgatgtgaca gaaattaatc ccaacgcggt
    12841 aatgattata aaatcaacta tccctgttgg ttttacagag tccattaaag aacgttttgg
    12901 tattgaaaat gtgatctttt cgcctgagtt tttgcgtgaa ggtaaagcac tttatgataa
    12961 cttacaccca tcacgcattg tgattggcga gcagtctgaa cgcgctgaac gttttgctgc
    13021 gttattacag gaaggcgcca ttaagcaaga cataccaaca ttgtttactg actcaaccga
    13081 agctgaggcg attaaacttt ttgccaacac ttatctggct atgcgtgtag cgtatttcaa
    13141 tgaacttgat agttatgctg aaagcctggg gcttaattca cgccagatta ttgagggcgt
    13201 atgccttgac ccgcgtatcg gtaatcacta caacaacccg tcattcggtt atggtggtta
    13261 ttgtctgccg aaagatacta agcagttact ggcaaattac cagtctgtgc cgaataacct
    13321 gatctcggca attgttgacg ccaaccgcac gcgcaaagat tttattgccg attctatcct
    13381 tgcacgtaaa ccgaaagttg ttggcgtcta tcgtttgatt atgaagagtg gttcagacaa
    13441 tttccgtgct tcctcgattc agggtattat gaagcgaatc aaggcgaaag gcgtgcctgt
    13501 aatcgtttat gagccagcga tgaaagagga cgattttttc cggtcgcgcg tggtacgtga
    13561 tctggatgcg ttcaaacaag aagctgatgt tattatttct aaccgtatgt ctgccgatct
    13621 ggctgatgta gcagataagg tttatacgcg cgacttgttt ggcaatgatt aattattttg
    13681 ttttattcta agaaaaggcc ctaatatatt agggcctttt cttatggttt tgtaaaatca
    13741 aactttatag aagttacgat accattctac aaagttcttt actccctctt taactgacgt
    13801 ttcaggtttg aatcctatta cgtcatacag tgcttttgta tcagcactgg tttccagtac
    13861 atcaccgggt tggagaggca tcatattctt gttggcttca atacccagag cctcttctaa
    13921 ggcattgata tagtccatca actccacagg cgaactatta ccaatgttat agacacgata
    13981 tggtgctgaa cttgttgctg gcgaacctgt ttctacagcc cactgtggat ctttttctgg
    14041 aataacatcc tgtaaccgaa taatagcttc ggcaatatca tcaatataag taaagtcacg
    14101 cttcattttg ccgaagttgt aaacatcaat gcttttacct tccagcatgg ctttagtgaa
    14161 tttaaataat gccatatccg gacgtcccca tggaccataa accgtaaaga aacgcagccc
    14221 tgtggtcggt aagccataca aatgagaata cgtatgggcc atgagttcat tcgctttttt
    14281 agttgctgca taaagcgaaa caggatgatc tacagagtca tctgtagaga aaggcatctt
    14341 gaggttcatg ccataaacag aactggagga agcgtaaagt agatgctgaa cattattata
    14401 gcggcatcct tccagtatgt tcaggaatcc aatcaggttt gcatctgcat atgcattggg
    14461 attttcaagg gagtaacgta cacctgcttg cgcagcgagg tttattacgc gatcgaaccg
    14521 ctcgtctgca aacagtgccg ccattttctc gcgatcggcc aggtcaattt tataaaaact
    14581 gaaattgtcg tgcttgagta aatcaagtcg tgcttgtttg aggttgacat cgtaataatc
    14641 atttaagttg tcaatcccta caacctgatg accagctgca agaagccgtt tacttacata
    14701 gaaaccgata aagccagcag ctcccgtaac cagaaatttc atttataatc ctcgctcagg
    14761 ctagaatata gccaattttc atctggcata actgaaagtt aaatcatacc gttagacaag
    14821 aaaaaaagat aatcggtatc agttctaaac ctggctgttt tttctggtaa cgtgctcatt
    14881 ttacaatcaa agctgttcta agctgactat acaagccgac gtcattatct ccaaccgtat
    14941 ggcagaagag cttaaggatg tggcagataa ggtctatacc cgcgatctct ttggcagcga
    15001 ctaacatcct gttatcaggg cgattttcgc cctgattctc ttatgttccc tttgtaataa
    15061 ttcattattt ttatcattta tcctatagca ttcatggcga ttatcgctaa actatggcga
    15121 cttaaaatta tttcgtccgt tagggtaatg atgagagtag aaaataataa tgtttctggg
    15181 caaaaccatg acccggaaca gattgatttg attgatttac tggtgcagtt gtggcgtggc
    15241 aagatgacaa ttatcatctc tgtcattgtt gctattgccc tggctatagg gtatctggtc
    15301 gttgccaaag aaaagtggac ttcaacagct atcgttactc aacctgatgt ggggcaaatc
    15361 gctggttata ccaacgcgat gaatgtgatt tacggtccgg ctgtaccgaa agtctccgac
    15421 attcagactt cacttatcgg acgttacagc actgcattct cagcattagc ggaaacgttg
    15481 gataatcagg aagaacctga aaaactgacc attgagccta ctgttaaaaa tcagtcctta
    15541 cctttagcgg tgtcttatgt tggtgaaaca gctgaaggtg cgcagaaaca gctggcgcaa
    15601 tatatccagc aagttgacga ccaggtaaac gaagaactgg aaaaagacct gaaagacaac
    15661 atcgcgctgc gtatgaaaaa cttgcaggat tcgctgaaaa cccaggaagt agtcgcgcag
    15721 gagcagaaag atctgcgtat ccgtcagatt caggaagcgt tgcagtatgc gaatcaggcg
    15781 caggtgacaa agccacaggt tcagcagact gaagatgtga cacaagatac gttgttcctt
    15841 ttggggagcg aagcgctgga gtcgatgatt aagcatgagg cgacccgtcc gttggtgttc
    15901 tcaccaaact actatcagac tcgtcaaaac ctgctggata tcgaaagctt aaaagttgat
    15961 gatcttgata ttcatgctta ccgttatgta atgaaaccga cgttacctat tcgtcgcgat
    16021 agcccgaaaa aggcaatcac cttgattctg gcagtgctgc taggcggtat ggtgggcgcg
    16081 gggattgtgt tggggcgtaa cgctctgcgt aattacaacg cgaagtaatc tttgcagctt
    16141 taaagaaaac gggcagggtg gtgacacctt gcccgttttt ttttgccgga tgcgacaaca
    16201 acatcgcatc cgcttacccc gcaactcact gatgccgttt acgcaggttc tcaattaccg
    16261 tcgttaaatc cagatcctga tcctgcaaca gcaccagcag gtgatacatc aagtcagatg
    16321 cctcgttggt cagctcaaag cggtcatgta ccgttgctgc cagtgcggtt tccacgcctt
    16381 cttcacccac tttctgcgca atgcgcttgg tgccgctggc atacagtttg gcggtgtagg
    16441 aggtttccgg gtcggcagat ttgcgttcgg cgagcagttg ttccagttga tacaggaaca
    16501 gccactggtg agcggtgtcg ccgaagcagc tgctggtgcc tttgtggcag gtcgggccga
    16561 taggattcgc cag
//