LOCUS       AB811618               16901 bp    DNA     linear   BCT 13-MAY-2015
DEFINITION  Escherichia coli DNA, O-antigen biosynthetic locus, strain: P11a.
ACCESSION   AB811618
VERSION     AB811618.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1
  AUTHORS   Iguchi,A., Iyoda,S., Kikuchi,T., Ogura,Y., Katsura,K., Ohnishi,M.,
            Hayashi,T. and Thomson,N.R.
  TITLE     A complete view of the genetic diversity of the Escherichia coli
            O-antigen biosynthesis gene cluster
  JOURNAL   DNA Res. 22 (1), 101-107 (2015)
   PUBMED   25428893
  REMARK    DOI:10.1093/dnares/dsu043
REFERENCE   2  (bases 1 to 16901)
  AUTHORS   Iguchi,A., Iyoda,S. and Ohnishi,M.
  TITLE     Direct Submission
  JOURNAL   Submitted (29-MAR-2013) Contact:Atsushi Iguchi University of
            Miyazaki, Faculty of Agriculture; Gakuen-kibanadai-nishi 1-1,
            Miyazaki, Miyazaki 889-2192, Japan
FEATURES             Location/Qualifiers
     source          1..16901
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="P11a"
                     /db_xref="taxon:562"
                     /note="serogroup:O42"
     gene            557..1948
                     /gene="wcaM"
     CDS             557..1948
                     /gene="wcaM"
                     /codon_start=1
                     /transl_table=11
                     /product="colanic acid biosynthesis protein"
                     /protein_id="BAQ00906.1"
                     /translation="MDKKFSRRRFLSAGATLAAIPLLHSPAVRALGRNDAVDIRNYLV
                     GNDWIRAFRQAFDDADIIDVPKGVICDNINTGIIMPPGKTLQVNGSLKGNGRGRFALQ
                     DGCKVVGEGSLNNITLDVRGSDCTIEGLAMSGFGPVAQIYIGGKQKRTMRNLTITRIN
                     ISQANYGILRQGFHNQLDGVKITHSKFSYLQGDAIEWNVAINDKNILISDHVIDHIDC
                     TNGKTNWGIGIGLAGSTYDNNYPEHQAVKNFVVANITGSHCRQLVHVENGKHFIIRNI
                     KARNITPEYSKKAGIDNATVAIYGCDNFVIDGVDMVNSAGMLIGYGVIKGKYLSIPQN
                     FRINNVRMDNRQLTLKLRGIQISSGNAPSFVALTNLDLNHASLEIHNKPQYIFMRNIK
                     VIQPAARGPALQLHFDLRKDVRGKFMAKQETLLSMSNIHAVNENGQRSVDIDRIDQHV
                     VNVDALNFTLPKR"
     gene            2083..2988
                     /gene="galF"
     CDS             2083..2988
                     /gene="galF"
                     /note="O042_01"
                     /codon_start=1
                     /transl_table=11
                     /product="UTP-glucose-1-phosphate uridylyltransferase"
                     /protein_id="BAQ00907.1"
                     /translation="MDTIMVNLKAVIPVAGLGMHMLPATKAIPKEMLPIVDKPMIQYI
                     VDEVVAAGIKEIVLVTHASKNAVENHFDTSYELEALLEQRVKRQLLAEVQSICPPGVT
                     IMNVRQAQPLGLGHSILCARPIVGDNPFVVVLPDIILDGASADPLRYNLAAMVARYNE
                     TGRSQVLAKRMPGDLSEYSVIQTKEPLTVEGKVSRIVEFIEKPDQPQTLDSDLMAVGR
                     YVLSADIWAELEKTAPGAWGRIQLTDAIAELAKKQSVDAMLMSGDSYDCGKKMGYMQA
                     LVQYGLRNLKEGAKFRKGIEKLLSE"
     CDS             3316..3711
                     /note="O042_02"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycerol-3-phosphate
                     cytidyltransferase"
                     /protein_id="BAQ00908.1"
                     /translation="MKKIITFGTFDVFHVGHVNILERAASLGDYLIVGVSSDELNYSK
                     KQRYPIYSQEDRTKIISSLKFVNEVFIEESLEKKLEYIKTYNADILVMGDDWAGRFDW
                     VKSDCEVIYLPRTPSISTTEIIEVVKSIR"
     gene            3722..4951
                     /gene="wzx"
     CDS             3722..4951
                     /gene="wzx"
                     /note="O042_03"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen flippase"
                     /protein_id="BAQ00909.1"
                     /translation="MKLKQNVLFGNIAALAILQLATYITPLLIVPYLTRVLGPGGYGT
                     VAICLSIIQMSLILTDFGFNLSSTEYIARNCQSKDKINKHIGAVFQIKILLIFLCVIF
                     LYFLVNDQLQQFKIEFFFYSCIAIIGQTFQSLWFFQGVEKMKRITLFLTISKFSYVIL
                     TFVIVKKPEQGRFVILAYALSQVIGALLSQYYMRKEGYKYTPANLSSMLGVLRTSALF
                     FWSRLAVSTYTTASTLVVGAAGHVQAGYYAASEQLYKAGQNITTPVSQALYPYMTRAK
                     NWALFFKMMSILTVVMITASLTAIWLSQWLIALIFGPEYIVSQNVFIVFMLALIVTFV
                     STNFGYPVFSALGKVKVANYTVIFGALTHVVILGVLFCLGEISAYNVVRAVLFTEIVI
                     LILRMFFFVKLYRREVK"
     CDS             4948..6126
                     /note="O042_04"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycerophosphotransferase"
                     /protein_id="BAQ00910.1"
                     /translation="MIIKKVISKLFGLFFCALDYVWKKQDINIFGAGRGSRYFDNSKT
                     LFEYYISQGDRAYWFYTGKKPDVVGISPDAFVQANSLYGMLIALRAKKAFACYGSLDF
                     WLYRFSRKTVSVQLWHGIPIKKVFFGEKNLTQRKKLQYLFEISAFQYFIVSSKLEQYI
                     ISAQTGMHLDRVKVLGYPRNDNLFKSANEVIIPEVVALNSNFKKVVLFAPTFRNNDYS
                     VFSSFNDDEWNVFFDFLKTENFLCIFRAHAVEFLQNNDDNAKRLSKYSSNVIFLGQDK
                     YQDAQDLMVYSDILISDYSGMIPDYLLLDKPIIRFIFDEQQYDNERGVNFLQKNLPIG
                     SAAYNMPTLIEALRQCVESTEESVAVNAFAKKMYHDNLCGKYSEKIYNYFNSLSQGKV
                     "
     gene            6123..7502
                     /gene="wzy"
     CDS             6123..7502
                     /gene="wzy"
                     /note="O042_05"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen polymerase"
                     /protein_id="BAQ00911.1"
                     /translation="MKQARIKPFSYLSLSFFVLFLIFLNISAVSFDEYLTDLQYSYAY
                     VLFAISLVAVYYAQGESYTSLGFLFNTCLFLFIGGRFIATTFGIDSESVFTLDFMTTY
                     IPTSDEKLEIYTRVVSFQIFLNLGYLFLRKEDSLLNLNKNDNSLPGRLLFLIVIVLFL
                     LCLVEQYSMLSKAMSEGYLARYGDQAESYDAGAAFKYTLLFVFTGLLFATCKKKYIII
                     NFMIYMTLATIIILIGARGAFVSTILMGVWLYGLNKKISLKKLSIIFLSLAGILLIIM
                     NFSARGNYYSNELIDSLLRFLYDQGNTLAVVGYVRTITDYPVFAYISTFLPGSSFFAS
                     MFHGGSDLNSYMLSFPAYANYVANPNMYFAGYGLGWSIISSVEMFSADILFIFCIFSV
                     LIGMFLKFANEQAKRNSFWFGAVACLCAKILFTARADIKTIIPLFMYYAIMYLIISTA
                     MRILRQRYG"
     CDS             7495..8505
                     /note="O042_06"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00912.1"
                     /translation="MDNRDVMFSVIVPCYNVVSHINETVASLNKAIDSACTTVEVIFV
                     NDGSTDKTLDVLNEICSNKPSYRVIDQENGGVSNARNTGIRESTGKYILFLDSDDTYK
                     NNIFSILSNISFSDDIVFFSYEKIDQSGNTRVYTIPNSYMAENSITVLKDLFSKKIYL
                     NICALAVNRDCIFQNNIFFDESIQHCEDLQFIIKMITYSKSFQFINEPLFTYNYTPGS
                     AVNSKVDEKHYSKFIAFENMRDVFIKNDKYKELIPAYDFYVATVYLLLLKTIVSNGVV
                     NNKQLSKFVEYSFILKRKMELPPNTMGAFVLIFNIINYIFPMKVKFLMMSFILRMNKG
                     LR"
     CDS             8502..9419
                     /note="O042_07"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00913.1"
                     /translation="MSITNKTIALVIVTYNRCNLLMEMLSSIENMSVKPDIVYVIDNN
                     SSDNTSSVVTECDSRKNINIKYHNTGYNAGGAGGFYIGSKMAYEDGWDRIWLADDDIV
                     LDKECLNNAMEYDDGRTILQPMRYNMDGSCAEISAIQYDLSNPFYLRPKRKTVQNIFN
                     KNILSYDIQSIPFEGPIIPREVFNVIGFPDERFFIFNDDLDFAIRAQRAGFSIKCITN
                     AKIVRKIPFVQSVALKTWKGYFMFRNYFRVQKVYGSSPLIYLRILLVFCLALGHSLVR
                     MDINSIKMLCGALKDGLSQEFKLTEKYKP"
     CDS             9416..10486
                     /note="O042_08"
                     /codon_start=1
                     /transl_table=11
                     /product="putative acetyltransferase"
                     /protein_id="BAQ00914.1"
                     /translation="MSTTDSPNIKTSNNNFDIVRLILALVVVFSHIRDLNNINSRFFS
                     IFSGDFAVECFFVISGYLIIRSFKNNQNIRKYIFSRGMRILPMYYVSIVSFFVILFFI
                     SHLSVVEYLKEGGIRYLVFNGVFLNFIQPSLPGVFVDNPRISAVNGALWTIKVEILFY
                     IFVPFFVLFIKKINRHIIPIFIILILSSIVFKWIVTDYHQILHIPEQLVNQLPSVLSY
                     FLLGGLVNYLDLSKISKKTVFWFFIVSAFYLLLSSKTSLDLLVRPFVIAGFILPICLQ
                     RKFLISVPEKMGDLSYGIYVTHFPLVQLLIAVGLYNSFWLGFCLTFTSLFILSFISWH
                     LIEKPALRFAKSAGKNKVVRGV"
     gene            10483..11628
                     /gene="glf"
     CDS             10483..11628
                     /gene="glf"
                     /note="O042_09"
                     /codon_start=1
                     /transl_table=11
                     /product="UDP-galactopyranose mutase"
                     /protein_id="BAQ00915.1"
                     /translation="MRIAIVGAGFSGAVIARELAEHGHSVDIFEKRDHVAGNCYSKRD
                     PDTNVMVHVYGPHIFHTDDKEVWEYINKFGMFEPYVNRVKAITKGAVYSLPINLHTIN
                     QFFHKTLNPAEAKDFINSLCELFEFEPITFEQQALSFIGRDLYEAFFRTYTIKQWGLE
                     PSELPASILKRLPVRFNYNDNYFSHRYQGMPRDGYTNIISAILDHASIAVKLNTDFKK
                     NVGNEYDHVFYSGTIDGYFDYSHGRLPYRTLDFVTERHKGDYQGTAVINYCDDSEKFT
                     RITEHKYFSPWEEHSNTIIYKEYSRTCTETDSPYYPIRQVQEKELLRKYVDLANQTNN
                     VSFIGRLGTYRYLDMDVTIREALNAVKLFMKIKKENEKVPAFFTEIL"
     gene            11807..13213
                     /gene="gnd"
     CDS             11807..13213
                     /gene="gnd"
                     /note="O042_10"
                     /codon_start=1
                     /transl_table=11
                     /product="6-phosphogluconate dehydrogenase"
                     /protein_id="BAQ00916.1"
                     /translation="MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVVA
                     ENPGKKLVPHYTVKEFVESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGN
                     TFFQDTIRRNRELSAEGFNFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIA
                     AVAEDGEPCVTYIGADGAGHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLSNDELATI
                     FTEWNEGELSSYLIDITKDIFTKKDEDGNYLVDVILDEAANKGTGKWTSQSSLDLGEP
                     LSLITESVFARYISSLKDQRVAASKVLSGPKAELAGDKAAFVEKVRRALYLGKIVSYA
                     QGFSQLRAASDEYNWDLNYGEIAKIFRAGCIIRAQFLQKITDAYAENSGIANLLLAPY
                     FKNIADEYQQALRDVVAYAVQNGIPVPTFGAAVAYYDSYRSAVLPANLIQAQRDYFGA
                     HTYKRTDKEGVFHTEWLD"
     gene            13447..14613
                     /gene="ugd"
     CDS             13447..14613
                     /gene="ugd"
                     /note="O042_11"
                     /codon_start=1
                     /transl_table=11
                     /product="UDP-glucose 6-dehydrogenase"
                     /protein_id="BAQ00917.1"
                     /translation="MKVTISGTGYVGLSNGLLIAQHHDVVALDIIPSRVDMLNARVSP
                     IVDKEIQQYLSSGELRFSATTDKYLAYQNADYVIIATPTDYDPKTNYFNTSSVESVIQ
                     DVIEINPQAVMIIKSTVPVGFTDSVKKKYATDNIIFSPEFLREGKALYDNLHPSRIVI
                     GERSERAERFARMLQQGAIKQDIPTLFTDSTEAEAIKLFANTYLAMRVAYFNELDSYA
                     ETLGLNSRQIIEGVCLDPRIGAHYNNPSFGYGGYCLPKDTKQLLANYQSVPNNIISAI
                     VDANRTRKDFIAEAILARKPKVVGIYRLIMKSGSDNFRASSVQGIMKRLKAKGITVIV
                     YEPVMKEDEFFSSRVVRDLDAFKQEADVIVSNRMAEELTDVAEKIYTRDLFGND"
     gene            14759..15757
                     /gene="wzz"
     CDS             14759..15757
                     /gene="wzz"
                     /note="O042_12"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen chain length determinant protein"
                     /protein_id="BAQ00918.1"
                     /translation="MDVTKVYMIQDNNNGRSGYEREPEQIDLIDLLMQLWRGKLTIIV
                     CVIVAIALAVAYVFLAKEKWTSTATITRPDAAQIATYHNAINTLDSSINLSDVQNQVI
                     NRFNSAFIALTEALDNQQEPEKLTIEPSVKGQNLPLTVTYVSDTAQSAQRGVAEYIQK
                     IDEQIADELVLDLNDTIKLRVMNIKDDLENQETVAQEQKDLRIKQITESLKYAQKSNV
                     TKPQLQQTQDVTQETMFLLGTEALGAMVANEASRPLTFGAGYYGLKKNLLDIEKLKVD
                     PKTIHVYRYVMKPTLPIRRDSPKRGLTLVLAVLLGGMIGAGVVLGRNALRNYKPKA"
     gene            complement(15817..16416)
                     /gene="hisI"
     CDS             complement(15817..16416)
                     /gene="hisI"
                     /codon_start=1
                     /transl_table=11
                     /product="phosphoribosyl-AMP cyclohydrolase"
                     /protein_id="BAQ00919.1"
                     /translation="MLTEQLDWDKTDGLMPAIVQHAVSGEVLMLGYMNKEALAQTESS
                     GKVTFYSRTKERLWTKGETSGNFLNVVSITPDCDNDTLLVLVNPIGPTCHKGTSSCFG
                     DASHQWLFLYQLEQLLAERKTADPESSYTARLYASGTKRIAQKVGEEGVETALAATVK
                     DRFELTNEASDLMYHLLVLLQDQDLDLTTVIENLRKRHQ"
ORIGIN      
        1 ctcagtggcc cgcctgacgg agaaaaaagg tctgcatgta gcgattgaag cctgccgtca
       61 gttgaaagag cgcggtgtgg cgtttcacta tcgcattctc ggcatcggcc cgtgggaacg
      121 ccgcctgcgc acattgatcg aacagtatca actggaaggg tacgtggaga tgccgggctt
      181 taagcccagc catgaggtaa aagcgatgct cgatgaggcg gatgtctttc tgctgccgtc
      241 gattaccggc gcagatggcg atatggaagg cattcctgtg gcactgatgg aagcgatggc
      301 agtgggcatt ccggtgcttt cgaccgagca tagcggtatt ccggaactga tagacgccaa
      361 cgcctccggc tggctggtgg cggagaacga cgctccggcg ctggcgggca aactcagcga
      421 actgcgccat cttgatgagc cgacgctgcg cccggtgcta caacgcgccc gccaaaaagt
      481 tgaaaccgag ttcaatcagc aggtgattaa ccgccagctc gcgagcctgc tgcaaaccct
      541 ttgctattga ggttgcatgg ataaaaaatt ttcccgacgt cgcttcctgt cggcaggcgc
      601 tacgcttgcc gccatcccac tgctacacag ccccgctgta cgcgcgctgg ggcgtaatga
      661 tgccgttgat atccgcaact atctggtcgg taatgactgg atccgtgcat ttcgtcaggc
      721 gtttgacgat gccgatatta tcgacgtccc caaaggcgtg atttgcgaca atattaatac
      781 cggcatcatc atgccaccgg gtaaaacgct gcaggtaaac ggcagcctga aaggcaatgg
      841 tcgtgggcgt tttgcgttgc aggatgggtg taaagtggtg ggggagggga gtctcaataa
      901 tattactctc gacgtgcgcg gatctgactg caccatcgaa ggtctggcga tgagcggctt
      961 tggcccggtg gcgcaaatct acatcggcgg caaacaaaaa aggacgatgc gcaatctcac
     1021 catcacgcgg attaatatca gccaggctaa ctacggtatt ttacgccagg gtttccataa
     1081 tcaactcgac ggcgtaaaaa tcacccacag taaatttagc tacctgcagg gtgatgccat
     1141 tgaatggaac gtcgcgatta acgacaagaa tatcctcatc tccgatcatg tgattgacca
     1201 tatcgattgc accaatggca agaccaactg gggtattggc attgggcttg cgggcagcac
     1261 ctacgataac aattacccgg agcaccaggc ggtgaaaaac tttgtcgtcg ccaatatcac
     1321 cggcagccac tgccgacagt tggttcacgt cgaaaacggt aaacacttta ttatccgtaa
     1381 tattaaggca cgaaatatca ccccggaata cagtaagaaa gccggaattg ataacgctac
     1441 ggtagcaata tatggatgtg ataatttcgt tatcgatggt gtggatatgg ttaatagcgc
     1501 gggcatgcta attggctatg gtgttatcaa agggaaatat ctgtcgatac cgcagaattt
     1561 caggataaat aatgtgcgga tggataatcg acaattaacg ctaaagctgc ggggaataca
     1621 gatttcatcg ggcaatgcgc cctcgtttgt tgcgcttacc aacctcgatc tgaaccatgc
     1681 gtcgctggag atccacaaca agccgcaata catatttatg cgtaatatca aggtgataca
     1741 gcctgcggcg cgcgggcccg cactacagct ccacttcgac ttacgcaagg atgttcgcgg
     1801 gaagtttatg gccaaacagg agacgctgct ctcgatgtca aatattcatg cggtcaatga
     1861 aaacggccag cggtctgtgg atattgaccg tattgatcag cacgttgtca atgtcgatgc
     1921 gctgaatttt accctgccta aacgctgaat ttttagccga acccacctct tcagacgcat
     1981 tctcggattg tatccagaga tttagcggta tttacccgat actatgagaa aacatagtgg
     2041 atcaaacaac gttaatagct ataattcatc aaccgtatat aggtggacac gataatggtt
     2101 aatttgaaag cagtcattcc ggtagccggg ctgggcatgc atatgctccc tgccaccaag
     2161 gccattccta aagagatgct accgatcgtt gacaagccga tgatccaata catcgtcgac
     2221 gaagttgttg ctgcagggat caaagaaatc gtcctggtca cccacgcctc caaaaatgcc
     2281 gtggaaaacc acttcgacac ctcctatgaa ctggaagctc tgctggagca acgcgttaag
     2341 cgtcagctgc tggcggaagt tcagtccatt tgcccgccgg gcgtaaccat catgaacgtg
     2401 cgacaggcgc agccgctggg cctgggccac tccattttgt gcgcgcgtcc gatcgttggc
     2461 gataacccgt ttgtggttgt tctgcctgat atcattctcg atggcgcatc cgctgaccca
     2521 ttgcgttata acctcgctgc gatggtggca cgttataacg aaacaggccg cagccaggtg
     2581 ctggcgaaac gtatgccggg cgatctttct gagtactcgg ttattcagac taaagagccg
     2641 ctgaccgtag aaggtaaagt gagccgtatc gttgagttca tcgaaaaacc agaccaaccg
     2701 caaacgctgg attccgacct gatggccgta gggcgctatg tgctttccgc cgacatctgg
     2761 gccgaactgg aaaaaaccgc gccgggtgcc tggggacgta ttcagttgac ggatgctatc
     2821 gccgagctgg cgaagaaaca gtccgttgac gcgatgctga tgagcggcga cagctatgac
     2881 tgcggtaaga aaatgggtta catgcaggcg ttagtccagt atgggctgcg caacctgaaa
     2941 gaaggggcga agttccggaa agggattgag aaactgcttt cagaataaga cactacgcaa
     3001 caacacggaa tgttggtgat gtaacagaac ggcagatgat tgtggttgag gaactctcat
     3061 ttcacagcag ttgccgtttt tgcttttaaa aacaacaact aaaattagtg attgcgcggt
     3121 gttttttgat aaaaaatgcc ggatttctcc ttgtcttaca cagggattgc gcccaaaata
     3181 gtgggctaaa ttggtgggcg agattcgatg caaacgtgaa ggtttgtggg ggctggtcca
     3241 cgacatactg aattttgtgc agtgcactgg tagctgttga gccaggggcg gtagcgtgaa
     3301 tattatgaga gagctatgaa gaaaattata acctttggga cttttgacgt tttccatgtt
     3361 gggcatgtga atattcttga aagggctgcc agtcttggcg actatctaat agttggcgtc
     3421 tcttctgatg agttgaatta ttcaaaaaaa caacgctatc ctatttattc tcaagaagat
     3481 cgaaccaaaa ttatttcatc actaaagttt gtcaatgaag ttttcataga agaatccctt
     3541 gagaaaaagc tcgagtacat taaaacatat aacgcggata ttcttgttat gggggatgat
     3601 tgggctggga gattcgattg ggtgaaaagt gattgtgaag ttatttatct gcctcgaaca
     3661 ccatctatat cgactactga aattatagaa gtcgtcaagt ctattaggta gggcaggtag
     3721 attgaaactt aagcagaatg tattgtttgg taatattgcg gcgctggcga tattacaatt
     3781 agctacatat atcacgcctt tgttaattgt cccttatctt actcgagtgt taggtccggg
     3841 aggctatggc actgttgcaa tttgtttgtc aataattcag atgtcactaa tattgactga
     3901 ctttggtttt aatcttagtt ctacagaata tatagcaaga aattgtcaat ctaaagataa
     3961 aataaataaa catattggtg cagtttttca aattaaaata ttattgattt ttctgtgtgt
     4021 gatttttctt tattttttag taaatgacca attgcaacaa tttaaaatag agtttttctt
     4081 ttattcatgc attgctatta ttgggcaaac atttcaatcc ctatggtttt tccaaggggt
     4141 agaaaagatg aagcggatta cacttttttt aactatatca aagttttcat atgttatcct
     4201 gacttttgta attgtaaaaa aaccagagca aggacgattt gtcattcttg cttatgcatt
     4261 atctcaagtc attggcgcat tattatctca atattacatg cgtaaagaag gttataaata
     4321 tacccctgca aatttatcca gcatgttggg ggttttacgt accagtgcat tattcttttg
     4381 gtcccgactt gctgtctcca catatacaac tgcgagcaca ttggtcgtag gagctgcagg
     4441 acatgtgcaa gctggttatt atgctgccag cgaacaactg tataaggcag gtcaaaatat
     4501 aacgacccca gtcagccagg cattatatcc ttatatgaca cgggcaaaaa attgggccct
     4561 gttttttaaa atgatgtcta ttcttacggt tgtgatgatt accgctagcc taactgctat
     4621 ttggttaagt cagtggctga ttgctttaat ctttggtcca gaatatatag ttagccagaa
     4681 tgtattcata gttttcatgc ttgccctaat agtcacattt gtaagtacaa attttgggta
     4741 ccctgtattt tccgcgcttg ggaaagttaa agttgcaaat tacactgtta ttttcggtgc
     4801 tttaacgcat gtagttattc tgggtgtttt gttttgtttg ggtgaaataa gtgcctataa
     4861 cgtagttagg gctgtattat ttacagaaat agtcatattg atattgcgaa tgttcttctt
     4921 tgtgaagtta tacaggcgag aagtaaaatg ataattaaaa aagttatatc caaattattt
     4981 ggcttgtttt tttgtgcgct ggattacgtt tggaaaaaac aagatataaa tatatttgga
     5041 gcaggtagag gctctcgtta ttttgataac tcgaaaacac tctttgagta ttatatatct
     5101 caaggtgatc gagcctactg gttctacaca ggaaagaagc cagatgttgt tggaatctct
     5161 cctgatgcat ttgtacaggc taacagtttg tatggaatgt tgattgcatt acgtgcaaaa
     5221 aaagcattcg catgttacgg ttctttagat ttttggctat ataggttttc tcgtaaaaca
     5281 gtatccgttc aattatggca tggcataccc atcaaaaagg ttttctttgg tgagaaaaat
     5341 ttaacgcagc gtaaaaaact tcagtattta tttgagattt cagcttttca gtatttcata
     5401 gtatcctcaa aacttgaaca gtatattatt tcagctcaaa ccgggatgca tctggatcga
     5461 gttaaggtct taggttatcc caggaatgat aatttattta aatcagcaaa tgaagtgatt
     5521 atccctgaag tagttgcatt gaacagtaat ttcaaaaaag ttgttttatt cgcaccaaca
     5581 tttaggaata acgattattc tgtatttagt tcatttaatg atgatgaatg gaatgttttt
     5641 ttcgatttct taaaaacaga gaattttctt tgtatctttc gagcgcatgc tgttgagttt
     5701 ctccaaaata atgatgataa cgctaaaaga ttgtctaaat actcaagtaa tgtcattttt
     5761 cttgggcaag acaaatatca ggatgcacag gatttaatgg tttacagcga tattctgatt
     5821 agtgactatt ccggtatgat tccagattac ttgctactgg ataaacctat catcagattt
     5881 atttttgatg agcagcagta tgataacgag cgtggcgtta actttttgca aaaaaatctg
     5941 cctataggct cggccgcgta caatatgccg acattaatag aagcattgag acaatgtgta
     6001 gaaagcacag aagagtcggt ggcagtaaat gcgtttgcaa aaaaaatgta tcacgataat
     6061 ttatgtggga aatattcaga aaaaatatat aactatttta attctttatc acaggggaag
     6121 gtatgaaaca agcaagaata aagcctttct catatttatc attatctttt tttgtgttgt
     6181 tcttaatttt tttaaatatt tcagcagttt cattcgatga gtatctgaca gaccttcaat
     6241 attcatacgc ctatgtgctg tttgctatat ctcttgtggc ggtctactac gctcaaggtg
     6301 agtcttatac gagtcttggt ttcttgttta atacctgttt atttttgttc ataggcggtc
     6361 gttttattgc gacaacgttt ggaatagaca gtgagtcggt gtttacttta gatttcatga
     6421 ctacatatat accaacatcg gatgagaaat tagaaatata cacaagagta gtatcatttc
     6481 aaatattttt aaatttgggc tatttgtttt tacgtaagga agatagttta ttaaatctga
     6541 ataaaaatga caattcactt ccgggtcgtc ttttattttt aattgttata gtgctgtttt
     6601 tattatgcct tgtggaacaa tactcaatgc tgtcgaaagc tatgtctgag gggtacctgg
     6661 ccagatatgg cgatcaagcc gaaagttatg atgcaggggc tgcatttaaa tatacgctgc
     6721 tttttgtttt tacaggctta ttatttgcta catgtaaaaa gaagtacatt attataaatt
     6781 tcatgattta tatgaccctg gctactatca ttatactaat tggtgcacgg ggagcatttg
     6841 tatcaaccat actaatgggg gtatggttat acggtttaaa taagaaaata agtttaaaga
     6901 aactttccat tattttcttg tcgttggccg gaatactttt aattatcatg aatttttctg
     6961 cacgtggcaa ttattattca aatgaactca tcgattcttt attgcgtttc ctctatgatc
     7021 agggtaatac acttgctgtg gtgggttatg taagaaccat taccgattat ccagtgttcg
     7081 catatatttc aacatttttg cctggaagtt cattctttgc atcaatgttt catggtggaa
     7141 gtgatttaaa tagctacatg ctaagttttc ccgcttatgc aaactatgtt gctaatccaa
     7201 atatgtattt tgctggatac ggcctgggat ggtcaatcat cagttctgtg gaaatgttct
     7261 ccgccgatat cttattcatt ttttgcattt tttcggtcct tattggtatg tttttaaagt
     7321 ttgctaatga acaggcaaaa aggaatagtt tctggtttgg ggctgttgcg tgtttgtgtg
     7381 cgaaaatttt atttacagct cgtgctgata tcaaaacgat aattccacta tttatgtatt
     7441 atgcaataat gtatctaatt ataagcactg ctatgcgaat tttgaggcaa agatatggat
     7501 aatagggatg taatgttttc ggttatagtt ccatgctata acgtggtttc gcatataaat
     7561 gagactgtag cttcacttaa taaagctatc gattcggcct gtaccacggt cgaagtcatt
     7621 tttgttaatg atggctctac agataaaaca ttggatgttt taaacgaaat ctgcagtaac
     7681 aaaccatcat atcgtgttat tgatcaggaa aatggtggtg tctcaaacgc aaggaataca
     7741 ggaataagag agtctacagg gaaatatatt ctctttctgg attcagatga tacatacaaa
     7801 aataatatat tttcgatttt atcgaacata tcattttcag atgatattgt tttctttagc
     7861 tatgaaaaga tagaccagag cggtaatacg agggtttata ctattccaaa ctcttatatg
     7921 gccgagaatt caattactgt attaaaagat ctttttagta aaaaaatcta tttaaatatt
     7981 tgtgcgctag ctgtaaatag ggattgtata tttcagaata atattttttt cgatgaaagt
     8041 attcaacatt gtgaggatct tcaattcatc attaaaatga ttacttattc aaaatcattc
     8101 caattcataa atgaaccttt atttacctat aattacactc ccggttctgc tgttaatagc
     8161 aaggtagatg agaaacatta ttcaaaattt attgcctttg agaacatgcg cgatgttttt
     8221 ataaaaaatg ataaatataa agagttaatc ccggcgtacg atttttacgt tgcaacagta
     8281 tacttattac tacttaaaac gattgtctca aatggtgtgg ttaacaacaa acaactaagt
     8341 aagttcgttg aatattcttt tatcctcaag agaaaaatgg aattaccacc aaatacaatg
     8401 ggtgcttttg ttttgatatt taacataatt aattatattt ttcctatgaa agtaaaattt
     8461 ttaatgatgt catttatctt acggatgaat aaaggtttaa gatgagtatt acaaataaaa
     8521 caattgcgct ggtcattgta acatataata gatgtaacct tttgatggaa atgctttcct
     8581 ctatcgaaaa catgagtgtt aagcctgata ttgtctatgt tatagacaat aacagtagtg
     8641 ataatacttc atcggttgtc acagagtgtg attcaagaaa aaatattaat ataaaatatc
     8701 acaacactgg atataacgct ggaggtgctg gcggctttta tatcggcagt aaaatggctt
     8761 atgaagatgg ttgggataga atttggcttg cggatgatga cattgttttg gataaggagt
     8821 gtcttaataa cgcaatggag tatgatgatg gacgcactat cttacaacct atgcgttata
     8881 atatggacgg atcctgtgcc gaaatttcag ctatccagta cgatttaagt aatccttttt
     8941 atttacgtcc aaaacgcaag acggttcaga atattttcaa caaaaatatt ctgtcatatg
     9001 atatccaatc cattccgttt gaaggaccga ttattcccag ggaagtattt aatgtcatag
     9061 gttttccaga tgaacgtttc tttatattta atgacgattt agattttgcg attagagctc
     9121 agagagctgg cttcagcata aaatgtatta ctaacgcaaa aatcgtacgt aaaattccct
     9181 ttgtacagtc ggtagcatta aaaacatgga agggctattt catgtttaga aattattttc
     9241 gggttcagaa agtttatggt tcaagcccac ttatttatct gagaattttg ctcgtgttct
     9301 gccttgcact gggacattca ctcgtgcgta tggatatcaa ttcaattaag atgctgtgcg
     9361 gtgcgttgaa agatggtctc tctcaagaat ttaagctgac tgagaaatac aaaccatgag
     9421 tactaccgat agccctaata taaaaacatc aaataacaat tttgatatag taaggctcat
     9481 tcttgcgtta gttgttgttt tctcacatat aagagattta aataatatta attcccggtt
     9541 cttctccatt ttctcaggtg actttgccgt agaatgcttt ttcgtaatta gcggttattt
     9601 gatcattaga agctttaaaa ataatcaaaa tatcagaaaa tatatttttt cgagggggat
     9661 gagaattctc cctatgtact acgtttctat agtatccttt ttcgttatat tattttttat
     9721 ctctcacctt tccgttgttg aatatttaaa ggaaggcgga attcgatatt tagtatttaa
     9781 tggagtattc ctcaatttca tccagccttc gctgccggga gtgttcgttg ataatcctcg
     9841 aatctctgcg gttaatgggg ctctttggac tataaaagtt gagatcctat tctatatatt
     9901 tgttccattc tttgtcctgt tcattaaaaa aatcaatcga catattattc ctatatttat
     9961 aattcttatt ttatcgtcta ttgtattcaa gtggattgtt acagactatc atcaaatttt
    10021 acatattcct gagcaactgg ttaatcagtt accgtcggtg ctaagttatt ttctattagg
    10081 cggcttggtt aattatctgg atctatctaa gatatcaaaa aaaacagtat tttggttttt
    10141 tatagtatca gctttttatc ttttactaag tagtaaaacg tcattggatt tacttgttcg
    10201 cccatttgtt attgcagggt tcatactgcc gatatgtttg cagcgtaaat ttttaataag
    10261 tgtgcctgaa aaaatgggtg acctttcgta tggtatatat gtaacacatt tccctcttgt
    10321 tcaattacta attgcagtag ggttgtataa ttcattttgg ttaggttttt gtttaacatt
    10381 tactagtctt tttattttgt cttttattag ttggcatctt attgagaagc cagctcttcg
    10441 ttttgctaaa tctgcaggaa aaaataaagt tgtgaggggt gtatgagaat tgctattgtt
    10501 ggtgctggat ttagtggtgc agttatagcc agggaattgg ctgaacatgg tcactcagta
    10561 gatatctttg agaaaagaga ccatgttgct ggtaattgtt atagtaaaag agacccagac
    10621 acaaatgtta tggttcatgt ttatggcccg catattttcc atacggatga taaagaagta
    10681 tgggaatata tcaataaatt cggaatgttc gagccatatg ttaatagagt caaggccata
    10741 actaaaggcg cggtttattc cctgccaatc aatctccata caattaacca gtttttccac
    10801 aaaactctga accctgctga agcgaaagac ttcataaatt ctttgtgtga actattcgaa
    10861 tttgagccga ttacattcga gcagcaggct ttatcattta ttggtcgaga cttgtacgag
    10921 gcatttttta gaacgtatac cattaaacaa tggggtcttg aaccttcaga gcttcctgcc
    10981 agtattttga aacggctacc agttagattt aattataacg ataactattt cagccatcgt
    11041 tatcagggta tgccacgtga tggatatact aatataatta gtgccatttt ggaccatgca
    11101 agtatcgctg tgaaattaaa cactgatttc aaaaaaaatg tcggcaatga atatgatcac
    11161 gtgttttata gcggcacgat tgacggttat tttgactact cccatggccg ccttccttac
    11221 aggactctag attttgtcac ggaaagacat aaaggtgatt atcaaggaac cgctgtaatt
    11281 aactattgtg atgatagtga gaaatttact cgtattactg aacacaaata tttttcccct
    11341 tgggaagagc acagcaatac aataatctat aaagaataca gccggacatg tactgagact
    11401 gattctccct actatccaat tcggcaggtt caggaaaaag aattactaag aaagtatgtt
    11461 gatttagcaa atcaaacaaa caatgtttca tttattgggc gtttaggtac gtacagatat
    11521 cttgacatgg atgtaactat tcgtgaggca ctaaatgctg taaaactctt tatgaaaata
    11581 aaaaaggaga acgaaaaagt tccagcattt ttcacggaaa tactgtgaag atataatttc
    11641 tgctccgaga tacataatgt cgatagtatt agtaatggtg agcattgtta tttattgtca
    11701 gtttgacagc actcttggct atccagattt gttggatatg agttaatatc acaccacatt
    11761 caagccgcgc atatctcgcg gtgaccacac ctgacaggag tatgtaatgt ctaagcaaca
    11821 gatcggcgta gtcggtatgg cagtgatggg gcgcaacctg gcgctcaaca tcgaaagccg
    11881 tggttatacc gtctccatct tcaaccgctc ccgtgaaaag acagaagaag ttgttgccga
    11941 aaatccaggc aagaaactgg ttcctcatta cacggtaaaa gaattcgtcg aatctcttga
    12001 aaccccgcgt cgtatcctgt tgatggtgaa agccggtgcg ggtaccgatg ccgctattga
    12061 ttctctgaaa ccgtatctgg ataaaggtga catcatcatt gatggtggta atactttctt
    12121 ccaggacacc attcgtcgta atcgcgagct gtcggctgaa ggctttaact tcatcggtac
    12181 cggtgtttcc ggcggtgaag agggcgcgct gaaaggccca tctatcatgc ctggtggtca
    12241 gaaagaagcc tatgagctgg ttgccccaat cctgaccaaa atcgctgctg ttgcggaaga
    12301 tggcgaaccg tgcgtgacct atattggtgc cgatggtgcg ggtcactatg tgaaaatggt
    12361 tcacaacggt atcgaatacg gcgacatgca gctgatcgca gaagcgtact ctctgctgaa
    12421 aggtggcctg aacctctcta acgacgagct ggcgactatc ttcaccgagt ggaacgaagg
    12481 cgaactgagc agctatctga tcgacatcac caaagacatc ttcaccaaga aagatgaaga
    12541 cggtaattat ctggttgatg tgattctgga tgaagccgct aacaaaggta ccggtaaatg
    12601 gaccagccag agctccctgg atctcggcga gccactgtcc ctgatcaccg agtctgtatt
    12661 cgcgcgttat atctcctctc tgaaagatca gcgtgttgca gcgtctaaag tgctttctgg
    12721 cccgaaagcg gaactggctg gcgacaaagc ggctttcgtt gagaaagttc gccgcgcgct
    12781 gtatctcggt aaaatcgttt cttacgcgca gggcttctct cagctgcgtg ccgcgtctga
    12841 cgaatacaac tgggatctga actacggtga aatcgcgaag atcttccgtg cgggctgtat
    12901 tattcgtgca cagttcctgc agaagatcac cgatgcctat gctgaaaata gcggtatcgc
    12961 aaacctgctg ctggcaccgt acttcaagaa tatcgctgat gagtatcagc aggcgctgcg
    13021 tgacgtggtt gcctacgctg tacagaacgg tattccggtt ccgaccttcg gcgctgcggt
    13081 tgcctactat gacagctacc gttcagcggt actgccggct aacctgattc aggctcagcg
    13141 tgactacttc ggtgcacata cctataaacg tactgataaa gaaggcgtat tccataccga
    13201 atggttggac taatcctaaa taaataatgg aagcccggcg atgccgggct tttttttgcg
    13261 ctcaattctt attgcattat ggtcctgtct taatattaac ttaatatcga tggtttattc
    13321 tctctgaaga aagtccgaat tgtttgtaat tctattgcag tgaatgcgct tacgagttaa
    13381 aaaaatttta aacgtattga tgtgatatca cattataaat aattaagttt attctgagag
    13441 agtacaatga aagttaccat ctctggtaca ggctatgtcg gcctctcgaa cggcctgctg
    13501 atcgcgcaac accacgacgt cgtggcgttg gacatcattc cttcacgtgt ggatatgctc
    13561 aacgcgcgtg tatcacccat tgttgacaaa gagatccaac agtacctgag ctcaggcgag
    13621 ttgcgtttct ccgcaactac tgacaaatac ctggcttatc agaatgctga ttacgttatt
    13681 atcgcgacgc caacggatta cgaccctaaa actaactatt ttaatacgtc cagcgttgag
    13741 tcggttattc aggatgtcat tgagattaat ccgcaggccg ttatgattat caaatcaacg
    13801 gtgccggttg gttttacgga ttcggtgaag aaaaaatatg ccactgataa tattattttc
    13861 tcgccagagt ttttgcgtga aggtaaagcg ttgtacgaca accttcaccc ctcgcggatc
    13921 gtgattggtg agcgttcaga gcgcgcagaa cgttttgccc gaatgctcca gcagggcgct
    13981 attaagcaag acatacctac gctgtttacc gattcgacgg aagcagaggc gattaaactc
    14041 tttgccaaca cctatctggc aatgcgtgtt gcttacttta acgagctgga tagctacgcg
    14101 gaaacgttgg ggctcaattc ccgccaaatc atcgaaggtg tctgtctgga tcctcgcatc
    14161 ggtgctcact acaacaaccc ttcctttggt tatggtggct attgcctgcc gaaggatact
    14221 aagcaactgc tggcgaacta ccagtcggtg cctaacaaca ttatctctgc cattgtcgat
    14281 gcgaaccgga cgcgcaaaga ttttatcgct gaggcgattc tggcgcgtaa gccgaaagtg
    14341 gtcggtatct atcgcctgat tatgaaaagc ggctccgata atttccgtgc atcctccgtg
    14401 cagggcatca tgaaacgcct gaaagcgaag gggataacgg tgattgtgta cgaaccggtg
    14461 atgaaagagg atgaattctt cagctcacgt gtcgttcgcg atctggatgc cttcaagcaa
    14521 gaagcggatg ttatcgtttc taaccgtatg gccgaggagt taaccgacgt agcagaaaaa
    14581 atctacacgc gcgatctttt tggcaacgac taatctaaat ttttgacaag ctgaatgcct
    14641 gacaagacgg gcgttcagcc ttttttctga ttcttttcag gtttctctgt ttttggtgaa
    14701 aatcctatag aaattcggat tggtccaggt aaactgatgc cctcgtgggt atttcagttt
    14761 ggatgtcact aaggtttata tgattcaaga taacaataat gggcgcagcg ggtatgagcg
    14821 tgagccggag cagatcgacc ttatcgattt gttgatgcaa ctctggcgtg gcaagttgac
    14881 catcatcgta tgcgtcatcg tcgcgattgc gctcgctgtg gcttatgtct ttttagcgaa
    14941 agagaaatgg acctctaccg cgaccatcac tcgcccggat gcggcgcaga ttgcgaccta
    15001 ccataacgcc ataaatactc tggattcatc gattaacttg tccgacgttc aaaaccaggt
    15061 gattaaccgc tttaactctg catttatcgc attgacggaa gcgttggata atcagcaaga
    15121 gcctgagaaa ctgactattg agccctctgt taagggccag aatctacccc taactgtgac
    15181 ttacgtgagt gatacagcac aatccgccca gcgcggtgta gctgaataca tccagaaaat
    15241 cgacgaacaa atcgctgatg agctggtact tgaccttaat gacaccatca aattacgtgt
    15301 gatgaacatt aaggacgacc tggaaaacca ggaaaccgta gctcaggaac aaaaagacct
    15361 gcgtatcaag cagatcactg aatccctgaa atacgcgcag aaaagtaacg tcaccaaacc
    15421 gcagcttcag cagacccaag acgtaactca ggaaaccatg ttcctgttgg gcacagaggc
    15481 tctgggcgca atggttgcca acgaagccag ccgtccgctg acctttggtg cgggctacta
    15541 cggtttgaag aaaaacctgc ttgatatcga aaaactgaaa gtcgatccga aaaccattca
    15601 cgtctatcgc tacgtgatga agccgacgct gccaatccgt cgcgacagcc cgaagcgtgg
    15661 tctgacgctg gtgctggcgg tgctgctggg cgggatgatt ggtgccggtg ttgtgttggg
    15721 ccgcaacgcg ttgcgtaact acaaaccgaa agcataacgc ttacgtcaga tagcaaaaaa
    15781 ccgggctcgc ccggtttttt tacgcctgtt gaaaatttac tgatgacgtt ttcgcaggtt
    15841 ctcaatcacg gtcgttaaat cgagatcctg atcctgcagc agcaccagca ggtggtacat
    15901 caagtccgac gcttcattgg tcagctcaaa gcggtctttc accgttgctg ccagtgcggt
    15961 ttctacgcct tcttcaccca ctttctgcgc gatacgcttg gtgccgctgg catacaggcg
    16021 cgcggtgtag gagctttccg ggtctgcggt tttacgctcg gccagcagtt gttccagttg
    16081 atacaggaac aaccattggt ggctggcgtc gccgaagcaa ctggaagtgc ctttgtggca
    16141 agttggccca atcgggttga ccagtaccag cagggtgtcg ttgtcgcagt cgggcgtgat
    16201 gctgacaacg ttcaggaaat tgccggaggt ttcacctttg gtccacaggc gttctttggt
    16261 gcgcgaataa aacgtcactt tgccggacga ctctgtctgg gccagcgcct ctttattcat
    16321 atagcccagc attaatactt cgccggaaac cgcgtgttgt acgatggcgg gcatcagtcc
    16381 gtcggtttta tcccaatcca gttgttcagt taacataccc gtatctccac gccctgtgcg
    16441 gccaggtacg cttttaattc accaatatta ataatttgct tgtggaatac cgaggcggcc
    16501 agcgcgccat cgacatccgc atcgcggaag gcttcgagga agtgttccat ggtacccgca
    16561 ccgcccgagg caatcagcgg tacgtggcag acgtcacgca cttttttcag ttgcgccagg
    16621 tcgtagccat tacgcacgcc gtcctggttc atcatgttga ggacgatctc gcccgcgccg
    16681 cgtttctgta cttcctgcac ccagtcgagg gtttcccatt gggtgacgcg ggtgcggctt
    16741 tcatcgccgg tgtattgatt gacgtgatat ttgccgctgt cggcgtcaaa ccaggtgtcg
    16801 atcccgacca cgatgcactg cacgccaaaa cgatccgcca ggcgggtgat cagctccggg
    16861 tcggccagcg ccggggagtt gatggaaatt ttatctgcac c
//