LOCUS       AB811605               16391 bp    DNA     linear   BCT 13-MAY-2015
DEFINITION  Escherichia coli DNA, O-antigen biosynthetic locus, strain: P7a.
ACCESSION   AB811605
VERSION     AB811605.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1
  AUTHORS   Iguchi,A., Iyoda,S., Kikuchi,T., Ogura,Y., Katsura,K., Ohnishi,M.,
            Hayashi,T. and Thomson,N.R.
  TITLE     A complete view of the genetic diversity of the Escherichia coli
            O-antigen biosynthesis gene cluster
  JOURNAL   DNA Res. 22 (1), 101-107 (2015)
   PUBMED   25428893
  REMARK    DOI:10.1093/dnares/dsu043
REFERENCE   2  (bases 1 to 16391)
  AUTHORS   Iguchi,A., Iyoda,S. and Ohnishi,M.
  TITLE     Direct Submission
  JOURNAL   Submitted (29-MAR-2013) Contact:Atsushi Iguchi University of
            Miyazaki, Faculty of Agriculture; Gakuen-kibanadai-nishi 1-1,
            Miyazaki, Miyazaki 889-2192, Japan
FEATURES             Location/Qualifiers
     source          1..16391
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="P7a"
                     /db_xref="taxon:562"
                     /note="serogroup:O20"
     gene            <1..905
                     /gene="wcaM"
     CDS             <1..905
                     /gene="wcaM"
                     /codon_start=3
                     /transl_table=11
                     /protein_id="BAQ00714.1"
                     /translation="YAILRQGFHNQIIGANITNCKFSDLQGDAIEWNVAINDSDILIS
                     DHIIERINCTNGKINWGIGIGLAGSTYDNNYPEDQAVKNFVVANITGSDCRQLIHVEN
                     GKHFVIRNIKARNITPDFSKKAGIDNATVAIYGCDNFVIDNIEMINSAGMLIGYGVIK
                     GKYLSIPQNFRVNNIQLDNTHLAYKLRGIQISAGNAVSFVALTNIEMKRASLELHNKP
                     QHLFMRNIKVMQESSVGPALSMNFDMRKDVRGVFMAKKETLLSLANVHAVNERGQSSV
                     DIDRINHHIVNVEKINFRLPERRE"
     gene            1068..1973
                     /gene="galF"
     CDS             1068..1973
                     /gene="galF"
                     /note="O020_01"
                     /codon_start=1
                     /transl_table=11
                     /product="UTP-glucose-1-phosphate uridylyltransferase"
                     /protein_id="BAQ00715.1"
                     /translation="MDEIMTNLKAVIPVAGLGMHMLPATKAIPKEMLPIVDKPMIQYI
                     VDEIVAAGIKEILLVTHASKNAVENHFDTSYELESLLEQRVKRQLLAEVQSICPPGVT
                     IMNVRQGEPLGLGHSILCARPAIGDNPFVVVLPDVVIDDASADPLRYNLAAMIARFNE
                     TGRSQVLAKRMPGDLSEYSVIQTKEPLDREGKVSRIVEFIEKPDQPQTLDSDIMAVGR
                     YVLSADIWPELERTQPGAWGRIQLTDAIAELAKKQSVDAMLMTGDSYDCGKKMGYMQA
                     FVKYGLRNLKEGAKFRKGIEKLLSE"
     CDS             2307..2678
                     /note="O020_02"
                     /codon_start=1
                     /transl_table=11
                     /product="putative phosphatase"
                     /protein_id="BAQ00716.1"
                     /translation="MNKIIVDLDGTLTEEDTNDYTKVKPKLKVVKKLYEFKKMGFSIV
                     IMTARNMRTFDGNIGKINIHTLPVIIDWLNENNIPYDEVIVGKPWCGNKGFYVDDRAL
                     RPSEFARLNLQEINELFDKDK"
     CDS             2678..4267
                     /note="O020_03"
                     /codon_start=1
                     /transl_table=11
                     /product="putative phosphotransferase"
                     /protein_id="BAQ00717.1"
                     /translation="MLLILSSAYIDIDLQSEFGRLPPSMLPLGNKRLVQHQKKLLNTN
                     ELMIITLPKSYKISEWDRKWLDNNNIKIVFVNDGGALGESVLYAIEYIKTLNISEHLR
                     ILYGDTLILSNIKDDSNVIAVSNSEDNYNWARVENQNAYIKISTENDVDILGGDILCG
                     YFSFSDIDLLRECLISNNYNFIEAIKSYHAKSFLFVRKIDEWLDFGHVNTYYKSKMKY
                     TTQRAFNELYINSDWVCKSSQDYEKILAEANWFEKIPLELKKYIPQYLGKESKNNKSA
                     SYKLEYLCHTALNELYVFSELPLTVWKSILEKCLDFVRESKSYIPSDKERFSTINELL
                     IDKTNARLVSFCSEKQFSINDKWDFKGKRISVSDILDVAAKYIPNDNNPSLMHGDLCF
                     SNILFDFRAGRIKLIDPRGLSVDRNYTIYGSYYYDLAKLSHSILGMYDWIVAGYCDAN
                     ICERKIELSFVNDKKIENIKSIFIDMITAQFDITLNELYAMQIYLFLSMLPLHSDDVQ
                     RQKALFANVFRLYELLQEIEK"
     CDS             4264..5019
                     /note="O020_04"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="BAQ00718.1"
                     /translation="MIVIPMAGMSSRFRNAGYKKPKYMLKAHGITLFSHSVSSFKSYF
                     NNEVFIFIVKDIDGSEFVKTEVKKLGILHYHIILLEQTTRGQAESVYNGLKQLQEKIM
                     ISPTESLTIFNIDTIRCNFMYPKLHERGDGYLEVFSGEGDNWSFVKPVNNESTLVIET
                     AEKKPISKLCCTGLYYFSRLQYFFEAYDLYILTPKDSWDKGELYVAPLYNILIAQKKE
                     IHYHKINVSDVFFAGVPKEYEDFCKIDYESFVG"
     gene            5025..6251
                     /gene="wzy"
     CDS             5025..6251
                     /gene="wzy"
                     /note="O020_05"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen polymerase"
                     /protein_id="BAQ00719.1"
                     /translation="MNWKIKKNVELLILFLVLNQLVIDTFNGYFIFSSQGGGNISVIY
                     KIIIFFLFLFYELVSRDRFIVAFSIVTWGVFLTFFHLLSNNYTEVVMDLSEYIKLATT
                     FIVFLGVSKFSYINPLAFIKYLSVYSFCIILFNILLSAFGVGETSYSDFGYKGFFYAA
                     NALSGVFCIVACYLMYITLKKSLTYYIICAGVLALCSFAIGTKTGIVFVAISLVTIPL
                     LMEGKKAKIRVSLLSLVGFLCALVIYADKIYTSNLVLRIVHFYEVGGWSKMLFSDRDL
                     FLKYNIDQFLNSDPVSLLIGIGYAGINAFPKPLTEIDIADITIIYGMLTTSAYISFYI
                     GILFYSNGYLKKNCPRDIIAISRYICLVLMIVSSIAGHILFNGMVTLYLGIAMALPWW
                     MANYRTRHIKGLKINV"
     gene            6244..7626
                     /gene="wzx"
     CDS             6244..7626
                     /gene="wzx"
                     /note="O020_06"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen flippase"
                     /protein_id="BAQ00720.1"
                     /translation="MFKSVGVGFLSRIISVLSNIIIIPIILKHLTPEQFSLWMLFVSF
                     YSLVIIFDFGFSATISRYVSYVLSGATLQQLQNGYYENVWLGNGGGIDYKALNELSRI
                     NKIIFYYLVLIASVFLLCIYLYYCNFVGINISKDDRIAWGLFSISILIQLASIRYNGF
                     LHGSGNVAKIYRNTICSNFVFLLFFIFFIYLQWSLVGICIARLLSSLMVFILNAISSS
                     KLTCVYPRLRCNEVKGHDNKRLFKRIRDKSFHLGIGGLGNFICNRMTIMVMTATVAIQ
                     NIAGVSFIINLSITILSISLILINNAMPELVRFRVEGAYDKLFNSFKRICFISIVFFI
                     SSYVVMVISTPYIIKITHSKVILPSNSIVLLCFCIFFIELIQSLSISFISTSNNTDFA
                     KYQIITGLSFLLICFVFSYFKWTSLVNILLVQLIVQCIYNGWKWPFVIFCEYNKVRHL
                     IRKKNDVAAK"
     CDS             7610..8668
                     /note="O020_07"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00721.1"
                     /translation="MLLLSRNSLPVLKEYRGLEIKCLKNYIVDMDFFAYKDSMHIYEE
                     STVNEYISNKGWVSKRAKNHPDLGFCYNKASIDKNGSILYSKQKYVTRNNDCDFFLFD
                     YSWGHNYQHWLISSLGRLFVYCELKKYNPKLKLLIGDKMPKYKSEAITLLGISDDDLI
                     CHREVTKYRKIYTCNFNSGSGLRVSHLSYYYYEKMANLINFTDDFGRKIYIARDDSRG
                     KRPLINRSELNALMTKRGFNVVFLEELSFYEKIALFKSADIIIGDFSSGWGHIVFCKK
                     FTKLILLEHDIYKFQGFYKEIANSKCLDLKVVETKNIFRLMYLKFLKLIWTLLKDVDK
                     RANSLSWKVNIKELMDFL"
     CDS             8665..9411
                     /note="O020_08"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00722.1"
                     /translation="MIKIYTINLFTENARREKILSLAKKLELPIKIENAIIGSNLSKE
                     YLDNLTNESIDKIGRNLSPGEVGCYLSHIKCLKNFLSSGDEFAIILEDDVTLDYRIKD
                     FISTIEFKETTLFFDVMLLGYRNGYGSYWGKKKWNSHKLLRFPDCGYGAHAYLVTRKG
                     AEKIVYNNAIPIWPYDYVTGGRADKTIRVYGVEKKIVDLDFYNSSCSSLEAERNYLGA
                     YSSEYKVKTPFVLYVLKKLIKGLKPIRVYK"
     CDS             9408..10463
                     /note="O020_09"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00723.1"
                     /translation="MKVLIVSNMYPSIENPSLGVFVKNTEEMLVNANIDVDRAVIDRI
                     YSNSFEKVFGYFIFYLKVIYKILFCKCDIVYAHYVSHVAIPIFFVNLFKHIVVFSHVH
                     GGDVKQLKGTSAVFFKIKQALSKKIMDISKVIFSPSASYKRHIIELYSQDESKIIIFP
                     SGGIDTTLFSFGSGRKKNILGYAGRLEDSKNVDLIIKSLIDNKYNLEIVGDGKKKGQL
                     QELVSKYNLSERVIFHSSKTQKELSEWYKRVSILIYPSSSESLGLVPLEALACGTDVL
                     LSPIDAFFEFRDIGLQFEFLSELTPQAINVGIEKIISTRCFRNNMSNNIIINSVYARN
                     VVCKEFIDVFKQKCHCF"
     CDS             10432..10914
                     /note="O020_10"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00724.1"
                     /translation="MYSNKNAIVFSYGAGGHSAQANRLAALLIPRLDSFYIISISDDC
                     ITPKWSHIHFVTGEVRKKNSYFDTLTNMGPIKIIQTLLKIKKYNVRCVISNGPGISVI
                     TALFFKVFGAKIIHVETWSRFVSKSLTGMAMYYIADVFYVQNKELCKIYKNAIYSGRL
                     "
     CDS             10911..11369
                     /note="O020_11"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00725.1"
                     /translation="MKIFTTVGTTSFDLLIKSVDEFAATNKDNDFIFQIANGQFHPRN
                     GCYFRFENDIVHYYEWADVVITHAGAGTIYKLLEQRKKVIIVPNLVRIDKHQRDIAQY
                     MCDHHYSLVLWDLSSLSSIMKDIEKFSPAVYKKTPFFRSDEIVNFINNIR"
     gene            11406..12812
                     /gene="gnd"
     CDS             11406..12812
                     /gene="gnd"
                     /note="O020_12"
                     /codon_start=1
                     /transl_table=11
                     /product="6-phosphogluconate dehydrogenase"
                     /protein_id="BAQ00726.1"
                     /translation="MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIA
                     ENPGKKLVPYYTVKEFVESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGN
                     TFFQDTIRRNRELSAEGFNFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIA
                     AVAEDGEPCVTYIGADGAGHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQT
                     FTEWNNGELSSYLIDITKDIFTKKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEP
                     LSLITESVFARYISSLKDQRVAASKVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYA
                     QGFSQLRAASEEYNWDLNYGEIAKIFRAGCIIRAQFLQKITDAYAENPQIANLLLAPY
                     FKQIADDYQQALRDVVAYAVQNGIPVPTFAAAVAYYDSYRAAVLPANLIQAQRDYFGA
                     HTYKRIDKEGVFHTEWLD"
     gene            13061..14227
                     /gene="ugd"
     CDS             13061..14227
                     /gene="ugd"
                     /note="O020_13"
                     /codon_start=1
                     /transl_table=11
                     /product="UDP-glucose 6-dehydrogenase"
                     /protein_id="BAQ00727.1"
                     /translation="MKITISGTGYVGLSNGILIAQNHEVVALDIVQAKVDMLNKKQSP
                     IVDKEIEEYLATKDLNFRATIDKYDAYKNADYVIIATPTDYDPKTNYFNTSSVEAVIR
                     DVTEINPNAVMVIKSTIPVGFTKSIKERLGIDNLIFSPEFLREGKALYDNLHPSRIVI
                     GERSERAERFAALLQEGAIKQNIPTLFTDSTEAEAIKLFANTYLAMRVAYFNELDSYA
                     ESLGLNTRQIIEGVCLDPRIGNHYNNPSFGYGGYCLPKDTKQLLANYQSVPNNLISAI
                     VDANRTRKDFIADAILSRKPQVVGIYRLIMKSGSDNFRASSIQGIMKRIKAKGVEVII
                     YEPVMKEDSFFNSRLERDLATFKQQADVIISNRMAEELKDVADKVYTRDLFGSD"
     gene            14317..15354
                     /gene="wzz"
     CDS             14317..15354
                     /gene="wzz"
                     /note="O020_14"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen chain length determinant protein"
                     /protein_id="BAQ00728.1"
                     /translation="MAIIAKLWRLKIISSVRVMMRVENNNVSGQNHDPEQIDLIDLLV
                     QLWRGKMTIIISVIVAIALAIGYLAVAKEKWTSTAIVTQPDVGQIAGYTNAMNVIYGP
                     AVPKVSDIQASLIGRYSTAFSALAETLDNQEEAEKLTIEPTVKNQSLPLAVSYVGETP
                     EGAQKQLAKYIQQVDDQVNVELEKDLKDNIALRMKNLQDSLRTQEVVAQEQKDLRIRQ
                     IQEALQYANQAQVTKPQIQQTGEDITQDTLFLLGSEALESMIKHEATRPLVFSPNYYQ
                     TRQNLLDIESLKVNDLDIHAYRYVMKPTLPIRRDSPKKAITLILAVLLGGMVGAGIVL
                     GRNALRNYNAK"
     gene            complement(15451..16062)
                     /gene="hisI"
     CDS             complement(15451..16062)
                     /gene="hisI"
                     /codon_start=1
                     /transl_table=11
                     /product="phosphoribosyl-AMP cyclohydrolase"
                     /protein_id="BAQ00729.1"
                     /translation="MLTEQQRRELDWEKTDGLMPVIVQHAVSGEVLMLGYMNPEALDK
                     TIESGKVTFFSRTKQRLWTKGETSGNFLNVVNITPDCDNDTLLLLANPIGPTCHKGTS
                     SCFGDTAHQWLFLYQLEQLLAERKSADPETSYTAKLYASGTKRIAQKVGEEGVETALA
                     ATVHDRFELTNEASDLMYHLLVLLQDQGLDLTTVIENLRKRHQ"
ORIGIN      
        1 attacgccat cttacgccag ggatttcata accagattat cggtgccaac atcaccaact
       61 gtaagttcag cgacttacaa ggcgacgcca ttgaatggaa cgtggcaatt aacgacagtg
      121 atattttgat ctccgaccac atcatcgagc gcatcaactg tactaacggc aaaatcaact
      181 ggggcattgg cataggtctt gcgggaagca cttatgataa taattacccg gaagaccagg
      241 cagtgaaaaa ctttgtcgtg gcgaatatca cgggatcgga ttgtcggcag ttgatccatg
      301 ttgaaaatgg taaacatttt gttatccgta atatcaaagc ccgcaatatc acgccggatt
      361 tcagtaagaa agcaggtatt gataacgcga cagtcgctat ttacggttgt gataatttcg
      421 tgattgataa tattgaaatg attaatagtg ccgggatgtt aatcggctat ggggtaatta
      481 aaggcaaata tctctcgata ccacaaaatt tccgagtgaa taatattcag ctggataaca
      541 ctcaccttgc ttataaattg cgcggcatcc aaatctccgc cgggaatgcc gtctcctttg
      601 tggcgctgac taacattgag atgaagcgtg cctcgctgga gctacacaac aagccgcaac
      661 atctttttat gcgaaatatc aaagtgatgc aggaatcctc agttggacca gcattgagca
      721 tgaacttcga catgcgcaaa gacgttcgcg gcgtctttat ggcgaaaaaa gaaacactgc
      781 tatctcttgc aaatgttcat gcggtgaatg aaagaggaca aagctccgtc gatatcgaca
      841 ggattaatca ccatattgtt aatgtggaaa agattaactt tagattgccg gaacggaggg
      901 agtagatttg cgaccattcc tggaaaaatg gagccatact taggaacaat gctactgcaa
      961 tccacaacga agcggcgtaa catcacaagt aattcagtaa tcaattcagg gtaattgatg
     1021 ctggcgaaaa aaatcgaaca agctataatt cagcaaccat tttacaggtg gatgaaataa
     1081 tgacgaattt aaaagcagtt attcctgtag cgggtcttgg gatgcatatg ttgcctgcca
     1141 ctaaggcgat tcccaaagag atgctaccga tcgtcgacaa gccaatgatt cagtacattg
     1201 ttgacgagat tgtggctgca gggatcaaag aaatcctcct ggtaactcac gcgtccaaga
     1261 acgcggtcga aaaccacttc gacacctctt atgaattaga gtctctcctt gaacagcgcg
     1321 tgaagcgtca actactggcg gaagtacagt ccatttgccc gccgggcgtg accattatga
     1381 acgtgcgtca gggcgaacct ttaggtttag gccactccat tttgtgtgcg cgacctgcca
     1441 ttggtgacaa cccatttgtc gtggtactgc cagacgttgt gatcgacgac gccagcgccg
     1501 acccgctgcg ctacaacctt gctgccatga ttgcgcgctt caacgaaacg ggccgcagcc
     1561 aggtgctggc aaaacgtatg ccgggtgacc tctctgaata ctccgtcatc cagaccaaag
     1621 aaccgctgga tcgtgaaggt aaagtcagcc gcattgttga atttatcgaa aaaccggatc
     1681 agccgcagac gttggactca gacatcatgg ccgttggtcg ctatgtgctt tctgccgata
     1741 tttggccgga acttgaacgc acgcagcctg gtgcgtgggg acgtattcag ctgactgatg
     1801 ctattgccga actggcgaaa aaacaatctg ttgatgcaat gctgatgaca ggtgacagct
     1861 acgactgcgg taaaaaaatg ggttatatgc aggcgtttgt gaagtatgga ctacgcaacc
     1921 tgaaagaagg ggcgaagttc cgtaaaggca ttgagaagct gttaagcgaa taatgaaaat
     1981 ctgaccggat gtaacggttg ataagaaaat tataacggcg gtgaagattc gtggcgaaag
     2041 taatttgttg cgaattttcc tgccgttgtt ttatataaac aatcagaata acagcgagtt
     2101 agcaatagga ttttagtcaa agttttccag gattttcctt gtttccagag cggattggta
     2161 agacaattag cgtttgaatt tttcgggttt agcgcgagtg ggtaacgctc gtcacatcgt
     2221 aggcatgcat gcagtgctct ggtagctgta aagccagggg cggtagcgta tttgcttatt
     2281 tttatcgtgt aatcaaagtg attgttatga ataagataat agttgatctt gacggtactt
     2341 taactgagga agatacaaat gattatacta aagttaaacc aaaactaaaa gttgttaaaa
     2401 aattgtatga atttaaaaaa atgggattca gtattgtaat aatgacagca aggaatatgc
     2461 gaacatttga tggtaatatt ggaaagatta atatacatac acttcctgta atcattgact
     2521 ggcttaatga aaataatatc ccgtacgatg aagttattgt ggggaagcca tggtgcggta
     2581 ataagggatt ttatgttgat gatcgggcac taaggccttc tgaatttgca agattaaatc
     2641 ttcaagagat aaacgaatta tttgataagg ataaataatg cttttaatac tatcgtctgc
     2701 gtatattgat attgatttac agtctgaatt tggtcggttg ccaccgagca tgttaccgct
     2761 aggaaataaa cgattagttc aacatcaaaa aaaacttctt aacacgaatg agttgatgat
     2821 aatcacttta cctaaatcat ataaaatatc agaatgggac aggaagtggt tagataataa
     2881 taatataaaa atagtctttg ttaatgatgg tggggcgctt ggtgaatcgg tattatatgc
     2941 tattgaatat attaaaacat taaacatttc tgaacatctc aggattttgt atggagatac
     3001 tttgattctt tcaaatataa aagatgactc aaatgtaatc gctgtatcta actctgagga
     3061 taattataac tgggctagag tcgaaaatca gaatgcatat ataaaaatat ccaccgaaaa
     3121 tgatgtggac attttaggag gagatatact ttgtggctat ttttcattta gtgatataga
     3181 tcttcttcgg gagtgtttga tttctaataa ttataacttt attgaagcca taaaaagtta
     3241 ccatgcaaaa agttttctat ttgttagaaa aattgatgaa tggttggatt ttggtcatgt
     3301 gaatacttat tacaagtcaa agatgaaata tacaacgcaa agagcattca atgagttata
     3361 tattaactca gattgggtat gcaaatctag tcaggattat gagaagattt tagctgaggc
     3421 gaactggttt gaaaaaatac cactggaatt aaaaaaatat ataccacagt acttaggtaa
     3481 agagtctaaa aataataaga gtgcaagtta taaactagaa tatttgtgtc atactgcact
     3541 aaatgaatta tatgtcttta gtgaattacc gctaactgta tggaaatcaa tattggaaaa
     3601 atgccttgac ttcgttcgag agagtaaaag ttatatacca tctgataaag aacgattctc
     3661 aacaattaat gagttattga ttgacaagac caatgctagg cttgtatctt tctgttcaga
     3721 aaaacaattt tctattaatg ataaatggga ctttaagggg aaaaggatta gtgtctctga
     3781 tatacttgat gtagcggcta aatatatccc taatgataat aatccatctt tgatgcacgg
     3841 agacttatgc tttagtaata tattatttga ttttagagca ggtagaatta aattaattga
     3901 tcctcgagga ttatctgttg atagaaatta tacaatttat ggttcatact attatgattt
     3961 agctaaactt agtcattcaa tattgggaat gtatgattgg atagtggcag gctattgtga
     4021 tgcgaacatc tgtgaacgaa aaatagaatt gagttttgtt aatgataaaa aaatcgaaaa
     4081 tataaaaagt atttttattg acatgattac tgcacaattc gatattactc taaatgaatt
     4141 gtacgcaatg caaatttatc tattcttatc aatgttacca ctccattcag atgatgtgca
     4201 acggcaaaaa gcattgttcg caaatgtctt tagattatat gaacttttac aggagattga
     4261 aaaatgatcg ttataccaat ggctggtatg agttctcgat ttcggaatgc aggctataaa
     4321 aagccgaaat atatgctaaa agctcatggt atcactctgt tctctcattc tgtttctagc
     4381 tttaaaagtt attttaataa tgaggttttt atctttattg taaaagatat tgacggaagt
     4441 gaatttgtta agactgaagt gaaaaaactc ggaattttgc attatcatat tattttgtta
     4501 gagcagacaa ctcgaggtca agctgaatca gtatataatg gattgaaaca actccaagaa
     4561 aaaataatga tcagtccaac cgagtcttta actattttta atattgatac tataagatgt
     4621 aattttatgt atccaaaact tcatgaaaga ggtgatggtt atcttgaggt tttttcagga
     4681 gaaggggata attggtcatt tgtgaaacct gttaataatg agtcaacatt agtaatagaa
     4741 acagctgaaa aaaaaccaat atcaaaatta tgctgtactg ggttgtatta tttctctaga
     4801 ctccagtatt ttttcgaagc ttatgattta tatattttaa cacccaaaga tagttgggat
     4861 aaaggggagc tttatgtagc tccgttatat aatattctga tcgcccaaaa gaaagaaata
     4921 cactaccaca aaataaatgt aagtgatgtg ttttttgctg gtgttcccaa ggaatatgaa
     4981 gatttctgta agatagatta tgaatctttt gttgggtagg ttagatgaat tggaagatta
     5041 agaaaaacgt tgagctgtta attttattct tagtgcttaa ccagttggtt attgatactt
     5101 tcaatggtta ctttattttt agttctcaag ggggggggaa tatatcagtt atttataaaa
     5161 taattatatt ttttctcttt ttgttttatg agttagtgag tagggatagg tttattgttg
     5221 cattttctat cgttacttgg ggagttttct taactttttt tcatttatta agcaacaatt
     5281 atacagaagt tgtaatggac ttgtcagaat atataaagct ggcaacaaca tttattgttt
     5341 ttttaggggt ttctaaattt tcatatataa atccactggc ttttataaag tatttgagtg
     5401 tttattcgtt ttgtataatt ttatttaata ttttattgag tgcatttggt gttggtgaaa
     5461 cttcatatag tgattttggc tataaaggtt ttttctacgc agctaatgct ctttctggtg
     5521 ttttttgcat agttgcttgt tatttaatgt atataacgct gaaaaaaagt ttgacatatt
     5581 atataatatg tgcgggcgtt ttagcgttat gctcgtttgc tataggaacg aagacaggca
     5641 tcgtatttgt ggctatatca ttagtgacta ttcctttact gatggagggt aaaaaagcaa
     5701 aaatacgagt atctttatta tcattagttg gttttttatg tgccttggtt atctatgctg
     5761 ataaaattta tacatctaat ttagttttaa gaattgttca tttctatgaa gtcggtggtt
     5821 ggagtaagat gcttttttcg gatcgggacc tttttcttaa gtataatatt gatcaattct
     5881 taaacagtga tccagtgtca ttacttatag ggataggcta tgctggtatt aatgcattcc
     5941 caaagcctct tacagagatc gatattgctg atataacaat aatttatggg atgttaacta
     6001 cctctgctta catttctttt tatattggca ttttgttcta tagcaatgga tatcttaaaa
     6061 aaaattgccc aagagatata atagcaatat ctcgttatat atgcttggtt ttgatgattg
     6121 tgtcgtccat tgctgggcat attcttttta atggaatggt tactctttat ttaggtattg
     6181 caatggcgtt accttggtgg atggctaact atcgaactcg acatataaaa gggttgaaaa
     6241 taaatgttta agtcggtagg tgttggtttt ttatctagaa ttatatctgt attatctaat
     6301 attataatca ttcctattat attaaagcat ttaacgccag agcaattttc gttatggatg
     6361 ttatttgttt cattttatag tttggttata atatttgatt ttggatttag tgctacaatt
     6421 agtagatatg ttagttatgt tttaagtggt gcgaccttac agcaattaca aaatggttat
     6481 tatgaaaatg tttggctagg gaatgggggc ggtattgatt ataaagccct gaatgaatta
     6541 agtagaataa ataaaataat tttttattat cttgtcttaa ttgcttcagt ttttctactt
     6601 tgtatatatt tatattattg caactttgtc ggaatcaata tttctaagga tgatagaatt
     6661 gcatggggac ttttttctat atcgatattg attcagttgg cgagtattag atataacgga
     6721 ttcttacacg gttcaggtaa tgttgcaaaa atttatagaa atacaatatg ctcgaatttt
     6781 gtatttctgt tgtttttcat tttttttatt tacttgcagt ggtcattagt tggtatttgt
     6841 attgctagac ttctttcatc gttgatggtg tttattttaa atgccatatc ttcatcgaaa
     6901 ctgacttgcg tgtatccgag actaagatgc aatgaagtta agggccatga taataaacgt
     6961 ttgtttaaac ggattcgaga taagtctttt catcttggta taggtggttt gggaaacttt
     7021 atatgtaatc gtatgacaat tatggttatg acggcaacag tcgcaattca aaatattgca
     7081 ggtgtttcct tcatcatcaa tttgagtatt actattcttt caatttcatt gatactgatt
     7141 aataatgcaa tgcctgaact ggttcgtttt cgtgtcgagg gggcgtatga taaactcttt
     7201 aattccttca aacgaatatg tttcataagc attgtttttt ttatatcctc atatgtcgta
     7261 atggttataa gcacaccgta tattattaaa atcacacatt ctaaagtaat tcttccttct
     7321 aactcgattg tactgttgtg tttctgcatt ttttttatag agttgatcca gagtttatcc
     7381 atatcattta tttcgacaag taataacact gattttgcta aataccaaat tataacagga
     7441 ctttcatttt tgttaatatg cttcgttttc agttatttta aatggacttc attagttaat
     7501 attttacttg tacaattaat agttcagtgt atatacaatg gctggaaatg gccatttgtg
     7561 atcttttgtg aatataataa agttagacac cttattagga aaaaaaatga tgttgctgct
     7621 aagtagaaat tcgctgcctg tacttaaaga atatcgagga ctagagatta aatgtctcaa
     7681 gaactatatt gttgatatgg atttttttgc ctataaagat agcatgcata tttacgaaga
     7741 gtcgacagta aatgagtata tctccaataa ggggtgggtc tcaaaaagag ctaaaaatca
     7801 cccagatttg gggttttgtt ataataaggc aagtattgac aaaaatggta gtattttata
     7861 ttcaaaacaa aaatatgtaa caagaaataa tgattgtgat tttttcttat ttgattattc
     7921 gtgggggcat aattaccaac attggttaat atcttcattg gggcgcttgt ttgtttactg
     7981 tgagctgaaa aaatacaacc caaagttgaa gttattaatt ggtgataaaa tgcctaaata
     8041 taagagtgaa gctatcactt tattaggtat tagtgatgat gatttaatat gtcatcggga
     8101 ggttacaaaa tatagaaaaa tatacacgtg taatttcaat agtggctctg ggcttagagt
     8161 cagtcattta tcatactatt actatgaaaa gatggctaat ctaattaatt ttaccgatga
     8221 ttttggacgt aaaatatata tagcgaggga tgactctcgt ggtaaaagac ctttaataaa
     8281 tagaagtgag ttaaatgcat taatgactaa acggggattt aatgttgtct ttttggaaga
     8341 attgagcttt tatgaaaaaa ttgctctttt taaaagtgca gatattatta ttggcgactt
     8401 tagttctggt tgggggcata ttgtattttg taagaaattt acaaagttaa ttcttcttga
     8461 acatgatata tataaatttc aaggttttta taaagaaata gctaactcaa aatgtttaga
     8521 tcttaaggtt gtagaaacaa aaaatatttt tcggctcatg tatttgaagt ttttaaaatt
     8581 aatttggacc ttgttaaagg atgttgacaa gcgtgctaac tctctgtcat ggaaagtaaa
     8641 tattaaagaa ctaatggatt ttctatgatt aagatttata ctattaactt atttactgaa
     8701 aatgctcgca gagagaaaat attgtctttg gcaaaaaaat tggaactacc gataaaaata
     8761 gaaaatgcaa taataggttc gaatctatct aaagaatatt tggataatct taccaatgaa
     8821 tccatagata aaataggtag aaatttaagt ccaggagaag ttggttgcta tttgtcacat
     8881 attaaatgct tgaaaaattt tctatcatca ggagatgagt ttgctataat tttagaagat
     8941 gatgttactt tagattatcg aataaaagat tttatcagta ccatagaatt taaagagaca
     9001 acactttttt ttgatgttat gttgcttggt tatcgtaatg gatatggttc ttattggggg
     9061 aaaaaaaaat ggaattctca taaattactt cgctttcctg attgtggtta tggagctcat
     9121 gcctacttgg ttaccaggaa aggtgcagaa aaaatagtat ataataacgc aattcctatt
     9181 tggccgtatg attatgtcac tggaggtagg gcggataaaa caattcgagt ttatggtgtt
     9241 gagaaaaaaa ttgttgattt agatttttac aatagctctt gttcatcgtt agaggcagag
     9301 agaaattatc ttggtgcata ttcttctgaa tataaagtga aaacaccttt tgttctatat
     9361 gtattaaaaa aattgatcaa aggattaaaa ccaataaggg tatacaaatg aaggttctta
     9421 tagtttctaa tatgtatcca agtattgaaa atccttctct gggtgtcttt gtaaagaata
     9481 ccgaagaaat gttagtcaat gccaatatag acgttgatag agctgtcata gacagaatat
     9541 attcaaattc atttgagaaa gtatttggct attttatttt ttatttaaaa gtcatctata
     9601 aaattttatt ttgtaaatgt gatattgttt atgcacatta tgtatcgcat gtagcaatac
     9661 caattttttt tgttaattta tttaaacaca tagttgtttt ctcgcatgtg catgggggag
     9721 atgtaaaaca gctgaaagga acgtcagctg tattctttaa aataaaacaa gcattatcaa
     9781 aaaagattat ggatatatca aaggtgattt tttccccatc agcttcatac aaaaggcata
     9841 taattgaact ttattcgcaa gacgagagca agattattat ttttccttcc ggagggattg
     9901 atacgacact attttctttt ggttcaggga gaaagaaaaa tatattgggg tatgcaggtc
     9961 gattagagga cagtaagaat gttgatttaa ttataaaatc tcttattgat aataaataca
    10021 atcttgagat tgtaggagat gggaaaaaaa aaggtcaatt acaagaattg gtctctaaat
    10081 ataacttatc tgaaagagtt atatttcata gcagcaaaac tcaaaaagag ttgtcagaat
    10141 ggtataaacg agtgtctatt ttgatttacc cgtcttcaag tgaaagttta ggtttggttc
    10201 ctttagaagc tcttgcatgt ggtacggatg ttcttttatc gccaattgat gcattttttg
    10261 aatttagaga tattgggttg caatttgagt ttttaagtga gttaacccct caagcaatta
    10321 atgtagggat tgaaaaaatc atttccacta gatgttttcg caataatatg agtaataaca
    10381 ttattattaa ctctgtatat gctagaaatg ttgtttgcaa ggaatttatt gatgtattca
    10441 aacaaaaatg ccattgtttt tagttatggt gcaggcgggc actcggcaca agcaaacaga
    10501 ctggctgcgc ttcttatacc taggttagat agtttttata taatatcaat atccgatgat
    10561 tgtattacac ctaagtggtc tcatatacat tttgttaccg gagaggttag aaaaaaaaat
    10621 agttatttcg atactcttac aaatatgggg ccaataaaaa taattcaaac attgttaaaa
    10681 ataaaaaaat ataatgtgag atgtgttatt tcaaatggtc caggtatatc tgtaatcact
    10741 gctttattct ttaaagtatt tggggcgaaa ataattcatg ttgaaacatg gtctcggttc
    10801 gtgtcaaaat ccttaacagg aatggctatg tattatattg ccgacgtgtt ctatgttcaa
    10861 aacaaagaat tatgtaaaat atataaaaat gcaatttatt caggtcgact atgaaaatat
    10921 ttactacagt tggaacaaca agttttgatc ttttaattaa gtcagttgat gaattcgccg
    10981 ctacaaataa agataatgat tttatcttcc agatagcgaa tggacaattt caccctagaa
    11041 atggttgtta ctttcgattt gaaaatgata ttgtgcatta ttatgagtgg gcagatgttg
    11101 tcataactca tgcaggcgca ggcactatat ataaactcct ggagcaaaga aaaaaagtaa
    11161 tcattgttcc aaatcttgtg cgtattgata aacatcaacg cgatattgca caatatatgt
    11221 gtgaccatca ttattccttg gtattgtggg acctatcatc tttatcttcg ataatgaaag
    11281 atattgaaaa attttctcca gcggtatata agaaaactcc tttttttaga agtgatgaga
    11341 tagttaattt tattaacaat ataagataat ttatacaaat tgtatttttc tgacaggagt
    11401 aaacaatgtc aaagcaacag attggcgtag tcggtatggc agtgatgggg cgcaaccttg
    11461 cgctcaacat cgaaagccgt ggttataccg tctctatttt caaccgttcc cgtgaaaaga
    11521 ccgaagaagt gattgccgaa aatccaggca aaaaactggt tccttactat acggtgaaag
    11581 agtttgttga atctctggaa acgcctcgtc gcatcctgtt aatggtgaaa gcaggtgcag
    11641 gcacggatgc tgctattgat tccctcaagc catacctcga taaaggtgac atcatcattg
    11701 atggtggtaa taccttcttc caggacacca ttcgtcgtaa tcgtgagctt tctgcagaag
    11761 gctttaactt cattggtacc ggtgtttccg gcggtgaaga aggcgcgctg aaaggtcctt
    11821 ccattatgcc tggtggccag aaagaagcct atgaactggt tgcaccgatc ctgaccaaaa
    11881 tcgccgcagt ggctgaagac ggtgagccat gcgttaccta tattggtgcc gatggtgcag
    11941 gtcactatgt gaagatggtt cacaacggta ttgaatacgg tgatatgcag ctgattgctg
    12001 aagcctattc tctgctaaaa ggtggcctga acctcaccaa cgaagaactg gcgcagacct
    12061 ttaccgagtg gaataacggt gaactgagca gctatctgat cgacatcacc aaagatatct
    12121 tcaccaaaaa agatgaagac ggtaactacc tggttgatgt gattctggat gaagcggcta
    12181 acaaaggtac cggtaaatgg accagccaga gcgcgctgga tctcggcgaa ccgctgtcgc
    12241 tgattaccga gtctgtgttt gcacgttata tctcttctct gaaagatcag cgcgttgccg
    12301 cttctaaagt tctctctggc ccgcaagcgc agccagcagg cgacaaggct gagttcatcg
    12361 aaaaagttcg tcgtgcgctg tatctgggca aaatcgtttc ttacgctcag ggcttctctc
    12421 agttgcgtgc tgcgtctgaa gaatacaact gggatctgaa ctacggcgaa atcgcgaaga
    12481 ttttccgtgc tggctgcatt atccgtgcgc agttcctgca gaaaatcacc gatgcctatg
    12541 ccgaaaatcc gcagatcgct aacctgctgc tggctccgta cttcaagcaa attgccgatg
    12601 actatcagca ggcgcttcgc gatgtcgttg cttatgcagt acagaacggt atcccggttc
    12661 ctaccttcgc tgctgcggtt gcctattacg acagctaccg cgccgctgtt ctgcctgcga
    12721 acctgatcca ggcacagcgt gactatttcg gtgcgcatac ttataagcgc attgataaag
    12781 aaggtgtgtt ccataccgaa tggctggatt aatctgattt aaatcaatta atcaaagcaa
    12841 ggcccggaga aaccctccgg gcttttttat tatacaaagc ggcaggttat ggcctttttt
    12901 tataatttat ggttaaaaaa gcgatataat acagagccgc acagcaggat cgctgccttg
    12961 acagttcatc tacatcagcg ttaaaaatcc cgcagtagat gaagctgtgg tggtggatta
    13021 atgaccactc taaatgttta accggaagaa gtcagagcta atgaaaataa caatttcagg
    13081 aacaggttat gttggtcttt caaatggtat tctgattgcg caaaaccacg aagtggttgc
    13141 actggatatc gttcaggcca aagtggacat gcttaacaag aagcagtcac cgattgttga
    13201 taaggagatt gaagagtatc tggcgactaa agatctcaat ttccgcgcta cgatagataa
    13261 gtatgacgcg tataaaaatg ccgattacgt tattattgcc acacctaccg attatgatcc
    13321 gaaaacaaat tattttaata cctcaagcgt ggaagcggtc attcgcgatg tgacagaaat
    13381 taatcctaat gctgtcatgg tgattaaatc tacaattccg gtaggtttca ccaaatcaat
    13441 taaagaacgt ctgggtatcg ataaccttat tttctctccg gaatttctcc gtgaaggtaa
    13501 agccctttac gataatcttc atccttcacg tattgtcatt ggtgagcgtt cagaacgcgc
    13561 agaacgtttt gcggcgttat tacaggaagg cgcgattaag caaaatatcc caaccctgtt
    13621 taccgactcc actgaagcag aagcgattaa acttttcgct aatacctatc tggcgatgcg
    13681 cgtagcatac tttaatgaac tggatagcta tgcagaaagt ttagggctga atactcgcca
    13741 gattatcgaa ggcgtttgtc tcgatccgcg tattggcaac cattacaaca acccgtcgtt
    13801 tggctatggt ggttattgtc tgccgaaaga taccaagcag ttactggcca actaccagtc
    13861 tgtgccgaat aacctgattt cggcaattgt cgatgctaac cgcacacgta aagactttat
    13921 tgccgatgcc attttgtcac gcaagccgca agtggtgggt atttatcgtc tgattatgaa
    13981 gagcgggtca gataacttcc gtgcgtcttc cattcagggg attatgaaac gtatcaaggc
    14041 gaaaggcgtt gaagtgatca tctacgaacc ggtgatgaaa gaagattcat tcttcaactc
    14101 tcgcctggaa cgtgatctcg ccaccttcaa acaacaagcc gacgtcatta tttccaaccg
    14161 tatggcagaa gagcttaagg atgtggcaga caaagtctac acccgcgatc tctttggcag
    14221 tgactaacat cctgttatca gggcgatttt cgccctgatt ctcttatgtt ccctttgtaa
    14281 taattcatta tttttatcat ttatcctata gcattcatgg cgattatcgc gaaactatgg
    14341 cgacttaaaa ttatttcgtc cgttagggta atgatgagag tagaaaataa taatgtttct
    14401 gggcaaaacc atgacccgga acagattgat ttgattgatt tactggtgca gttgtggcgc
    14461 ggcaagatga ctatcatcat ttctgtcatt gttgctattg ccctggctat agggtatctg
    14521 gccgttgcca aagaaaagtg gacttccact gctatcgtta ctcaacctga tgtggggcaa
    14581 atcgctggtt ataccaacgc gatgaatgtg atttacggtc cggctgtacc gaaagtctcc
    14641 gacattcagg cttcacttat cggacgttac agcactgcat tctcagcatt agcggaaacg
    14701 ctggataacc aggaagaagc agaaaagctg accattgagc ctaccgttaa aaatcagtca
    14761 ttacctttag cggtgtctta tgttggtgaa acacctgaag gtgctcagaa gcagctggcg
    14821 aagtatatcc agcaagttga cgaccaggta aacgtagagc tggaaaaaga cttgaaagac
    14881 aacatcgcgc tgcgtatgaa aaacttgcag gactctttaa gaactcagga agtagtcgcg
    14941 caagagcaga aagatctgcg tatccgtcag attcaggaag cgttgcagta tgcgaatcag
    15001 gcgcaggtga caaaaccgca aattcaacag actggcgaag atatcacgca agatacgttg
    15061 ttccttttgg ggagcgaagc gctggagtcg atgattaagc acgaggcgac ccgtccgttg
    15121 gtgttctcac caaactacta tcagacacgt caaaacctgc tggatatcga aagcttaaaa
    15181 gttaatgatc ttgatattca tgcttaccgc tatgtaatga aaccgacgtt acctattcgt
    15241 cgcgatagtc cgaaaaaggc aattaccttg attctggcgg tgctgctggg cggcatggtt
    15301 ggcgcgggga ttgtgctggg gcgtaacgct ctgcgtaatt acaacgcgaa gtaatctttt
    15361 cggttttaaa gaaaaagggc agggtggtga caccttgccc gttttttttg ccggatgcga
    15421 caacaatatc gcatccgctt accccgcaac tcactgatgc cgtttacgca ggttctcaat
    15481 taccgtcgtt aaatccagcc cctgatcctg caacagcacc aacaggtgat acatcaaatc
    15541 agatgcctcg ttggtcagct caaagcggtc atgtacagtc gcggccagtg cggtttccac
    15601 gccttcttcg cccactttct gcgcaatgcg tttggtgccg ctggcataca gtttggcagt
    15661 gtaagaggtt tccgggtcgg cagatttgcg ttcggcgagc agttgttcca gttgataaag
    15721 gaacagccac tggtgagcgg tgtcgccgaa gcagctgctg gtgcctttgt ggcaggtcgg
    15781 gccgatggga ttcgccagca acagtaacgt gtcgttgtcg cagtccggcg taatatttac
    15841 tacgttgagg aaattgcccg acgtttcgcc tttggtccac agtcgctgtt tagtgcgcga
    15901 gaagaaggtg actttgccgc tttcgatggt tttatctaag gcttccgggt tcatatagcc
    15961 cagcattaac acttcaccgg ataccgcgtg ttgcacaatc accggcataa gtccgtcggt
    16021 tttttcccag tccagttcgc gacgttgttg ttctgttaac atatcctgat ctccacgccc
    16081 tgtgttgcca ggtacgcttt taattcacca atattgatta tttgtttgtg gaatacggaa
    16141 gccgccagcg cgccgtcaac gtcggcatcg cggaaggctt cgaggaagtg ttccatggtg
    16201 cccgcgccac cggaggcaat cagcggaacg tggcagactt cacgcacttt tttcagttgt
    16261 tcgaggtcgt aaccgttacg cacgccgtcc tgattcatca tgttgaggac gatttctccg
    16321 gcaccgcgtt tttgcacttc ctgtacccag tcgagcgttt cccattgagt gacgcgggtg
    16381 cggctttcat c
//