LOCUS       AB811620               15423 bp    DNA     linear   BCT 13-MAY-2015
DEFINITION  Escherichia coli DNA, O-antigen biosynthetic locus, strain: H702c.
ACCESSION   AB811620
VERSION     AB811620.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1
  AUTHORS   Iguchi,A., Iyoda,S., Kikuchi,T., Ogura,Y., Katsura,K., Ohnishi,M.,
            Hayashi,T. and Thomson,N.R.
  TITLE     A complete view of the genetic diversity of the Escherichia coli
            O-antigen biosynthesis gene cluster
  JOURNAL   DNA Res. 22 (1), 101-107 (2015)
   PUBMED   25428893
  REMARK    DOI:10.1093/dnares/dsu043
REFERENCE   2  (bases 1 to 15423)
  AUTHORS   Iguchi,A., Iyoda,S. and Ohnishi,M.
  TITLE     Direct Submission
  JOURNAL   Submitted (29-MAR-2013) Contact:Atsushi Iguchi University of
            Miyazaki, Faculty of Agriculture; Gakuen-kibanadai-nishi 1-1,
            Miyazaki, Miyazaki 889-2192, Japan
FEATURES             Location/Qualifiers
     source          1..15423
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="H702c"
                     /db_xref="taxon:562"
                     /note="serogroup:O44"
     gene            <1..906
                     /gene="wcaM"
     CDS             <1..906
                     /gene="wcaM"
                     /codon_start=1
                     /transl_table=11
                     /protein_id="BAQ00939.1"
                     /translation="NYAILRQGFHNQIIGANITNCKFSDLQGDAIEWNVAINDSDILI
                     SDHIIERINCTNGKINWGIGIGLAGSTYDNNYPEDQAVKNFVVANITGSDCRQLIHVE
                     NGKHFVIRNIKARNITPDFSKKAGIDNATVAIYGCDNFVIDNIEMINSAGMLIGYGVI
                     KGKYLSIPQNFRVNNIQLDNTHLAYKLRGIQISAGNAVSFVALTNIEMKRASLELHNK
                     PQHLFIRNIKVMQESSVGPALSMNFDMRKDVRGVFMAKKETLLSLANVHAVNERGQSS
                     VDIDRVNHHIVNVEKINFRLPERRE"
     gene            1069..1974
                     /gene="galF"
     CDS             1069..1974
                     /gene="galF"
                     /note="O044_01"
                     /codon_start=1
                     /transl_table=11
                     /product="UTP-glucose-1-phosphate uridylyltransferase"
                     /protein_id="BAQ00940.1"
                     /translation="MDEIMTNLKAVIPVAGLGMHMLPATKAIPKEMLPIVDKPMIQYI
                     VDEIVAAGIKEILLVTHASKNAVENHFDTSYELESLLEQRVKRQLLAEVQSICPPGVT
                     IMNVRQGEPLGLGHSILCARPAIGDNPFVVVLPDVVIDDASADPLRYNLAAMIARFNE
                     TGRSQVLAKRMPGDLSEYSVIQTKEPLDREGKVSRIVEFIEKPDQPQTLDSDIMAVGR
                     YVLSADIWPELERTQPGAWGRIQLTDAIAELAKKQSVDAMLMTGDSYDCGKKMGYMQA
                     FVKYGLRNLKEGPKFRKSIEKLLGE"
     CDS             2368..3372
                     /note="O044_02"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00941.1"
                     /translation="MKVIVNNFFDGILKRGIPIYTSELVQKLRDNNVQVIYVACPKAF
                     HKLPSWFLNVLFIIVEQLLIPIMGIFYRTKYNIYPYNSSSIIDLLLGKAIVIIHDFIS
                     LKKNKRNLAAIYVKVCIYFSSFLAKKVIFISQSTQRVSKRISLFKCIESILLPNPFFS
                     FEKIANVTEIKDLGYLLLVSGLGDNKDLGTALDYYFSIPREERIPLKILGCGNGISKV
                     NDLIDGRDTDKEIEIIGFVSLEEVVKLYCNSKIVWAHSLAEGYGRTLAEAKLTCKNVI
                     CTRISAFREQKDSNIFFYTYYSEYYEVYSYLVDNSPSVERKALHEHILFENELRKIYE
                     "
     CDS             3365..4567
                     /note="O044_03"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyltransferase"
                     /protein_id="BAQ00942.1"
                     /translation="MSNIDINKKQILVLTPRFPFPVIGGDRLRIYKICKELSKHYDLT
                     LLSLCDKREELNYEYDREVFSSVHRVYLSKKKSILNVIFSLFSNTPLQIGYYKSKEFE
                     DKLKQLLPEHSATLSHLIRVGDYVKENKDINFLEMTDAISLNYKRVKEKASLLSLKTF
                     VYSFEQKRLERYERTINNKFSLTTLVSQVDSDYLYPDRPNNVLVCGNGVDAVSLPFSE
                     RKIAKDKKITLVFIGNLYSLQNMDGVRWFTKEVLPFLNKHGNFEFKVIGRITDKDKSW
                     LESQPGVVVTGEVDSITYAAADGHIGVCPIRLGAGIQNKVLEYMALGLPCISSTVGFE
                     GLGAEEGKEIYVANTKEEYLRVLNYFITNLDKYTETALVAKKFIGENFSWEAKLSPYI
                     QKIKESVK"
     gene            4569..5984
                     /gene="manC"
     CDS             4569..5984
                     /gene="manC"
                     /note="O044_04"
                     /codon_start=1
                     /transl_table=11
                     /product="mannose-1-phosphate guanylyltransferase"
                     /protein_id="BAQ00943.1"
                     /translation="MIIPIIMAGGSGTRLWPLSRSLYPKQFLSLINENSLLQETLKRL
                     DGLNCLPPVIVSNNEHRFIVAEQLRQFGVDDFQIILEPVGRNTAPAVALAALKSLELH
                     GDHHMLVLAADHAIQDIEAFHAAVLAAEQESVDNKLVTFGIVPTKPETGYGYIKKGEQ
                     VKNSVFKVNSFVEKPDLETAKNYLEQKCYLWNSGMFMFKASVYLDELKKFRPDILAAC
                     KESLSSASTDLDFIRLNSDVFAECPDESIDYAVMEKTQDCVVIPLDADWSDIGSWTSL
                     WEISEKDEHENVSHGDVINYDSRNNYIYSEGSLISTVGVNNLIIVQTKDALLVAQQDN
                     VQDIKKIVEILKKQKRSEHISHREVYRPWGRYDSVERGDRYQVKRITVKPGECLSTQM
                     HHHRAEHWVVVAGTAKVTCGERTFFVTENESTFIPIGTVHTLENPGKIPLEVIEIQSG
                     VYLGDDDIVRLSDKYGRVEDK"
     gene            5989..7410
                     /gene="manB"
     CDS             5989..7410
                     /gene="manB"
                     /note="O044_05"
                     /codon_start=1
                     /transl_table=11
                     /product="phosphomannomutase"
                     /protein_id="BAQ00944.1"
                     /translation="MNITNDVIKNSGIAFGTSGARGLVKDFTPNVCAAFTYAFIDVMM
                     KDFSFKEVALAIDNRPSSYAMAQACAAALLECSIKPIYYGVIPTPALANQAIADGIPA
                     IMVTGSHIPFDRNGLKFYRPDGEISKENENSIIHAEKEYPDVTVLPELQCSKRAADTY
                     IERNTSIFSNIFKGKRIGIYEHSSAGRDLYSEIFSKLGAEVVSIGRSDEFVPIDTEAV
                     SKEDEEKALHWSSEYDLDMIFSTDGDGDRPLVADENGVWLRGDILGLFCSKAMNIEAV
                     AVPVSCNTVIQTCGWFNHVTLTKIGSPYVISAFDSLNNSFDRVAGFEANGGYLLGSDV
                     NYNSGMIKALPTRDAVLPALMVLALAIKNNVTISKLLAELPPRFTYSNRVQNFATSKS
                     KSIIASAQENPQEFIERIGFVDLHVQSVDTIDGLRLTLSDGSIIHLRPSGNAPELRCY
                     AEADNIIKAEKLVLEVLHKVTLL"
     gene            7594..8925
                     /gene="wzy"
     CDS             7594..8925
                     /gene="wzy"
                     /note="O044_06"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen polymerase"
                     /protein_id="BAQ00945.1"
                     /translation="MHKQYYSLLCNKIQFKHLAIYFSVFLSLSSCFLWGGADTFVSQV
                     YIDILATISTALLVVLMFYYYINRVRYLSLTLLFAFVFSLIIGLPSIYLYYFKNANHG
                     FEIICIWGMLINSILYLQTTETVIKEEKRYLTSLFYILFSIVALCQLYKILIYLMFIL
                     NSGEGHLAIYTESEELLSQVPFFIRAISGFAVVMSLSTFYFKTPTYIKVIAFVLLASD
                     LAIGIRNKFFFSVICIFILYMYSNEYRVRNLFKQLSKPIFLIAGFLCFSMVSYFREGY
                     QIDFMIYIGIVLDSLSSTLGGMQNLFDMQSSGWDQLHPAVVFTQVLPLSGLGFLDDQQ
                     IAKDFSIIVLGDVSSGIALSSSGLLESSLLSLNLGVIIYLLYLSGVMLFIKWGLNNQR
                     IIINFVAISMISGFFYAVRGELILPLAFLLKSLPIVLISPLLVKNKIYHGQ"
     gene            8967..10202
                     /gene="wzx"
     CDS             8967..10202
                     /gene="wzx"
                     /note="O044_07"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen flippase"
                     /protein_id="BAQ00946.1"
                     /translation="MIKEIFSDGIFSLFNKICYFGFKTLAIILITRSLGEDVGGEFIF
                     LVGFLEVLRVVTDFGVDLFVIKKYNDSTDKIKLLNVTFAQKILSGVIVLLLFCLYSFV
                     QGYQYNVYIPIVLALPVALFFNFSNSYFQSLNSNKSLTVPIAIASIATCTIFAIQYFL
                     NVKFNAWDYLCVELLFVSLVTLKLFVSVKFRFIRTSAFDVLMSILSLYKYTLSIGLTA
                     VVVIIYSRIDNFYLKTFAPGDLAAYGQIFRMVDPLVMVSSVFSTVAYARFCRINLQEK
                     NAFTKVFQFLLCIVAYGVLSSLVYFFIIKYLGHFVLISNVNNDFLIMMFLIVACVKCI
                     NGGTTAIIQSQGFYKVGLYVSYVCILTSIPTMYFLIMKYGVKGAAMTILLVECISFIL
                     LLCSFFMIKKMRPKKTFEM"
     gene            10355..11761
                     /gene="gnd"
     CDS             10355..11761
                     /gene="gnd"
                     /note="O044_08"
                     /codon_start=1
                     /transl_table=11
                     /product="6-phosphogluconate dehydrogenase"
                     /protein_id="BAQ00947.1"
                     /translation="MSKQQIGVVGMAVMGRNLALNIESRGYTVSVFNRSREKTEEVVA
                     ENPGKKLVPYYTVKEFVESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGN
                     TFFQDTIRRNRELSAEGFNFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIA
                     AVAEDGEPCVTYIGADGAGHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLTNEELAQT
                     FTEWNNGELSSYLIDITKDIFTKKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEP
                     LSLITESVFARYISSLKDQRVAASKVLSGPQAQPAGDKAEFIEKVRRALYLGKIVSYA
                     QGFSQLRAASEEYNWDLNYGEIAKIFRAGCIIRAQFLQKITDAYAEDPQIANLLLAPY
                     FKQIADDYQQALRDVVAYAVQNGIPVPTFAAAVAYYDSYRAAVLPANLIQAQRDYFGA
                     HTYKRIDKEGVFHTEWLD"
     gene            12011..13177
                     /gene="ugd"
     CDS             12011..13177
                     /gene="ugd"
                     /note="O044_09"
                     /codon_start=1
                     /transl_table=11
                     /product="UDP-glucose 6-dehydrogenase"
                     /protein_id="BAQ00948.1"
                     /translation="MKITISGTGYVGLSNGLLIAQNHEVVALDILPSRVAMLNDRISP
                     IVDKEIQQFLQSDKIHFNATLDKNEAYRDADYVIIATPTDYDPKTNYFNTSSVESVIK
                     DVVEINPYAVMVIKSTVPVGFTAAMHKKYRTENIIFSPEFLREGKALYDNLHPSRIVI
                     GERSERAERFAALLQEGAIKQNIPTLFTDSTEAEAIKLFANTYLAMRVAYFNELDSYA
                     ESLGLNTRQIIEGVCLDPRIGNHYNNPSFGYGGYCLPKDTKQLLANYQSVPNNLISAI
                     VDANRTRKDFIADAILSRKPQVVGVYRLIMKSGSDNFRASSIQGIMKRIKAKGVEVII
                     YEPVMKEDSFFNSRLERDLATFKQQADVIISNRMAEELKDVADKVYTRDLFGSD"
     gene            13287..14300
                     /gene="wzz"
     CDS             13287..14300
                     /gene="wzz"
                     /note="O044_10"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen chain length determinant protein"
                     /protein_id="BAQ00949.1"
                     /translation="MRTWKFPSVRVMMRVENNNVSGQNHDPEQIDLIDLLMQLWRGKM
                     TIIISVIVAIALAIGYLAVAKEKWTSTAIVTQPDVGQIAGYNNAMNVIYGQAAPKVSD
                     LQETLIGRFSSAFSALAETLDNQEEPEKLTIEPSVKNQQLPLTVSYVGQTAEGAQMKL
                     AQYIQQVDDKVNQELEKDLKDNIALGRKNLQDSLRTQEVVAQEQKDLRIRQIQEALQY
                     ANQAQVTKPQVQQTEDVTQDTLFLLGSEALESMIKHEATRPLVFSPNYYQTRQNLLDI
                     ESLKVDDLDIHAYRYVMKPTLPIRRDSPKKAITLILAVLLGGMVGAGIVLGRNALRNY
                     NAK"
     gene            complement(14483..15094)
                     /gene="hisI"
     CDS             complement(14483..15094)
                     /gene="hisI"
                     /codon_start=1
                     /transl_table=11
                     /product="phosphoribosyl-AMP cyclohydrolase"
                     /protein_id="BAQ00950.1"
                     /translation="MLTEQQRHELDWEKTDGLMPVIVQHAVSGEVLMLGYMNPEALDK
                     TIESGKVTFFSRTKQRLWTKGETSGNFLNVVSIASDCDNDTLLVLANPIGPTCHKGTS
                     SCFGNTAHQWLFLYQLEQLLAERKSADPETSYTAKLYASGTKRIAQKVGEEGVETALA
                     ATVHDRFELTNEASDLMYHLLVLLQDQGLDLTTVIENLRKRHQ"
ORIGIN      
        1 aattacgcca tcttacgtca gggatttcat aaccagatta tcggtgccaa catcaccaat
       61 tgtaagttca gcgacttaca gggggacgcc attgaatgga acgtggcgat taacgacagt
      121 gatattttga tctccgacca catcatcgag cgcatcaact gtaccaacgg caaaatcaac
      181 tggggaatcg gcataggcct tgcggggagt acttatgata ataactaccc ggaagaccag
      241 gcagtgaaaa actttgtcgt ggcgaatatc acgggatcgg attgtcgaca actgatccat
      301 gttgaaaatg gtaaacattt tgttattcgt aatatcaaag cccgcaatat cacgccggat
      361 ttcagtaaga aagcaggtat tgataacgcc acggtcgcta tttacggttg tgacaatttc
      421 gtgattgata atattgaaat gattaatagc gccgggatgt taatcggtta tggggtaatt
      481 aaaggcaaat atctctcgat accgcaaaat ttccgagtga ataatattca gctggataac
      541 acccaccttg cttacaaatt gcgcggtatc caaatctctg ccgggaatgc tgtctccttt
      601 gttgcactga ctaacattga gatgaagcgt gcctcgttgg agttacacaa caaaccgcaa
      661 catcttttta tacgaaatat caaagtgatg caggaatcct ctgttggacc cgcattgagc
      721 atgaacttcg acatgcgcaa agacgttcgc ggcgtcttta tggcgaaaaa agaaacactg
      781 ctgtctcttg caaatgttca tgcggtgaat gaaagagggc aaagctccgt cgatatcgac
      841 agggttaatc accatattgt taatgtggaa aagattaact ttagattgcc agaacggaga
      901 gagtagattt gcgaccattc ctggaaaaat ggagccatac ttaggaacaa tgctactgca
      961 atccacaacg aagcggcgta acatcacaag taattcagta atcaattcag ggtaattgat
     1021 gctggcgaaa aaaatcgaac aagctataat tcagcaacca ttttacaggt ggatgaaata
     1081 atgacgaatt taaaagcagt tattcctgta gcgggtcttg ggatgcatat gttgcctgcc
     1141 actaaggcga ttcccaaaga gatgctaccg atcgtcgaca agccaatgat tcagtacatt
     1201 gttgacgaga ttgtggctgc agggatcaaa gaaatcctcc tggtaactca cgcgtccaag
     1261 aacgcggtcg aaaaccactt cgacacctct tatgaattag aatctctcct tgaacagcgc
     1321 gtgaagcgtc aactactggc ggaagtgcag tccatctgtc cgccgggcgt gaccattatg
     1381 aacgtgcgtc agggcgaacc tttaggtttg ggccactcca ttttatgtgc acgacctgcc
     1441 attggtgaca acccatttgt cgtggtactg ccagacgttg ttatcgatga cgccagcgcc
     1501 gatccgctac gctataacct tgctgccatg attgcgcgct tcaacgaaac gggccgcagc
     1561 caggtgctgg caaaacgtat gccgggtgac ctctctgaat actccgtcat tcagaccaaa
     1621 gaaccactgg atcgtgaagg taaagtcagc cgcatcgtcg aatttatcga aaaaccggat
     1681 cagccgcaga cgctggactc agacatcatg gccgttggtc gctatgtgct ttctgccgat
     1741 atttggccgg aacttgaacg cacgcaacct ggtgcatggg ggcgtattca gctgactgat
     1801 gctattgccg aactggcgaa aaaacagtcc gttgatgcca tgctgatgac cggcgacagc
     1861 tacgactgcg gtaaaaaaat gggctatatg caggcgtttg tgaagtatgg actgcgcaac
     1921 ctgaaggaag ggccaaagtt ccgtaagagc attgagaagt tgctcgggga atagatccca
     1981 agccaatgta acaataattt agataaatag cggcagctaa catcccggcg tctatgcttt
     2041 aaacaaagga atgttactgt cgtttttctt tttaaaacaa agaataacaa cgagttaacc
     2101 tactaagttt aatctatttt ttgttggatt tatccttgtt tctgacagca tttggtaaga
     2161 caattggcgt ttgaatttaa gatagctttg cgatagctag cggggcgggg tacatctttg
     2221 gcattttgct agtgcactgg tagctgttaa gccaggggcg gtagcgtggt aagattgtgt
     2281 ttatatgatg cgttctcaaa ataagaaata ataatcctga ctatttttat actattgata
     2341 atatctgaaa taaacttaag agcaaacatg aaagtaattg taaataattt ttttgatggt
     2401 attttgaaaa gaggaatacc gatctatact tctgaacttg tgcaaaagtt aagagacaat
     2461 aatgttcagg ttatttatgt tgcatgtcca aaagcattcc ataagctgcc ttcatggttt
     2521 ctgaatgttc tttttataat agtagagcag cttttaatac caattatggg tatattttat
     2581 agaactaagt ataatatata tccctataat agtagttcca tcattgactt gttattaggt
     2641 aaggcaattg ttataattca tgacttcatt agtcttaaga aaaataaacg aaatcttgct
     2701 gccatttatg tgaaagtctg tatttatttt tcatcttttt tagcaaagaa agtaatattt
     2761 atttctcaaa gcactcagcg agtatctaag agaatatcgc tatttaagtg tatagaatct
     2821 atcctgctcc caaatccatt tttctcattt gagaaaattg ctaatgttac cgaaataaaa
     2881 gatcttggat atttacttct agtttcaggt ttaggggata ataaggatct aggcacagct
     2941 ctggactatt atttttcaat cccaagggaa gaaagaatac cattaaaaat attaggttgt
     3001 gggaatggta ttagcaaggt taacgactta attgatgggc gggatacaga taaagaaatt
     3061 gaaattattg gttttgtttc tttagaggaa gtcgtcaaac tatattgtaa ttctaaaatt
     3121 gtttgggctc attcgcttgc cgaggggtat ggaaggactt tagctgaagc aaaactcaca
     3181 tgcaaaaatg ttatatgcac acggatctct gctttccgcg aacaaaagga ttcgaatatt
     3241 ttcttttata cttactattc tgagtattat gaagtctatt catacttggt agataattca
     3301 cccagtgtcg aaaggaaagc tctgcatgaa catattttat ttgaaaatga attgagaaag
     3361 atttatgagt aatattgata taaataagaa acagatatta gttttgactc cacggttccc
     3421 gtttcctgtc attggtgggg atcgattacg tatctataag atctgtaaag aactgtctaa
     3481 gcattatgat cttacgttgc tgagtctgtg tgataaacgc gaagagctca actatgaata
     3541 tgatcgtgaa gtttttagta gtgttcacag agtatatctt tcaaagaaaa aatctatttt
     3601 aaatgtcata ttctctttgt tttcaaatac tcccctacag attgggtatt ataaatctaa
     3661 agaatttgaa gataaactta agcagttatt acctgaacat tctgcaactc tttcacattt
     3721 gataagggtt ggtgattatg tgaaagagaa taaagatata aattttttag agatgaccga
     3781 tgccatttca cttaattata aacgagtaaa ggaaaaagca tctttattga gtttaaaaac
     3841 atttgtatat tcttttgaac aaaaaagact cgaacgatat gagcgaacta taaataacaa
     3901 gttcagcttg actactttgg tatcacaggt tgactccgat tatttatatc cagaccgtcc
     3961 gaataatgta ttagtctgtg gaaatggtgt tgatgccgtt agcttacctt tttcagaacg
     4021 aaaaatagct aaagataaaa agataaccct tgtatttata ggtaatttat attctttgca
     4081 aaatatggat ggtgtgagat ggttcaccaa ggaagtttta ccatttctta acaagcatgg
     4141 taattttgaa tttaaggtca tcggacgtat tacagataaa gataagagtt ggttagaaag
     4201 ccagcctggc gttgttgtca caggtgaagt tgatagcata acttatgcag cagctgatgg
     4261 gcatattggt gtatgtccta ttagattagg ggcaggtatc caaaataagg tacttgaata
     4321 tatggcgttg ggattacctt gtatctcttc tactgtaggc tttgaaggct tgggagcaga
     4381 ggagggtaag gagatttatg ttgccaatac aaaagaagaa tatttacgtg tattaaatta
     4441 ttttataaca aatctggata aatataccga aacagcatta gttgcgaaaa agtttatcgg
     4501 tgagaatttt tcatgggaag ctaaattgag cccatatatc cagaaaatta aggagtctgt
     4561 taaataaaat gattatccca attattatgg ccggtggttc tggtactcgc ttatggcctc
     4621 tttcgcgttc gttatacccg aaacaatttt tatcattgat taatgaaaat agtttgctcc
     4681 aggaaacgtt gaagagactt gatggattaa attgtttgcc tcctgtcatt gttagcaata
     4741 atgagcatag atttattgtt gctgaacaat tgcgacagtt cggtgtggat gacttccaga
     4801 ttattctaga acctgtaggt agaaatactg cgcccgccgt tgcgctggct gctctaaagt
     4861 ctctagaact ccatggcgat catcatatgc tggttcttgc tgctgaccat gctattcagg
     4921 atattgaagc cttccatgca gctgttttag ctgcagaaca agagtccgtt gacaataagt
     4981 tagtgacttt tggcatcgtc ccgaccaaac ctgaaactgg gtatggctat attaaaaagg
     5041 gcgaacaagt taaaaactct gtatttaaag taaattcttt cgtcgaaaaa cctgatttag
     5101 aaacggctaa aaattatctc gaacaaaaat gctatttgtg gaatagtggt atgttcatgt
     5161 tcaaggcgag cgtatattta gatgaattga aaaaatttcg ccctgatatt ttagcagcgt
     5221 gtaaagagtc gctttccagt gctagtactg atctagattt tatcagatta aattctgatg
     5281 tctttgcaga atgtcccgat gagtcaattg attatgcggt aatggaaaaa actcaggatt
     5341 gtgtagttat tccacttgat gctgactgga gtgacatcgg ttcatggaca tcactttggg
     5401 aaatatcaga gaaagatgaa catgaaaacg tatcgcatgg cgatgtaatt aactatgaca
     5461 gcaggaacaa ctacatttac tctgaaggtt cactgatcag cactgtagga gttaataacc
     5521 ttattatagt tcaaactaaa gatgcgctcc tggtagcaca gcaagacaac gtacaagaca
     5581 taaagaagat tgtcgaaatt cttaaaaagc aaaaacgtag cgaacatata tcccatcgcg
     5641 aagtctatcg tccttgggga cgttatgatt ctgtagaacg tggcgaccgt tatcaggtaa
     5701 agcgtattac cgttaagcct ggtgaatgtc tctcaacaca aatgcatcat catcgagctg
     5761 agcattgggt ggttgtcgct ggtactgcaa aggtgacttg cggcgaacgc acttttttcg
     5821 tcactgaaaa tgagtcaact ttcataccaa ttggcacagt tcataccttg gaaaatccag
     5881 gaaagatacc attagaagta attgagattc agtcgggtgt atatctaggt gatgatgata
     5941 ttgtgcgcct aagtgataaa tatggtcgtg ttgaggataa ataattatat gaatattacc
     6001 aatgatgtaa ttaaaaatag cggaattgca tttggtacaa gtggtgctcg tggattagtg
     6061 aaagatttta cacccaacgt gtgtgctgca ttcacttatg cttttatcga tgtaatgatg
     6121 aaggattttt cttttaaaga ggttgcgctc gcaatagata atcgcccaag cagctatgct
     6181 atggcacaag cttgcgcagc agcattgttg gaatgtagta ttaaacctat ttactacggt
     6241 gtaattccaa ctccagcttt ggcaaatcaa gcgattgccg atgggattcc tgcaataatg
     6301 gttactggaa gtcatattcc atttgataga aatggtttga aattctatcg tccagacggg
     6361 gaaatttcaa aagaaaatga gaacagcatt atacatgctg aaaaagagta tcctgatgta
     6421 actgtattgc cagaattaca atgttcaaag cgtgccgctg atacttatat cgagagaaac
     6481 acttcaattt tttcaaatat atttaaaggt aaacgtatcg ggatttatga acattcaagt
     6541 gcgggacggg atctttattc agaaatattc agtaagcttg gtgctgaagt tgtaagtatt
     6601 ggtagaagtg atgagtttgt gcctattgat actgaagcag tatcaaaaga agatgaagaa
     6661 aaagctttac actggtcatc tgagtatgac ctcgatatga ttttttctac cgatggtgat
     6721 ggcgatcgtc ctttggttgc tgacgaaaat ggcgtttggt tacggggtga tatattagga
     6781 ctattttgct caaaggcaat gaatattgaa gcggtagctg tacctgtaag ttgtaatacg
     6841 gttattcaga cttgcgggtg gtttaatcat gtaacgctga ctaaaattgg ttcaccatac
     6901 gtcatttcag cgtttgattc tctgaataat agttttgata gggttgcagg gtttgaggct
     6961 aacggtgggt atcttttagg tagcgatgta aattataaca gcggtatgat taaagcgctt
     7021 ccaacaagag atgctgtttt gcctgcttta atggtactgg cactggctat aaaaaataat
     7081 gtgactattt caaaactctt ggcggagttg ccaccacgat ttacctactc aaatagagtt
     7141 caaaattttg caacaagcaa aagcaaaagc attatcgcgt cagctcaaga aaatcctcaa
     7201 gaatttatcg aaagaatagg ctttgtcgat cttcatgtac aatcggtgga tacaattgac
     7261 gggttaagat tgacactaag tgatggttca ataatccatt tgcgaccgtc aggcaacgca
     7321 cctgaattgc gatgctatgc agaagcagat aacataataa aagctgaaaa attagtgtta
     7381 gaagttttgc ataaagttac tcttttgtaa aaaaatataa acttttttct actcttgagc
     7441 ggtttgtcat ttaaccgctc agtaatagat tgtttataaa ttgtttatat ttagcattgg
     7501 tgtttttatt tgcgttcatc ccgaataaga gattgtaaaa ttaactgttt cttatttttc
     7561 aaatgagtta cttcactagt aaagctaatt actatgcata agcaatatta ttcattattg
     7621 tgcaataaaa tacagtttaa acatctggct atatattttt ctgtatttct ttcactatcc
     7681 tcatgtttct tgtggggagg ggcggataca tttgtatcgc aagtgtatat tgatatttta
     7741 gccactatat ctacagcgct attagttgtt ttgatgttct attattatat taatagagtt
     7801 cgctatttat cactaacctt actttttgca ttcgtttttt ctttgattat tggtttgcca
     7861 tcgatttatc tttactattt taaaaacgca aatcatgggt ttgaaataat ttgtatctgg
     7921 gggatgttga tcaattccat cctttacttg caaacaacag agactgtcat aaaagaagaa
     7981 aaaagatatt taactagttt attttatatt ttgttttcta ttgttgcact gtgtcaatta
     8041 tacaaaatat taatttatct tatgtttata ttgaattcag gagaagggca tttagcaatt
     8101 tatactgaaa gcgaagaatt gctatcccaa gttccatttt ttattcgtgc tattagtggt
     8161 tttgcagttg taatgtcatt gtccactttt tattttaaaa caccgaccta cattaaagtt
     8221 attgcatttg ttttacttgc atctgattta gctattggaa tacgtaataa gtttttcttt
     8281 tcagtgattt gtatttttat actatatatg tactctaatg agtatagagt aagaaattta
     8341 tttaagcaac tctcaaaacc aatatttctc atcgccggtt ttttatgctt ctcgatggta
     8401 tcgtatttcc gtgaagggta ccaaatcgat tttatgattt atattggcat tgttttagat
     8461 tcgctatcct ctactcttgg ggggatgcag aatttgtttg atatgcaatc atcaggatgg
     8521 gatcaacttc atcccgctgt ggtattcaca caagtattac cgctaagcgg tcttggtttt
     8581 cttgatgatc aacaaatcgc aaaagatttt tcaataattg ttttaggtga tgtatcctct
     8641 ggtattgcgt tgtcatcttc aggattgtta gagtcatcgt tgctgagtct aaacttggga
     8701 gtgattattt atttactgta tttatcaggg gtgatgcttt ttattaaatg gggactaaat
     8761 aatcaacgga taataataaa ctttgttgcc atctccatga tatctggatt tttttatgct
     8821 gttcgtggtg aactgatttt gccattggct tttcttctaa aatcattgcc gattgttctt
     8881 atatctccat tacttgttaa aaataaaatt tatcatggtc agtaagtggt ttatttttcg
     8941 accaggatct caccagtagg catgacatga tcaaagaaat tttctccgat ggcatttttt
     9001 cgctatttaa taaaatatgt tacttcggtt ttaaaacact tgcaataatt ctgattactc
     9061 gttccttagg agaagatgta ggcggagagt tcattttttt agttggtttt ctcgaagtcc
     9121 ttcgggtggt tactgatttt ggtgtggatc tgtttgttat aaaaaaatat aatgattcta
     9181 cagataaaat aaaactatta aatgtaacgt ttgcacaaaa aattctttct ggagtaattg
     9241 ttttactact gttttgtttg tattcttttg ttcagggtta tcaatataat gtctatattc
     9301 ctattgtgtt agccttacct gttgctttat tttttaattt ctcaaatagc tattttcaat
     9361 ctctcaattc caataaatct ctcacggttc cgatcgcaat tgcatctatt gcaacgtgta
     9421 cgatcttcgc tattcagtat tttttaaacg ttaaatttaa cgcatgggat tacctgtgtg
     9481 ttgaactatt attcgtatcg ctggttacac taaaactatt cgttagtgtc aagtttaggt
     9541 ttattagaac gtcagctttt gatgtgctaa tgtcaattct ttctttatat aaatatacat
     9601 taagtatagg tcttacagct gttgttgtaa ttatttatag ccgtatagat aatttttatc
     9661 tcaagacatt tgccccaggg gatcttgcag catatggcca gatatttagg atggttgatc
     9721 cactggttat ggtttcttct gtattttcta cagttgccta tgcaagattt tgccgaatta
     9781 acttacaaga aaaaaatgct tttactaagg tgtttcagtt cctgttatgt attgtggcat
     9841 atggcgtgct gagttcatta gtttatttct ttataataaa atacctgggt cattttgtat
     9901 tgatttctaa tgttaataat gatttcttga taatgatgtt cttgattgtt gcatgtgtga
     9961 aatgtatcaa tggtggtaca actgcaataa ttcagtcaca ggggttttat aaagtgggtt
    10021 tgtatgtttc gtatgtttgc attttgacat cgataccaac tatgtatttc ttaataatga
    10081 agtacggtgt taaaggtgct gctatgacga ttctgcttgt agagtgtatt agtttcatat
    10141 tacttctctg cagctttttt atgataaaaa agatgcgtcc taaaaaaaca ttcgaaatgt
    10201 aatcaatgag tcctctttga atagaattag tttgttctat ttatgaacac ttagcttgag
    10261 taagttctaa catagattac taattgtttg atactatctg ctttacaagc ataaccgcgt
    10321 atgtcgcggt gaccacacct gacaggagta tgtaatgtcc aagcaacaga tcggcgtcgt
    10381 cggtatggca gtgatggggc gcaacctggc gctcaacatc gaaagccgtg gttataccgt
    10441 ctccgtcttc aaccgctccc gcgaaaaaac tgaagaagtt gttgccgaga acccgggtaa
    10501 gaaactggtt ccttattaca cggtgaaaga gtttgtcgag tctcttgaaa cccctcgtcg
    10561 catcctgtta atggtgaaag caggtgcagg cacggatgct gctattgatt ccctcaaacc
    10621 atatctcgat aaaggtgaca tcatcattga tggtggtaac accttcttcc aggacactat
    10681 tcgtcgtaat cgtgagcttt cagcagaggg ctttaacttc atcggtaccg gtgtttccgg
    10741 cggtgaagag ggggcgttga aaggaccttc catcatgcct ggtgggcaga aagaagccta
    10801 tgaactggtt gcaccgatcc tgaccaaaat cgccgcagta gctgaagacg gtgagccatg
    10861 cgttacctat attggtgccg atggcgcagg tcactatgtg aagatggttc acaacggtat
    10921 tgaatacggc gatatgcagc tgattgctga agcctattct ctgctaaaag gtggcctgaa
    10981 cctcaccaac gaagaactgg cgcagacttt taccgagtgg aataacggtg aactgagcag
    11041 ctacctgatc gacatcacca aagatatctt caccaaaaaa gatgaagacg gtaactacct
    11101 ggttgatgtg attctggatg aagcagcaaa caaaggtacg ggcaaatgga ccagccagag
    11161 tgcgctggat ctcggcgaac cgctgtcgct gataaccgag tctgtgtttg cacgttatat
    11221 ctcttctctg aaagatcagc gcgttgccgc gtctaaagtt ctctctggcc cgcaagcgca
    11281 gccagcaggc gacaaggctg agttcatcga aaaagttcgc cgtgcgctgt atctgggcaa
    11341 aatcgtttct tacgctcagg gcttctctca gctacgcgcc gcgtctgaag agtacaactg
    11401 ggatctgaac tacggcgaaa tcgcgaagat tttccgtgct ggctgcatca tccgtgcgca
    11461 gttcctgcag aaaatcaccg atgcttatgc cgaagatccg cagatcgcta acctgctgct
    11521 ggctccgtac ttcaagcaaa ttgctgatga ctaccagcag gcgctgcgtg atgtcgttgc
    11581 ttatgcagta caaaacggta tcccggttcc gaccttcgcc gctgcggttg cctattacga
    11641 tagctaccgt gccgctgttc tgcctgcgaa cctgatccag gcacagcgtg actatttcgg
    11701 tgcacatact tataagcgca ttgataaaga aggtgtgttc catactgaat ggctggatta
    11761 atctgattta accaacaata aaattgaggc ccggcgtata ttgcaccggg cttttttttt
    11821 gccaattatc ttatagacta aatttcactg cttaatatta acttaataaa tatcagctat
    11881 tcttataaag aaattctgaa ttgtttttcg ttgcgttgac catcttacaa cgtagcgtta
    11941 aaacttttaa ctcttatcag gatgctaaaa acatcatgat tcacagttaa gttaattctg
    12001 agagcatgaa atgaaaatta ccatttccgg tactggctat gtaggcttgt caaacgggct
    12061 tctaatcgca caaaatcatg aggttgtggc attagatatt ttaccgtcac gcgttgctat
    12121 gctgaatgat cggatatctc ctattgttga taaggaaatt cagcagtttt tgcaatcaga
    12181 taaaatacac tttaatgcca cattagataa aaatgaagcc taccgggatg ctgattatgt
    12241 catcatcgcc actccaaccg actatgatcc taaaactaat tatttcaata catccagtgt
    12301 agaatcagta attaaagacg tagttgagat aaatccttat gcggttatgg tcatcaaatc
    12361 aacggttccc gttggtttta ccgcagcgat gcataagaaa tatcgtactg aaaatattat
    12421 tttctctccg gaatttctcc gtgaaggtaa agccctttac gataatctcc atccttcacg
    12481 tattgtcata ggtgagcgtt cagaacgcgc tgaacgtttt gctgcgttgt tacaggaagg
    12541 ggcgattaag caaaatatcc cgaccctgtt taccgactcc actgaagcag aagcgataaa
    12601 acttttcgct aatacctatc tggcgatgcg cgtagcgtac tttaatgaac tggatagcta
    12661 tgcagaaagt ttaggtctga atactcgcca gattatcgaa ggcgtttgtc tcgatccgcg
    12721 tattggcaac cattacaaca atccgtcgtt tggttatggt ggttattgtt tgccgaaaga
    12781 taccaaacag ttactggcga attatcagtc tgtgccgaat aacctgattt cggcaattgt
    12841 cgatgctaac cgcacgcgta aagattttat tgccgatgcc attttgtcac gcaagccgca
    12901 agtggtgggt gtttatcgtc tgattatgaa gagcggttca gacaacttcc gcgcgtcttc
    12961 cattcagggg attatgaaac gtatcaaggc gaaaggcgtt gaagtcatca tttacgaacc
    13021 ggtgatgaaa gaagactcat tcttcaactc tcgcctggaa cgagatctcg ccactttcaa
    13081 acaacaagct gacgtcatta tctccaatcg tatggcagaa gagcttaagg atgtggcaga
    13141 taaggtatac acccgcgatc tctttggcag cgactaacat cttgttatca gggctattta
    13201 cgccctgatt gtcttttgtt acttcctcaa taattcatta tttttatcac ttatcctata
    13261 gcattcacga ggattatcgc taaactatgc ggacttggaa atttccgtca gttagggtaa
    13321 tgatgagagt agaaaataat aatgtttctg ggcaaaacca tgacccggaa cagattgatt
    13381 tgattgattt actaatgcag ttgtggcgtg gcaagatgac aatcatcatc tctgtcattg
    13441 ttgctattgc cctggctata gggtatctgg ccgttgccaa agaaaagtgg acttccacag
    13501 ctatcgttac tcaacctgat gtggggcaaa tcgctggcta taacaatgcc atgaatgtta
    13561 tctatggtca ggctgcaccg aaagtgtcag atttgcagga gacgttgatt ggtcgcttca
    13621 gttctgcctt ctctgcatta gcagaaacgc tggataatca ggaagaacca gaaaaactta
    13681 ccatcgaacc ttctgttaag aaccagcaat taccattgac tgtttcttat gttgggcaaa
    13741 ctgcagaggg cgcacaaatg aagttggccc aatacattca gcaagttgac gataaagtga
    13801 atcaagagct agaaaaggat ctcaaagaca acattgctct gggacggaaa aacttgcagg
    13861 actctttaag aacgcaggaa gtggtcgcgc aggagcagaa agatctgcgt atccgtcaga
    13921 ttcaggaagc attgcagtat gcgaatcagg cgcaggtgac aaaaccacag gttcagcaga
    13981 ctgaagatgt gacgcaagat acgttgttcc ttcttgggag cgaagcactg gagtcgatga
    14041 ttaagcatga ggcgacccgt ccgttggtgt tctcaccaaa ctactatcag actcgtcaaa
    14101 acctgctgga tatcgaaagc ttaaaggttg atgatcttga tattcatgct taccgttatg
    14161 tgatgaaacc gacgttacct attcgtcgcg atagcccgaa aaaggcaatt accttgattc
    14221 tggcagtgct actgggtggc atggttggcg cggggattgt gctggggcgt aacgctctac
    14281 gcaattacaa cgcgaaataa tctttgcagt tttaaagaaa atgggcaggg tggtgacacc
    14341 ttgcccgttt tttttgccgg atgcgatgct ggcgcatctt atccagccaa aatgtgcaga
    14401 gcgaatagta ggcccgataa gcttgcgcat cgggcaatgg ctacggatgc gactacaaca
    14461 tcgcatccgg tcagtccgca actcactgat gccgtttgcg caggttctca atcaccgtcg
    14521 ttaaatccag cccctgatcc tgcaacagca ccagcaggtg atacatcaag tcagatgcct
    14581 cgttggtcag ctcaaagcgg tcatgtaccg ttgctgccag cgcagtttcc accccttctt
    14641 cgcccacttt ctgcgcgatg cgtttggtgc cgctggcata cagtttggct gtgtaagagg
    14701 tttccgggtc ggcagattta cgttcggcga gcagttgttc cagttgatac aggaacagcc
    14761 actggtgagc ggtgttgccg aagcaactgc tggtgccttt gtggcaggtc gggccgatgg
    14821 gattcgccag cactaataaa gtgtcgttgt cgcagtccga cgcaatactc actacgttga
    14881 ggaaattacc cgacgtttcg cctttggtcc acagtcgctg tttagtgcgc gagaagaagg
    14941 taactttgcc actttcgatg gttttgtcca gagcttccgg gttcatatag cccagcatta
    15001 acacttcgcc agataccgcg tgttgtacaa tcaccggcat cagtccgtcg gttttttccc
    15061 agtccagttc gtgacgttgt tgttctgtta acatatcctg atctccacgc cctgtgatgc
    15121 caggtacgct tttaattcac taatattgat tatttgtttg tggaatacag aagctgccag
    15181 cgcgccgtca acgtcggcat cgcggaaggc ttcgaggaag tgttccatgg tgcccgcgcc
    15241 accggaggca atcagcggga cgtggcaaac ttcacgcact tttttcagtt gatcgaggtc
    15301 gtaaccgttt cgtacgccgt cctgattcat catgttgagg acgatttctc cggctccacg
    15361 tttttgcact tcctctaccc agtcgagtgt ttcccactga gtgacgcggg tgcggctttc
    15421 atc
//