LOCUS       EU294176               13749 bp    DNA     linear   BCT 26-AUG-2008
DEFINITION  Escherichia coli serogroup O159 O antigen gene cluster, complete
            sequence.
ACCESSION   EU294176
VERSION     EU294176.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 13749)
  AUTHORS   Liu,B., Knirel,Y.A., Feng,L., Perepelov,A.V., Senchenkova,S.N.,
            Wang,Q., Reeves,P.R. and Wang,L.
  TITLE     Structure and genetics of Shigella O antigens
  JOURNAL   FEMS Microbiol. Rev. 32 (4), 627-653 (2008)
   PUBMED   18422615
REFERENCE   2  (bases 1 to 13749)
  AUTHORS   Liu,B., Knirel,Y.A., Feng,L., Perepelov,A.V., Senchenkova,S.N.,
            Wang,Q., Reeves,P.R. and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (23-NOV-2007) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, 23# HongDa Street, Tianjin
            300457, P. R. China
FEATURES             Location/Qualifiers
     source          1..13749
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:562"
                     /note="serogroup: O159"
     misc_feature    1021..12213
                     /note="O antigen gene cluster"
     gene            1021..2400
                     /gene="wzx"
     CDS             1021..2400
                     /gene="wzx"
                     /note="O antigen flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="ACA24887.1"
                     /translation="MQCSGSCKARGGSVENIENVCMVIKSSNGFGRIRINILLGFFSK
                     FGSFILSYISLPIALSYLGVNYYGVWIVIFSVVAWIYNFDIGIGLGLKNSLNDALVKK
                     NYKLANELIATAYIFLIAVSILLLLISFLLVFSINLDSIFSMSNIRESEIRTTLLVSV
                     FFTIANFILLLYKQLFFAVNLSGFAAVTTILYQILVIVFLLVAKYFIEPSLLIVAIIY
                     GVSNLFVGVFFTLYFFKRNDVLKFSFSNYKRNHIKSIGGVGIKFFIIQMCMLMIFTCD
                     NIIISKYLGPEYVTSYSLILKTYQAFIMISYIILTPYWTLFAEAYYQKNTEWILKQYK
                     KLYTLFLLMIIAVIAYSLYIQPLLKIWLHTELKFNKYMIYGFCIFVIIRVFIDLHAVF
                     LNGIGKINVQLVLYLFAAIINIPLAIILIKHFNMGSEAVIFSASIAIAPMAIILPLQS
                     LVLFRNIAK"
     gene            2397..3134
                     /gene="wfgP"
     CDS             2397..3134
                     /gene="wfgP"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfgP"
                     /protein_id="ACA24888.1"
                     /translation="MKLTVITVVYNSIEMFKKTYFCLSQQTCQNFTWIIKDGCSDDGL
                     ELFINEIKGEFKELVYINKTDNGIYNAMNQALDTDQLEEGLVTFLNAGDIYSSNLTLE
                     KVLSLYNKSAGVIAIPVSVAGKEIQQTLITGYIVNNICHQATFYNISCAIVTNTLKFD
                     ERYLLCADFALLIKLSLSTDIHYLTQVPPVIYETSGISSIRIYKRLYEKAVIIYSSDL
                     LLINKLFSLLAILKGGVLHVFNRNSIK"
     gene            3106..3942
                     /gene="wfgQ"
     CDS             3106..3942
                     /gene="wfgQ"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfgQ"
                     /protein_id="ACA24889.1"
                     /translation="MFLIATLSSKENEIDECKESVVKQTIDKKQIIFEGFDNITAHKK
                     VYSLFNEAEKKYKYLWKGDADMRFCDQDVLRDIAFFFDGHPRVDHIILPVRDHFAGKH
                     ILGAHFFRNGVRWIENNETIFVDPNPALCNKRVILYRWKNRIEHCFNPHDQQSFMFGV
                     HRISKLLAAGEKEDYSQFVSQLYVLNNLKKEYVKKKKRMHLLAMNGVMAVANGSANFY
                     DYSHKIKNNTSIKYDSIDYSLDDYGNYICLQFKKLTPKGKAKYFYRKLILILKAVIYG
                     YS"
     gene            3929..4942
                     /gene="wzy"
     CDS             3929..4942
                     /gene="wzy"
                     /note="O antigen polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="ACA24890.1"
                     /translation="MVILKSRLIFLFFFVFLVLMVFYKIEANYFTPDEIFYLFSDSML
                     TDVTVASRYKFVAYIFRFIYEYGEYISLLIVNITIVWFVINKLSKSSNNNDVNYLIYG
                     FLFPSVVFYASLFLRDFYVFILAMLFVYVRRGKHKLFFQWCIILAIGFLKIELAAIFM
                     CAMFISRIKISPFVIVYMFIICVLTWFLALHNQTLMGIYLNTLERFEPTVFSEYNTLF
                     FGLQQMEPTPLNGAINIFFSYINLLSPFLISWPSNTGNIFNVIMTVDSILFLGCIIIG
                     VLGFNTKKYYSDDLYRLSIFVLLLSIIYGYFMVTPMTSLRMHIHFVPLQYYFLWDLGL
                     KYV"
     gene            4935..6080
                     /gene="wfgR"
     CDS             4935..6080
                     /gene="wfgR"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfgR"
                     /protein_id="ACA24891.1"
                     /translation="MCKKILIIGACPPPYTGQSISLEKLKNTLENDSDFEVRHINLAP
                     KFGHTTGKFNIIRCSQTIYILLSYIWNLLLFKPNTIYMTKGSSKWGFVRDYAFQLLMK
                     MFSSNTKFVVHLKGGNYDSFYESSTELLKKCIVNFLKNCDSIIVLGPSLIKMYDFCPD
                     IKSKIRVVFNALPQDTVNNYVKENTNTVNVVFLSNLIISKGYLDVLQASLEVSKFNIH
                     FHFAGDFMLSPDDEDDKGDLKKGKEEFNNFIINNGLENNITYHGVLVGNKKNDLLKLG
                     DIFILPTYYHVEGQPISIIEAMSFRNAIISTNYRSIPDIVYEGRNAIFVKPKKPEDIV
                     NAITYLYENRNVLIAYQNNSYEYYHKKHIWSKHYSAMKEIFISEKAK"
     gene            6077..7195
                     /gene="gmd"
     CDS             6077..7195
                     /gene="gmd"
                     /note="GDP-mannose-4,6-dehydratase"
                     /codon_start=1
                     /transl_table=11
                     /product="Gmd"
                     /protein_id="ACA24892.1"
                     /translation="MKKAFITGITGQDGSYLAEFLLDKGYEVHGIKRRASSFNTERVD
                     HIYQDRHNQNPNFFLHYGDLTDTSNLVRLIKEIQPDEVYNLGAQSHVAVSFESPEYTA
                     DVDAMGTLRLLEAIRICGLEKKTRFYQASTSELFGLVQEIPQRETTPFYPRSPYAVAK
                     MYAYWITVNYRESYGMYACNGILFNHESPRRGETFVTRKITRAIANISQGIEKCLYLG
                     NMDSPRDWGHAKDYVRMQWMMLQQDHPEDFVIATGKQISVREFVRMSAKEVGLELEFS
                     GQGVDEIATVVNKTSDCAIGVSIGDVIVRVDPRYFRPAEVETRLGDPAKAKKVLGWEP
                     EITVEEMCAEMVASDLAKAKQHALLKSHGYDVAVSLER"
     gene            7199..8164
                     /gene="fcl"
     CDS             7199..8164
                     /gene="fcl"
                     /note="GDP-L-fucose synthetase"
                     /codon_start=1
                     /transl_table=11
                     /product="Fcl"
                     /protein_id="ACA24893.1"
                     /translation="MTKKRIYVAGHRGMVGSAICRQLSLRDDIELVVKTHKELDLTVQ
                     KDVDAFFEQEKIDQVYLAAAKVGGIYANNTFPAEFIYQNLMIESNIIHSAHKAGIQKL
                     LFLGSSCIYPKFAKQPMNESALLTGILEPTNEPYAIAKIAGIKLCESYNRQYGRDYRS
                     IMPTNLYGINDNFHPENSHVIPALMRRFHEAKESGAPEVIVWGTGTPMREFLYVDDMA
                     AASVHVMELDEAIYQQNTQPMLSHINVGTGVDCSIREMAETMASVVGYQGKIVFDVTK
                     PDGTPRKLMDVTRLKNLGWQYRYNLHEGLSLTYKWFIENINSFRG"
     gene            8167..8628
                     /gene="gmm"
     CDS             8167..8628
                     /gene="gmm"
                     /note="GDP-mannose mannosyl hydrolase"
                     /codon_start=1
                     /transl_table=11
                     /product="Gmm"
                     /protein_id="ACA24894.1"
                     /translation="MNKRLERELFKKIVEHTPLISIDLIIRNDKGEALLGQRLNRPAQ
                     NYWFVPGGRIYKDESFEIAFKRITFEEVGVQISLNDALFLGVYEHFYNDNFSEAEFST
                     HYVVHGYEIQLKPQQLHLPTVQHNSYKWFDVVTLLNSTTVHQYTKNYFIPR"
     gene            8634..10037
                     /gene="manC"
     CDS             8634..10037
                     /gene="manC"
                     /note="GDP-mannose pyrophosphorylase"
                     /codon_start=1
                     /transl_table=11
                     /product="ManC"
                     /protein_id="ACA24895.1"
                     /translation="MLLPVVMAGGSGTRLWPLSRTLYPKQFLSLNSRLTMLQETLRRL
                     DKVEHKPALVICNESHRFIVAEQLRKEGLKHSGILLEPVGRNTAPAVALAALQAMVTG
                     DDPILLVLAADHEIQNEDNFIAAVLAAKNFAEQGKLVTFGIVPTSPETGYGYIKSGEY
                     LDGKGYKVAAFVEKPELHVAQRYISDGGYLWNSGMFMFRASVFIDELKKFRPDILASC
                     QSSLSSSTQDLDFIRLDNSSFSCCPEESIDYAVMEKTAEAVVVPLNAQWSDVGSWSAL
                     WEISSKDQSGNAIRGDVLVEDATDSYLYSQHRLIGAVGVKDLVVVETKDAVLVAHKDK
                     VQQVKNIVAQLKKNNRTEYLQHREIFRPWGSHDTIAEGARFQVKHVIVLPGHITAKQI
                     HYHRTEHWIVVSWTAKVHLEDNAYLVSDMNQHIYLLVFHMLLKILSDPLEIVDVRSGV
                     YLEEDDVIRVSSSGVGY"
     gene            10037..10783
                     /gene="wfgS"
     CDS             10037..10783
                     /gene="wfgS"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfgS"
                     /protein_id="ACA24896.1"
                     /translation="MRISIITATYSSEKTLFDTLLSLEKQTHPDIEYIVVDGASKDNT
                     IKLIKSNSTKVSKIICEPDKGIYDALNKGIQAASGDVIGFLHSDDLLAYDDAIADIAK
                     TFESTGCDAIYGDLEYVAQNDTTKRIRLWKSGSFSRFKMKVGWMPPHPSFYMKRECYS
                     QFGSFSLDYRISADYDSLLRYILKQRISIAYLPKVLVKMRVGGISNRSVSSMVKKSME
                     DIRVMKHNGIIWPIALVYKNISKLPQFIKK"
     gene            10789..12213
                     /gene="manB"
     CDS             10789..12213
                     /gene="manB"
                     /note="phosphomannomutase"
                     /codon_start=1
                     /transl_table=11
                     /product="ManB"
                     /protein_id="ACA24897.1"
                     /translation="MLNVKKIINDSNIAFGTSGARGLVIDFSHDVCAAFTHAFLSVID
                     DKYNFNKVALAIDNRPSSYEIAQACAYAIKQHGFEVEYHGVIPTPALAHYSMQKNIPC
                     IMVTGSHIPFDRNGLKFYRPDGEITKEDELAIINSEYTFSPVGVLPHLETSTQGADYY
                     LERYVSLFNPEILKGKRIGVYEHSSAGRDLYAPLFNQLGAEVISLGRSDEFVPIDTEA
                     VSDEDRILAREWSKKYNLDAIFSTDGDGDRPLVADENGEWLRGDILGLLTAIELNIKA
                     LAIPVSCNTAIEESNKFASIQRTKIGSPYVIAAFADLAKQFDSVAGFEANGGFLLASD
                     LQINGKELKSLPTRDAVLPALMLLIASRNSTISQLINNLPQRFTWSDRVKNFPSDSSQ
                     QIIKNAISSPNNFFNSLGYESLSCSAIDETDGARFTLNNGDIIHLRPSGNAPELRCYA
                     EASDENQAKQYVTNVLGNITSLIS"
ORIGIN      
        1 attgtggctg cagggatcaa agaaatcctc ctggtaactc acgcgtccaa gaacgcggtc
       61 gaaaaccact tcgacacctc atatgaatta gaatctctcc ttgagcagcg cgtgaagcgt
      121 caactgcttg cggaagtgca gtccatctgt ccaccgggcg tgaccattat gaacgtgcgt
      181 cagggcgaac ctttaggttt aggccactcc attttgtgtg cacgacccgc cattggtgac
      241 aacccatttg tcgtggtgct gccagacgtt gtgatcgacg acgccagtgc cgatccgctg
      301 cgttacaacc ttgctgccat gattgcgcgc ttcaacgaaa cgggccgcag ccaggtgctg
      361 gcaaaacgta tgccgggtga cctctctgaa tactccgtca ttcagaccaa agaaccgctg
      421 gatcgcgaag gcaaagtcag ccgcattgtt gaatttatcg aaaaaccgga tcagccgcag
      481 acgctggact cagacatcat ggccgtcggt cgctatgtgc tttctgcaga tatttggccg
      541 gaacttgaac gcactcagcc aggtgcatgg ggacgtattc agctgactga tgccattgcc
      601 aaactggcga aaaaacagtc tgttgatgcc atgctgatga caggtgacag ctatgactgc
      661 ggtaaaaaaa tgggttatat gcaggcattt gtgaagtatg gactacgcaa cctgaaagaa
      721 ggggcgaagt tccgtaaagg gattgagaag ctgttaagcg aataatgaaa atctgaccgg
      781 atgtaacggt tgataaggaa attataacgg cagtgaagat tcgtggcgaa agtaatttgt
      841 tgcgaatatt cctgccgttg ttttatataa acaatcagaa taacaacgag ttagcaatag
      901 gattttagtc aaagttttcc aggattttcc ttgtttccag agcggattgg taagacaatt
      961 agcgtttgaa tttttcgagt taagcgcgag tgggtaacgc tcgtcacatc gtagacatgc
     1021 atgcagtgct ctggtagctg taaagccagg ggcggtagcg tggaaaatat tgagaatgtt
     1081 tgcatggtca ttaaaagcag taatggattt gggcgtatta gaataaatat attactaggt
     1141 tttttttcga agtttggtag ttttatatta agttatatat cattacctat agcactgagc
     1201 tatttgggtg ttaattatta tggtgtatgg atagtaattt tctcagtagt agcatggatt
     1261 tataattttg atattggtat aggtctaggt ttaaaaaata gtttaaatga tgcgctggta
     1321 aaaaaaaatt ataagttagc aaatgaattg attgctactg cgtatatatt tctgatagca
     1381 gtaagtatat tattgctatt gatatcattt ttattggttt tttctattaa cctagattct
     1441 atttttagta tgtctaatat tagagagagt gaaataagaa ctacattact tgttagtgtt
     1501 ttttttacaa ttgctaattt tattttgctt ttatataaac aattgttttt tgccgtaaat
     1561 ttatcggggt tcgctgcggt aaccacaata ttgtatcaaa ttttggtaat cgtttttctt
     1621 ttagttgcaa agtattttat agaaccttca ttgttaatag tggcaattat atatggcgtg
     1681 tcaaatttat ttgtaggagt gttctttaca ttgtatttct ttaagagaaa tgatgtatta
     1741 aagtttagtt tttctaatta caaaaggaat catataaaat ccattggtgg agtaggaatt
     1801 aaatttttta tcattcagat gtgtatgctt atgattttta cgtgtgataa tattatcata
     1861 tcaaaatatc tcggtcctga atatgttaca agctatagtc ttatcttaaa aacgtatcag
     1921 gcttttatta tgataagtta tataattctt actccttatt ggaccttatt tgcggaagct
     1981 tattatcaaa aaaacacgga atggatatta aaacaatata agaaattata tactctgttt
     2041 ttacttatga ttatagcagt cattgcttat tcattatata ttcaaccttt gcttaagata
     2101 tggctccata ctgaattgaa attcaataag tatatgattt atggattttg tatatttgta
     2161 ataattagag ttttcattga tctgcatgct gtttttttga atgggattgg gaaaataaat
     2221 gtccagttag tgttatatct tttcgcggct attataaata tcccgttggc aattatatta
     2281 ataaaacatt tcaacatggg tagtgaggca gtaatatttt ccgcatcaat agcgattgca
     2341 ccgatggcaa taatattgcc acttcaaagt ttagtattat ttaggaatat tgccaagtga
     2401 agctaacagt aattaccgtt gtttataatt ctattgaaat gtttaaaaaa acatattttt
     2461 gcttatctca acaaacctgt cagaatttta catggataat aaaagatggc tgttcagatg
     2521 atggtttaga gttgtttata aatgaaatta aaggtgagtt taaggaactt gtttatatta
     2581 acaaaacaga taatggtatc tataatgcta tgaatcaagc gttggacacg gaccagcttg
     2641 aagaaggatt agttactttt ttaaatgctg gagatattta ctcatctaat ctaaccttag
     2701 agaaggtctt atctctttat aataaatccg ctggggtaat tgcaattcct gtttcagttg
     2761 caggcaaaga aatacaacag acgttaatta caggatatat agttaacaat atttgtcatc
     2821 aagcaacctt ttataatata tcgtgcgcga ttgtaaccaa tacattgaag tttgacgagc
     2881 gatatttatt atgcgcagat ttcgctttgt tgattaaatt atctttatcc accgatatac
     2941 attatttaac acaagtacca cctgtaattt atgaaacgtc aggcatttct tctattagaa
     3001 tatataaaag gttatacgaa aaagcagtaa taatttacag ttcagattta ttattaataa
     3061 ataagctttt ttctttgttg gccattttaa aaggaggtgt attgcatgtt tttaatcgca
     3121 actctatcaa gtaaagaaaa tgaaatagat gaatgtaaag aaagcgttgt taaacaaact
     3181 attgataaga agcaaatcat ttttgagggt tttgataata taaccgctca taagaaagtt
     3241 tattcacttt ttaatgaagc tgaaaaaaaa tataaatact tgtggaaggg ggatgctgat
     3301 atgcgatttt gtgatcagga tgtgctaaga gacattgctt tctttttcga tggtcatcca
     3361 agagttgatc atattatctt acctgttaga gatcactttg cgggtaagca tatattaggt
     3421 gcccattttt ttagaaatgg agtaagatgg attgaaaata atgaaactat atttgtagac
     3481 ccaaatccag ctttatgtaa taaacgcgtt atactttata gatggaaaaa tagaatcgaa
     3541 cattgcttta atcctcatga tcaacaatcc ttcatgtttg gagttcacag aatatcaaaa
     3601 ctcttagctg caggagaaaa ggaagattac agtcaatttg ttagccagtt atacgtatta
     3661 aataatttaa agaaagaata cgtaaaaaaa aaaaagcgaa tgcatttatt agcaatgaat
     3721 ggtgttatgg ctgtagcgaa tggaagtgca aatttttatg attattcaca taaaattaaa
     3781 aataacacaa gtataaaata tgattctatt gattattcac tagatgatta tggtaattat
     3841 atttgcttgc agtttaaaaa actaacgcca aaaggtaagg cgaaatactt ttaccgcaaa
     3901 ctcatattaa tattaaaggc ggtgatatat ggttattctt aaatcaagat taatatttct
     3961 attctttttt gtttttttag tactaatggt tttctataaa atagaggcaa attactttac
     4021 gccagatgag atcttctatt tatttagcga ctcaatgtta acagatgtta cagtagctag
     4081 tcgctataag tttgtagcgt atatatttag atttatttat gaatatggtg aatatatctc
     4141 tctactgatt gtaaatataa caatagtatg gtttgtaata aataaacttt caaagtcatc
     4201 aaataacaat gatgttaatt atttaattta tggttttttg tttccatccg ttgtttttta
     4261 tgcgtctctt ttcctccgtg acttttatgt ttttattttg gcaatgcttt ttgtgtatgt
     4321 taggcggggt aaacataagt tattttttca atggtgtatc attttagcaa tcggatttct
     4381 taaaatagaa ttagcagcaa tatttatgtg tgcaatgttt atatcaagga ttaaaattag
     4441 tccttttgta attgtttaca tgtttatcat atgcgttctc acatggttct tggctttgca
     4501 caaccaaaca ttgatgggaa tatatcttaa tacattagaa cgattcgaac caactgtttt
     4561 ttctgaatac aatactttat tttttggatt gcaacaaatg gaaccgactc cgttgaatgg
     4621 tgcaataaat atttttttta gttatattaa tttgctttct ccttttctaa tatcctggcc
     4681 atcgaataca ggaaatatat ttaatgttat aatgacagta gattcaatcc ttttcttggg
     4741 ttgcattatt attggtgttt tgggatttaa taccaaaaaa tattattcag atgatcttta
     4801 caggttatct atatttgttt tgctactgtc aattatttac ggttatttta tggtaacgcc
     4861 aatgacttca ttgcggatgc atatccattt cgtacctttg caatactatt ttttatggga
     4921 tctaggttta aaatatgtgt aagaagatat taattattgg cgcttgccct ccaccttata
     4981 caggtcaaag tatttcttta gaaaagttga aaaatacttt agagaatgat tctgattttg
     5041 aagtcagaca tatcaacctt gcgccaaaat ttggtcatac gactgggaaa tttaatataa
     5101 tacgctgttc acagaccatt tatatattgc tttcgtatat atggaatctg cttttattta
     5161 aaccaaatac tatatatatg accaaaggaa gttcaaaatg gggatttgta agggattatg
     5221 cattccaact attaatgaaa atgttttctt caaatacgaa atttgttgtt catttaaaag
     5281 gtggaaatta tgattcattt tatgaaagtt caacagaact tttaaaaaaa tgtatagtta
     5341 attttttaaa aaattgcgat agtataatag tattaggtcc ctcattaata aaaatgtatg
     5401 atttctgtcc tgatattaag agcaaaatac gtgttgtatt taatgcattg ccacaagaca
     5461 ctgtaaacaa ttatgttaaa gaaaatacaa atacagttaa tgttgtattt ttatctaatt
     5521 tgataatttc taagggatat ttagatgtat tgcaagcaag tttggaggta agtaagttta
     5581 atatccactt tcatttcgct ggtgatttta tgctaagccc tgatgatgaa gatgataaag
     5641 gggatttaaa aaaaggaaaa gaagaattta ataattttat aattaataat ggactagaaa
     5701 ataatataac atatcatggt gtgttggtag gtaataaaaa aaatgactta cttaaattag
     5761 gtgatatatt tattctacct acttattatc atgtcgaagg acaacctata tccatcattg
     5821 aagcaatgtc atttagaaat gcaataattt caacaaatta cagatctata cctgatatag
     5881 tgtatgaggg gaggaatgca atatttgtta agcccaaaaa accggaagat attgtcaatg
     5941 ctattacgta cttgtatgaa aataggaatg tattgatagc gtatcaaaat aactcttatg
     6001 agtattatca caaaaaacat atatggtcaa agcattatag tgcaatgaaa gaaatcttta
     6061 taagcgagaa agcgaaatga aaaaagcatt tattacaggc attactggtc aggatggctc
     6121 ttacttggct gaattccttc ttgataaagg gtatgaagtg catggcatta aacgtcgagc
     6181 atcttcattt aatacagagc gtgttgatca catttatcaa gatcgccaca atcaaaatcc
     6241 aaatttcttt cttcattacg gtgatttgac agatacttca aacttagttc gcctcattaa
     6301 agaaatccaa ccggacgaag tttataacct tggcgctcaa tctcatgtag cggtttcatt
     6361 cgaatcacct gaatatactg ctgacgttga tgcgatgggg actttacgtc tgttggaagc
     6421 gattcgtatt tgtgggctag agaaaaaaac acgtttttat caggcatcta cttctgaact
     6481 cttcggctta gttcaggaaa tcccacagcg agaaacaaca ccattctacc ctcgttcgcc
     6541 ttatgctgtt gcgaagatgt atgcatactg gattactgta aactatcgtg aatcctatgg
     6601 aatgtacgcc tgtaacggaa ttctcttcaa tcatgaatcc ccgcgtcgtg gtgaaacatt
     6661 cgtaacacgt aaaatcacgc gtgctattgc aaatatttcg cagggaatcg aaaaatgtct
     6721 ctatcttggc aatatggatt caccgcgcga ctgggggcat gcgaaagatt acgtgcgtat
     6781 gcagtggatg atgttgcaac aagatcaccc agaggatttt gtaattgcaa caggcaaaca
     6841 aatttccgta cgtgaatttg ttcgtatgtc agctaaagaa gtcggtctgg agttagaatt
     6901 ctccggacaa ggtgttgatg aaatagcaac tgttgtcaat aaaacatctg actgtgctat
     6961 tggtgttagt attggggatg tgatcgttcg tgttgatcct cgttatttcc gtcctgcaga
     7021 agttgaaact cgtcttggtg acccagcaaa agcgaaaaaa gtattgggtt gggaaccaga
     7081 gattacagtt gaagagatgt gtgccgaaat ggttgccagt gatctggcga aagcaaaaca
     7141 gcatgcacta ctgaaaagcc atggttacga tgttgcagtt tctctggagc ggtaaggtat
     7201 gacaaaaaaa cgtatctacg ttgctggtca ccgaggtatg gttggctctg ctatttgccg
     7261 tcaattatca ctgcgtgatg atatcgaatt agttgtcaaa acacataaag aactcgatct
     7321 aaccgtacag aaggatgttg atgcattttt tgagcaagag aaaattgatc aggtttatct
     7381 tgctgcggct aaagttggtg gcatttatgc caacaataca tttccggcag aattcatcta
     7441 tcagaatctc atgattgaga gtaatattat tcattcagct cacaaggccg gaattcaaaa
     7501 attacttttt ttaggctcaa gctgtattta tcctaaattc gcaaagcagc cgatgaacga
     7561 gtctgcgctt ttaacgggca tacttgagcc aactaatgag ccatacgcaa ttgctaaaat
     7621 tgcgggcata aaattatgtg aatcttataa ccgtcaatat ggccgtgatt atcgcagtat
     7681 aatgcctact aatctttatg gcataaatga taatttccac cctgaaaact ctcatgttat
     7741 tccggcactc atgcgtaggt tccatgaggc aaaagagagt ggcgcaccag aagttattgt
     7801 ctgggggacc ggaacaccga tgcgtgagtt tttatatgtt gatgatatgg ctgccgcatc
     7861 tgttcatgta atggaacttg acgaagcaat ttatcaacaa aatacacagc ctatgttatc
     7921 tcatattaat gttggtacgg gtgtagattg ttccatacgt gaaatggctg aaacaatggc
     7981 ctctgtggtg ggttatcaag gtaaaattgt ttttgatgtt actaaacctg atggcactcc
     8041 gcgtaaactt atggacgtta cccggctcaa aaacttgggc tggcaatatc gctataattt
     8101 acatgaaggc ttatcattaa catataaatg gtttattgag aatattaatt cttttcgggg
     8161 atagttatga ataagagatt ggaacgtgag ctatttaaaa aaatagttga gcatactcct
     8221 ctaatctcga ttgatctcat aattagaaac gataaaggag aggcgctgct ggggcagcgc
     8281 cttaatcgcc cagcacaaaa ttattggttt gtgccaggag ggcgaattta taaggatgag
     8341 tcattcgaga ttgcatttaa gcggataaca tttgaagaag tgggcgttca aattagtctt
     8401 aatgatgcct tatttctagg ggtgtatgaa catttttaca atgataattt ttctgaagca
     8461 gaattttcta cacactatgt agtgcatgga tatgaaatcc aacttaaacc tcagcaactt
     8521 cacctaccaa cggtccagca taattcctac aagtggtttg atgtagtaac gttgcttaat
     8581 agcactacag ttcatcaata taccaaaaat tattttatac caaggtaata gatatgctac
     8641 ttcccgttgt catggccggt ggttctggta ccagattatg gcctctttca cgtacacttt
     8701 atccgaaaca atttctgtct ttgaatagtc gtttaaccat gttgcaagag acattgcggc
     8761 ggcttgacaa ggtcgaacat aaacctgctt tggtcatttg taacgaatca catcgcttta
     8821 tcgttgctga acaattgcgt aaagagggtt taaagcatag cggtattttg cttgagcctg
     8881 ttggtcgtaa tactgcgcct gctgtagcac ttgcagcact tcaggctatg gtaactggag
     8941 atgatcctat tctgttggtt cttgctgctg atcatgaaat ccagaatgag gataatttca
     9001 ttgctgcagt tcttgcagcc aagaattttg cagagcaggg taaacttgtt acgtttggta
     9061 tcgttccaac atccccagag actggctatg gttacattaa gtcaggtgaa tatctggatg
     9121 gaaaaggtta taaagttgcg gcttttgttg aaaaaccaga gcttcacgta gctcagcggt
     9181 atatatcaga tggcggttat ctttggaata gtgggatgtt tatgttcaga gcatctgtat
     9241 ttatcgatga actgaaaaaa ttccgaccag atattttagc cagttgccaa agctccctgt
     9301 cctcttcgac acaagattta gattttatcc gtctggataa ctcttcattt tcttgctgtc
     9361 ctgaagagtc tattgactat gcagttatgg aaaaaacagc cgaagctgtc gttgttccat
     9421 taaatgcgca atggagtgat gttggatcat ggtctgcatt gtgggaaata agttcaaaag
     9481 accaaagcgg caatgccatt cgtggtgatg tattggttga agatgctaca gatagttatc
     9541 tttattcgca gcatagactt attggtgccg tgggcgtaaa ggatttggtt gttgttgaaa
     9601 cgaaagatgc agtattagtt gctcataaag ataaagttca gcaagttaaa aatattgtcg
     9661 ctcaacttaa aaagaataat cgaacagaat atttacagca tcgggaaatt tttcggccct
     9721 ggggcagtca tgacactata gccgaagggg cgcgctttca ggtgaaacat gtgattgtat
     9781 tacctggtca cattactgct aagcagattc attaccatcg tactgaacat tggattgtcg
     9841 tctcatggac agctaaagtt catcttgaag ataacgctta ccttgtttct gatatgaatc
     9901 aacatatata cctgttggtg ttccacatgc tattgaaaat cctgtcagat ccgctcgaaa
     9961 tagttgatgt tagatcagga gtctacctgg aagaggatga tgttataaga gtttcttctt
    10021 ctggagtagg atactaatgc gaatttctat tatcacagct acttatagta gtgaaaaaac
    10081 tctctttgat acattacttt ctctagaaaa gcaaacgcat ccagatattg aatatatagt
    10141 tgtagatgga gcatcaaaag ataatactat taagctgatt aagagtaata gtacaaaagt
    10201 ttcaaaaatc atttgcgaac ccgataaggg catttatgat gctctgaata aaggtattca
    10261 agcagcttcg ggtgatgtta ttggtttttt acattctgat gatttactag cttatgatga
    10321 tgctattgca gatatagcaa aaacatttga aagtacaggg tgtgatgcta tttatggcga
    10381 tttggagtat gttgcccaaa atgatacgac taaacgtatt agattatgga aaagtggttc
    10441 atttagtcgt ttcaagatga aagtgggttg gatgccgcca cacccatcat tttatatgaa
    10501 acgcgaatgt tatagtcagt ttggtagttt ttctttagat tatcgaatat ctgctgatta
    10561 tgattcatta ttacgatata ttttaaagca acgtatttca atagcatatt taccaaaagt
    10621 cttagtgaag atgcgtgttg gtggaattag caatcgttca gtatcttcaa tggtcaagaa
    10681 gtcaatggaa gacattcgtg ttatgaaaca taatggtatt atctggccaa tagctttagt
    10741 gtataaaaat atatccaaac ttcctcaatt tattaaaaag taatcatcat gttaaatgtt
    10801 aaaaaaatca ttaacgatag taatattgcg ttcggtacta gtggtgctcg cggtttagtg
    10861 atcgattttt cccatgatgt ttgtgctgcg ttcactcatg cgtttctttc tgttattgat
    10921 gacaaataca attttaataa agttgcctta gccattgata accgcccaag tagttacgaa
    10981 attgctcagg catgcgcgta tgctataaaa caacatggat tcgaggttga atatcatggt
    11041 gtaattccga ctcctgcatt agctcattat tcgatgcaga aaaacattcc ctgcataatg
    11101 gtcacaggga gtcatatccc ttttgatcgt aatggcttaa aattctacag acctgatggt
    11161 gaaatcacta aagaggatga gctcgcaatt ataaatagtg agtatacatt ttcgcctgta
    11221 ggtgtattac ctcatcttga aacaagcact caaggtgcag actactacct cgagcgttat
    11281 gtttctcttt ttaatcccga gattttaaag gggaaaagaa taggggtata tgaacattct
    11341 agtgcaggac gcgatttata tgctcctctt tttaatcaat tgggtgcaga ggtcatttcc
    11401 ctcggtagaa gtgatgagtt cgttccgatt gatacggaag cagtaagcga tgaagatcgt
    11461 atacttgcaa gagagtggtc taaaaaatat aatcttgatg ctattttctc aacagatggc
    11521 gatggtgatc gtcctttagt tgccgatgaa aatggtgaat ggttaagagg cgatattctg
    11581 ggactactta ctgctattga acttaatatc aaggcgttgg ctattccagt gagttgtaat
    11641 acagcaattg aagagtctaa taaatttgca agtatacaac gaacgaaaat aggttctcct
    11701 tatgtaattg cagcatttgc agatcttgct aagcaatttg attcagtcgc aggttttgaa
    11761 gctaatggtg gttttctcct tgcctccgat ttacaaatta atggcaagga attaaaatcg
    11821 ttgcctacac gagatgctgt gttaccagca ttaatgctct taatagcttc tcgcaatagt
    11881 actatttctc aactgattaa taatcttcct cagcgattca cttggtcaga tagagttaaa
    11941 aacttccctt cagattcaag tcaacaaatt ataaaaaatg ccatatcgtc acccaataat
    12001 ttctttaata gtttaggtta tgaatcatta tcctgttccg ctattgatga aacggatggt
    12061 gcaagattta ctttaaataa tggtgatatt atacatctcc gtccttccgg taatgctcca
    12121 gaactccgtt gttatgctga ggccagtgat gaaaatcaag ctaagcaata tgttacgaat
    12181 gtgctgggaa atattacctc tttgatttct tgatgttata ggtttatcta cgcttatatg
    12241 tgtgcgtagg tttgattaca cgtagatgcc ggtatacaga attgaagaac ggtatttgtt
    12301 gcattaatga aattcagcac tacacacatt cgtgcaactt gagataacat ctcaatcata
    12361 ttcaagtcgc gcatacatcg cggtgaacac cccctgacag gagtaaacaa tgtcaaagca
    12421 acagatcggc gtcgtcggta tggcagtgat ggggcgcaac cttgcgctca acatcgaaag
    12481 ccgtggttat accgtctcta ttttcaaccg ttcccgtgag aagacggaag aagtgattgc
    12541 cgaaaatcca ggcaagaaac tggttcctta ctatacggtg aaagagtttg ttgaatctct
    12601 ggaaacgcct cgtcgcatcc tgttaatggt gaaagcaggt gcaggcacgg atgctgcaat
    12661 tgattccctc aaaccatatc tcgataaagg tgatatcatc attgatggcg gtaacacctt
    12721 cttccaggac accattcgtc gtaaccgtga gctttctgcc gaaggcttta acttcattgg
    12781 taccggtgtc tccggtggtg aagaaggtgc gctgaaaggt ccttccatta tgcctggtgg
    12841 gcagaaagaa gcctatgaac tggttgcacc gatcctgacc aaaatcgccg cagtggctga
    12901 agacggtgag ccatgcgtta cctatattgg tgccgatggt gcaggtcact atgtgaagat
    12961 ggttcacaac ggtattgaat acggcgatat gcagctgatt gctgaagcct attctctgct
    13021 taaaggtggc ttgaaccttt ccaacgaaga actggcgcag acctttaccg agtggaataa
    13081 cggtgaactg agcagctacc tgatcgacat caccaaagat atcttcacca aaaaagatga
    13141 agagggtaac tacctggttg atgtgattct ggatgaagcg gctaacaaag gtaccggtaa
    13201 atggaccagc cagagtgcgc tggatctcgg cgaaccgctg tcgctgatta ccgagtctgt
    13261 gtttgcacga tacatctctt ctctgaaaga tcagcgcgtt gccgcatcta aagttctctc
    13321 tggtccgcaa gctcagtcag caggcgacaa ggctgagttc atcgaaaaag ttcgccgtgc
    13381 actgtatctg ggcaaaatcg tttcttacgc ccagggcttc tctcagctac gcgctgcgtc
    13441 tgaagagtac aactgggatc tgaactacgg tgaaatcgcg aagattttcc gtgctggctg
    13501 catcattcgt gcgcagttcc tgcagaaaat caccgatgct tatgccgaaa atccgcagat
    13561 cgctaacctg ctgctggctc cgtacttcaa gcaaattgcc gatgactacc agcaggcgct
    13621 gcgtgatgtc gtcgcttatg cggtacagaa cggtatcccg gttccgacct tcgccgctgc
    13681 ggttgcctat tatgacagct accgttctgc tgttctgcct gcgaacttaa tccaggcgca
    13741 gcgcgacta
//