LOCUS       EU294173               14249 bp    DNA     linear   BCT 26-AUG-2008
DEFINITION  Escherichia coli serogroup O29 O antigen gene cluster, complete
            sequence.
ACCESSION   EU294173
VERSION     EU294173.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 14249)
  AUTHORS   Liu,B., Knirel,Y.A., Feng,L., Perepelov,A.V., Senchenkova,S.N.,
            Wang,Q., Reeves,P.R. and Wang,L.
  TITLE     Structure and genetics of Shigella O antigens
  JOURNAL   FEMS Microbiol. Rev. 32 (4), 627-653 (2008)
   PUBMED   18422615
REFERENCE   2  (bases 1 to 14249)
  AUTHORS   Liu,B., Knirel,Y.A., Feng,L., Perepelov,A.V., Senchenkova,S.N.,
            Wang,Q., Reeves,P.R. and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (23-NOV-2007) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, 23# HongDa Street, Tianjin
            300457, P. R. China
FEATURES             Location/Qualifiers
     source          1..14249
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:562"
                     /note="serogroup: O29"
     misc_feature    1086..13333
                     /note="O antigen gene cluster"
     gene            1086..1481
                     /gene="wffW"
     CDS             1086..1481
                     /gene="wffW"
                     /note="glycerol-3-phosphate cytidyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WffW"
                     /protein_id="ACA24847.1"
                     /translation="MKRIITFGTFDVFHVGHVNILERTASLGDYLIVGVSSDKLNFNK
                     KGRYPIYNQEDRCRIINSLRVVNDVFIEESLEQKKEYIIQYEADILVMGDDWAGRFDW
                     VNDICDVIYLPRTPSVSTTEIIEVVKTLR"
     gene            1478..2638
                     /gene="wffX"
     CDS             1478..2638
                     /gene="wffX"
                     /note="glycerophosphotransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WffX"
                     /protein_id="ACA24848.1"
                     /translation="MTNFKKIARKIISKSISLLNYFIPKKKNRIFFKSKPDYSGNCKA
                     LSDYIIEKKLPYHIVWSVKKEINQKGITVVRAGSLKEFFYYFTSKYVITTHNEMIGPI
                     ATNQKYISLWHGMPFKKICYLGENDHQGMIDYSAIRIATSEVMRSIISASFREKANNV
                     YITGQPRNDFLFKPISLTDIGIKSIKNKKIVMFAPTFRMNNEDIRYSDGAEIIDNNFL
                     RVNDFCMEEIDYYLEQSNLHLILKLHPYEEEYFRGIATLSSNITIISSDELTQKNIDL
                     NQLLSLVDILITDYSSIYLDYLILNKPLIFLVPDVDAYSSARGGFTLEPFDFWTPGDK
                     VSCQRSLLNSINKIITGNDEYAEKRNQINLIINKYSDANNSQRVIELMKSLS"
     gene            2635..3735
                     /gene="wffY"
     CDS             2635..3735
                     /gene="wffY"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WffY"
                     /protein_id="ACA24849.1"
                     /translation="MKIYIFLGDLSSKGGIERVSVALANGLAKFYDVTIISLYRATRN
                     LSFVPDEKVNVIYLYDEFEKSMYNRNLGAIIGLKFDFLYIIKKLKQLKRLNLELNKND
                     VLISSDIKMSLLLFFYAKKSKIIAIEHFEHDVGNLVLRKIRSALYPKLSAVVSQTGED
                     QIKYLQWLPRKKHKIIPNIISFEATDIPQNKIEQKNVLAVGRLTHQKGFDLLLQAWAD
                     ANTHDWRLKIIGDGEELNHLNSLITELNISNAEIIPFQKDIQRHYSSAGIFVLSSRFE
                     GLGMVLLEALSSGLACISFDCPAGPKSIISSDNGVLVPTGDTIKLSQAISFLINNEEE
                     RKRLQNKAAASVEKFKESNVIAKWRELLNEIS"
     gene            3722..4777
                     /gene="wffZ"
     CDS             3722..4777
                     /gene="wffZ"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WffZ"
                     /protein_id="ACA24850.1"
                     /translation="MKFHRKQYDAVFLTNVPAFYKVNLFNEIQKNKDIFVIFVSDKSK
                     IRNEDFYSYDFAFDHFFLNEENFEERSKIKTLFNLLRVLRTISYKKIIYSGWEVKEVT
                     LAALFNKREKNAIVIESSIIETKKTGLTWLLKKIAIGRMSLAYPSGLLQKAILETFSF
                     KGKTVITHGVGISNLKETSFHNKKTCTRNNPLRFIYVGRISSEKNIDFMVKVFKTLPY
                     ELILIGDGPLKKQFDDKTYSNIRFLGYIDNKKLSKELLKSDCFILPSLSEPWGLVVEE
                     ALTLGLPVIVSNHVGCHSDLVNDRNGIIFDVNDTQSFIDALSKMEKNYERFARGASEF
                     HASEIAKAQIDAYVGSI"
     gene            4777..6177
                     /gene="wzx"
     CDS             4777..6177
                     /gene="wzx"
                     /note="O antigen flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="ACA24851.1"
                     /translation="MSNKNKTFKDFINYFLGDLFVKGFMFISLPLLSRIMSPEDYGRM
                     SLINAAVMILYVFISLNLQNAVINAYMKNEVDFPVYLGSVLWGLTAAQVLLVALSIYF
                     AVPLGMLLSISKYDVYWVVAICILLSYIYIYTSYLQGARLSSSFVKLNIFSKISEVVV
                     IFVFAWFLTQDKYLAKVYAQLVISFILLTYVLKKLKKIAVFKFNVRYFISALAFSSPL
                     IIHVLSNALLSQVDRLFIAKMLGEGQAGIYSFAYNIGMCILVVVMAWNSSWQPKLYKL
                     IDSKDNGKIIRIVDVSSLLLLIVSFLSILFSKQMVEVLADNRYRESISVVPVILIGNS
                     LIHIYLSYVNFTFYKKKTIYVSIGTLLAVAINIALNYILIPIYGIHGAAWATVIAYFM
                     LAFFHYLIATIMLKANPLSLFLLLWYSALLLASYFLVIYLDSLSLWISLSIKAMIIFI
                     ILIILMKTKIYNELKE"
     gene            6174..7337
                     /gene="wzy"
     CDS             6174..7337
                     /gene="wzy"
                     /note="O antigen polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="ACA24852.1"
                     /translation="MTVSIYLLLLAFVFLLAMSDFFIIADARNRFLLYIILFSLLVTF
                     IGLRYQTGLDWLFYNNLFNGEGFSLAIEPGYYFFSYVSSFLMGYWIYQALITAVLIIC
                     LKTFFEKNTKNYLFCIGFFFLYQFIFVTEAIRQIIALSIILVAYKKFYDGKKLQFHML
                     TILACSFHISAVIVFILIPFLKRRNIYILKILTIVGLVLAIFSVYPVDYLIQLLSLLP
                     AGGYIEKIRWYSQDDYAGSVLTFSLVFKVFVVLLFDYRFKSIKSHGQSLINARAYDFI
                     YTSVYLMIFMDVYLGRFGTISTRLDVYFIPCFLIALNHLINEHKQGVSRFIFFFVVMV
                     YFTINYLSIMNGYYFEKFYSPYQNYITEFLNPGSYSDRGWDVRYYFSNKELLQ"
     gene            7334..8443
                     /gene="wfgA"
     CDS             7334..8443
                     /gene="wfgA"
                     /note="glycosyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WfgA"
                     /protein_id="ACA24853.1"
                     /translation="MNLLINASNLYVGGGVQVAISVLEELSDSSFSFIAVVSPVVYSQ
                     LSDDAASCCIVIESSPSKLLNFKVRRQLDDIVKKNDISVVFTIFGPSYWSPKNVKHAI
                     GFALPWLIYDIEYIFKKLTLKAKLKFCILKLLQPYYFKKNADLIFTETDDVNLRVTKL
                     LNFEKEQVYTVSNTLNGLLKNSNCYDYSILDRLPTKEPNDIWLVTISHNYPHKNLEVI
                     KELVTVLPPCYKFILTVSSDFLQLVPKEHRERVITIGNATLSQCAPLYEVCDGLFMPT
                     LLECFSASYLEAMYMKKIIFTSDLPFAHTVCKDAAFYFAPHDVENIRSTLVNGFQNKE
                     ILNHKLNEGSKIYESFPSAKARALQYIDIIKSNLV"
     gene            8468..9502
                     /gene="fnlA"
     CDS             8468..9502
                     /gene="fnlA"
                     /note="4,6-dehydratase, 3- and 5-epimerase"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlA"
                     /protein_id="ACA24854.1"
                     /translation="MFKDKVLLITGGTGSFGNAVLNRFLETDIKEIRIFSRDEKKQDD
                     MRKKYNNSKLKFYIGDVRDYSSILSAARGVDFIYHAAALKQVPSCEFHPLEAVKTNVL
                     GTENVLEAAIANQVKRVVCLSTDKAVYPINAMGISKAMMEKVMVAKSRNVNSDKTVIC
                     GTRYGNVMASRGSVIPLFVDLIKAGKALTITDPNMTRFMMTLEDAVDLVLYAFEHGNN
                     GDIFVQKAPAATIETLAIALKELLNVEQHPVNVIGTRHGEKLYEALLSREEMIAAIDM
                     GDYYRVPPDLRDLNYGKYVEQGDSRISAVEDYNSHNTQRLDVEGMKTLLLKLPFIRAL
                     RAGEHYDLDA"
     gene            9495..10607
                     /gene="fnlB"
     CDS             9495..10607
                     /gene="fnlB"
                     /note="reductase"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlB"
                     /protein_id="ACA24855.1"
                     /translation="MPNMKILITGADGFIGRNLCLRLQEAGYCDLVKIDRGSSAADLE
                     TGLQDADFVYHLAGINRPKNVDEFAEGNSNLTQQIVDYLLAKHKSIPIMISSSIQAEL
                     VNAYGQSKAAAEKHIERYAAESGAAYFIYRYPNVFGKWCKPNYNSFVATFCHNIANNI
                     DITINDSFAPVNLVYIDDVCSDAIKLLSGKVESGYKTVKPVYSTTVGEVAELLYRFKE
                     SRSTLVTEAVGTGFIRALYSTWLSYLPADMFAYSVPSYGDARGVFCEMLKTPSAGQFS
                     FFTAHPGITRGGHYHHTKNEKFLVIRGQACFRFEHVITGERYEMNVSSDEFKIVETVP
                     GWTHDVTNIGADELIVMLWANEIFSRDEPDTIARPL"
     gene            10607..11737
                     /gene="fnlC"
     CDS             10607..11737
                     /gene="fnlC"
                     /note="C-2 epimerase"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlC"
                     /protein_id="ACA24856.1"
                     /translation="MKKLKIMSVVGTRPEIIRLSRVLAKLDEHCEHILVHTGQNYDYE
                     LNEVFFNDLGVRKPDYFLNAAGKNAAETIGQVIIKVDEVLESEKPEAMLVLGDTNSCI
                     SAIPAKRRKVPIFHMEAGNRCFDQRVPEETNRRIVDHTADINMTYSDIAREYLLAEGL
                     PADRIIKTGSPMFEVLTYYMPQIDNSDVLSRLNLRSGEFFVVSAHREENVDSPKQLVK
                     LATILNTIAEKYDLPVIVSTHPRTRNRINEQGIEFHPNINLLKPLGFHDYNHLQKNSR
                     AVLSDSGTITEESSIMNFPAVNIREAHERPEGFEEASVMMVGLDCERVLQALDILATQ
                     PRGETRLLRQVSDYSMPNVSDKVVRIVHSYTDYVKRVVWKEY"
     gene            11737..12948
                     /gene="wbuB"
     CDS             11737..12948
                     /gene="wbuB"
                     /note="L-fucosamine transferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuB"
                     /protein_id="ACA24857.1"
                     /translation="MKLALIIDDYLPNSTRVGAKMFHELAQEFIRRGHDVTVITPDIC
                     LQDDVSFSTFQGVKTWRFKSGPLKDVSKIQRAINETLLSYRAWNSIKSQIKKETFDGV
                     VYYSPSIFWGHLVKKIKSRCQCPAYLILRDMFPQWVIDAGMLKAGSLIERYFRVFERS
                     SYRQANRIGLMSDKNLEVFRVNNKGYPCEVLRNWASLTPTVPPQGYIPLRQRLGLDDK
                     VIFFYGGNIGHAQDMGNLMRLARKMAEHPQAHFLFIGQGDEVELINSLAAEWSLPNFT
                     YLASVNQDEFKFILSEMDIGLFSLSARHSSHNFPGKLLGYMVQSLPILGSVNAGNDLL
                     DVVNQNNAGLIHINGEDDKLHESALLMLKDVAARRQFGLGANALLREQFSVESAAQTI
                     EMRLEACNATH"
     gene            12935..13333
                     /gene="wbuC"
     CDS             12935..13333
                     /gene="wbuC"
                     /note="unknown"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuC"
                     /protein_id="ACA24858.1"
                     /translation="MRLIDTHQLEALYEQAGKSARLRAHLLLHNSHREKVQRLLIALV
                     QGSYVDPHFHELPHQWEMFVVMQGQVQVCLYGKDGEIINQFVAGENTAISVVEFSPGD
                     IHSVECLSPRALMMEVKEGPFDPSFAKAFI"
ORIGIN      
        1 attgtggctg cagggatcaa agaaattgtt ctggttacgc actcgtccaa gaatgcggtc
       61 gaaaaccact tcgacacctc ttacgaactc gaagcgctgc tggagcagcg tgttaaacgt
      121 caactgctgg cggaagtgca gtccatttgt cctcctggcg tgaccatcat gaacgtgcgt
      181 caggcgcagc cgctgggcct gggccactcc atcctgtgtg ctcgccctgt cgtgggcgac
      241 aacccgttta tcgtggtcct gccggatatc atcatcgata ccgcttctgc ggatccgctg
      301 cgctataacc tggcggcgat ggtggcgcgt ttcaacgaaa caggccgcag ccaggtgctg
      361 gcgaaacgca tgaaaggcga tctgtccgag tactctatta tccagactaa agaagcgctg
      421 gagacagaag ggcaggtgag ccgcatcgtt gagttcatcg aaaaaccgga tcagccgcag
      481 acgctggatt ctgacctgat ggcggttggt cgttatgtcc tgaacgcgga tatctgggcc
      541 gagctggaaa aaaccgagcc aggcgcctgg gatcgtatcc agttaaccga tgcgatcgcc
      601 gagctggcga aaaagcagtc tgttgacgcg atgctgatga ccggtgagag ctacgactgc
      661 ggtaagaagc tgggctacat gcaggcgttt gtgaactatg ggctgcggaa cctgaaggaa
      721 ggggcgaagt tcagaagccg gattgagaag ttgttagcta acgactgatt ttatcttagt
      781 tgatttgcac aagcggcaat catcatttgg ggatgttgaa acataaccaa aatggtagct
      841 gccgtttttt gttattaatt ctaatgataa catggattta tctgatttaa atctggtcag
      901 atttgtaacg atttgtgctt gtttctgagg tcgtttagga cgacaattag cagagttgta
      961 atgcagttgt ctagtggcag ttagtgtccg atgacagaca acagaaaatg aaagaatcat
     1021 gcatcattca gtgcactggt agctgttgag ccaggggcgg tagcatattt aattgtgaga
     1081 gaacaatgaa gagaattatt acgtttggta catttgatgt ttttcatgtt ggtcatgtta
     1141 atatccttga gcgaactgct tcacttggcg actatcttat tgtaggtgta agttcagata
     1201 aattgaattt caataaaaaa ggtcgttacc ccatttataa tcaagaagac cgctgtcgta
     1261 taataaattc tcttagagtt gtgaatgatg tatttattga agaatcttta gagcaaaaaa
     1321 aagagtatat aatccaatac gaagctgata ttttagttat gggtgatgat tgggctggcc
     1381 gatttgattg ggtaaatgac atttgtgatg ttatttattt accaagaaca ccatcagtat
     1441 ctaccacaga aattattgaa gttgtgaaga ccctcagatg acgaatttca aaaaaatagc
     1501 aagaaaaata attagtaaaa gcatttcatt gttaaattat tttatcccca agaaaaaaaa
     1561 tagaattttt ttcaaaagca aacctgacta ctcaggtaat tgtaaggcac taagcgatta
     1621 tattatagag aaaaaacttc catatcatat cgtttggtct gttaaaaaag aaattaatca
     1681 aaaaggaatt actgtagtaa gagctggttc attgaaagaa tttttctatt actttacaag
     1741 taaatatgtt attactacgc ataatgaaat gataggtcca attgcaacaa atcaaaaata
     1801 cataagcttg tggcatggaa tgccttttaa gaaaatttgt tatcttggag agaatgatca
     1861 tcaaggaatg atagattatt cagccattag gattgccact tccgaagtaa tgcgttctat
     1921 aatttcagca agctttcgtg aaaaagccaa taatgtatat attacaggcc agcctcgtaa
     1981 tgattttttg ttcaaaccaa ttagtctgac agatattggt attaaatcta taaagaacaa
     2041 aaaaattgta atgtttgctc caacatttcg tatgaataat gaagatataa gatattctga
     2101 tggagcggaa attattgata ataattttct tcgagtaaat gatttctgca tggaagagat
     2161 agattattat cttgaacaaa gcaatttaca tttgatatta aaattgcatc catacgagga
     2221 ggaatatttc cgcgggatcg caacactaag ttcgaatata actattataa gttctgatga
     2281 actcacgcaa aaaaatatcg atttgaatca gttgctttcc ttggtcgata ttttaataac
     2341 agattactca tcaatttatt tagattactt aattctaaat aaacctctaa tttttttagt
     2401 tcctgatgta gatgcttata gttctgcacg cggtgggttt actttagaac cttttgattt
     2461 ttggacgcca ggagataagg ttagctgtca aaggtcatta ttgaattcaa taaataaaat
     2521 aatcactgga aatgatgagt atgctgaaaa acgtaaccaa ataaatctca taataaataa
     2581 atactctgat gctaataata gccagagagt cattgaattg atgaagagtt tatcatgaaa
     2641 atatacattt tcttaggaga tttaagttcg aaaggtggta ttgagcgtgt ttcagtagca
     2701 ttagccaatg gattggctaa attttatgat gtcactatca ttagcttata tcgtgcaact
     2761 agaaatttat catttgtccc ggatgaaaag gtcaatgtga tctatttgta cgatgaattt
     2821 gaaaagagta tgtataatcg taatctggga gctatcatag ggttaaagtt tgatttctta
     2881 tatattataa aaaagttgaa gcaacttaaa agattaaatt tagaactaaa taaaaatgat
     2941 gtgcttattt caagcgatat taaaatgtct ctgctattat ttttctatgc aaaaaaaagc
     3001 aaaattatag ctattgagca ttttgaacat gatgttggta atttagtgtt gagaaaaatt
     3061 agaagcgcac tatatcctaa attatcagca gttgtatcgc aaactggcga agatcaaatt
     3121 aagtatttgc aatggttacc tagaaagaaa cataaaatca ttccaaatat tattagcttc
     3181 gaagcgaccg atataccgca aaataaaata gaacaaaaaa atgtacttgc tgtgggacga
     3241 ttaactcatc aaaagggttt tgatttactt ctacaagctt gggcagacgc aaatactcat
     3301 gattggcgct taaagatcat tggagacgga gaagagctga accatttaaa ttctctaatt
     3361 accgagttaa atatctctaa cgctgaaatt atcccttttc aaaaggatat tcaaaggcat
     3421 tattcttctg caggaatatt cgtactttct tctcgctttg agggtttggg tatggtgctt
     3481 ttagaagctc ttagcagcgg cttggcgtgt attagttttg attgtccagc tggtcctaaa
     3541 agtataatct caagtgataa tggggtgtta gttccaactg gtgacactat aaaattatca
     3601 caagctattt ctttcttgat aaataacgaa gaagaaagaa aacggttaca aaacaaagct
     3661 gctgcttctg ttgaaaaatt caaagaatca aacgtaattg caaaatggcg agagttattg
     3721 aatgaaattt catagaaaac aatatgatgc agtatttctt acaaacgtac ctgctttcta
     3781 taaagtaaat ttgttcaacg aaattcaaaa aaataaagat atttttgtta tattcgtttc
     3841 agataagtcg aaaattagga atgaagattt ttattcatac gactttgcgt ttgaccactt
     3901 ttttcttaat gaagagaact ttgaagaacg aagtaaaata aaaacactat tcaatttact
     3961 tagagtgtta cgaacgattt cgtacaaaaa aattatatat tcaggatggg aagttaaaga
     4021 agtaactcta gctgcattat ttaataagcg ggaaaaaaat gcaatagtga tcgaaagtag
     4081 cattattgaa acgaagaaaa ctggtttgac atggcttcta aaaaaaatag ctatcggtcg
     4141 tatgtcgctt gcttacccat cagggctatt gcaaaaagca atattggaga cattctcttt
     4201 taaaggaaaa actgttatta cccatggcgt tggtatctct aatttaaaag agaccagttt
     4261 tcataataaa aaaacatgta caaggaataa tcctcttcgt ttcatctatg ttggaaggat
     4321 ttcatcggaa aaaaatatag attttatggt gaaagtattt aaaactcttc cttacgaatt
     4381 gatactaatt ggagatggtc cattaaaaaa acagtttgac gataaaacct atagcaatat
     4441 cagattttta ggctatattg acaataaaaa attatcaaaa gaactactta aaagtgattg
     4501 ttttattctt ccgtcattat ctgaaccgtg gggattagta gtagaggagg ctttgacatt
     4561 agggcttccg gttatagtca gtaaccatgt gggctgtcat agtgatttag tcaatgatag
     4621 aaatggcatt atattcgatg tgaacgatac acaatccttt attgacgcat tgtcgaaaat
     4681 ggaaaaaaat tatgaacgct ttgcccgtgg tgccagcgaa ttccatgcta gtgaaatagc
     4741 aaaagcacag atcgatgctt atgtaggtag catctgatga gcaacaaaaa caaaacattt
     4801 aaagatttta taaattattt tttaggcgat ctttttgtca aaggatttat gtttatctcg
     4861 ctacctctac tttcgagaat aatgtcgcca gaagattatg ggcggatgtc ccttataaat
     4921 gcagctgtta tgattttata tgtttttata agtttaaatc tccaaaatgc tgttatcaac
     4981 gcttacatga aaaatgaagt tgattttcca gtatatctag gtagtgtatt atggggattg
     5041 accgccgcgc aagtattgtt agtcgcttta agtatatatt ttgctgttcc gcttggaatg
     5101 ttattgagta ttagcaaata tgatgtttat tgggttgtcg ccatttgtat tttgctaagc
     5161 tatatatata tatatactag ctatctacag ggtgcacggc tcagttctag ctttgtcaaa
     5221 ctgaatatat ttagtaagat atcagaagtt gttgtcattt ttgtctttgc ttggttttta
     5281 actcaagata aataccttgc taaggtatat gctcagttag tgattagctt tattttactg
     5341 acatatgtgt tgaagaaact aaaaaagata gctgtattca aatttaatgt acgatatttt
     5401 atatcagcac ttgcatttag ttctccatta attatacatg ttctttcaaa tgctttgctt
     5461 tcacaagttg accgattgtt tatcgcaaag atgttgggag aggggcaggc tggtatatat
     5521 tctttcgcat ataatatcgg aatgtgtata ttagtggttg ttatggcctg gaactcttcg
     5581 tggcaaccta aattatataa gcttattgat tcgaaggata atggtaaaat aattcgaatt
     5641 gtcgatgtaa gttccttatt attattaata gtatcatttt tatctattct tttttcaaaa
     5701 cagatggttg aagtccttgc ggacaatcgc tatagggaaa gtatatccgt cgttcctgtc
     5761 atattgattg gtaactctct gattcatatt tatttaagct atgttaactt tactttctat
     5821 aagaaaaaaa caatatatgt ttcaattggt acattgcttg cggtagcgat aaatattgct
     5881 ttgaattata tactcatacc aatatacggt atccacggag cagcatgggc tacagtaata
     5941 gcttatttta tgctggcatt tttccattat ctcatagcaa caataatgtt aaaggcaaac
     6001 ccactctcat tgtttctgtt attatggtat tcagctttgt tattggcttc gtatttctta
     6061 gtaatatacc ttgactcttt gtctctttgg atctctttat caataaaggc aatgatcatt
     6121 tttattatcc tcatcatcct tatgaaaaca aaaatctata atgaattaaa ggaatgacag
     6181 tgtcgatata tcttctgctt ctagctttcg tatttctgct tgcaatgtca gattttttta
     6241 tcattgctga tgccagaaat cgttttttac tttatataat actattttcg ctattagtaa
     6301 cctttatagg tttaagatat caaactggac ttgattggtt attttataac aatctattta
     6361 atggagaggg tttttcatta gccattgagc ctggatatta ttttttctcg tatgtttcat
     6421 cttttttaat ggggtattgg atttatcagg cattaataac cgccgttcta ataatatgtt
     6481 taaaaacatt ctttgaaaaa aacactaaaa actatctgtt ttgcataggt tttttcttct
     6541 tatatcaatt tattttcgtg acggaagcaa tacggcaaat aatcgctctg tcaattattt
     6601 tggttgcata taaaaagttt tatgatggta agaaattgca atttcacatg cttaccattt
     6661 tggcttgttc attccatatt tctgctgtaa ttgtctttat tttgattccg tttttaaaac
     6721 gcagaaatat atatatatta aaaatactga caatcgttgg tttagttttg gcaattttta
     6781 gtgtttatcc tgttgactac ttaatacagt tactgtcatt gctccctgct ggtggttata
     6841 tagaaaagat aagatggtat agtcaggatg attatgctgg atcagtactt acgttttcat
     6901 tagtattcaa agtttttgtt gtgcttttat tcgattacag atttaaatca ataaaatcac
     6961 atggtcaaag tcttattaat gcgagggcat atgattttat ttatacttcg gtttatttaa
     7021 tgatattcat ggacgtttat cttggtaggt ttggtactat tagcaccagg cttgacgtat
     7081 actttatacc atgtttttta atagctctta atcatttaat aaatgaacac aaacaaggtg
     7141 tgagtcgttt catattcttc ttcgttgtca tggtttactt tactataaat tatctcagta
     7201 ttatgaacgg atattacttc gagaaatttt acagtcctta tcaaaattat ataactgaat
     7261 ttttaaatcc gggcagttat agtgatagag ggtgggatgt tagatattat ttcagcaata
     7321 aggaattatt gcagtgaatc ttttgattaa tgctagtaat ctgtatgttg gtggaggagt
     7381 ccaggtagca atttctgtac tggaagagtt atctgattca tcattttctt ttattgcggt
     7441 tgtttcacca gttgtttatt cgcagttaag cgatgatgca gcatcatgtt gtatagtgat
     7501 tgaatcttct ccatcaaaat tgttgaattt taaagttaga aggcaactcg acgatatagt
     7561 taaaaaaaat gatatttctg tagttttcac aatcttcggt cctagctatt ggtctccgaa
     7621 aaatgttaaa catgctattg gttttgcgct cccttggttg atttatgata ttgaatatat
     7681 atttaaaaaa ttgactttaa aagctaaatt gaaattttgc attttaaaat tattacagcc
     7741 atattacttc aagaaaaatg ccgacttaat ttttactgaa acagatgatg tcaacttgcg
     7801 ggtaacaaaa cttcttaact ttgaaaaaga acaagtctat actgtttcaa acacacttaa
     7861 tggtttatta aaaaattcaa actgttatga ttacagcatt ttggatagat tacctacgaa
     7921 agaaccaaat gatatttggt tggtaactat ttctcataat taccctcata agaacttaga
     7981 agtcattaaa gaattagtaa cagtattgcc accttgttat aagtttattt taacagtttc
     8041 aagtgatttt ttgcagctag tcccaaaaga gcatagagag cgagtcatca ccataggtaa
     8101 tgcaacactt agtcaatgtg ctccgttgta tgaagtttgt gatggattat tcatgccaac
     8161 acttttagaa tgctttagtg cttcttactt agaagcaatg tacatgaaaa aaataatctt
     8221 cacttctgat ctgccttttg ctcacactgt ttgcaaagat gcagcatttt actttgctcc
     8281 tcatgatgtt gaaaatatta ggagtacact tgttaatggc tttcaaaaca aagaaattct
     8341 taaccataaa ttaaatgaag gttcgaaaat ttatgaaagt tttccttctg cgaaagctcg
     8401 agcattgcag tatatagata taataaaatc caacttggta taaattgtag attttgaggt
     8461 gttaaaaatg tttaaagata aggttttact tattactggc ggaacagggt ctttcggtaa
     8521 cgctgtactt aatcgttttc ttgaaactga tattaaagaa ataaggattt tttctcgcga
     8581 tgaaaaaaaa caagacgata tgcggaaaaa atataataat tctaagttaa aattctacat
     8641 tggggatgta agggattatt ccagcattct aagcgccgca cgtggcgtcg actttatata
     8701 ccatgctgct gcattaaaac aagttccgtc atgtgaattt catcctctgg aagcagtgaa
     8761 aactaacgta ttaggtacag agaatgtgct tgaagcagca attgcaaacc aggttaaacg
     8821 tgtcgtttgc ttaagcacgg ataaggcagt atatccgatt aatgccatgg gtatttccaa
     8881 agcaatgatg gaaaaagtga tggtcgcaaa atcacgtaat gttaatagcg acaaaactgt
     8941 gatttgcggt actcgctacg gcaacgtgat ggcttcacgt ggttccgtta ttcccttatt
     9001 cgttgatctg atcaaagcgg gcaaagcgct gacgatcact gacccaaata tgacccgttt
     9061 tatgatgacg cttgaagatg ctgtcgatct ggtcctatat gcgtttgaac atggtaataa
     9121 tggcgatata tttgtccaaa aagcgcctgc tgcaacgatt gaaacattag ccattgctct
     9181 caaagaactt cttaatgttg agcaacatcc tgttaatgtt atcggaacgc gccatggtga
     9241 gaaactttat gaagcgctgc ttagccgtga agagatgatt gccgccattg acatggggga
     9301 ttactaccgt gttccaccag acctgcgcga tcttaactat ggaaaatacg tagaacaagg
     9361 tgatagccga atctcagcag tagaggatta taactctcac aatacacagc gactggatgt
     9421 tgaagggatg aaaacgcttc ttttgaaatt accttttatt cgtgcactgc gtgcgggtga
     9481 acattacgat ctggatgcct aatatgaaaa tcctgattac tggagctgat ggttttattg
     9541 gacgtaacct gtgcttacgc cttcaggaag caggctactg tgaccttgtt aagattgacc
     9601 gcggttcaag tgcggctgat ctggaaactg gccttcaaga tgctgatttt gtctatcatc
     9661 tcgcaggtat caatcgacct aaaaacgttg atgaatttgc cgaggggaat agcaatctga
     9721 ctcaacagat tgttgattat cttttagcca agcataaaag catacctatt atgatcagtt
     9781 cttccattca ggctgaactg gttaatgctt atggtcaaag taaagctgca gcagaaaaac
     9841 atattgaacg ctatgcagct gaaagcggtg cagcttattt tatttatcgt tatccgaatg
     9901 tttttggtaa gtggtgtaag cctaattata attcgttcgt ggcgaccttt tgccataata
     9961 ttgccaacaa tatcgatatc acgatcaatg actccttcgc gcctgttaat cttgtttata
    10021 ttgatgatgt ctgttctgat gcgataaagc tcttgtctgg aaaggttgaa agcgggtaca
    10081 aaactgttaa gccagtatat tcgacgacag taggtgaggt ggcggaatta ctttatcgct
    10141 tcaaagaaag ccgttccact cttgtcaccg aggctgtagg aacagggttc atccgcgcgc
    10201 tgtattcgac gtggttaagt tatctcccag ccgatatgtt tgcgtattca gttccctctt
    10261 acggagacgc ccgaggggtt ttttgtgaaa tgttaaaaac cccttcagcg gggcagtttt
    10321 cattttttac agcgcatccc ggcattacac gtgggggtca ttatcatcac accaaaaatg
    10381 agaagttcct ggtcattcgc ggccaggcat gctttaggtt tgaacatgtg attaccggtg
    10441 agcgatatga gatgaatgtt tcctcagatg agttcaaaat cgttgagaca gtccccggct
    10501 ggacacatga tgttacaaat attggagcgg atgaattgat agtcatgctg tgggcaaacg
    10561 aaattttcag tcgcgatgag cctgatacta ttgcgagacc tctgtaatga aaaaactaaa
    10621 aattatgtct gttgttggta cgcgtcccga gattatccgt ctgtcacgcg ttctcgctaa
    10681 gcttgatgaa cactgcgagc atattcttgt ccatactggt caaaactatg attatgagtt
    10741 aaacgaagta ttctttaatg accttggtgt acgaaaaccc gattactttt taaatgctgc
    10801 tgggaaaaat gctgcagaaa ccatcggtca ggttatcatc aaagttgatg aggtacttga
    10861 atccgaaaag cctgaagcaa tgttggtgct gggtgataca aactcctgta tttctgcaat
    10921 tccagccaaa cgccgtaaag tgcctatctt ccatatggaa gctggcaatc gttgtttcga
    10981 tcagcgcgtc ccggaagaga ccaatcggcg cattgtagac cataccgctg acatcaatat
    11041 gacctacagc gatattgcac gtgaatacct tcttgctgaa ggcctcccag cggaccgaat
    11101 tattaaaacc ggtagcccaa tgtttgaggt acttacgtat tatatgcctc aaatcgataa
    11161 ttcggatgta ctgtcgcgtc tgaacctgcg ttcaggcgaa tttttcgtcg tcagcgcgca
    11221 tcgtgaagag aatgttgatt ctcccaaaca gctagtcaag cttgcgacta ttctcaatac
    11281 tattgctgaa aaatatgatt tgccggttat tgtatccact catccgcgga cacgtaatcg
    11341 tattaacgag caagggattg aattccatcc aaatattaat ctactgaaac cgttaggttt
    11401 ccatgattac aaccatttgc agaaaaattc acgtgctgtg ctgtctgaca gcggtacgat
    11461 aactgaagaa tcttccatta tgaatttccc ggcggtaaat attcgggaag cacatgagcg
    11521 tccagagggc tttgaagaag cctctgtcat gatggtgggc ctggattgtg aacgtgttct
    11581 acaggcactg gatattctgg caacacagcc ccgcggcgaa acccgtcttt tacgacaagt
    11641 aagtgactac agcatgccta atgtgtcaga taaagtcgtc agaatcgttc attcttatac
    11701 tgattatgtc aagcgagtcg tctggaaaga atactgatga aacttgcttt aatcatagat
    11761 gattacctgc ccaatagtac gcgagttggt gcaaaaatgt ttcatgaatt ggctcaggaa
    11821 tttattcgcc gtgggcatga tgttacggta attacacctg acatctgtct tcaggatgat
    11881 gtgtccttta gcaccttcca gggggtcaag acatggcgtt tcaaaagtgg gcctctcaag
    11941 gatgtgagca aaattcaacg agccatcaat gaaacacttc tatcctatcg tgcctggaat
    12001 tccattaaaa gccagataaa aaaagagact tttgatgggg tagtttatta ctcaccctcc
    12061 attttctggg ggcacttagt caagaaaatt aaatctcgtt gccagtgtcc ggcttacctg
    12121 attttgaggg atatgttccc gcaatgggtg atagacgctg gcatgttaaa agccggttcc
    12181 ctcatcgaac gctatttccg tgttttcgaa agatcatctt atcgccaggc aaaccgtatc
    12241 gggctgatgt cagataagaa tcttgaggtc tttcgggtta acaacaaagg ttatccttgt
    12301 gaggttttgc gtaactgggc ttctctcacg ccgacggtac caccccaggg ttatatccca
    12361 ttgcgtcagc gtcttggcct tgatgataaa gttattttct tctatggagg gaatatcggt
    12421 catgcgcagg atatggggaa tctgatgcgt cttgctcgaa aaatggctga gcatccgcaa
    12481 gcccattttt tatttatcgg gcagggggat gaagttgaat taatcaattc tttggctgcc
    12541 gagtggtcat tgcccaactt tacgtatttg gcctctgtca atcaggatga atttaaattt
    12601 atcctctcgg aaatggatat aggcttgttt tcactttccg ccagacattc ttcgcataat
    12661 ttcccgggta aattgctagg gtatatggtt cagtccttac ctatactagg cagtgtgaat
    12721 gctggtaacg atttgcttga tgtcgtcaat caaaataatg ccggattaat tcatatcaat
    12781 ggtgaggatg acaagcttca tgagtccgca ctgttaatgc ttaaggatgt tgctgcgcga
    12841 cgtcaattcg gcttaggcgc gaatgcatta ttgagagaac agttctccgt tgagtctgcg
    12901 gcacagacta tagaaatgag gttagaggca tgtaatgcga ctcattgata ctcaccaact
    12961 tgaagcttta tacgaacaag ccggaaaatc tgcacgcttg cgcgctcatc tcttattgca
    13021 caattcgcac cgagagaaag tgcaacgtct gctcattgcc ttggttcagg gcagctatgt
    13081 cgatccgcat ttccatgaac ttcctcatca atgggagatg tttgtcgtta tgcaggggca
    13141 ggttcaagtc tgtttgtacg gcaaagatgg cgaaatcatt aatcaatttg tcgctggaga
    13201 gaatactgca ataagcgtag tcgagttttc tccgggtgat atacacagtg tcgaatgtct
    13261 ctctccgaga gcattaatga tggaagtgaa agaagggcct tttgatcctt cctttgccaa
    13321 ggcgttcatc taacgcccct ctgaatcgca tcttccgcta tctactcagg ctcatcctga
    13381 gttaacatct aagccacatt tcaagccgcg cacagtcgcg gcgaccacac ctgacaggag
    13441 tatgtaatgt ccaagcaaca gatcggcgtt gtcggtatgg cagtgatggg gcgcaacctg
    13501 gcgctcaaca tcgaaagccg tggttatacc gtctccgttt tcaaccgctc ccgtgataag
    13561 accgaagaag tcatcgctga gaatccgggt aagaaactgg ttcctttcta tacggttaaa
    13621 gagtttgttg aatctctgga aaggcctcgt cgtatcctgt taatggtgaa agcgggcgca
    13681 ggtaccgatg cagccatcga ttccctgaaa ccttatctgg acaaaggcga catcatcatt
    13741 gatggtggta acaccttctt ccaggacacc attcgtcgta accgtgaact ctctgctgaa
    13801 ggtttcaact tcatcggtac cggtgtttcc ggtggtgaag agggcgcgct gaaaggccca
    13861 tctatcatgc ctggcggcca gaaagaagcg tacgagcttg ttgcgccaat cctgaccaaa
    13921 atcgctgcgg ttgcggaaga tggtgagccg tgtgtgacct atatcggtcc ggacggtgca
    13981 ggccactatg ttaagatggt tcacaacggc atcgaatacg gcgatatgca gctgattgct
    14041 gaagcctact ctctgctgaa ggggggcctg aacctttcca acgaagaact agcagagacc
    14101 ttcactgagt ggaacaaagg cgagctgaac agctatctga tcgacatcac caaatatatc
    14161 ttcacgaaga gagatgaaga gggtaaatac ctgggtcgat gtgattcctt gacgaagccg
    14221 ccgaacaagg gtaccggcaa atgggacca
//