LOCUS       GU014554               17547 bp    DNA     linear   BCT 08-JUN-2010
DEFINITION  Escherichia coli strain E47a O-antigen gene cluster, complete
            sequence.
ACCESSION   GU014554
VERSION     GU014554.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 17547)
  AUTHORS   Wang,Q., Wang,S., Beutin,L., Cao,B., Feng,L. and Wang,L.
  TITLE     Development of a DNA microarray for detection and serotyping of
            enterotoxigenic Escherichia coli
  JOURNAL   J. Clin. Microbiol. 48 (6), 2066-2074 (2010)
   PUBMED   20351209
REFERENCE   2  (bases 1 to 17547)
  AUTHORS   Wang,Q., Wang,S., Beutin,L., Cao,B., Feng,L. and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (28-SEP-2009) TEDA School of Biological Sciences and
            Biotechnology, Nankai University, 23 Hongda Street, Tianjin 300457,
            P. R. China
FEATURES             Location/Qualifiers
     source          1..17547
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="E47a"
                     /db_xref="taxon:562"
                     /note="serogroup: O25"
     misc_feature    1..17547
                     /note="O-antigen gene cluster"
     gene            1137..2222
                     /gene="rmlB"
     CDS             1137..2222
                     /gene="rmlB"
                     /note="dTDP-D-glucose 4,6-dehydratase"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlB"
                     /protein_id="ADI43256.1"
                     /translation="MKILVTGGAGFIGSAVVRHIINNTQDSVVNVDKLTYAGNLESLA
                     DVSDSERYVFEHADICDAAAMARIFAQHQPDAVMHLAAESHVDRSITGPAAFIETNIV
                     GTYVLLEAARNYWSALDSDKKNSFRFHHISTDEVYGDLPHPDEVNNKEKLPLFIETTA
                     YAPSSPYSASKASSDHLVRAWKRTYGLPTIVTNCSNNYGPYHFPEKLIPLVILNALEG
                     KALPIYGKGDQIRDWLYVEDHARALYTVVTEGKAGETYNIGGHNEKKNIDVVLTICNL
                     LDEIVPKEKSYREQITYVADRPGHDRRYAIDAEKIGRELGWKPQETFESGIRKTVEWY
                     LSNTKWVDNVKSGAYQSWIEQNYEGRQ"
     gene            2222..3121
                     /gene="rmlD"
     CDS             2222..3121
                     /gene="rmlD"
                     /note="dTDP-6-deoxy-L-mannose-dehydrogenase"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlD"
                     /protein_id="ADI43257.1"
                     /translation="MNILLFGKTGQVGWELQRALAPLGNLIALDVHSTDYCGDFSNPE
                     GVAETVRSIRPDIIVNAAAHTAVDKAESEPEFAQLLNATSVEAIAKAANEVGAWVIHY
                     STDYVFPGSGDRPWLETDATAPLNVYGETKLAGEKALQEHCAKHLIFRTSWVYAGKGN
                     NFAKTMLRLAKEREELAVINDQFGAPTGAELLADCTAHAIRVALNKPDVAGLYHLVAS
                     GTTTWYDYAALVFEEARKADIPLALNKLNAVPTTAYPTPACRPHNSRLNTEKFQQNFA
                     LVLPDWQVGVKRMLNELFTTTAI"
     gene            3179..4057
                     /gene="rmlA"
     CDS             3179..4057
                     /gene="rmlA"
                     /note="glucose-1-phosphate thymidylyltransferase"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlA"
                     /protein_id="ADI43258.1"
                     /translation="MKTRKGIILAGGSGTRLYPVTMAVSKQLLPIYDKPMIYYPLSTL
                     MLAGIRDILIISTPQDTPRFQQLLGDGSQWGLNLQYKVQLTPDGLAQAFIIGEEFIGG
                     DDCALILGDNIFYGHDLPRLMDAAVNKESGATVFAYHVNDPERYGVVEFDKNGTAISL
                     EEKPLQPKSNYAVTGLYFYDNDVVEMAKNLKPSARGELEITDINRVYMEQGRLSVAMM
                     GRGYAWLDTGTHQSLIEASNFIATIEERQGLKVSCPEEIAYRKGFIDAEQVNVLAEPL
                     KKNAYGQYLLKMIKGY"
     gene            4060..4602
                     /gene="rmlC"
     CDS             4060..4602
                     /gene="rmlC"
                     /note="dTDP-6-deoxy-D-glucose-3,5 epimerase"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlC"
                     /protein_id="ADI43259.1"
                     /translation="MNVIKTEIPDVLILEPEVFGDERGFFMESFNQKVFEEAVGRKVE
                     FVQDNHSKSIKGVLRGLHYQLEPYAQGKLVRCVVGEVFDVAVDIRKSSGTFGKWVGVN
                     LSAENKRQLWIPEGFAHGFLVLSDLAEVLYKTNQYYAPSHERNIIWNDPLLNIKWPRT
                     ALITLSDKDANGEKLELSEY"
     gene            4604..5863
                     /gene="wzx"
     CDS             4604..5863
                     /gene="wzx"
                     /note="O-antigen flippase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="ADI43260.1"
                     /translation="MSLLKHSIWNVAGYFIPTLIAIPAFGLIAREIGVELFGLYTLSM
                     IFIGYASIFDAGLTRAVVREIALLKNRLDDCNTIIVTSIIAVVFLGGIGGGGVFLLKD
                     HIIELLNMSPIYYVDAIKSLILLSSLIPVFLVTQILLAELEGREYFGILNIQKSLGNS
                     LIAGLPALFVLINQTLFSAIIGVAIARVICLWLSYIMSRKRITIDISFFSITVLKRLF
                     RYGGWVTISNIISPILASMDRFILSHIQGASKISFYTVPNELVTRLGIVPGSLGKAVF
                     PKLSHASSFTASYAEQKKAYILMTVIVLPLVLFIYYYAKFILTLWMGAEYAGISVEIL
                     RIMLIGYIFNCYSQISFANIQAFGKAKYTAYIHMMEFIPYLIMLYIISKECGVIGVAW
                     LWTIRVIIDFLMLFYMSYRCNNLMKKG"
     gene            5868..6833
                     /gene="wekA"
     CDS             5868..6833
                     /gene="wekA"
                     /note="glycosyl transferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WekA"
                     /protein_id="ADI43261.1"
                     /translation="MIYIVVLNWNGAIDTINCVKSLMNLNYDDYKIIVVDNCSTDNSY
                     DSIKENLNALYITGKSFIEVKYEDRSKYQTLENDKIILIQSPKNNGYASGNNIGIELA
                     LNQEDMKYVWVLNNDTEVDKEALTHLISKCDSDKNIGICGSRLVYFTDREMQQGLGGV
                     HNRWLCTTKNYEMGRLVSKKYDDEVISNNIDYIIGASMFFSRECLETVGLMNEEYFLY
                     YEELDICLRAKAKNFKLGICSDSLVYHKIGASTDGGKSMIADLCSIKNRLAITEKFYP
                     QYYWTVWLSLFVVAFNRARRGEFNKMKRCLNVMFNFKRNKGSKCH"
     gene            6900..8048
                     /gene="wekB"
     CDS             6900..8048
                     /gene="wekB"
                     /note="glycosyl transferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WekB"
                     /protein_id="ADI43262.1"
                     /translation="MKVAFLSAYDPLSTSSWSGTPYYMLKALSKRNISIEILGPVNSY
                     MVYMLKAYKLILRCFGKEYDYSRSKLLSKYYGRIFERKLKKIDGLDFIIAPAGSSQIA
                     FLETNIPIIYLSDTTYDQLKNYYPNLNKKTIINDEDASLIERKAIEKATVVSFPSKWA
                     MDFCKDYYRLDSDKLVEIPWGANLFEDIHFANKTIIQKISYTCLFLGVDWERKGGKTA
                     LKAIEYVRELYGIDVRLKICGCTPNQEILPAWVELIDKINKNNVEEYQKFIDVLSNAD
                     ILLLPTIAECYGMVFCEAAAYGLPVVATDTGGISSIVINERTGILIKDSSDYKHFGNA
                     IHKIISSVETYQNYSQNARVRYNKILHWDNWAKKIIEIMYEHKNRRTK"
     gene            8020..9081
                     /gene="wzy"
     CDS             8020..9081
                     /gene="wzy"
                     /note="O-antigen polymerase"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="ADI43263.1"
                     /translation="MSIRIEEPNSTKRIIFLFLLFLVFPDFLFYTLGIDNFSISTIIS
                     IILLFVFLRAKNTCKDNLLIIVVLFILLCFNCLLSMLFNIEQVLSFKIVLSMYSILIM
                     AYVSSCYAQTLWLCSEEILKRSVFYLFAFLCLIGIISILLQKTEIIHDKSMILFPEPS
                     AFALVFIPIFSFCLYYTRGGGVLLLYILSLGIALGIQNLTMLVGIVISVFVMKKITIR
                     QTIVIFLGAWIFSMILSDLDISYYTSRLDFKNTTNLSVLVYLSGIERAFLNFITSYGL
                     GIGFQQMGVNGEVGVYQQILADLDAPMLNIYDGSFISSKLISEFGFIGAIMCIFYLFI
                     FFDFICVSKKIRDIHRSIF"
     gene            10108..11211
                     /gene="wekC"
     CDS             10108..11211
                     /gene="wekC"
                     /note="glycosyl transferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WekC"
                     /protein_id="ADI43264.1"
                     /translation="MFDLSKSYIVVSATALASGGALTILKQFIKHASQNSNDYIMFVS
                     AGLELPVCDNIIYIENTPKGWLKRIYWDWFGCRKFISEHKINVKKVISLQNSSLNVPY
                     EQIIYLHQPIPFSKVDSFLNDITFDNVKLFLYKNFYSYFIFKYVNANTTIVVQTNWMK
                     KGVLDQCDKISSERVLVIKPDIKTFNNTKFDVDKDVSVKTLLYPATPLTYKNHLVILK
                     ALVILKQKYFIDDLKFQVTFEKNRYKNFDKFVQLNNLSKNIDYLGVLSYSKLQKKYMA
                     ASFIVFPSYIESYGLPLIEAASLGKKIISSDLPYARDVLKNYSGVDFVIYNDEDGWAR
                     ALFNVLNGNSKLNFRPYEKDSRSSWPQFFSILK"
     gene            11220..12254
                     /gene="fnlA"
     CDS             11220..12254
                     /gene="fnlA"
                     /note="FucNAc synthetase"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlA"
                     /protein_id="ADI43265.1"
                     /translation="MFNGKILLITGGTGSFGNAVLRRFLDTDIKEIRIFSRDEKKQDD
                     MRKKYNNQKLKFYIGDVRDYSSILNASRGVDFIYHAAALKQVPSCEFHPMEAVKTNIL
                     GTENVLEAAIANRVRRIVCLSTDKAVYPINAMGISKAMMEKVIVAKSRNLDSSKTVIC
                     GTRYGNVMASRGSVIPLFVDLIKSGKPLTITDPNMTRFMMTLEDAVDLVLYAFEHGNN
                     GDIFVQKAPAATIQTLAIALKELLNAHEHPINIIGTRHGEKLYEALLSREEMIAAEDM
                     GDYYRVPPDLRDLNYGKYVEHGDRRISEVEDYNSHNTERLDVEGMKKLLLKLPFIRAI
                     RSGEDYELDS"
     gene            12238..13362
                     /gene="fnlB"
     CDS             12238..13362
                     /gene="fnlB"
                     /note="FucNAc synthetase"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlB"
                     /protein_id="ADI43266.1"
                     /translation="MSWIHNMKILVTGASGFIGRNLVFRLKEAGYNELITIDRNSSLA
                     DLEQGLKQADFIFHLAGVNRPVKESEFGEGNSNVTQQIVDVLKKNNKNTPIMLSSSIQ
                     AECDNAYGKSKATAEKIIQQYGETTNAKYYIYRLPNVFGKWCRPNYNSFIATFCHRIA
                     NDETITINDPSAVVDLVYIDDFCSDILKLLEGANETGYRTFGPIYSVTVGEVAQLIYR
                     FKESRQTLITEDVGNGFTRALYSTWLSYLSPEQFAYTVPSYSDDRGVFCEVLKTKNAG
                     QFSFFTAHPGITRGGHYHHSKNEKFIVIRGSACFKFENIVTGERYEFNVSSDDFKIVE
                     TVPGWTHDITNNGSDELVVMLWANEIFNRSEPDTIARVLS"
     gene            13377..14489
                     /gene="fnlC"
     CDS             13377..14489
                     /gene="fnlC"
                     /note="FucNAc synthetase"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlC"
                     /protein_id="ADI43267.1"
                     /translation="MSVVGTRPEIIRLSRVLAKLDEYCDHLIIHTGQNYDYELNEVFF
                     KDLGVRKPDYFLNAAGKNAAETIGQVIIKVDDVLEQEKPEAMLVLGDTNSCISAIPAK
                     RRKIPIFHMEAGNRCFDQRVPEETNRKIVDHTADINMTYSDIAREYLLAEGVPADRII
                     KTGSPMFEVLTHYMPQIDGSDVLSRLNLTPGNFFVVSAHREENVDTPKQLAKLANILN
                     TVAEKYDVPVVVSTHPRTRNRINENGIQFHKNILLLKPLGFHDYNHLQKNARAVLSDS
                     GTITEESSIMNFPALNIREAHERPEGFEEGAVMMVGLESERVLQALEIIATQPRGEVR
                     LLRQVSDYSMPNVSDKVVRIIHSYTDYVKRVVWKQY"
     gene            14489..15697
                     /gene="wbuB"
     CDS             14489..15697
                     /gene="wbuB"
                     /note="putative L-fucosamine transferase"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuB"
                     /protein_id="ADI43268.1"
                     /translation="MKLALIIDDYLPHSTRVGAKMFHELGLELLSRGHDVTVITPDIT
                     LQAIYSVSMIDGIKVWRFKSGPLKDIGKAKRAINETLLSFRAWRALKHLIQHDTFDGI
                     VYYSPSIFWGDLVKKIKQRCQCPSYLVLRDMFPQWVIDAGMLKAGSPIEKYFRYFEKK
                     SYQQADRIGVMSDKNLEIFRQTNKGYPCEVLRNWASMTPVSASDDYHSLRQKYDLKDK
                     VIFFYGGNIGHAQDMANLMRLARNMMRYHDAHFLFIGQGDEVDLIKSLAAEWNLTNFT
                     HLPSVNQEEFKLILSEVDVGLFSLSSRHSSHNFPGKLLGYMVQSIPILGSVNGGNDLM
                     DVINKHRAGFIHVNGEDDKLFESAQLLLADSALRKQLGQNANVLLKSQFSVESAAHTI
                     EVRLEAGECV"
     gene            15688..16095
                     /gene="wbuC"
     CDS             15688..16095
                     /gene="wbuC"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuC"
                     /protein_id="ADI43269.1"
                     /translation="MRLVDDNILDELFRTAVNSERLRAHYLLHASHQEKVQRLLIAFV
                     RDSYVEPHWHELPHQWEMFVVMQGQLEVCLYEKNGEIQKQFIVGDGTGISVMEFSPGD
                     IHSVKCLSPNALMLEIKEGPFDPLKAKAFSKWL"
ORIGIN      
        1 attgtggctg cagggatcaa agaaatcctc ctggtaactc acgcgtccaa gaacgcggtc
       61 gaaaaccact tcgacacctc ttatgaatta gaatctctcc ttgaacagcg cgtgaagcgt
      121 caactgctgg cggaagtgca atctatctgc ccgccgggcg tgactattat gaacgtgcgt
      181 cagggcgaac ctttaggttt aggccactcc attttgtgtg cgcgacctgc cattggtgac
      241 aacccgtttg tcgtggtact gccagacgtt gtgatcgacg atgccagcgc cgacccgcta
      301 cgttacaacc ttgctgccat gattgcgcgc ttcaacgaaa cgggccgcag ccaggtgctg
      361 gcaaaacgta tgccgggtga cctctctgaa tactcggtca tccagaccaa agaaccgctg
      421 gatcgcgaag gtaaagtcag ccgcattgtt gaatttatcg aaaaaccgga tcagccgcag
      481 acgctggact cagacatcat ggccgttggt cgctatgtgc tttctgccga tatttggccg
      541 gaacttgaac gcacgcagcc tggtgcatgg ggacgtattc agctgactga tgccattgct
      601 gaactggcga aaaaacagtc cgttgatgcc atgctgatga ccggcgacag ctacgactgc
      661 ggtaaaaaaa tgggctatat gcaggcgttt gtgaagtatg gactgcgtaa cctaaaagaa
      721 ggggcgaagt tccgtaaagg gattgagaag ctgttaagcg aataatgaaa atctgaccgg
      781 atgtaacggt tgataagaaa attataacgg cagtgaagat tcgtggcgaa agtaatttgc
      841 tgcgaatatt cctgccgttg ttttatataa acaatcagaa taacaacgag ttagcaatag
      901 gattttagtc aaagttttcc aggattttcc ttgtttccag agcggattgg taagacaatt
      961 agcgtttgaa tttttcgggt ttagcgcgag tgggtaacgc tcgtcacatc gtagacatgc
     1021 atgcagtgct ctggtagctg taaagccagg ggcggtagcg tgcgttaata cctctattaa
     1081 tcaaactaag agccgctaat ttcacagcat gctctgaagt aatatggaat aaaaaagtga
     1141 agatacttgt tactggtggc gcaggattta ttggttctgc tgtagttcgt cacattataa
     1201 ataatacgca ggatagtgtt gttaatgtcg ataaattaac gtacgccgga aacctggaat
     1261 cacttgctga tgtttctgat tctgaacgct atgtttttga acatgcggat atttgcgatg
     1321 ctgctgcaat ggcgcggatt tttgctcagc atcagccgga tgcagtgatg cacctggctg
     1381 ctgaaagcca tgtggatcgt tctatcactg gccctgcggc atttattgaa accaatattg
     1441 ttggtactta tgtcctttta gaagccgctc gcaattactg gtctgctctt gatagcgaca
     1501 agaaaaatag cttccgtttt catcatattt ctactgacga agtctatggt gatttgcctc
     1561 atcctgacga agtaaataat aaagaaaaat tacccttatt tattgagaca acagcttacg
     1621 caccaagcag cccttattcc gcatccaaag catccagcga tcatttagtc cgcgcgtgga
     1681 aacgtaccta tggtttaccg accattgtga ctaactgttc gaataactac ggtccttatc
     1741 actttccgga aaaattgatt ccactagtaa ttcttaatgc tctggaaggt aaggcattac
     1801 ctatttatgg caaaggggat caaattcgtg attggctgta tgttgaagat catgcgcgtg
     1861 cattatatac cgtcgtaacc gaaggtaaag cgggtgaaac ttataacatt ggtgggcaca
     1921 acgaaaagaa aaacattgat gtagtgctca ctatttgtaa tttgctggat gagattgtac
     1981 cgaaagagaa atcttatcgt gagcaaatca cttatgtcgc cgatcgtccg ggacacgatc
     2041 gccgttatgc cattgatgct gagaagattg gtcgcgaatt gggatggaaa ccacaggaaa
     2101 cgtttgagag cgggattcgg aagacagtgg aatggtacct gtccaataca aaatgggttg
     2161 ataatgtaaa aagtggtgcc tatcaatcgt ggattgaaca gaactatgag ggccgccagt
     2221 aatgaatatc ctcctttttg gcaaaacagg gcaggtaggt tgggaactac agcgtgctct
     2281 ggcacctttg ggtaatttga ttgctcttga tgttcactcc actgattact gtggtgattt
     2341 tagtaatcct gaaggtgtag ctgaaaccgt aagaagcatt cggcctgata ttattgtcaa
     2401 cgcagccgct cacaccgcag tagacaaagc agaatcagaa ccggagtttg cacaattact
     2461 taacgcaaca agtgtcgaag cgattgcgaa agcagcaaat gaagttggag cttgggttat
     2521 acactactcc accgattatg ttttccctgg cagtggtgac aggccatggc tggaaacgga
     2581 tgcaacagcg ccgctaaatg tttacggtga aactaagcta gctggggaaa aagcgttaca
     2641 agaacattgc gcaaagcatc ttattttccg taccagctgg gtatacgctg gtaaaggaaa
     2701 taattttgcc aaaacgatgt tgcgtctggc aaaagaacgc gaagagttgg ctgtgataaa
     2761 cgatcaattt ggcgcaccaa cgggtgctga gcttctggcc gattgtacag cacatgccat
     2821 tcgtgtcgca ctgaataaac cggatgtcgc aggcttgtac catctggtag ctagtggtac
     2881 cacgacctgg tacgattatg ctgcgctggt ttttgaagag gcgcgcaaag cagatattcc
     2941 cctcgcactc aacaaactca atgcggtacc aacgacagcc tatcctacac cagcttgtcg
     3001 tccacataac tctcgactta atacagaaaa atttcagcag aattttgcgc ttgtcttgcc
     3061 tgactggcag gttggtgtga aacgcatgct caacgaatta tttacgacta cagcaattta
     3121 atagtttttg catcttgttc gtgatgatgg agcaagatga attaaaagga atgatgaaat
     3181 gaaaacgcgt aagggtatta ttttagcggg tggttctggt actcgtcttt atcctgtgac
     3241 tatggcagtc agtaaacagc tattaccgat ttatgataaa ccgatgatct attacccgct
     3301 ctctacactg atgttggcgg gtattcgcga tattttgatt attagtacgc cacaggatac
     3361 tcctcgtttt caacaactgc tgggtgacgg tagccagtgg gggctaaatc ttcagtacaa
     3421 agtgcaactg actccagatg ggcttgcgca ggcatttatt atcggtgaag agtttattgg
     3481 tggtgatgat tgtgctttga ttcttggtga taatatcttt tacggtcacg atctgccgag
     3541 gttaatggat gccgctgtta acaaagaaag tggtgcaacg gtatttgcct atcacgtaaa
     3601 tgatcctgaa cgctatggtg tcgttgagtt tgataaaaac ggtactgcaa tcagcttgga
     3661 agaaaaaccg ttacaaccaa aaagtaatta tgcggtaacc gggctttatt tctatgataa
     3721 cgacgttgtg gaaatggcga aaaaccttaa gccttctgcc cgtggtgaac tggaaattac
     3781 cgatattaac cgtgtctata tggaacaggg gcgtttatct gttgccatga tgggccgtgg
     3841 ttatgcatgg ttagacacgg ggacacatca aagtctgatt gaagcaagta acttcattgc
     3901 aacaattgaa gagcgacaag gtttaaaggt atcttgcccg gaagaaattg cttatcgtaa
     3961 aggctttatt gacgctgagc aggttaatgt attagcagaa ccactaaaga aaaatgctta
     4021 tggtcagtat ctgctaaaaa tgattaaagg ttactaaaaa tgaatgtaat taaaactgaa
     4081 attcctgatg tattaatttt ggaaccggaa gtttttggtg atgagcgcgg tttttttatg
     4141 gaaagcttta atcagaaagt tttcgaagag gctgtagggc gtaaggttga atttgttcag
     4201 gataaccatt ctaaatcaat taagggtgta ttacgcggat tgcactatca gctggaacct
     4261 tatgctcaag gtaaattagt tcgttgtgtg gtcggtgagg tttttgatgt agcagttgat
     4321 attcgtaaat cgtcaggtac atttgggaaa tgggttgggg tgaatttgtc tgctgagaac
     4381 aagcgtcagt tgtggatacc tgaaggattt gctcatggat ttttggtact tagtgattta
     4441 gcagaagttt tatataaaac gaatcaatat tatgctccat cacatgaacg aaatattatc
     4501 tggaatgacc ccttgcttaa tattaaatgg ccaaggacag cactgattac tctgtctgat
     4561 aaggatgcaa atggggaaaa attagaacta agtgagtatt gaaatgtctc tcttaaaaca
     4621 tagtatatgg aatgttgcgg gctactttat accaacatta attgcaatcc cagcgtttgg
     4681 attaattgca agggaaattg gtgtagaact atttggtttg tatactttat caatgatttt
     4741 tatagggtat gctagtatat ttgatgctgg gttaacaaga gctgtagtac gcgaaatagc
     4801 attactaaaa aacagactgg acgattgtaa tacgataata gtaacttcta ttattgctgt
     4861 ggtattttta gggggtatcg gaggcggggg agtgtttctg cttaaagacc atattattga
     4921 actgttaaat atgtcaccaa tatactacgt cgatgcgata aagtctctaa tattattatc
     4981 atctctgata cctgtattct tagtcacgca aatactatta gcagagcttg aggggcggga
     5041 atattttgga atcctaaata tacaaaaaag tttagggaat tctttaattg cagggttgcc
     5101 tgcattattt gttttaatta atcaaacact tttttctgca attattggtg tagctattgc
     5161 aagagttata tgcttgtggt taagctacat tatgagcagg aaaagaataa ctatcgatat
     5221 ttcatttttt tcaataactg ttttaaaacg gttatttaga tatggcgggt gggtaactat
     5281 aagtaacata atatctccta tattagcgag tatggataga tttattctat ctcatatcca
     5341 gggagcatca aaaatatcat tctatacagt ccctaatgag ctggtaacta ggcttggaat
     5401 agttccaggc tctcttggga aagctgtttt tccaaaatta agccatgcaa gtagttttac
     5461 agcgtcatat gcagaacaaa aaaaagcgta tatattaatg actgtcattg tattgccttt
     5521 ggttttattt atatattact acgcaaagtt tattttaaca ttgtggatgg gggctgagta
     5581 tgcagggatt tcagtcgaaa tattacggat tatgcttata gggtatatct ttaactgtta
     5641 ttcacaaatc tcttttgcca atatacaggc atttggaaaa gcaaaataca ctgcatacat
     5701 ccatatgatg gaatttattc cttatttgat aatgttatat ataatttcaa aggaatgtgg
     5761 ggttattggt gtggcgtggt tatggacaat tcgagtgata attgattttt tgatgctttt
     5821 ttatatgagt tatcgttgta ataatcttat gaaaaaaggg tagcctgatg atatatattg
     5881 tagtgttaaa ttggaatggg gctatagata ccattaattg tgttaaaagt ttaatgaatt
     5941 taaattatga tgattataaa attatcgttg ttgataactg ttctacggat aactcatatg
     6001 attctataaa agaaaatctt aatgcattat atattactgg taaaagtttc attgaggtga
     6061 agtatgagga tagaagtaaa tatcaaacat tagaaaacga taaaatcata ttaatacaat
     6121 ctccgaaaaa taatgggtac gcaagtggta ataacattgg aatagagctc gcacttaatc
     6181 aggaggatat gaaatacgtc tgggttctga ataatgatac tgaagtggat aaagaggctt
     6241 taactcattt aattagtaaa tgtgattcag ataaaaatat agggatttgc ggttctcgtt
     6301 tagtctattt taccgataga gagatgcagc aaggactggg tggggtacat aacagatggt
     6361 tatgcactac aaaaaattat gagatgggaa gattagtttc caaaaaatat gatgatgaag
     6421 tcattagcaa taatatagat tatataattg gcgcatcaat gtttttctct agagaatgtt
     6481 tggaaacagt tggattgatg aatgaagaat attttttata ctatgaagag ttagatattt
     6541 gcctcagagc aaaagcaaag aactttaaat taggtatttg ctcagatagt ttggtttatc
     6601 ataagatagg tgcaagtact gatgggggaa agagtatgat agctgacctt tgttcaataa
     6661 aaaataggct ggccattaca gaaaagtttt atccacaata ttattggacg gtatggttgt
     6721 cactctttgt tgtagcattt aaccgtgcta gaagaggtga gtttaataag atgaaaagat
     6781 gtttgaatgt tatgtttaac ttcaaacgaa ataaaggtag caaatgccat tagaatatgc
     6841 atttaatgat ggtgttatta aataaatgta tagtttgata tgttattaaa gggtatttaa
     6901 tgaaagtggc ttttttatct gcttatgatc cactatctac atccagttgg tcgggcacac
     6961 cttattatat gctaaaggca ttatcgaaga gaaatatttc cattgaaata ttaggaccgg
     7021 taaatagcta tatggtatac atgttaaaag catataaatt aatattaagg tgtttcggaa
     7081 aggaatatga ttatagtcgt tcgaagttgc tttccaagta ttacggtaga atatttgaga
     7141 gaaaattaaa aaaaattgat ggtttggatt ttattattgc acctgcaggt tcttcacaaa
     7201 ttgctttttt agaaacaaat ataccaataa tatatctatc ggatacaaca tatgatcaat
     7261 taaaaaacta ttatccgaat ttaaataaaa aaacaattat aaatgatgag gatgcaagtt
     7321 taatcgaacg caaggctatt gaaaaagcaa cagtcgtatc tttcccatct aaatgggcaa
     7381 tggatttttg caaggactat tacagattgg attctgataa attagttgaa ataccatggg
     7441 gggctaattt atttgaagat attcattttg ctaataaaac tataattcaa aagattagtt
     7501 atacttgtct tttcttgggg gtcgattggg aaagaaaagg tggtaaaaca gcattgaaag
     7561 caattgaata tgtaagagag ttatatggga tcgatgttag actaaaaatt tgtggatgta
     7621 ctccgaatca agagatttta cctgcttggg ttgaattaat tgataaaata aataaaaata
     7681 acgttgaaga atatcagaaa ttcatcgatg tgttatctaa cgctgatata cttcttttac
     7741 caaccattgc tgaatgttac ggaatggtat tttgtgaagc tgcagcttat ggattgccag
     7801 ttgtcgccac agatacaggt ggaattagtt ctatagttat caacgaaagg acggggatat
     7861 taattaaaga ctcgtcagac tataagcact ttggaaatgc aattcataaa ataattagct
     7921 ccgtagagac ttatcaaaac tactcccaaa acgcaagagt tagatataat aaaatattgc
     7981 attgggacaa ttgggcaaaa aagataattg agattatgta tgagcataag aatagaagaa
     8041 ccaaatagca caaaaagaat tatattttta tttttacttt tccttgtttt tcctgatttt
     8101 ttgttttata cattagggat tgataatttt agcatttcaa cgataatctc cattatattg
     8161 ctttttgttt ttttaagggc taaaaacact tgcaaagata atttgctaat aatagtagta
     8221 ttattcatat tgttgtgttt taactgtctg ttaagtatgc tatttaatat tgaacaggtt
     8281 ttatcattta aaattgtact ttcaatgtat agcatcttaa taatggcata cgtctcctct
     8341 tgttatgcac agactttgtg gttatgttct gaagaaatac ttaagagatc cgtcttttat
     8401 ttgttcgcat ttctttgcct tattggcatt ataagtattc ttttacagaa aactgagatt
     8461 atacatgata aaagtatgat tctttttcct gaaccatcag catttgcatt ggttttcata
     8521 cctatctttt cattttgttt atactataca aggggggggg gggtactatt gctctatata
     8581 ttatctttgg gtattgcgtt aggtatccag aacttaacga tgttagtagg cattgtgatt
     8641 agtgtttttg tgatgaaaaa aataacaata aggcaaacta ttgttatatt tttaggggca
     8701 tggatttttt ccatgatatt aagtgattta gacatttctt actatacatc gcggcttgat
     8761 tttaaaaata ctacgaactt atcagtgctt gtatatcttt caggaattga aagagctttc
     8821 ttgaatttta ttacaagtta tggtcttggt attggttttc aacaaatggg cgtgaatggg
     8881 gaggtaggag tgtatcaaca aattttagct gatcttgatg cccctatgtt aaatatatac
     8941 gatggctcat ttatttcttc gaagttaata tctgagtttg ggtttattgg tgcaataatg
     9001 tgcattttct atctttttat ttttttcgat tttatctgcg tttcaaaaaa aataagagat
     9061 atccaccgca gtatatttta gcatatagtt tctatatgtg tttcttcatc ccccttttta
     9121 tacgtggtgc tggctatata aatccctatg tgtttatgtt attttcatca atatttttat
     9181 gcaaatatca tgctaaaatt atcttgatga aatctaatgt caaaatggct atataatagt
     9241 agattatgtt atcattaata cgtaaataac atatattcta accagggcat aaataatgtg
     9301 cataaaaaaa ttaagttaat taaacgatat ggcctttatg gtggtcttag gcttcttaaa
     9361 gattattctt aacaaaagtt ttattttgtt caaatgttag ggttattaga ttttcatgtt
     9421 atcttagaaa agatggaagt gttagttttg gaaaagggtt tacatcaggt gtagtattag
     9481 gaggtgatac atttatggat gctatagtgt ctattggaga aaatgttcaa attaatgatt
     9541 atgttccaca tcgcggctat taataatgcc attattggta gagatacatt aatagcaagt
     9601 aaagtattta ttagtgatca taatcatggt attttttcta aatctgatat ccatagttca
     9661 ccaactatta ttccttcatc taggtctctt gaatctgcac ctgtgtatat tgaagagcgt
     9721 gtgtggattg gtgaaaacgt gacaatatta ccaggtgcgt gtataggtaa tggtgtagtt
     9781 attggcgcaa atagtgttgt tcgtggtgag attcttaata atgtgatctg agttgacccc
     9841 cgaaaacacc agacagtaga tgtatcttaa aataagaggt aggcttggac atatatctaa
     9901 cttaagatac aatccctgtc tggaaataag agggcaagaa cagaaaatgt ttcgatttgg
     9961 gaaagatagg atatggcttc ttatgtagta tataatatcc tgcattcatt cggataactt
    10021 cctatggaag tgtactttgc tctgtctgtt ttcatttgtt gaaaatttat gttaataaga
    10081 agctttagat aaccacttag gaactgtatg tttgatttgt ccaaaagtta tattgttgta
    10141 agtgcgacgg cgctggcctc cggaggtgca ttaactatat taaagcaatt tataaaacat
    10201 gcatcacaaa attcaaatga ctatattatg tttgtatctg cgggattaga gttgccggtc
    10261 tgtgataaca tcatttacat agaaaacaca ccaaaaggat ggttgaaaag aatatattgg
    10321 gattggttcg gttgtcgaaa gtttatctct gaacataaga ttaacgttaa gaaagtaatt
    10381 tctctacaaa attccagttt gaatgttcct tatgagcaga ttatttactt gcaccagcca
    10441 attcctttca gtaaagttga ttctttttta aatgatatca cgttcgataa cgtaaaactt
    10501 tttttatata aaaattttta ttcctatttt atatttaaat atgtgaatgc aaatacaacc
    10561 atcgtagtgc aaacgaattg gatgaaaaaa ggagtgttgg atcaatgtga taagattagt
    10621 tccgaaaggg tccttgttat aaaacctgat atcaaaacat ttaataatac taaatttgat
    10681 gtagataagg atgtatctgt taaaacactc ttatatccag cgacaccact tacctataaa
    10741 aatcatttgg tcattctgaa ggcgttggtt attttaaagc aaaagtattt tatagatgat
    10801 ctgaaattcc aagtgacttt tgaaaagaat aggtacaaaa attttgataa gtttgtgcaa
    10861 ttaaataacc taagcaaaaa cattgattat ctcggtgttc tttcatactc gaaattgcaa
    10921 aaaaaatata tggcggcatc ttttattgtt tttcctagct atatagaatc atatgggtta
    10981 ccactcatcg aagctgctag tttaggaaaa aaaatcatta gtagtgatct tccttatgcc
    11041 cgtgatgttt taaagaatta tagcggcgta gattttgtaa tttacaatga tgaagatggc
    11101 tgggctaggg cgttgtttaa tgttttaaat ggcaattcga agctcaattt taggccttat
    11161 gaaaaagata gtcgttcatc ttggccacag ttcttctcta ttttaaaata aggtgtatta
    11221 tgtttaatgg taaaatattg ttaattactg gtggtacggg gtctttcggt aatgctgttc
    11281 taagacgttt tcttgataca gatatcaaag aaatacgtat tttttcccgg gatgaaaaaa
    11341 aacaagatga catgaggaaa aaatataata atcagaagct taagttctat ataggtgatg
    11401 ttcgcgatta ttcgagtatt ctcaatgctt ctcgaggtgt tgattttatt tatcatgctg
    11461 cagccctgaa gcaagtgcct tcctgcgaat tccaccccat ggaagctgta aaaacgaata
    11521 ttttaggtac tgaaaacgtt ctagaagctg caatagctaa tcgcgttagg cgaattgtat
    11581 gtctgagtac agataaagcc gtatatccta ttaatgcaat gggcatatct aaagcaatga
    11641 tggaaaaagt cattgttgca aaatcacgta atcttgatag ttcaaaaaca gttatctgcg
    11701 gaacacgtta tgggaatgta atggcttcac gtggatcggt catcccattg tttgttgatc
    11761 taatcaaatc tggtaaacca ttgaccatta ccgatcccaa tatgactcgt ttcatgatga
    11821 cgcttgagga tgctgttgat ctggtccttt atgccttcga gcatggaaat aacggtgata
    11881 ttttcgttca gaaagctcct gcggcaacaa ttcaaacatt agccattgca cttaaggaat
    11941 tgctaaatgc ccatgaacat ccaatcaata ttattggaac tcgacacggg gaaaaacttt
    12001 acgaagcgtt attgagccga gaggaaatga tagcagcgga agatatgggt gattattatc
    12061 gtgttccacc agatctccgc gatttgaact atggtaaata tgtggaacat ggtgaccgtc
    12121 gtatctcgga agtggaagat tataactctc ataatactga gagattagat gttgagggta
    12181 tgaaaaaatt actgctaaaa cttcctttta tccgggcaat tcgttctggt gaagattatg
    12241 agttggattc ataatatgaa aattttagtt actggtgctt cagggtttat cggccgtaat
    12301 ttggttttcc gccttaagga ggctggttat aacgaactta ttacgataga tcgtaactct
    12361 tctttggcgg atttagagca gggacttaag caggcagatt tcatttttca ccttgcagga
    12421 gtaaatcgtc ctgtgaagga gagtgaattt ggagagggaa atagcaacgt aactcaacag
    12481 attgttgatg ttctgaaaaa aaataataaa aatactccta tcatgctgag ttcttccatc
    12541 caggctgaat gtgataacgc ttatggaaag agtaaagcga ctgcggagaa aatcattcag
    12601 cagtatgggg aaacgacaaa tgccaaatat tatatttatc gcttgccgaa tgtattcggt
    12661 aagtggtgtc gcccaaatta taactccttt atagcaactt tctgccatcg cattgcaaat
    12721 gatgaaacta ttacaattaa tgatccttca gcagttgttg atctggtgta tatagatgac
    12781 ttttgttctg acatattaaa gctattggaa ggagcgaacg aaactggtta caggacattc
    12841 ggtccaattt attctgttac tgttggtgaa gtggcgcaat taatttaccg atttaaagaa
    12901 agtcgccaaa cattaatcac cgaagatgta ggtaatggat ttacacgtgc attgtactca
    12961 acatggttaa gttatctgtc tcctgaacag tttgcgtata cggttccttc ttatagtgat
    13021 gatagagggg tattctgtga agtattgaaa acgaaaaacg cgggccagtt ttcgttcttt
    13081 actgcgcatc caggaattac tcggggggga cattatcatc attccaaaaa tgagaaattt
    13141 attgtcatcc gaggaagtgc ttgtttcaaa tttgaaaata ttgtcacggg tgagcgatat
    13201 gaatttaatg tctcctcaga tgattttaaa attgttgaaa cagttccggg gtggacgcat
    13261 gacatcacta ataatggctc ggatgagcta gttgttatgc tttgggcaaa tgaaatattt
    13321 aatcgttctg aaccagatac tatagcgaga gttttatcgt gaaaaaattg aaagtcatgt
    13381 cggttgttgg gactcgtcca gaaattattc gactctcgcg tgtccttgca aaattagatg
    13441 aatattgtga ccaccttatt attcatactg gccaaaacta cgattatgaa ttgaatgaag
    13501 tttttttcaa agatttgggt gttcgcaaac cagattattt tcttaatgcc gcaggtaaaa
    13561 atgcagcaga gactattgga caagttatca ttaaagttga tgatgtcctt gaacaggaaa
    13621 aaccagaagc tatgttagtt cttggcgata ctaactcctg tatttcagca ataccagcaa
    13681 agcgtcgaaa aattccgatc ttccatatgg aagcggggaa tcgttgtttt gaccaacgcg
    13741 taccggaaga aactaacaga aaaatagttg accacactgc tgatatcaat atgacatata
    13801 gcgatatcgc tcgtgaatat cttctggctg aaggtgtacc agccgataga attattaaaa
    13861 ccggtagccc aatgtttgaa gtactcactc attatatgcc gcagattgat ggttccgatg
    13921 tactttctcg cctgaattta acacctggga atttctttgt ggtaagtgcc cacagagaag
    13981 aaaatgttga tacccctaaa cagcttgcga aactggcgaa tatacttaat accgtggctg
    14041 aaaaatatga tgtcccggta gttgtttcta ctcatcctcg cactcgtaac cgcatcaatg
    14101 aaaacggtat tcaattccat aaaaatatct tgcttcttaa gccattagga tttcacgatt
    14161 acaaccatct gcaaaaaaat gcacgtgctg ttttatcgga tagtgggact attacagaag
    14221 agtcctccat tatgaacttc cctgcactca atatacgaga agcgcacgaa cgcccggaag
    14281 gcttcgaaga aggggcagta atgatggtcg gtcttgaatc tgagcgcgtt ttacaggcat
    14341 tagaaattat tgcaacacag cctcgtggag aagtacgctt acttcgtcag gtcagtgact
    14401 atagcatgcc caatgtttca gataaagttg tgcgtattat ccattcatat actgactacg
    14461 ttaaacgggt tgtctggaaa caatactaat gaaacttgca ttaatcattg atgattattt
    14521 gccccatagc acacgtgttg gggctaaaat gtttcatgag ttaggccttg aattgttgag
    14581 cagaggccat gatgtaactg taattacgcc tgacatcaca ttacaagcaa tctattctgt
    14641 tagtatgatt gatggtataa aggtttggcg tttcaaaagt ggacctttaa aggatatagg
    14701 taaggctaag cgtgccataa atgaaactct tttatctttt cgtgcatggc gtgcattaaa
    14761 gcacctcatt caacatgata catttgatgg tatcgtttat tattccccct ctattttttg
    14821 gggagacttg gttaaaaaaa taaaacagcg atgccagtgc ccaagctacc tggtcctaag
    14881 ggatatgttt ccacagtggg tcattgatgc aggtatgttg aaagccggtt cgccaattga
    14941 aaaatatttc aggtattttg aaaaaaaatc atatcagcag gctgaccgga taggggtaat
    15001 gtctgataag aatcttgaga tatttcgtca gaccaataaa ggttatccgt gtgaagtttt
    15061 acgtaattgg gcctcaatga ctcctgtgtc tgccagcgat gattatcatt cacttcgtca
    15121 aaaatacgat ctaaaagata aagtcatttt tttctatggc ggtaatattg ggcatgctca
    15181 ggatatggcg aacttaatgc gccttgcgcg taatatgatg cgttatcatg atgctcattt
    15241 cctgtttata gggcagggtg atgaagttga cctgataaaa tctcttgctg cagaatggaa
    15301 tttaactaat ttcactcacc taccttcagt gaaccaggaa gagtttaaat taattttatc
    15361 tgaagttgat gtcggcctgt tctccctttc atctcgccat tcttcacata atttccctgg
    15421 gaaattacta gggtatatgg ttcaatcaat cccgatcctt gggagtgtga atggcggcaa
    15481 tgatttaatg gatgtaatta ataagcacag ggccggtttc attcatgtta atggtgaaga
    15541 tgataaactg ttcgaatctg cacaattgct tcttgcagat tcggctttaa gaaagcagtt
    15601 aggtcagaac gctaatgtgt tgttaaaatc tcaattttcg gttgaatcgg cggcacatac
    15661 tatcgaagtc cgactggagg caggagaatg cgtttagttg atgacaatat tctggatgag
    15721 ctttttcgca cagcagtaaa ttctgaacgt ttgcgcgctc attatttatt gcacgcatct
    15781 catcaggaga aggttcaacg tttacttatt gcatttgtac gcgacagcta tgttgagccc
    15841 cattggcatg agttaccgca tcagtgggaa atgtttgtcg tcatgcaagg gcaattagaa
    15901 gtttgtttgt atgagaaaaa tggtgagata caaaaacagt ttattgttgg agacggtact
    15961 ggaataagcg tcatggaatt ttccccaggt gatatacata gtgtcaaatg cctgtcaccg
    16021 aatgccctta tgttggagat aaaggaagga ccatttgacc cactgaaagc taaggctttt
    16081 tctaagtggt tatagggcga tacaccaccc tttattcttc tatcttattc tatacatgct
    16141 gggttaccat cttagcttct tcaagccgcg caaccccgcg gtgaacaccc cctgacagga
    16201 gtaaacaatg tcaaagcaac agatcggcgt cgtcggtatg gcagtgatgg ggcgcaacct
    16261 tgcgctcaac atcgaaagcc gtggttatac cgtctctatt ttcaaccgtt cccgtgaaaa
    16321 gacggaagaa gtgattgccg aaaatccagg caagaaactg gttccttact atacggtgaa
    16381 agagtttgtt gaatctctgg aaacgcctcg tcgcatcctg ttaatggtga aagcaggtgc
    16441 aggcacggat gctgctattg attctctcaa gccatacctc gataaaggtg acatcatcat
    16501 tgatggtggt aacaccttct tccaggacac aattcgtcgt aaccgtgagc tgtctgcaga
    16561 aggttttaac tttatcggta ccggtgtttc cggtggtgaa gaaggtgcgc tgaaaggacc
    16621 ttccatcatg cctggtgggc agaaagaagc ctatgaactg gtcgctccga tcctgaccaa
    16681 aatcgccgcc gttgctgaag atggcgaacc gtgcgttacc tatattggtg ccgatggcgc
    16741 aggtcactat gtgaagatgg ttcacaacgg tattgaatac ggtgatatgc agctgattgc
    16801 tgaagcctat tctctgctta aaggtggcat gaatctctct aacgaagaac tggcgcagac
    16861 gtttaccgag tggaataacg gtgaactaag cagctacctg atcgacatca ccaaagacat
    16921 cttcactaaa aaagatgaag acggtaacta cctggttgat gtgatcctgg atgaagcggc
    16981 taacaaaggt accggtaaat ggaccagcca gagcgcgctg gatctcggcg aaccgctgtc
    17041 gctgattacc gagtctgtgt ttgcacgtta tatctcttct ctgaaagagc agcgtgttgc
    17101 cgcatctaaa gttctctctg gcccgcaagc gcagccagct ggcgacaaag gtgagttcat
    17161 cgaaaaagtt cgccgtgcgc tgtatcttgg caaaatcgtt tcttacgctc agggcttctc
    17221 tcagctgcgt gcagcgtctg aagagtacaa ctgggatctg aactacggcg aaatcgcgaa
    17281 gattttccgt gctggttgca tcattcgtgc gcagttcttg cagaaaatca ccgatgctta
    17341 tgccgaaaat ccgcagatcg ctaacctgct gctggctccg tacttcaagc aaattgccga
    17401 tgactaccag caggcgctgc gtgatgtcgt tgcttatgca gtacagaacg gtatcccggt
    17461 tccgaccttc gctgctgcgg ttgcctatta cgatagctac cgtgccgctg ttctgcctgc
    17521 gaacataatc caggcgcagc gtgacta
//