LOCUS       AY545992               12850 bp    DNA     linear   BCT 08-JUN-2004
DEFINITION  Escherichia coli strain O172, O-antigen gene cluster, complete
            sequence.
ACCESSION   AY545992
VERSION     AY545992.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 12850)
  AUTHORS   Guo,H., Feng,L., Tao,J., Zhang,C. and Wang,L.
  TITLE     Identification of Escherichia coli O172 O-antigen gene cluster and
            development of a serogroup-specific PCR assay
  JOURNAL   J. Appl. Microbiol. 97 (1), 181-190 (2004)
   PUBMED   15186455
REFERENCE   2  (bases 1 to 12850)
  AUTHORS   Guo,H., Feng,L., Tao,J., Zhang,C. and Wang,L.
  TITLE     Direct Submission
  JOURNAL   Submitted (10-FEB-2004) Center for Functional Genomics Research;
            College of Life Sciences, Nankai University, 23 Hongda Street,
            TEDA, Tianjin 300457, P.R. China
FEATURES             Location/Qualifiers
     source          1..12850
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="O172"
                     /db_xref="taxon:562"
                     /clone="G1092"
     gene            1087..2388
                     /gene="wzx"
     CDS             1087..2388
                     /gene="wzx"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="AAT28921.1"
                     /translation="MNNKTNELIGGMLFKGLYIFITSLNALLMVKILSPKDLGVWYVF
                     MTLQTLIFTLNNAIIPNIARQYTLGSLSKELNFNCYIFHRSTQKTFIYLILLILIICA
                     IATFTYLSSVLAILESQNKIVLVSWLIIVFSLCLEVYYSSYDCAFNGMGKFKNVNKIN
                     FISRACLFLISIGMIAYDIDGRNALLYFCIGYFISNLIKRFFIYRLFISNYHNLCFNS
                     ESDTESFYKKNEKIILNLSCMSFISSIGGMLIVRGGMLILPYYVSIEEVGKYGLTYQL
                     FEIAFNLLFTASAIKTPSWIFLYKENKCELKKSYLKIKYVSLIVMAIGGGVISFYGGQ
                     ILSLFGLHATLLTTNLCLLLTLIFILQLNHSISGQLLTIQNKIPYAYASLYTGIGVVL
                     LSMIFIPITGFKGALVAIFISQLAYNNWKWPLEARKKIINV"
     gene            2381..3556
                     /gene="wzy"
     CDS             2381..3556
                     /gene="wzy"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="AAT28922.1"
                     /translation="MYNMSVNKKITKMFVFCEFLCGLYILFYGEYVSDYLNVETNVKH
                     IYIICFLICIVFFHYLFLYSWCILSVLFFRKSKLTTSVNINSIFLLLVIIYFIFLLKT
                     GSGKVYADGGSIGELSSFDKLLFFPIIILKLNFLIYIYAAGCKKKDNIYYLVLFIFLI
                     CELYRGVSFSILLIALIEIEKIKRCFRIKCLLISLPLFVLFVNIVYNIKFMVRLGEHY
                     DYLDIFQTLIMLLGRLSIISNVLYNYEHYYSVSNFVEGFGYSAINEFLEKLTPMPSLF
                     GITEKTTEIGKLIFYHSYGRWDSAIAISVLGILSIVPGQLLEICAILIISFVFIQLII
                     NMLDNTEQQNTVAFFFIILTLYQGFWGLLANYVYALFIYLIIIASCNLMMSKSKGRL"
     CDS             3553..4335
                     /note="Orf3"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAT28923.1"
                     /translation="MNNLEIRVLSLPDAYARRTKFQERFSLVSKLKFQFFDGVYGKNI
                     PDEILKSIYDDKKAKLKINRSMTVGEIGATYSHYLIYKDAYEKKLDYLIVLEDDSFVD
                     ENFDDVINRLLVKITPDDDAIIFIQKHTLDSKVIFSRKKDILKNGFELVKMLGSSQYF
                     VGSYGYILTKKSINKIIQNYLPIYCVCDHWFFIKKDSKIESFYCVSPSLVYTNDEDIR
                     LVDSFINEERKNVLKNRGVSRIGRIKIIIKRVVLRLLNKDWE"
     CDS             4335..5423
                     /note="Orf4"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAT28924.1"
                     /translation="MFYICKVITVLIKVIISFLVFPLCKPFSNKNKKVVVIGTRNGNQ
                     GNDNGEVFYSYLNDNNDNDDLLVYLIRRSKNKEKYKNILIKNSIRANIKILSADILYI
                     THSESDLIDFWWRFVTYKKIVFIQHGVIGIKRLPEYEKKKFSLFVSSNNYEYEILIKY
                     YNICSERIVKSGIPRFDNYTILNEAPQKIKKCLVMFTWRKFYKDEQSIRLKRVISTII
                     RNEPSIKIYVASHELSDYSLSEFEFYNINYVESIGIQNAIKECDLLITDYSSIAWDFL
                     YQNKLICFIQTDYLEYVFNEGVYFHCDDFFGYIIRDLSDINDAFISEILRVNKLNNQE
                     FLKRYPFYINYKKKHSELLFLETMEYNR"
     CDS             5420..6499
                     /note="Orf5"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAT28925.1"
                     /translation="MKIIIYATAAVDGGALSLLNDLLEYANDDIDNEYTVCVNEKLNN
                     EVSVYNNLTFLFVDTKAWHKRVYFDFIGFKKNFDNKDYCLVINLQNIPVRTQLKQILY
                     LHQPLPFSDIKLNILEKRNRKLIFYKYLYGLIIKFNSCFIDHCLVQTEWMRKAVIDKL
                     NLSEKKISIIRPVIDIDLNKILKNENENENTFIYPAASYSYKNHIILVESLNMIGVDF
                     LFQNKITVIFTLDRDENSKLFDRIKKYNLQEIIKFTGNIPRYDVLNYIYNAKALLFPS
                     RLETFGIPLIEAVKFNSNIIVSDLPYAHDVLDGYENVKYCNPDSPEDWSEAIKFAINL
                     KENKLNQGFELNSGWRELSSIISTL"
     gene            6526..7560
                     /gene="fnlA"
     CDS             6526..7560
                     /gene="fnlA"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlA"
                     /protein_id="AAT28926.1"
                     /translation="MFKDKVLLITGGTGSFGNAVLRRFLDTDIKEIRVFSRDEKKQDD
                     MRKKYNNDKLKFYIGDVRDYRSILNATRGVDYIYHAAALKQVPSCEFHPMEAVKTNVL
                     GTENVLEAAISNGVKRVVCLSTDKAVYPINVMGISKAMMEKVIVAKSRNLDSSKTVIC
                     GTRYGNVMASRGSVIPLFVDLIKAGKPLTVTNPDMTRFMMTLEDAVDLVLYAFEHGNN
                     GDIFVQKAPAATIETLAIALKELLGANEHPVKIIGTRHGEKLYEALLSREEMIAAIDM
                     GEYYCVPPDLRDLNYSKYVEHGDCRISEIEDYNSHNTVRLDVKGMKELLLKLPFVRAL
                     IAGEAFELDS"
     gene            7562..8668
                     /gene="fnlB"
     CDS             7562..8668
                     /gene="fnlB"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlB"
                     /protein_id="AAT28927.1"
                     /translation="MKILITGSKGFIARNLIYRLQEAGFKDLITIDRESPLQELEQGL
                     KIADFIYHLAGVNRPKEEHEFQEGNTDLTKLIVDYLLCNAKKTPIMLSSSIQAECDNA
                     YGKSKASAEKIIQHYGHVSGAEYYIYRLPNVFGKWCRPNYNSFVATFCHRIANDQDII
                     IHDPTAEVELVYIDDFCTDAINLLNNKYASGFKNIKPTYSITVGEVANLIYKFKESRH
                     TLITENVGQGFSRALYSTWLSYLQPEQFVYAVPSYSDERGVFCEVLKTHSSGQFSFFT
                     ALPGVTRGGHYHHTKNEKFIVIRGTACFRFKNVLTGERYEINVASDEYKIVETVPGWS
                     HDITNTGHDELIVMLWANEIFNRDQPDTIASVLS"
     gene            8683..9795
                     /gene="fnlC"
     CDS             8683..9795
                     /gene="fnlC"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlC"
                     /protein_id="AAT28928.1"
                     /translation="MSVVGTRPEIIRLSRVLAKLDEYCDHLIVHTGQNYDYELNEVFF
                     KDLGVRKPDYFLNAAGKNAAETIGQVIIKVDEVLEQEKPEAMLVLGDTNSCISAIPAK
                     RRRIPIFHMEAGNRCFDQRVPEETNRKIVDHTADINMTYSDIAREYLLAEGVPADRII
                     KTGSPMFEVLTHYMPQIDGSDVLSRLNLTPGNFFVVSAHREENVDTPKQLAKLANILN
                     TVAEKYDVPVVVSTHPRTRNRINENGIQFHKNILLLKPLGFHDYNHLQKNARAVLSDS
                     GTITEESSIMNFPALNIREAHERPEGFEEGAVMMVGLESERVLQALEIIATQPRGEVR
                     LLRQVSDYSMPNVSDKVVRIIHSYTDYVKRVVWKQY"
     gene            9795..11003
                     /gene="wbuB"
     CDS             9795..11003
                     /gene="wbuB"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuB"
                     /protein_id="AAT28929.1"
                     /translation="MKLALIIDDYLPHSTRVGAKMFHELGLELLSRGHDVTVITPDIT
                     LQVIYSVSMIDGIKVWRFKSGPLKDVGKAKRAINETLLSFRAWRAFKHLIQHDTFDGI
                     VYYSPSIFWGDLVKKIKQRCQCPSYLVLRDMFPQWVIDAGMLKAGSPIEKYFRYFEKK
                     SYQQADRIGLMSDKNLEIFRQANKNYPCEVLRNWASMTPVSASDDYHSLRQKYDLKDK
                     VIFFYGGNIGHAQDMANLMRLARDMMRYHDAHFLFIGQGDEVDLIKSLAVEWNLTNFI
                     HLPSVTQEEFKLILSEVDVGLFSLSSRHSSHNFPGKLLGYMVHSIPILGSVNDGNDLM
                     DIINKHRAGFIHVNGEDDKLFESAQLLLSDSVLRKQLGQNANVLLKSQFSVESAAHTI
                     EVRLEAGECI"
     gene            10994..11401
                     /gene="wbuC"
     CDS             10994..11401
                     /gene="wbuC"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuC"
                     /protein_id="AAT28930.1"
                     /translation="MHLVDDNILDELFRTAVNSERLRAHYLLHASHQEKVQRLLIAFV
                     RDSYVEPHWHELPHQWEMFVVMQGQLEVCLYEQNGEIQKKFVVGDGTGISVVEFSPGD
                     IHSVKCLSPKALMLEIKEGPFDPLKAKVFSKWL"
ORIGIN      
        1 attgtggctg cagggaatca aagaaatcct cctggtaact cacgcgtcca agaacgcggt
       61 cgaaaaccac ttcgacacct cttatgaatt agaatctctc cttgaacagc gcgtgaagcg
      121 tcagctgctg gcggaagtgc agtccatctg tccgccgggc gtgaccatta tgaacgtgcg
      181 tcagggcgaa cctttaggtt tgggccactc cattttatgt gcacgacccg ccattggtga
      241 caacccattt gtcgtggtgc tgccagacgt tgtgatcgat gacgccagcg ccgacccgct
      301 gcgctacaac cttgctgcca tgattgcgcg cttcaacgaa acgggtcgta gccaggtgct
      361 ggcaaaacgt atgccgggcg atctctctga atactccgtc attcagacca aagagccgct
      421 ggaccgtgaa ggcaaagtca gccgcattgt tgaatttatc gaaaaaccgg atcagccgca
      481 gacgctggac tcagacatca tggccgttgg tcgctatgtg ctttctgcag atatttggcc
      541 ggaacttgaa cgcactcagc ctggtgcatg ggggcgtatt cagctgactg atgccatcgc
      601 tgaactggcg aaaaaacagt ccgttgacgc catgctgatg actggagaca gctacgactg
      661 tggtaaaaaa atgggctata tgcaagcgtt cgtgaagtat gggctgcgca acctgaaaga
      721 aggggcgaag ttccgtaaag gcattgagaa gctgttaagc gaataatgaa aatctgaccg
      781 gatgtaacgg ttgataagaa aattataacg gcagtgaaga ttcgtggcga aagtaatttg
      841 ttgcgaatat tcctgccgtt gttttatata aacaatcaga ataacaacga gttagcaata
      901 ggattttagt caaagttttc caggattttc cttgtttcca gagcggattg gtaagacaat
      961 tagcgtttga atttttcggg tttagcgcga gtgggtaacg ctcgtcacat cgtaggcatg
     1021 catgcagtgc tctggtagct gtaaagccag gggcggtagc gtacctttta tatagagctt
     1081 acaattgtga ataataaaac gaatgagcta ataggtggaa tgttattcaa agggttatac
     1141 atctttataa cctcactgaa cgccctgttg atggttaaaa tactatcacc gaaagatctg
     1201 ggggtgtggt atgtttttat gactcttcaa actttaatat ttacacttaa taatgcgata
     1261 atacctaaca ttgctcggca atatacattg ggtagcctca gtaaagaatt aaactttaat
     1321 tgttatattt ttcatcgctc aactcaaaag acatttatat atcttatatt attgatatta
     1381 atcatatgtg caattgcaac atttacatat ttgagctctg ttttagcgat cttggaatca
     1441 caaaataaaa tagtcttagt ttcttggctt ataatcgtat tctctttgtg tttggaagtt
     1501 tattattctt catatgactg tgcttttaat gggatgggca aatttaaaaa tgtaaataaa
     1561 attaatttta tatcgcgggc atgtttgttt ttgataagta ttggcatgat agcatatgat
     1621 attgatggta gaaatgcatt attatatttt tgcattggtt attttattag taatttaata
     1681 aaaagatttt ttatatacag gctatttata tccaattatc ataatctatg ttttaatagt
     1741 gaatctgata ctgaatcttt ttataaaaaa aatgaaaaaa taatactcaa tttgtcatgt
     1801 atgtccttta tatcatcaat tggcgggatg ttaattgtga gaggtgggat gcttattcta
     1861 ccttattatg tatctatcga agaagttggt aaatatggtc taacttatca attgtttgag
     1921 attgctttta atttgctatt cactgcgtca gcaataaaaa cgcctagttg gatttttttg
     1981 tataaagaaa ataagtgtga gctaaaaaaa tcatatttaa aaataaaata tgtaagttta
     2041 attgtgatgg caataggggg gggggtgatc agtttttatg gggggcagat actgtcactg
     2101 tttggactgc atgcaacatt attaactaca aatttgtgtt tacttctgac attaattttt
     2161 attttacaat tgaatcatag tatatcaggg cagttgttaa ctattcagaa taaaatacct
     2221 tatgcatatg cttctcttta tacaggaatt ggggttgttt tactgtcgat gatttttata
     2281 ccgataacag gattcaaggg agcattggtt gcgattttta tttcccaatt agcatataat
     2341 aactggaaat ggccgttaga ggctaggaag aaaataataa atgtataata tgagcgttaa
     2401 taaaaaaatc acaaagatgt ttgtcttttg tgagttttta tgtggattgt atattttatt
     2461 ttatggtgaa tatgtctctg actatctcaa tgttgaaaca aatgttaagc atatttacat
     2521 aatatgtttt cttatttgta tcgtattttt tcattatttg tttttatata gttggtgtat
     2581 attaagtgtt ttgtttttcc gcaaaagcaa actaacaaca tcagtaaata ttaattctat
     2641 atttttgttg ttagttataa tatactttat ttttcttctc aaaaccggaa gtggaaaagt
     2701 atatgcggac ggcggtagca taggtgaatt aagtagtttt gataagttgt tatttttccc
     2761 aataataatt cttaaactta attttctaat atacatatat gcagcgggtt gtaaaaaaaa
     2821 ggataatata tattatcttg tgctatttat atttttaatt tgtgaacttt atagaggtgt
     2881 ttcattttca atattactga tcgctctaat tgaaattgag aaaataaaaa ggtgttttag
     2941 gattaaatgt ttgttaatat cactgcctct ttttgtctta tttgttaata tagtatataa
     3001 tattaaattt atggtaaggt taggggagca ttatgattat cttgatatat tccaaacctt
     3061 aataatgtta cttggtaggt taagtataat ttcaaatgtt ttgtataatt atgagcatta
     3121 ttactcagtt agcaactttg tagaaggttt tggttatagt gcgataaatg agtttttaga
     3181 aaaattgacg ccaatgccgt cattatttgg aataactgaa aaaacgacag aaatagggaa
     3241 gttgatattt tatcattcat atggaagatg ggatagtgca attgcaatct ctgtgttagg
     3301 tatattaagt attgtgcctg gacaactatt agagatatgt gcaattttaa ttattagttt
     3361 tgtttttatt caattaatta taaatatgct tgacaatact gagcagcaaa atacggttgc
     3421 atttttcttc attatattaa ctctttatca ggggttttgg gggttgctgg ctaattatgt
     3481 ctatgcgcta ttcatttatt taattattat agcatcttgt aatttaatga tgtctaaaag
     3541 taaaggacgg ttatgaataa tctagaaatt cgagtgttgt ctttgcctga cgcgtatgcg
     3601 cgaaggacga aatttcagga aagattttct ttagtctcca aattgaaatt tcaatttttc
     3661 gatggcgtgt atgggaagaa tattccagac gagattttga aaagtatata tgatgataaa
     3721 aaggctaagt tgaagattaa ccgaagtatg acagtaggtg aaattggggc aacatattca
     3781 cattacttaa tatataaaga cgcatatgaa aaaaaacttg attatctaat tgtactcgag
     3841 gatgactctt ttgtagatga aaattttgat gatgtaatta ataggttact tgtaaaaata
     3901 acaccagatg atgatgctat tatatttata caaaagcata cccttgactc taaagtgatt
     3961 tttagtcgaa aaaaagatat attgaaaaac ggttttgagt tggtaaaaat gttaggaagt
     4021 tcacaatatt ttgttgggtc atatggctat attctaacta aaaaatcaat taacaaaata
     4081 atacagaact atttgccaat atattgtgtt tgcgaccatt ggttctttat taaaaaagat
     4141 agtaagatag agtcatttta ttgtgtgagc ccaagtttag tatatactaa tgatgaagat
     4201 attagactgg ttgatagttt tatcaatgaa gaaaggaaaa atgttctgaa aaatcgaggt
     4261 gtatcacgta ttgggagaat aaaaataatt ataaaacgtg tagtgctgag attgttaaat
     4321 aaggattggg aatagtgttt tatatttgta aggtaatcac cgttttaatc aaggttataa
     4381 tttcattctt ggtgtttcca ttgtgtaagc catttagtaa taaaaataaa aaagtggttg
     4441 taataggaac tcgaaatgga aatcaaggta atgataatgg tgaggttttt tattcatatt
     4501 taaatgacaa taatgacaat gacgatcttc tggtttattt aatacggaga agtaagaata
     4561 aggagaaata taaaaatatc ctaataaaaa actccatcag agctaacatt aagattttaa
     4621 gtgcggacat attatatata acacattcag aatcagattt aattgacttc tggtggcgat
     4681 tcgttactta taaaaaaata gtttttattc agcatggtgt tataggaata aaaagacttc
     4741 ctgagtacga aaagaaaaaa ttctctcttt ttgtttcaag caacaattat gaatatgaga
     4801 ttttgattaa atattataat atatgtagcg aaagaatagt taaatcagga atacctaggt
     4861 ttgataatta tactatattg aacgaagccc cacagaaaat aaaaaaatgc ctagtcatgt
     4921 ttacatggcg aaaattttat aaagatgaac aatcaatcag attgaagcgt gttattagta
     4981 caataattag aaatgagcct tcaataaaga tatacgttgc atcgcacgaa ttatctgatt
     5041 attcactgtc agaatttgaa ttttataata tcaattatgt ggaatcaata ggtatacaga
     5101 atgcaattaa agagtgtgat ctattaataa ctgattattc aagtattgct tgggattttt
     5161 tatatcaaaa taaattgatt tgctttatac aaactgatta tttagaatat gttttcaatg
     5221 agggtgtcta tttccattgt gatgattttt ttggttatat tatcagggat ctaagtgata
     5281 ttaatgatgc ctttatttcg gaaattttaa gagttaataa gttaaataat caagaattct
     5341 taaaaagata ccctttttat ataaactata agaaaaagca ctctgagtta ttatttctag
     5401 agacaatgga atataatcga tgaaaattat tatatatgcg acagcagcag ttgatggtgg
     5461 cgctctttcg cttttaaatg atttgctgga atatgcgaat gatgatattg ataatgaata
     5521 tactgtttgc gttaatgaaa aattaaataa cgaagtgtct gtttacaata atttgacatt
     5581 tttatttgtt gatactaaag cttggcataa aagggtttat tttgacttta tagggtttaa
     5641 aaaaaacttt gataataaag attattgctt ggtaataaat ttgcaaaata taccagttcg
     5701 gacacaatta aaacaaatat tgtacttgca tcagcctttg cctttttcgg atattaagtt
     5761 aaatattttg gagaagcgta atagaaaatt gatattctat aaatacttat atggattaat
     5821 aataaaattt aattcatgtt ttattgatca ttgcttagtg caaactgagt ggatgagaaa
     5881 agctgttatt gataaactaa acctgtctga gaaaaaaata agtataatta gaccagtaat
     5941 agatattgat ttgaacaaaa ttttaaaaaa tgaaaatgaa aatgaaaata cattcatcta
     6001 tcccgcagca tcttatagtt ataaaaatca tataatattg gttgaatcat taaatatgat
     6061 tggtgtggat tttttgtttc agaataagat aactgttata tttacattag atcgtgatga
     6121 aaattcgaag ttgtttgatc ggataaaaaa atataatctt caagagatta ttaaatttac
     6181 aggaaatatc ccaagatatg atgttttaaa ttacatttat aatgctaaag ccttactgtt
     6241 tccatcaaga ctagaaacat ttggtatacc attgatagaa gctgtaaaat ttaattctaa
     6301 cataattgta agtgatctac cttatgcgca cgacgtattg gatggttatg aaaatgtcaa
     6361 atactgtaat cctgattctc cagaggattg gtctgaagca atcaaatttg ctatcaatct
     6421 aaaagagaat aaattaaatc agggctttga attaaattca gggtggagag agttgagttc
     6481 gattatttca actctttaat taggctagat ataaaaaggt gtggtatgtt taaagataaa
     6541 gttttattaa taaccggtgg gactggttct tttggaaatg ctgtattgcg gcgatttctt
     6601 gacacagata ttaaagaaat tcgtgttttt tcgcgtgatg aaaagaaaca agatgatatg
     6661 cgaaaaaaat acaataatga taaattgaaa ttctatattg gtgatgtcag agattataga
     6721 agtattttaa atgctacacg aggtgttgat tatatttatc atgcagctgc attaaaacaa
     6781 gttccttcgt gtgaattcca tcctatggag gcagttaaga ccaacgtgtt aggtactgag
     6841 aatgtgttgg aggctgcaat ttctaatgga gttaaacgag tagtttgttt gagtactgat
     6901 aaagccgtgt accccattaa tgtaatgggg atttccaaag caatgatgga aaaagtaatt
     6961 gtagcgaaat cgcgtaattt ggatagttct aaaactgtca tttgtggaac tcgctatggc
     7021 aacgttatgg catcgcgtgg ctcagttatt cctctgtttg tggatttgat taaagcagga
     7081 aaaccgctaa cagtgacgaa ccctgatatg acaaggttta tgatgacgct tgaagatgcg
     7141 gtagacctag ttctttatgc atttgaacat ggtaataatg gcgatatttt cgtacaaaaa
     7201 gcaccagcag ctaccattga aactttagca attgcactca aggaactatt gggtgctaat
     7261 gaacatccgg tcaaaattat aggtaccaga cacggcgaaa aattatatga ggcgttattg
     7321 agtcgtgaag agatgatcgc agcaatcgat atgggagaat attactgtgt tccgccagac
     7381 ttgcgtgacc ttaactatag taaatatgtt gagcatggtg attgtcgaat ttcagaaatt
     7441 gaagactata attcacacaa tacagtaagg ctggatgtta aaggaatgaa ggaattattg
     7501 cttaaactac cgtttgttcg agctttgata gctggtgaag cttttgaatt ggattcataa
     7561 tatgaaaata ctaattactg gttctaaagg ttttattgct cgtaatttaa tctatcgcct
     7621 gcaggaagca ggctttaaag atttaattac gatcgaccgt gaatcacctt tgcaagagtt
     7681 agaacaggga ctcaaaattg ctgattttat ttatcatctt gctggtgtaa ataggccaaa
     7741 ggaagaacat gagtttcagg agggaaatac tgatcttaca aaattaattg ttgactatct
     7801 gctttgtaat gcaaaaaaga ctcctattat gcttagttcc tccattcagg ctgaatgtga
     7861 taacgcgtat ggaaaaagca aggcatcggc ggaaaaaatc attcaacatt atggtcatgt
     7921 tagtggcgca gaatattata tctatcgatt accaaatgtg ttcggtaagt ggtgtcgacc
     7981 aaattacaac tcctttgttg caactttttg tcataggata gcaaacgatc aagatattat
     8041 cattcatgac ccgacagcag aggtcgagct tgtttatatt gatgattttt gtactgatgc
     8101 tatcaactta ttaaataaca agtacgcgtc aggttttaaa aatataaagc cgacgtattc
     8161 aataacagtg ggtgaggtag caaatctaat ttataaattt aaagaaagta gacatactct
     8221 tattacggaa aatgttggtc agggtttttc acgagcgtta tattcaactt ggcttagtta
     8281 cttgcaacca gagcagttcg tgtatgcagt gccttcctat agtgatgaaa gaggagtgtt
     8341 ctgcgaggtc ttaaaaaccc attcctctgg acaattttca ttttttaccg cacttccagg
     8401 agtaacgcgt ggagggcact atcatcatac aaagaatgaa aaatttatcg ttattcgtgg
     8461 aacagcatgt tttaggttta aaaatgtttt aacaggagaa cgatatgaga ttaatgttgc
     8521 gtcagatgaa tataaaattg tagaaactgt gccaggttgg tcccatgata ttactaatac
     8581 cggtcatgat gaattaatcg taatgttgtg ggcgaatgaa atatttaatc gtgatcaacc
     8641 tgatactata gcgagcgttt tatcatgaaa aaattgaaag tcatgtcggt tgttgggact
     8701 cgtccagaaa ttattcgact ttcgcgtgtc cttgcaaaat tagatgaata ttgtgaccac
     8761 cttattgttc atactggaca aaactacgat tatgaattga atgaagtttt tttcaaagat
     8821 ttgggtgttc gcaaacctga ttattttctt aatgccgcag gtaaaaatgc agcagagact
     8881 attggacaag ttattattaa agttgatgag gtccttgaac aggaaaaacc agaagccatg
     8941 ttagttcttg gtgatactaa ctcctgtatt tcagcaatac cagcaaagcg tcgaagaatt
     9001 ccgatcttcc atatggaggc tgggaatcgt tgttttgacc aacgcgtacc ggaagaaact
     9061 aacagaaaaa tagttgacca taccgctgat atcaatatga catatagtga tatcgcgcgt
     9121 gaatatcttc tggctgaagg tgtaccagcc gatagaatta ttaaaactgg tagcccaatg
     9181 tttgaagtac tcacgcatta tatgccgcag attgatggtt ccgatgtact ttctcgcctg
     9241 aatttaacac ctgggaattt ctttgtggta agtgcccaca gagaagaaaa tgttgatacc
     9301 cctaaacagc ttgcgaaact ggcgaatata cttaataccg tagctgaaaa atatgatgtc
     9361 ccggtagtcg tttctactca tcctcgcact cgtaaccgca tcaacgaaaa cggtattcaa
     9421 ttccataaaa atatcttgct tcttaagcca ttaggatttc acgattacaa ccatctgcaa
     9481 aaaaatgcgc gtgctgtttt atcggatagt gggactatta cagaagagtc ctccattatg
     9541 aacttccctg cactcaatat acgagaagcg cacgaacgcc cggaaggctt cgaagaaggg
     9601 gcagtaatga tggtcggcct tgaatctgag cgcgttttac aggcattaga aattatcgca
     9661 acacagcctc gtggagaagt acgcttactc cgtcaggtca gtgactatag catgccaaat
     9721 gtttcagata aagttgtgcg tattatccat tcatacactg actacgttaa acgggttgtc
     9781 tggaagcaat actaatgaaa cttgcattaa tcattgatga ttatttgccc catagcacac
     9841 gtgttggggc taaaatgttt catgagttag gccttgaatt gctgagcaga ggccatgatg
     9901 taactgtaat tacgcctgac atcacattac aagtaatcta ttctgttagt atgattgatg
     9961 gtataaaggt ttggcgtttc aaaagtggcc ctttaaagga tgtaggtaag gctaaacgtg
    10021 ccataaatga aactctttta tcttttcgtg catggcgcgc atttaagcac ctcattcagc
    10081 atgatacatt tgatggtatt gtttattatt ccccctctat tttttgggga gacttggtta
    10141 aaaaaataaa acagcgatgc cagtgcccaa gctatctggt cctgagggat atgtttccac
    10201 agtgggttat tgatgcaggt atgttgaaag ccggttcacc aattgaaaaa tatttcaggt
    10261 attttgaaaa aaaatcatat cagcaggctg accggatagg gttaatgtct gataagaatc
    10321 ttgagatatt tcgtcaggcc aataaaaatt atccgtgtga agttttacgt aattgggcct
    10381 caatgactcc tgtgtctgcc agcgatgatt atcattcact tcgtcaaaaa tacgatctaa
    10441 aagataaagt tatttttttc tatggcggaa atattgggca tgctcaagat atggcaaact
    10501 taatgcgcct tgcgcgtgat atgatgcgtt atcatgatgc tcatttcctg tttatagggc
    10561 agggtgatga agttgacctg ataaaatctc ttgctgtaga atggaattta actaatttca
    10621 ttcatctacc ttcagtgacc caagaagagt tcaaattaat tttatctgaa gttgatgtcg
    10681 gcctattctc cctttcatct cgccattctt cacataattt ccccgggaaa ttactcgggt
    10741 atatggttca ttcaatcccg attcttggga gtgtgaatga cggcaatgat ttgatggata
    10801 taattaacaa gcacagggcc ggttttattc atgttaatgg tgaagatgat aaactgtttg
    10861 aatctgcaca attgcttctt agtgattcag ttttaagaaa acagttaggt cagaacgcta
    10921 atgtgttgtt aaagtctcaa ttttcggttg aatcggcggc acatactatc gaagtccgac
    10981 tggaggcagg agaatgcatt tagttgatga caatattctg gatgaacttt ttcgcactgc
    11041 agtaaattct gaacgtttgc gcgctcatta tttattgcac gcatctcatc aggagaaagt
    11101 tcaacgttta cttattgcat ttgtacgcga cagctatgtt gaaccccatt ggcatgagtt
    11161 accgcatcag tgggaaatgt ttgtcgtcat gcaagggcaa ttagaagttt gtttgtatga
    11221 gcaaaatggt gagatccaaa aaaagtttgt tgttggagac ggtacgggaa taagcgtcgt
    11281 ggaattttcc ccaggagata tacatagtgt caaatgcctg tcaccaaaag cccttatgtt
    11341 agagataaag gaggggccat ttgacccact gaaagctaag gttttttcta agtggttata
    11401 gggcgataca tcaccgttta ttcttctatc ttattctata catgctgggt taccatctta
    11461 gcttcttcaa gccgcacacc cgcagcgaac acccctgaca ggagtaaaca atgtcaaagc
    11521 aacagatcgg cgtcgtcggt atggcagtaa tggggcgcaa ccttgcgctc aacatcgaaa
    11581 gccgtggtta taccgtctct attttcaacc gttcccgtga gaagacggaa gaagtgattg
    11641 ccgaaaatcc gggcaagaaa ctggttcctt actatacggt gaaagagttt gttgaatctc
    11701 tggaaacgcc tcgtcgcatc ctgttaatgg tgaaagcagg tgcaggcacg gatgctgcta
    11761 ttgattctct caagccatac ctcgataaag gcgacatcat cattgatggt ggtaacacct
    11821 tcttccagga caccatccgt cgtaaccgtg agctttctgc agaaggcttt aacttcatcg
    11881 gtaccggtgt ctccggcggt gaagaaggtg cgctgaaagg tccttccatt atgcctggtg
    11941 ggcagaaaga agcctatgaa ctggttgcgc cgatcctgac caaaatcgcc gcagtggctg
    12001 aagatggcga accgtgcgtt acctatattg gtgccgatgg tgcaggtcat tatgtgaaga
    12061 tggttcacaa cggtattgaa tacggtgata tgcagctgat tgccgaagcc tattctctgc
    12121 taaaaggtgg cctgaacctt accaacgaag aactgtcaca gacctttacc gaatggaata
    12181 acggtgaact gagcagctac ctgatcgaca tcaccaaaga tatcttcacc aaaaaagatg
    12241 aagacggtaa ctacctggtt gatgtgattc tggatgaagc agcaaacaaa ggtacgggta
    12301 aatggaccag ccagagtgcg ctggatctcg gtgaaccgct gtcgctaatt accgagtctg
    12361 tgtttgcacg ttatgtctct tctctgaaag atcagcgtgt tgccgcatct aaagttctct
    12421 ctggcccgca agcgcagcca gctggcgaca aggctgagtt catcgaaaaa gttcgtcgtg
    12481 cgctgtatct gggcaaaatc gtttcttacg cccagggctt ctctcagctg cgtgctgcgt
    12541 ctgaagagta caactgggat ctgaactacg gcgaaatcgc gaagattttc cgtgctggct
    12601 gcatcatccg tgcgcagttc ctgcagaaaa tcaccgatgc ttatgccgaa aatccacaga
    12661 tcactaacct gctgctggct ccgtacttca agcaaattgc cgatgactac cagcaggcgc
    12721 tgcgcgatgt cgtcgcatat gcagtacaga acggtatccc ggttccgacc ttcgccgctg
    12781 cggttgccta ttatgacagc taccgtgccg ctgttctgcc tgcgaacctg atccaggcac
    12841 agcgcgacta
//