LOCUS       KJ778789               12349 bp    DNA     linear   BCT 29-MAR-2016
DEFINITION  Escherichia coli strain Bi 7455-41 serotype O43:K-:H2 O-antigen
            gene cluster, complete sequence.
ACCESSION   KJ778789
VERSION     KJ778789.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 12349)
  AUTHORS   DebRoy,C., Fratamico,P.M., Yan,X., Baranzoni,G., Liu,Y.,
            Needleman,D.S., Tebbs,R., O'Connell,C.D., Allred,A., Swimley,M.,
            Mwangi,M., Kapur,V., Raygoza Garay,J.A., Roberts,E.L. and Katani,R.
  TITLE     Comparison of O-Antigen Gene Clusters of All O-Serogroups of
            Escherichia coli and Proposal for Adopting a New Nomenclature for
            O-Typing
  JOURNAL   PLoS ONE 11 (1), E0147434 (2016)
   PUBMED   26824864
  REMARK    Publication Status: Online-Only
REFERENCE   2  (bases 1 to 12349)
  AUTHORS   Yan,X., Fratamico,P.M., Tebbs,R.S., O'Connell,C.D., Swimley,M.,
            Baranzoni,G.M., Debroy,C. and Liu,Y.
  TITLE     Direct Submission
  JOURNAL   Submitted (30-APR-2014) Molecular Characterization of Foodborne
            Pathogens Research Unit, USDA-ARS, 600 East Mermaid Lane, Wyndmoor,
            PA 19038, USA
COMMENT     ##Assembly-Data-START##
            Assembly Method       :: CLC Genomics Workbench v. 7.0
            Coverage              :: >50X
            Sequencing Technology :: IonTorrent
            ##Assembly-Data-END##
FEATURES             Location/Qualifiers
     source          1..12349
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="Bi 7455-41"
                     /serotype="O43:K-:H2"
                     /db_xref="taxon:562"
     misc_feature    1..12349
                     /note="O-antigen gene cluster"
     gene            76..1389
                     /gene="wzx"
     CDS             76..1389
                     /gene="wzx"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen flippase"
                     /protein_id="AIG62642.1"
                     /translation="MSLVKIIPKHLWVAASSWGARGISACVQIVSVHYLVSLLGEDKY
                     SAFILLGGLITWCNLSDFGIGNSILNYIAERRAQDKNYEYFILVGSVIVFILFFIVAV
                     FLCFLSMTVAEQYLKIYSDAIINNKIILFYISTLIFCGTALAGIIYKIWYAEQIGWLS
                     NLFPAVCALIGLLNIIVVRKIDGNFSDLLIVFVLFYLPALIIPIYLLLKRYRFEIRKT
                     KLNRRLFAGASLKIIERARPFFIFAVMGAIVLQTDLIVLSQKGDASEIILYGVLLKIF
                     NVIYFIYSAVLQAWWPVCTELRIKKQWVELKKSIRLSVGLGALAITTLIFLVYCLQDV
                     VFKLLGLGGIEKGSFILYCLFCLYFIIRAWCDTYAVLLQTMNSMKPLFIIVPIQALIN
                     FILQWYFISILSLTGILIGSIISFLCTVAIYLPYKFNQQIKKQTH"
     gene            1405..2148
                     /gene="epsH"
     CDS             1405..2148
                     /gene="epsH"
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferase"
                     /protein_id="AIG62641.1"
                     /translation="MRKKLSIVTVVYNGERFIENAINSVISQKNEQVEYIIVDGGSTD
                     STLNIIEKYKNKIDIFISEKDKGIYDAMNKGWSKATGEYVAFLNSDDFYQPGLLNSVL
                     NETNKNPDMIVTNTLIQDGEGKRKLFNRVTRKEDYKLHLRLPFMHPSVFIKKCIISKH
                     NGFSLNYKIASDCDLLLKVLNESISIEYVNAYIVMRLGGVSDVNYKLGRKEYRDIYFN
                     HFNRKIKANIGYVESLLSHYCYKAIRILK"
     CDS             2145..2666
                     /codon_start=1
                     /transl_table=11
                     /product="acetyltransferase"
                     /protein_id="AIG62640.1"
                     /translation="MKSLKIYLWELFFSKIPCNFIRRIFFSKVLNNKINNNISLLRNI
                     HLTSTDGISIDEKTTINKNVYIDGRGGVTIGSNVSISPYVRIITASHDVNCPNFSLIL
                     KPVIIKDYVWICTSSIILPGVTLGYGAIVAAGAVVTKNIPDYAIVAGNPAKVIGYRSE
                     TLHYNPLWRPTFQ"
     gene            2663..3733
                     /gene="wffZ"
     CDS             2663..3733
                     /gene="wffZ"
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferases group 1"
                     /protein_id="AIG62639.1"
                     /translation="MRKYYICRDFSEACGISKYGYVFFSTILKEYGFEKIHLKDVNDV
                     SQVLSKINCDDKVWIEIGLGTYLETLLYKKLIRKNNQNVIITLHDAPFIEYPILKFKN
                     QPFNLLSKINQYVFLRWPFTSFFYSYLHKTKRIYTLNPKGTESLLNRYRLHNVVTIPH
                     VLHNIEEVDNKKSGILQFLYFGFIGKNKGLEYALSLHEKINTLVKTPITMKIIGKTLD
                     EKSEKYFQKIKRRYNENVEYLGYVEDKELDILMQQDNIILLPTKNYKVIKPTSGSVLN
                     SLKYLNIVFTTKVNANECLISDKENGFFLQGDINSDTFNILSIINNSDLRNKIRLNIY
                     NDLMMKYIPIKVINEIKVDDYR"
     gene            3720..4931
                     /gene="wzy"
     CDS             3720..4931
                     /gene="wzy"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen polymerase"
                     /protein_id="AIG62638.1"
                     /translation="MTIAKKKQLNLINFIRRFSILFFLIIFLSLSPNYIFIFYPELKF
                     VIAILGAILALLGICDVRKIFKTYSSLFLFLFYGVLFFTSIISYIIYGNLNGVYFSLS
                     ILFKFLIVIIFVMSLKDIDILFLIKILINIMAVVCLFSLIGEFLYILNIIAVTNSFEF
                     QTYLYHVISYWGAFTVSFDIYGMKIIRNQSFFQEPGFFAFYIFITMIFISIVQKLYSK
                     NHFFILYGLFFLTMLSTLSLTGIALSAILSVYIFRGVVINSIASIISMSILTYILISD
                     NPYVNKIGSLDERLYGLINGANVFYSNPMVFLLGAGYESEPLFMFDGKFNNLFFEILL
                     YSGIFNLFIYMGFIIYIFRKCYGIKFKYFLVIIYCMTTPLFWSPIMIIFNVVLLRYNG
                     VKQSLLRLNEK"
     CDS             4928..5974
                     /codon_start=1
                     /transl_table=11
                     /product="mannosyl transferase-like protein"
                     /protein_id="AIG62637.1"
                     /translation="MILLDGIIFSLQMSGGISVYFYELIKHLDSQRKKHEIILYKNNN
                     DLIKNYATNAEFRFSINIERFLRCRNFCSEATIFHSSYYRLPERQFRGKIITTVHDFT
                     DEIYPRNAYAKILSYQKKKTILNSDGIICISDNTKRDLLNFIPEAKGIPIKVIYNGVG
                     DFSYNPDCVRNIASFKQPYALFVGGRKKYKNFNVCVQTLSQYKNINLVIVGGGDLDFQ
                     ELKMLNRYLKGRYYKKGYVDDQQLNNLYTCALFLFYPSQYEGFGIPVLEAMKSGCPVI
                     ATDCSSVREIASGYALLAKEATVEQFSKCINLLLDESFREKMIYNGLYAKKFTWDKCF
                     SDTVSFYDEVRYLK"
     gene            5971..7089
                     /gene="gmd"
     CDS             5971..7089
                     /gene="gmd"
                     /codon_start=1
                     /transl_table=11
                     /product="GDP-mannose 4,6-dehydratase"
                     /protein_id="AIG62636.1"
                     /translation="MKVALITGITGQDGSYLAEFLLEKGYEVHGIKRRASSFNTDRVD
                     HIYQDPHISNPKFHLHYGDLTDTSNLTRILSEVRPDEVYNLGAMSHVAVSFECPEYTA
                     DVDAIGTLRLLESIRFLGLENKTRFYQASTSELYGLVQEVPQKETTPFYPRSPYAVAK
                     LYAYWITVNYRESYGMFACNGILFNHESPRRGETFVTRKITRAIANISQGIEKCLYLG
                     NLDSLRDWGHAKDYVRMQWMMLQQDKPEDFVIATGKQISVREFVRMSAKEVGLELEFT
                     GKGVDEIATVVNKTSDCAVGVNIGDVIVRVDPRYFRPAEVDTLLGDPTKAKEVLGWEP
                     EITIEKMCSEMVASDLEKAKQHAFLKSHGYDVAVSLER"
     gene            7093..8058
                     /gene="fcl"
     CDS             7093..8058
                     /gene="fcl"
                     /codon_start=1
                     /transl_table=11
                     /product="GDP-L-fucose synthase"
                     /protein_id="AIG62635.1"
                     /translation="MTKKRIYVAGHRGMVGSAICRHLSEFHDVELVVKTHKELDLTNQ
                     QDVETFFEQEKIDEVYLAAAKVGGIHANNTYPAEFIYQNLMIESNIINSAHRAGINKL
                     LFLGSSCIYPKFAEQPMKESSLLTGVLETTNEPYAIAKIAGIKLCESYNRQYGCDYRS
                     VMPTNLYGTNDNFHPNNSHVIPALMRRFHEAKELGLNEVVVWGTGTPKREFLYVDDMA
                     AASVYVMELDDEVYKKNTQPMLSHINVGTGVDCSIREMAETMALVVGYEGKIVFDRTK
                     PDGAPRKLMDVTRLEKLGWKYRYNLKEGLELTYKWFINNLDSFRR"
     gene            8061..8516
                     /gene="nudD"
     CDS             8061..8516
                     /gene="nudD"
                     /codon_start=1
                     /transl_table=11
                     /product="GDP-mannose mannosyl hydrolase"
                     /protein_id="AIG62634.1"
                     /translation="MNKRLAPELFKSIVEHTPLISIDLIIRNEEGKALLGQRLNRPAQ
                     NYWFVPGGRILKDESFENAFKRVTLEELGVQISINEAKFLGAYEHFYSDNFSGTNFST
                     HYIVLGYEINTMSHQINYPTLQHSTYNWFDIAELLADSSVHQYTKNYFK"
     gene            8528..9931
                     /gene="manC"
     CDS             8528..9931
                     /gene="manC"
                     /codon_start=1
                     /transl_table=11
                     /product="mannose-1-phosphate guanylyltransferase 1"
                     /protein_id="AIG62633.1"
                     /translation="MLLPVVMAGGSGTRLWPLSRTLYPKQFLSLTSRLTMLQETLRRL
                     EGVEHRPALVICNEVHRFIVAEQMRNEHLANSGILLEPKGRNTAPAVALAALKAVSSG
                     EDPILLVLAADHDIQDQERFISSILAAKEFAEEGKLVTFGIVPTKPETGYGYIKTGEN
                     LNEYGFKVSAFVEKPELDVAKKYLEDGGYLWNSGIFMFRASVFIDELNKFRPDILKIC
                     QQALKSSTQDLDFIRIDNDSFSCCPEESIDYAVMEKTTEAVVVPLNAHWSDVGSWSAL
                     WEISSKDKSGNAIRGDVLIHDSSDSYLYSQHRLIGVVGVKDLVVVETKDAILVAHKDK
                     VQKVKNIVEQLKVNNRAEYQQHREIFRPWGSHDSIAEGSRFQVKHVVIHPGHKTAKQI
                     HYHRTEHWIVVSGTAKVHYEDEIFLVSENESTYIPIGVPHFIENPGKIPLEIIEVRSG
                     VYLDEDDVVRILNDDGY"
     CDS             9997..10743
                     /codon_start=1
                     /transl_table=11
                     /product="PGL/p-HBAD biosynthesis
                     glycosyltransferase/MT3031"
                     /protein_id="AIG62632.1"
                     /translation="MKVSIITVTYNSEKTLRNTLESIELQTYSDIEYIIIDGGSTDNT
                     LKIINEVSTRVTRCLSESDKGIYDALNKGINLSTGDIIGFVHSDDVLARPDIIETIVG
                     RFHETKADVVYGDLVFFEKNQIDIIKRYWRSGPFKRSKLSLGWAPPHPSFYMRRELYK
                     DDGYFDLSYRIAADYDQMVRVLKRDDIKVSYVPQVFVKMRLGGESTRIDNAISSTKEI
                     VAVMKNHNVNWKFAIIIRKISKLMQLFAHK"
     gene            10768..12138
                     /gene="manB"
     CDS             10768..12138
                     /gene="manB"
                     /codon_start=1
                     /transl_table=11
                     /product="phosphomannomutase"
                     /protein_id="AIG62631.1"
                     /translation="MKKLTCFKAYDIRGKLGEELNEDIAWRIGRAYGEFLKPKTIVLG
                     GDVRLTSETLKLALAKGLQDAGVDVLDIGMSGTEEIYFATFHLGVDGGIEVPASHNPM
                     DYNGMKLVREGARPISGDTGLRDVQRLAEANDFPPVDETKRGRYQQINLRDAYVDHLF
                     GYINVKNLTPLKLVINSGNGAAGPVVDAIEARFKALGAPVELIKVHNTPDGNFPNGIP
                     NPLLPECRDDTRNAVIKHGADMGIAFDGDFDRCFLFDEKGQFIEGYYIVGLLAEAFLE
                     KNPGAKIIHDPRLSWNTVDVVTAAGGTPVMSKTGHAFIKERMRKEDAIYGGEMSAHHY
                     FRDFAYCDSGMIPWLLVAELVCLKGKTLGELVRDRMAAFPASGEINSKLAQPVEAINR
                     VEQHFSREALAVDRTDGISMTFADWRFNLRSSNTEPVVRLNVESRGDVPLMEEKTKLI
                     LELLSK"
ORIGIN      
        1 ttggtatata tgcagtatgg tggtagctgt agagccaggg gcggtagcgt ggataattta
       61 aaggattagg ggtgaatgag cttagttaaa ataattccaa aacatttatg ggtcgccgct
      121 tcatcttggg gagctagagg gattagcgct tgtgtacaaa ttgtaagtgt gcattattta
      181 gtctctttac tcggagagga taaatattct gcttttattt tactgggggg gttaattaca
      241 tggtgtaatt tatctgactt cggtatcgga aatagtatat taaattatat cgcagaaaga
      301 agggcacaag acaaaaatta cgaatatttt atattagtag gatctgttat cgtttttata
      361 ttatttttta ttgtagcagt gtttctttgt tttttatcaa tgacagtggc agaacaatat
      421 ctaaaaatat actcagatgc tattattaat aataaaatta ttttgtttta tatatcaaca
      481 ttgatttttt gtggtactgc gcttgctggg attatttaca aaatatggta tgctgagcaa
      541 attggttggt tatcaaactt atttccggca gtctgcgcat taattgggct tttaaatatt
      601 attgttgttc gtaaaattga cggtaacttt agtgatttgc tgattgtttt tgttttattt
      661 tatttgccgg ctttgattat acctatttat cttttgttga aaagatatcg atttgaaata
      721 agaaaaacaa aattgaatcg aaggcttttt gctggtgcaa gtcttaagat tattgaaagg
      781 gctcgaccat tttttatttt tgcagtcatg ggggcgattg tccttcaaac tgatttaata
      841 gtactatctc aaaaaggaga tgcaagtgaa atcatattat atggagtgtt attaaagata
      901 tttaatgtga tatattttat ttatagcgca gttctccagg cgtggtggcc agtttgtacc
      961 gaattacgca taaaaaaaca atgggtggaa cttaaaaaaa gtataaggct atctgtaggg
     1021 ttaggtgcat tagcaataac cacgttaatt tttcttgttt attgtttaca agatgttgta
     1081 tttaaattgc taggtttagg gggaatagaa aaaggttcat ttatattata ttgtttgttt
     1141 tgtttgtatt ttatcattcg tgcatggtgt gatacctatg cagttttgtt acaaacaatg
     1201 aatagtatga agccgctgtt tattattgta ccgatccaag cgttgattaa ttttatattg
     1261 cagtggtatt ttatatcaat tctatcactg acaggtatat taattggttc aataatatca
     1321 ttcttgtgta ctgtcgcaat atatttaccc tacaaattca atcaacaaat aaaaaaacaa
     1381 acacactgat agagggagtg gttgatgcgg aaaaaattat caatagtgac tgtcgtatat
     1441 aatggggaga ggttcattga aaatgcaatc aatagtgtta tatcccaaaa aaatgagcaa
     1501 gttgaatata ttatagtaga tggggggtct acagattcaa cgttaaatat tatagaaaaa
     1561 tataaaaata aaatagatat ttttatttca gaaaaagata aaggtatata tgatgcaatg
     1621 aataaaggat ggagcaaagc tactggagaa tatgtggctt tcttgaatag tgatgatttt
     1681 tatcagcctg gattgctaaa ttccgtttta aatgaaacta ataaaaatcc ggatatgata
     1741 gtaactaata cgttgattca ggatggcgag ggaaaaagaa aattatttaa tagagtgact
     1801 agaaaagaag attataaatt acatttacga ctgccgttta tgcatccatc cgtgtttata
     1861 aaaaaatgta ttatatccaa acataatgga tttagtttaa attataaaat agcatcagat
     1921 tgtgatcttt tgcttaaagt gctaaacgaa tcaatttcaa ttgaatatgt caatgcttat
     1981 attgttatgc ggttaggtgg tgtaagtgat gtcaattata aattgggcag aaaagaatat
     2041 agagatatat attttaatca ttttaataga aaaataaaag ctaatatagg ttatgttgag
     2101 agtttattat cgcattattg ttataaagct ataaggattc taaaatgaaa tcgttaaaga
     2161 tttatttatg ggagttgttt ttttcaaaaa taccatgtaa ttttattcgg cgaatatttt
     2221 tctctaaggt tttaaataac aaaattaata ataatatatc attattgaga aatattcatc
     2281 taacttcaac tgatggtata tcaattgatg aaaaaacgac cataaataaa aatgtttata
     2341 tcgatggaag aggaggggtg acaattggtt ctaatgttag tatctcccct tatgtcagga
     2401 ttattaccgc gagtcacgat gtaaattgtc ctaatttttc tttaatactg aagcctgtga
     2461 taattaaaga ttatgtctgg atatgcacat cttctattat tttaccaggc gtaaccttgg
     2521 gctatggagc cattgtcgca gcaggagcag ttgttacaaa aaatattcct gattatgcta
     2581 ttgtcgctgg caaccctgcg aaggtaattg ggtatcgtag tgaaaccctg cactataatc
     2641 cattatggag acccacgttt caatgagaaa atattatatt tgtagagatt tttccgaagc
     2701 ctgtggaatt tcaaaatatg gatatgtatt ctttagtaca atactaaaag aatatggttt
     2761 cgaaaagatc catttaaaag atgtaaatga tgttagtcaa gtattatcga agatcaattg
     2821 tgatgataaa gtttggattg aaattgggtt gggaacatat ttagaaactc tattgtacaa
     2881 gaaattaatt aggaaaaata atcaaaatgt aataattaca ttacatgatg caccgtttat
     2941 tgaatatcct attttaaaat ttaaaaatca acctttcaat ttattatcca aaataaatca
     3001 atatgttttt ttgagatggc catttacgtc atttttttat agttatttac ataaaacaaa
     3061 gcgtatatat acactaaacc ctaaaggtac agaatcactt cttaaccgtt atcgtttgca
     3121 taatgtagtt actattccac atgttttaca taatatagaa gaagtagata ataagaaaag
     3181 tggtatacta cagttcttat actttggttt tataggtaaa aataaaggat tagaatatgc
     3241 gctcagttta catgagaaaa taaatacatt agttaaaacc cccattacaa tgaaaattat
     3301 tggaaaaaca ctagatgaaa aatctgagaa gtactttcaa aaaataaaaa gaagatataa
     3361 tgagaatgtt gaatatttag ggtatgttga agacaaagaa cttgatatat taatgcaaca
     3421 agataatatt attcttttac caacaaaaaa ttataaagtt ataaaaccta ccagtggaag
     3481 tgttcttaat tcgttaaaat atcttaatat tgtatttaca acaaaagtta atgctaatga
     3541 atgtctaata agtgataaag aaaatggctt ttttttacaa ggagatataa atagcgatac
     3601 atttaatatt ttaagcatta ttaacaattc tgatttaaga aataaaataa gattaaatat
     3661 atataatgat ttgatgatga agtatatacc aatcaaagtt attaatgaga tcaaagttga
     3721 tgactatcgc taaaaaaaaa caattgaact taataaattt tattcgcagg ttctctatac
     3781 tgtttttttt aattattttt ttatctttat ctccgaatta catatttatt ttttatcctg
     3841 aactaaaatt tgtaattgct attttgggtg caatacttgc attacttggc atatgtgatg
     3901 ttagaaaaat atttaaaaca tattcgtctc tattcttatt ccttttttat ggagtccttt
     3961 tttttacttc gataattagt tatattatat atggtaactt gaatggagtg tatttttcct
     4021 tatctatttt atttaagttt ctgatagtta tcatattcgt aatgtcttta aaagatattg
     4081 atattctatt tctgataaag atattaataa atattatggc tgttgtatgt ttgttttctt
     4141 taattggaga gtttttatac attctaaata ttatagcagt aacaaacagt tttgaatttc
     4201 aaacatattt atatcatgtt atttcttatt ggggagcttt tacagtttca tttgatatat
     4261 atggcatgaa gataattaga aatcaatctt ttttccaaga gccgggtttt tttgcatttt
     4321 acatttttat cacaatgatt tttatttcaa tagtgcagaa gctatatagc aaaaaccatt
     4381 ttttcatact atatggtttg ttcttcttga ctatgctatc tacgctttct cttacaggaa
     4441 ttgcgttatc agccatatta agtgtgtaca tatttagggg ggttgttatt aattcaatcg
     4501 caagcattat cagcatgtca attttgactt acatattgat ctctgataac ccctatgtta
     4561 ataaaatagg ttctttagac gaacgtttgt acggattaat taatggggct aatgtatttt
     4621 attcaaaccc catggttttt cttttaggtg ccggttatga gtcggaaccg ctatttatgt
     4681 ttgatgggaa attcaataat ttatttttcg aaatactatt atactctggt atttttaatt
     4741 tgtttattta tatgggtttt attatttata tcttcaggaa atgttatggg attaagttta
     4801 aatattttct tgtcattata tattgtatga caacaccact attttggtcg cctattatga
     4861 taatttttaa cgttgtttta cttcgctaca atggggtaaa gcagagtctg ttaaggttaa
     4921 atgaaaaatg attttattag atggaataat tttttcgttg caaatgtcgg gtggaatatc
     4981 agtttatttt tatgagctaa ttaaacatct cgatagccaa agaaaaaagc atgaaatcat
     5041 tttgtataaa aataataatg atttaattaa aaattatgcg acgaatgcag agtttcgatt
     5101 ttctataaat atagaaagat ttctgagatg tcgtaatttt tgttcagaag caacaatatt
     5161 tcattcaagt tattatcgtt tgccagagag gcagtttaga ggaaaaataa taactacagt
     5221 tcatgatttt acggatgaga tatatcccag aaatgcttat gctaagatac ttagttacca
     5281 aaaaaagaaa actattttaa atagcgatgg aattatttgc atctctgata ataccaaaag
     5341 ggatctattg aattttattc ctgaagcaaa aggaattcct ataaaagtta tatataatgg
     5401 agttggagat ttctcttata atccagattg tgtaagaaac attgcttcat ttaaacagcc
     5461 atatgcatta ttcgttggag gacgaaaaaa atacaagaac tttaatgtct gtgtccaaac
     5521 actcagtcaa tataaaaata ttaatcttgt gattgttggt ggaggtgatc tggattttca
     5581 agaattaaaa atgttaaata gatatttaaa aggacgttat tataaaaaag gttatgtaga
     5641 tgaccagcaa ttaaataatc tttacacctg cgctttattt ttattttatc catcccaata
     5701 tgaagggttt ggtattcctg tgttagaagc aatgaagtct gggtgtcctg taattgcaac
     5761 tgattgttct tctgtaagag agatagcatc aggatatgct ctgctagcca aagaggcaac
     5821 tgttgaacaa ttttctaagt gtattaattt attattagat gaaagtttta gagagaaaat
     5881 gatatataat ggtctttatg ccaagaaatt cacttgggat aaatgctttt ctgatactgt
     5941 tagtttttat gatgaggtga gatatttaaa atgaaagtag ctctgattac gggtattact
     6001 ggacaagacg gttcttattt ggctgaattt ttattagaaa agggatacga agttcacggt
     6061 atcaaacgtc gagcatcttc gttcaacact gatcgagttg atcatattta tcaggatcca
     6121 catattagta atccaaaatt ccatcttcat tatggtgatc taactgatac ttctaactta
     6181 acacgtatac tttcagaagt taggccagat gaagtatata atttaggagc tatgagtcat
     6241 gttgcagttt cctttgaatg tccagaatat accgctgatg ttgatgcaat tggaacgtta
     6301 agattgttgg agtctattcg ttttttagga ttagaaaata agacaagatt ttatcaagca
     6361 tcaacatctg agttgtatgg attggttcaa gaagttccac aaaaagaaac aacgcctttt
     6421 tatccaagat caccatatgc agttgccaag ctttatgcct attggataac tgttaactat
     6481 cgtgaatcat atggtatgtt tgcttgtaat ggcattttgt tcaatcatga atccccacgc
     6541 cgtggagaaa cattcgtaac gcgtaaaatt acacgtgcta tagctaacat ttctcaaggt
     6601 attgaaaaat gcctatatct cggtaatctg gattcgcttc gtgattgggg acatgctaaa
     6661 gattatgttc gtatgcaatg gatgatgctc caacaagaca aaccagagga tttcgttata
     6721 gcaacaggta aacaaatatc tgtgcgtgaa tttgttcgta tgtcagctaa agaagttggt
     6781 ctggaattag aattcactgg taaaggtgta gatgaaatag caaccgttgt taataaaaca
     6841 tctgactgtg ctgttggggt aaacattgga gatgttattg ttcgcgtaga ccctcgctat
     6901 ttccgtcccg cagaggttga tacgctgttg ggggatccaa ctaaagcgaa agaagtgtta
     6961 ggatgggaac cagaaattac tattgaaaag atgtgttcag aaatggttgc tagtgattta
     7021 gaaaaagcaa aacagcatgc atttcttaaa agccatggtt atgacgtagc agtatctctg
     7081 gagcgttgag taatgacaaa gaagcgtatt tatgttgcgg ggcatcgtgg tatggttggt
     7141 tctgctatat gccgacactt atcagaattt catgatgtcg agttagttgt aaaaactcat
     7201 aaagaactcg atttgactaa tcaacaagat gtcgagactt tttttgaaca agagaaaata
     7261 gatgaagtat atcttgccgc tgcaaaagta ggtggaattc acgctaataa tacatatccg
     7321 gcagaattta tttatcagaa tcttatgata gaaagtaata taatcaattc ggctcataga
     7381 gcaggtatta ataaattact ttttttaggt tcaagttgta tttatcctaa gtttgcagag
     7441 cagccaatga aagaatcttc acttttaaca ggtgtactcg aaactacaaa tgagccatat
     7501 gcaatagcta aaattgcagg tataaaattg tgtgagtctt acaatcgtca atatggatgt
     7561 gattatcgca gtgtaatgcc tactaatttg tatggtacga atgataattt tcatcctaat
     7621 aactcacatg taattccagc gctcatgagg cgttttcatg aagcaaagga gttggggtta
     7681 aatgaagtag ttgtctgggg gactggaaca ccaaaacgtg agtttttata tgttgatgat
     7741 atggcagctg cgtcagtata tgtgatggag cttgatgatg aagtttacaa aaaaaatacg
     7801 caaccaatgt tatctcatat taacgtaggt actggtgttg attgttctat acgcgaaatg
     7861 gcagaaacaa tggctttagt tgttggctat gaaggaaaaa ttgtttttga tagaactaaa
     7921 ccggatggcg caccgcgtaa acttatggat gttactcgtc ttgaaaaact gggctggaaa
     7981 tatcgttata atttaaagga aggactagaa ttaacttata agtggtttat aaataacctt
     8041 gactcattta ggagataata ttgaataaga gattagcacc tgagttattt aaatcaatag
     8101 tcgaacatac tccactaatc tcgatagatc ttattataag aaacgaagaa ggtaaggcgc
     8161 tgcttggcca gcgcctcaat cgtccagcac aaaattattg gtttgtgccg ggggggcgaa
     8221 ttcttaaaga tgagtctttc gagaacgcat tcaaaagagt tacacttgaa gaactaggtg
     8281 ttcaaattag tattaatgaa gcaaaatttc ttggtgcata tgaacatttc tacagcgaca
     8341 acttttcagg aactaatttt tcaacgcatt atatagtact tgggtatgag attaatacga
     8401 tgtcacatca aattaactat ccaacactgc aacatagcac ttacaattgg ttcgatatag
     8461 ccgaattgtt agctgattct tcagttcatc agtacacaaa aaattatttt aagtgaaggt
     8521 tatttatatg ctacttcctg ttgtaatggc cggtggttct ggaactagat tgtggccact
     8581 ttctcgaaca ctatatccga aacaattcct atcgttaact agtcgtttga ctatgctaca
     8641 agagacctta agaaggcttg agggggttga acatcgtcct gctctggtta tttgtaatga
     8701 agttcatcgt tttatcgttg cagaacagat gcgtaatgaa catttagcga atagtggcat
     8761 tttacttgag ccgaaaggtc gtaatacagc tcctgcagtt gctcttgctg ctcttaaagc
     8821 agtttcatca ggcgaggatc ctatactgct tgtattagca gccgatcatg atatacaaga
     8881 ccaagagcgc tttatatcgt cgatattggc tgcaaaagaa tttgcagagg aaggtaagct
     8941 ggttactttt ggtattgtgc caaccaaacc cgaaactgga tatggctaca taaaaaccgg
     9001 agagaattta aatgaatatg gctttaaagt ttctgctttt gttgaaaaac ctgagctaga
     9061 tgtggccaaa aaatatctcg aagatggagg ttatctttgg aatagtggaa tattcatgtt
     9121 cagggcctct gtgtttattg atgagttaaa taaatttaga ccagacatac taaaaatatg
     9181 ccaacaagca ttgaagtcct ctacacaaga tcttgatttt atccgtatag ataatgactc
     9241 atttagttgt tgccctgaag aatctattga ttatgctgtt atggagaaaa caacagaggc
     9301 tgtggtagtt ccattaaatg cccactggag cgatgttggt tcttggtctg cattatggga
     9361 aattagcagc aaagataaaa gtggaaatgc aattagagga gatgtattaa ttcatgattc
     9421 ttcggatagt tatctttact cacaacatag attaattggt gtagtaggag ttaaagattt
     9481 agtagttgtt gaaactaaag atgctattct cgttgcgcat aaagataaag ttcagaaggt
     9541 aaaaaatatt gttgaacaac ttaaagttaa taaccgtgcg gaatatcagc agcatcgtga
     9601 aatatttaga ccatggggca gtcatgactc tatagcagaa gggtctcgat ttcaggttaa
     9661 acatgttgtt attcatcctg gacataaaac tgctaaacag atccattacc atcgtactga
     9721 acattggatt gttgtttccg gaacagcaaa agtccattat gaggatgaaa tatttcttgt
     9781 ttctgaaaat gaatcaactt atataccaat aggtgtaccg cattttattg agaatcctgg
     9841 aaagatccct ttggaaatta ttgaagtacg ttcaggtgtt tacttggatg aagatgatgt
     9901 tgttagaatc ttaaatgatg atggatatta atgcaacatt ataattcgta atgctgtact
     9961 gacgttattt aattatgatt attattggat gttaaaatga aagtcagtat tattacagtg
    10021 acttataata gtgaaaagac tttaaggaat actttagagt caatagagct gcaaacctat
    10081 agcgatatag agtatataat tattgatggt ggttctaccg ataatacgtt aaaaataatt
    10141 aacgaagtat caacaagagt aacaagatgt ctatcagaaa gcgataaagg tatctatgat
    10201 gctttaaata aaggtataaa tttatctacg ggagatatta tcgggttcgt tcattctgat
    10261 gacgttttag caagacctga tattattgaa actattgtag gccgtttcca tgagacaaaa
    10321 gcggatgttg tatacggtga tttggttttt ttcgaaaaaa accaaattga tataatcaaa
    10381 cgatactggc gtagtggccc ttttaaacgt tctaagctat cattaggttg ggcaccaccg
    10441 cacccatctt tctatatgag aagggaatta tataaagacg atggatattt tgatttatcc
    10501 tataggattg ctgcagacta tgatcagatg gtcagggttt tgaaacgtga tgatattaaa
    10561 gttagttatg ttcctcaagt atttgtaaag atgagattgg gaggggaaag taccagaatt
    10621 gataacgcga tatcaagtac aaaggaaatt gtagcagtta tgaaaaacca taatgtaaat
    10681 tggaaatttg ctatcattat cagaaaaata tcaaaactaa tgcaattgtt tgcgcataaa
    10741 taattttata attggtaagg tttttatatg aaaaaattaa cctgctttaa agcctatgat
    10801 attcgcggga aattaggcga agaactgaat gaagatattg cctggcgcat tggtcgcgcc
    10861 tatggcgaat ttctcaaacc gaaaaccatt gtgttaggcg gtgatgtccg cctcaccagc
    10921 gaaaccttaa aactggcgct ggcgaaaggt ttacaggatg cgggcgtcga tgtgctggat
    10981 attggcatgt ccggcactga agagatctat ttcgccacgt tccatctcgg cgtggatggc
    11041 ggcattgaag ttcccgccag ccataatccg atggattaca atggcatgaa gctggtgcgc
    11101 gaaggggctc gcccgatcag cggtgatacc ggactgcgcg acgtccagcg cctggcagaa
    11161 gccaacgact ttcctcccgt cgatgaaacc aaacgcggtc gctatcagca aatcaatctg
    11221 cgtgacgctt acgttgatca cctgttcggt tatatcaatg tcaaaaatct cacgccgctc
    11281 aagctggtga ttaactccgg gaacggcgca gcgggtccgg tggtggacgc catcgaagcc
    11341 cgctttaaag ccctcggcgc gcccgtggaa ttaatcaaag tgcacaacac gccggacggt
    11401 aatttcccca acggtattcc taacccgcta ctgccagaat gccgcgacga cacccgcaat
    11461 gcggtcatta aacacggcgc ggatatgggc attgcttttg atggcgattt tgaccgctgc
    11521 ttcctgtttg acgaaaaagg gcagtttatt gagggctact acattgtcgg cctgctggca
    11581 gaagcgttcc tcgaaaaaaa tcctggcgcg aagatcatcc acgatccacg tctctcctgg
    11641 aacaccgttg atgtggtgac tgccgcaggt ggtacgccgg taatgtcgaa aaccggacac
    11701 gcctttatta aagaacgtat gcgcaaggaa gacgccatct acggtggcga aatgagcgcc
    11761 caccactatt tccgtgattt cgcctactgc gacagcggca tgatcccgtg gctgctggtg
    11821 gctgaactgg tgtgtctgaa aggaaaaacg ctgggcgaac tggtgcgcga ccggatggca
    11881 gcatttccgg caagcggtga gatcaacagc aaactggcgc aacccgttga ggcgattaac
    11941 cgcgtcgaac agcattttag ccgtgaggcg ctggcggtgg atcgcaccga tggcatcagc
    12001 atgacctttg ccgactggcg ctttaacctg cgctcctcca acaccgaacc ggtggtgcgg
    12061 ttgaatgtgg aatcgcgcgg tgatgtgccg ctgatggaag aaaaaacaaa acttatcctt
    12121 gagttactga gtaagtaatc cagtaatttc atataaatag gttttaaaag acggaaaaga
    12181 tgagatatac agtgtggtat agccaaggta atgctattca ccatctctat tagtgagtta
    12241 acatctatac cacatttaag ccgcacactc ggcggtgagc accccctgac aggagtaaac
    12301 aatgtcaaag caacagatcg gcgtcgtcgg tatggcagtg atggggcgc
//