LOCUS       KJ778810               15817 bp    DNA     linear   BCT 29-MAR-2016
DEFINITION  Escherichia coli strain H 320a serotype O97:K-:H- O-antigen gene
            cluster, complete sequence.
ACCESSION   KJ778810
VERSION     KJ778810.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 15817)
  AUTHORS   DebRoy,C., Fratamico,P.M., Yan,X., Baranzoni,G., Liu,Y.,
            Needleman,D.S., Tebbs,R., O'Connell,C.D., Allred,A., Swimley,M.,
            Mwangi,M., Kapur,V., Raygoza Garay,J.A., Roberts,E.L. and Katani,R.
  TITLE     Comparison of O-Antigen Gene Clusters of All O-Serogroups of
            Escherichia coli and Proposal for Adopting a New Nomenclature for
            O-Typing
  JOURNAL   PLoS ONE 11 (1), E0147434 (2016)
   PUBMED   26824864
  REMARK    Publication Status: Online-Only
REFERENCE   2  (bases 1 to 15817)
  AUTHORS   Yan,X., Fratamico,P.M., Tebbs,R.S., O'Connell,C.D., Swimley,M.,
            Baranzoni,G.M., Debroy,C. and Liu,Y.
  TITLE     Direct Submission
  JOURNAL   Submitted (30-APR-2014) Molecular Characterization of Foodborne
            Pathogens Research Unit, USDA-ARS, 600 East Mermaid Lane, Wyndmoor,
            PA 19038, USA
COMMENT     ##Assembly-Data-START##
            Assembly Method       :: CLC Genomics Workbench v. 7.0
            Coverage              :: >50X
            Sequencing Technology :: IonTorrent
            ##Assembly-Data-END##
FEATURES             Location/Qualifiers
     source          1..15817
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /strain="H 320a"
                     /serotype="O97:K-:H-"
                     /db_xref="taxon:562"
     misc_feature    1..15817
                     /note="O-antigen gene cluster"
     gene            127..1215
                     /gene="rmlB"
     CDS             127..1215
                     /gene="rmlB"
                     /codon_start=1
                     /transl_table=11
                     /product="dTDP-glucose 4,6-dehydratase"
                     /protein_id="AJE24494.1"
                     /translation="MKILVTGGAGFIGSAVIRHIINNTLDAVVNIDKLTYAGNLESLV
                     DIENSERYIFEQVDICDSEAIARIFACHQPDAVMHLAAESHVDRSITGPAAFIETNII
                     GTYVLLEETRKYWLSLDEARKAAFRFHHISTDEVYGDLPHPDKQIPGTALPLFTENTP
                     YAPSSPYSSSKASSDHLVRAWRRTYGLPTIVTNCSNNYGPYHFPEKLIPLIILNALAG
                     KQLPVYGNGEQIRDWLYVEDHARALYKVVTEGTVGETYNIGGHNERKNIEVVKTICAI
                     LDEIVTAKPKGIQRFEQLITYVADRPGHDLRYAIDASKIKRELGWVPAETFESGIRKT
                     VNWYLNNDGWWKRVIDGSYAGERLGLVD"
     gene            1229..2095
                     /gene="rmlA"
     CDS             1229..2095
                     /gene="rmlA"
                     /codon_start=1
                     /transl_table=11
                     /product="glucose-1-phosphate thymidylyltransferase 2"
                     /protein_id="AJE24495.1"
                     /translation="MKGIVLAGGSGTRLYPITQGVSKQLLPVYDKPMIFYPISVLMLA
                     GIRDILIITTPEDMPSFKRLLGNGSQFGIRLSYEVQPSPDGLAQAFIIGEEFINNEPC
                     ALVLGDNIYFGQSFGKKLETAAQLTRGAMVFGYQVLDPERFGVVEFDKSFKALSIEEK
                     PLKPKSNWAVTGLYFYDSNVVEMAKQVKPSGRGELEITTLNQMYLERGELQVELLGRG
                     FAWLDTGTHDSLVEASQFIHTIEKRQGMKVACLEEVAYRKGWLSKEQVSEQATKMAKN
                     DYGRYLRMLINE"
     gene            2118..3008
                     /gene="rmlD"
     CDS             2118..3008
                     /gene="rmlD"
                     /codon_start=1
                     /transl_table=11
                     /product="dTDP-4-dehydrorhamnose reductase"
                     /protein_id="AJE24496.1"
                     /translation="MKILLIGKNGQVGWELQRSLSTLGELVAIDYFDTGMCGDLTDPE
                     GIAETIRLVRPDVVVNAAAHTAVDKAESERKLSQLLNADSVEVIARETARLGALVIHF
                     STDYVFNGEGEHYRLEDEEPAPLNVYGETKLAGEAAIIKYNPRHFIFRTSWVFATRGA
                     NFVKTMLRLAKEKETLSIINDQHGAPTSAELIADCTAIAIRVEHNNKSLHGTYHLVAS
                     GETTWYEYAKYVFSVAHQFNEILAVKEVKAVDTSAYPTPAKRPHNSRLANSKFQNAFL
                     VTLPDWKIGVQRVVTELLGK"
     gene            3026..3571
                     /gene="rmlC"
     CDS             3026..3571
                     /gene="rmlC"
                     /codon_start=1
                     /transl_table=11
                     /product="dTDP-4-dehydrorhamnose 3,5-epimerase"
                     /protein_id="AJE24497.1"
                     /translation="MNVIKTEIQDVLILEPKVFGDERGFFFESFNQHVFEEAVGKKVS
                     FVQDNHSKSKKGVLRGLHYQLAPHSQGKLVRCTMGAVFDVAVDIRIGSETFGKWVGVE
                     LSAENKRQLWIPEGFAHGFVTLTDTAEFLYKATNYYAPCAERCIIWNDSQLSIAWPEI
                     NEISLSSKDVTGLPLKDSELN"
     gene            3578..4504
                     /gene="epsE"
     CDS             3578..4504
                     /gene="epsE"
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferase family 2"
                     /protein_id="AJE24498.1"
                     /translation="MKHEPKIAILLCSYNGGAYIRRQLDSIISQSYSNWVLYISDDGS
                     TDETLDIVYEYKKRLGDGRVQVFSGPGQGFAWNFISLVDKVPGDFDYYAFSDQDDEWL
                     NFKLDKAVQLLITDDSIPQLYCGRTQLVDEDNCRLGLSPLFTRKPCFRNALVQSIAGG
                     NTMIFNRASKNIILKTPSNSKIISHDWWIYILVTGCGGRVIYDKQPTILYRQHQNNII
                     GANKGISARLSRLLGVIDGRYKKWIQANLDVLEEIEINFTEDNRFVLNNFIRARKSGF
                     FKRIYIFSKIKLFRQTLVGSFAFIIAIMMNKV"
     gene            4573..5334
                     /gene="glmU"
     CDS             4573..5334
                     /gene="glmU"
                     /codon_start=1
                     /transl_table=11
                     /product="bifunctional protein"
                     /protein_id="AJE24499.1"
                     /translation="MINIVIPMAGAGSRFAKAGYADPKPLIPINGTPMIKLVINNLKP
                     AVPHRFIFICQKEHSQKYDLQQKLKSWAPGSEVIEIDGLTEGAACTVLTAKDLINNED
                     ALMIANSDQYVDIDIDDYLRYQEEENLDGLIMTMTADDPKWSFVKIDVNNLVRDVVEK
                     VVISDEATVGIYNFKHGRDFIAAAELMIKNNLRVNNEFYVAPTYNQLINDYNSKIGIY
                     NIGSEANGMYGLGIPDDLNLFLSLPVCKKALEKSK"
     CDS             5331..5963
                     /codon_start=1
                     /transl_table=11
                     /product="phosphodiesterase"
                     /protein_id="AJE24500.1"
                     /translation="MKIISHRGYWKSTEEKNKEVAFTRSFALNYGTETDVRDYLGDLV
                     ISHDIADENAITLNSFLENANKYGSEDNKITLALNIKADGLASSVSIAISKFNNLDCF
                     VFDMAVPDMRSYFEHSVPVFTRCSEVESQPVWLEKSTGIWLDAFDKEWFTSDLIITLL
                     ATGKRVCIVSSELHGRDKTRLWEMLLPLRSQPNLILCTDVPEDASEYFSR"
     CDS             5974..6591
                     /codon_start=1
                     /transl_table=11
                     /product="HAD family hydrolase"
                     /protein_id="AJE24501.1"
                     /translation="MTIKAILFDMDGVLIDAKEWHYEALNKALDLFGMKISRFDHLTT
                     FDGLPTKKKLEMLSKERHLPRELHDFINEMKQQYTMEIVHTECKPQFIHEYALSRLKS
                     EGYKIAVCSNSIRNTVTTMMDKASLTGYIDLMISNEDVTHGKPDPEMYKLAMKTLGLK
                     PDECLIVEDNENGIKAAKGAGGNLLVVRDVYDTNYTNISSRIKAL"
     CDS             6617..7354
                     /codon_start=1
                     /transl_table=11
                     /product="glycosyl transferase family 2"
                     /protein_id="AJE24502.1"
                     /translation="MAVNILILAAGPTTNDQRDGGYPLCLTETDGVSLIERIVENTKN
                     IENAKYSFALLEQDIEKYHLDRIVQLLAADCIVSKIPEGTKGSACTALLASSQLNGDN
                     ELLIISANELVDLDFTDVLSEFRNKKLDGGTLIFKSIHPRYSYVSLGLDELVIEAAQQ
                     KPISQHATAGVFWFARTSDFQDAAKNLIRKNASVNERFYVAPTFNELILRQMRVGVRA
                     LKLSDYKPLKTERQVNQFENSASYEKF"
     CDS             7341..7661
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="AJE24503.1"
                     /translation="MKNFKLDDMIKGWFVGGFSPTAFATEDCEVAVKKYKCGDKEEAH
                     YHKLATEITVIISGTVKMLDKEWHQGDIIVLSPGEITSFEAITDAINVVVKLPGALND
                     KYVV"
     gene            7804..8544
                     /gene="wzm"
     CDS             7804..8544
                     /gene="wzm"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen ABC transporter permease"
                     /protein_id="AIG62858.1"
                     /translation="MLYSSLRLAIFEIQKRSLNTYAGWTWSLMNPLSQMAILYFIMTH
                     VFKSNIENILLWLISGLNCWIVIQSALLRSCQSLISRRALLQNNNISHNLLVMSDILS
                     EVIILIPFYLFAIALAIFHGVPFSNLILVPLMLLILLVFLLGLGMILATLTPILRDLP
                     YLLGIFMQIAFWLTPIAYAKSSMKGFAASIINFNPFTYFILLSQSIFMGSPVSMKLVV
                     IPAGLAIIAVSVGFMLSNAVGKKTVINL"
     gene            8541..9266
                     /gene="wzt"
     CDS             8541..9266
                     /gene="wzt"
                     /codon_start=1
                     /transl_table=11
                     /product="O-antigen export system, ATP-binding protein"
                     /protein_id="AIG62859.1"
                     /translation="MKKSVEFKNVELLVPEADRPQSLKSLLLNFRKLNSKKKTILSIP
                     HFTAHDGDKICIVGRNGNGKTTFLKVLAGIYPVTRGIIWTEKKPTVVLAAGIGLEEEL
                     SVIENINLSLIIKNVKKSDIPALAESILEFCELKDDRYKQYKHLSTGFKSRLAFAIAV
                     SEKPDILILDEVLGGGDEFFMKKANAKLIETINVSSTAFIATHAPDQMQGICNRLVMI
                     EKGQILFDGAFEEGVNFYRNSYV"
     CDS             9288..10583
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="AIG62860.1"
                     /translation="MAISVVICGLVRSQEKLLTKLQNYFDWREQGRVDEIVYSTWIGE
                     IDSYSGLRKILETKNVKMIEVEEPRLVLKGGHQLHQMLAFYYGLSALKNQDQFVLKTR
                     VDLADNHASMLHEFEFGTSEANDFAGVGIKKRILVEYAQMLYPFLCGDAQFFGHINDL
                     KKLVNLSAEMELLYNRLAVEQTFFFNPFKELALFKQHFYWNLPHISEISDRRNEQIAD
                     VITNESIVRAIQGWWFILDNYFKIGWGPTLPDTIPFTSIQDAFKYKGHDKLIGDDFSD
                     VIVNQSFVTSLIGLFTEEEANSILEDVSNNENYNMLAIPKNVFNDYQGFLKKFSDLPA
                     AKAVCCQNNRLIISGATQHFFVKDENDSASKRYHEQITALRRENEILRKTQNINFSNS
                     LIHRVLNRHLSRKTIDFLKYKCPQLTDFYARHFMRKREK"
     CDS             10585..11613
                     /codon_start=1
                     /transl_table=11
                     /product="rhamnan synthesis protein F"
                     /protein_id="AIG62861.1"
                     /translation="MRLQGYFEILRLTIQFQEYKNKTDFIINHPWRLLLLALLKIIRR
                     FHNLLNRGAMKKLIISNKPNGVYVDDSFLRIEYNNGNYEVIIENVNDVTTPVVNNIKS
                     TALQTFSSNRKVVFVHAFYHEEAIYIFNQLSMFFDYDIIISSPHADIINRAKEKFGSE
                     RVIGLITPNHGRDVLPFLICLKFINVENYSHFVKLHTKKSKHLRDKGRWFRLNVEFLI
                     GNKSVTDKIFQLMPDNAPIILGESVLEIQDHLENNVHWLAFLLAKDPSCIDSKFIPGT
                     MFLGTGSFLRLVKSLNLHRYKIEKEAGQLDGCCVHAMERYFGYLASVHGGNCDALEAF
                     VGKEEAKL"
     CDS             11610..13262
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="AIG62862.1"
                     /translation="MKKTILINGAVRDIEEFVLIIDCLLEQRKKSEEKIEIIISTWHE
                     DINKNLQLFRWIASNDIKVVGSAGIDSGGPANIFRQWRTLEAGLSIVSSDSLILKGRT
                     DKFLLRKDVIEAFVKAEGSDPALQMAIKQDKLAVEHISLSLPFMAKDMIYIGTVTAIR
                     KIMHYSVRTKYVADHIFHGIGPECFLWLESCSSDQELMQLIQKIDFRFISNELMKNNC
                     IFEYDWSQIKPQICLLYSKWYHSFDSNFTFLSDIIKCHKSPSWVINEGLYKYQTGDRE
                     DYERLRFILESVTPTSLLNCASELCFLNSTDTFTLESNSDNSYLEWKPELPFLEDIDR
                     IRNDYSREYSDIVLLRSKLIQRMLVSQNPDPKKLTQALKWNIRQRDNETLNMVYNWMM
                     SADDNIKYVSHDDRLFVLERILDSFTFIADNVAIENTIEILKDYFKKSPQLSVRVAES
                     YFRKGKLYYSLYWFWLSYKGLPGHLGVNHGLGCTLLDLGFPRLALKYLRQANAIQPQD
                     QTASFTLIRCLARCNKKSEAKILMNNLSGHLRVEAERILNAD"
     CDS             13252..14691
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="AIG62863.1"
                     /translation="MLIKMIRKKRWLKKFDGALRAAYEASNYLNHYSYQWFSENVYSL
                     ALGLDSAIDFDEEFYLSHNADIARAVKNGGLCCGYVHFCTLGKYELRVWSSKKIYEIR
                     PGGPILGAGLAEPKNIFPLPHYTPDLSALPESSEKSLVILIPFLVDDLFFAGYTSFFN
                     DMTLIFPLFSDVKVIVSNAHYNEHLLDKYGGNIQVLPFSDISLLTVKPTLVYCFDTET
                     FFQAKQVFGELKRVVYYCQDYESGFYPYGSMYARSQSAIYLSKNIVFSTGILASSIES
                     KGLLGDDVNIYITSPKIEPFSVKNVKSKKLFFYYRPEFFNSRNMPELILRTVIDFCQK
                     HTGYEIYLVGAVGTSFSQNINGTNVVILSKLAKDEYLDLISSCDAVVALIYSDHPGVI
                     AYQAAASGIPTVTNTFEIRNADFIHSISSNLVPFDPVRDSLVDKLEFALSMPKGNCDF
                     NSAMYEQRSLLSFYDFNSKIIGNDRSYTR"
     CDS             14688..15596
                     /codon_start=1
                     /transl_table=11
                     /product="methyltransferase domain protein"
                     /protein_id="AIG62864.1"
                     /translation="MKTSDNKNDFYPSAYSLRFTPARLSKAIDWHGHLSFAAWLMELV
                     RPEILVELGVFRGDSLSTFSQASRDLNIKCEITGVDSWGGDNTTGAYGEEVYSEVKDY
                     FSSSFPNTKLYRALFDEALSEFSDDSVNVLHIDGCHHYDAVKHDYETWLPKVSTENGI
                     ILFHDTNVVAHGFGSKQFWEEINSTYPSFSFNHSNGLGVLLVGKRQPNEFIALSQDER
                     FLDKVRSIYELSGNMFIHKAKEQWWKDEADKHAAYVNHLTGDVGKQIADTINHHFVNH
                     LTAHRQTGVFSNNNYAKRLVKKIFHR"
ORIGIN      
        1 gtcgttgcac acagtgtacc tggttgctgt agagctaggg gcggtagcat gtctgaaatt
       61 tgtctcgcgc acttgtctat gtttttatac gattatcaag tcaaatagta atagtggaaa
      121 attcacgtga aaatactggt tacaggtgga gcaggattta ttgggtctgc agttattcgt
      181 catattatta ataatactct ggatgctgtg gtcaatattg ataaattaac ctatgcgggt
      241 aatcttgaat ctctggtcga tattgaaaat agtgaacgat atatttttga acaagtggac
      301 atctgtgaca gcgaggcgat agctcgtatc tttgcctgcc accaacctga tgccgtgatg
      361 catcttgctg ctgagagcca tgttgaccgt tctattaccg ggccagctgc atttattgag
      421 acgaatatca ttggtacgta tgtgctcctg gaagaaactc gcaagtactg gttatctctg
      481 gatgaggcgc gtaaagctgc gttccgcttc catcatatct caaccgatga ggtgtatggc
      541 gacttgccgc acccggataa gcaaatccca ggtactgcgt tgccgttgtt taccgaaaat
      601 acaccatatg caccaagtag cccttattcg tcgtctaaag catcaagtga ccatttagtt
      661 cgtgcctggc gacggactta tgggttgcca acgatcgtga ccaactgttc taacaactac
      721 ggcccttatc attttcctga gaagttaatc ccgctaatta ttctcaatgc gcttgcgggc
      781 aaacaactgc cggtttacgg caatggcgag caaattcgtg attggctcta tgttgaggat
      841 catgcgcggg cactgtataa agttgtgacg gagggaactg tcggggaaac gtataatatt
      901 ggtggccata atgaacgtaa aaatattgaa gttgttaaaa ctatttgcgc cattcttgat
      961 gagatagtca ctgctaaacc gaaaggtatt caacgttttg aacaacttat cacctacgtt
     1021 gccgatcgcc cggggcatga tttgcgttat gcaattgatg ccagcaaaat caaacgtgaa
     1081 ttaggctggg tgcctgctga gacatttgaa tctggtatcc gtaaaacagt taactggtat
     1141 ttgaataatg acggctggtg gaaacgtgta atagatggct cctacgcggg agaacgttta
     1201 gggctggtgg attaattaag gaataatgat gaaaggtatt gtgcttgctg ggggatctgg
     1261 aactcgccta tatccgatta cgcagggggt atccaagcag ttgctgccag tttacgacaa
     1321 gccaatgatt ttctatccga tatcggttct gatgttggct ggaattcgtg atattttaat
     1381 tataacaact cccgaagata tgccttcctt taaacgtctg ttgggtaacg gatcgcagtt
     1441 tggcattcgc ctctcctatg aagtgcagcc atctccggat ggcttggccc aggcatttat
     1501 tattggtgag gagttcatca ataacgaacc gtgcgcactg gtattggggg ataatattta
     1561 tttcggtcag agctttggta aaaagctcga aaccgcagcg caattgaccc gtggggcaat
     1621 ggtttttggt tatcaggtgt tggatcctga acgttttggt gtggttgagt ttgataagag
     1681 tttcaaagcg ctttctattg aggaaaaacc gctcaaaccg aaatctaact gggcagtaac
     1741 aggactttat ttctatgaca gtaatgttgt ggaaatggca aaacaggtta aaccttctgg
     1801 aagaggtgaa ttggagatta ctacgctgaa ccaaatgtat cttgagcgcg gtgagctgca
     1861 ggtagaattg ctaggacgtg gttttgcttg gttggataca ggtactcatg acagccttgt
     1921 agaagcatcg cagtttattc ataccattga gaagcgtcag gggatgaaag ttgcatgctt
     1981 ggaagaagtc gcttaccgta aaggatggtt gagcaaagag caagtttccg agcaggcgac
     2041 gaaaatggct aaaaacgatt atggccgcta tttgcgcatg ttaatcaatg aataactcac
     2101 cataaagaaa atcttgtatg aaaattttgc tgattggaaa aaatgggcaa gttggttggg
     2161 aacttcagcg ctctctttca acattaggcg agttagttgc aatagattat ttcgatactg
     2221 gtatgtgtgg tgatctaact gatcctgagg gtattgctga gactatacgt cttgtaaggc
     2281 ctgatgttgt tgtcaatgca gcggctcata cagcagtgga taaagctgag agtgaaagaa
     2341 aactatctca attgctaaat gccgatagcg ttgaagtaat tgctcgggag accgcaagat
     2401 taggtgcctt ggttattcat ttttctactg actacgtttt caatggggag ggggaacact
     2461 atcgtcttga agatgaagag cctgctccgt tgaatgtgta cggagaaact aaattagcgg
     2521 gggaagcagc tataatcaaa tataatcctc gtcattttat tttccgcaca agttgggtct
     2581 ttgctacacg tggtgctaat tttgttaaga caatgctgcg gcttgcaaag gaaaaagaaa
     2641 ccttgtcaat catcaacgat caacatggtg cgcctactag cgcagaactt attgccgact
     2701 gcacagcaat agccatccga gttgagcata ataataaatc attgcatggt acataccatt
     2761 tagtggcaag tggagagact acttggtatg aatatgctaa atatgtattt tctgtagctc
     2821 atcagtttaa tgaaattttg gctgttaaag aggttaaggc tgtagatacc tctgcgtatc
     2881 cgacacctgc aaaaaggcca cataattctc gccttgcaaa ttcgaagttt caaaatgctt
     2941 ttttggtaac attacctgat tggaaaattg gtgtacaaag agttgttact gaactgctgg
     3001 gaaaataagc taggagagta ctaaaatgaa tgtaatcaaa acagaaattc aagatgtatt
     3061 aattttagaa cctaaagttt ttggtgatga acgtggtttc ttctttgaaa gtttcaatca
     3121 gcatgttttc gaagaggcgg ttgggaaaaa agtttctttc gtccaggata atcattcaaa
     3181 atcaaaaaaa ggggtcttga gaggacttca ttatcaattg gcaccacatt cacagggtaa
     3241 attagttcgc tgtacaatgg gggccgtatt tgatgtggca gtagatattc gaattgggtc
     3301 tgaaacattc ggcaagtggg ttggggtaga attaagtgca gagaataagc gtcaattgtg
     3361 gattcctgaa ggcttcgctc atgggtttgt cacattaact gatacggctg aatttttgta
     3421 taaagctaca aattattatg cgccatgtgc cgagcgttgc ataatctgga acgactctca
     3481 actttctatt gcatggccag aaataaatga aatttcctta tcttctaaag atgtgactgg
     3541 cctgccatta aaagattccg agctcaatta ataaaatatg aaacatgaac caaaaatagc
     3601 aatattgtta tgtagttata atggtggcgc ttatattaga cggcaacttg attcaattat
     3661 aagtcaatct tatagtaatt gggtgctgta tatatcagat gatggttcaa ccgatgagac
     3721 tttggacatt gtctacgagt acaaaaaacg cttaggtgat ggacgtgtac aggtattttc
     3781 tggtccaggg cagggatttg catggaactt tatttcactt gtcgataaag tcccgggaga
     3841 ttttgattat tatgccttta gcgatcaaga cgatgagtgg ttgaacttta aacttgataa
     3901 agcagttcaa ctcttaatta ctgatgacag tattccacag ttatattgcg ggcgtacaca
     3961 attagttgac gaggacaatt gtagattagg gctttcgcca ctttttacga gaaaaccttg
     4021 cttccggaat gcattagtac aaagcattgc tggtggcaat acaatgatat ttaatagggc
     4081 ctcaaaaaat attattttaa aaacaccgtc aaattcaaaa attatatcgc atgactggtg
     4141 gatctatata ttagtcactg gttgtggtgg tagagttata tatgataaac aaccaacaat
     4201 tctctaccgt cagcatcaaa ataatattat tggggccaac aagggtattt cagcacggct
     4261 gagtcgtttg cttggcgtta tagacggacg ctataaaaaa tggatacaag caaatcttga
     4321 tgttctagaa gaaatagaaa taaattttac ggaagataat cgattcgttt taaataattt
     4381 tatacgtgct cgtaaatctg gtttcttcaa aagaatatac atcttttcca aaattaaatt
     4441 attccgtcaa acattggttg gcagttttgc ttttataata gcaataatga tgaacaaagt
     4501 ataattattt atatggagat ggttgtctta aatgacagtc gtcccttact tttatataac
     4561 gataggtgaa aaatgattaa tattgttatt cctatggctg gcgccggaag ccgttttgcg
     4621 aaagctggtt atgctgatcc taaaccatta atacctatca atggtacgcc aatgatcaaa
     4681 ttggttataa ataatttaaa gcccgcagtc cctcatcgat ttatttttat ctgtcaaaaa
     4741 gaacattcac aaaaatatga tttgcaacaa aaattgaagt catgggctcc tggttcggaa
     4801 gttatagaaa ttgatggttt gactgaaggt gctgcatgta ccgtacttac ggcgaaagat
     4861 ttaattaata acgaagatgc tttaatgatt gctaatagcg atcaatatgt tgatatcgat
     4921 attgatgatt acttgagata ccaggaggaa gaaaatttag atggtctgat tatgactatg
     4981 actgctgatg atcctaaatg gtctttcgta aaaatagatg ttaataattt agttcgcgat
     5041 gttgttgaaa aagtcgttat ttctgatgag gcgacagtag gtatctataa tttcaaacat
     5101 ggccgtgact ttattgctgc cgctgagttg atgattaaga ataatcttcg ggtaaacaac
     5161 gagttttatg ttgcaccaac atataatcaa ttaattaatg attataactc caagattgga
     5221 atctataata ttggctctga agctaatggt atgtatgggc ttggaattcc tgatgattta
     5281 aatttatttt tatcgctacc tgtatgcaaa aaagcattgg agaaaagtaa atgaaaatta
     5341 tttcccatag aggttattgg aaaagtacgg aagagaaaaa taaagaggta gcatttactc
     5401 gttcttttgc tctaaattat ggtacggaaa cagatgttcg tgattacctt ggggatttag
     5461 tcatttcgca tgatattgct gatgaaaatg caataacttt aaattcattt cttgaaaatg
     5521 cgaacaaata tggttcagaa gataataaaa tcacattagc tcttaatata aaagcggatg
     5581 gtctggcaag tagcgtctca atagcaatta gcaaatttaa taatctcgac tgctttgtat
     5641 ttgatatggc agtgccagat atgcgaagct actttgaaca ctcggtacca gtcttcactc
     5701 ggtgtagcga ggttgaatca caacctgtat ggctcgaaaa atctactggc atttggttag
     5761 acgctttcga taaggaatgg tttacctctg accttatcat tacgttatta gcgactggta
     5821 agcgggtatg tatcgtctca tcagagttac atgggcgtga taaaaccaga ttgtgggaaa
     5881 tgctgttacc tttaagatca caacccaatt tgattctttg cacagatgtt cctgaagacg
     5941 caagtgagta tttttcgcga taatgaggcg agtatgacta ttaaagcaat tttatttgat
     6001 atggatggtg tgcttatcga tgctaaagaa tggcattatg aagctttaaa taaagcactt
     6061 gatttgtttg gaatgaaaat atcccgtttt gaccatctaa caacttttga tggattgcct
     6121 accaaaaaaa aattagaaat gcttagtaaa gagagacatt taccgaggga gttgcatgat
     6181 tttattaatg agatgaaaca acagtataca atggaaattg ttcatactga atgtaaacct
     6241 caatttattc atgaatatgc tctttctaga cttaaatcag aaggttataa gatcgccgta
     6301 tgttctaatt ctatcagaaa tacagtgaca acaatgatgg ataaggcatc tttaactggt
     6361 tatattgatt taatgatttc gaatgaggac gtaactcatg gtaaaccaga tcctgaaatg
     6421 tataagctgg ctatgaaaac cctaggtctg aaacctgatg agtgtctcat tgttgaagat
     6481 aatgaaaacg gtatcaaagc agccaaagga gcaggtggta acttactagt tgtccgtgat
     6541 gtgtatgata caaactatac aaacatctct tcgcggataa aggcgttgta atccgattct
     6601 gattaggaga aatatcatgg cggttaatat acttattctt gctgcgggtc caacaactaa
     6661 cgatcagcgg gatggcgggt atcctctgtg tttgacagaa acagatggcg tatctttaat
     6721 tgagaggata gttgaaaata ctaagaacat tgagaatgca aaatatagtt ttgcattact
     6781 agaacaggat atagaaaaat atcatttgga tcgtattgtc caattactcg ctgcagactg
     6841 tattgtgtcg aaaattccgg agggaactaa aggatctgct tgtacagcat tattagcatc
     6901 gagccaattg aatggtgata acgaactact aatcatcagt gcgaacgaac ttgttgatct
     6961 tgattttact gatgtactca gcgaatttag aaataagaag cttgacggag ggactcttat
     7021 atttaaatca atacatcctc gctattcata tgtctcctta ggcttggatg agcttgtgat
     7081 tgaagctgcg cagcaaaaac cgattagtca gcacgcgacc gctggtgttt tttggtttgc
     7141 acgtacttct gattttcaag atgctgctaa aaatcttatc aggaaaaatg caagtgtaaa
     7201 tgaacgattt tatgttgcac caacatttaa tgaactgatt cttcgtcaga tgcgtgtagg
     7261 agttcgtgca ttaaagctta gcgattacaa gcccctcaaa actgaaagac aagttaacca
     7321 attcgaaaat agtgcttctt atgaaaaatt ttaaacttga tgatatgatt aaaggatggt
     7381 ttgtaggtgg tttttcacca acagcctttg ctactgaaga ctgtgaagtt gcagttaaga
     7441 aatacaaatg tggtgataaa gaagaagctc attatcataa gctagctact gaaattactg
     7501 taataatcag cggtactgtt aagatgttag ataaagaatg gcatcaagga gatattattg
     7561 tattgtctcc tggtgagatt acttcttttg aggcaattac tgacgctatt aatgtagtag
     7621 tgaaattacc tggtgcattg aacgataaat acgtagttta attttattat ctatttgtca
     7681 agttagcttt ctttatatta aaaagaaagt tcctatcgct gcattttaaa ttaaatgtgc
     7741 acactgtaat tggtaaagag atatcgtttg taaatatgat atcaattgct aaggtattag
     7801 ataatgttat atagtagttt gcggcttgcg atatttgaga tacaaaaaag atctctgaac
     7861 acttatgctg gttggacttg gagtctaatg aatccattat cgcaaatggc cattttgtat
     7921 tttattatga cgcatgtttt caaaagtaat atcgaaaaca ttttgctttg gctcataagt
     7981 ggacttaact gttggatcgt tattcagagt gctctattga gaagttgtca gagccttatc
     8041 tccagaagag cacttttgca aaataataat atatcacata atcttcttgt tatgtccgat
     8101 attctctcag aagttattat tttaattcct ttttacttat tcgcaatagc attagcaatt
     8161 tttcatggtg taccattctc taatctaatc ttagttccct taatgcttct aattttgctc
     8221 gtattccttt tgggtttagg aatgatactt gcaacattaa ctcctatatt acgtgattta
     8281 ccttacctac tgggaatctt catgcagata gcattttggt taacaccaat tgcttatgct
     8341 aaatcctcaa tgaaaggttt tgcagcatca attattaatt tcaatccttt tacctatttt
     8401 attcttctat cgcaatccat tttcatgggc agcccggtct caatgaaatt ggtcgttata
     8461 ccagctggcc tagctattat cgccgtttca gtcggtttta tgctttcaaa tgcagtaggt
     8521 aaaaagacgg taattaattt atgaaaaaat ctgttgaatt taaaaacgtt gaattacttg
     8581 tacccgaggc agatcgtcca cagtcactta aaagcttgtt acttaatttc agaaaactga
     8641 atagcaagaa aaaaacgatt ttatcaatac cacatttcac tgcccatgat ggcgataaaa
     8701 tttgtatcgt agggcgtaat ggtaatggta aaacaacttt cttgaaggtc ttggctggca
     8761 tttatcctgt gacgagagga attatttgga ctgaaaaaaa accgacggta gttttagccg
     8821 cggggatagg tctcgaggaa gaactgagtg tcattgaaaa tatcaaccta tcactgataa
     8881 ttaaaaatgt gaagaaatct gatattcctg ctcttgctga atcgatatta gaattttgtg
     8941 agctaaaaga tgatcgctat aagcaatata agcacttatc gactggtttt aaaagtcgat
     9001 tagcatttgc cattgcagtg agtgagaaac ctgatattct cattcttgat gaagtattag
     9061 gcgggggaga tgagtttttc atgaagaagg ctaatgcaaa gctaatagaa acaattaatg
     9121 tgtcttccac tgcatttatt gccactcatg caccagacca aatgcaaggg atttgtaatc
     9181 gtttggtcat gatcgaaaaa ggacaaattc tctttgatgg cgcttttgaa gagggcgtta
     9241 atttttatag aaatagttac gtataaatat aaatggaata aataaccatg gccatttctg
     9301 ttgttatctg cggcttagta agaagccagg aaaaattact tactaaactt caaaattatt
     9361 tcgactggcg cgaacaaggt agagttgatg agattgtcta ttctacttgg attggcgaaa
     9421 ttgatagtta ttcaggcctt agaaaaattc ttgagaccaa aaatgttaag atgatagaag
     9481 ttgaagaacc acgcttagtt cttaaaggtg gacatcaact tcaccaaatg ctggctttct
     9541 attacggttt aagcgcatta aagaatcaag atcagtttgt tttaaaaact cgagtagacc
     9601 ttgctgataa tcatgcctcg atgttgcatg agtttgaatt tggcacatct gaagcaaacg
     9661 actttgcagg tgtaggtatt aaaaaaagaa ttcttgttga atatgcgcag atgctttatc
     9721 catttttatg tggtgatgca caattttttg ggcatattaa tgatctcaaa aaactggtta
     9781 acttgtcagc tgaaatggag ttgctttata atcgtttagc agtggagcaa actttctttt
     9841 ttaacccatt taaagaatta gctctgttca aacaacattt ctattggaat ctgccacata
     9901 ttagtgaaat ttctgatcgc cgcaatgaac aaattgcaga tgttatcact aacgaaagta
     9961 tagttcgggc gattcaagga tggtggttta ttcttgataa ttacttcaag attggttggg
    10021 ggccaacact acccgacact atcccgttca catctataca ggatgcgttt aagtataaag
    10081 gccatgataa gcttattggt gatgatttca gcgatgtgat tgttaaccaa agctttgtga
    10141 cttctttgat tggtcttttt acggaagaag aagctaactc aatattagag gacgtaagca
    10201 ataatgaaaa ctacaacatg cttgctatcc caaaaaatgt ttttaatgat tatcaaggat
    10261 tcctgaaaaa gttcagtgat ctccctgcag cgaaggccgt gtgttgtcaa aataataggc
    10321 tcattatttc tggtgctacg caacatttct ttgtaaaaga tgaaaatgac tctgccagta
    10381 agcgttatca tgaacaaatt acagcattac gtcgtgaaaa cgagattcta aggaaaacac
    10441 aaaatatcaa tttcagtaac tcactcatac accgggtact taatagacat ctatcgcgta
    10501 aaacaattga ttttcttaag tataagtgtc ctcagttaac tgacttttat gcccgtcatt
    10561 tcatgaggaa gagagaaaaa taatatgcgt cttcaagggt attttgaaat attacgattg
    10621 actattcaat ttcaggaata taaaaataaa acggacttta ttattaatca tccgtggcga
    10681 ttattgctgc tcgcacttct taaaattatt agacgttttc ataacctcct aaatagaggt
    10741 gcgatgaaga agttgatcat ttcaaataaa cctaacgggg tctatgttga tgattctttt
    10801 cttcgtattg aatacaataa tgggaactat gaagttatta tagaaaatgt aaatgacgtc
    10861 acaactcctg tggtcaataa tattaaatcc acagcgttgc aaacattttc tagtaatagg
    10921 aaagtcgttt ttgttcatgc tttctatcat gaagaagcta tatatatttt taatcagctt
    10981 tcaatgttct tcgactatga tattattatt tcatcaccac atgctgatat tattaatcgc
    11041 gcaaaagaaa aatttggctc tgaacgagta attggactta taactcctaa tcatggccga
    11101 gatgttttac cttttctaat ttgtttaaag tttattaatg tagaaaatta tagccacttc
    11161 gttaagttac ataccaaaaa atccaagcat cttagagaca agggacgttg gtttagactt
    11221 aacgttgaat ttttaattgg taataaaagt gtcactgata aaatctttca gttaatgcct
    11281 gataatgccc ctataattct tggtgaatca gtattggaaa ttcaggacca tcttgaaaat
    11341 aatgttcatt ggctagcatt tttattagct aaagatccct cctgcattga tagcaaattt
    11401 attcctggaa ctatgttcct tggcactgga agttttttac gtcttgttaa atctttaaac
    11461 ttacatcgtt acaagataga gaaagaggca gggcaacttg atggatgctg tgtgcatgcc
    11521 atggaaagat atttcggcta tttagcgagt gtgcatggtg gaaattgcga tgcgcttgag
    11581 gcctttgtgg ggaaagaaga ggcgaaacta tgaaaaaaac aattttaatt aatggtgcgg
    11641 tgcgcgacat tgaagagttt gttttaataa ttgattgtct cctggaacaa aggaaaaaaa
    11701 gcgaagaaaa aatcgaaatc atcatttcta cttggcatga agatatcaat aaaaatttac
    11761 aacttttccg atggattgcg tcgaatgata ttaaagttgt tgggagcgca ggcattgatt
    11821 ctggaggacc tgctaacata tttcgccagt ggcgtacact tgaagctggc ttaagcattg
    11881 tctcatcgga ttctttgatt cttaaaggac gtactgataa atttttatta cgtaaagatg
    11941 taatcgaagc ttttgtcaaa gcagaaggaa gtgatcccgc tttgcaaatg gcaataaaac
    12001 aagataaact ggctgtagag catatttctt taagtcttcc gttcatggct aaagatatga
    12061 tctatatagg gacagtaaca gcgatcagaa aaatcatgca ctattcggta agaacaaagt
    12121 atgtcgctga ccatatattt catggaattg gtcctgaatg tttcctttgg cttgaatcat
    12181 gtagttctga ccaggagtta atgcagttaa tacaaaaaat tgactttcgg tttatctcta
    12241 atgaattaat gaaaaataat tgtatatttg agtatgattg gtctcaaatc aaaccacaga
    12301 tttgcctgct ttattcaaaa tggtatcatt cgtttgatag taattttaca tttttgtcag
    12361 atataattaa atgccacaaa tctccttctt gggtaataaa cgaaggtcta tataagtatc
    12421 agactgggga tcgtgaggat tatgaacggc tgcgctttat tcttgaaagt gttacgccga
    12481 catcgcttct taattgtgct tctgagctat gctttttaaa ttctactgac acctttaccc
    12541 ttgaaagtaa tagtgataac tcttatctgg agtggaaacc tgaattacct ttcttggaag
    12601 atattgatag aataagaaat gactattctc gggaatattc tgatatcgtc ttgctaagaa
    12661 gcaaattgat tcagagaatg ctagtgtcac agaatccaga tcctaaaaaa ctaactcaag
    12721 cccttaaatg gaatattagg cagcgtgaca atgagacttt aaatatggtc tataactgga
    12781 tgatgtctgc agacgataat ataaagtatg tatcacacga tgaccgtctt tttgttcttg
    12841 aaagaatatt ggattctttt acatttattg ctgacaatgt cgctattgaa aacacgatag
    12901 aaatattaaa ggattatttt aaaaagtctc ctcaactttc cgttcgtgtt gctgagagtt
    12961 attttagaaa gggtaagtta tattattcat tatactggtt ctggctgagt tataaaggct
    13021 tgcctggtca tttgggtgtc aatcatggtt taggctgcac actacttgat ttaggctttc
    13081 ctagacttgc cttaaaatac ttgcgtcaag ctaatgcaat tcaaccgcaa gaccaaactg
    13141 cttctttcac acttattcgc tgcttggcta gatgtaataa gaaatcagaa gcaaaaatat
    13201 taatgaataa tctttccggt catttacggg ttgaagcaga gaggatcctc aatgctgatt
    13261 aaaatgataa gaaaaaagag atggttaaaa aaattcgatg gtgctttacg tgctgcttat
    13321 gaggcttcga attatttaaa ccactattct taccaatggt tttccgaaaa tgtatattcg
    13381 ttggcactgg gccttgactc agcaatagat tttgatgagg aattttatct tagtcacaat
    13441 gctgatatcg ctcgcgcagt aaaaaatggt ggcctttgtt gtggttacgt acatttttgc
    13501 acccttggaa aatatgagtt aagggtatgg agttccaaaa aaatatatga gattagacca
    13561 ggtggtccta tattaggtgc cggtttggca gagcctaaaa atatttttcc attacctcac
    13621 tatacacctg atcttagtgc actgcctgag tcatcagaga aatctctagt cattctcatt
    13681 ccttttttag ttgacgacct tttcttcgct ggttatacga gtttctttaa tgatatgact
    13741 cttattttcc ctcttttttc tgacgttaaa gtcatagtga gtaatgctca ttataatgag
    13801 catttacttg ataaatatgg gggtaacatt caggtccttc ctttctctga tatttcactg
    13861 ttaacagtga aaccaacttt ggtatattgc ttcgatacag agaccttctt ccaggcaaag
    13921 caggtgttcg gtgagcttaa gagagtggtt tattattgtc aggattatga atccggattt
    13981 tatccatacg ggtcaatgta tgccagaagt cagtccgcta tctatttaag taaaaacatt
    14041 gttttttcga ctggtatact tgcaagttct atcgagagta aaggattgct tggagatgat
    14101 gtaaatattt atataacgtc tccaaaaata gaaccttttt cggttaaaaa tgttaagagt
    14161 aagaagcttt ttttctatta tcgacctgag tttttcaata gtagaaatat gccggagttg
    14221 atattacgaa cagttattga tttttgccaa aagcatactg gatatgaaat ttatcttgtt
    14281 ggtgctgtcg gtacatcatt ctcgcaaaat atcaacggaa ctaatgttgt tattcttagt
    14341 aaactagcca aagatgagta tcttgattta atttcatcat gtgatgctgt agttgcgctg
    14401 atatattcag accatcccgg tgttattgcg tatcaagctg ccgcctcagg aatcccgaca
    14461 gtaacaaaca catttgaaat tcgtaatgct gattttattc attcaatatc ctctaatttg
    14521 gtgccttttg accctgtcag agattcattg gtcgataaat tagagtttgc tctttcgatg
    14581 ccgaaaggaa actgtgattt taattcggcg atgtacgagc aaaggagtct attaagcttt
    14641 tatgacttca attcaaaaat tataggaaat gacaggagct atactagatg aaaacatctg
    14701 ataataaaaa tgatttctat ccctctgctt acagtttacg ttttacaccg gcacgtctca
    14761 gtaaagctat tgactggcat gggcatctat catttgctgc atggctcatg gaactcgtcc
    14821 gccctgaaat attagttgag ttaggtgtgt ttcgcggaga tagtctatcg actttctctc
    14881 aggcatcccg agatctgaat attaaatgtg agattactgg tgttgactct tggggagggg
    14941 ataacacaac tggagcttat ggcgaagaag tctattccga ggttaaagat tatttctcat
    15001 catcttttcc taatacaaaa ttgtatcgtg cattgttcga tgaggcttta tctgaatttt
    15061 ctgatgattc tgttaatgtt ctgcacattg atggttgcca tcactatgac gcggtaaagc
    15121 atgattacga gacttggctc ccgaaagtct caactgagaa tggtattatt ctatttcatg
    15181 ataccaatgt tgttgctcat gggtttggtt ctaagcaatt ttgggaagaa attaatagca
    15241 cctatccttc ctttagtttc aatcattcta atggattagg tgttctttta gtcggcaaaa
    15301 gacagcctaa tgagttcatt gcactgtctc aggatgaaag attccttgac aaagttaggt
    15361 ctatttatga attatcaggt aatatgttta ttcataaggc taaagaacaa tggtggaaag
    15421 atgaagcaga taaacatgct gcatatgtta atcatttaac aggtgatgtt gggaaacaaa
    15481 tcgctgatac gataaatcat cattttgtta accaccttac tgctcatcga caaactggtg
    15541 tattctcaaa taataattat gcaaaacggt tggtgaaaaa aatatttcac agataaccat
    15601 aaggtattaa tggcatttta ttgattatct gtgttgcttt agtattgact aatgtgtgtt
    15661 ttgttttttt acttacttta gacttttata tgtaaaaact tggaggggat aataatataa
    15721 aaaccctcca gaatgtttta tcatgagtgt tgttcacacc tgacaggagt acataatgtc
    15781 caagcaacaa atcggcgtag tcggtatggc tgtgatg
//