LOCUS       AY568960               14433 bp    DNA     linear   BCT 26-JUL-2016
DEFINITION  Escherichia coli serotype O4:K3:H5 GalF (galF) gene, partial cds;
            RmlB (rmlB), RmlD (rmlD), RmlA (rmlA), RmlC (rmlC), Wzx (wzx), WbuG
            (wbuG), Wzy (wzy), WbuH (wbuH), FnlA (fnlA), FnlB (fnlB), FnlC
            (fnlC), WbuB (wbuB), and WbuC (wbuC) genes, complete cds; and Gnd
            (gnd) gene, partial cds.
ACCESSION   AY568960
VERSION     AY568960.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 14433)
  AUTHORS   D'Souza,J.M., Samuel,G.N. and Reeves,P.R.
  TITLE     Evolutionary origins and sequence of the Escherichia coli O4
            O-antigen gene cluster
  JOURNAL   FEMS Microbiol. Lett. 244 (1), 27-32 (2005)
   PUBMED   15727817
REFERENCE   2  (bases 1 to 14433)
  AUTHORS   D'Souza,J.M., Samuel,G.N. and Reeves,P.R.
  TITLE     Direct Submission
  JOURNAL   Submitted (08-MAR-2004) School of Molecular and Microbial
            Biosciences, University of Sydney, Sydney, NSW 2006, Australia
FEATURES             Location/Qualifiers
     source          1..14433
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /serotype="O4:K3:H5"
                     /db_xref="taxon:562"
     gene            <1..781
                     /gene="galF"
     CDS             <1..781
                     /gene="galF"
                     /codon_start=2
                     /transl_table=11
                     /product="GalF"
                     /protein_id="AAT85646.1"
                     /translation="NSLVIIVAAGIKEILLVTHASKNAVENHFDTSYELESLLEQRVK
                     RQLLAEVQSICPPGVTIMNVRQGEPLGLGHSILCARPAIGDNPFVVVLPDVVIDDASA
                     DPLRYNLAAMIARFNETGRSQVLAKRMPGDLSEYSVIQTKEPLDREGKVSRIVEFIEK
                     PDQPQTLDSDIMAVGRYVLSADIWPELERTQPGAWGRIQLTDAIAELAKKQSVDAMLM
                     TGDSYDCGKKMGYMQAFVKYGLRNLKEGAKFRKGIEKLLSE"
     gene            1154..2239
                     /gene="rmlB"
     CDS             1154..2239
                     /gene="rmlB"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlB"
                     /protein_id="AAT85647.1"
                     /translation="MKILVTGGAGFIGSAVVRHIINNTQDSVVNVDKLTYAGNLESLA
                     DVSDSERYVFEHADICDAAAMARIFAQHQPDAVMHLAAESHVDRSITGPAAFIETNIV
                     GTYVLLEAARNYWSALDSDKKNSFRFHHISTDEVYGDLPHPDEVNNTEELPLFTETTA
                     YAPSSPYSASKASSDHLVRAWKRTYGLPTIVTNCSNNYGPYHFPEKLIPLVILNALEG
                     KALPIYGKGDQIRDWLYVEDHARALYTVVTEGKAGETYNIGGHNEKKNIDVVLTICDL
                     LDEIVPKEKSYREQITYVADRPGHDRRYAIDAENIGRELGWKPQETFESGIRKTVEWY
                     LSNTKWVDNVKSGAYQSWIEENYEGRQ"
     gene            2239..3138
                     /gene="rmlD"
     CDS             2239..3138
                     /gene="rmlD"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlD"
                     /protein_id="AAT85648.1"
                     /translation="MNILLFGKTGQVGWELQRALAPLGNLIALDVHSTDYCGDFSNPE
                     GVAETVKKIRPDVIVNVAAHTAVDKAESEPEFAQLLNATSVEAIAKAANEVGAWVIHY
                     STDYVFPGNGDMPWLETDVTAPLNVYGKTKLAGERALQEHCAKHLIFRTSWVYAGKGN
                     NFAKTMLRQAKEREELAVINDQFGAPTGAELLADCTAHAIRVALKKPEVAGLYHLVAN
                     GTTTWHDYAALVFEEARKAGIDLALNKLNAVPTTAYPTPARRPHNSRLNTEKFQQNFA
                     LVLPDWQVGVKRMLNELFTTTAI"
     gene            3197..4075
                     /gene="rmlA"
     CDS             3197..4075
                     /gene="rmlA"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlA"
                     /protein_id="AAT85649.1"
                     /translation="MKTRKGIILAGGSGTRLYPVTMAVSKQLLPIYDKPMIYYPLSTL
                     MLAGIRDILIISTPQDTPRFQQLLGDGSQWGLNLQYKVQPSPDGLAQAFIIGEDFVGG
                     DDCALVLGDNIFYGHDLPKLMEAAVNKEIGATVFAYHVNDPERYGVVEFDNNGTAISL
                     EEKPLEPKSNYAVTGLYFYDNDVVEMAKNLKPSARGELEITDINRIYMEQGRLSVAMM
                     GRGYAWLDTGTHQSLIEASNFIATIEERQGLKVSCPEEIAYRKGFIDAEQVKVLAEPL
                     KKNDYGQYLLKMIKGY"
     gene            4080..4544
                     /gene="rmlC"
     CDS             4080..4544
                     /gene="rmlC"
                     /codon_start=1
                     /transl_table=11
                     /product="RmlC"
                     /protein_id="AAT85650.1"
                     /translation="MNVIKTEIPDVLIFEPKVFGDERGFFFESFNQKVFEEAAGRKVE
                     FVQDNHSKSKINVLRGMHYQLTQNTQGKLVRVISGSVYDVAVDLREKSKTFGKWVGVE
                     LSGNNKRQLWIPEGFAHGFYVLEENTEFVYKCTDTYNPAHEHTLLWNDPTTI"
     gene            4642..5880
                     /gene="wzx"
     CDS             4642..5880
                     /gene="wzx"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzx"
                     /protein_id="AAT85651.1"
                     /translation="MSLIRNSFYNIAGFAVPTLVAVPALGILARLLGPENFGLFTLAF
                     ALIGYASIFDAGISRAVIREIALYRESEKEQIQIISTASVIVLFLGVVAALLLYFSSN
                     KVVELLNVSSVYIETAVRAFSVISFIIPVYLINQIWLGYLEGLEKFANINVQRMISST
                     SLAILPVIFCYYNPSLLYAMYGLVVGRVISFLISAIICRDIILKSKLYFNVATCNRLI
                     SFGGWITVSNIISPIMAYFDRFIISHIMGASRIAFYTAPSEGVSRLINIPYALARALF
                     PKLAYSNNDDERKKLQLQSYAIISIVCLPIVVIGVIFASFIMTTWMGPDYALEAATIM
                     KILLAGFFFNSLAQIPYAYLQSIGKSKITAFVHLIELAPYLLLLYYFTMHFGIIGTAI
                     AWSLRTFCDFVILLSISRRK"
     gene            5877..6779
                     /gene="wbuG"
     CDS             5877..6779
                     /gene="wbuG"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuG"
                     /protein_id="AAT85652.1"
                     /translation="MIAVDIALATYNGANFIRQQIESIQKQTYRNWRLIISDDNSSDD
                     TVDIIKDMMSNDSRIYLVGNKRQGGVIQNFNYALSQTTSEIVLLCDQDDIWPEERLEI
                     LIDKFKALQRNDFVPAMMFTDLKLVDENNCLIAESFYRTNNINPQDNLKNNNLLWRST
                     VYGCTCIMNKKLVDIALPIPTYAHMHDQWLALLAKQYGNIFYFDYASVRYRQHSTNVV
                     GGRNKTPFQKFNSIQKNLKRINLLVDRTVALIKSNNDFYPGNKMENKIDYLKFGVNEV
                     LPYLFKGNKKVFSLCVLISLALQK"
     gene            6776..7963
                     /gene="wzy"
     CDS             6776..7963
                     /gene="wzy"
                     /codon_start=1
                     /transl_table=11
                     /product="Wzy"
                     /protein_id="AAT85653.1"
                     /translation="MIYLLFFFALFMICTFLTHRRQALYVVSALVFLFLALTYPSGGD
                     WIGYFLHYDCMVNEQCNNGFIMFEPGYELIVSLFGYLGFQTIIIFIAAVNVILILNFA
                     KHFENGSFVIVAIMCMFLWSVYVEAIRQALALSIVIFGIHSLFLGRKRKFITLVLFAS
                     TFHITALICFLLMTPLFSKKLSKIISYSLLIFSSFFFAFSETILSALLAILPEGSIAS
                     EKLSFYLATEQYRPQLSIGSGTILDIILIFLICVSFKRIKKYMLANYNAANEILLIGC
                     CLYISFGIFIGKMMPVMTRIGWYGFPFVIVLLYINLGYSEYFKRYINKRGCGYSKLLI
                     AFYFLLQILRPLTYDYSYYNIMHQDTLLNRFDALDDASLRQSAKRKCFDLGKIGYGFL
                     CSI"
     gene            8076..9179
                     /gene="wbuH"
     CDS             8076..9179
                     /gene="wbuH"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuH"
                     /protein_id="AAT85654.1"
                     /translation="MFDLSKNYIIVSATALASGGALTILKQFIKHASQNSNDYIMFVS
                     AGLELPVCDNIIYIENTPKGWLKRIYWDWFGCRKFISEHKINVKKVISLQNSSLNVPY
                     EQIIYLHQPIPFSKVDSFLKNITSDNVKLFLYKKFYSYFIFKYVNANTTIVVQTNWMK
                     KGVLEQCDKISTERVLVIKPDIKAFNNTNFDVDMDVSAKTLLYPATPLTYKNHLVILK
                     ALVILKKKYFIDDLKFQVTFEKNRYKNFDKFVQLNNLSKNVDYLGVLSYSNLQKKYMA
                     ASLIVFPSYIESYGLPLIEAASLGKKIISSDLPYARDVLKDYSGVDFVIYNNEDGWAK
                     ALFNVLNGNSKLNFRPYEKDSRSSWPQFFSILK"
     gene            9188..10222
                     /gene="fnlA"
     CDS             9188..10222
                     /gene="fnlA"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlA"
                     /protein_id="AAT85655.1"
                     /translation="MFNGKILLITGGTGSFGNAVLRRFLDTDIKEIRIFSRDEKKQDD
                     MRKKYNNPKLKFYIGDVRDYSSILNASRGVDFIYHAAALKQVPSCEFHPMEAVKTNVL
                     GTENVLEAAIANGVRRIVCLSTDKAVYPINAMGISKAMMEKVMVAKSRNVDCSKTVIC
                     GTRYGNVMASRGSVIPLFVDLIKSGRPMTITDPNMTRFMMTLEDAVDLVLYPFEHGNN
                     GDIFVQKAPAATIETLAIALKELLNVNHPLLNIIGTRHGEKLYEALLTREEMIAAKDM
                     GEYYRVPPDFRRLNYGKKWNHGDRRISEVEDYNPHNTDRLDVEGMKKLLLKLPFIRAL
                     RSGEDYELDS"
     gene            10206..11330
                     /gene="fnlB"
     CDS             10206..11330
                     /gene="fnlB"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlB"
                     /protein_id="AAT85656.1"
                     /translation="MSWIHNMKILVTGAAGFIGRNLVFRLKEAGYNELITIDRNSSLA
                     DLEQGLKQADFIFHLAGVNRPVKECEFEEGNSNLTQQIVDILKKNNKNTPIMLSSSIQ
                     AECDNAYGKSKAAAEKIIQQYGETTNAKYYIYRLPNVFGKWCRPNYNSFIATFCHRIA
                     NDEAITINDPSAVVNLVYMVDLQAAANSLLEGANETGYRTFGPIYSVTVGEVAQLIYR
                     FKESRQTLITEDVGNGFTRALYSTWLSYLSPEQFAYTVPSYSDDRGVFCEVLKTKNAG
                     QFSFFTAHPGITRGGHYHHSKNEKFIVIRGSACFKFENIVTSERYEPNVSSDDFKIVE
                     TVPGWTHNITNNGSDELVVMLWANEIFNRSEPDTIARVLS"
     gene            11345..12457
                     /gene="fnlC"
     CDS             11345..12457
                     /gene="fnlC"
                     /codon_start=1
                     /transl_table=11
                     /product="FnlC"
                     /protein_id="AAT85657.1"
                     /translation="MSVVGTRPEIIRLSRVLAKLDEYCDHLIVHTGQNYDYELNEVFF
                     KDLGVRKPDYFLNAAGKNAAETIGQVIIKVDEVLEQEKPEAMLVLGDTNSCISAIPAK
                     RRRIPIFHMEAGNRCFDQRVPEETNRKIVDHTADINMTYSDIAREYLLAEGVPADRII
                     KTGSPMFEVLTHYMPQIDGSDVLSRLNLTPGNFFVVSAHREENVDTPKQLVKLANILN
                     TVAEKYDVPVVVSTHPRTRNRINENGIQFHKNILLLKPLGFHDYNHLQKNARAVLSDS
                     GTITEESSIMNFPALNIREAHERPEGFEEGAVMMVGLESDRVLQALEIIATQPRGEVR
                     LLRQVSDYSMPNVSDKVLRIIHSYTDYVKRVVWKQY"
     gene            12457..13665
                     /gene="wbuB"
     CDS             12457..13665
                     /gene="wbuB"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuB"
                     /protein_id="AAT85658.1"
                     /translation="MKLALIIDDYLPHSTRVGAKMFHELGLELLSRGHDVTVITPDIS
                     LQAIYSISMIDGIKVWRFKSGPLKDVGKAKRAINETLLSFRAWRAFKHLIQHDTFDGI
                     VYYSPSIFWGDLVKKIKQRCQCPSYLILRDMFPQWVIDAGMLKAGSPIEKYFRYFEKK
                     SYQQAGRIGVMSDKNLEIFRQTNKGYPCEVLRNWASMTPVSASDDYHSLRQKYDLKDK
                     VIFFYGGNIGHAQDMANLMRLARNMMRYHDAHFLFIGQGDEVELIKSLAAEWNLTNFT
                     HLPSVNQEEFKLILSEVDVGLFSLSSRHSSHNFPGKLLGYMVQSIPILGSVNGGNDLM
                     DVINKHRAGFIHVNGEDDKLFESAQLLLSDSVLRKQLGQNANVLLKSQFSVESAAHTI
                     EVRLEAGECV"
     gene            13656..14063
                     /gene="wbuC"
     CDS             13656..14063
                     /gene="wbuC"
                     /codon_start=1
                     /transl_table=11
                     /product="WbuC"
                     /protein_id="AAT85659.1"
                     /translation="MRLVDDNILDELFRTAANSERLRAHYLLHASHQEKVQRLLIAFV
                     RDSYVEPHWHELPHQWEMFVVMQGQLEVCLYEQNGEIQKQFVVGDGTGISVVEFSPGD
                     IHSVKCLSPKALMLEIKEGPFDPLKAKAFSKWL"
     gene            14175..>14433
                     /gene="gnd"
     CDS             14175..>14433
                     /gene="gnd"
                     /codon_start=1
                     /transl_table=11
                     /product="Gnd"
                     /protein_id="AAT85660.1"
                     /translation="MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIA
                     ENPGKKLVPYYTVKEFVESLETPRRILLMVKAGAGTDAAIAS"
ORIGIN      
        1 gaattcacta gtgattattg tggctgcagg gatcaaagaa atcctcctgg taactcatgc
       61 gtccaagaac gcagtcgaaa accacttcga cacctcttat gaattagaat ctctccttga
      121 gcagcgcgtg aagcgtcaac tgcttgcgga agtacagtcc atttgcccgc cgggcgtgac
      181 aattatgaac gtgcgtcagg gcgaaccttt aggtttgggc cactccattt tatgtgcacg
      241 acctgccatt ggtgacaatc catttgtcgt ggtgctgcca gacgttgtga tcgacgacgc
      301 cagcgccgac ccgctgcgct acaaccttgc tgccatgatt gcgcgcttca acgaaacggg
      361 ccgcagccag gtgctggcaa aacgtatgcc gggcgatctc tctgaatact ccgtcatcca
      421 gactaaagaa ccgcttgatc gcgaaggtaa agtcagccgc attgttgaat ttatcgaaaa
      481 accggatcag ccgcagacgc tggactcaga tatcatggcc gttggccgct atgtgctttc
      541 tgccgatatt tggccggaac ttgaacgcac tcagcctggt gcatggggac gtattcaact
      601 gactgatgcc atcgctgaac tggcgaaaaa acagtccgtt gatgccatgc tgatgacagg
      661 tgacagctac gactgcggta aaaaaatggg ttatatgcag gcatttgtga agtatggact
      721 acgcaacctg aaagaagggg cgaagttccg taaagggatt gagaagctgt taagcgaata
      781 atgaaaatct gaccgaatgt aacggttgat aagaaaatta taacggcagt gaagattcgc
      841 ggcgaaagta atttgctgcg aatattcctg ccgttgtttt atataaacaa tcagaataac
      901 aacgagttag caataggatt ttagtcaaag ttttccagga ttttccttgt ttccaaagcg
      961 gaatggtaag acaattagcg tttgaatttt tcggatttgg cgcgagtggg taacgctcgc
     1021 cacatcgtag acatgcatgc agtgctctgg tagctgtaaa gccaggggcg gtagcgtgca
     1081 ttaatacctc tattaatcaa actgagagcc gcttatttca cagcatgctc tgaagtaata
     1141 tggaataaat taagtgaaaa tacttgttac tggtggcgca ggatttattg gttctgctgt
     1201 agttcgtcac attataaata atacgcagga tagtgttgtt aatgtcgata aattaacgta
     1261 cgccggaaac ctggaatcac ttgctgatgt ttctgattct gaacgctatg tttttgaaca
     1321 tgcggatatt tgcgatgcag ctgcaatggc acggattttt gctcagcatc agccggatgc
     1381 agtgatgcac ctggctgctg aaagccatgt tgaccgttca attaccggcc ctgctgcatt
     1441 tattgaaacc aatattgttg gtacttatgt ccttttggaa gccgctcgca attactggtc
     1501 tgctcttgat agcgacaaga aaaatagctt ccgttttcat catatttcta ctgacgaagt
     1561 atatggtgat ttgcctcatc ctgacgaggt aaataataca gaagaattac ccttatttac
     1621 tgagacaaca gcttacgcgc caagcagccc ttattccgca tccaaagcat ccagcgatca
     1681 tttagtccgc gcgtggaaac gtacctatgg tttaccgacc attgtgacta attgctctaa
     1741 caattatggt ccttatcatt tcccggaaaa attgattcca ttggttattc tcaatgctct
     1801 ggaaggtaaa gcattaccta tttatggtaa aggggatcaa attcgcgact ggctgtatgt
     1861 tgaagatcat gcgcgtgcgt tatataccgt cgtaaccgaa ggtaaagcgg gtgaaactta
     1921 taacattggt gggcacaacg aaaagaaaaa catagatgta gtgctcacta tttgtgattt
     1981 gctggatgag attgtaccga aagagaaatc ttatcgtgag caaatcactt atgttgccga
     2041 tcgtccggga cacgatcgcc gttatgcgat tgatgctgag aatattggtc gcgaattggg
     2101 atggaaacca caggaaacgt ttgagagcgg gattcggaag acagtggaat ggtatctgtc
     2161 caatacaaaa tgggttgata atgtgaaaag tggtgcctat caatcgtgga ttgaagagaa
     2221 ctatgagggc cgccagtaat gaatatcctc ctttttggca aaacagggca ggtaggttgg
     2281 gaactacagc gtgctctggc acctctgggt aacttgattg ctcttgatgt tcattccact
     2341 gattattgtg gcgatttcag taaccccgaa ggtgtggctg aaaccgtcaa aaaaattcgc
     2401 ccagatgtta ttgttaatgt tgctgctcat accgcggtag ataaggctga gtcagaacca
     2461 gaatttgcac aattactcaa tgcgaccagc gttgaagcaa ttgcaaaagc ggctaatgaa
     2521 gttggggctt gggtaattca ttactcaact gactacgtct tccctggaaa tggcgacatg
     2581 ccatggctcg agacggatgt aaccgctccg ctcaatgttt atggcaaaac caaattggct
     2641 ggagaaagag cattacaaga acattgcgca aagcatctta ttttccgtac cagctgggta
     2701 tatgcaggta aaggaaataa ctttgccaaa acaatgttac gtcaggcaaa agagcgcgaa
     2761 gaactggctg tgataaacga tcagtttggc gcaccaacag gtgctgaatt gctggctgat
     2821 tgcaccgctc atgccattcg cgtggcatta aaaaaaccag aagttgctgg cttgtaccat
     2881 ctggtagcaa atggcacaac aacctggcac gattacgccg cgctagtatt cgaagaagcc
     2941 cgtaaagcag ggattgacct tgcacttaac aaactcaacg ccgtaccaac aacggcttat
     3001 cctactccag cccgccgtcc tcataattct cgcctcaata ccgaaaagtt tcagcagaac
     3061 tttgcgcttg tcttgcctga ctggcaggtg ggcgtgaaac gtatgctcaa cgaattattt
     3121 acgactacgg caatttaaca aatttttgca tctcgctcat gatgccagag cgggatgaat
     3181 taaaaggaat ggtgaaatga aaacgcgtaa aggtattatt ctggctggtg gttccggcac
     3241 tcgtctttat cctgtgacga tggcagtgag taaacaactg ctgccgattt atgataagcc
     3301 gatgatttat tatccgcttt caacgcttat gttagcgggt attcgcgata ttcttattat
     3361 cagtacgcca caggatacac cgcgtttcca acaattgttg ggggacggga gtcagtgggg
     3421 gcttaatcta cagtataaag tacaaccgag tccggatggc ctggcgcaag cgtttattat
     3481 tggtgaagac tttgttggtg gtgatgattg tgcactcgta cttggcgata atatcttcta
     3541 tggacacgac ttgccgaaat taatggaagc tgctgttaac aaagaaatcg gtgcaacggt
     3601 atttgcttat cacgtcaatg atcctgaacg ttatggtgtc gtggagtttg ataataacgg
     3661 tactgcgatt agcctggaag aaaaaccgct ggaaccaaaa agtaactatg cggttactgg
     3721 gctttatttc tatgacaatg atgttgtaga aatggcgaaa aaccttaagc cttctgcccg
     3781 tggcgaactg gaaattaccg atattaaccg tatttatatg gagcagggac gtttgtctgt
     3841 cgctatgatg gggcgtggtt atgcctggtt ggatactggt acacatcaaa gtcttattga
     3901 agcaagtaac ttcattgcca ccattgaaga gcgtcaggga ttaaaggtat cttgcccgga
     3961 agagattgct taccgtaaag ggtttattga tgctgagcag gtgaaagtat tagccgaacc
     4021 gctgaagaaa aatgattatg gtcagtatct gctaaaaatg attaaaggtt attaataaaa
     4081 tgaacgtaat taaaactgaa attcctgatg tgctgatttt tgaaccaaaa gtttttggtg
     4141 atgaacgtgg cttctttttt gagagtttta accagaaagt atttgaagaa gctgcaggac
     4201 ggaaggttga atttgttcag gataaccatt ctaagtctaa aataaatgta ttgcgtggga
     4261 tgcattatca gctaacacaa aatactcaag gaaaactggt tcgggtaatt tctggttcag
     4321 tatatgatgt tgccgtagat ttaagagaaa aatcaaagac atttggcaaa tgggtgggtg
     4381 tagaattatc tgggaataat aaaagacaat tgtggatccc cgaaggtttt gcccatggtt
     4441 tttatgtgtt ggaggagaat accgaatttg tttataaatg taccgatact tataaccctg
     4501 ctcatgaaca cacattgcta tggaatgatc caactacaat ataagttggc caatcataca
     4561 aaactgcaag ccaattattt ctgaaaaaga tgctaatgga catctttttt cacataaaac
     4621 ctatttctga aatgcaatat tatgagttta attagaaaca gtttctataa tattgctggt
     4681 tttgctgtgc cgacattagt tgcagtccct gctttgggga ttcttgccag gctgcttgga
     4741 ccggagaatt ttggactttt cacactagca ttcgctttga taggatatgc aagtattttc
     4801 gacgccggga ttagtcgagc tgtaatcaga gaaatcgctc tttatcgaga aagtgaaaaa
     4861 gagcaaatac aaattatttc gacagcaagt gtaatcgtac tattcttagg ggtggttgca
     4921 gctttgttac tttattttag tagtaataaa gttgttgagt tattgaatgt tagttccgtt
     4981 tatattgaaa cagcagtgcg tgcattctct gttatttcat ttataatacc tgtgtatctg
     5041 attaaccaga tttggcttgg ttatctggaa gggctagaaa aatttgcaaa tataaatgtt
     5101 cagagaatga tttctagcac aagcttggct atattaccag tgatattttg ttattacaat
     5161 ccctcgttgc tttatgctat gtatgggttg gtggttgggc gtgtgatttc atttttgatt
     5221 agcgcaataa tttgtcgaga tattattctt aaaagtaaac tttactttaa tgtggcaact
     5281 tgcaatcgtc ttatctcttt tggtggatgg ataacagtta gtaatatcat aagcccaatc
     5341 atggcatatt tcgaccgctt tatcatctct catattatgg gggcttcgag aattgcattt
     5401 tatacagcgc cctcagaggg tgtatcaagg ttaattaata tcccatatgc tttggcaaga
     5461 gctctatttc ctaaattggc atatagcaat aatgatgatg aacgaaaaaa attacaacta
     5521 cagagctacg caattataag cattgtatgt ctacccatag ttgttattgg tgtcattttt
     5581 gcctcattca taatgacaac atggatggga cctgattatg ccttagaagc agcaactatc
     5641 atgaaaatac ttcttgctgg ttttttcttt aactctttag cgcaaatacc ttatgcatac
     5701 ttgcaatcta tcggaaagtc aaaaattacc gcatttgtgc atctcataga acttgcgcca
     5761 tacttattat tattgtatta cttcacaatg catttcggca taattggcac ggcaatcgct
     5821 tggtcactta gaacattttg tgattttgtt atactacttt cgatatcgag aagaaaatga
     5881 ttgcggttga tattgcgctt gcaacctaca atggtgctaa ttttattcgg caacagattg
     5941 aatctatcca gaaacaaact tatagaaatt ggcgtcttat aataagtgat gataactcga
     6001 gtgatgatac tgttgatatt attaaggata tgatgtctaa cgacagtcgt atctatttgg
     6061 taggaaataa aagacaagga ggggttattc agaactttaa ttatgctctt tcacaaacta
     6121 catctgaaat tgtgttacta tgtgaccagg atgacatttg gccggaggag cgtctggaaa
     6181 ttcttataga taaatttaag gccttgcagc gtaatgattt tgttccggca atgatgttta
     6241 ctgatttgaa attagtagac gaaaataatt gtttgattgc agaaagtttt tatcgaacga
     6301 ataatattaa tccacaagat aatctgaaaa ataataatct tctctggcgt tcaacggtat
     6361 atggctgtac ttgcatcatg aataagaaac ttgttgatat tgcattgcct atacctacat
     6421 atgcacatat gcatgatcaa tggttggcat tattagcgaa gcaatatggt aacatttttt
     6481 atttcgacta tgcgtctgtt cgttataggc aacattctac aaatgttgtt ggtggtagaa
     6541 ataaaacgcc atttcaaaaa tttaattcca tacaaaaaaa cctaaaaagg attaatttgc
     6601 tagtggatag aactgttgct ttaattaaat caaataacga tttctatcca gggaataaaa
     6661 tggaaaataa aattgattac ttaaaatttg gagtgaatga agtattacct tatcttttta
     6721 aaggaaacaa gaaagttttt tcactttgtg tattaattag tttggcatta caaaaatgat
     6781 atatttatta tttttttttg cactgtttat gatctgtacg tttttaacac acaggcgaca
     6841 ggcattatat gttgtatctg cgttagtatt tctttttttg gctttaacct atccatcagg
     6901 aggggactgg ataggttatt ttctccatta tgactgcatg gttaatgagc agtgtaataa
     6961 tggttttata atgtttgaac ctggatatga attaattgtt tccttatttg gatatttggg
     7021 atttcagaca attattattt ttatagccgc tgtaaatgta attctaatat taaattttgc
     7081 aaagcatttt gaaaacggaa gttttgttat tgttgcgata atgtgcatgt tcctttggag
     7141 tgtttatgtt gaggcgatta gacaggctct ggccttatct atagttatat ttgggattca
     7201 ttctcttttt ttgggtagaa aaaggaaatt tataacatta gtattatttg cgtcaacttt
     7261 ccatataact gctttgattt gttttcttct aatgactcct ctattttcaa agaaattaag
     7321 caagataata agttatagcc tattaatttt cagtagcttc tttttcgctt tttctgaaac
     7381 catattaagt gcactccttg caattttgcc agaaggatcc attgccagtg aaaaattaag
     7441 tttttactta gcaaccgagc aatacaggcc acagttatct attgggagtg gcactattct
     7501 tgacattata cttatttttc tgatatgtgt aagttttaaa cgaataaaga aatatatgct
     7561 cgctaattat aatgctgcaa atgagatatt gcttattggt tgctgtcttt atatttcttt
     7621 cggtattttt atcgggaaaa tgatgccagt tatgactcgc attggttggt atggttttcc
     7681 atttgttata gtacttcttt atattaactt gggttattca gaatatttta agaggtatat
     7741 aaataaaaga gggtgtgggt atagcaaatt attaattgct ttttattttt tgctacaaat
     7801 tttgcgacca ttaacatatg attatagcta ttataatata atgcaccagg atactttgct
     7861 gaataggttt gatgcattag atgatgcatc attaagacaa tcagcgaaga gaaaatgttt
     7921 cgatttggga aagataggat atggtttctt atgtagtata taatatcctg cattcattcg
     7981 gataatttcc tatggaagtg tcctttgctc tgtctgtcct catttgttga aattttatgt
     8041 taataagaag ctttagataa ccacttagga actgtatgtt tgatctgtcc aaaaattata
     8101 ttattgtaag tgcgacggcg ctggcttccg gaggtgcatt aactatatta aagcaattta
     8161 taaaacatgc atcacaaaat tcaaatgact atattatgtt tgtatctgcg ggattggagt
     8221 tgccggtctg tgataacatc atttacatag aaaacacacc aaaaggatgg ttgaaaagaa
     8281 tatattggga ttggttcggt tgtcggaagt ttatctcgga acataagatt aacgttaaga
     8341 aagtaatttc tctacaaaat tccagtttga atgttcctta cgaacagatt atttacttgc
     8401 accagccaat tccttttagt aaagttgatt cttttttaaa aaatatcaca tccgataacg
     8461 taaagctttt tttatataaa aagttttatt cctattttat atttaaatat gtgaatgcca
     8521 atacaaccat cgtagtgcaa acgaattgga tgaaaaaagg agtgctggag caatgtgata
     8581 aaattagtac cgaaagggtc cttgttataa aacctgatat caaagcattt aataatacta
     8641 attttgatgt agatatggat gtatctgcaa aaacactctt atatccagcg acaccactta
     8701 cctataaaaa tcatttggtc attctgaagg cgttggttat tttaaagaaa aagtatttta
     8761 tagatgatct gaaattccaa gtgacttttg aaaagaatag gtacaaaaat tttgataagt
     8821 ttgtgcaatt aaataactta agcaaaaacg ttgattatct cggcgttctt tcatactcga
     8881 acttgcaaaa aaaatatatg gcggcatctt taatcgtttt tcctagctat atcgaatcat
     8941 atgggttacc actcatcgaa gctgctagtt taggaaaaaa aatcattagt agtgatcttc
     9001 cttatgcccg ggatgtttta aaggattata gcggcgtaga ttttgtaatt tacaataatg
     9061 aagatggctg ggctaaggcg ttgtttaatg ttttaaatgg caattcgaag ctcaatttta
     9121 ggccttatga aaaagatagt cgttcatctt ggccacagtt cttctctatt ttgaaataag
     9181 gtgtattatg tttaatggta aaatattgtt aattactggt ggtacggggt ctttcggtaa
     9241 tgctgttcta agacgttttc ttgacactga tatcaaagaa atacgtattt tttcccggga
     9301 tgaaaaaaaa caagatgaca tgaggaaaaa atataataat ccgaaactta agttctatat
     9361 aggtgatgtt cgcgactatt cgagtatcct caatgcttct cgaggtgttg attttattta
     9421 tcatgctgca gctctgaagc aagtaccttc ctgcgaattc cacccaatgg aagctgtaaa
     9481 aacgaatgtt ttaggtacgg aaaacgtact ggaagcggca atagctaatg gagttaggcg
     9541 aattgtatgt ttgagtacag ataaagctgt atatcctatc aatgcaatgg gtatttccaa
     9601 agcgatgatg gaaaaagtaa tggtagcaaa atcgcgcaat gttgactgct ctaaaacggt
     9661 tatttgcggt acacgttatg gaaatgtaat ggcatctcgt ggttcagtta tcccattatt
     9721 tgtcgatctg attaaatcgg gtagaccaat gacgataaca gaccctaata tgactcgttt
     9781 catgatgact ctcgaagacg ctgttgattt ggttctttac ccatttgaac atggcaataa
     9841 tggtgatatt tttgtccaaa aggcacctgc ggctaccatc gaaacgttgg ctattgcact
     9901 caaagaattg cttaatgtaa accaccccct gttaaatata atcggaaccc gacacgggga
     9961 aaaactgtac gaagcgttat tgacccgaga ggaaatgatt gcagcgaagg atatgggtga
    10021 atattatcgt gttccaccag atttccgccg attgaactat gggaaaaagt ggaaccatgg
    10081 tgaccgtcgt atctcggaag tggaagatta taatcctcat aatactgata ggttagatgt
    10141 tgagggaatg aaaaaattac tgctaaaact tccttttatc cgggcacttc ggtctggtga
    10201 agattatgag ttggattcat aatatgaaaa ttttagttac tggcgctgca gggtttatcg
    10261 gtcgaaattt ggtattccgg cttaaggaag ctggatataa cgaactcatt acgatagatc
    10321 gtaactcttc tttggcggat ttagagcagg gacttaagca ggcagatttt atttttcacc
    10381 ttgctggggt aaatcgtccc gtgaaggagt gtgaatttga agagggaaat agtaatctaa
    10441 ctcaacagat tgttgatatc ctgaaaaaaa acaataaaaa tactcctatc atgctgagtt
    10501 cttccatcca ggctgaatgt gataacgctt atggaaagag taaagcagct gcggaaaaaa
    10561 tcattcagca gtatggggaa acgacaaacg ctaaatatta tatttatcgc ttgccgaatg
    10621 tattcggtaa gtggtgtcga ccaaattata actcctttat agcaactttc tgccatcgca
    10681 ttgcaaatga tgaagctatt acaattaatg atccttcagc agttgtaaat ctggtgtata
    10741 tggtcgacct gcaggcggcc gcgaattcac tattagaagg agcgaacgaa actggttaca
    10801 ggacatttgg tccaatttat tctgttactg ttggtgaagt ggcacaatta atttaccggt
    10861 ttaaagaaag tcgccaaaca ttaatcaccg aagatgtagg taatggattt acacgtgcat
    10921 tgtactcaac atggttaagt tacctgtctc ctgaacagtt tgcgtatacg gttccttctt
    10981 atagtgatga cagaggggta ttctgtgaag tattgaaaac gaaaaacgcg ggccagtttt
    11041 cgttctttac tgcgcatcca ggaattactc ggggtggtca ttatcatcat tccaaaaatg
    11101 agaaatttat tgtcatccga ggaagtgctt gtttcaaatt tgaaaatatt gtcacgagtg
    11161 aacgatatga acctaatgtt tcctctgatg attttaaaat tgttgaaaca gttccgggat
    11221 ggacgcataa cattactaat aatggctcgg atgagctagt tgttatgctt tgggcaaatg
    11281 aaatatttaa tcgttctgaa ccagatacta tagcgagagt tttatcgtga aaaaattgaa
    11341 agtcatgtcg gttgttggga ctcgtccaga aattattcga ctctcgcgtg tccttgcaaa
    11401 attagatgaa tattgtgacc accttattgt tcataccggg caaaactacg attatgaact
    11461 gaatgaagtt tttttcaaag atttgggtgt tcgcaaacct gattattttc ttaatgccgc
    11521 aggtaaaaat gcagcagaga ctattggaca agttatcatt aaagttgatg aggtccttga
    11581 acaggaaaaa ccagaagcca tgttagtact tggcgatact aactcctgta tttcagcaat
    11641 accagcaaag cgtcgaagaa ttccgatctt ccatatggag gctgggaatc gttgttttga
    11701 ccaacgcgta ccggaagaaa ctaacagaaa aatagttgat cataccgctg atatcaatat
    11761 gacatatagt gatatcgcgc gtgaatatct tctggctgaa ggtgtaccag ccgatagaat
    11821 tattaaaacc ggtagcccaa tgtttgaagt actcactcat tatatgccgc agattgatgg
    11881 ttccgatgta ctttctcgcc tgaatttaac acctgggaat ttctttgtgg taagtgccca
    11941 cagagaagaa aatgttgata cccctaaaca acttgtgaaa ctggcgaata tacttaatac
    12001 cgtggctgaa aaatatgatg tcccggtagt tgtttctact catcctcgca ctcgtaaccg
    12061 catcaacgaa aacggtattc aattccataa aaatatcttg cttcttaagc cattaggatt
    12121 tcacgattac aaccatctgc aaaaaaatgc acgtgctgtt ttatcggata gtgggactat
    12181 tacagaagag tcctccatta tgaacttccc tgcactcaat atacgagaag cgcacgaacg
    12241 cccggaaggc ttcgaagaag gggcagtaat gatggtcggt cttgaatctg atcgcgtttt
    12301 acaggcatta gaaattattg caacacagcc tcgtggagaa gtacgcttac ttcgtcaggt
    12361 tagtgactat agcatgccaa atgtttcaga taaagttctg cgtattatcc attcatatac
    12421 tgactacgtt aaacgggttg tctggaagca atactaatga aacttgcatt aatcattgat
    12481 gattatttgc cccatagcac acgcgttggg gctaaaatgt ttcatgagtt aggccttgaa
    12541 ttactgagca gaggccatga tgtaactgta attacgcctg acatctcatt acaagcaatt
    12601 tattctatta gtatgattga tggtataaag gtttggcgtt tcaaaagtgg acctttaaag
    12661 gatgtaggta aggctaaacg tgccataaat gaaactcttt tatcttttcg cgcatggcgc
    12721 gcatttaagc acctcattca acatgataca tttgatggta tcgtttatta ttccccctct
    12781 attttttggg gcgacttggt taaaaaaata aaacaacgat gccagtgccc aagctatctg
    12841 atcctaaggg atatgtttcc acagtgggtc attgatgcag gtatgttgaa agccggttca
    12901 ccaattgaaa aatattttag gtattttgaa aaaaagtcat atcagcaggc tggccggata
    12961 ggggtaatgt ctgataagaa tcttgagata tttcgccaga ccaataaagg ttatccgtgt
    13021 gaagttttac gtaattgggc ctcaatgact cctgtgtctg ccagcgatga ttatcattca
    13081 cttcgtcaaa aatacgatct aaaagataaa gtcatttttt tctatggcgg taatattggg
    13141 catgctcagg atatggcaaa cttaatgcgc cttgcgcgta atatgatgcg ttatcatgat
    13201 gctcatttcc tgtttatagg gcagggtgat gaagttgagc tgataaaatc tcttgctgca
    13261 gaatggaatt taactaattt cactcatcta ccttcagtga accaggaaga gtttaaatta
    13321 attttatctg aagttgatgt cggcctgttc tccctttcat ctcgccattc ttcacataat
    13381 ttccccggaa aattactagg gtatatggtt caatcaatcc cgatccttgg gagtgtgaat
    13441 ggcggcaatg atttaatgga tgtaattaat aagcacagag ccggtttcat tcatgttaat
    13501 ggtgaagatg ataaactgtt tgaatctgca caattgcttc ttagtgattc agttttaaga
    13561 aaacagctag gtcagaacgc taatgtgttg ttaaagtctc aattttcggt tgaatcggcg
    13621 gcacatacta tcgaagtccg actggaggct ggagaatgcg tttagttgat gacaatattc
    13681 tggatgaact ttttcgcact gcagcaaatt ctgaacgttt gcgcgctcat tatttattgc
    13741 acgcatctca tcaggagaag gttcaacgtt tacttattgc atttgtacgc gacagctatg
    13801 ttgaacccca ttggcatgag ttaccgcatc agtgggaaat gtttgtcgtc atgcaagggc
    13861 aattagaagt ttgtttgtat gagcaaaatg gtgagatcca aaaacagttt gttgttggag
    13921 acggtacggg aataagcgtc gtggaatttt ccccaggaga tatacatagt gtcaaatgcc
    13981 tgtcaccaaa agcccttatg ttggagataa aggaggggcc atttgaccca ctcaaagcta
    14041 aggctttttc taagtggtta tagggcgata caccaccgtt tattcttcta tcttattcta
    14101 tacatgctgg gttaccatct tagcttcttc aagccgcgca accccgcggt gaccacccct
    14161 gacaggagta aacaatgtca aagcaacaga tcggcgtcgt cggtatggca gtgatggggc
    14221 gcaaccttgc gctcaatatc gaaagccgtg gttataccgt ctctattttc aaccgttccc
    14281 gtgaaaagac cgaagaagtg attgccgaaa atccaggcaa aaaactggtt ccttactata
    14341 cggtgaaaga gtttgttgaa tctttggaaa cgcctcgtcg catcctgtta atggtgaaag
    14401 caggtgcagg cacggatgct gctattgctt ccc
//