LOCUS       FN995094               15824 bp    DNA     linear   BCT 16-JUL-2015
DEFINITION  Escherichia coli O-antigen gene cluster, isolate 1303.
ACCESSION   FN995094
VERSION     FN995094.1
KEYWORDS    .
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1
  AUTHORS   Duda,K.A., Lindner,B., Brade,H., Leimbach,A., Brzuszkiewicz,E.,
            Dobrindt,U. and Holst,O.
  TITLE     The lipopolysaccharide of the mastitis isolate Escherichia coli
            strain 1303 comprises a novel O-antigen and the rare K-12 core type
  JOURNAL   Microbiology (Reading, Engl.) 157 (PT 6), 1750-1760 (2011)
   PUBMED   21372091
REFERENCE   2  (bases 1 to 15824)
  AUTHORS   Dobrindt,U.
  TITLE     Direct Submission
  JOURNAL   Submitted (23-JUN-2010) Dobrindt U., Universitaet Wuerzburg, Inst.
            f. Molekulare Infektionsbiologie, Josef-Schneider-Str. 2 / Bau D15,
            97080 Wuerzburg, GERMANY
FEATURES             Location/Qualifiers
     source          1..15824
                     /organism="Escherichia coli"
                     /mol_type="genomic DNA"
                     /serovar="O70:H-"
                     /isolate="1303"
                     /db_xref="taxon:562"
     gene            330..1223
                     /gene="galF"
     CDS             330..1223
                     /gene="galF"
                     /codon_start=1
                     /transl_table=11
                     /product="UTP-glucose-1-phosphate uridylyltransferase"
                     /protein_id="CBN82192.1"
                     /db_xref="GOA:A9C4E3"
                     /db_xref="InterPro:IPR005774"
                     /db_xref="InterPro:IPR005835"
                     /db_xref="InterPro:IPR029044"
                     /db_xref="UniProtKB/TrEMBL:A9C4E3"
                     /translation="MTNLKAVIPVAGLGMHMLPATKAIPKEMLPIVDKPMIQYIVDEI
                     VAAGIKEILLVTHASKNAVENHFDTSYELESLLELRVKRQLLAEVQSICPPGVTIMNV
                     RQGEPLGLGHSILCARPAIGDNPFVVVLPDVVIDDASADPLRYNLAAMIARFNETGRS
                     QVLAKRMPGDLSEYSVIQTKEPLDREGKVSRIVEFIEKPDQPQTLDSDIMAVGRYVLS
                     ADIWPELERTQPGAWGRIQLTDAIAELAKKQSVDAMLMTGDSYDCGKKMGYMQAFVKY
                     GLRNLKEGAKFRKGIEKLLSE"
     gene            1491..1517
                     /gene="jumpstart sequence"
     misc_feature    1491..1517
                     /gene="jumpstart sequence"
     gene            1509..1516
                     /gene="ops element"
     misc_feature    1509..1516
                     /gene="ops element"
     gene            1595..2680
                     /gene="rmlB"
     CDS             1595..2680
                     /gene="rmlB"
                     /codon_start=1
                     /transl_table=11
                     /product="dTDP-glucose 4,6 dehydratase"
                     /protein_id="CBN82193.1"
                     /db_xref="GOA:E6ZDL5"
                     /db_xref="InterPro:IPR001509"
                     /db_xref="InterPro:IPR005888"
                     /db_xref="InterPro:IPR016040"
                     /db_xref="UniProtKB/TrEMBL:E6ZDL5"
                     /translation="MKILVTGGAGFIGSAVVRHIINNTQDSVVNVDKLTYAGNLESLA
                     DVSDSERYVFEHADICDAAAMARIFAQHQPDAVMHLAAESHVDRSITGPAAFIETNIV
                     GTYVLLEAARNYWSALDGDKKNSFRFHHISTDEVYGDLPHPDEVNNKEELPLFTETTA
                     YAPSSPYSASKASSDHLVRAWKRTYGLPTIVTNCSNNYGPYHFPEKLIPLVILNALEG
                     KALPIYGKGDQIRDWLYVEDHARALYTVLTEGKAGETYNIGGHNEKKNIDVVLTICDL
                     LDEIVPKEKSYREQITYVADRPGHDRRYAIDAEKISRELGWKPQETFESGIRKTVEWY
                     LANTKWVENVKLGAYTSYLSKQGGDNN"
     gene            2680..3549
                     /gene="rmlA"
     CDS             2680..3549
                     /gene="rmlA"
                     /codon_start=1
                     /transl_table=11
                     /product="glucose-1-phosphate thymidylyltransferase"
                     /protein_id="CBN82194.1"
                     /db_xref="GOA:E6ZDL6"
                     /db_xref="InterPro:IPR005835"
                     /db_xref="InterPro:IPR005907"
                     /db_xref="InterPro:IPR029044"
                     /db_xref="UniProtKB/TrEMBL:E6ZDL6"
                     /translation="MKGIILAGGSGTRLYPLTLGVSKQLMPIYDKPMIYYPLSVLMLA
                     GIKDILIITTQEDQASFVRLLGDGKKFGVNLSYAIQPSPDGLAQAFIIGEKFIGSESV
                     CLVLGDNIFFGQGFTPKLQIATSRTRGATVFGYQVMDPERFGVVEFDADLKVLSIEEK
                     PFKPKSNWAVTGLYFYDNDVIEIAKSIKPSPRGELEITSVNEVYLTNSSLHVELLGRG
                     FAWLDTGTHDSLIEAGSFVETVQKRQGMMVACPEEIAWRNGWLSNEELLDLGIQLSKN
                     HYGQYLIKLAKHI"
     CDS             3546..3953
                     /note="ORF 3"
                     /codon_start=1
                     /transl_table=11
                     /product="putative dTDP-6-deoxy-3,4-keto-hexulose
                     isomerase"
                     /protein_id="CBN82195.1"
                     /db_xref="GOA:E6ZDL7"
                     /db_xref="InterPro:IPR008894"
                     /db_xref="InterPro:IPR011051"
                     /db_xref="UniProtKB/TrEMBL:E6ZDL7"
                     /translation="MNIEFISLQKHGDERGALVSLEREKNIPFDIRRVYYIFDTKEGI
                     TRGFHAHRKLKQVVIAVKGSCRFILDDGVERVSVVLDNPSEGLLITSLIWREMTDFSK
                     DCVLMVLADMEYDESDYIRDYSIFKLIAQDQNT"
     CDS             4032..5135
                     /note="ORF 4"
                     /codon_start=1
                     /transl_table=11
                     /product="putative aminotransferase"
                     /protein_id="CBN82196.1"
                     /db_xref="GOA:E6ZDL8"
                     /db_xref="InterPro:IPR000653"
                     /db_xref="InterPro:IPR015421"
                     /db_xref="InterPro:IPR015422"
                     /db_xref="InterPro:IPR015424"
                     /db_xref="UniProtKB/TrEMBL:E6ZDL8"
                     /translation="MVDFLNLKKINKRQKQDLLEAVERVIDSGWYIMGSELDSFEQEF
                     AIFCQVKYCLGVANGLDALTLVLRAWKEMGKIKDGDEVIVQANTYIASVLAITENNLI
                     PVLVEPDNKSFNLSVENVCNAISDKTKVILPVHLYGQISPMKDIMRIAKERGLLVLED
                     CAQAHGAQIEGKRAGSWGDAAGFSFYPGKNLGALGDAGAITTNDEELYKVIKALRNYG
                     SEEKYLNLYKGVNSRLDEIQAAMLRVKLKMLSEDIKLRQCIAQRYLTEIKNSFLELPH
                     VENMENHVWHLFVLKTQKREALQLWLERHKIQSLIHYPIPPHKQNAYKKMNNIRLPLT
                     EDLHRKVLSIPMDPTMSDDDVKSVINALNGFMG"
     gene            5132..6382
                     /gene="wzx"
     CDS             5132..6382
                     /gene="wzx"
                     /codon_start=1
                     /transl_table=11
                     /product="putative O-antigen flippase"
                     /protein_id="CBN82197.1"
                     /db_xref="GOA:E6ZDL9"
                     /db_xref="InterPro:IPR002797"
                     /db_xref="UniProtKB/TrEMBL:E6ZDL9"
                     /translation="MSKLLKVTASTGVLTLAKMAMGFAISKIIAIYTGPSGMALLGQI
                     QGAVTVFTGIANAPVSNGIVRYTSEQSKNGIHACSRWWRASLIWVVTIYIILLPVSVL
                     FSHYLADYFFGNKNYAWIIYLIIALLPLTALGTLFLSIINGLQNFRRFVLINFVSVLM
                     SGIVMAVLIIFYNIQGAIVAASIQAALIGLIILVINLNQQWMHFRNFVGKFDYSAICD
                     IGKYVVMAMASSLIMPAALLLVRNVLVQTSGWQGAGLWQAVWKISEVYLSIITIALTT
                     YYLPRLSQLNTIDSIMDEILASVKVVMPIITVIALLVYFSRDVLISILFTDEFRSARE
                     LFAIQLCGDIIKILAWLYAFPMLSRCAVKWYLLTEMFFGIVFILLSYILIPLFQLHGA
                     NYAYLLSYSLYGVVIITNVRRFLK"
     CDS             6420..6932
                     /note="ORF 6"
                     /codon_start=1
                     /transl_table=11
                     /product="putative acetyl transferase"
                     /protein_id="CBN82198.1"
                     /db_xref="GOA:E6ZDM0"
                     /db_xref="InterPro:IPR011004"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM0"
                     /translation="MFLNISLLYIISKTSKNSIIFKMPIIGKGFSLSIFNRAKLNICN
                     LVARNNLSLFVSQGQLTFKKGCFVNNNCSFNCLDSIQIGENTIFGEGVKVYDHDHIID
                     NEYYVSKNEFITSPVKIGSNCWIGTNTIILKGVSITDNVIIGANSLVNKSISEAGVYV
                     SKNGVLTKIK"
     CDS             6948..7868
                     /note="ORF 7"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyl transferase"
                     /protein_id="CBN82199.1"
                     /db_xref="GOA:E6ZDM1"
                     /db_xref="InterPro:IPR001173"
                     /db_xref="InterPro:IPR029044"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM1"
                     /translation="MNKFITITVISYNSSATISDTLNSILQQTYNKKNIEVIISDDAS
                     KDNTLLIANDWKDKNKGIFNNIVIVSHSENKGVAANCNQAWKLAKGEWIKTIAADDML
                     LPNCIEENIKYVLNNSDAKIIFSDMIPFTSYGYEEPMKHDKKKINCSHSQQKKNILYQ
                     CYLLAPTAFINRKALADVGYADEAYPMIEDYPLWLRCLNNGYKFSYMEKNTVIYRQGD
                     SLSQQNTKIGNISYMQSLYSFQKEKIWPQLPKWMIFKKWDDYILYKHKNSWIKIFGNE
                     MTFFYRVFRKLVLLLRPYKMYLFAKKIIMK"
     gene            7879..9159
                     /gene="wzy"
     CDS             7879..9159
                     /gene="wzy"
                     /codon_start=1
                     /transl_table=11
                     /product="putative O antigen polymerase"
                     /protein_id="CBN82200.1"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM2"
                     /translation="MVYNILILIIFIIIVLISNKRLRIFSFKPTFLGAMFLLSLFIQI
                     VPGTILVSFFDYPMSFGVDTTISNEVKIETFRYTFISISALLFIITAASVFLNFDVDL
                     IKLETRYLRAKLLTFFSLVVILVKILSVGNIPFLMVLHGDFDGAALAKAQILKNEVGF
                     GGLFIGYIFVYFPYISLVYAYCQKKKQQYGIEVFRLNLLLITIYSIYDMQKSKFIVVL
                     FILFILYLKFSKKINYWLVTGIPIVSIFLLCSFFILLHNIPMSEVFDSVFARLFIGQT
                     EGSFMIYQALTPDISRIAYGMPLAGLFGISSVDPAAEIITIFFPTAGDAWINSNSYFQ
                     AHAWSIFGDLSLILGPLFVALNIIGLYFLKELFSKVDKAYACCVYIVSILTLPIVNDF
                     SYFLFFKSWFCMIVLMLFYISTVKFIEICCNYKR"
     CDS             9237..10319
                     /note="ORF 9"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyl transferase"
                     /protein_id="CBN82201.1"
                     /db_xref="GOA:E6ZDM3"
                     /db_xref="InterPro:IPR001296"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM3"
                     /translation="MIKILHIVGNKIEPSNGIGRLLPEMIEMQNKFSTNIHCTLCCIN
                     DVYITSSFQVINKNEVKHINIDDYDLFIFHGLYFWSYISFAKKILSKKKSYLIKPHSS
                     LIINAQEKSFIKKRIANLLYFKAFVKNAKAIIFTNDDEAKNSVRWNPNALFEGNGLTS
                     IQSSDIDIKQKQKPYKFVYLSRIDFTHKGTDILLDALDLLKERYNIKDLHLSIYGKGS
                     KEEENELIRRIKKLNFTNVAFYGAIYGNQKYDMFNKKDIFILTSRYEGFPMAILEALD
                     AGLPCLVTRGVNMTSIIEKYHVGWECQTTPQSVANLIVSVLGVEQDVLNEMSRQARKY
                     IIEEHNWPALAKYSESLYKQVCERKQ"
     CDS             10316..11239
                     /note="ORF 10"
                     /codon_start=1
                     /transl_table=11
                     /product="putative UDP-glucose 4-epimerase"
                     /protein_id="CBN82202.1"
                     /db_xref="GOA:E6ZDM4"
                     /db_xref="InterPro:IPR001509"
                     /db_xref="InterPro:IPR016040"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM4"
                     /translation="MNKRILILGGSGFIGVNLIDHFLNCGHEVIVYGRKHPLGEFNNK
                     ITFLKAGFTDISAHKKYLKSLNIDTAIYLINNFPVNSNVPDFEMCLELNKLLINEVFD
                     IVERFIFFSSGGRVYKSSHKPHHEDERLRAVCDYGKSKIYLEQFVISCAYLKCKRFLI
                     VRPSNPYGPHQILTGNQGLIAILLGRIMNGEMIQIWGSGNEIRDYIYIQDFVQIFYKL
                     FCVENPQFNIYNIGSGIGVSTKTILSTVSQRLPNYIIQTEYIENKKTIQSNILCNKRI
                     IGEIGNYHFTDVNSGIEQFIEWLHNIDNRKL"
     CDS             11272..12081
                     /note="ORF 11"
                     /codon_start=1
                     /transl_table=11
                     /product="putative glycosyl transferase"
                     /protein_id="CBN82203.1"
                     /db_xref="GOA:E6ZDM5"
                     /db_xref="InterPro:IPR001173"
                     /db_xref="InterPro:IPR029044"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM5"
                     /translation="MKLSVLLSLYIHESPNFLDDCLASLYKQSHFPDEVVIVFDGPVT
                     NELHDCVDKWSKYLPIVSIELDKNVGLGQALNVGLKKCSYNYVFRMDTDDICHPERLL
                     QQLSFFKNNPDVGLLSCAVGEFKHSVKDIYAWRRLPLKHDEIIRFSKKRNPFNHMAVA
                     FKKELVLNAGGYQNEYLYEDYSLWIRMIQNGVITANLPETLVYARTGNGMAARRSGLK
                     YAKSEYFAQVKFYKMGYLSFLELLRNLAIRLPLRLVPVSLLSLLYSTILRK"
     gene            12307..13425
                     /gene="tnp"
     CDS             12307..13425
                     /gene="tnp"
                     /codon_start=1
                     /transl_table=11
                     /product="transposase IS4 family protein"
                     /protein_id="CBN82204.1"
                     /db_xref="GOA:E6ZDM6"
                     /db_xref="InterPro:IPR002559"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM6"
                     /translation="MEHISVIPDYRQAWKVEHKLSDILLLTICAVIYGVEDWEDLEDF
                     GETHLDFLNQYGDIENGIPVNDTIARVVSCISPAKFHECFINWMRDCHSSDNKDVIAT
                     DGKTLRHSYDKSRRRGAIHVISAFSTMHSLVIGQIKTDEKSNEITAIHELLNMLDIKG
                     KIITTDAMGCQKILLRIYKNREVIIFFAVKGNQGRLNKAFEEKMPLKELNNPEHDSYA
                     ISEKSHGREETRLHIVCDVPDELIDFTFEWKGLKKLCVAVSFRSIIAEQKKEPEMTVR
                     YYISSADLTAEKFAIAILNHWHVENKLHRRLDVVMNEDDCKIRRGNAAELFSGKRHIA
                     INILTNDKVFKAGLRRKMRKAAMDRNYLASVFAGSGLP"
     CDS             13482..13964
                     /note="ORF 13"
                     /codon_start=1
                     /transl_table=11
                     /product="putative acetyl transferase"
                     /protein_id="CBN82205.1"
                     /db_xref="GOA:E6ZDM7"
                     /db_xref="InterPro:IPR001451"
                     /db_xref="InterPro:IPR011004"
                     /db_xref="InterPro:IPR018357"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM7"
                     /translation="MSIHLLSDVKSKKIGMGTTIWQFVVIFENAVIGENCNICAHTLI
                     ENNVVIGNNVTIKSGVYLWDGIILEDNVFVGPSVAFTNDIYPRSKMHKSSYPTTLIKQ
                     GASIGANSTILPGITIGRNSIVGAGSVVTKDVPDDVIVIGNPAKIIRSISSDYPSKIK
                     "
     gene            14309..15715
                     /gene="gnd"
     CDS             14309..15715
                     /gene="gnd"
                     /codon_start=1
                     /transl_table=11
                     /product="6-phosphogluconate dehydrogenase"
                     /protein_id="CBN82206.1"
                     /db_xref="GOA:E6ZDM8"
                     /db_xref="InterPro:IPR006113"
                     /db_xref="InterPro:IPR006114"
                     /db_xref="InterPro:IPR006115"
                     /db_xref="InterPro:IPR006183"
                     /db_xref="InterPro:IPR006184"
                     /db_xref="InterPro:IPR008927"
                     /db_xref="InterPro:IPR012284"
                     /db_xref="InterPro:IPR013328"
                     /db_xref="InterPro:IPR016040"
                     /db_xref="UniProtKB/TrEMBL:E6ZDM8"
                     /translation="MSKQQIGVVGMAVMGRNLALNIESRGYTVSIFNRSREKTEEVIA
                     ENPGKKLVPYYTVKEFVESLETPRRILLMVKAGAGTDAAIDSLKPYLDKGDIIIDGGN
                     TFFQDTIRRNRELSAEGFNFIGTGVSGGEEGALKGPSIMPGGQKEAYELVAPILTKIA
                     AVAEDGEPCVTYIGADGAGHYVKMVHNGIEYGDMQLIAEAYSLLKGGLNLSNEELAQT
                     FTEWNNGELSSYLIDITKDIFTKKDEDGNYLVDVILDEAANKGTGKWTSQSALDLGEP
                     LSLITESVFARYISSLKDQRVAASKVLSGPQAQSAGDKAEFIEKVRRALYLGKIVSYA
                     QGFSQLRAASEEYNWDLNYGEIAKIFRAGCIIRAQFLQKITDAYAENPQIANLLLAPY
                     FKQIADDYQQALRDVVAYAVQNGIPVPTFAAAVAYYDSYRAAVLPANLIQAQRDYFGA
                     HTYKRIDKDGVFHTEWLD"
ORIGIN      
        1 aataactacc cggaagacca ggcagtgaaa aactttgtcg tggcgaatat cacgggatcg
       61 gattgtcgaa cgtttgtttc tgagtaatgc agacgagtca gagaaaaaag gaccaggttg
      121 gactacgatt attcggaaag aggtactgat taaattatca gtatgtggat ttccgagtaa
      181 tccgagtaac ccagatgctg atggtgtgta gtgttatcgt aaggtttaat caaagttatg
      241 cggaactaag ctttggtata tagccataac gtttggctaa cctatggcaa taatttacgc
      301 actatcagcc acttagaggt aggaaaagaa tgacgaattt aaaagcagtt ataccggtag
      361 caggtcttgg gatgcatatg ttgcctgcca ctaaggcgat tcccaaagag atgctaccga
      421 tcgtcgacaa gccaatgatt cagtacattg ttgacgagat tgtggctgca gggatcaaag
      481 aaatcctcct ggtaactcac gcgtccaaga acgcggtcga aaaccacttc gacacctctt
      541 atgaattaga atctctcctt gaactgcgcg tgaagcgcca actgttggcg gaagtacagt
      601 ccatctgtcc gccgggcgtg acaattatga acgtgcgtca gggcgaacct ttaggtttgg
      661 gccactccat tttatgtgca cgacctgcca ttggtgataa tccatttgtc gtggtgctgc
      721 cagacgttgt gatcgacgac gccagcgccg acccgctgcg ctacaacctt gctgccatga
      781 ttgcgcgctt caacgaaacg ggccgcagcc aggtgctggc aaaacgtatg ccaggtgacc
      841 tctctgaata ctctgtcatc cagaccaaag agccgctgga tcgcgaaggt aaagtcagcc
      901 gcattgttga attcatcgaa aaaccggatc agccgcaaac gctggactca gatattatgg
      961 ccgtgggccg ttatgtgctt tctgccgata tttggccgga actggaacgt actcagcctg
     1021 gtgcatgggg acgaattcag ctgactgatg ccattgctga gctggcgaaa aaacagtccg
     1081 ttgacgccat gctgatgact ggagacagct acgactgtgg taaaaaaatg ggctatatgc
     1141 aagcgttcgt gaagtatggg ctgcgcaacc tgaaagaagg ggcgaagttc cgtaaaggca
     1201 ttgagaagct gttaagcgaa taatgaaaat ctgaccggat gtaacggttg ataagaaaat
     1261 tataacggca gtgaagattc gtggcaaaag taatttgttg cgaatattcc tgccgttgtt
     1321 ttatataaac aatcagaata acaacgagtt agcaatagga ttttagtcaa agttttccag
     1381 gattttcctt gtttccagag cggattggta agacaattag cgtttgaatt tttcgagtta
     1441 agcgcgagtg ggtaacgctc gtcacatcgt aggcatgcat gcagtgctct ggtagctgta
     1501 aagccagggg cggtagcgtg cattaatacc tctcttaatc aaactaagag ccgctaattt
     1561 cacagcatgc tctgaagtaa tatggaataa aaaagtgaag atacttgtta ctggtggcgc
     1621 aggatttatt ggttctgctg tagttcgtca cattataaat aatacgcagg atagtgttgt
     1681 taatgtcgat aaattaacgt acgccggaaa cctggaatca cttgctgatg tttctgattc
     1741 tgaacgctat gtttttgaac atgcggatat ttgcgatgct gctgcaatgg cgcggatttt
     1801 tgctcagcat cagccggatg cagtgatgca cctggctgct gaaagccatg tggatcgttc
     1861 aattacaggc cctgcggcat ttattgaaac caatattgtt ggtacttatg tccttttgga
     1921 agcagctcgc aattactggt ctgctcttga tggcgacaag aaaaatagct tccgttttca
     1981 tcatatttct actgacgaag tctatggcga tctgcctcat cctgacgaag taaataataa
     2041 agaagaatta cccctcttta ctgagacgac agcttacgcg ccaagcagcc catattctgc
     2101 ttctaaagca tccagcgatc atttagtccg cgcgtggaaa cgtacctatg gtttaccgac
     2161 cattgtgact aactgttcga ataactacgg cccttatcac tttccggaaa aattgattcc
     2221 gctggtaatt cttaatgctc tggaaggtaa ggcattacct atttatggca aaggggatca
     2281 aattcgcgat tggctgtatg ttgaagatca tgcgcgtgcg ttatataccg ttttaaccga
     2341 aggtaaagca ggtgaaactt ataacattgg tggacacaac gaaaagaaaa acattgatgt
     2401 agtgctcact atttgtgatt tgttggatga gattgtaccc aaagagaaat cttaccggga
     2461 gcaaattact tatgttgccg atcgtccggg acacgatcgc cgctatgcga ttgatgctga
     2521 gaagattagc cgcgaattgg gctggaaacc acaggaaacg tttgagagcg ggattcgtaa
     2581 aacagtggaa tggtacctgg ctaatacaaa atgggttgag aatgtgaaac taggtgcata
     2641 tacttcttac ctttccaaac aaggcggaga taataactga tgaaaggtat tatactggca
     2701 ggtggttcag gaacgaggct atatccatta actttggggg tatctaagca gttgatgccc
     2761 atatatgata aaccaatgat ttattatccc ctatcagtgt taatgttggc aggcataaaa
     2821 gatattctga ttatcactac acaggaagat caggcaagtt ttgttaggtt gttaggggat
     2881 ggaaaaaaat ttggtgttaa tttgagttat gcaattcagc caagtcctga tgggttagct
     2941 caggcattta tcattggaga aaaatttatc ggcagtgaat cggtgtgcct ggtcttaggg
     3001 gacaatatat tctttggaca aggttttacg cccaaattac aaatagcaac gagtcgaaca
     3061 agaggtgcga ctgtttttgg ttatcaagta atggaccctg aacgatttgg agttgttgag
     3121 ttcgatgcgg atctaaaagt tctaagtata gaagaaaaac cctttaaacc aaaatcaaat
     3181 tgggccgtga ctgggctata tttttatgat aatgatgtta ttgaaatagc aaaaagtata
     3241 aaaccgtctc caagaggtga attagagata acatcagtaa atgaagttta cctgactaat
     3301 agttccttac atgttgaatt gttaggccgt ggatttgcat ggcttgatac agggacacat
     3361 gatagcctga ttgaagcggg cagttttgtt gaaactgtgc aaaaacgtca aggaatgatg
     3421 gtcgcttgtc ctgaagaaat tgcttggcgt aatggatggt tgagtaatga ggaattattg
     3481 gatttaggta tccaattaag caaaaatcat tacggtcaat atctaataaa actggcaaag
     3541 catatatgaa tatagagttt atctctcttc agaaacatgg agatgagcga ggggcgctag
     3601 tttcccttga aagagaaaaa aatatccctt ttgatattcg tagagtttat tatatctttg
     3661 atactaaaga aggtataact cgaggattcc atgcccatcg taaactaaag caagttgtaa
     3721 ttgctgtaaa gggtagttgt cgctttattc tcgatgacgg ggtagagcgt gttagtgttg
     3781 tattagataa tccatcggag gggcttctta ttacatctct catctggcga gaaatgacag
     3841 atttcagtaa ggactgtgtt ttaatggttc ttgctgacat ggaatatgat gaatctgatt
     3901 acattagaga ttattctatt tttaaattaa tagcacaaga ccagaacact taaaacatat
     3961 aagatataat aattcgtatt atattgaatt atagaattcg ttgatgacaa ctaaaatcta
     4021 agggttgaga aatggttgat tttttaaatc taaaaaaaat aaataaacgt caaaaacaag
     4081 atttgctaga agcagtagaa agagtaatag attccggttg gtatataatg ggttcagaac
     4141 tggattcatt cgaacaagag tttgcaatat tttgtcaggt caaatactgt cttggggttg
     4201 caaatggtct tgatgctcta actttagttt taagagcttg gaaggaaatg gggaaaataa
     4261 aggatggtga tgaggttatt gtgcaagcaa atacctacat agcatccgta ttagcgataa
     4321 ctgaaaataa tcttattccg gtactagttg agccagataa caaatccttc aatttgtcag
     4381 ttgaaaatgt atgcaatgca atttcagata aaacaaaagt tattctgcca gtacatcttt
     4441 atggtcagat atcgccaatg aaagacatta tgagaattgc caaggaacga gggcttctcg
     4501 ttcttgaaga ttgtgcccaa gcacatggtg ctcaaatcga gggtaaacga gctggtagct
     4561 ggggggatgc tgcaggattc agtttctatc ctggaaaaaa cttgggagcg cttggcgatg
     4621 ctggtgctat caccactaat gatgaggagt tatacaaggt tattaaggcg cttagaaact
     4681 atggttcaga agagaaatat ctaaatctat ataaaggagt taatagccga cttgatgaaa
     4741 tacaggccgc aatgttacgt gtaaaactca aaatgttgag tgaagatatt aaacttagac
     4801 aatgtatagc gcaacgatat cttacagaga taaaaaattc gttcctcgaa ttacctcatg
     4861 ttgaaaatat ggagaaccat gtttggcatt tatttgtcct gaaaacgcaa aaacgagaag
     4921 cattacagtt atggcttgag agacataaga ttcagtcatt aattcactat ccaatccccc
     4981 ctcataagca aaatgcttat aagaaaatga ataatattcg tcttccactg accgaagacc
     5041 tgcacagaaa agtattatca attcctatgg acccaacaat gtcagatgat gatgttaaat
     5101 cagttataaa cgccttaaat ggttttatgg gatgagtaag ctcttaaaag taaccgcctc
     5161 gacaggagtt ttaactctag ctaaaatggc aatgggattt gccatttcga aaattattgc
     5221 gatatatacc ggtccatcag gaatggcctt gcttggccag attcaaggtg ccgtcactgt
     5281 ctttacggga atagcaaatg ctcctgtaag taacggaata gtaaggtata catcagaaca
     5341 aagtaaaaat gggattcatg catgctcacg atggtggcga gcatcattaa tctgggtggt
     5401 aacaatatat ataatattgt tacctgtatc agtgttattt tcacattact tagcggatta
     5461 tttctttggt aacaagaatt atgcatggat aatatactta atcatagcat tgcttcctct
     5521 cactgctttg ggcacccttt ttctatctat aattaatgga cttcaaaatt ttagacgatt
     5581 tgtattaata aattttgttt cagttctaat gtcgggcatt gtgatggccg tactcatcat
     5641 tttctataat atacagggag caattgtagc agcttcgatt caggctgcat taattggctt
     5701 gataatattg gtaattaatt taaaccaaca atggatgcac ttcaggaatt ttgtaggcaa
     5761 gtttgattat tctgcaattt gtgatattgg caaatatgtt gttatggcaa tggcaagttc
     5821 gcttattatg ccagcggctt tacttttagt acgaaacgtc ttggtccaaa caagtggctg
     5881 gcaaggtgca gggctttggc aggctgtttg gaaaatttca gaagtatatc taagtataat
     5941 tacaatagct ttaactacat attatttacc taggctatca cagttgaata ctatcgacag
     6001 cattatggac gaaatacttg caagtgtaaa ggttgtgatg cctattataa ctgtaatcgc
     6061 actgctagtt tatttttcgc gggatgtttt aatttccatt ctctttactg atgaatttag
     6121 atctgcgaga gaactttttg ccattcaact ttgtggagat attataaaaa tattagcatg
     6181 gctttatgcg tttcccatgt tatcaagatg tgcagttaaa tggtatcttt taacagagat
     6241 gttttttggt attgttttta ttttgttgtc ttatatttta attccacttt ttcaattaca
     6301 tggcgcgaat tatgcctatc ttctaagtta tagtttatat ggtgtagtaa ttataacaaa
     6361 tgtccgaaga tttctaaaat aaggatacta aattgttcaa atttatcaaa ttatattata
     6421 tgtttttaaa tatttccctg ctttatataa tcagcaaaac atcaaaaaat tcaataattt
     6481 tcaagatgcc tataattggt aagggattca gtttgtctat ttttaataga gcaaaactca
     6541 atatttgcaa tttagtcgca agaaacaacc tgagcctctt tgtaagccaa ggccaactta
     6601 cgtttaaaaa gggatgtttt gtaaataaca attgttcttt taattgtctg gatagtattc
     6661 aaatagggga gaatacaata tttggcgaag gtgtaaaagt atatgatcat gaccatatca
     6721 ttgacaatga gtattatgtt agcaagaacg agttcattac ttctcctgtg aaaattggct
     6781 caaattgttg gatcggaact aatacaataa ttttaaaagg agtatctata accgacaatg
     6841 taattattgg tgctaattca cttgtaaata aatcaatttc ggaagcaggg gtttatgtaa
     6901 gtaaaaacgg agttttaaca aaaataaaat aaggttatat gttgcgaatg aataaattta
     6961 ttaccattac agtcatttct tataattcta gcgccacaat atctgatacg ctaaatagta
     7021 ttctccagca gacttataat aagaaaaaca ttgaagtcat catttccgat gacgcttcaa
     7081 aagataacac cttgttaatc gctaatgact ggaaagacaa aaataaaggt atttttaata
     7141 atattgttat tgtatcccat agtgaaaata agggagtggc cgctaactgt aatcaggcat
     7201 ggaaattagc taaaggtgaa tggattaaaa ctattgctgc tgatgatatg ttgctcccta
     7261 attgcattga ggaaaatata aaatatgttt tgaataactc agatgcaaaa attattttct
     7321 cagatatgat ccctttcact agttatgggt atgaagaacc aatgaaacat gacaagaaga
     7381 aaatcaactg ttctcatagc caacaaaaaa aaaatatcct ttatcaatgt tatcttctag
     7441 ctccaactgc atttattaat agaaaagctc tcgcggatgt aggttatgcc gatgaggcgt
     7501 acccgatgat cgaagattat cctctttggt tgagatgttt gaataatgga tataaatttt
     7561 cttatatgga aaagaatact gtgatttatc gtcaaggtga ctctttatct caacagaata
     7621 ccaagatcgg taatatatcc tatatgcagt ctttatattc ttttcagaaa gaaaaaatat
     7681 ggccgcagtt gcccaaatgg atgatattta aaaaatggga tgattatata ctatataaac
     7741 ataaaaactc atggataaaa atttttggaa atgaaatgac ctttttttat cgtgtcttcc
     7801 gaaaattggt attattactt agaccgtata aaatgtatct ttttgcaaaa aaaataataa
     7861 tgaaatagag aaataaagat ggtatataac atattaatat taattatttt tataattatt
     7921 gtattgattt caaataaaag attacgcatt tttagtttca aaccaacatt tttaggggct
     7981 atgtttttat tgtctctgtt tatacaaatt gtccctggaa caattttggt ttcattcttt
     8041 gattacccaa tgtctttcgg agtggataca actataagca atgaggtaaa aattgagaca
     8101 tttagatata cttttatttc aatttcagca ttgttattta taataacagc agcctcagtt
     8161 tttttgaatt tcgatgtgga tttaattaaa ttagaaaccc gatatttgag agccaaacta
     8221 cttacctttt tttctttggt tgttatatta gtaaaaatat tatcagttgg taatattcca
     8281 tttttgatgg ttttacatgg tgatttcgat ggtgccgcct tggcaaaggc acaaatcttg
     8341 aaaaatgaag ttggatttgg tggtcttttt atcggttaca tttttgttta cttcccttat
     8401 atatcattag tatatgcata ttgtcaaaaa aagaaacaac aatatggaat agaggtgttt
     8461 agattaaatc ttcttcttat aacaatatac agtatttacg atatgcagaa gtcaaagttt
     8521 attgttgtat tatttatatt gtttattctt tatttgaagt tttcgaagaa aatcaattat
     8581 tggttagtaa caggtatacc tattgtgagc atttttctct tatgttcctt ttttattttg
     8641 ttacacaata ttccaatgag tgaagtattt gattctgttt ttgcaagatt atttattggg
     8701 cagacggaag gctcttttat gatatatcaa gcattgactc ctgatatttc gcgcatcgcg
     8761 tatggtatgc cgttagctgg tctgtttgga atatcatcgg tcgatccagc agcggaaatc
     8821 atcacgatat tttttccaac tgctggggat gcatggatca attccaatag ttatttccaa
     8881 gcccatgcgt ggtcgatttt tggtgattta tcgctaatct tagggccact gtttgttgca
     8941 ctgaatataa ttggtctata ttttttaaaa gagctcttta gtaaagttga caaagcctat
     9001 gcttgttgcg tttacatcgt atcaattctt actttaccca tagttaatga cttctcatat
     9061 tttttatttt ttaaatcatg gttttgcatg attgtattaa tgctatttta tatttcaacg
     9121 gtcaagttca ttgaaatttg ttgtaattat aaaagataaa atatgtacta atcatcatcc
     9181 tgtcactgca tttgcaacag ataacttaaa accttataaa tacaagcttg gtaattatga
     9241 taaaaatatt gcacatcgtt ggtaacaaaa tagaaccttc aaatggcata ggtcgtttat
     9301 taccagaaat gatagagatg caaaataaat ttagtacaaa catacactgt acactttgtt
     9361 gtattaatga cgtatatata acctcctcat ttcaagtaat caacaaaaat gaagtaaagc
     9421 atattaatat agatgattat gatcttttta ttttccatgg tctttatttt tggtcatata
     9481 tttcttttgc aaaaaaaata ttatctaaaa aaaagtcata tcttattaag cctcattcta
     9541 gtttgataat aaatgctcaa gaaaaatcat tcataaaaaa aagaatcgca aatttattat
     9601 attttaaggc atttgttaaa aatgcaaagg caattatatt tacaaatgac gatgaagcga
     9661 agaactccgt tcgctggaat ccgaatgctc ttttcgaagg taacggtctc acaagtatac
     9721 aatcatcaga tattgatata aaacagaaac agaaaccata taagtttgtg tatctctcac
     9781 gaatagattt tactcataaa ggtacggata tacttcttga tgctttagac ttattaaaag
     9841 aaagatataa tattaaggat cttcatctct caatctatgg gaaaggatca aaagaagaag
     9901 agaatgaact tattcgtcgt ataaaaaaac taaattttac gaatgttgca ttttatggag
     9961 caatttacgg taatcaaaaa tatgatatgt ttaataagaa agatattttc attttgactt
    10021 cacgttatga gggattcccg atggcgatac tagaagcact agatgcaggt ttgccatgtt
    10081 tagttacaag aggtgttaat atgacaagta ttattgagaa atatcatgtt ggatgggaat
    10141 gtcaaacgac tcctcaaagt gtggcaaatt tgattgtttc tgtacttggg gtagagcagg
    10201 atgttctgaa tgaaatgtct agacaggccc gtaaatatat cattgaagag cataactggc
    10261 ctgcacttgc taaatattca gaatcgctct ataaacaagt ttgtgagagg aaacagtgaa
    10321 taaacgtatt cttattttag gtggttccgg atttattggt gttaatctga ttgatcattt
    10381 tttgaattgt ggtcacgagg ttattgtata tgggagaaag caccctttag gagaatttaa
    10441 taataaaatc acttttctta aggcggggtt tactgatatt tctgcgcata agaaatattt
    10501 aaaaagctta aatattgaca cggcaatata tttaataaat aatttccctg ttaattcaaa
    10561 tgtaccagac ttcgagatgt gtctagagtt aaataaacta ttaataaatg aggtatttga
    10621 tatcgtagaa cgttttattt ttttttcttc tggcggtaga gtttataaaa gtagtcacaa
    10681 acctcaccat gaagacgaac gcctgagggc cgtatgtgat tatggaaaaa gtaaaattta
    10741 tttagagcag tttgtcattt catgtgcata tttgaaatgc aaaagattcc ttatcgttag
    10801 gccatcaaac ccttatggtc ctcatcagat attaactgga aatcaggggt tgatagccat
    10861 actactaggc cgtattatga acggagagat gatacaaata tggggaagtg ggaacgaaat
    10921 aagagattat atttatattc aagattttgt tcaaatattt tacaagttat tctgtgtgga
    10981 aaatccacaa tttaatattt ataatatcgg ttcgggtata ggagtgtcaa caaaaactat
    11041 cctaagtacg gtcagtcaaa gacttcctaa ttatattatt caaactgaat atatagagaa
    11101 taaaaaaaca atacaatcta acattctttg taataaacgc attattgggg aaataggaaa
    11161 ttaccatttt actgatgtta actctggtat tgaacaattt attgaatggt tacataatat
    11221 cgataataga aaattataat ataatttttc atttttaatg gtaagcctct catgaaatta
    11281 agcgtattac tttcattata catacatgaa tcaccaaatt ttttggatga ttgcttagca
    11341 agcttgtata agcaaagtca ttttcctgac gaagtcgtga ttgtttttga tggccctgtg
    11401 actaatgaat tgcatgactg tgttgataaa tggagtaaat atttaccaat tgtttctatt
    11461 gaattggata agaatgttgg ccttggtcaa gctttgaatg ttgggttaaa aaagtgtagc
    11521 tataattatg tcttcaggat ggataccgat gatatatgtc acccagagcg actattgcaa
    11581 caattatctt tttttaaaaa taatcccgat gttgggttat tgagttgtgc tgtaggtgag
    11641 tttaaacatt ctgtcaaaga catctatgca tggcgcaggc ttcctctcaa acatgatgaa
    11701 ataatccgtt tttcaaagaa aagaaatcct ttcaatcata tggctgtagc ctttaaaaaa
    11761 gaattagttt taaatgccgg aggttatcaa aatgaatact tatatgaaga ttattcatta
    11821 tggattcgca tgattcagaa tggtgtaatt acagccaatt taccggaaac gctcgtatat
    11881 gctagaactg gaaatggaat ggcagctaga cgttcaggct taaagtatgc taagtctgaa
    11941 tattttgcac aagtaaaatt ttacaaaatg ggatatttga gttttctgga gttgttacgt
    12001 aatctggcaa ttagattacc tctcaggctt gttccggttt cattattgtc attactttac
    12061 tcgactattt tgcgtaaata aagttaaatt aatatccttt ataaaaatca tgtgtttttt
    12121 tgttaaatcc ttaagggatg gagaatatga aaagataatc aaaagcacac ttttgcactt
    12181 aataatttgc attttatgtt caataattaa gatattcctt attacctaaa accgttttac
    12241 attgcttata catgatcaaa tactccttac ataattaagg agaacaaaat tgaactttaa
    12301 aaattgatgg aacatatttc cgttattccc gattacagac aagcctggaa agtggagcat
    12361 aaattgtcag atattctact gttgactatt tgtgccgtta tttatggtgt agaagattgg
    12421 gaagatcttg aggattttgg ggaaacacat ctcgattttt tgaatcaata tggtgatatt
    12481 gaaaatggta ttcctgttaa cgataccatt gccagagtgg tatcctgtat cagtcctgca
    12541 aaatttcacg agtgctttat taactggatg cgtgactgcc attcttcaga taataaagac
    12601 gtcatcgcaa ctgatggaaa aacactccga cattcttatg acaagagtcg ccgcagggga
    12661 gcgattcatg tcattagcgc gttctcaaca atgcacagtc tggtcatcgg acagatcaag
    12721 acggatgaga aatctaatga gattacagct atccatgaac tgcttaacat gttggatatt
    12781 aagggaaaaa taatcacaac tgatgcgatg ggttgccaaa agatattgct gagaatatac
    12841 aaaaacaggg aggtgattat ttttttcgct gtaaaaggaa accagggacg gctaaataaa
    12901 gccttcgagg aaaaaatgcc gctgaaagaa ttaaataatc cagagcatga tagttacgca
    12961 attagtgaaa agagtcacgg cagagaagaa acccgtcttc atattgtctg cgatgtccct
    13021 gatgaactta ttgatttcac gtttgaatgg aaaggactga aaaaattatg cgtggcagtc
    13081 tcctttcggt caataatagc agaacaaaag aaagagccag aaatgacggt cagatattat
    13141 atcagttctg ctgatttaac tgcagagaag ttcgccatag caatcctaaa ccactggcac
    13201 gtggagaata agctgcaccg tcgtctggac gtggtaatga atgaagacga ctgcaaaata
    13261 agaagaggaa acgcagcaga attattttca gggaaacggc acatcgctat taatatttta
    13321 acgaatgata aggtattcaa ggcagggtta agacgtaaga tgcgaaaagc agccatggac
    13381 agaaactacc tggcgtcagt ctttgcgggg agcgggcttc cgtaatcttg ccttgattac
    13441 tatattcttg aaataaataa ttaatattat tgagggttta tatgagcatc catttattga
    13501 gtgacgtaaa atcaaaaaaa ataggcatgg gtactacaat ttggcaattt gtggtaattt
    13561 tcgaaaatgc agtaattgga gaaaattgca atatttgtgc acatacttta attgaaaaca
    13621 atgtagttat aggtaataat gttacaatta aatctggtgt gtatttatgg gatggtataa
    13681 tattagagga taatgtattc gttggtcctt ctgttgcttt cacaaatgat atttatcctc
    13741 gttcaaaaat gcataaatca tcttacccta cgactttgat taaacagggt gcatcgattg
    13801 gggctaattc aactatatta ccgggtataa caataggtcg caatagtatc gttggtgctg
    13861 gctcagtcgt tactaaagat gttcctgatg atgttattgt tattggaaat ccggctaaaa
    13921 taatacgatc tatatcaagc gattatccat ctaaaataaa atgacatcgt ttttgagtga
    13981 ctgttttatt atatttttat ttgattgtgc taattttgtt gaggcgtaaa tgtagagggt
    14041 agtagcgtaa ttaaaaagtg tttggtcata atattaattg gtgttcatgc gttctaatac
    14101 ttctatatta agattcaaaa catagtgtca aatctcgatt tcttaaatta tctatgaatt
    14161 gcactctcca gtgaaaattt ttaactcctt atattgttat tctctatttc attcagtaat
    14221 tttaaaaatc cttaattttg cattaaataa aaatcacatt tacatcataa acaagccgct
    14281 ccgcggtaac ccctgacagg agtaaacaat gtcaaagcaa cagatcggcg tagtcggtat
    14341 ggcagtgatg gggcgcaacc ttgcgctcaa catcgaaagc cgtggttata ccgtctctat
    14401 tttcaaccgc tcccgtgaga agacggaaga agtgattgcc gaaaatccag gcaagaaact
    14461 ggttccttac tatacggtga aagagtttgt tgaatctctg gaaacgcctc gtcgcatcct
    14521 gttaatggtg aaagcaggtg caggcacgga tgctgctatt gattccctca agccgtacct
    14581 cgataaaggt gacatcatca ttgatggtgg taataccttc ttccaggaca ccattcgccg
    14641 taaccgtgag ctttctgccg aaggctttaa cttcatcggt accggtgttt ccggtggtga
    14701 agagggcgcg ctgaaagggc cttccattat gcctggtggc cagaaagaag cctatgaact
    14761 ggttgctccg atcctgacca aaatcgccgc agtagctgaa gacggtgagc catgcgttac
    14821 ctatattggt gccgatggcg caggtcacta tgtgaagatg gttcacaacg gtattgaata
    14881 cggtgatatg cagctgattg ctgaagccta ttctctcctg aaaggcggcc tgaatctctc
    14941 taacgaagaa ctggcacaga cctttaccga gtggaataac ggtgaactga gcagctacct
    15001 gatcgacatc accaaagaca tcttcactaa aaaagatgaa gacggtaact acctggttga
    15061 tgtgatcctg gatgaagcgg ctaacaaagg taccggtaaa tggaccagcc agagcgcgct
    15121 ggatctcgga gaaccgctgt cgctgattac cgagtctgtg tttgcacgtt atatctcttc
    15181 tctgaaagat cagcgcgttg ccgcatctaa agttctctct ggtccgcaag ctcagtcagc
    15241 aggcgacaag gctgagttca tcgaaaaagt tcgccgtgcg ctgtatctgg gcaaaatcgt
    15301 ttcttacgct cagggcttct ctcagctgcg tgctgcgtct gaagaataca actgggatct
    15361 gaactacggc gaaatcgcga agattttccg tgctggctgc atcatccgtg cgcagttcct
    15421 gcagaaaatc accgatgcat atgccgaaaa tccgcagatc gctaacctgc tgctggctcc
    15481 gtacttcaag caaattgccg atgactacca gcaggcactg cgcgatgtcg tcgcttatgc
    15541 ggtacagaac ggtatcccgg ttccgacctt cgctgctgcg gttgcctatt acgatagcta
    15601 ccgtgccgct gttctgcctg cgaacctgat ccaagcacag cgtgactatt tcggtgcgca
    15661 tacttataag cgcattgata aagatggtgt gttccatact gaatggctgg attaatctga
    15721 tttaaccaac aataaaattg aggcccggcg tatattgcac cgggcttttt tttgccaaat
    15781 atcttataga ctaaatttca ctgcttaata ttaacttaat aaat
//