LOCUS NZ_ACVX01000040 28409 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00039, whole genome shotgun sequence. ACCESSION NZ_ACVX01000040 NZ_ACVX00000000 VERSION NZ_ACVX01000040.1 GI:256005755 DBLINK Project: 55637 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. REFERENCE 1 (bases 1 to 28409) AUTHORS Lucas,S., Copeland,A., Lapidus,A., Glavina del Rio,T., Tice,H., Bruce,D., Goodwin,L., Pitluck,S., Larimer,F., Land,M.L., Hauser,L. and Hemme,C.L. CONSRTM US DOE Joint Genome Institute (JGI-PGF) TITLE The draft genome of Clostridium thermocellum DSM 2360 JOURNAL Unpublished REFERENCE 2 (bases 1 to 28409) AUTHORS Lucas,S., Copeland,A., Lapidus,A., Glavina del Rio,T., Tice,H., Bruce,D., Goodwin,L., Pitluck,S., Larimer,F., Land,M.L., Hauser,L. and Hemme,C.L. CONSRTM US DOE Joint Genome Institute (JGI-PGF) TITLE Direct Submission JOURNAL Submitted (17-JUL-2009) US DOE Joint Genome Institute, 2800 Mitchell Drive B310, Walnut Creek, CA 94598-1698, USA COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000040. URL -- http://www.jgi.doe.gov JGI Project ID: 4085028 Source DNA and Bacteria available from Christopher L. Hemme (hemmecl@ou.edu) Contacts: Christopher L. Hemme (hemmecl@ou.edu) David Bruce (microbe@cuba.jgi-psf.org) Whole genome sequencing and draft assembly at JGI-PGF Annotation by JGI-ORNL The JGI and collaborators endorse the principles for the distribution and use of large scale sequencing data adopted by the larger genome sequencing community and urge users of this data to follow them. It is our intention to publish the work of this project in a timely fashion and we welcome collaborative interaction on the project and analysis. (http://www.genome.gov/page.cfm?pageID=10506376). ##Metadata-START## Organism Display Name :: Clostridium thermocellum DSM 2360 Culture Collection ID :: DSM 2360 GOLD Stamp ID :: Gi02594 Isolation Site :: contaminant of Clostridium thermocellum strain LQ8 Isolation Country :: USA Oxygen Requirement :: Anaerobe Cell Shape :: Rod-shaped Motility :: Motile Sporulation :: Sporulating Temperature Range :: Thermophile Temperature Optimum :: 60 C Gram Staining :: gram+ Biotic Relationship :: Free living Diseases :: None Phenotypes :: Cellulose degrader, Ethanogenic, Ethanol production Energy Source :: Chemoorganotroph ##Metadata-END## FEATURES Location/Qualifiers source 1..28409 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene complement(817..1671) /locus_tag="ClothDRAFT_2570" CDS complement(817..1671) /locus_tag="ClothDRAFT_2570" /inference="protein motif:PFAM:PF03773" /note="PFAM: permease; KEGG: cha:CHAB381_0335 permease" /codon_start=1 /transl_table=11 /product="permease" /protein_id="ZP_05430709.1" /db_xref="GI:256005756" /db_xref="InterPro:IPR005524" /translation="MNILAMIFGWLNDQLLKMRWLSELVRLLVEKVFGLPVSERIGGS IHFFIYDTIKIFILLSLLIFVISYIQSYFPPERTKKILGKIKGIKGNILGALLGTITP FCSCSSIPIFIGFTSAGLPLGITFSFLISSPMVDLASLMLLISFFGLKIAIAYVVVGL ILAVIGGTLIEKFRLEKYVEGYVREIENVDAEVPEMTRKERISYSKEQVRDIIKRVWL YVLIGVGIGAAIHNWIPQSFIENVVGGNNPFAVMLATVVGIPMYADIFGTLPIAEALF AKGVDVGV" misc_feature complement(823..1545) /locus_tag="ClothDRAFT_2570" /note="Predicted permease; Region: DUF318; cl00487" /db_xref="CDD:119868" gene complement(1780..2181) /locus_tag="ClothDRAFT_2571" CDS complement(1780..2181) /locus_tag="ClothDRAFT_2571" /inference="protein motif:PFAM:PF01451" /note="PFAM: Protein-tyrosine phosphatase, low molecular weight; SMART: Protein-tyrosine phosphatase, low molecular weight; KEGG: cju:C8J_1458 arsenate reductase" /codon_start=1 /transl_table=11 /product="Protein-tyrosine phosphatase, low molecular weight" /protein_id="ZP_05430710.1" /db_xref="GI:256005757" /db_xref="InterPro:IPR017867" /translation="MKKKVAFVCVHNSCRSQMAEGWAKKLGSDVLEAYSAGTEKYPEV KPLAVQVMEEAGVDMSDHHPKLLSDIPAEVDILITMGCNVECPYVPCQHIEDWGLSDP SGGPIEDYRKTRDIIKEKVEDLIQRVKNNQI" misc_feature complement(1801..2175) /locus_tag="ClothDRAFT_2571" /note="Low molecular weight phosphotyrosine protein phosphatase; Region: LMWPc; pfam01451" /db_xref="CDD:144880" misc_feature complement(1804..2175) /locus_tag="ClothDRAFT_2571" /note="Low molecular weight phosphatase family; Region: LMWPc; cd00115" /db_xref="CDD:29014" misc_feature complement(order(2134..2142,2146..2151,2155..2157)) /locus_tag="ClothDRAFT_2571" /note="active site" /db_xref="CDD:29014" gene complement(2206..3261) /locus_tag="ClothDRAFT_2572" CDS complement(2206..3261) /locus_tag="ClothDRAFT_2572" /inference="protein motif:TFAM:TIGR00832" /note="TIGRFAM: arsenical-resistance protein; PFAM: Bile acid:sodium symporter; KEGG: aeh:Mlg_2709 bile acid:sodium symporter" /codon_start=1 /transl_table=11 /product="arsenical-resistance protein" /protein_id="ZP_05430711.1" /db_xref="GI:256005758" /db_xref="InterPro:IPR002657" /db_xref="InterPro:IPR004706" /translation="MSDKETMQENKGLGFFEKYLTVWVAVCIIVGVAIGQLVPSIPET LSKFEYANVSIPVAILIWLMIYPMMLKIDFSSIVRATKKPKGLIVTCVTNWLIKPFTM YLIAAFFLKVVFSRWIGPDLATDYLAGAVLLGAAPCTAMVFVWSYLTKGDPAYTLVQV AVNDLIILFAFTPIVAFLLGVSNVTVPYDTLILSTILFVVIPLAGGYLTRRNIIKHKS IEYFENIFLKKFDNVTIVGLLLTLVIIFSFQGEIILSNPLHIILIAIPLIIQTFFIFF IAYGWAKIWKLPHDIAAPAGMIGASNFFELAVAVAISLFGLESGAALATVVGVLVEVP VMLTLVRIANSTRHWFQ" misc_feature complement(2302..3225) /locus_tag="ClothDRAFT_2572" /note="Membrane transport protein; Region: Mem_trans; cl09117" /db_xref="CDD:164125" gene complement(3397..3795) /locus_tag="ClothDRAFT_2573" CDS complement(3397..3795) /locus_tag="ClothDRAFT_2573" /inference="protein motif:PFAM:PF01022" /note="PFAM: regulatory protein ArsR; SMART: regulatory protein ArsR; KEGG: saz:Sama_0493 transcriptional regulator" /codon_start=1 /transl_table=11 /product="transcriptional regulator, ArsR family" /protein_id="ZP_05430712.1" /db_xref="GI:256005759" /db_xref="InterPro:IPR001845" /translation="MDLIEIFKALGDENRIRILNLLIRQELCVCEIETVLDMTQSNAS RHLNKLKTSGIITSEKKSQWVYYRVDNKFIEENNLLYEFIKNKMAENTQLLRDIETLK KYKNSNFTCEQLREDKSQVLKYLREQCNNN" misc_feature complement(3580..3777) /locus_tag="ClothDRAFT_2573" /note="Arsenical Resistance Operon Repressor and similar prokaryotic, metal regulated homodimeric repressors. ARSR subfamily of helix-turn-helix bacterial transcription regulatory proteins (winged helix topology). Includes several proteins that appear to...; Region: HTH_ARSR; cd00090" /db_xref="CDD:28974" misc_feature complement(order(3634..3636,3724..3726,3733..3738, 3745..3750,3757..3759,3766..3768,3772..3777)) /locus_tag="ClothDRAFT_2573" /note="dimerization interface; other site" /db_xref="CDD:28974" misc_feature complement(order(3595..3603,3616..3624,3640..3645, 3649..3654,3661..3666,3670..3681,3706..3714,3751..3759, 3769..3774)) /locus_tag="ClothDRAFT_2573" /note="putative DNA binding site; other site" /db_xref="CDD:28974" misc_feature complement(order(3703..3705,3712..3714)) /locus_tag="ClothDRAFT_2573" /note="putative Zn2+ binding site; other site" /db_xref="CDD:28974" gene complement(4567..6390) /locus_tag="ClothDRAFT_2574" CDS complement(4567..6390) /locus_tag="ClothDRAFT_2574" /inference="protein motif:TFAM:TIGR01135" /note="TIGRFAM: glucosamine/fructose-6-phosphate aminotransferase, isomerizing; PFAM: sugar isomerase (SIS); glutamine amidotransferase class-II; KEGG: pca:Pcar_2933 glucosamine--fructose-6-phosphate aminotransferase, isomerizing" /codon_start=1 /transl_table=11 /product="glucosamine/fructose-6-phosphate aminotransferase, isomerizing" /protein_id="ZP_05430713.1" /db_xref="GI:256005760" /db_xref="InterPro:IPR000583" /db_xref="InterPro:IPR001347" /db_xref="InterPro:IPR005855" /translation="MCGIVGYIGSRDAAPILLNGLKKLEYRGYDSAGVAILDNGNIKV VKCKGRLEKLEEKVNCDAPVGNIGIGHTRWATHGEPNDLNSHPHISSSGKIAVVHNGI IENYLELKEFLAAEGYEFVSDTDTEVVAHLIDYHYHGDIVQAVITSINEIEGSYALGV LCRDYPDKFVAARKDSPLIVGLGNGENFIASDIPAILEYTRDVYILEDKEIVLLSDKE VKVFNNHGLAVQKKVFKVNWDVASAEKAGYEHFMMKEMCEEPKVVRDTVNPRIKDGNI VLDNIRITAEDLKNIRKIFIVACGTAYHAGVVGKYIIEKLARIPVEVDVASEFRYRDP LISDKDLVIIISQSGETIDTLFALRESKKKGARVLSIVNVVGSSIARESDDVLYTWAG PEIAVASTKAYNTQLSALYLIALDFAYKLGRIDRDYYSKVIEELKAVPREIEKVLANR DIIQKFASQHYNAKSIFFIGRGLDYALSMEGSLKLKEISYIHSEAYAGGELKHGTIAL IEEGTLVVCPVTQDSLVEKMISNIREVKARGAVVLAIAKESNKQVCKVADVVVTIPDV DSFIAPIVAVTPLQLFAYYMALQKGCDVDKPRNLAKSVTVE" misc_feature complement(4570..6390) /locus_tag="ClothDRAFT_2574" /note="glucosamine--fructose-6-phosphate aminotransferase; Reviewed; Region: PRK00331" /db_xref="CDD:178980" misc_feature complement(5749..6387) /locus_tag="ClothDRAFT_2574" /note="Glutamine amidotransferases class-II (Gn-AT)_GFAT-type. This domain is found at the N-terminus of glucosamine-6P synthase (GlmS, or GFAT in humans). The glutaminase domain catalyzes amide nitrogen transfer from glutamine to the appropriate substrate...; Region: GFAT; cd00714" /db_xref="CDD:48478" misc_feature complement(order(6013..6018,6088..6093,6133..6135, 6160..6165,6169..6174,6310..6312,6385..6387)) /locus_tag="ClothDRAFT_2574" /note="glutaminase active site; other site" /db_xref="CDD:48478" misc_feature complement(5137..5514) /locus_tag="ClothDRAFT_2574" /note="SIS (Sugar ISomerase) domain repeat 1 found in Glucosamine 6-phosphate synthase (GlmS) and Glucosamine-6-phosphate deaminase (GlmD). The SIS domain is found in many phosphosugar isomerases and phosphosugar binding proteins. GlmS contains a N-terminal...; Region: SIS_GlmS_GlmD_1; cd05008" /db_xref="CDD:88405" misc_feature complement(order(5332..5334,5398..5400,5407..5409, 5419..5421,5425..5427,5446..5451,5458..5463,5491..5496)) /locus_tag="ClothDRAFT_2574" /note="dimer interface; other site" /db_xref="CDD:88405" misc_feature complement(order(5347..5355,5485..5490)) /locus_tag="ClothDRAFT_2574" /note="active site" /db_xref="CDD:88405" misc_feature complement(4576..5040) /locus_tag="ClothDRAFT_2574" /note="SIS (Sugar ISomerase) domain repeat 2 found in Glucosamine 6-phosphate synthase (GlmS) and Glucosamine-6-phosphate deaminase (GlmD). The SIS domain is found in many phosphosugar isomerases and phosphosugar binding proteins. GlmS contains a N-terminal...; Region: SIS_GlmS_GlmD_2; cd05009" /db_xref="CDD:88406" misc_feature complement(order(4579..4581,4594..4599,4789..4794, 4798..4800,4810..4815,4864..4875,4879..4887,4891..4893, 4903..4905,4909..4911,4915..4917,4921..4923,4933..4935, 4975..4977)) /locus_tag="ClothDRAFT_2574" /note="dimer interface; other site" /db_xref="CDD:88406" misc_feature complement(order(4930..4932,4939..4941)) /locus_tag="ClothDRAFT_2574" /note="active site" /db_xref="CDD:88406" gene complement(6852..8201) /locus_tag="ClothDRAFT_2575" CDS complement(6852..8201) /locus_tag="ClothDRAFT_2575" /EC_number="5.4.2.10" /inference="protein motif:TFAM:TIGR01455" /note="KEGG: gbm:Gbem_2635 phosphoglucosamine mutase; TIGRFAM: phosphoglucosamine mutase; PFAM: phosphoglucomutase/phosphomannomutase alpha/beta/alpha domain I; phosphoglucomutase/phosphomannomutase alpha/beta/alpha domain III; phosphoglucomutase/phosphomannomutase ; phosphoglucomutase/phosphomannomutase alpha/beta/alpha domain II" /codon_start=1 /transl_table=11 /product="phosphoglucosamine mutase" /protein_id="ZP_05430714.1" /db_xref="GI:256005761" /db_xref="InterPro:IPR005841" /db_xref="InterPro:IPR005843" /db_xref="InterPro:IPR005844" /db_xref="InterPro:IPR005845" /db_xref="InterPro:IPR005846" /db_xref="InterPro:IPR006352" /db_xref="InterPro:IPR016066" /translation="MGRLFGTDGVRGVANLELTAELAYKLGQAGAYVLTSETKHTPKI LVGMDTRISGDMLEASLVAGLCSVGAEVACLGIAPTPTVAYLTRYYNADAGVVISASH NPYEFNGIKFFNSKGYKLSDALEERIESIILDNSEKIQLPTGEKIGRKIEIESPLDDY VNFIKSTIKGDLKGLKVAIDCANGASYQVAPVTFFELGADVCVINNEPDGVNINKDCG STHIEQLQKFVIESGADVGLAFDGDADRVLAVDENGNMVDGDQIMAIIGLELKKQGKL TNNTIVATVMSNLGLDIMAKREGINIVKTKVGDRYVLENMLENGHVLGGEQSGHIIFL EHSTTGDGILTGAQLLNVVKSSGKKLSELASIMQVLPQVLMNARVSNQNKEKYLEDEV ICEMCKELENEFRDEGRVLIRPSGTEPLVRVMIEGKDRDYIEKRALELVKVIEERLG" misc_feature complement(6855..8198) /locus_tag="ClothDRAFT_2575" /note="phosphoglucosamine mutase; Provisional; Region: glmM; PRK14316" /db_xref="CDD:184616" misc_feature complement(6879..8192) /locus_tag="ClothDRAFT_2575" /note="GlmM is a bacterial phosphoglucosamine mutase (PNGM) that belongs to the alpha-D-phosphohexomutase superfamily. It is required for the interconversion of glucosamine-6-phosphate and glucosamine-1-phosphate in the biosynthetic pathway of UDP-N-...; Region: GlmM; cd05802" /db_xref="CDD:100095" misc_feature complement(order(6936..6938,6951..6959,6963..6965, 7212..7214,7218..7220,7224..7226,7275..7283,7344..7346, 7464..7469,7473..7475,7479..7481,7869..7871,7893..7901, 8169..8171,8178..8180,8184..8186)) /locus_tag="ClothDRAFT_2575" /note="active site" /db_xref="CDD:100095" misc_feature complement(order(6936..6938,6951..6959,6963..6965, 7212..7214,7218..7220,7224..7226,7275..7277,7281..7283, 7344..7346,7464..7466,7899..7901,8178..8180)) /locus_tag="ClothDRAFT_2575" /note="substrate binding site; other site" /db_xref="CDD:100095" misc_feature complement(order(7467..7469,7473..7475,7479..7481, 7899..7901)) /locus_tag="ClothDRAFT_2575" /note="metal-binding site" /db_xref="CDD:100095" gene complement(8411..9997) /locus_tag="ClothDRAFT_2576" CDS complement(8411..9997) /locus_tag="ClothDRAFT_2576" /inference="protein motif:PFAM:PF01266" /note="PFAM: FAD dependent oxidoreductase; KEGG: dar:Daro_3016 FAD dependent oxidoreductase" /codon_start=1 /transl_table=11 /product="FAD dependent oxidoreductase" /protein_id="ZP_05430715.1" /db_xref="GI:256005762" /db_xref="InterPro:IPR000759" /db_xref="InterPro:IPR006076" /db_xref="InterPro:IPR013027" /translation="MKLIVRNLKLSLDEDIDALKKLVCKKIKVSEKDFKNFRIVKESI DARKKPFINLVYSVMVEIEGKIKVRESTDISILEQETEKVLVPGSIKLKNRPVVIGSG PAGLFAGLVLAQNGYRPLILERGECVEKRTQIVNRYWTTGELDPETNVQFGEGGAGTF SDGKLTTRINDRRCSIVLEEFYKSGAHEEILYKAKPHIGSDVLKKVVSNMRNKIIEYG GEVRFNSKVTSIIVKNGSITSIVVNDKEEIPCEVAVLAIGHSARDTFKMLFDKGVEFI QKPFSIGVRIEHPQELIDRAQYGEAAGHPRLGAADYQLFQKLGDRTVYSFCMCPGGVV VASASEPGMIVTNGMSEFARDKENANSALVVSVEPGDFGSSHPLAGVDFQRKWERLAF VAGGSCNRAPVQRLGDFIEGRKSTFLGTVKPSYTGGTNLADIHSCLPTFVTDSIKKAI PYFDSKIKGFGMKDAVITGVETRTSSPVRIPRGDTLEAIGIKGLYPAGEGAGYAGGIV SAAVDGIRIAEKIISTYSYE" misc_feature complement(8414..9979) /locus_tag="ClothDRAFT_2576" /note="Uncharacterized FAD-dependent dehydrogenases [General function prediction only]; Region: COG2509" /db_xref="CDD:32579" misc_feature complement(<9623..9709) /locus_tag="ClothDRAFT_2576" /note="Pyridine nucleotide-disulphide oxidoreductase; Region: Pyr_redox; cl14644" /db_xref="CDD:187400" misc_feature complement(<9227..>9370) /locus_tag="ClothDRAFT_2576" /note="Pyridine nucleotide-disulphide oxidoreductase; Region: Pyr_redox; cl14644" /db_xref="CDD:187400" gene complement(10014..11225) /locus_tag="ClothDRAFT_2577" CDS complement(10014..11225) /locus_tag="ClothDRAFT_2577" /inference="protein motif:PFAM:PF07949" /note="PFAM: YbbR family protein; KEGG: pca:Pcar_1000 hypothetical protein" /codon_start=1 /transl_table=11 /product="YbbR family protein" /protein_id="ZP_05430716.1" /db_xref="GI:256005763" /db_xref="InterPro:IPR012505" /translation="MNELLKKDLTLKIISVFFAIFLWFIVLDSSNPVTWVELNVPLKV ENESSLKEKGIMLKNENFPRNVSVSLKGRKSAFNNIGLNDIEAIVDLSKVEDVNTQFL YVNVYTNKKGVSFQGVTPRVVEIELEKLGENPFPVNVVITGKPKEGYTVVKANAIPTT VSIEAPDEIINSIGEVRAYVDVDNLSNDIIINKECVVYNKEGEKIVELDKKISVDINI EIAKEVPIVPAVRGRPAKNYTDGIHRVVPEKAWISGPSDVIDLIDNLKTEPIDIENMS QSMTKIVNLVLPDGVRLVDTPRSVYVDVVIEELAEREFVFNKESIAFDNAVKNNSLKY EILDDEIKITLTGTRQELNKISPESLKLSVDVGGLSEGEYKRPLNVVIPDTVNLSGSY DVKISVKKTGS" misc_feature complement(10032..11225) /locus_tag="ClothDRAFT_2577" /note="Uncharacterized protein conserved in bacteria [Function unknown]; Region: COG4856" /db_xref="CDD:34465" misc_feature complement(10611..10823) /locus_tag="ClothDRAFT_2577" /note="YbbR-like protein; Region: YbbR; pfam07949" /db_xref="CDD:149173" gene complement(11222..12100) /locus_tag="ClothDRAFT_2578" CDS complement(11222..12100) /locus_tag="ClothDRAFT_2578" /inference="protein motif:PFAM:PF02457" /note="PFAM: protein of unknown function DUF147; KEGG: pca:Pcar_0999 hypothetical protein" /codon_start=1 /transl_table=11 /product="protein of unknown function DUF147" /protein_id="ZP_05430717.1" /db_xref="GI:256005764" /db_xref="InterPro:IPR003390" /db_xref="InterPro:IPR014046" /translation="MFFLVGTTNFWDIIANLSTNLDIKSPWDLIKTIIDIGIVSFVIY KLIKLIRETRAWQLIKGILVIVIAARASELIGFKTLSFILRLTIEYMAIILVVLFQPE FRRGLEQLGRSRFRNLFSFEEEDSTIKVKSLIEEIIKAVTEMSRTFTGALIVIERETK LGEIINSGINLDSNVTSELLINIFTPNTPLHDGAVVIRDNKIKAAACFLPLTENPNLS KELGTRHRAALGISEVSDAIVVVVSEESGRISVALNGGLTRNLTSDTLRKALSKNLLD KENPSKKLGIWKVKAK" misc_feature complement(11303..12028) /locus_tag="ClothDRAFT_2578" /note="Uncharacterized conserved protein [Function unknown]; Region: COG1624" /db_xref="CDD:31811" misc_feature complement(11327..11692) /locus_tag="ClothDRAFT_2578" /note="DisA bacterial checkpoint controller nucleotide-binding; Region: DisA_N; pfam02457" /db_xref="CDD:145543" gene complement(12226..13095) /locus_tag="ClothDRAFT_2579" CDS complement(12226..13095) /locus_tag="ClothDRAFT_2579" /inference="protein motif:PFAM:PF04055" /note="PFAM: Radical SAM domain protein; KEGG: gme:Gmet_1006 radical SAM family protein" /codon_start=1 /transl_table=11 /product="Radical SAM domain protein" /protein_id="ZP_05430718.1" /db_xref="GI:256005765" /db_xref="InterPro:IPR007197" /translation="MEAAKPAMFYDKGEDLKVHCRLCPHNCTISPGNLGVCRARKNID GDLYSLNYGKISSIALDPIEKKPLYRFKSGSKILSIGTFGCNLKCSFCQNWEIAHDNP RLYEVTSETVVSKAKELVSEGNIGIAYTYNEPTIWYEFVYDTAVLAKEEGLSNVLVTN GFIGREALLMLLPYIDAMNIDVKAYTASFYKNICGGVLENVKETVELAAEKCHVEVTT LVIPTLNDELKEISEIAKWLSSISRKIPLHLSRYFPNYKMLNIPPTPKDTLFRAREEA QKYLDYVYLGNVW" misc_feature complement(12229..12978) /locus_tag="ClothDRAFT_2579" /note="Pyruvate-formate lyase-activating enzyme [Posttranslational modification, protein turnover, chaperones]; Region: PflA; COG1180" /db_xref="CDD:31373" misc_feature complement(12262..12852) /locus_tag="ClothDRAFT_2579" /note="Radical SAM superfamily. Enzymes of this family generate radicals by combining a 4Fe-4S cluster and S-adenosylmethionine (SAM) in close proximity. They are characterized by a conserved CxxxCxxC motif, which coordinates the conserved iron-sulfur cluster...; Region: Radical_SAM; cd01335" /db_xref="CDD:100105" misc_feature complement(order(12340..12345,12436..12438,12559..12561, 12616..12624,12697..12702,12706..12708,12817..12825, 12829..12831,12835..12837,12841..12843)) /locus_tag="ClothDRAFT_2579" /note="FeS/SAM binding site; other site" /db_xref="CDD:100105" gene complement(13107..14495) /locus_tag="ClothDRAFT_2580" CDS complement(13107..14495) /locus_tag="ClothDRAFT_2580" /inference="protein motif:PFAM:PF01871" /note="PFAM: AMMECR1 domain protein; Extradiol ring-cleavage dioxygenase class III protein subunit B; KEGG: dal:Dalk_3956 AMMECR1 domain protein" /codon_start=1 /transl_table=11 /product="AMMECR1 domain protein" /protein_id="ZP_05430719.1" /db_xref="GI:256005766" /db_xref="InterPro:IPR002733" /db_xref="InterPro:IPR004183" /db_xref="InterPro:IPR005829" /translation="MGRIISSYIFPHPPLIVPEIGKGDEKGAIKTIEACEKAAEQIRK EKPSTIILTTSHAPLFEDYIFINDHKTLKGNFSRFGARKVELGFENNLKMVESIIEFA KKEGFDAGGISEGIGRRYGISGELDHGALVPLYYISRVYSDFKLVHVAMSTLTLEEHY KFGMCIGEAVRNSDEDVVFVASGDLAHRLTSDGPYGYNKHAPEFDELLVKSIEKDDID RILDIDDKLRDEAAECGLRSFVIMLGALDGYSVVPEVYSYEGPFGVGYMVARIGVGAM DSSRRIIENRRNKRKKSTDPYVSLAKRALEAYVTEGRVLDDYSGLPEEMLNSRAGTFV SIKKKGELRGCIGTIGPTRENIASEIVHNAISAGTSDPRFYPVKPYELDELEYSVDVL MEPEEINSMDELDVVKYGVIVRAGRRTGLLLPNLENVNTVEQQVSIALQKAGISPNEK YTMERFEVIRHK" misc_feature complement(13110..14492) /locus_tag="ClothDRAFT_2580" /note="hypothetical protein; Provisional; Region: PRK03881" /db_xref="CDD:179666" misc_feature complement(13686..14471) /locus_tag="ClothDRAFT_2580" /note="The N-terminal domain, an extradiol dioxygenase class III subunit B-like domain, of unknown proteins containing a C-terminal AMMECR1 domain; Region: ED_3B_N_AMMECR1; cd07951" /db_xref="CDD:153388" misc_feature complement(13110..13607) /locus_tag="ClothDRAFT_2580" /note="AMMECR1; Region: AMMECR1; cl00911" /db_xref="CDD:186253" gene complement(15309..16460) /locus_tag="ClothDRAFT_2581" CDS complement(15309..16460) /locus_tag="ClothDRAFT_2581" /inference="protein motif:COG:COG2367" /note="KEGG: gur:Gura_3441 beta-lactamase class A-like protein" /codon_start=1 /transl_table=11 /product="Beta-lactamase class A-like protein" /protein_id="ZP_05430720.1" /db_xref="GI:256005767" /db_xref="InterPro:IPR000871" /translation="MFIICIRKKNSVKERICKILKGKIRNYFVLVVTFFMGVAFVMYS GNLASMGMKSNEYNKGNYEAHKAYYAGTYEYGTDYDVEDDLYSLEFDDELLNDELEYL EDIGEPFYYEDLDNDFDNTLENQVEKDTYAALENKLRKYISKYNCYFGIYFVDLESGK EFGINDTEEFFAASTFKIPLNLYVYDMIRKGMLDPMTSLEYTEEDFEGGTGIIWNNES FGKTFTIKELLRLSIVYSDNVAVNMLLRCVGKANVKEYMRRLGGVVVDDGKNVSCPRD MAMYLKEVYELSENGDPWGRELVQNMINTKFYDRLPVLLPKNLKIAHKTGNYTGVVHD VGIVYAEKPYIVVVMTKNVKNGQSANKAIANISKMIYDYVVKQSGKDLD" sig_peptide complement(16311..16460) /locus_tag="ClothDRAFT_2581" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.774) with cleavage site probability 0.310 at residue 50" misc_feature complement(15339..16106) /locus_tag="ClothDRAFT_2581" /note="Beta-lactamase; Region: Beta-lactamase; cl01009" /db_xref="CDD:186300" gene complement(16664..17539) /locus_tag="ClothDRAFT_2582" CDS complement(16664..17539) /locus_tag="ClothDRAFT_2582" /EC_number="1.3.1.26" /inference="protein motif:TFAM:TIGR00036" /note="KEGG: buc:BU146 dihydrodipicolinate reductase; TIGRFAM: dihydrodipicolinate reductase; PFAM: dihydrodipicolinate reductase" /codon_start=1 /transl_table=11 /product="dihydrodipicolinate reductase" /protein_id="ZP_05430721.1" /db_xref="GI:256005768" /db_xref="InterPro:IPR000169" /db_xref="InterPro:IPR000846" /db_xref="InterPro:IPR011770" /translation="MIRVCLVGLGKTGKEIAKVILEQENMKLVSVVCSSKSQNLGKSL DEIIGCRNSGIIVDSEKNLEQVIFKTKPDVVVDFSTPDATIRNAKIFSKMKVNIVVGT TGFTDFALKKLFVLTRKYHNAICYAPNITLGVNVLMLLTNLAASILNNYDFQITEIHH KRKVDVPSGTAIKIAGEIKKGLDSAGVSIKEKVIPINAVRAGGVVGRHEVMIVGEDDK IEISHESFSRRAFALGAIKAIEFIHDKVGYYEMSDVLNLHKVLEDYIEKEQIKRKKKY KKCRNDVEESPVSVV" misc_feature complement(16769..17539) /locus_tag="ClothDRAFT_2582" /note="dihydrodipicolinate reductase; Provisional; Region: PRK00048" /db_xref="CDD:178822" misc_feature complement(17153..17536) /locus_tag="ClothDRAFT_2582" /note="Rossmann-fold NAD(P)(+)-binding proteins; Region: NADB_Rossmann; cl09931" /db_xref="CDD:186874" misc_feature complement(16775..17143) /locus_tag="ClothDRAFT_2582" /note="Dihydrodipicolinate reductase, C-terminus; Region: DapB_C; pfam05173" /db_xref="CDD:147385" gene complement(18138..19385) /locus_tag="ClothDRAFT_2583" CDS complement(18138..19385) /locus_tag="ClothDRAFT_2583" /inference="protein motif:PFAM:PF00768" /note="PFAM: peptidase S11 D-alanyl-D-alanine carboxypeptidase 1; KEGG: lpf:lpl1517 hypothetical protein" /codon_start=1 /transl_table=11 /product="peptidase S11 D-alanyl-D-alanine carboxypeptidase 1" /protein_id="ZP_05430722.1" /db_xref="GI:256005769" /db_xref="InterPro:IPR001967" /translation="MYRRVLIQIQCFTVAMMILFFSQSPVFAVAEPPEIKAPSAILME VQRGQILYQKNPKLKLHVSCANKIMTGLIALEKMQNQLNTNITVSKKAVSVEGAVLNL EVGGKYPVEDLIYSVLLGSANDSANVLAEYIGGDEKGFVELMNKKAQELEMKDTYFTN PTGLYDEKQYTTAYDLAVLIRYALTKSSTFNEMFSAKARPWVDGTQILINSNELFWSY DGVDGGKTGYNEIDRQTAITTATRNGQRLICIVLDSPEESMYDDSVKLLDYGFLNFRT GILVSMGQPLKKVTVGDKVIDLVSIGDYYYTYPAGENYIKNIEFKVPEKFDPPVLKSD VLGIAKYTLEDGTVIEVSLHPAVDVYSSMGLFESLINQVKEYRDIVILLCILLVIELF IAVYHIVRLIKRLFLKLVYKPGK" sig_peptide complement(19299..19385) /locus_tag="ClothDRAFT_2583" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.999) with cleavage site probability 0.639 at residue 29" misc_feature complement(18255..19370) /locus_tag="ClothDRAFT_2583" /note="D-alanyl-D-alanine carboxypeptidase [Cell envelope biogenesis, outer membrane]; Region: DacC; COG1686" /db_xref="CDD:31872" misc_feature complement(<18846..19322) /locus_tag="ClothDRAFT_2583" /note="Beta-lactamase; Region: Beta-lactamase; cl01009" /db_xref="CDD:186300" misc_feature complement(18309..18566) /locus_tag="ClothDRAFT_2583" /note="Penicillin-binding protein 5, C-terminal domain; Region: PBP5_C; pfam07943" /db_xref="CDD:149169" gene 19618..19761 /locus_tag="ClothDRAFT_2584" CDS 19618..19761 /locus_tag="ClothDRAFT_2584" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430723.1" /db_xref="GI:256005770" /translation="MAKNKKKQKDVKDAKYEFANDQLGENTEPRYEEMKQDKKGGKKA GKK" gene 19953..21101 /locus_tag="ClothDRAFT_2585" CDS 19953..21101 /locus_tag="ClothDRAFT_2585" /inference="protein motif:PFAM:PF04015" /note="PFAM: protein of unknown function DUF362; 4Fe-4S ferredoxin iron-sulfur binding domain protein; KEGG: gur:Gura_4011 hypothetical protein" /codon_start=1 /transl_table=11 /product="protein of unknown function DUF362" /protein_id="ZP_05430724.1" /db_xref="GI:256005771" /db_xref="InterPro:IPR001450" /db_xref="InterPro:IPR007160" /db_xref="InterPro:IPR017900" /translation="MSKVALIRCESYDYDAVKSAVKRGLDLIGGPHRFAAPNEKILLK PNLLSADPPERCSTTHPSVFKAVAEIFMEAGITNLSYGDSPGIHKPITAARKNGIEKA ANELGIKLADFLEGKEVFFENAIQNKKFIIANGVLESDGIISLPKLKTHGFARMTGCV KNQFGCIPGPLKGEFHVRIPSIIDFSKMLVDLNVYLKPRLFVMDGIIAMEGNGPRGGT PRKINAILLSEDPIALDATVCRMINLNPEFVPTIVFGKEAGLGTYDENEIEILGDDIQ SFITYDFDVRREPVKPFKPGGAIQFFRNFIVPKPYILKNKCIKCGVCVNACPVKPKAV DWHNGNKKEPPTYIYKRCIRCYCCQELCPESAIHLKVPFIRKFFYNPK" misc_feature 19959..20837 /locus_tag="ClothDRAFT_2585" /note="Domain of unknown function (DUF362); Region: DUF362; cl00879" /db_xref="CDD:120200" misc_feature 20880..20939 /locus_tag="ClothDRAFT_2585" /note="4Fe-4S binding domain; Region: Fer4; pfam00037" /db_xref="CDD:143826" gene complement(21118..21765) /locus_tag="ClothDRAFT_2586" CDS complement(21118..21765) /locus_tag="ClothDRAFT_2586" /inference="protein motif:PFAM:PF07238" /note="PFAM: type IV pilus assembly PilZ" /codon_start=1 /transl_table=11 /product="type IV pilus assembly PilZ" /protein_id="ZP_05430725.1" /db_xref="GI:256005772" /db_xref="InterPro:IPR009875" /translation="MKVGEIASICHYSGKTWFKSVVLQVEKDLLVVKLVKEFVILNFL ENDPVVLGYEENDEVFIAGCIVKGIDPDCSYIKLKVESVRSLKEQRECERFPVSFYAK IKCDDSDKINVATIKNMSFDGLMINTAADFPLKKNIEVTIYPTFQEVKIDEDVDKTVI SLRSDIVRKEAFTRYFEYRLKITNIDAQNQNLLRLYLQSIKGLQQRFLKDLKEKL" misc_feature complement(21175..21504) /locus_tag="ClothDRAFT_2586" /note="PilZ domain; Region: PilZ; cl01260" /db_xref="CDD:163963" gene 22162..22977 /locus_tag="ClothDRAFT_2587" CDS 22162..22977 /locus_tag="ClothDRAFT_2587" /inference="protein motif:PFAM:PF02582" /note="PFAM: protein of unknown function DUF155; KEGG: gur:Gura_1501 hypothetical protein" /codon_start=1 /transl_table=11 /product="protein of unknown function DUF155" /protein_id="ZP_05430726.1" /db_xref="GI:256005773" /db_xref="InterPro:IPR003734" /translation="MVFKAYAVTNEIDLNRIAAKCNIPKKYTWEEPLILNENVLSSIF NKEIPEGQKILVFSFGSIVFINCPSEHEKLFIEYLKNEKIDIDVENYKEYSDDYELQV RENAEIELTDSYLTVPKFEFFYPELVSTVIAKSVALEKTEEHLSTILDTLETMIDKLE KGKLNVGNKEIAKTTSKIVRHEYNTIAYIMILDKPDITWTNSDAKNLYDMMSEFFELN DRYITLKEKTDILNNVLSGFSSISHSMRGLFVEWVIVILIFVEIILMLADLLK" misc_feature 22321..22839 /locus_tag="ClothDRAFT_2587" /note="Uncharacterized ACR, YagE family COG1723; Region: DUF155; cl00751" /db_xref="CDD:153973" gene 23000..23809 /locus_tag="ClothDRAFT_2588" CDS 23000..23809 /locus_tag="ClothDRAFT_2588" /inference="protein motif:PFAM:PF02582" /note="PFAM: protein of unknown function DUF155; KEGG: gur:Gura_1501 hypothetical protein" /codon_start=1 /transl_table=11 /product="protein of unknown function DUF155" /protein_id="ZP_05430727.1" /db_xref="GI:256005774" /db_xref="InterPro:IPR003734" /translation="MKTVHFISYKVAASLPLDKIAAFLKTNMKFTWDEYIVVGGEQLD TILKYHSEDKAVYLFKYGCISFVNFTDKEIYSFLKYLESITSRINYNLMPRYHESHNV TIDENLKCSLFENKSVEVDYDKNIDHILSIVLARSTQMLFFETQVNNLLDSAEKFVIL LQKGRLLTFTKKSYAIMAKILRFEFDSLSCIRIFEHPALGKHSIKLKEIYDILAEYYE FGGRFNVMQSKIKDLRKIVGMYSSLSYSETETRLLLFEIFLLSLFSLAHII" misc_feature 23165..23677 /locus_tag="ClothDRAFT_2588" /note="Uncharacterized ACR, YagE family COG1723; Region: DUF155; cl00751" /db_xref="CDD:153973" gene complement(24293..24739) /locus_tag="ClothDRAFT_2589" CDS complement(24293..24739) /locus_tag="ClothDRAFT_2589" /inference="protein motif:PFAM:PF04509" /note="PFAM: CheC domain protein; KEGG: dal:Dalk_0295 CheC domain protein" /codon_start=1 /transl_table=11 /product="CheC domain protein" /protein_id="ZP_05430728.1" /db_xref="GI:256005775" /db_xref="InterPro:IPR007597" /translation="MDVKNAFVETAMGVLSEFGFSSVFAEKNETGGLVEAEYVNVVMG VNGAISGNLIMTAKKESALAIASAMLGGMEFTEVDDMVKSAIGELLNIIAGNAFSKVD VKAAVYISTPTLLIGEGISVLLQSPGTNKLVFDMDGQSMDVFLDIE" misc_feature complement(24299..24739) /locus_tag="ClothDRAFT_2589" /note="Predicted inhibitor of MCP methylation, homolog of CheC [Cell motility and secretion]; Region: COG1406" /db_xref="CDD:31596" gene complement(25067..26527) /locus_tag="ClothDRAFT_2590" CDS complement(25067..26527) /locus_tag="ClothDRAFT_2590" /EC_number="2.4.2.11" /inference="protein motif:TFAM:TIGR01513" /note="KEGG: msu:MS1889 nicotinate phosphoribosyltransferase; TIGRFAM: nicotinate phosphoribosyltransferase; PFAM: Nicotinate phosphoribosyltransferase-like; Quinolinate phosphoribosyl transferase" /codon_start=1 /transl_table=11 /product="nicotinate phosphoribosyltransferase" /protein_id="ZP_05430729.1" /db_xref="GI:256005776" /db_xref="InterPro:IPR002638" /db_xref="InterPro:IPR006405" /db_xref="InterPro:IPR015977" /translation="MKKINWNQSENLSMLTDFYELTMGNGYFENGIGDRIAYFDMFFR RVPENGGFAIMAGLAQVIEYINNLKFEDDDIEFLRSKGIFSEDFLKYLKDFKFCCDIW AIPEGTPIFPNEPIITVRGPVIQAQFIETMILLTINHQSLIATKANRIVRAAQGRPVL EFGTRRAQGYDGAVLGARAAYIGGCAGTACAIADRDFGVPASGTMAHSWVQLFPSELE AFRAYARVYPDNCVLLVDTYNVLKSGVPNAIKVFKEEVVPRGFRPKGIRIDSGDIAYL SKEARKMLDEAGFPDCKIVVSNSLDEYIIRDILQQGAQVDIFGVGERLITSKTEPVFG GVYKLVAVEENGTIIPKIKMSENVVKITNPGYKKVFRLFDRKNNKAIADVIVNAGEVI DDSKPYEIFDPDHTWKRKTVTDFYAKELQVQIFDKGKCVYKVPEINEIRDYCREQINT LWDEVLRFENPHKYYVDLSEELWNIKNKLLKEHTLL" misc_feature complement(25112..26515) /locus_tag="ClothDRAFT_2590" /note="nicotinate phosphoribosyltransferase; Validated; Region: PRK09243" /db_xref="CDD:181722" misc_feature complement(25508..26491) /locus_tag="ClothDRAFT_2590" /note="Nicotinate phosphoribosyltransferase (NAPRTase), subgroup A. Nicotinate phosphoribosyltransferase catalyses the formation of NAMN and PPi from 5-phosphoribosy -1-pyrophosphate (PRPP) and nicotinic acid, this is the first, and also rate limiting...; Region: NAPRTase_A; cd01570" /db_xref="CDD:29617" misc_feature complement(order(25553..25555,25562..25567,25571..25573, 25634..25639,25721..25723,25961..25966,26030..26038)) /locus_tag="ClothDRAFT_2590" /note="active site" /db_xref="CDD:29617" gene complement(26539..27213) /locus_tag="ClothDRAFT_2591" CDS complement(26539..27213) /locus_tag="ClothDRAFT_2591" /inference="protein motif:PFAM:PF00857" /note="PFAM: isochorismatase hydrolase; KEGG: ccv:CCV52592_0502 cytoplasmic membrane protein" /codon_start=1 /transl_table=11 /product="isochorismatase hydrolase" /protein_id="ZP_05430730.1" /db_xref="GI:256005777" /db_xref="InterPro:IPR000868" /translation="MKVLQKNEFLQKSNETLASILDMLEKLPVVKFDEIEADKAVLVI IDMTNGFAKEGALKSDAVKELIPRICELSEICDRRKIRKIAFADCHTDESPEFDAYPK HCMKGTAESEIVDEIKNIGGYTLIEKNSTNGFLEEAFRKWLLENPDINTFILTGDCTD ICVQQFAITLKAYFNMNNKRARVIVPLNAVDTYDLGVHDRNLMNVMAAYNMIINGVEV VRDIVE" misc_feature complement(26575..27096) /locus_tag="ClothDRAFT_2591" /note="Isochorismatase family; Region: Isochorismatase; pfam00857" /db_xref="CDD:144449" misc_feature complement(26599..27093) /locus_tag="ClothDRAFT_2591" /note="Cysteine hydrolases; This family contains amidohydrolases, like CSHase (N-carbamoylsarcosine amidohydrolase), involved in creatine metabolism and nicotinamidase, converting nicotinamide to nicotinic acid and ammonia in the pyridine nucleotide cycle. It...; Region: cysteine_hydrolases; cd00431" /db_xref="CDD:29548" misc_feature complement(order(26728..26730,26830..26832,27076..27078)) /locus_tag="ClothDRAFT_2591" /note="catalytic triad; other site" /db_xref="CDD:29548" misc_feature complement(26740..26745) /locus_tag="ClothDRAFT_2591" /note="conserved cis-peptide bond; other site" /db_xref="CDD:29548" gene complement(27380..27574) /locus_tag="ClothDRAFT_2592" CDS complement(27380..27574) /locus_tag="ClothDRAFT_2592" /inference="protein motif:TFAM:TIGR02861" /note="TIGRFAM: small acid-soluble spore protein, H-type; PFAM: small acid-soluble spore H family protein" /codon_start=1 /transl_table=11 /product="small acid-soluble spore protein, H-type" /protein_id="ZP_05430731.1" /db_xref="GI:256005778" /db_xref="InterPro:IPR012610" /translation="MDAARAQQIIESDQVIEVLHEGSPVWIEKVMDNNMAHVSYIHTK EEKDVPLYMLVEKELPKNFH" misc_feature complement(27407..27574) /locus_tag="ClothDRAFT_2592" /note="Small acid-soluble spore protein H family; Region: SspH; cl06949" /db_xref="CDD:186692" gene 28066..28185 /locus_tag="ClothDRAFT_2593" CDS 28066..28185 /locus_tag="ClothDRAFT_2593" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430732.1" /db_xref="GI:256005779" /translation="MFFRGVLSEFFERISLCTYTNKSLNQKKKKKEKDREKEK" ORIGIN 1 aattcttcgg tctggacacc attagattta aattattgac cttcaggtaa tcgatatgtt 61 tgtcaaaata ctctctgcaa acctgtttat caacaaaaac ccttacacat ctttttggtt 121 ttgaaaaaaa agattctttc aataaataat tacagttttt ccaatctgac agtcatacct 181 aatccatcgt ttaaaaccgg cagtatattt aaaaaaaata atcccgcagc cgttcaggat 241 tcttcctgct tcgaccacgg aattttgaag caaacttatt tttattttat ttatagacta 301 aactttatta tcatggagtt gtatatttaa aataaactcc gctccaaacc actttccctc 361 aaacccttat gccttctagt cttaacccta ttctcctaat ctcttccaga taataaagtc 421 cgctctaaaa ttccatattt tcatcccatt tattaacact ttttccttat ttcttgtaac 481 attttttaaa ataaagtcgg ttctaaatag gggtaaggtg caagatgaac agggtaaagt 541 ttcaagggtt aagggataag agttcatttc acttttccat tgctttatca atattatctt 601 caatatagtc ttcaatccct ttaaaatcaa tacttctaac cttatctaat acttcttaac 661 cataataacc ttattcctta caccttaacc ctttcacctg ttaaaatgca aaccccgcag 721 caaatgaaga tttctcctgc atctactgcg aggttttgga acggactata tttttataga 781 gcgaagttta ttattatgga gtggagttta tttgtattat acacctacgt ccactccttt 841 tgcaaataac gcttcggcta ttggaagagt accgaatata tcagcataca ttggaatgcc 901 cactacagta gcaagcatca ctgcaaatgg attattacct ccaaccacat tttctatgaa 961 tgactgtgga atccagttat gaatagccgc ccctatgcct acaccgatta atacatatag 1021 ccaaaccctt ttgataatat ctctgacctg ttcctttgaa tatgatattc tttccttacg 1081 agtcatttca ggcacttccg catcaacatt ttcaatttcc cttacatatc cttctacata 1141 tttttcaagt ctaaactttt ctattaaagt tcctccaata actgccaaaa ttaagcctac 1201 tacaacatag gctatggcaa ttttaagacc gaaaaatgaa attaacaaca ttaatgacgc 1261 caaatctacc attggcgaag atattaagaa agaaaaggtt atgcctaaag gcaatccagc 1321 cgaagtaaaa cctataaaaa ttggtatact ggagcaactg caaaagggag ttatcgtacc 1381 aagcagtgcc ccaagtatat tccctttaat gccttttatc tttccgagaa tcttctttgt 1441 cctctctggc ggaaaataac tctggatata ggatatgaca aatattaata gtgataataa 1501 tataaatatt ttaattgtat cgtatataaa aaagtgaata cttccgccta tcctttcgct 1561 aacaggtaaa ccaaatactt tttccacaag aagtcttacc aattctgaaa gccatctcat 1621 ttttaatagt tggtcattta accaaccgaa tatcatggct aatatgttca tatgaaaaca 1681 tcccctttac cccttacaca cttcaagtta tttttcaaca tgtttgcact tttcaacttc 1741 actgcaattc tcttattttg attaattaca taccgcttat caaatctgat tgttctttac 1801 tctctgtatt aaatcctcga ctttttcctt aattatatct cttgtttttc tgtaatcctc 1861 tattggtccg cctgacgggt cactaagccc ccaatcttct atatgctggc atggtacata 1921 agggcattct acattacatc ccatcgttat taatatatct acttccgccg gaatatcgct 1981 taatagtttc ggatgatggt cactcatatc cactcctgct tcttccatta cctgtactgc 2041 tagtggcttc acttcagggt atttttccgt ccctgccgaa tatgcttcta atacgtcact 2101 tcccaacttc tttgcccaac cttctgccat ttgagaacgg caagagttgt ggacacatac 2161 aaaagcaacc ttctttttca ttcgatacca cctttttcta caaggttatt gaaaccaatg 2221 ccttgtacta tttgcaatcc tgaccaatgt aagcatgacc gggacttcaa ccaatacccc 2281 tacaactgtt gcaagagcgg ctccagattc cagtccaaag agtgaaattg ccactgcaac 2341 tgcaagttca aagaaattgc ttgctccaat cattcccgca ggtgctgcaa tatcatgggg 2401 aagtttccat atctttgccc atccataagc aatgaagaat ataaagaatg tctggataat 2461 taatggtatg gcaattaata taatatgcaa gggattactt aaaattattt caccctggaa 2521 cgagaaaata attactaaag tgagaagcaa acctacgatt gttacattat caaatttctt 2581 gagaaaaatg ttctcgaaat actctatact cttatgttta atgatgttcc ttctagtaag 2641 gtaccctcct gccaatggaa taacaacaaa caggattgtt gataatatca gcgtgtcata 2701 aggaacggtc acattactta cccctaatag gaatgcaaca attggtgtaa atgcaaacaa 2761 tattatcagg tcattcactg ctacctgcac taatgtataa gcagggtcgc cttttgtcag 2821 ataactccat acgaatacca tggcggtaca tggtgcggct cctaataata ctgcacctgc 2881 aagatagtct gtcgctaaat ccggaccaat ccacctactg aacactactt tcaagaaaaa 2941 cgctgcaata agatacattg taaaaggctt gataagccag tttgttacac aagtaactat 3001 tagtcccttc ggtttttttg ttgccctgac aatgcttgaa aaatcaattt tcagcatcat 3061 tgggtaaatc attagccata tgagaatagc aacaggaatt gatacatttg catattcaaa 3121 tttgcttaaa gtttcaggga ttgaaggaac taattgtcct attgcaactc ctactataat 3181 gcatactgct acccatactg taaggtactt ttcaaaaaaa cctaatcctt tattttcttg 3241 cattgtttct ttgtcactca agttttatgc cccctatcaa tttaaattat cttgttctta 3301 ctatatgatt atattcagtt ataatcatat agtgactaat ttaaagtttt tacagaaaaa 3361 taactaaaat cagttttcta ttattaataa ttttcattaa ttgttattgc actgctctcg 3421 aagatactta agaacctgac ttttatcttc ccgtagttgc tcacatgtaa agttactgtt 3481 tttatatttt ttaagtgtct ctatatctct taacaattgt gtattttcag ccatcttgtt 3541 tttaataaat tcatacagta ggttattttc ttcaataaac ttgttatcta ctctgtaata 3601 gacccattga gatttctttt cactggttat aatacctgaa gtttttaatt tatttagatg 3661 tcttgaagca ttagactgcg tcatatccag cactgtttct atctcgcaca cacagagttc 3721 ctgtcttatt agcaaattga gtattctaat tctgttttca tctcccaacg ctttaaagat 3781 ttctattaaa tccaatttat caccaccata tgattatatt caattatact catatatata 3841 atagtattga tttatttctc tgtcaacaat aaatacatta tcttataaat caaaaaatat 3901 gttttttata tttatcacat aattcaagaa tacgttccca taacataccc caaacctccc 3961 ctacgatgtg aaaatctaat tttgggaata actttattat tttagaacca actttattat 4021 catagagtca actttattat ttctaaaaca ttttccttat tccttttccc taaaaatcca 4081 tacccctaac tatgtatatt taaaataaac tccgctccaa acgactttcc ctcaaaccct 4141 tatcccttct aaccttaacc ctattcgccc aatctcttcc agataataaa gtcggttcaa 4201 aaactccata ttttcattcc atttaataac atttcttcct taattcttgt agtaattttt 4261 aaaataaagt cggttccgaa taagggcaat gtgcaaggga aaaggtataa ggttgcattt 4321 tctcatgtgc tttttccatt caagtatcaa tatataatac tctcaactcc tttaaaatca 4381 atgtctttag cctaatccct taccccttaa cccttccttc aaaaaacaaa ccccgcagca 4441 aatgaagatt tctcctgcat ctgctacggg attttggaac gaactttatt tttatagagc 4501 gaactttatt ttcctggaat caactttatt tgatttatac aggagtgaag tttatttctc 4561 ccgcccttac tccacagtca cactcttggc aagatttctg ggcttatcaa cgtcacaacc 4621 cttctgcaaa gccatgtaat aggcaaacaa ttgcagaggt gtcaccgcca ctatcggagc 4681 aataaacgaa tcaacatccg gtatggtaac aaccacgtcg gcaaccttgc acacctgctt 4741 gttgctctcc tttgctatcg caaggacaac cgcccctctg gcctttactt ccctgatatt 4801 gcttatcatc ttttccacga ggctgtcctg agtcacagga caaactacca gcgtaccctc 4861 ctcaataaga gcaatggtac cgtgtttcaa ctctcccccg gcataggcct cagagtgaat 4921 ataggaaatt tccttaagct tcagcgaacc ctccatggac agggcataat caaggcctct 4981 tccgataaag aaaatactct ttgcattata gtgctgtgat gcaaatttct gtattatatc 5041 cctgttggcc aaaacttttt ctatttcccg gggaacagcc tttaattctt ctatcacttt 5101 actgtaataa tccctgtcta ttctgcccag tttatatgca aaatccaggg ctataaggta 5161 caatgccgag agctgggtgt tgtatgcctt tgtggacgcc acggcaattt ccggacctgc 5221 ccaggtataa agaacatcat ccgactctct tgcaatcgaa cttcccacaa catttacaat 5281 ggacagaacc cttgcccctt ttttctttga ttcccttaat gcaaacaatg tgtcaatggt 5341 ctcgcccgac tgacttatta taattaccaa atccttgtcg cttataagag gatctctgta 5401 tctgaattcc gatgcaacat ccacctctac cggaattctt gccagctttt caattatata 5461 ttttccgaca accccagcat gatatgcggt gccgcatgca acaatgaaaa ttttccttat 5521 atttttcaaa tcttcagcag taatcctgat gttgtccagt actatattgc cgtcttttat 5581 tctcggattt acagtgtctc ttaccacttt aggctcctca cacatttctt tcatcatgaa 5641 atgttcgtag cctgcctttt ccgccgaagc aacatcccaa tttaccttga acactttctt 5701 ctgtaccgcc aaaccatggt tgttaaacac cttgacttcc ttgtcactca aaagtacaat 5761 ttctttatct tccaaaatat atacatccct tgtgtattca agtattgcag gaatatcaga 5821 agcaataaaa ttctcgccgt ttccaaggcc gacgataagc ggactgtctt ttcgggcggc 5881 aacaaatttg tcaggataat ctctgcaaag gacccccaat gcataagacc cctcaatttc 5941 atttatagag gtgataacag cctgaactat atcaccatga tagtggtaat ctataagatg 6001 cgccacaacc tctgtatcag tgtccgatac aaattcataa ccctccgccg caaggaactc 6061 tttcaattcg agataatttt caattatgcc gttatgtaca acggcaattt tgcctgaact 6121 gcttatatga ggatgggaat tcagatcatt cggctctccg tgagttgccc aacgggtatg 6181 acctattccg atatttccta ccggtgcgtc gcagttcacc ttttcctcca atttttcaag 6241 tcttcctttg cactttacca cttttatatt tccattgtct aaaattgcca ctccggcaga 6301 gtcatagccc ctgtactcaa gctttttaag cccgttcaga agtataggtg ctgcatctct 6361 gctacctata taaccaacta ttccacacac agatatctct cctttacagt tttatgttat 6421 ttttcaggta caaccgaaaa aagacaaaag aagtggctat catcttagac aggaaaattc 6481 actcagatcc cttttgtacc gcagttgcct gcgagtcttt gtaggaccct gacggtcgtg 6541 acaaccggaa ggtttccgcc gaaaactcga taactcaccg attgaaaaat taccggtgac 6601 ctccttctcc tcgtccacgt ggttaaaaca cgtgctggcg ctttttctat aaattcatta 6661 tggcctaaac cactatcccc ctttcgtggc acataatgaa caagatttcc ctgtccaaaa 6721 cttcttttat ttatacaaca acaggcatat tataatatat tacgccgttg tagtataatc 6781 aacttaaatt atttaatttt tatcattttt tgctcctctg tttaagtttc attttatcat 6841 ctatttatca tctaaccaag tctctcttca ataactttta caagctcaag agctcttttt 6901 tctatataat ccctgtcctt accctctatc ataaccctga caagaggttc cgttcctgaa 6961 ggcctgataa gcacccttcc ttcatcccgg aactcattct caagctcttt gcacatttcg 7021 catattactt catcttcaag atatttttcc ttattttgat tgcttacccg ggcattcatt 7081 aatacctgag gaagcacctg cattattgag gccagttcgg aaagcttttt accggaagat 7141 ttcacaacat taagaagctg tgctcccgta agaatgccgt ctcctgtagt actatgttca 7201 agaaaaataa tatgtcccga ctgctcgcct cccaaaacat gcccgttttc aagcatgttt 7261 tccagtacat atctgtctcc cacttttgtt ttaactatgt taattccttc tcttttcgcc 7321 attatatcaa gtccaagatt gctcataaca gtagctacaa tggtattgtt tgtaagcttt 7381 ccctgttttt ttagctcaag gccgattatg gccatgattt ggtcaccgtc aaccatgttg 7441 ccgttctcgt caaccgcaag aaccctgtca gcatccccgt caaaagcaag cccgacatca 7501 gctccgcttt caattacaaa tttctgcaac tgctcaatat gagtggagcc gcagtctttg 7561 ttaatattta caccgtcagg ctcgttgtta ataacacaga catccgcacc aagttcaaag 7621 aaagtaacgg gtgccacctg gtatgatgct ccgtttgcac agtcaattgc aactttaagc 7681 ccttttaaat ctcccttgat agtgctttta ataaaattta catagtcgtc caacggtgac 7741 tcaatttcaa ttttccttcc tattttctca cctgtgggaa gttgaatttt ctccgaattg 7801 tcaagaatta tggattctat tctttcttcc agggcatcgg aaagtttata tcctttgctg 7861 ttgaagaatt ttattccgtt aaactcgtaa ggattgtggg aagcagaaat taccacaccg 7921 gcatctgcat tatagtacct ggtaagataa gcaaccgtcg gagtaggagc tattcccaga 7981 caagccactt ccgctcccac cgaacataat cctgcaacaa gggaagcctc cagcatatct 8041 cccgatattc ttgtatccat gcccaccaaa attttaggtg tgtgctttgt ctcagaagtc 8101 aacacatacg ctcctgcctg ccccaattta tatgcaagct cggcggttaa ttccagattt 8161 gccactcctc ttactccatc agtaccaaac agacgtccca atacactcat ccccctaaat 8221 tatttcatct ttttaactta ttaacttaaa aacaaaatac ttcaattaaa tgtttccaga 8281 caaatatatt tataaattat tcataataac tatattatat tattcagtaa ggcaaatatc 8341 aaaaaccatt ttatgttatc cgatttgcaa aaaatttcag ataacgcatt aatatattat 8401 tcatatgcag ttactcgtat gaataggtac ttattatctt ttccgctatt ctaatgccgt 8461 caaccgctgc actcacaatt ccgcccgcat acccggctcc ttcaccggca ggatacaaac 8521 cctttatgcc aattgcttca agtgtgtccc ctcttggaat tcttacgggc gacgaggtcc 8581 tggtctccac tcctgtaata acggcatcct tcatgccaaa accttttatt ttggaatcaa 8641 aatagggtat ggcttttttt atggaatccg tcacaaatgt cggaagacag gaatgaatat 8701 cggcaagatt cgttcctccg gtataactgg gcttgactgt tcccaaaaaa gtggattttc 8761 ttccttcgat aaaatcccca agcctctgca ccggtgcccg gttgcaggaa ccgcccgcaa 8821 caaaagccag cctttcccac tttctctgaa aatcaacacc ggccagggga tggctgcttc 8881 caaaatcccc cggttccact gataccacaa gggcactgtt ggcattttcc ttgtcccttg 8941 caaattcact cattccgttt gtcacaatca tgcccggttc cgaagccgat gccacaacaa 9001 cgcctcccgg acacatgcag aatgaataca cggttctgtc gccaagtttt tgaaacagct 9061 ggtaatccgc cgctccaagt ctgggatgac ctgccgcttc accgtactgg gccctgtcaa 9121 tcagctcctg gggatgttca atcctgactc ctattgaaaa aggcttttgt atgaattcaa 9181 cccctttgtc aaaaagcatt ttgaaggtat cccttgcact atggcctatt gcaaggactg 9241 caacctcaca gggtatttct tccttgtcgt ttaccacaat tgaggttata cttccgtttt 9301 taacaattat tgaagtaact tttgaattaa accttacttc tcccccgtat tcaattatct 9361 tgttgcgcat gtttgatact acttttttta acacatcaga acctatatga ggctttgcct 9421 tgtataaaat ctcttcatgc gccccggatt tgtaaaattc ctctaaaaca atactgcagc 9481 gcctgtcatt tatcctggtg gtaagttttc cgtcagaaaa agtcccggca ccgccttctc 9541 caaactgtac attggtttct ggatcaagct cgccggtcgt ccaatacctg ttgacaattt 9601 gcgtgcgttt ttcaacacat tctccccgtt cgagaatcaa cggcctatag ccgttttggg 9661 ccagaacaag ccctgcaaac agacctgcag gacctgagcc gataaccaca ggcctgtttt 9721 taagctttat gctgccagga accaaaacct tttccgtctc ttgctctaaa atgctgatgt 9781 ccgtactttc ccttaccttt attttgcctt caatttcaac catcacagag tagacaagat 9841 tgataaaagg ttttttcctc gcatcaatgg actcttttac tatcctgaaa ttcttaaagt 9901 ccttttcact aactttaatt tttttacaaa caagtttttt taacgcatct atatcttcat 9961 ccaaagaaag ttttaaattt cgaactatta gtttcatctg cacctcgtta aacttaactt 10021 ccggtttttt tcacactgat tttaacatca tagcttccgg aaagattcac agtatcaggg 10081 ataaccacgt taaggggcct cttatactcc ccttccgaaa gcccgcctac atcaacgcta 10141 agcttgagac tctcaggcga aatcttgttc aactcctgtc tggtaccggt caaagttatt 10201 tttatctcat catccaaaat ttcatactta agtgaattat tttttactgc attgtcaaac 10261 gcaatgcttt ccttgttaaa gacaaattcc ctttctgcca gttcctcaat aaccacatcc 10321 acataaacac ttcttggagt gtcaacaagg cgaaccccat ccggcagaac gagatttaca 10381 attttggtca tgctctgcga catattttca atatcaatag gttcggtttt caagttgtca 10441 ataaggtcaa tgacgtcaga aggtcccgaa atccacgcct tttccggcac aaccctgtgt 10501 atgccgtcgg tgtaattttt tgccggtctc ccccttacgg ccggtactat aggcacttct 10561 ttcgcgattt caatattgat gtcaacactt atttttttat ccagctcaac tattttttct 10621 ccttctttgt tgtaaaccac acattccttg tttataataa tatcgttact gagattgtca 10681 acatcaacat aagccctgac ttcaccgatg gaatttatta tttcgtccgg cgcttcaatt 10741 gaaaccgttg tcggtattgc atttgccttt accactgtgt agccttcctt cggttttcct 10801 gtgataacta cattaacagg aaaaggattt tcacccagtt tttccagttc tatttccaca 10861 actctcggtg ttactccctg aaaagacaca ccttttttat ttgtataaac attgacatat 10921 aaaaactgag tattaacatc ctccaccttt gaaaggtcaa caattgcctc aatgtcattt 10981 aaacctatat tgttaaaagc gctttttctt ccctttagac tgacggaaac atttctcgga 11041 aagttctcat tcttaagcat tattcccttt tctttaagtg aactttcatt ttcaactttc 11101 aaaggcacat tcaattcaac ccaggttacc ggattagagc tgtccaaaac aataaaccag 11161 agaaatatgg cgaaaaagac agagattatt tttaaagtta aatccttctt cagtaactca 11221 ttcatttggc cttcaccttc catatcccca gtttcttgct tggattctct ttatctaaaa 11281 gatttttgct taaagccttt ctcaaagtat ccgaagtcaa gttcctggta aggccgccgt 11341 ttagggcaac cgaaatcctt ccggactctt cggaaaccac cacaacaatt gcgtctgaaa 11401 cttcacttat gccaagtgca gcccggtgcc ttgtccccag ttccttgctg agattcggat 11461 tttccgtaag gggcaaaaag catgccgccg cttttatctt gttgtccctg attactacgg 11521 caccgtcgtg taaaggcgta ttcggcgtga aaatatttat caaaagctcg gaggtaacat 11581 ttgaatccag gttaattccc gagttgataa tctcccccaa cttcgtttct ctttcaatta 11641 caataagcgc tcccgtaaag gtccttgaca tctccgttac ggcctttatt atttcctcaa 11701 tcagcgactt tactttaatg gtactgtctt cttcttcaaa gctgaaaaga tttctaaacc 11761 tgctccttcc cagctgctcc agtcctcttc tgaactcagg ctgaaacagt accacaagta 11821 ttatagccat atactctatg gtaagtctca gtataaaaga cagagtttta aaaccaatca 11881 gttcacttgc cctggccgca atcacaataa caagaatacc ttttataagc tgccacgccc 11941 gtgtctccct tatcagtttt attaatttgt atattacaaa tgacactata cctatatcta 12001 taattgtctt tatcaaatcc cacgggcttt ttatatctaa gtttgttgac aaatttgcaa 12061 tgatatccca aaaatttgtt gttcctacca gaaaaaacat ttgaaaacct cactctgagt 12121 gccaacgtta aaaatttctt ataaaagaat tataacttat ttctaaataa atgtaagctt 12181 tttttaataa aaatataatt aataattgat tacaaaaatg ttattctacc acacattgcc 12241 aagataaaca taatccagat atttttgtgc ttcttccctc gctctaaaca gagtgtcttt 12301 gggtgtcggc ggaatattca acattttgta atttggaaaa taccttgaaa gatgcagagg 12361 tatcttcctt gatatggatg aaagccactt tgcaatttcg gaaatttctt ttaactcgtc 12421 attcaatgtg ggaataacaa gggtggttac ttccacatgg catttttcgg ccgccagctc 12481 cacagtttct ttcacattct ccaaaacacc cccgcatata tttttgtaaa aagaggctgt 12541 gtaagctttt acatctatgt tcatggcatc aatataagga agcagcatta aaagcgcttc 12601 cctgccgata aatccgttgg tcaccaaaac atttgaaagg ccttcctctt ttgcaagtac 12661 cgccgtatca tacacaaact cataccatat agtgggttcg ttgtaggtat atgcaatccc 12721 tatattacct tcagatacaa gctcctttgc cttgctgaca acagtttcgg atgtcacttc 12781 ataaagcctg ggattatcat gggcaatctc ccaattctgg caaaaagaac atttgagatt 12841 gcatccaaaa gtgcctattg acaatatctt cgaaccactt ttaaatctgt acaggggctt 12901 tttttctata gggtccagcg caatggaaga aatcttccca taatttaaag aatacaaatc 12961 tccgtcaata tttttccgcg ccctgcaaac tcccaaattt ccgggactta tagtacaatt 13021 gtgggggcag agacggcaat gtacttttag atcctctcct ttatcgtaaa acatcgccgg 13081 ctttgctgct tccatattac cactcctcat ttgtgcctta taacctcaaa cctttccatt 13141 gtgtattttt cgtttggact tatgcctgcc ttttgaagcg caattgatac ctgctgctct 13201 acagtattaa cgttttcaag gtttggaagc aaaaggcccg tccttcttcc ggctcttaca 13261 atcaccccat attttactac atccagttca tccatggaat taatctcttc gggctccatt 13321 aaaacatcaa cggaatattc aagctcatcc agctcatagg gcttcacagg atagaaccgg 13381 ggatcggaag tacccgcgct tattgcatta tgaactatct cacttgctat attttccctt 13441 gtcggcccga tagtaccgat acagccccta agttcaccct ttttctttat tgaaacaaaa 13501 gttccggctc tactattcag catctcctcc ggaagaccgc tgtaatcatc caaaaccctg 13561 ccttccgtta cataagcctc cagggctctt ttggcaagag aaacatacgg atcggtactc 13621 ttttttcttt tgtttctcct gttttcaatt atccttcggg aagaatccat agctccgact 13681 ccgattcttg ccaccatata tcccactcca aaaggacctt cataagagta aacttcagga 13741 accacactgt atccgtccaa agctcccagc attattacaa aggatcttaa tccgcactct 13801 gcggcttcat cccgaagctt gtcatctata tcaagaatcc tgtcaatatc gtccttttcg 13861 atgcttttaa ccagaagctc atcaaattcc ggggcatgct tgttgtagcc atagggtccg 13921 tcactggtaa ggcggtgtgc caaatctcca cttgcgacaa ataccacgtc ttcatctgaa 13981 tttctgacgg cttcgcctat gcacatacca aacttgtaat gttcctccaa agtaagtgtg 14041 gacattgcaa catgaacaag tttaaaatcc gaatacaccc ggcttatata ataaagaggc 14101 accagcgctc catggtccag ttccccggaa atcccgtacc ttctgcctat accttcgctg 14161 attcctccgg catcaaagcc ttcttttttc gcaaactcaa taattgactc caccattttt 14221 aaattattct caaaaccaag ctccacctta cgggctccaa atcttgaaaa gttgcctttc 14281 agcgttttat ggtcattaat gaaaatataa tcctcaaaca aaggcgcgtg ggaagtcgta 14341 agaataatgg ttgaaggctt ctcttttctt atttgttcag ccgctttttc acatgcctct 14401 atagttttaa ttgcgccctt ctcatctccc ttgccaatct caggtacaat caaaggagga 14461 tgaggaaaaa tataagaact tattattctt cccataattt ataccactac cttcctaaaa 14521 aaatagacgc agtcataaca cccaccgaag ttataaaaaa cgtcaaaacc ataataaatg 14581 caatcagtct gacggtagac ttcttcatgt cctttcacat cctattctat atagtgttta 14641 taacaaaata aacatttatt caatttcccc cgctatattt tataatattt ttgtgtatag 14701 ataaatacct taatatcata ataaattatc caataaacca aatacctgcc gcattattta 14761 caatttaata atatattaag ttaattttaa attaatattt ttttgaattt taagaaggat 14821 tttaatttgt tttgtagaat agaattttat ataaatctct atatgaatca tgttataaaa 14881 ctcatcatta ataaaaccgg taaatatata gagaaaaaac aaaacaacaa gtcacttctc 14941 atgaaaacac tagtatggaa cgattctccc ctgttgcata gtagtgtttt tcttttgtct 15001 tcttgcttca aacaaatttg ttgtaaaatg tcgaaaaatg acgaaattta aaattaactc 15061 aacaaaggca gcaaacttta tctgtaagtc gcccatttaa aattgtactt aatttgatat 15121 ttctgataca atagaatttg tacattatac tcccctttat attttggtat aaggagatat 15181 aaatagagac ggttctgttt atattcttca gataatatag aaaggatacg ggtcttaaat 15241 atttccttat accattttat tttatcacct taattgtaca tacaatatgt acagtgtttc 15301 caaatttttt aatcaagatc ttttcccgat tgctttacaa cataatcgta aatcattttt 15361 gaaatatttg ctattgcttt attggccgat tgtccgtttt tcacattctt tgtcataaca 15421 acaactatat acggcttttc ggcataaaca atcccgacgt catgtacaac cccggtatag 15481 tttccggttt tgtgtgcaat ttttaggttt ttcggaagca ataccggaag ccggtcgtaa 15541 aatttcgtgt ttatcatgtt ttgtacaagt tccctgcccc aggggtcacc gttttcagaa 15601 agttcataca cttcttttaa gtacatcgcc atatccctgg gacatgacac atttttcccg 15661 tcatcaacca cgactccgcc caacctgcgc atatattcct tgacatttgc tttcccaaca 15721 catcgaagca acatgtttac cgcaacgttg tcactatata ctattgagag tctgagcagc 15781 tcctttatgg taaaagtttt cccaaaagac tcattattcc aaataattcc tgtaccacct 15841 tcaaaatctt cctcggtata ttccaaagaa gtcataggat caagcattcc ttttcttatc 15901 atgtcataaa catacaaatt caaaggaatt ttgaaagtgc tcgcagcaaa aaactcttcc 15961 gtgtcattaa taccaaattc ttttccgctt tccaggtcaa caaaatatat tccaaaataa 16021 cagttgtatt ttgatatgta ttttcgaagc ttgttttcca aagctgcgta agtatccttc 16081 tctacctgat tttcaagggt gttgtcaaaa tcgttatcca agtcttcata gtaaaagggc 16141 tctccgatat cctcaagata ttcaagctca tcatttaaaa gctcatcatc aaattccaaa 16201 gaatacaaat catcctcaac atcataatca gtaccatatt cgtaagttcc ggcatagtaa 16261 gctttatggg cttcataatt gcccttgtta tattcattgc ttttcatgcc catacttgcc 16321 aaattgccac tgtacataac aaacgccaca cccatgaaga atgtgaccac aagcacaaaa 16381 tagtttctta ttttaccttt cagtatcttg caaattcttt cttttacaga attctttttg 16441 cgaatacata taataaacac ttgctgtcaa actccccata aaacaagata gtacctgcta 16501 tattattttt atccaataaa aacttatatt attacaaaat acagttcgca aaaaaataaa 16561 gctgtggagc attatgccca tagcttgtat tcagaacaga aacacagaca gtgtcaaagc 16621 ttattaaaac cacatatgta tcactcttta actcttcaca gcactaaacc acacttacgg 16681 gtgattcttc aacatcattt ctgcattttt tgtatttctt ctttcttttt atttgttctt 16741 tttcaatata atcctccaaa accttgtgaa gattcaatac gtcgctcatt tcataatatc 16801 cgaccttgtc atgaataaac tcaatggctt ttatggctcc cagcgcaaaa gccctcctcg 16861 aaaaagactc atggcttatt tctatcttgt cgtcttcacc gacaatcata acctcatgtc 16921 tgccgaccac accaccggca cgaaccgcat ttatcggtat tactttttcc ttaatactaa 16981 cacctgccga atcaaggcct tttttaatct ctcctgcaat tttaattgca gtaccggagg 17041 gtacatccac ttttctcttg tggtgaatct ctgtaatctg aaaatcataa ttgttcagaa 17101 tactggcggc aagattggtc aaaagcatta acacgttcac acccaaagtt atattgggag 17161 cataacaaat tgcattgtga tactttcttg taagcacaaa cagttttttt aatgcaaaat 17221 ccgtaaatcc tgtggttccg acaactatat ttactttcat cttcgagaat atcttggcat 17281 ttctgatggt agcatcggga gtcgaaaaat caaccacaac atcgggtttt gttttaaata 17341 ttacctgttc caaattcttt tcactgtcaa caattattcc cgaatttctg catccgataa 17401 tctcatccag ggattttcca aggttttggc ttttagaact gcacacaacc gaaaccagct 17461 tcatgttctc ctgttccaaa ataacttttg caatttcttt ccctgtcttg ccgagtccta 17521 ccagacatac tctaatcaat tagatccccc ccatttcata atgatgtaaa acaaactgac 17581 agtcaaagta acagcttgtt agaaagaacc gttaatggaa tatgttgtta tatatatgtt 17641 aaaagccgca gagaagcttc tgcggcctga ttaacataca aaataaccaa ccatactcct 17701 ctatcaacgc ctacgaggtt agctgacggg ttcgggtcga aagagttaac cctacctggc 17761 aaaaaccaag attcacccca aaaaatggtt cccccgctca aaactgatta agcgcttaaa 17821 atctttatta agtttttatt tataccttgc aaccttcata cacttataag attaatacat 17881 tatatgcaaa tgaaaacaaa ttgattaacg tattctgtat tatttatctg actggtttcc 17941 taaatacgga tgagccttat tgacatccgc gatattgaac gatccttcat gcaaaaatca 18001 agttttgaac ctttacatct tgagaaaact ttatatagca taaattttac gattgcatta 18061 tatcaaattg ccaaacatat gtcaataaaa tatgttgtac aactacctga aagcaaactc 18121 aaattccgta aaactattta tttcccaggc ttgtaaacaa gctttagaaa cagccgcttt 18181 atcagcctca ctatatgata aaccgcaata aataattcta ttaccaaaag aatacacagc 18241 aatattacta tatccctgta ttccttcact tgatttatca acgactcaaa caagcccatc 18301 gaagagtaaa catcaaccgc cggatgcaga cttacttcaa taaccgttcc atcctccaaa 18361 gtatactttg caatgcctaa aacatcactt ttcagtacag gaggatcaaa cttttcagga 18421 actttaaatt caatattctt tatataattt tccccggcag ggtaagtata gtaatagtca 18481 cctatgctaa ccaaatctat aactttatcg ccgacggtaa ctttcttcaa aggttgtccc 18541 attgatacca gaatgcctgt cctgaaattt aaaaaaccat agtccagaag ctttaccgaa 18601 tcgtcataca tgctttcttc cggtgaatca agaactatgc atatcaacct ttgcccgttt 18661 cttgtggcag tggtaattgc cgtttgacgg tctatttcgt tatatccggt ctttccaccg 18721 tcaacgccgt catagctcca gaacaactca ttgctgttta ttaaaatctg cgttccgtca 18781 acccatggtc tggccttagc cgaaaacatc tcattgaaag tgctggattt tgtcagagca 18841 tatcttatta aaacggccag gtcatacgcc gttgtatatt gtttttcatc ataaagaccc 18901 gtgggatttg taaaataagt atccttcatc tcaagttcct gggccttttt attcataagc 18961 tcaacaaaac ccttctcgtc tccacctata tactcagcca gaacattggc actgtcattg 19021 gcggatccta acaaaaccga atatatcaaa tcttcaaccg ggtattttcc gccgacctcg 19081 agatttaaca cagctccttc aacagaaacc gccttcttgc tgacagtgat attggtgttc 19141 agttgattct gcattttttc caaagcaatg agtccggtca taattttatt tgcacacgaa 19201 acatgaagtt ttaattttgg attcttttga tagagtatct gtcccctctg cacttccatc 19261 aaaatagcgg aaggtgcctt gatttccgga ggttccgcaa ctgcgaaaac cggactttga 19321 gagaaaaaca aaatcatcat tgctactgta aagcactgaa tttgtatcaa gactcttcta 19381 tacatatcca acctcgtcca attctttttt tattggaaaa tcaatattta tattgccaac 19441 cacatagtta acaaaatagt tgtttgaatt tacaggtata ttgtttcaac attattatag 19501 tactttaatt ccactaatac aactcagaat ttatagaatt aaacatcctt cacacaaatc 19561 catttttctt gtatttcttt tctactattc aggaaaacta aaataggagg tgaaaccatg 19621 gctaaaaaca agaaaaaaca aaaagacgtc aaagatgcaa aatatgagtt tgcaaatgac 19681 cagttgggag aaaatacaga acccagatat gaagagatga aacaggataa aaaaggcggc 19741 aagaaagcag gcaagaagta acgtacagct tacaggaaaa atatgcatag tatgtagaaa 19801 aaattgcaaa caagcagagt taaaatattt tttctctttt attgcctggc actgcttgtt 19861 tgctttcttt ctttttcaca ctccccttta aatttttatc aatatatgct agtatagact 19921 acaaaaagaa aagcaaaagg tggttaacac taatgtcaaa agtggctcta atcagatgtg 19981 aaagttatga ctatgatgcc gtcaaatcag ccgtaaaaag ggggcttgac cttattggag 20041 gccctcaccg gtttgccgct cccaatgaaa aaatactctt aaaacccaat cttctttcgg 20101 cagacccgcc ggaaagatgc agcacaacgc acccttccgt atttaaagcc gtggcggaaa 20161 tattcatgga ggcaggaata accaatcttt cctacggcga ctcccccggc attcacaagc 20221 ccataaccgc ggcgagaaaa aacggaattg aaaaagctgc aaatgagctt ggaatcaaac 20281 ttgccgattt cctggaagga aaggaagtgt tctttgaaaa cgcaatccaa aataaaaagt 20341 ttataatagc aaacggtgtt cttgaaagcg acggcattat cagtctgccc aagctaaaaa 20401 cccatggatt tgccagaatg acgggttgtg tgaaaaacca gtttggatgc atacccggac 20461 ctctgaaagg agaatttcac gttcggattc ccagtataat cgatttttca aaaatgctgg 20521 tggatcttaa cgtttattta aaacctcgtc tttttgtcat ggacggtatc atagcaatgg 20581 aaggcaacgg acccagaggc gggactccca gaaaaataaa tgcgatactt ctttccgaag 20641 atccaattgc cctggatgcc actgtatgca gaatgataaa tttaaacccc gagtttgtgc 20701 ctaccatagt atttggaaaa gaagccggcc ttggaactta tgacgaaaat gaaattgaaa 20761 ttctcggaga tgatattcaa agcttcataa cttatgactt tgatgtaaga agagaacctg 20821 taaagccctt caagcccggc ggagccatcc agtttttcag aaatttcatc gttccaaagc 20881 cctacatttt aaaaaacaaa tgtattaaat gcggagtatg tgtaaatgcg tgtccggtaa 20941 aaccaaaagc agtagattgg cacaacggaa ataaaaaaga acctcctaca tatatttaca 21001 aaagatgtat aagatgttac tgctgtcagg aactttgtcc ggaaagcgca atccacctca 21061 aggttccttt tattcgcaaa tttttttata atccgaaata aaaaataaag ctttttatta 21121 caacttttct ttgaggtctt ttaaaaacct ttgctgcaac ccttttatac tttgaaggta 21181 aagccttaac aggttttgat tctgggcatc aatattggtt attttaagcc tgtattcaaa 21241 ataccttgta aaggcttcct tccttacaat atcagatctt aaagaaataa cggttttgtc 21301 aacatcctcg tctattttta cctcctgaaa tgtcggatat atcgtcactt caatattctt 21361 cttgagcgga aagtcggcag cggtgttaat catcagaccg tcaaagctca tatttttgat 21421 tgtggcaaca ttgattttat cagagtcatc acacttgatc tttgcataaa aagacacagg 21481 aaacctttca cattctcgtt gctcttttaa agatcttaca gattcaacct taagttttat 21541 atagctgcaa tccggatcta ttccctttac aatacaaccg gctataaata cttcgtcatt 21601 ttcctcatag cccagcacaa cagggtcatt ttcaagaaaa tttaaaatga caaactcttt 21661 tacaagcttt accacaagca aatccttttc aacttgaagc accacacttt taaaccacgt 21721 cttaccggaa taatggcaaa tagaggctat ttctccaact ttcatataca cattgacctc 21781 ctgtgctata aaaaaaagac ccgttgtttt gcccatattt tacttctaat atgtaccaat 21841 actgcagtgc catagaatta cattctacaa tattatatat tttctacaaa aacatataaa 21901 aatccttctt tgaaaaattt atcaacaagt caaactatct gcttttcatc ggccctttgt 21961 tatgatataa ttgtcataca agaattacct attgtaattt tgtactgtct tacaagctaa 22021 aatgtttgct tttttagtta aataccttcc ctgatgttat attataccat tgataatgtt 22081 attgattttt tatcaatcta tagaataaat aatgctatat aattcaaaaa ttaaaactga 22141 aggtgatcat gtttggataa aatggttttt aaggcctatg cagtaacgaa cgaaattgac 22201 cttaacagaa ttgccgccaa atgtaatatt cctaaaaagt atacgtggga ggaaccactt 22261 atccttaatg aaaatgtttt atcctcaatt tttaacaaag aaattccaga aggccaaaaa 22321 attcttgtat tttcttttgg aagcatagta tttataaact gtccttccga gcatgaaaaa 22381 ctttttattg aatatctcaa aaatgaaaaa atcgatatag acgttgaaaa ctacaaagaa 22441 tattccgacg attatgaact tcaagtgagg gaaaatgccg aaatagaact gactgacagt 22501 tatctgacgg taccgaagtt tgaatttttc tatcctgagc ttgtttcaac cgttattgcc 22561 aagtcggtgg ccctggaaaa aaccgaagag cacctcagca caatcctgga cactctggaa 22621 accatgattg ataaactgga aaaaggaaaa ctcaatgtcg gaaacaaaga aattgcaaaa 22681 accacgtcaa aaatagtacg gcatgagtac aacacaatag cttacataat gatattagac 22741 aaacctgaca ttacctggac caacagcgat gcaaaaaatc tttatgacat gatgtcagaa 22801 tttttcgaac ttaatgacag atatataaca ttaaaggaaa aaaccgatat tttaaataat 22861 gtactcagcg gtttttcttc gataagccat tcaatgagag gactttttgt tgaatgggtt 22921 atagttattc taatatttgt ggaaataatt cttatgctcg cagatttatt aaagtaattt 22981 caacggggaa ttggtaggta tgaaaacagt tcattttata agttacaaag tcgcagcatc 23041 tcttccttta gacaagatag ccgctttcct caaaaccaat atgaaattta catgggatga 23101 atacatagtg gtaggcggtg aacaacttga cacaatttta aaatatcaca gcgaagacaa 23161 ggccgtatat cttttcaaat acggctgcat ttcctttgtc aattttacgg ataaagaaat 23221 ttacagcttt cttaaatacc tggaatcaat aacgtcgaga ataaactaca acctgatgcc 23281 caggtaccac gaaagccaca atgtcacaat tgatgaaaac ttaaaatgca gtctttttga 23341 aaacaaaagc gtagaggttg attatgacaa aaacatagac cacattttgt ccatcgtgct 23401 ggcccgttca acacaaatgc tcttttttga aacacaggtt aataatctgc tggacagcgc 23461 ggaaaaattc gtcattttgc tgcagaaagg gcgtctatta acctttacta aaaaatctta 23521 tgccataatg gccaaaattc tgaggtttga atttgacagt ttaagttgta tcagaatttt 23581 tgaacatccc gcccttggca aacacagtat aaaattaaaa gaaatatatg atattcttgc 23641 agaatattac gaatttggcg gccgattcaa cgtaatgcaa agtaaaataa aagacctgag 23701 aaaaatagtg ggcatgtatt catcgctaag ctacagcgaa accgaaaccc gcctgctttt 23761 gtttgaaata tttctgcttt ctttgttttc attggcccat atcatatagg caaagaacta 23821 aatcagtcaa acaataaata atgaaaaaag ataataaaaa gaaagatgga gaaaacgaat 23881 tacacgtttt ccccatcttg cgtgagactt ttttggttat tacaagattt attgacatga 23941 cataataata accatcatta aaggattaga aatgaatatt caattcctaa caatttgtgt 24001 gctttatatg cacagggggt aaaaaactta tgctttatct ataataagag aaaagcagta 24061 tataatcaat gaaatattta ttccttcgat agagaattat tcattgtttt ccaatcgcct 24121 ccgatgaata tgaatcttat caggtcaaaa aatcgcttaa aacagcgaag cccgcataaa 24181 gaaggacctt tatgcaggct tcgctgctat cacaaagagg gaataagtat atattggttg 24241 tgtatagccc tcgcatccta aataaggaag tctctcaaaa atcaattaaa aactactcaa 24301 tgtcaagaaa aacatccatg gattgtccgt ccatgtcaaa aaccaatttg tttgtgccag 24361 ggctttgaag caaaacagaa attccctccc cgataagcaa tgtaggtgtg gaaatataaa 24421 ccgctgcctt tacgtcaact ttactgaaag catttcctgc aattatatta agcaattccc 24481 ctattgcact ttttaccatg tcatcaactt ccgtaaattc catgcccccc agcatagctg 24541 acgctatagc caaagcagat tctttctttg ccgtcataat cagattgccg cttattgccc 24601 cgttaactcc catgacaaca tttacatact ctgcttcaac taatccgcct gtctcattct 24661 tttcggcaaa cacggaagaa aacccaaatt cggacaatac acccattgca gtttcaacaa 24721 aggcattttt gacatccatt ctttgcactc ctcataaaac ggaactgcct tcaaaccctg 24781 aataaacaaa tatttgaact gccggtacga atacctgttg acgaaaacaa tgcacgatga 24841 aacaattaat gaacggccta cttcaaaatg caatttgtga gttgttttat cgtaacatgt 24901 tagaaaaatt ttctaaagta ttttatatat ataattatac gacctggcag ttcaatttcc 24961 ttctcaatag tcatgaaaaa aaatatataa aaaactccaa taatttttgt gcttttttca 25021 taaacagaat taaaataaac ctttaacaat tataatcctt taacaattat aataaagtat 25081 gctctttaag cagcttattc ttgatattcc acaattcttc actcaagtct acataatatt 25141 tgtgcggatt ttcaaacctg agcacctcat cccagagggt gttaatctgt tctctgcagt 25201 aatctctgat ttcatttatt tcaggtactt tatatacaca ttttccttta tcgaaaatct 25261 ggacctggag ctcctttgca taaaaatcgg tcacagtttt cctcttccat gtatgatccg 25321 ggtcgaaaat ctcataaggt ttgctgtcgt caatgacttc acccgcattt acgataacat 25381 ctgctatagc tttgttgttc tttctgtcaa acaatctgaa aacttttttg tatccggggt 25441 ttgttatctt taccacattt tcactcattt ttattttcgg tattatagtc ccgttttctt 25501 ccaccgccac aagtttatat actcctccga aaacaggttc ggtttttgaa gttatcagcc 25561 tctcaccaac accgaaaatg tcaacctgtg ctccttgctg caatatatcc ctgattatat 25621 attcatcaag cgaattggag acaacaattt tgcaatcggg gaatcctgcc tcatcaagca 25681 tttttcttgc ttctttcgaa agatacgcaa tatcccccga atcaattctg attcccttgg 25741 gtctgaaccc tcttggcaca acttcttctt taaatacctt aatggcgttg ggcacccctg 25801 attttaacac attatatgta tccacaagaa gaacgcagtt gtcaggatat actctcgcat 25861 aggctctaaa agcctccagc tccgaaggaa aaagctgaac ccagctgtga gccattgtac 25921 ccgaagcagg tacaccaaaa tctctgtcgg ctatggcaca tgcagtaccg gcacatcctc 25981 cgatatatgc cgctcttgct ccaagcacag ctccgtcata accctgggcc cttctggtgc 26041 caaattccag cacaggcctt ccctgtgcag ctcttacaat cctgttggct ttggtggcta 26101 taaggctctg atgattgatc gtgagtaaaa tcattgtttc tataaactgt gcctgaataa 26161 ccggtcccct taccgttata ataggttcat tgggaaaaat cggagttccc tcgggtatcg 26221 cccatatatc gcagcaaaac ttaaaatctt tgaggtattt taaaaagtct tcactgaata 26281 tccccttgct tcttaaaaac tcaatatcat catcctcaaa cttaaggttg tttatatatt 26341 caataacctg ggccaagccc gccattatgg caaatccgcc gttttccgga actcttctga 26401 aaaacatgtc aaagtaagca attctgtccc cgattccgtt ttcaaaataa ccgtttccca 26461 ttgtaagctc ataaaagtca gtgagcatgc ttaggttttc actttgattc caattgattt 26521 tcttcattgt tattccccct actcaacaat atcccgtaca acctcgaccc cgttgattat 26581 catattgtat gctgccataa cattcataag gtttctgtcg tgcactccca agtcataggt 26641 atcaaccgca ttcaacggaa cgattactct tgcccgttta ttattcatgt taaaataagc 26701 cttaagtgta atagcaaact gttgtacaca gatatcggtg caatctcccg tcaatatgaa 26761 ggtgttgata tcgggatttt ccaaaagcca ctttctgaaa gcttcttcca aaaatccgtt 26821 ggtagaattt ttttctataa gagtatatcc cccgatattt tttatttcat ccactatttc 26881 actttccgcc gtacctttca tgcaatgttt tggatacgcg tcaaattccg gtgattcatc 26941 ggtatgacag tctgcaaagg caatttttcg tatttttcgc ctatcacaaa tttcgctaag 27001 ctcacatatc ctgggtataa gctcttttac ggcatcgctt ttaagcgccc cttcttttgc 27061 aaaaccgttg gtcatgtcaa taataaccaa aacggcttta tcggcctcaa tttcatcaaa 27121 ttttacaaca ggaagttttt caagcatatc taaaattgat gccaaagttt cattgctctt 27181 ttgtaaaaat tcattctttt gcaaaacctt cataaaaaat tccccctcat cctttattga 27241 cattataact tccacatact tcatagtgtt attattgttt tgttattatc attataatac 27301 tatattgaaa taatgtcaac aaaaattttt cctgaggggg aatcaattaa ataaatacgg 27361 gcaaaggcat gccaaatgct taatggaagt ttttaggcaa ttccttttcc accagcatat 27421 ataaaggcac gtctttttcc tcttttgtat ggatatagga aacatgagcc atgttattat 27481 ccattacctt ttcaatccat accggtgagc cttcatgcaa tacctcgata acctggtccg 27541 attcaattat ttgttgcgct ctggcagcat ccatttgtat accatctccc gtttttattt 27601 tatcaattgt tttattaaat attttatcaa aattgtatga aataattaga tttgagaagg 27661 cagtataaaa tatttactgc tttatttata gtattgcctg tttcgtatct taatatttta 27721 ttataaaata ataagtttat tatattcatt tatatggata agttattgta taattaagat 27781 gcggggagga aatcaataaa aaccgcattg aaaggtcaaa taaaaattat taactcacat 27841 tttgaatcgc tttttatgag taagatctta ctaatatatc attttttctt agttggtttt 27901 tgtttatctt atttgtttcg attcatctaa ggggaatgga acggaaataa ctgcaggggc 27961 ttgcaaagat tacttgtcag cattgtcaca aaagagtgtt tgtactactt tcaagtagtc 28021 aggcaggtcc gcataatttt aggggagttt ttataaggaa aggtgatgtt ttttagggga 28081 gttttgagcg aattttttga acgaatttct ttgtgtacgt acacaaataa atctttaaat 28141 cagaaaaaga aaaagaaaga gaaagacaga gaaaaagaaa aatagaaaga gagaatttaa 28201 aaaaaataaa gataaaaaga aaaagagaga aaaatataat caaagataat ctgatttatc 28261 aaatgagaga aatggttgat cttttgtagg ggggaaggaa aagttaaaaa ataagttaat 28321 ttttttggca taacggaagc ttcctgttac cagagacaaa aataaaaaac tgttgcaaaa 28381 ctgattggtc atgttttttg caacagttt //