LOCUS NZ_ACVX01000056 13288 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00032, whole genome shotgun sequence. ACCESSION NZ_ACVX01000056 NZ_ACVX00000000 VERSION NZ_ACVX01000056.1 GI:256006027 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000056. FEATURES Location/Qualifiers source 1..13288 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene 1275..2051 /locus_tag="ClothDRAFT_2826" CDS 1275..2051 /locus_tag="ClothDRAFT_2826" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430965.1" /db_xref="GI:256006028" /translation="MLRIVKSKKTEWEKLETLKQEKINSKATLEKLLEGASGIQREAL LKGDEGKRQEALAMVQSLQQQIAAVDRDIKFLEEEQSKVEAMHIEFKLKEIERQKEAI QKELEPYRKAYEDAKTAFKKAEQEWFAKNHEASRKFDALNRERDALRLRLDKLTPPPS PQPKHSVEEWLNLCRQGKVKTYIQGNDPNLDDAWRQYEEEKEIIRDWAKKSATRKKVC GETLPLPEVAKHYSQARLREIVSATHPKAANAVFGHLFGH" misc_feature <1392..>1739 /locus_tag="ClothDRAFT_2826" /note="Protein of unknown function (DUF3584); Region: DUF3584; pfam12128" /db_xref="CDD:152563" gene 2335..3003 /locus_tag="ClothDRAFT_2827" CDS 2335..3003 /locus_tag="ClothDRAFT_2827" /inference="protein motif:PFAM:PF00239" /note="PFAM: Resolvase domain; KEGG: glo:Glov_2327 resolvase domain" /codon_start=1 /transl_table=11 /product="Resolvase domain protein" /protein_id="ZP_05430966.1" /db_xref="GI:256006029" /db_xref="InterPro:IPR006118" /db_xref="InterPro:IPR006119" /translation="MPTTKIKTKAHPRLRQFRIYGYLRVSTIDQDTEKNKADILSFAN SKGFLGQVEFVEEKISGLKSWKKRKLKDLVESMSEGDILIVPELSRLGRSLVEVLEVL NELKDKGVKVFSVKENFQLNGDDIQSKVMRTMLGLFAEIERDLISARTKEGLAAVKAS GKRLGRPKGPGKSKLDKFKPEIVALLKNGSKKIFIAERYGVTPATLTNWLKRHGLDKL TPTP" misc_feature 2389..2979 /locus_tag="ClothDRAFT_2827" /note="multiple promoter invertase; Provisional; Region: mpi; PRK13413" /db_xref="CDD:184041" misc_feature 2389..2793 /locus_tag="ClothDRAFT_2827" /note="Serine Recombinase (SR) family, Resolvase and Invertase subfamily, catalytic domain; members contain a C-terminal DNA binding domain. Serine recombinases catalyze site-specific recombination of DNA molecules by a concerted, four-strand cleavage and...; Region: SR_ResInv; cd03768" /db_xref="CDD:58117" misc_feature order(2404..2406,2410..2412,2599..2604,2611..2613) /locus_tag="ClothDRAFT_2827" /note="catalytic residues; other site" /db_xref="CDD:58117" misc_feature 2410..2412 /locus_tag="ClothDRAFT_2827" /note="catalytic nucleophile; other site" /db_xref="CDD:58117" misc_feature order(2596..2598,2734..2739,2743..2748,2758..2760) /locus_tag="ClothDRAFT_2827" /note="Presynaptic Site I dimer interface; other site" /db_xref="CDD:58117" misc_feature order(2614..2616,2629..2634,2722..2724,2731..2736, 2743..2748,2755..2757,2764..2766) /locus_tag="ClothDRAFT_2827" /note="Synaptic Antiparallel dimer interface; other site" /db_xref="CDD:58117" misc_feature order(2683..2691,2722..2727,2734..2739,2746..2748, 2758..2760,2767..2769,2779..2781) /locus_tag="ClothDRAFT_2827" /note="Synaptic Flat tetramer interface; other site" /db_xref="CDD:58117" misc_feature order(2683..2685,2737..2739,2746..2748,2758..2760, 2767..2769,2779..2781) /locus_tag="ClothDRAFT_2827" /note="Synaptic Site I dimer interface; other site" /db_xref="CDD:58117" misc_feature order(2761..2763,2779..2784) /locus_tag="ClothDRAFT_2827" /note="DNA binding site" /db_xref="CDD:58117" gene 3164..5008 /locus_tag="ClothDRAFT_2828" CDS 3164..5008 /locus_tag="ClothDRAFT_2828" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430967.1" /db_xref="GI:256006030" /translation="MKKSKSLIIGYLLAFFLGGVGAHLFYYHKRLRAWIYFLAVIFSA ARLLPLTMVLGWIDMFFIKKWHKEYLERGEKISEKLIDIPTRFTFTTEITQVGKLEPS LQKVLPKKEEKKFYKEEDIILPEYAHLKTPIHIRKDIEKLRNSVNAKKTNSPAIEINV FTRDTEFMKDSIRYADMVVRNADFVPLEVYWTTFRDLDERQKKWYFYWRYQALNGNYL DTDLSYVILFVYELINYTFNQNAAFNVSMMVRLREAYKDRLPALDKYIVPWIRDILVE LNEIELAYKWGLGAEPYSGLNFYRIFKEHQGDISKIPMEEWRKVVYGYSETTFFKANA QKVYAVFEQALKLFQKINAEEGLDLEKAWFRPEEKIENYRFFNSAVIGRNVSSRVIKY LKYVPTDYFYNEVTALFRLSENVTRLLAGVTRQLQVNEELLPPGFKEALLEEIRRLDL TENVGLKSRFSPDKKIKNRFYQVASKENEESKQTIPKRTTQTIGIGSEKIKPELDLLQ IDIPAHRSSISLADEEVNVEGFISSLTEEESKFISTFSNNKKSINEAEEQLRAQGVPV TIFVEQINAKAEEYLEDVFIELIGEEYVINEELVTVWEEIKRRKQHEN" sig_peptide 3164..3232 /locus_tag="ClothDRAFT_2828" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.992) with cleavage site probability 0.958 at residue 23" misc_feature 3170..>3286 /locus_tag="ClothDRAFT_2828" /note="TM2 domain; Region: TM2; cl00984" /db_xref="CDD:186291" gene 4998..5387 /locus_tag="ClothDRAFT_2829" CDS 4998..5387 /locus_tag="ClothDRAFT_2829" /inference="similar to AA sequence:KEGG:Mchl_5415" /note="KEGG: mch:Mchl_5415 hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430968.1" /db_xref="GI:256006031" /translation="MKIKRRDSADILNALAGGVVPKRGLQYIMVGREAEMKQIREELR DIRENGNSMIRFFIGTYGTGKSFMQNFIRQVALEEGFVVTNADFTPHRRLYGSDNQAL ALYNELIKNLSTKSAPQGNALPIILDQ" gene 5391..6329 /locus_tag="ClothDRAFT_2830" CDS 5391..6329 /locus_tag="ClothDRAFT_2830" /inference="similar to AA sequence:KEGG:PST_3462" /note="KEGG: psa:PST_3462 biotin carboxylase" /codon_start=1 /transl_table=11 /product="biotin carboxylase" /protein_id="ZP_05430969.1" /db_xref="GI:256006032" /translation="MSLQNKVMENLDYEDKTVLEDNVFVRAVEKEIVKAVSHLDELTG GYDFAKVLSIYYKSFVEQDKEKQRQALRWLRGEYLTKSDALRDLGIREIIDDSNYYAH LKVLCKFVRQAGYSGLIINLDEAVNLYKITHREAREKNYDYILTIYNDILQGSVEGLY ITFSGTPEFLEDERRGLYSYQALKRRLKPTVENEKYQDLKQAVIKLTPLTPEETLILL MNIRDIHAAHYGYEINVMDEEIRRYLLWIYKRPGAKEHIILGDVVRQFISFLNIKMEH PTLNFEELYMGEETSENNLPEEVIDIHKRFKRTQLS" misc_feature 5472..6266 /locus_tag="ClothDRAFT_2830" /note="Protein of unknown function (DUF2791); Region: DUF2791; pfam10923" /db_xref="CDD:151370" gene 6347..8485 /locus_tag="ClothDRAFT_2831" CDS 6347..8485 /locus_tag="ClothDRAFT_2831" /inference="protein motif:PFAM:PF00270" /note="PFAM: DEAD/DEAH box helicase domain protein; helicase domain protein; SMART: DEAD-like helicase ; helicase domain protein; KEGG: bxe:Bxe_B0141 DEAD/DEAH box helicase" /codon_start=1 /transl_table=11 /product="DEAD/DEAH box helicase domain protein" /protein_id="ZP_05430970.1" /db_xref="GI:256006033" /db_xref="InterPro:IPR001650" /db_xref="InterPro:IPR011545" /db_xref="InterPro:IPR014001" /db_xref="InterPro:IPR014021" /translation="MSQIFYKLSDKVQKKIWDIGWKHFTPIQEKAIPVIIDTEKDVVL SSGTASGKTEAAFLPIISKIHETASNVLKVLYVSPLKALINNQFERLQKLCEEMNIPV HRWHGDVSQHSKKKLINNPAGILQITPESIESLFINRTQFLKQLFQELEFIVIDELHA FIDTERGVQLRSLLSRIKQYTKRCPRIIGLSATIDNFSLIKKWINCNNPDNVEIIEVK GFERDIYYSLMHFEKSKTGNYPLELYEDILELTRNYTSLIFFNSRAAVEEATVILNRL AQREKLGERYFAHHSSIAKAEREFVEKLMSESTGIKSVIATSSLELGIDIGEIDLVIQ VDSTFTVSSLKQRLGRSGRKQGEGQYLQMYTTDKYGLLQSIAVMDLLLQGWTEPCKGY PYPYDILFHQIISICHQLNGIPLEKLVSLVSENAAFYELPESDIRMLVEHMIGKEYLE ILAGTQELIVGLEGERLLRQKDFYSVFMTPEVYEVFYGTKNIGEIEKTFLLNEGDNII LAGRLWKIEEIDFHRNKVYVKKAMDGKPPRYSGGLAPLHPRIPERMHEILCLDCKFDF IDDRAQTALEELKVPYKYFNVKPDERIIWQTKEKLLFETFTGTNIFRTLIWMLRYYGV DEVKTDGIGRMEIPLNDEFIDILQDIKSRKWSLRSLLPYTKEEEFFVSKYSDFLPSEL QIKMHGAYNVDIEGVLKFLDKFRIRIISLE" misc_feature 6347..>8209 /locus_tag="ClothDRAFT_2831" /note="Lhr-like helicases [General function prediction only]; Region: Lhr; COG1201" /db_xref="CDD:31394" misc_feature 6464..6928 /locus_tag="ClothDRAFT_2831" /note="DEAD-like helicases superfamily. A diverse family of proteins involved in ATP-dependent RNA or DNA unwinding. This domain contains the ATP-binding region; Region: DEXDc; cd00046" /db_xref="CDD:28927" misc_feature 6491..6505 /locus_tag="ClothDRAFT_2831" /note="ATP binding site; other site" /db_xref="CDD:28927" misc_feature 6812..6823 /locus_tag="ClothDRAFT_2831" /note="putative Mg++ binding site; other site" /db_xref="CDD:28927" misc_feature 7034..7423 /locus_tag="ClothDRAFT_2831" /note="Helicase superfamily c-terminal domain; associated with DEXDc-, DEAD-, and DEAH-box proteins, yeast initiation factor 4A, Ski2p, and Hepatitis C virus NS3 helicases; this domain is found in a wide variety of helicases and helicase related proteins; may...; Region: HELICc; cd00079" /db_xref="CDD:28960" misc_feature order(7127..7138,7214..7219,7295..7303) /locus_tag="ClothDRAFT_2831" /note="nucleotide binding region; other site" /db_xref="CDD:28960" misc_feature order(7319..7321,7382..7384,7394..7396,7403..7405) /locus_tag="ClothDRAFT_2831" /note="ATP-binding site; other site" /db_xref="CDD:28960" gene 8733..9065 /locus_tag="ClothDRAFT_2832" CDS 8733..9065 /locus_tag="ClothDRAFT_2832" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430971.1" /db_xref="GI:256006034" /translation="MMTVEIKIIENPLSDWKLGDPCSICNRMFSYTEAEYVAVVYVDE ERDFICGDCLKKGPEAIKKAAQKRAQEIRDEIRLGLKEAELLEKIASGDIVYPWDDQE KFSKCANK" gene 9141..10292 /locus_tag="ClothDRAFT_2833" CDS 9141..10292 /locus_tag="ClothDRAFT_2833" /inference="protein motif:PFAM:PF00239" /note="PFAM: Resolvase domain; Recombinase; KEGG: geo:Geob_0720 recombinase" /codon_start=1 /transl_table=11 /product="Resolvase domain protein" /protein_id="ZP_05430972.1" /db_xref="GI:256006035" /db_xref="InterPro:IPR006119" /db_xref="InterPro:IPR011109" /translation="MEPKAYSYIRFSSPEQEKGDSLRRQIQLSEEYCKQHGLILDDTL KLTDRGLSAFKGIHRTKGALGEFLRLVEEGKIPPGSVLLVENLDRLSREQILDALNQF TSIIKAGIKIVTLQDGMEYDQESINQNWAQLIISITYMARAHDESETKSKRISAVWEN KRSKAGNGGEKLTAKAPAWLKLSQDRTKFILIPEAAKAIELIFRKKLAGKGAERIARE LNEDPNIWEPPRTGPKKTGGWRGSYINKILRSRAVIGEFQPHKLVDGKRQPIGDPIPD YFPPVIDKELFYQVQAQLQANAEKKGNAGGRTGKVSNLFTHVIKCGLCGYPMHFINKG KPPKGGKYLVCDASRRLKTCTAKPIRYEEFEQLFFDNFEELDISQLIPG" misc_feature 9159..9608 /locus_tag="ClothDRAFT_2833" /note="Serine Recombinase family, catalytic domain; a DNA binding domain may be present either N- or C-terminal to the catalytic domain. These enzymes perform site-specific recombination of DNA molecules by a concerted, four-strand cleavage and rejoining...; Region: Ser_Recombinase; cd00338" /db_xref="CDD:58115" misc_feature order(9168..9170,9174..9176,9402..9407,9414..9416) /locus_tag="ClothDRAFT_2833" /note="catalytic residues; other site" /db_xref="CDD:58115" misc_feature 9174..9176 /locus_tag="ClothDRAFT_2833" /note="catalytic nucleophile; other site" /db_xref="CDD:58115" misc_feature 9717..10022 /locus_tag="ClothDRAFT_2833" /note="Recombinase; Region: Recombinase; pfam07508" /db_xref="CDD:148873" gene 10374..10829 /locus_tag="ClothDRAFT_2834" CDS 10374..10829 /locus_tag="ClothDRAFT_2834" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: geo:Geob_0720 recombinase" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430973.1" /db_xref="GI:256006036" /db_xref="InterPro:IPR000342" /translation="MENFSDTIGRTKDSRIREQLEKKLSQAFDDKESLESENKKFERE ITELRQQKAGLEKNIEQAKEIYQLLNSAQGETERIELRLRLRQQIQKSIEWIKIYPLQ EPYQEIQETEEPGIVKIMKSKYIDKVRIKFRGSRDLRVLYLKNHAELSE" misc_feature <10413..10568 /locus_tag="ClothDRAFT_2834" /note="Axonemal dynein light chain; Region: Ax_dynein_light; pfam10211" /db_xref="CDD:150826" gene complement(10862..11251) /locus_tag="ClothDRAFT_2835" CDS complement(10862..11251) /locus_tag="ClothDRAFT_2835" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430974.1" /db_xref="GI:256006037" /translation="MGAVAGFSIPHRYDTNEAIEVLSRKGEEFSIPHRYDTNSGRMGS YRQCRQISIPHRYDTNLDSHARLPVQCFQISIPHRYDTNELQVYQRYCSNLISIPHRY DTNHLVAIKDHQHFLSFQFLIGTIQTG" gene 12618..12773 /locus_tag="ClothDRAFT_2836" CDS 12618..12773 /locus_tag="ClothDRAFT_2836" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05430975.1" /db_xref="GI:256006038" /translation="MYRTYEELELSIIYIIKSIITSFYPRCNKMRLNNYDAFSNFTSV SVALVMN" ORIGIN 1 atctgaaacc tggacgtctg ttaagacaca aaaccttaac gtctaaaatc gcctattaaa 61 acttaacggt tgccctatta aaacttaacc atatatctat aatatataga atttaattaa 121 aatttataga attattaggc tttgaacttt tccaagttca aagaatgtga gattcttcta 181 ttaaagaaaa gatagtattc ctccaattaa agaaaagata gtattccttc actaaagatt 241 tacaaagttt atttagaatt aaattagaat ttatttatgc attgaactaa agttcaatgg 301 atgattaatt aaatcaaatt cctccaataa agataaaaca agtttcctcc aattaaagat 361 aagataggtt cctccaataa ataaataaat gtattcagcc attactgctt ttagcagttc 421 ggcccattgc aagtaaaccc attctgtcca tccgtgaaga tgttacaagg ttccgccatc 481 ctgctttcag cagcccggcc agtcccatat aaaggctccg acagtcctgc gccggcctag 541 ctatgcattg accccggccc gtctatgcat cgcccccgcc tatgcaccga tttactgcca 601 attttttgcc attttaagcc gctgaaaagc cttccccata taaaaggtat tccccacagc 661 ctatagagca aaatagagca aatttgatgg cttatttttg ccctcagccc taaatagaac 721 catgtttgta taacatggat ggagggacaa acataaggat agacaccaga aaggagatat 781 agtgaagatg ataaaaagaa gaaacactag aaagaactag aaatttgcca ttttaagcca 841 ttgaaaaagc cttcaaaaag ccttccccat acaaagttat tctccatcac cttaaaacag 901 catatagggc caattaggtg gcatagaatt gaagttacga gccctgttct accatatact 961 ggaacagggc tttttaattt tgtatgaaaa aaagttaaat cctttacttt tcatattaaa 1021 accgttaaaa ttaggacaag acaataaatg acaaaattag acaaacctgg agaaaggagg 1081 gaaagacagt gccagagctg ttaaccgttt cagaagttgc ccagttaatg aaggttaccc 1141 cacaaacagt tcttcagtgg atttacacta aacgactgaa ggcttacaag gctggaggcc 1201 aatggcgaat ccggccggag gatttgcagc tttttctcaa gggttcataa agactgaatt 1261 aaggaggttt tgaaatgcta aggattgtca aatcaaaaaa aaccgaatgg gagaaacttg 1321 agacgttaaa acaagagaaa atcaattcca aggcaaccct agaaaaactg ctcgaaggcg 1381 ctagcggaat acagcgagag gccctgttga aaggtgacga aggtaagcgt caagaggccc 1441 tggcgatggt gcaatcttta cagcagcaaa ttgcagcagt tgatagggat ataaagttcc 1501 tggaagaaga gcaatctaaa gtcgaagcaa tgcatatcga atttaagctg aaggaaatag 1561 aacggcagaa ggaggctatt caaaaggagc tagaaccgta ccggaaagcc tatgaggatg 1621 ccaagacagc tttcaaaaaa gcagaacagg aatggtttgc taaaaaccat gaagctagta 1681 ggaagtttga tgcattgaat cgggaacggg atgcactaag gcttagactg gacaaattaa 1741 ctcctccccc ttctccacag ccaaagcata gcgtggaaga gtggctaaac ctttgccggc 1801 agggtaaagt aaaaacctac attcagggaa atgaccctaa ccttgacgat gcctggcggc 1861 agtatgagga agaaaaagag ataatccggg attgggcaaa gaaatccgct acacggaaga 1921 aggtttgtgg cgaaacgtta cccttaccgg aagttgcaaa acattacagc caggcccggc 1981 tacgggaaat agtttcagct acccacccga aggcggcaaa tgcagtattt ggacatttat 2041 ttggacatta atgaaatgaa agagtgtgaa tagcatggaa aaagcaccta ctccacctgg 2101 agtaggtgcc tccattaaag gaggtgaaca agaaaatgaa ttggaaagaa ccttgcccct 2161 atttatacta ccaaattgta ctttgtacta gccgaaaacg ttttgaacaa aatgaacata 2221 taaattataa ctaaatatat agaaaaaagg cttgactttc tctttctttt cctttataat 2281 taaattaaaa aatcctaatt atgtcaaaaa aaggaagata aaaggggggt taatatgcct 2341 actaccaaga ttaagacgaa ggctcacccg aggctaaggc aatttagaat ttacggctac 2401 ttaagagttt caactattga ccaggacacg gaaaaaaata aggctgatat attatccttt 2461 gccaattcaa agggattctt ggggcaggtt gaatttgtgg aggagaaaat ctcaggctta 2521 aaatcctgga aaaaaagaaa gttgaaagat ttggtagaat caatgtcaga gggtgacatc 2581 cttattgtcc ctgaattgtc caggctagga cgttccctag ttgaggtttt agaagtctta 2641 aacgaattaa aggataaagg agttaaagtt ttttctgtca aagaaaactt ccagctaaac 2701 ggggacgata tacaatcaaa agttatgcga acaatgttag ggctatttgc tgaaatagaa 2761 agggatttaa tatctgcaag gacaaaggaa ggactggccg cagttaaagc atctggaaaa 2821 cggctaggca ggcccaaagg ccctggcaag tcaaagctgg ataagttcaa gccggaaatc 2881 gttgcattgc taaagaacgg ctcaaaaaag attttcatag cagaacgcta tggcgttacc 2941 ccggctaccc tgactaactg gctgaagagg cacggcctgg acaaattgac gcctacaccg 3001 taaggaagga gggaaaatag atggccgaga ttatcgaaca ggcttcaatg aaattaaaaa 3061 gatttgtata atatggtaag ggaagggata aaacaaaaaa ggaggaaact atataaatct 3121 ttattggagg aatactatct tttctttaat ggagtggtat agaatgaaaa aaagcaagtc 3181 tttgataata ggttatttat tagctttttt cttaggcggg gttggggcgc acctttttta 3241 ttatcacaaa cgtctaagag cctggatata ctttttggct gtcatatttt cagcagctcg 3301 attgcttcct ttgactatgg tattgggttg gatagatatg ttttttatta aaaaatggca 3361 taaggagtat ttagaaagag gagaaaagat ttcagagaag cttatagaca taccaactcg 3421 atttactttt acgacagaaa tcactcaagt tggaaaactt gaaccttctt tgcaaaaggt 3481 tttacctaag aaggaagaaa agaaatttta taaggaagag gatatcatac taccagaata 3541 tgctcatctt aaaactccta tccatataag aaaagatatt gagaaactaa gaaattctgt 3601 taatgctaaa aagacgaatt cgcctgctat agaaattaat gtttttactc gagatacaga 3661 atttatgaaa gattcaataa ggtatgctga tatggtggtc agaaatgctg actttgtgcc 3721 gttggaggtg tattggacta cttttagaga tttggatgaa agacagaaaa agtggtattt 3781 ttattggaga tatcaagcac taaacggcaa ttatttggat actgatctaa gctacgtaat 3841 cttatttgtt tatgaactga taaactatac tttcaatcaa aatgctgcgt tcaatgttag 3901 tatgatggtt cgcttacggg aggcatacaa ggatagactt cctgctctgg ataaatatat 3961 tgtgccctgg ataagggata tattagtaga attgaatgaa attgaattag cttataaatg 4021 gggattagga gcagaaccat attctggact caatttttat cgcattttta aagaacacca 4081 aggtgatatt agcaagatac ctatggagga atggagaaag gttgtatatg gatactcaga 4141 aaccaccttt tttaaagcaa atgcccaaaa agtatatgct gtttttgaac aagctttaaa 4201 attatttcaa aagataaatg cagaagaagg gttagatctg gagaaagcct ggttcagacc 4261 agaagaaaag atagagaact atcgcttttt taatagtgca gtaataggtc gaaatgtttc 4321 aagccgggtt ataaagtact taaaatatgt gcctacagat tatttttata atgaagtaac 4381 agctttgttc cggctttcag aaaatgtcac tcgcttgctc gctggagtta ccaggcagct 4441 tcaagtaaat gaagaattgt tgcctcctgg gttcaaggaa gctttattag aggaaataag 4501 gagattagat ctaacggaga atgtaggact aaaaagccgt ttttctcctg ataaaaaaat 4561 aaagaatcgt ttttatcaag tagcatcaaa agagaatgag gaatcgaaac aaactatacc 4621 taaaagaaca acccaaacta taggaatagg cagcgaaaaa attaaacctg aactggacct 4681 gctgcaaata gacattcccg cacataggtc tagcatcagc ttggctgatg aagaagttaa 4741 tgtagaagga tttatttctt ccttaacaga agaggaatct aaatttatta gcacattttc 4801 caataataag aaaagcataa atgaagcaga ggagcaatta agagctcaag gtgttcctgt 4861 aacaattttt gtcgagcaga taaatgctaa ggcggaagaa tatttagaag atgtctttat 4921 tgagcttata ggagaagaat atgtgataaa cgaagaattg gtaactgtat gggaagaaat 4981 aaagaggagg aagcagcatg aaaattaaaa ggagagattc agcagatatt ttaaatgcat 5041 tggcaggtgg agtggttcct aaaagaggtc ttcagtatat aatggtgggc cgtgaggcgg 5101 aaatgaaaca aataagagaa gagttaagag atataagaga aaatggaaac tctatgatta 5161 ggttttttat cggcacctat gggactggga aaagttttat gcaaaatttt attagacaag 5221 tggctttaga agaaggattt gtagttacca atgcggattt tactccccat agaaggttat 5281 atgggagcga taatcaagct ttagcattgt ataatgaact gataaaaaat ctatcaacca 5341 agtctgcacc ccaaggaaat gccttgccta ttattttaga ccagtagata atgagtttac 5401 aaaataaggt aatggaaaac ctagattatg aagataaaac tgttttggaa gacaatgtat 5461 ttgtgcgagc agtagagaaa gaaattgtta aggctgtttc tcatttagat gagttaacgg 5521 gtggttacga ttttgcaaaa gttttaagta tttactataa aagttttgta gagcaagata 5581 aagagaaaca acgtcaagct ttgaggtggc tcagaggaga atatttgact aaaagcgatg 5641 cactgcgaga cttaggaatt agagagatta ttgatgatag caattattat gctcacttaa 5701 aagtattatg taaatttgtg aggcaagcag ggtattcggg cttgattatc aatttagatg 5761 aagcggtgaa tctatataag attactcata gagaagccag agaaaaaaac tatgactata 5821 ttcttacgat ctacaatgac attttacaag gttcagttga ggggttatat ataacgttca 5881 gcggtacccc cgaattttta gaagatgagc gccgtgggct ttatagctac caggcattaa 5941 aacggcgttt gaaaccgacg gtagaaaatg aaaaatatca agatttaaaa caggcagtga 6001 ttaaattgac tccccttact cctgaagaga ccttgatatt attgatgaat ataagggata 6061 tccacgcagc tcattatggt tatgaaataa atgtgatgga cgaagaaatt cggagatatt 6121 tgctgtggat atacaagcga cctggcgcta aagagcacat tatcttagga gatgtggtca 6181 ggcagtttat cagctttttg aatattaaaa tggaacaccc tactttaaat tttgaagaat 6241 tatatatggg cgaagagact agtgaaaaca acttgccaga agaagttatc gatatacata 6301 agcgttttaa aagaacccag ctttcatgac ctgggaggta gtaaatatga gccaaatatt 6361 ttataagcta tcagataaag tacaaaagaa aatatgggac attggatgga aacattttac 6421 tcctattcaa gaaaaagcaa ttcctgtgat tatagataca gaaaaagatg tggttttatc 6481 ttcgggcaca gcttcaggaa aaaccgaggc tgcttttttg ccaatcataa gcaaaattca 6541 cgagacagct tctaacgttc tgaaagttct ttatgtttct cctctaaagg ctttgattaa 6601 taatcaattt gaacgacttc agaaattgtg tgaagagatg aatattcctg ttcataggtg 6661 gcatggagac gtgagccagc acagtaagaa aaaattgatt aataatcccg ctggcatatt 6721 gcagattact cccgaatcca ttgagagctt gttcataaac agaacacaat ttttaaaaca 6781 attattccag gaacttgaat ttatcgtaat agacgaactc cacgctttta ttgatacaga 6841 aagaggagtc caacttcgct ccctcttatc tcggattaaa caatatacta agaggtgccc 6901 taggattatt ggattatcag caacaatcga taacttttct ctgattaaaa agtggattaa 6961 ctgcaacaat ccagataatg tggagattat tgaagtgaag gggtttgaga gggatatcta 7021 ttatagtttg atgcattttg aaaaaagtaa aacaggaaat tatcctcttg aattatatga 7081 agatattcta gaattgaccc gaaattatac ctctttgatt ttttttaata gtcgggcggc 7141 agtagaggag gccacagtaa ttttgaatcg attagctcaa agggagaaac tgggagaaag 7201 gtattttgcc catcattctt caatagctaa ggcagaacgg gaatttgtgg agaagctgat 7261 gtcagaatct acggggatta aaagcgttat agcaacaagc tcattagaac taggcatcga 7321 tataggggaa atcgatttgg taatacaggt agacagtaca tttacagttt cctctttaaa 7381 gcagagattg ggtaggtcag ggagaaagca aggagagggt cagtatttac aaatgtatac 7441 cacagacaaa tatggattac tacaatctat tgcagtaatg gatctcttgt tgcaaggctg 7501 gactgaaccc tgcaaaggtt atccataccc atatgatatt ttatttcatc aaattatttc 7561 tatatgccac caactgaatg gtattcctct tgagaaactt gtttcattag taagtgaaaa 7621 tgctgcattt tatgaactgc cagaatcaga tatccgtatg ttggttgagc acatgatcgg 7681 taaggaatat ttagaaatat tggccggtac acaagaatta attgtaggat tagaagggga 7741 acgattactg agacaaaaag atttttactc cgtctttatg actcccgaag tctatgaagt 7801 cttttacgga actaaaaata taggggaaat agaaaaaact tttcttttaa acgaaggaga 7861 caatattatt ttggctggac gattgtggaa aatagaagaa atagactttc atagaaataa 7921 agtatatgta aaaaaagcga tggatggaaa gcctccaaga tattcaggtg gactagcacc 7981 attgcacccc cgtattccag agcgcatgca cgaaatattg tgcttagatt gtaagtttga 8041 ttttattgat gatagggctc agactgcttt agaagaatta aaggtgcctt ataagtattt 8101 taacgttaag ccagacgaaa ggattatctg gcaaacgaaa gagaagttac tttttgaaac 8161 ttttactggc acaaatatct ttagaacttt gatatggatg ttgcgttatt atggagttga 8221 cgaagtgaaa acagacggaa ttggacgtat ggagatccca cttaatgatg aattcattga 8281 tattttacag gatattaaga gtagaaaatg gtctttaaga agtttattgc cctatactaa 8341 agaagaggaa tttttcgtct ccaagtatag cgattttctt ccttcggaat tgcaaataaa 8401 aatgcacgga gcttataatg tagatatcga aggggtattg aaatttttag ataaatttcg 8461 tattagaata ataagcttgg aataataatt gaaataatgg tgtttgggaa taatctactt 8521 gatttgtaag agtactcagt aagaaaagta ttttcttgtc atttacaagg gtagctaatt 8581 gggagagaag atcaatataa tttcaagcaa taagaaaata gtttttcttt aagcgtgaaa 8641 tatatcccac ttaaaagatt tgcggcaaaa agaaaaataa tccctccaaa aaattatgtg 8701 gagaaaaata aagaaatatt agggagatga ttatgatgac ggtagaaatt aaaatcatag 8761 aaaacccatt aagtgattgg aaactgggag acccttgttc aatatgcaat aggatgtttt 8821 cttacacgga agcggaatat gttgctgtcg tttacgtgga tgaagaaaga gactttattt 8881 gcggggattg tctcaagaag gggcctgaag caatcaagaa ggcagcgcaa aagcgtgctc 8941 aagaaatccg ggacgaaatt cggcttgggc taaaagaagc ggagttgtta gaaaagattg 9001 cttcaggcga tattgtttac ccctgggatg accaagaaaa gttttccaag tgtgctaata 9061 agtagtttgt ctggctaatg tggagcttta tcccttcccc cctttggttg atatataagc 9121 cctgaaagga tgaaagtaaa atggaaccta aagcctattc ttacatccgc ttctcttccc 9181 cggaacagga gaagggagac agtctaagaa ggcaaattca gttatccgaa gaatactgca 9241 aacagcatgg ccttatccta gacgatacac ttaaacttac agaccgtgga ctatcagcct 9301 tcaaaggcat tcaccgtacc aagggagcat taggggaatt cctcagattg gtggaagaag 9361 ggaaaatccc tccaggttcg gttctgctag tagaaaacct ggacaggctt tctagggagc 9421 aaatccttga tgcacttaat cagtttacaa gtatcattaa agcaggaatt aaaatcgtaa 9481 cactgcaaga cgggatggaa tatgaccagg aaagcattaa tcagaactgg gcacagctta 9541 taatttctat cacttatatg gcccgggcac acgatgaatc agaaaccaag tctaaacgta 9601 tatcagccgt ttgggagaac aaaaggagta aagccggcaa tggaggcgaa aagctgaccg 9661 caaaagcccc agcgtggcta aaactttctc aagacagaac taaatttatc ttaattcctg 9721 aagcagccaa ggcgattgag ctaattttcc gtaaaaagtt agccgggaaa ggcgcagaaa 9781 ggattgcccg ggaattaaat gaagacccga acatttggga accgcccaga acaggcccta 9841 aaaagacagg aggctggaga ggttcatata taaacaagat tttaagaagc cgggctgtta 9901 ttggggaatt ccagccacat aaattagttg atggcaagag gcaacccata ggtgacccta 9961 taccggatta ttttccacca gtcattgata aggaattgtt ttaccaggtg caggctcaat 10021 tacaagctaa tgcagagaaa aaaggcaatg ctggaggcag gacgggtaaa gtctcaaacc 10081 ttttcaccca tgtcattaaa tgcggtttat gtggttatcc catgcatttt ataaacaaag 10141 gcaaaccgcc aaaaggcggt aaataccttg tctgtgatgc ttctaggcgg ttgaaaacct 10201 gtactgctaa acctattcga tatgaggaat ttgagcaatt attttttgat aacttcgagg 10261 aactggacat cagccagcta ataccggggt aagatgaaac ccaggccaga ataaatgagt 10321 tagaaaaact tctaacagtt aataggcaga ggctgcttga aattgacagt aaagtggaga 10381 acttctccga caccatcgga cgaacaaagg acagcagaat cagggaacag cttgaaaaga 10441 agctatccca ggcctttgat gataaagaaa gcttagagag cgagaataag aaatttgaac 10501 gggaaataac ggaattacgg caacaaaagg ccgggctgga aaaaaacatt gaacaggcta 10561 aagaaatata tcagttatta aattccgccc aaggtgagac agagagaatt gaactacgct 10621 tgcgcttgcg ccagcagatt cagaaatcta ttgaatggat taaaatttat ccgcttcagg 10681 aaccttatca ggaaatacag gaaaccgaag aacccggcat tgttaagatt atgaaaagca 10741 aatatattga caaggtgcga attaagtttc ggggaagccg agacctccgg gtgctatacc 10801 taaagaacca tgcagaactg agcgaatagc ataaaaccgt ttataatatt ctgccatgtt 10861 atcaccctgt ttgtatcgta cctatgagga attgaaatga taaaaaatgt tggtggtctt 10921 tgatggccac caagtggttt gtatcgtacc tatgaggaat tgaaattaaa ttactgcaat 10981 atctctgata tacctgaagc tcgtttgtat cgtacctatg aggaattgaa atttgaaaac 11041 attgtacagg caatcgcgcg tgactgtcta ggtttgtatc gtacctatga ggaattgaaa 11101 tttgccggca ctgtcggtaa gatcccattc tgccggagtt tgtatcgtac ctatgaggaa 11161 ttgaaaattc ttcccccttc ctgctcagca cttcaatagc ttcgtttgta tcgtacctat 11221 gaggaattga aaagcctgcc actgctccca tctgaaacct tcctcctctt gtttgtatcg 11281 tacctatgag gaattgaaaa tcctattcat aggtactggg aaacccagca tgtttgtgtt 11341 tgtatcgtac ctatgaggaa ttgaaaattg gtgtttccga ggtctgcaat tgcgccagca 11401 acaggtttgt atcgtaccta tgaggaattg aaatttaaac aagctgccat tgaagcggtt 11461 gctgcttcca atccgtttgt atcgtaccta tgaggaattg aaataacttg aaaacattgg 11521 cattggaatc agtgaaataa gtttgtatcg tacctatgag gaattgaaat tattttcagc 11581 ttcttgctct gtgttatact taccaagcca gtttgtatcg tacctatgag aaattgaaat 11641 ggttctaata catgcataat cgaaatgttc gaaggggttt gtatcgtacc tatgaggaat 11701 tgaaatactg caagatatgg ctttccgtca acttcataat gagtttgtat cgtacctatg 11761 aggaattgaa ataaagcaaa agcgattgca gctcttgaaa aagcaaaagg gtttgtatcg 11821 tacctatgag gaattgaaat cgattgacag cagagaaata gcagacatgt tggaaatgtt 11881 tgtatcgtac ctatgaggaa ttgaaattgc gcaaaccgtt ttccacacaa aaaaccgttc 11941 cgtggtttgt atcgtaccta tgaggaattg aaattctttg ttaatctcta ctcttctcaa 12001 atcaccgttc caggtttgta tcgtacctat gaggaattga aatctatttt ttcattggat 12061 tgattccaca gccattcttc gtttgtatcg tacctatgag gaattgaaat tttgtgtttt 12121 actctggctt ggtattcacg gagtagtttg tatcgtacct atgaggaatt gaaatgggtc 12181 gaagggctca tagttgcctt ggaaacctat gcgtttgtat cgtacctatg aggaattgaa 12241 atacagcagg attaaagaaa catttatttt cgtgttctcg tttgtatcgt acctatgagg 12301 aattgaaatt ttcattccat caacatataa agatgaaagc ggtaaagttt gtatcgtacc 12361 tatgaggaat tgaaattaga gtattccaaa ctgcagaagt gggaggatac aagtttgtat 12421 cgtacctatg aggaattgaa attttctctc ttttctggca ggtaatccac ttggaatatg 12481 gtttgtatcg tacctatgag gaattgaaat gaggattttt tgaaaattgg gagagtcgca 12541 ggagaagttt gtatcgtacc tatgaggaat tgaaactccc aagtatctgt atctaactga 12601 tatcctgcag gacctgtgtg tatcgtacct atgaagaatt agaattaagt atcatctata 12661 taatcaaatc tattataacc agtttttatc ctagatgtaa caaaatgaga cttaataact 12721 atgatgcctt tagcaatttc acttctgttt ctgttgcact tgtgatgaat tgaaataggc 12781 agtaaatcta attttattaa tatacaataa ttgcctttct tgtacctaca ataaaatagg 12841 acaaagtttt gccttttgtc ttcatatact ttatgtcaat acgctttttg aatttacgac 12901 aaattgtaca atttacttct taaattctat tctctgtatc attccgttat aaaaactaaa 12961 tgtaaaagat taaaaatcaa aattaaattt gattattatg catcttatgg taatatactt 13021 atgtaacttt aagttgttaa ttggaaaata aactatgttc gttacgttac taatttgaaa 13081 ggtttggttt gattccaagc tgtgcaaaat gagatgtttt gcacatggtt aaaggatgtg 13141 aggaaatgta ggaacgatat gcaaaattat acagtattct gacattatca aaaaattaaa 13201 aaagattgca aaaaaatagt ttacctaaaa ttgattatgc tgaaaagagg gaggattaaa 13261 atgaaaaaaa atattttttt taagaaga //