LOCUS NZ_ACVX01000064 4799 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00235, whole genome shotgun sequence. ACCESSION NZ_ACVX01000064 NZ_ACVX00000000 VERSION NZ_ACVX01000064.1 GI:256006105 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000064. FEATURES Location/Qualifiers source 1..4799 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene complement(6..866) /locus_tag="ClothDRAFT_2896" CDS complement(6..866) /locus_tag="ClothDRAFT_2896" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431035.1" /db_xref="GI:256006106" /translation="MNKRLILFIISMLCFTTLTGCGIDRRELVGDIIIGNGYTGIADY LIKYNPAAKEFESVVPGFYYEVEYNEDKSKILCYKSLRYSEILNSEICEYDIKSNEFS EAIFNWSEYPDEFEGNVKYVPNSDSISFILGDALHIYDRSSGTLTKLFKVAFDWYSWD NTGKKLLYGDYDENIYMYDMESKEEKKILEGRHPVYSNSNEYIAYMGKDQKLTVYNVN TGENWKTVTIGSSTRYIFSPDDKYILLGTEYWDIVSIPHYIIYALDYKTGKKKRLFGG EGNVPSLDWK" misc_feature complement(<675..>866) /locus_tag="ClothDRAFT_2896" /note="Phosphoinositide 3-kinase (PI3K)-like family, catalytic domain; The PI3K-like catalytic domain family is part of a larger superfamily that includes the catalytic domains of other kinases such as the typical serine/threonine/tyrosine protein kinases (...; Region: PI3Kc_like; cl00119" /db_xref="CDD:163723" sig_peptide complement(804..866) /locus_tag="ClothDRAFT_2896" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.949) with cleavage site probability 0.775 at residue 21" misc_feature complement(<12..512) /locus_tag="ClothDRAFT_2896" /note="WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues...; Region: WD40; cl02567" /db_xref="CDD:154987" misc_feature complement(order(39..41,75..80,114..116,135..137,174..176, 219..224,240..242,255..257,294..296,330..335,351..353, 363..365,408..413,447..452,465..467,477..479)) /locus_tag="ClothDRAFT_2896" /note="structural tetrad; other site" /db_xref="CDD:29257" gene complement(1376..1873) /locus_tag="ClothDRAFT_2897" CDS complement(1376..1873) /locus_tag="ClothDRAFT_2897" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431036.1" /db_xref="GI:256006107" /translation="MKNGKKVAWMLVSVCFLSMIALVIIYVNISPPVEGWKDFKKNCI SNYSFVDDVNLDRITPVDFRISYTLNRKITQEEVDSVFSWTTKYIQSEKVFSDLKKYH AKRYRYSFARLAIVFTYRDNNEHFECNIFSSPVSNGEPNYADYKTWYIEYNGKSSEVY NPMLK" sig_peptide complement(1802..1873) /locus_tag="ClothDRAFT_2897" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.763) with cleavage site probability 0.686 at residue 24" gene complement(1915..2712) /locus_tag="ClothDRAFT_2898" CDS complement(1915..2712) /locus_tag="ClothDRAFT_2898" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431037.1" /db_xref="GI:256006108" /translation="MPSLDWNSDRYKNIGKDETCNEDIVKTSLTNTDFLKIVDDGKVY YGGNQNWFQKYTQSFGGCGPTAAANILAYMAMTDPKFAKLYEYDLKNITKADFVKFME EVYKYVTPLEVPVFSHMSDKKGKQAGIPSLGITGLAAFAKGVEKFAKSRGIKLKAKWS GEKPTFDNAVSYIREGLRKNRPVALLNMFNPVSMQWADPQTSKIKSMTYERHWVTITG MIENRKTGEVTLEVSTWGGKATLSFNELYNNMDWNEMIFPAGIIYFE" gene complement(3094..3471) /locus_tag="ClothDRAFT_2899" CDS complement(3094..3471) /locus_tag="ClothDRAFT_2899" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431038.1" /db_xref="GI:256006109" /translation="MSLIMLLNVGIGNVYADETGKNALNFRKIYKEHRTYSSAVGISA NSLGDIAIGFNDDYINVYDKQGSFKYSFAFEVNGNYFFEFDNENNIVIFSVTDGMRYY FNNDAELIKTEKISDPEELKKLL" gene 4324..4464 /locus_tag="ClothDRAFT_2900" CDS 4324..4464 /locus_tag="ClothDRAFT_2900" /inference="similar to AA sequence:KEGG:GSPATT00007287001" /note="KEGG: hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431039.1" /db_xref="GI:256006110" /db_xref="InterPro:IPR013026" /translation="MNKVNEAIECYKPGIKNNPKELSFYMSLSDLLLYAGNVSEAMEC LN" gene 4575..>4799 /locus_tag="ClothDRAFT_2901" CDS 4575..>4799 /locus_tag="ClothDRAFT_2901" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431040.1" /db_xref="GI:256006111" /translation="MWKVVQENYGSVLGCKTIEASLVYDNKMYYRLYTAYDADSKNLK PKVFKPGMLVNVIKQEQYNFTFRYYYGCQLI" ORIGIN 1 tcctcctatt tccaatcaag gctgggaaca tttccctcac cgccaaataa tctttttttc 61 tttcccgtct tataatccag agcatatatt atataatgtg gaatacttac tatgtcccaa 121 tattccgttc ccaatagaat atatttgtca tccggagaaa aaatatatct tgtactactt 181 ccaattgtta cagttttcca attttctcct gtgttgacat tataaacagt taacttctga 241 tcttttccca tatatgcgat atattcattg ctgtttgagt aaacgggatg tctcccctct 301 aaaattttct tctcttcttt actctccata tcatacatat atatattttc atcataatca 361 ccataaagca gttttttccc tgtattatcc catgagtacc aatcaaacgc tactttaaat 421 aatttagtga gagttcctga tgacctgtca taaatatgca gtgcatcacc caaaatgaaa 481 ctaatgctgt cggaatttgg cacatattta acattacctt caaactcatc cgggtattca 541 ctccaattaa aaatagcttc actaaactca ttagacttaa tatcatactc acatatttct 601 gaattcagta tctcactata tcttaaagac ttatagcata atatctttga cttatcctca 661 ttatattcca cttcatagta aaagcccggc acaacacttt caaattcttt tgcagcagga 721 ttatatttta taagataatc agcaattccc gtataaccat tacctataat aatatcaccg 781 acaagctctc ttctgtctat tccacatccc gttaaggtag taaagcacag catacttatt 841 ataaatagaa ttaatctctt attcatttat tctctcctcc atttaaatgg attcaaagga 901 aatataggct tatcccccgt attttccaca attcggtctt caacagtcag atttcaaagt 961 ttttacaggc ttcctatagg tattttaagt ctttataaat tctttaactt ctcgtaattt 1021 tcattaaatt cgcttgtgcc acatgctact gttaaagata aaaatacaaa tttgatgtca 1081 attatgtaaa ttataccatc agacactttt ggattcaaca aattctcctg cttggtttca 1141 aatatcttca aatattaaat cttaggataa aatataaaaa agactgccaa ctaaatccct 1201 tttataagag aaatacttgt cagtccgttg tatcatctac agtttgcttc tacgcataaa 1261 attaatttca ttatactcat gcgcacaaat ttataagttg tattttttta tttctaactc 1321 tctgatttgg attataaaat atttataaaa acgctctctt ttcccgacat taaaattact 1381 ttaacattgg attgtacact tctgaagatt taccattata ttcaatatac catgttttat 1441 agtcggcata attgggctcc ccatttgaaa caggtgaaga aaaaatatta cattcaaaat 1501 gttcattatt gtctctgtat gtaaaaacaa ttgctaatct agcaaaacta tacctatatc 1561 ttttagcatg gtattttttt aaatcgctaa ataccttttc cgattgtata tattttgtcg 1621 tccaggaaaa tacactgtct acttcttctt gagttatttt tctgtttaaa gtgtagctaa 1681 tacgaaaatc tacaggcgta attctgtcca agttcacatc gtcaacaaat gaataattgc 1741 tgatacaatt cttcttaaaa tccttccatc cctctaccgg cggactaatg ttcacataaa 1801 taattactaa tgcaatcatc gaaagaaaac aaacagatac aagcatccaa gcaacttttt 1861 ttccgttttt cattggtagc ctcctcaata caaactatac aacccatgct ttttctattc 1921 aaaatatatt atccctgcag gaaaaatcat ctcattccaa tccatgttat tatataactc 1981 attaaaactc aacgttgctt ttcctcccca cgttgacacc tcaagggtta cctctcccgt 2041 ctttctattt tcaatcatac cggtaatagt tacccaatgc cgttcatagg tcattgattt 2101 aattttactt gtttgcggat cggcccactg catactaacc ggattaaaca tattcaggag 2161 cgcaacaggt ctgttttttc tcaatccttc ccgaatgtag cttacagcat tatcgaaagt 2221 tggcttttca ccactccatt ttgctttcag ctttatccct ctacttttgg caaatttctc 2281 aactccttta gcaaacgcag ccaaaccggt aatacctaag gacggtattc ccgcttgttt 2341 gcctttttta tcactcatat ggctaaaaac cgggacttcc aatggagtca catatttata 2401 tacttcttcc ataaacttca caaaatctgc tttagttata tttttcaaat catattcata 2461 cagttttgca aatttcgggt ccgtcattgc catatacgcc aatatattgg ctgccgcagt 2521 aggaccacag cctccaaaac tctgagtgta cttttgaaac cagttttggt taccgccgta 2581 atatacttta ccatcatcaa caattttcaa aaaatccgta ttggtaagac ttgttttaac 2641 tatatcttca ttgcaagtct catctttacc tatattttta taacgatctg aattccaatc 2701 caagcttggc atgtttctaa aaatattatt gaattattct cctataaaac agtctattgc 2761 aattatcata cttatgttac ttcaatatat cataaacttc ttttctttga gtaatttcat 2821 ctttgacagt gtctccttca tatcctcttt acacttccgt atattttttc atttccgttg 2881 atatagtttt aataaatccg catattacta tggccagaaa tgccagaacc gttaatgcca 2941 caaatgcctt aacagcgtat tgtaagccgg tttcatatat taccgattca ttaccgtcgg 3001 cgtcggtctt cgcaaattta atatatccaa ggacctgttt tagcgaataa ttaacaccat 3061 caatatttac attttctttg tccgggcgat tttttataat agttttttaa gctcttccgg 3121 atcagagatt ttttctgtct ttattagttc cgcatcgtta ttgaaataat aacgcatacc 3181 atctgtaacc gaaaaaatca cgatattgtt ttcattatca aattcaaaaa aataattgcc 3241 gttcacctca aaagcaaagg aatatttaaa gcttccctgc ttatcataga catttatata 3301 atcatcatta aatcctatag cgatatcacc taaagaatta gccgaaatac caactgctga 3361 tgaatacgtt ctatgctcct tataaatctt cctgaaattc aaggcatttt tgccggtttc 3421 atcggcatat acattgccaa ttcccacatt cagcagcatg attagtgaca taaataaaag 3481 aaatattttt cttttcactc gccatcacca caccaccatt ttcattataa ataccttcac 3541 ttactaagca attagtctaa aaaagtgctt atctatttcc ttcaacacga aactgcacat 3601 ccaaaatata tacttcaata aactacaaca gaaatccaaa taccaatcgc ccccgcaaat 3661 ggatattcaa gaccatccaa cttatcctca catgtgcatt gataatgact aaaatttaat 3721 aaaatatttt ataaatgaaa gattttttca tacaagaaag tgattcattt tgtcagtatc 3781 atattcaaca ccccgcctta tactttttaa ataatcttag ttccaatcta atattggtac 3841 aattataaaa acatctttta attatcccaa agtatcataa tttgaatctc aaaccaaaca 3901 ttataatgct tttaaaaacc ataccataca ttttctgtac ttcaaagaat taaacaaaaa 3961 taatttctat cactttttta gcaatcatgt aaatttcaat attaatataa tttaaaaatg 4021 tttttgaatt atagcttaat aaatctaaat atgtatgctt ctttcttatt tgtgttacat 4081 tagtccatat taatatcata ccaaagaaga taagaaatgc aactatattc cagtactaaa 4141 actaattaat ggatggaaat taaagcttta ttgataagct tttgcaataa tcatctcatt 4201 ttttaaataa tgcttttggt aatttaatca tttgatacaa tgcaaacttt aataaaacag 4261 ggaatcgctc ttgcaccaaa ccatatacgc ttatatgtgt ccaaagcatg gactttgttt 4321 gaaatgaata aagtaaacga agctatcgaa tgttacaagc ctggaataaa gaataacccg 4381 aaagaattgt ccttttatat gtcgttaagt gatctcctgc tttatgcagg caatgtcagc 4441 gaagcaatgg agtgtctaaa ttaagaaagc cattcaatta gacccttagc ttaaagctct 4501 cgcaataaat gataaggact ttaacaatat taataattca actgctttca aggcattgac 4561 aggagtaagt gtttatgtgg aaagttgtcc aggaaaatta cggttctgta ttgggatgta 4621 agactatcga agcatctttg gtttatgaca ataaaatgta ttacagactc tatactgcat 4681 atgatgccga ctctaagaat ctgaagccga aagttttcaa gccgggcatg cttgttaacg 4741 ttatcaaaca ggaacaatat aattttactt ttagatatta ttacggctgc caattgatt //