LOCUS NZ_ACVX01000069 3427 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00253, whole genome shotgun sequence. ACCESSION NZ_ACVX01000069 NZ_ACVX00000000 VERSION NZ_ACVX01000069.1 GI:256006134 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000069. FEATURES Location/Qualifiers source 1..3427 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene <1..889 /locus_tag="ClothDRAFT_2920" CDS <1..889 /locus_tag="ClothDRAFT_2920" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: vei:Veis_0254 hypothetical protein" /codon_start=2 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431059.1" /db_xref="GI:256006135" /db_xref="InterPro:IPR006141" /translation="AAGLVAIENIKAGDKVIATNPETFEVAEKTVLETYVRETTEFLH LTINGEVIKTTFEHPFYVKDVGFVEAGKLQVGDKLVDSKGNLLVVEEKKLEITDEPVK VYNFKVDDFHTYHVGKKGILVHNADYNPKMGFDDLDLEKATNKQKGNYGEYLADDNLI NNPKLKEAGYDLERIGGKVPTSPDDKITKGIDGIYINKNPNSNIKYVIDEAKFGKAGL SAKTRDGKQMSDSWLKGVRSGDNRILKAVNNDKQLARDIMRALRNNRIERVLSKVDAN GKVTTYRLDSSGNIIGIWP" misc_feature 2..379 /locus_tag="ClothDRAFT_2920" /note="Protein of unknown function (DUF1557); Region: DUF1557; pfam07591" /db_xref="CDD:148935" misc_feature 8..241 /locus_tag="ClothDRAFT_2920" /note="Hedgehog/Intein domain, found in Hedgehog proteins as well as proteins which contain inteins and undergo protein splicing (e.g. DnaB, RIR1-2, GyrA and Pol). In protein splicing an intervening polypeptide sequence - the intein - is excised from a...; Region: Hint; cl12032" /db_xref="CDD:175391" gene 913..2151 /locus_tag="ClothDRAFT_2921" CDS 913..2151 /locus_tag="ClothDRAFT_2921" /inference="protein motif:PFAM:PF08928" /note="PFAM: Domain of unknown function DUF1910; Domain of unknown function DUF1911; KEGG: aha:AHA_1829 hypothetical protein" /codon_start=1 /transl_table=11 /product="protein of unknown function DUF1910" /protein_id="ZP_05431060.1" /db_xref="GI:256006136" /db_xref="InterPro:IPR015024" /db_xref="InterPro:IPR015025" /translation="MRDPLCNKEDLIETIEFNQQTICEMKEEIEELKADIENGIQRYP RDNQSIIYITFADMFRYGMDMLLAKYSLGNHPDTMIDDYLDNITYLENCGEEEAGYIN LLWMVGLGILLEMDKEVLKRLARVIERQRIEDALMDFLLKACDIGWNHSTTKYEKKNP YEKTAEIIKIALHDKDKEAASKRLEKYMGKEWFKGHYDFGWRNAHKEPGYYGFWSFDT AALAKILGLDDSALKDNNHYPYDLAHYKNGMTFDLSWYSVPKEEEDKEEETVVYGIPG NPELERIIPGKFHSFVNEIINDYKTLPDEEFWKKYNLKEIWFDVEEYKEDNKDKNLLG TIIVFMLVDKDYILQLDYKEELIDYIENIHNYWAKKEVKLISFELDNDQQYYAYVPKD AEVGSLYEVKLTEVEKIEEV" misc_feature 916..1293 /locus_tag="ClothDRAFT_2921" /note="Domain of unknown function (DUF1910); Region: DUF1910; pfam08928" /db_xref="CDD:149863" misc_feature 1297..1638 /locus_tag="ClothDRAFT_2921" /note="Domain of unknown function (DUF1911); Region: DUF1911; pfam08929" /db_xref="CDD:149864" gene 2359..2886 /locus_tag="ClothDRAFT_2922" CDS 2359..2886 /locus_tag="ClothDRAFT_2922" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: xcb:XC_2059 hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431061.1" /db_xref="GI:256006137" /translation="MVVNVNIINVNIINVKRYRNRTIAGESQNVHLAVKDKLKKEGRS FELIPEDLDVYKEALDLWLSPNLEEVKSVIDKMILYHSVLVSDIDNEPEFGDYTYGFY PYEILFLMHIRRKLGLPVPDKFEDLLMNTPEAKVVINEPEPYPEWDPLLRAIDEFYRK NYPNYIPNKHGKLFE" gene 2899..3369 /locus_tag="ClothDRAFT_2923" CDS 2899..3369 /locus_tag="ClothDRAFT_2923" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: sew:SeSA_A2876 hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431062.1" /db_xref="GI:256006138" /translation="MAMEDIVGIIFEDIEEVKPILSDSEGNDLEGNDLSEAILEYGIS EGKFLCVDYGGEEGSEIINYIMDYEFSHGIELATQEELEELDEMEYDDLTDKIKEVNK ILEKAGYGLFCFPTGSDFYELFIAKLEDKEKLLEEKIVDDEELPLEERYIQYYV" ORIGIN 1 agcggcaggt ttggttgcga tagagaatat caaggcaggg gacaaggtaa ttgcgacgaa 61 tcctgaaact tttgaagtag cggaaaagac ggtgcttgag acatatgtga gagagacaac 121 ggagtttttg catttgacaa tcaatggaga ggtaatcaag acaacctttg agcatccgtt 181 ttatgtaaaa gatgtgggtt ttgttgaagc gggaaaactg caagtaggag ataagttggt 241 tgattcaaaa ggcaatcttt tggtggtgga agagaaaaag cttgagataa cagatgaacc 301 tgttaaggtt tataacttca aagtggatga ttttcatact tatcatgttg ggaaaaaagg 361 gatattggta cataatgcag actataaccc caaaatggga tttgatgatt tggaccttga 421 gaaagctacg aacaaacaaa aaggcaatta tggagagtat ctggcagatg ataatcttat 481 taataatcca aaattgaaag aagcagggta tgatttggag cggataggag gtaaggttcc 541 gacctcaccg gatgataaaa ttacaaaagg gatagacggt atatatataa acaagaatcc 601 taattcaaat attaaatatg tgattgatga agccaaattt ggaaaagcag gactgagtgc 661 aaagacaaga gatggaaaac aaatgtcaga ttcttggcta aagggtgtta gatcagggga 721 taatagaatt ttaaaagcag tgaataatga taaacaatta gcacgtgaca taatgagggc 781 attaagaaat aacagaatag aaagagtatt atccaaagta gatgcaaatg gaaaagtaac 841 aacatataga ctggatagca gtggtaatat aattggaatt tggccataag taattcgaag 901 gaggttacga taatgagaga tccgttatgt aataaagaag acttgataga gacgatagaa 961 tttaaccaac agactatttg cgagatgaaa gaagaaatag aggaactaaa agctgatatc 1021 gaaaatggta tacaaagata tccaagagat aatcagagta taatttatat tacgtttgct 1081 gacatgttta ggtatggtat ggacatgctt ttagcaaaat attccttggg caatcacccc 1141 gatacaatga tagatgacta tttagacaac ataacatatt tagagaattg cggtgaggaa 1201 gaggccggct acattaacct tttatggatg gttggactgg gtatcctttt ggaaatggat 1261 aaagaagtgt taaaaagact ggcaagagtt atagaaaggc aaagaataga agacgcactt 1321 atggattttc tattgaaagc ttgtgatata ggttggaacc acagtacaac gaaatatgaa 1381 aaaaagaacc cgtatgaaaa gacagcagag attataaaaa tagcattaca cgacaaagac 1441 aaggaagcgg catcaaaaag gcttgaaaaa tacatgggaa aagaatggtt caagggacat 1501 tacgactttg ggtggaggaa tgcccataag gaacctggct attatggttt ttggagtttt 1561 gatacagcgg cactggccaa gatactgggg ctggacgaca gtgcgttaaa agacaacaac 1621 cattatcctt atgatttggc acactataaa aatggaatga cctttgattt gagttggtat 1681 agtgtaccaa aggaagagga agataaggaa gaagaaacgg tggtatatgg tataccgggt 1741 aatcctgagt tggagaggat aatacctggg aagtttcaca gttttgtaaa tgagataata 1801 aatgattata aaacactgcc ggacgaagaa ttttggaaga aatacaattt gaaagaaatc 1861 tggtttgatg tggaggagta taaggaggat aataaagata agaatttgct aggaacgatt 1921 atagtattca tgcttgtgga caaagattat attttgcagt tggattataa agaagagtta 1981 atagactata tagagaatat acataattac tgggccaaga aagaagttaa gcttataagc 2041 tttgaattag acaatgacca gcagtactat gcatatgtgc cgaaggatgc ggaggttggt 2101 tcgttgtatg aggtaaaact gacagaagtg gagaaaatag aggaggttta gtgtttattg 2161 tgtaatagtg tgaagaagat gagttgttta tgaagaatct gctgtataat tggatatata 2221 tagtttgatt ttgggaatct ccttcctggc gaaacaaaaa ctataggaca gtatttggga 2281 aggagtattt tttgtgttat tttttttggg aagataatat tgtattgaga ataataagaa 2341 gttttattag gattgtttat ggttgtcaat gttaatataa tcaatgttaa tataatcaat 2401 gttaaaaggt ataggaacag aaccatagca ggggagagtc aaaatgtaca tttggcagtg 2461 aaagataagc tgaaaaaaga ggggcgttca tttgaattaa ttcctgaaga tcttgatgtt 2521 tataaagaag cattggattt atggttgagt ccaaatttgg aagaggttaa aagcgtgatt 2581 gataaaatga tattgtatca ttccgtatta gtttcggaca ttgataacga accggaattt 2641 ggtgattaca cgtatggatt ttatccatat gagatattgt ttttaatgca tataaggagg 2701 aaattaggtt tgccggtacc ggataaattt gaagacttgc tgatgaacac accggaagcg 2761 aaggtggtga ttaatgagcc ggagccatat ccggagtggg atcctttgtt gagagccata 2821 gatgagtttt accgaaagaa ttatccaaat tacattccca acaagcatgg aaaactgttt 2881 gaataggagg aaactgttat ggcaatggaa gatatagttg ggattatatt tgaagacatt 2941 gaggaagtga aaccaatttt aagtgattcg gaaggaaatg atttggaagg aaatgatttg 3001 agtgaggcga tattggaata cgggatatcg gaagggaagt ttctgtgtgt tgattatggt 3061 ggagaagagg ggagcgagat aataaattat ataatggatt atgaattcag tcatggaata 3121 gagcttgcaa cacaggagga gttggaagag ctggacgaga tggagtatga tgatttgaca 3181 gataagataa aagaagtgaa caagatattg gagaaagcag ggtatggact gttttgcttt 3241 ccaacaggaa gtgattttta tgagttgttt atagcgaagt tggaggataa agagaagtta 3301 ttggaggaaa agatagttga tgatgaggag ttgccattgg aagagaggta tattcagtat 3361 tatgtgtaag gggataatct gcagtattta gagttttgga taagaatatg gcttttataa 3421 aaatatt //