LOCUS NZ_ACVX01000067 3559 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00259, whole genome shotgun sequence. ACCESSION NZ_ACVX01000067 NZ_ACVX00000000 VERSION NZ_ACVX01000067.1 GI:256006125 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000067. FEATURES Location/Qualifiers source 1..3559 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene complement(19..2586) /locus_tag="ClothDRAFT_2913" CDS complement(19..2586) /locus_tag="ClothDRAFT_2913" /EC_number="2.4.1.1" /inference="protein motif:TFAM:TIGR02094" /note="KEGG: gsu:GSU0371 carbohydrate phosphorylase family protein; TIGRFAM: alpha-glucan phosphorylase; PFAM: glycosyl transferase family 35" /codon_start=1 /transl_table=11 /product="alpha-glucan phosphorylase" /protein_id="ZP_05431052.1" /db_xref="GI:256006126" /db_xref="InterPro:IPR000811" /db_xref="InterPro:IPR011834" /translation="MYLFGKITVTAVIPDELSKLKDIAYNLWWSWNSEAIDLFREIDL ALWEKLGKNPVRFLKEVSQKKLEAKLKDPDYMQRYKKVVNDFETYMNETDTWFSRNFP DKKDHMVAYFSAEYGLNEVLPIYSGGLGVLSGDHCKSASDLGIPFTAIGLFYKEGYFS QRINSEGWQETIFTPLNPSNLPIQPALNDKGEEVIISVELPGRVVYAKVWVVKVGRVN LYLMDTDIEQNSPYDRGLTARLYGGDQETRIQQEIFLGIGGARVLDALGIKATVYHMN EGHSAFLGLELIRKLVQNHNLPFNQAKEVVASSVIFTTHTPVPAGNDVFPLEMIDRYF GNYWPSLGINRHEFLDLGLRIGEHHNFNMTVLALTLAGQKNGVSELHGAVSRNIFKNV WPGIPEDEIPIGHITNGIHTLTWLSPSIKYLYDKYLDKDWKERLHEKEVWEKVDDIPD EELWKTHCVLKTKMIGYVREKLKEQRAANGESIERIKEVDTLLDSNALTIGFARRFAT YKRANLIFRDLARIQKLLNNPEKPVQIIFAGKAHPADGPAHEIIKHINDIAKQEGFNG KVILVENYNMTLARNLVQGVDIWLNNPRRPLEASGTSGQKVAINGIINFSVLDGWWCE GYNGKNGWAIGDDTFYDNEYHQDNADSESIYNILEKQIIPTFFDRNEKGVPEKWVKIM KESIKSIAAQYSTHRMVQDYINKYYIPAMERYDKIKASNYQFAANISEWKKKVAHLWP QVQIIAEKTANQLKERNFISGESIPIYATVNLGGLEPSDVKVQAYYGSIGKNNSIENP VIVDMDVVERNSDGTYLYSANITLYEGGEYGYTFRVIPNHPDIINPFDLGLIRWIVQ" misc_feature complement(187..2529) /locus_tag="ClothDRAFT_2913" /note="This family is most closely related to the oligosaccharide phosphorylase domain family and other unidentified sequences. Oligosaccharide phosphorylase catalyzes the breakdown of oligosaccharides into glucose-1-phosphate units. They are important...; Region: GT1_Glycogen_Phosphorylase_like; cd04299" /db_xref="CDD:99995" misc_feature complement(order(1867..1869,2392..2394,2413..2421, 2491..2499,2503..2508,2512..2514,2518..2520)) /locus_tag="ClothDRAFT_2913" /note="putative homodimer interface; other site" /db_xref="CDD:99995" misc_feature complement(order(769..771,778..789,793..795,859..864, 976..978,985..987,1000..1002,1078..1086,1090..1092, 1096..1101,1327..1329,1348..1350,1573..1578,1627..1629, 1639..1644,1750..1752,1756..1758,1843..1845,1867..1869, 1873..1878,2200..2208,2329..2331,2335..2337)) /locus_tag="ClothDRAFT_2913" /note="putative active site pocket; other site" /db_xref="CDD:99995" misc_feature complement(460..2262) /locus_tag="ClothDRAFT_2913" /note="alpha-glucan phosphorylases; Region: more_P_ylases; TIGR02094" /db_xref="CDD:162699" gene complement(2909..3442) /locus_tag="ClothDRAFT_2914" CDS complement(2909..3442) /locus_tag="ClothDRAFT_2914" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431053.1" /db_xref="GI:256006127" /translation="MTKVAEFKLNKFNSFFINLTALLIFFMGLIILEPVIGKEQWLIY IETAIYSGQILGLFTVLLAVTILHELFHGLAYIIFGAKLKFGIKYLNIYTMDISGTFY TSVQMAVILLFPIFILTILLLAVGILFPEFIYWIIVGIIYNIAGSFGDIFMLVFIIFM GKNCKIKDEEYGFGLYT" sig_peptide complement(3329..3442) /locus_tag="ClothDRAFT_2914" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.811) with cleavage site probability 0.799 at residue 38" misc_feature complement(2945..3262) /locus_tag="ClothDRAFT_2914" /note="Protein of unknown function (DUF3267); Region: DUF3267; pfam11667" /db_xref="CDD:152103" ORIGIN 1 tgaatttatg agcttttgtt actgtacaat ccatctgata agtcccaagt caaacggatt 61 gataatatcc ggatgattag gaatcactct gaaggtatat ccgtactctc cgccttcata 121 caaagtgatg tttgcagagt agagataagt tccgtcgctg tttctttcca ctacatccat 181 gtcaactatt acaggatttt cgatagagtt gttttttccg atgcttccgt agtaggcctg 241 aacctttacg tccgaaggtt caagacctcc aagattgaca gtggcgtata tcggtatgga 301 ttcaccggat ataaagtttc tttccttcaa ttggtttgca gttttttcag ctattatctg 361 tacctgaggc cacagatgcg ctaccttctt cttccattct gagatattgg ctgcaaattg 421 ataattgctt gcttttatct tatcatatct ttccattgca ggaatataat acttatttat 481 ataatcctga accattctgt gcgtgctgta ttgggcagcg atggatttta ttgattcctt 541 cattattttt acccactttt cgggtacacc tttttcattt ctgtcaaaga aagtaggtat 601 aatttgcttt tccagtatgt tgtaaattga ttcactgtcg gcattatcct gatgatattc 661 gttgtcgtag aaggtatcgt ctccgattgc ccaaccgttt ttgccgttgt aaccttcgca 721 ccaccaaccg tccagtacgc tgaagttgat tattccgttt atagccactt tttgtccgct 781 ggttccgctg gcttcaagag gtcttctcgg gttgttgagc caaatatcca ctccctgaac 841 caaattgcgg gcaagtgtca tattgtagtt ttccactaaa ataactttac cgttgaatcc 901 ttcctgcttt gcaatgtcat tgatatgttt gatgatttca tgagcaggtc cgtctgcagg 961 atgggctttt ccggcaaata ttatctgtac cggtttttcc gggttgttga gcaatttttg 1021 aattcgggca agatctctga atataaggtt tgccctttta taagttgcaa atcttcttgc 1081 aaatcctata gttaaagcat tggagtcaag cagtgtgtca acctctttga ttctttcgat 1141 tgactctccg tttgcagctc tctgctcttt aagtttttcg cgtacatatc caatcatttt 1201 tgttttcagg acgcaatggg ttttccaaag ctcttcgtcg ggaatgtcgt cgaccttctc 1261 ccagacttct ttttcatgaa gccgttcttt ccagtcttta tcaagatatt tgtcgtaaag 1321 atatttaatg cttggagaaa gccatgtaag agtatgaata ccgtttgtga tgtgcccgat 1381 cggtatttcg tcctcaggta ttccaggcca tacatttttg aagatgtttc ttgatactgc 1441 gccgtgaagc tcgcttacgc cgtttttctg tcctgccagt gtcaaggcaa ggacggtcat 1501 gttgaagttg tgatgctctc ctattcttaa tcccaaatct aaaaactcat gtctgtttat 1561 gcccaaagac ggccagtaat ttccgaaata cctgtctatc atttcaagcg ggaacacgtc 1621 gttaccagca ggtacaggtg tatgggttgt gaatataacg gatgaggcga cgacttcttt 1681 ggcctgattg aaaggaagat tatggttttg tactagcttt ctgataagct caaggccaag 1741 gaaagccgaa tgtccttcat tcatgtgata tacggtggct tttatgccta acgcgtcaag 1801 gactcttgca ccgcctattc caaggaagat ttcctgttgt attcttgttt cctggtctcc 1861 gccgtagagt ctggcggtaa gacctctgtc ataaggactg ttctgctcta tatcagtgtc 1921 cattaaatac agattcacac ggcccacctt taccacccag acttttgcgt atacaactct 1981 tccgggtagt tccacactta tgattacctc ttcacctttg tcatttaagg ccggttgtat 2041 tggaaggttt gaagggttta acggagtgaa tatcgtttcc tgccatcctt cagagtttat 2101 gcgctggctg aaatatcctt ctttatagaa caagccgatt gctgtaaagg gtattccgag 2161 gtcacttgcc gatttgcagt ggtcaccgga taatacgcca agcccgcctg aatatatggg 2221 gagtacttca ttcaatccat attccgcaga gaagtaagct accatatggt cttttttgtc 2281 ggggaagttc ctggaaaacc atgtatcggt ttcattcatg taagtttcaa aatcattgac 2341 tacttttttg tatctttgca tataatcagg gtctttaagc ttggcttcaa gctttttctg 2401 gcttacttcc ttgaggaatc ttaccggatt ctttccaagc ttttcccaca aagcaaggtc 2461 gatttctcta aaaaggtcga tagcttcaga gttccatgac caccacaagt tgtacgcgat 2521 gtctttgagc ttggatagtt cgtcaggtat tacagctgtt acggtaattt ttccaaaaag 2581 atacataggc accctccatt ttattatatg ctatattatt atcctttttt gaataataaa 2641 taacataaat atttttttat agaaattttt ataaaaagac agaataattt actttttatt 2701 ttttaacaat ttcactgtga tattctcaag agatttaata ttgaaagcac ggaaagatgg 2761 atcccctccc gcttttagcc gaatctcaca gagtgaaatg gcttggaata cggatatgat 2821 tacctgaatt cttattcaat atcatatcat aattagcttc tttttggtag agttttttga 2881 aaaaatttct ttatattttt tctttatgct atgtatatag cccaaatcca tactcctcat 2941 ccttgatttt gcagtttttg cccataaata ttatgaatac cagcataaaa atgtcaccga 3001 aagatccggc tatgttatat attattccaa ctattatcca gtaaataaat tcaggaaaaa 3061 gaattcctac cgctaaaagt aaaattgtta aaataaaaat tggaaacagt aatatcacag 3121 ccatctgaac acttgtataa aatgtccctg atatatccat cgtataaata tttaaatatt 3181 ttataccgaa tttgagtttt gcaccaaata ttatatatgc aagtccgtga aaaagctcat 3241 ggagtattgt aaccgccaaa aggactgtaa aaagtcctaa aatttgtccg ctgtaaattg 3301 cagtttcaat atatataagc cactgctctt tcccaatcac aggttccagt attattaaac 3361 ccataaaaaa gattaataaa gctgttaagt ttataaaaaa agaattaaat ttgtttaatt 3421 taaattctgc tactttagtc aaattaacac ctctttgcct gtaataaaat tcaatacaaa 3481 ttgtgtaaaa tttaaggatt cgatttaaaa agacataaaa aagcaactta aatatttgtt 3541 atatataatt ggcaaagag //