LOCUS NZ_ACVX01000068 3522 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00089, whole genome shotgun sequence. ACCESSION NZ_ACVX01000068 NZ_ACVX00000000 VERSION NZ_ACVX01000068.1 GI:256006128 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000068. FEATURES Location/Qualifiers source 1..3522 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene complement(145..657) /locus_tag="ClothDRAFT_2915" CDS complement(145..657) /locus_tag="ClothDRAFT_2915" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431054.1" /db_xref="GI:256006129" /translation="MIPNVHKNSIFWEGNIRLHDWDEYFGRELKIILNIGGDSIVDEV TALHKKGYDFLIAEQARILHTVIEAIFDKYPVWQEEYGYEGKEKEILMPDIDNKNELN QLIYPIKIFIMDVEKDGFPYIGIQFDCKWDQEHGVGVMLYKDNVVDIGGSDTAFMSWI AEEDKNRKKS" gene complement(969..1481) /locus_tag="ClothDRAFT_2916" CDS complement(969..1481) /locus_tag="ClothDRAFT_2916" /inference="protein motif:SMART:SM00306" /note="SMART: Hedgehog/intein hint domain protein; KEGG: hch:HCH_02073 rhs family protein" /codon_start=1 /transl_table=11 /product="Hedgehog/intein hint domain protein" /protein_id="ZP_05431055.1" /db_xref="GI:256006130" /db_xref="InterPro:IPR003587" /db_xref="InterPro:IPR006141" /translation="MYDNGKKIDFKCFVAGTMVLTAAGLVAIENIKAGDKVIATNPET FEVAEKTVLETYVRETTELLHLTINGEVIKTTFEHPFYVKDVSFVEAGKLQVGDKLLD SRGNVLVVEEKKLEIADKPVKVYNFKVDDFHTYHVGDNEVLVHNANYVEGDLDGITII IRSMQGKHIS" sig_peptide complement(1398..1481) /locus_tag="ClothDRAFT_2916" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.606) with cleavage site probability 0.574 at residue 28" misc_feature complement(1044..1448) /locus_tag="ClothDRAFT_2916" /note="Hedgehog/Intein domain, found in Hedgehog proteins as well as proteins which contain inteins and undergo protein splicing (e.g. DnaB, RIR1-2, GyrA and Pol). In protein splicing an intervening polypeptide sequence - the intein - is excised from a...; Region: Hint; cd00081" /db_xref="CDD:73181" misc_feature complement(order(1044..1049,1245..1247,1446..1448)) /locus_tag="ClothDRAFT_2916" /note="protein-splicing catalytic site; other site" /db_xref="CDD:73181" misc_feature complement(order(1245..1247,1254..1256,1446..1448)) /locus_tag="ClothDRAFT_2916" /note="thioester formation/cholesterol transfer; other site" /db_xref="CDD:73181" misc_feature complement(1041..1430) /locus_tag="ClothDRAFT_2916" /note="Protein of unknown function (DUF1557); Region: DUF1557; pfam07591" /db_xref="CDD:148935" gene complement(2104..2580) /locus_tag="ClothDRAFT_2917" CDS complement(2104..2580) /locus_tag="ClothDRAFT_2917" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431056.1" /db_xref="GI:256006131" /translation="MPKLNNIEGNILLEINLLNNDFLDVDEERQDSENWIPFEFVLNV PREKYVYTPDMGATFSVYEIKSLIEKFEQIAENKLSKKNFEKFEFSSSESYFDIIVDD PLEDGEIYMEIWLNIGTITDGELSGYDKGFRFVVKLDTFIEFTSELKRQYKRMMEL" gene complement(2626..2820) /locus_tag="ClothDRAFT_2918" CDS complement(2626..2820) /locus_tag="ClothDRAFT_2918" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431057.1" /db_xref="GI:256006132" /translation="MIGYSVSEISTNDLQYFYNNIKRFLMFEAQKEKIGNVTHFVMRK INQVVKKKTRISHFKNNWEL" gene complement(3026..>3522) /locus_tag="ClothDRAFT_2919" CDS complement(3026..>3522) /locus_tag="ClothDRAFT_2919" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: nmn:NMCC_1773 hypothetical protein" /codon_start=3 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431058.1" /db_xref="GI:256006133" /db_xref="InterPro:IPR006141" /translation="GFVEAGKLQVGDRLVDSRGNALVLEGKKLEITDKPVKVYNFKVD DFHTYHVAHIGVLVHNASSNYSNGMPEIKKTKHGEKRAKERGFSDEKINDIKNNYSQK VYQSGGRTVFAKKNGNYYDVVIVNKEGVVITTVGGKTKSLKTWKDVLKMLKNNGEISS LPID" misc_feature complement(3338..>3522) /locus_tag="ClothDRAFT_2919" /note="Protein of unknown function (DUF1557); Region: DUF1557; pfam07591" /db_xref="CDD:148935" ORIGIN 1 ttcgtcttcc tcacaatctt tcaattttct atttatctac catataataa aaaccataac 61 acccttattg accttgtata gattggtaac ataaactata tggtgttatg gtcgtcaatc 121 taaatattaa ctattttttc tattctaact tttttttcta ttcttatctt cttcagctat 181 ccaagacata aatgcagtat ctgaaccacc aatatctaca acgttatctt tatataacat 241 tacaccaact ccatgctctt gatcccactt acagtcaaac tgtattccaa tgtatgggaa 301 tccatctttt tcaacatcca taataaatat tttaattgga taaataagct gatttaattc 361 attcttatta tcaatatccg gcataagtat ttctttttct ttaccttcat aaccatattc 421 ttcttgccaa acaggatatt tatcaaatat agcttctata actgtatgta aaatacgtgc 481 ctgttcagca attaaaaaat cataaccctt tttatgcaat gcggtcactt cgtcaacaat 541 gctgtctcca ccaatgttta gtataatttt taattctcgt ccaaaatact catcccaatc 601 atgtaatcgt atgtttcctt cccagaaaat actattttta tgaacattag gtatcattaa 661 ctccacctct ttattatttt atggccttat tcccttcctt attaatgcag cgccacccgt 721 atgtttcact gctccatgta aatcagatgg tacaagcatc atagtaattc catcttcgac 781 atgatgccaa gtataccctt ttggtgttga tttatatcct gctgcttgat tagctttaat 841 aaaatcatag tatgtgtcac cttgtaatcc ttcaactttg actgtcttct tactataggg 901 actaaaatct ggaaaacctt cattcgtaaa tttaacacca tctggatact ttaatgctaa 961 atcaccactt aacttatatg tttgccctgc atacttctta ttataatagt aataccgtct 1021 aagtctcctt caacataatt tgcattatgc accaatactt cattatcgcc aacatgataa 1081 gtatggaagt catctacttt aaaattataa actttaacag gtttatctgc aatctctagc 1141 tttttctctt ccaccactaa aacattgcct cttgaatcaa gcagtttatc tcctacctgc 1201 agttttcctg cttcgacaaa gctcacatct ttaacataaa acggatgctc aaaggttgtc 1261 ttgattacct ctccattgat tgtcaaatgc aaaagctccg ttgtctctct cacatatgtc 1321 tcaagcaccg tcttctccgc tacttcaaaa gtctccggat tcgtcgcaat taccttgtct 1381 cctgccttga tattctctat cgcaaccaag cctgccgctg tcaataccat cgtacccgca 1441 acaaagcatt tgaaatctat tttcttgccg ttatcataca ccttgtaccg gttttcgtcg 1501 actaatttgt tgatttttga aacagtaatt ggtatgatac ttcaatttag cttaaagaaa 1561 ttcttgaata atgtctaaaa atatctttta ggtatgtcac atttacaata cttttgaaat 1621 tatttctctt gatcatgtta ttcatttctt cttttgataa tgttaacata agaaaatctc 1681 ttccttggat actatttgta attcttgcca agaaagaaac ttttcaatct ttttgtaggt 1741 aaagtgagac agatatgctt aaggtctact catgcggatt tccacctgtt ctcctccatt 1801 atcttgccca accgcaccac agaattattt atattcccta agaagtatca taattttatt 1861 ataaagtcaa cagtttatag tacaagcagg aagcccaagc cagtctagct tacaaactct 1921 tgctgcacca acaaaaatac cactgtcttc ttcaccgtta taacttaaat atatcatgct 1981 attaccagtt ttcattaatt tggtaatgca attgtgttta acttactttt ctgttttgtc 2041 agtcttaatt ttttagtatt attatactat gatttcaaat ttcccacgac agattcttct 2101 ttttcaaagt tccatcatac gtttatattg cctttttaat tcacttgtaa attcgataaa 2161 tgtatctaat tttaccacaa acctaaaccc tttgtcataa ccacttaatt caccgtcagt 2221 aattgtgcct atatttaacc aaatttccat gtatatttct ccatcttcca atgggtcatc 2281 cactataatg tcaaaatagg attcagaact tgaaaattca aatttctcaa agtttttttt 2341 agatagttta ttttctgcta tttgctcaaa tttttcaatc aaacttttaa tctcatatac 2401 actaaaagtt gctcccatat caggcgtata aacatatttt tcccgtggaa catttaagac 2461 aaattcaaat ggaatccaat tctcactatc ttgtctttcc tcatcaacat caagaaaatc 2521 attattaagc aagttaattt ctaacaaaat attaccctct atattgttta atttaggcat 2581 ataactcccc cttaattatt cttgaaatat ttttcttttc tgcttttata gctcccaatt 2641 atttttaaaa tgagaaattc tagttttctt ttttactact tgattaattt ttctcattac 2701 aaagtgcgtc acgttcccta ttttctcctt ttgagcttca aacattaaaa atctttttat 2761 gttattatag aaatattgta aatcattagt cgatatttca gaaactgaat acccaatcaa 2821 agtacactcc tctttttata tcaactctaa caatcagagt tctttctatg atttacatta 2881 tccctttatt ctaagtatac ttcatactaa atgttctttc gctttctcta atctattcac 2941 tgtccatgca actctcgtct taaattctac aatatggcat ccttttttca aagtttattt 3001 cattttagta caagaatact ctttcttaat ctattggcag tgaactaatc tctccattgt 3061 tttttaacat ttttaaaaca tctttccaag tttttaatga tttagttttt cctcctactg 3121 tcgttattac aacaccttcc ttattaacta taactacatc ataataattg ccattctttt 3181 ttgcaaatac agttctaccc cctgattgat agactttttg tgaataatta ttcttaatat 3241 catttatttt ttcatcacta aagcctcgct ctttagctct cttctctccg tgtttagttt 3301 ttttaatttc gggcattcca ttactatagt ttgaacttgc attatgcacc aatacaccaa 3361 tatgtgcaac atgataagta tgaaaatcat ccactttgaa gttgtaaacc tttacaggct 3421 tatctgttat ttcaagcttt ttaccttcca ataccaaagc attgcctctt gaatcaacca 3481 atctgtctcc tacctgcagt tttcctgctt cgacaaagcc ta //