LOCUS NZ_ACVX01000066 3611 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00005, whole genome shotgun sequence. ACCESSION NZ_ACVX01000066 NZ_ACVX00000000 VERSION NZ_ACVX01000066.1 GI:256006119 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000066. FEATURES Location/Qualifiers source 1..3611 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene complement(<1..184) /locus_tag="ClothDRAFT_2908" CDS complement(<1..184) /locus_tag="ClothDRAFT_2908" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431047.1" /db_xref="GI:256006120" /translation="MPEASVTTSSIARYALEKYVSDHIAKRDGTKILIEINTADATEE DIKNLYDLLSKLFDETK" gene complement(532..1131) /locus_tag="ClothDRAFT_2909" CDS complement(532..1131) /locus_tag="ClothDRAFT_2909" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431048.1" /db_xref="GI:256006121" /translation="MPRGVASVFSTLQNIDMFKQIEVLFNTKGIRLELPNTNKVQVWT TEGEMLNIEKKELLQNTSDISDYLIQFWWPQMDDVAIKLTCQGYLCVCDIYLDGLDES QTKVILDLLIIMTLQRFEIVGFVIDREELVSEFEWNKFFSNKEYLDSHYLELCGLKIF KKYELKEYKTEQLIDFKRDCVYVAIPNRERSTITLYLLC" gene complement(1147..2103) /locus_tag="ClothDRAFT_2910" CDS complement(1147..2103) /locus_tag="ClothDRAFT_2910" /inference="protein motif:SMART:SM00306" /note="SMART: Hedgehog/intein hint domain protein; KEGG: hch:HCH_02073 rhs family protein" /codon_start=1 /transl_table=11 /product="Hedgehog/intein hint domain protein" /protein_id="ZP_05431049.1" /db_xref="GI:256006122" /db_xref="InterPro:IPR003587" /db_xref="InterPro:IPR006141" /translation="MTTALSFSMDGFDMLAMGISLFEPSNALVEFNRKLHSNALYNGF QIAVNALAVFSAGAASTMNCFVAGTMILTATGLVAIENIKAGDKVIATNPETFEVAEK TVLETYVRDTTELLHLTINGEVIKTTFEHPFYVKDVGFVEAGKLQIGDRLVDSRGNVL VLEGKKLEITDKPVKVYNFKVDNFHTYHVGENRVLVHNANKYVKGTSSTTGKQAQIIG ATREQKVANITGGQVSGAKIKSSAGGTDIDVIGANGELIMVGGPAKANDLGKLGQVIK IYQDEAAIRGVGVKAYFAEGTPQNVIDFAIKKLGTDNVVIFK" misc_feature complement(1510..1914) /locus_tag="ClothDRAFT_2910" /note="Hedgehog/Intein domain, found in Hedgehog proteins as well as proteins which contain inteins and undergo protein splicing (e.g. DnaB, RIR1-2, GyrA and Pol). In protein splicing an intervening polypeptide sequence - the intein - is excised from a...; Region: Hint; cd00081" /db_xref="CDD:73181" misc_feature complement(order(1510..1515,1711..1713,1912..1914)) /locus_tag="ClothDRAFT_2910" /note="protein-splicing catalytic site; other site" /db_xref="CDD:73181" misc_feature complement(order(1711..1713,1720..1722,1912..1914)) /locus_tag="ClothDRAFT_2910" /note="thioester formation/cholesterol transfer; other site" /db_xref="CDD:73181" misc_feature complement(1507..1896) /locus_tag="ClothDRAFT_2910" /note="Protein of unknown function (DUF1557); Region: DUF1557; pfam07591" /db_xref="CDD:148935" gene complement(2317..2934) /locus_tag="ClothDRAFT_2911" CDS complement(2317..2934) /locus_tag="ClothDRAFT_2911" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431050.1" /db_xref="GI:256006123" /translation="MIDLIKLEITRTKFIKIYLPCEKKNIKPFDIISIKYLKDQIEYD LYVDDFATEAIQILKNLLKKALNFDLQIQRKYIDKGIGYYYNIYANELWTTDDENVIQ SLVDPSQNFSLWSTPTHIGIETFMYNIDDKIYIEISPIYKWNCDYPENESKYETFDNF LNNYKPIDIVSIDRSVAVRWLDFCCDMIKIFKENDKKYLKEDNTN" gene complement(3038..>3611) /locus_tag="ClothDRAFT_2912" CDS complement(3038..>3611) /locus_tag="ClothDRAFT_2912" /inference="similar to AA sequence:KEGG:NMB0655" /note="KEGG: nme:NMB0655 hypothetical protein" /codon_start=2 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431051.1" /db_xref="GI:256006124" /db_xref="InterPro:IPR006141" /translation="GFVEAGKLQVGDKLLDSKGNVLVVEEKKIKITDKPIKVYNFQVA DFHTYHVGNNEVLVHNVKYNSPDGKYTYKNGIYEDADYHGKVDDSIKSKKPQDGQFAL DNSVDIRDTSKRRVGIDINGDFVVLDHTGGEKFHGHVRPWSKGTPDLPPLTDRMKNAL KKAGYVKEVAKKPKLTSKIIDMINEISKSN" misc_feature complement(3431..>3611) /locus_tag="ClothDRAFT_2912" /note="Protein of unknown function (DUF1557); Region: DUF1557; pfam07591" /db_xref="CDD:148935" ORIGIN 1 cttttgtttc gtcaaacagc ttggaaagaa ggtcgtagag attctttatg tcctcttctg 61 tggcatctgc ggtgttgatt tcaattaaaa tttttgttcc atcacgcttg gcgatatggt 121 cgctcacata cttctccaaa gcgtatcttg ctatgcttga tgtggtaacg cttgcttccg 181 gcatttgcgc ttaaagttca tcgatgatag cgtccaattc atccgactgc ctttgtgtaa 241 gccttacccg taacatacta tccttttctg tagacattat tatacctcct gtatttctta 301 ttggtttaat tgtatcacaa tgtattataa tttgccaagc ttggataaag aagatagcca 361 caccagccga aacggtgtgg ccttaaaaga ttttctattc ttctgactta tagactttta 421 ttgttttatg attaccgtgc tcaaagacat aaattctttc tcatttagga caacgccaat 481 ttatttaaca tctcatgtac caataaaaac ttctctgcat cctttgaact tctagcagag 541 taagtataga gttattgtac tccgttcgcg atttggtata gcaacataaa cacaatctct 601 tttaaagtct atcaactgct ctgttttata ttctttgagc tcatacttct taaatatttt 661 taaaccgcat agttccaaat aatgactatc caaatactct ttgttactaa aaaatttgtt 721 ccattcgaat tctgaaacga gttcctctct atcaatgaca aacccaacta tttcgaatct 781 ttggagagtc ataatgatta ataagtcaag aataactttt gtttgacttt catctaatcc 841 gtctaaataa atatcacata cacataaata cccttgacaa gttagtttta ttgcaacatc 901 atccatctgg ggccaccaaa attgtattaa atagtcactt atatctgatg tgttttgaag 961 taattctttt ttctcaatat ttagcatttc accttctgta gtccatactt gcactttatt 1021 tgtattaggc aattcaagtc ttatcccctt agtgttaaaa agaacttcta tttgtttaaa 1081 catatcaata ttttgaagtg tagaaaatac gctagcaaca ccccttggca taagcaacct 1141 cctattctat ttaaatatta caacattatc tgtgcccagt ttttttatag caaaatcaat 1201 tacattttgt ggtgtacctt ctgcaaaata cgccttaaca ccaactcctc ttatggctgc 1261 ttcatcttga tatatcttaa taacttgacc caatttacca agatcatttg ctttcgctgg 1321 tccaccaacc attattaatt cgccattagc tccaattaca tctatatctg ttcctccagc 1381 acttgatttt atttttgctc cactaacttg tccacctgtt atatttgcaa ctttctgttc 1441 tctagtcgca cctataattt gagcttgttt tcctgtagta ctactcgttc ccttaacata 1501 cttattcgca ttatgaacca ataccctatt ttcgccaaca tgatacgtat gaaaattatc 1561 aaccttaaaa ttgtaaacct ttacaggctt atctgttatt tcaagctttt taccttccaa 1621 tactaaaaca ttacctcttg aatcaaccaa cctgtctcct atctgcagtt ttcccgcttc 1681 aacaaaaccc acatctttta cataaaacgg atgctcaaag gttgtcttga ttacctctcc 1741 attgattgtc aaatgcaaaa gctccgtcgt atctctcaca tatgtctcaa gcactgtctt 1801 ttccgctact tcaaaagtct ccggattcgt cgcaattacc ttgtcccctg ccttgatatt 1861 ctctatcgca accaagcctg tcgcagtcaa tatcattgta cctgcaacaa agcagttcat 1921 tgtcgatgcc gccccggcac tgaaaacagc cagcgcgttt acagcaatct ggaatccgtt 1981 ataaagtgca ttggaatgca gcttccggtt aaattcaacc aatgcattgg atggttcaaa 2041 caacgatatt cccattgcca gcatgtcaaa tccatccata ctaaaagaaa gtgctgtggt 2101 catataacat aaaacattcc actacctttg tacaacttgt aatgtgtttc ctgtctctga 2161 atataattga attaatatat aaatataata tatattaaac aaaaaggtca cattagttga 2221 aattacgtga cctgcaaatt ctccctatcc cttaagctta agttttttat gattcgttag 2281 tagctttgta caaataaaaa attgccatat aaaaagctaa tttgtgttat cttcttttaa 2341 gtacttttta tcgttttctt taaatatctt tatcatatca caacaaaagt ctagccatct 2401 cacagcaaca cttctgtcaa ttgaaacaat atcaattggt ttgtaattat ttagaaaatt 2461 gtcaaaagtt tcatatttac tttcattctc aggataatcg cagttccact tgtaaattgg 2521 acttatttca atatatattt tatcatcaat attatacata aaagtttcaa tacctatatg 2581 agttggagtt gaccaaaggc taaaattttg tgatggatca acaagacttt gaataacatt 2641 ttcgtcatca gttgtccaca attcatttgc ataaatatta tagtaatatc caattccctt 2701 atctatatat tttctctgta tttgtaagtc aaaatttaat gctttcttta gtaaattctt 2761 taatatttgt attgcctccg ttgcaaaatc atcaacatat aaatcatatt ctatttggtc 2821 tttcagatac tttatagata taatatcaaa tggctttata tttttctttt cacatggtaa 2881 gtatatttta ataaattttg ttcttgtaat ttctaattta attaaatcaa tcatttcttc 2941 aatcatcctt tactttttat ttgcacgaat ttcgtaaatt tcataaacta ctgctgaatt 3001 actctattat tgttgtaatt cggaaaacgt tttgttttta atttgatttt gatatttcat 3061 ttatcatatc aattatttta cttgtcaact taggtttttt agctacctcc ttaacatatc 3121 ctgccttttt gagagcattt ttcatcctgt cagtcaaagg cggaagatct ggagtacctt 3181 tactccaagg tctaacatgt ccatgaaact tttcaccacc tgtatgatct aacacaacaa 3241 aatctccatt tatgtcaatt ccaactcttc tttttgatgt atctcttata tcaacagagt 3301 tgtctaaagc aaactgaccg tcttgcggtt ttttactttt tatactatca tcaacttttc 3361 cgtgataatc agcatcttca tatattccat ttttatatgt gtatttacca tctggtgaat 3421 tatactttac gttatgaacc agcacttcat tattgccaac atgataagta tgaaaatcag 3481 ctacttgaaa gttgtaaact ttaatcggtt tatcagttat ttttattttt ttctcttcca 3541 ccaccaaaac attgcctttt gaatctagca gcttatctcc tacttgcagt tttcccgctt 3601 caacaaaacc c //