LOCUS NZ_ACVX01000065 3902 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00069, whole genome shotgun sequence. ACCESSION NZ_ACVX01000065 NZ_ACVX00000000 VERSION NZ_ACVX01000065.1 GI:256006112 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000065. FEATURES Location/Qualifiers source 1..3902 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene <1..144 /locus_tag="ClothDRAFT_2902" CDS <1..144 /locus_tag="ClothDRAFT_2902" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431041.1" /db_xref="GI:256006113" /translation="KADIDILRILNKYYYLVVEFKFVSEDMILLDVSAFTNVADAVKR EGE" gene 147..497 /locus_tag="ClothDRAFT_2903" CDS 147..497 /locus_tag="ClothDRAFT_2903" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431042.1" /db_xref="GI:256006114" /translation="MSKDIRTVRPPVQLLPKAIIAVRPASTAKADLEVMAAQVAQLTT VCCQENIQVDSIIITFGGIKDITKRVKQLTEQKDISYLIIYSGKQIAENESEYVNFKR DMQDWYNLKVVCYR" gene 765..1316 /locus_tag="ClothDRAFT_2904" CDS 765..1316 /locus_tag="ClothDRAFT_2904" /inference="ab initio prediction:Prodigal:1.4" /note="KEGG: ses:SARI_00048 hypothetical protein" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431043.1" /db_xref="GI:256006115" /translation="MVYAYFIENTGGEFKDNSCLFRYIKEQNISADNIYIDTADNKDE LDALLEKIEPGDTIVLRTITDLAEKRRELLHLLKELQDFGILIHSIMEPFFNGLEYFD RFQGSIEISKYYAEKKRRLAFEEARKQGVVGRPKIPEKQIETALKLYKSRLFTTEEIT KLSGVSSSTLYRALKEQGCLIRK" misc_feature 822..1157 /locus_tag="ClothDRAFT_2904" /note="Serine Recombinase family, catalytic domain; a DNA binding domain may be present either N- or C-terminal to the catalytic domain. These enzymes perform site-specific recombination of DNA molecules by a concerted, four-strand cleavage and rejoining...; Region: Ser_Recombinase; cl02788" /db_xref="CDD:155104" misc_feature 1161..1286 /locus_tag="ClothDRAFT_2904" /note="Helix-turn-helix domain of Hin and related proteins, a family of DNA-binding domains unique to bacteria and represented by the Hin protein of Salmonella. The basic HTH domain is a simple fold comprised of three core helices that form a right-handed...; Region: HTH_Hin_like; cl01116" /db_xref="CDD:186341" misc_feature order(1164..1169,1266..1271,1275..1283) /locus_tag="ClothDRAFT_2904" /note="DNA-binding interface; DNA binding site" /db_xref="CDD:119388" gene 1737..2996 /locus_tag="ClothDRAFT_2905" CDS 1737..2996 /locus_tag="ClothDRAFT_2905" /inference="protein motif:PFAM:PF02371" /note="PFAM: transposase IS116/IS110/IS902 family protein; transposase IS111A/IS1328/IS1533; KEGG: rhi:NGR_b13960 putative transposase for insertion sequence NGRIS-14b" /codon_start=1 /transl_table=11 /product="transposase IS116/IS110/IS902 family protein" /protein_id="ZP_05431044.1" /db_xref="GI:256006116" /db_xref="InterPro:IPR002525" /db_xref="InterPro:IPR003346" /translation="MRSGDKEKERIHIYNKRNICFVGVDMHKEKHCAVVIDCWMEKIG EVNFENRPSKFPAFVEDIRKICGTRDFVFGLEDTRGFGRNLASYLTGRKFEVKHVNPA YTSAVRLSNPIVYKDDSYDAYCVARVLRDMVDTLQDAKHEDVYWAIRQLVKRRDMIVK NNVMNKNQLHSQLSYSYPSYKKLFAQVDGKSALCFWENYPSPEHIWSTTSEKIYETIK PVHQALKIERIHAIIDMIKKDGNTQKGYQEERDSIVRNIVKDIKNNQELIKDIEEQLR KLLPQTGYKLQTMPGIDLITESKIVSEIGDINRFPDSDKLARFMGLAPVHFSSAGKGK DERCRNGNRELNAIFHFLAIQMVAISPSGKPRHPVFREYFEQKVKEGKNKPQALVCVA RRLVRIIYGMMKTKTEYRPYEKTDDKN" misc_feature 2001..2291 /locus_tag="ClothDRAFT_2905" /note="Transposase; Region: Transposase_9; pfam01548" /db_xref="CDD:144952" misc_feature 2592..2861 /locus_tag="ClothDRAFT_2905" /note="Transposase IS116/IS110/IS902 family; Region: Transposase_20; pfam02371" /db_xref="CDD:145490" gene 3125..3421 /locus_tag="ClothDRAFT_2906" CDS 3125..3421 /locus_tag="ClothDRAFT_2906" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431045.1" /db_xref="GI:256006117" /translation="MFESKIITKNGIEIGGLADVEINGKTLTLKDVAVYSNKGDIPNA VGARDIFKWQNEIAQQAKAQGFDTLIIKGVRAMNSTSANPGKVVEYIIDLTKLK" gene 3432..3746 /locus_tag="ClothDRAFT_2907" CDS 3432..3746 /locus_tag="ClothDRAFT_2907" /inference="ab initio prediction:Prodigal:1.4" /codon_start=1 /transl_table=11 /product="hypothetical protein" /protein_id="ZP_05431046.1" /db_xref="GI:256006118" /translation="MNEFSKTFSKEELEEIEVFKEGTEAMSVEGKEIICFQLLYQLIN GNIKISEVSKDKLLFTYAQLKGFKEISGSIGIFDTSLLESIVSKAKKIISEEIEKRKQ KR" ORIGIN 1 aaggcagata tagatattct taggatactt aataaatatt actatttggt agtggagttt 61 aaatttgtat cagaggatat gattctattg gatgtgagcg catttactaa tgtagcagat 121 gcagttaaaa gagaggggga gtaataatga gtaaagatat aagaacagta agaccacctg 181 tgcagttgtt acctaaagct ataatagcag taagaccagc aagtacagca aaagcagacc 241 ttgaagtaat ggcagcacag gtagcgcaat taacaacagt atgttgtcag gagaatatcc 301 aagtagacag tatcattata acttttgggg gtataaaaga tattacaaaa agagtaaaac 361 agctcacaga gcaaaaggat ataagctatc ttatcatata cagtggtaag cagattgcag 421 aaaatgaaag tgaatacgta aattttaaga gagatatgca ggactggtat aatttaaagg 481 ttgtttgtta caggtgatag ttgaggtttt ggtaaagtaa atatctcaaa tggtttaatg 541 aatatataaa tatgtgtttc gggtataaaa caagctcatt cccaaaatac atcaagattt 601 atctattact caaaacggtt gatatagaga tattttatga agaaaaaaga ataaggagta 661 attttgggaa tgagtagata agaattataa gaaattgatt taatctcaag gggtatagac 721 attctcaaat tgtaagaggt tttgagaaag gggggagagg aataatggta tacgcatatt 781 ttattgaaaa tacaggcggt gagttcaaag ataacagttg cttgtttaga tatataaaag 841 aacagaatat atcagcagat aacatataca ttgatacagc agataataaa gatgaattag 901 atgcgctttt agaaaagatt gagccaggag atacaatagt attaagaaca ataacagatt 961 tagcagaaaa gagaagagag ctattacatc tactaaagga actacaagac tttggtatct 1021 tgatacatag tataatggag ccatttttta atggtttaga gtatttcgac agatttcaag 1081 gttcaataga aatcagtaaa tattatgctg agaaaaaaag aagattagcc tttgaagaag 1141 caagaaagca aggggtagta ggaagaccaa agataccaga gaagcagatt gaaacagcat 1201 taaagctata caagagtaga ctatttacca cagaggaaat tacaaagtta tctggggtaa 1261 gcagtagtac cctttacaga gcattaaagg agcaggggtg cttaattcgc aaataggaat 1321 ggtattaata gatatagatt aacaggaaga gatcgggcgt gcagtgcccg atctcttcct 1381 gcataatgtt aaaaaatttt tttagtatta acttcaaatt tacagaagtc agaaaagcct 1441 tgaacgacaa gggaaaaagg gcagttgaaa attaagggta ggacataaat cggtataacc 1501 ctaacagtta gggttttcat gtgaacaaaa ataaagacag gttatggtat ataagcgagt 1561 gaaaattttc aagaagactg gactttagtg aatggtgacg gtaacatcat caaaaaagtg 1621 tagtcaataa aggctcgtgg tgccataatc acgtaatttg tcacattagg aacagatagg 1681 ctgtcgttcc cttgcgggct gtaaaaagct aacgctctta aattgaggtt gccgatgtgc 1741 gtagtggaga caaggaaaag gagaggatac atatttataa taaaagaaat atatgctttg 1801 taggggtaga tatgcacaag gaaaagcatt gtgcagttgt aattgattgc tggatggaaa 1861 aaatcggaga ggtcaacttt gaaaacagac catccaagtt tccagcattt gttgaggata 1921 tcaggaaaat atgtggtaca agagactttg tatttggact tgaggatacc agaggttttg 1981 ggcgtaatct ggcttcatac cttacaggaa ggaagtttga agtcaaacat gtgaatccag 2041 cctataccag tgcagtaagg ctttcaaatc ctattgtata caaggatgat tcctatgatg 2101 cctattgtgt tgcaagggta ttaagggata tggtggatac attacaggat gcaaaacatg 2161 aggatgtata ctgggcaatt cggcagttgg taaaaagacg ggatatgata gtaaaaaaca 2221 atgttatgaa caaaaaccaa ttacacagtc agttgtctta tagttatcca tcctataaga 2281 aattatttgc acaggttgat ggcaaaagtg cactatgctt ctgggaaaac tatccttcac 2341 cagagcatat ttggagtact acatcagaaa agatttatga aacaataaaa ccagtacatc 2401 aggcattaaa gatagagcgt attcatgcaa ttatcgatat gattaaaaag gacggaaata 2461 cacagaaggg gtatcaggaa gaaagagatt caattgtaag gaatattgta aaggatatta 2521 agaacaatca ggaactaata aaagacatag aagagcagtt aagaaaatta ttgccacaga 2581 cggggtataa gttgcaaacc atgccaggta tagaccttat tacagaatca aagattgtat 2641 ctgaaattgg tgatattaac agattcccag attcagataa gctggctcga tttatggggt 2701 tggcaccagt acatttcagt tcagcaggta aaggcaagga tgaacggtgc agaaatggaa 2761 acagagagtt gaatgcaata tttcattttt tggctataca aatggtagcc atatcaccat 2821 caggaaagcc aagacatcca gtattcagag agtattttga acagaaggtt aaagagggca 2881 agaacaagcc acaggcgctt gtatgcgtgg caaggcggct tgtgaggata atctacggta 2941 tgatgaaaac caagactgaa tacaggccat atgagaagac tgacgacaag aactgatttc 3001 atattctgga agcaaagcaa tggaagaaaa ttcttttttc attgagatat ggtagcagga 3061 attatataat agttatagtc cttgtagtga gggaacgagt aagactgtat ttgaaaatgg 3121 ggaaatgttt gaaagtaaaa ttattacgaa aaatggcatc gaaataggtg gacttgctga 3181 tgtagaaatc aatggaaaaa ctctaacact taaagatgtt gcagtatact caaataaagg 3241 agatattccc aatgctgttg gggcaagaga tatctttaaa tggcaaaacg agatagctca 3301 acaggcaaag gctcagggtt ttgatacact tattattaaa ggtgttagag ctatgaattc 3361 aacttctgca aatccaggaa aagttgttga atatataatt gacttaacta aacttaaatg 3421 aggtgaatat attgaatgaa tttagtaaaa ctttttcaaa ggaagaactt gaagaaattg 3481 aggtttttaa ggaaggaaca gaagctatga gtgttgaagg aaaagaaatt atttgctttc 3541 aattattgta ccaactgatt aatggaaata ttaaaatttc agaagtttca aaagataagc 3601 tgttatttac atatgctcaa ttaaaaggat ttaaggagat tagtggttct atcggaattt 3661 ttgatacaag tttattggag agtattgtaa gtaaggcaaa aaagataatt tctgaagaga 3721 tagaaaaaag aaagcaaaaa agataaaata ctgaggtcac acagttccaa ctgctgtgac 3781 cttgttttcc gtacgcagag attaacgtat caaaacaaag gagactgttt aaccttttat 3841 taatacataa ggagcaggac gaaggaatgg cacattcgat gccggaggac atgggaggtt 3901 tg //