LOCUS NZ_ACVX01000072 3331 bp DNA linear CON 10-NOV-2010 DEFINITION Clostridium thermocellum DSM 2360 ctg00126, whole genome shotgun sequence. ACCESSION NZ_ACVX01000072 NZ_ACVX00000000 VERSION NZ_ACVX01000072.1 GI:256006149 KEYWORDS WGS. SOURCE Clostridium thermocellum DSM 2360 ORGANISM Clostridium thermocellum DSM 2360 Bacteria; Firmicutes; Clostridia; Clostridiales; Clostridiaceae; Clostridium. COMMENT PREDICTED REFSEQ: This record has not been reviewed and the function is unknown. The reference sequence was derived from ACVX01000072. FEATURES Location/Qualifiers source 1..3331 /organism="Clostridium thermocellum DSM 2360" /mol_type="genomic DNA" /strain="DSM 2360" /isolation_source="contaminant of Clostridium thermocellum strain LQ8" /db_xref="taxon:572545" gene <1..2354 /locus_tag="ClothDRAFT_2932" CDS <1..2354 /locus_tag="ClothDRAFT_2932" /inference="protein motif:TFAM:TIGR01643" /note="TIGRFAM: YD repeat protein; PFAM: YD repeat-containing protein; KEGG: ppd:Ppro_0084 YD repeat-containing protein" /codon_start=3 /transl_table=11 /product="YD repeat protein" /protein_id="ZP_05431071.1" /db_xref="GI:256006150" /db_xref="InterPro:IPR006530" /translation="WGKVINITEPDGTNIKYDYDYAGNLVSTTDGNGNTTRYTYNSLN LLSEIIDPDGRKITFKYDRQGRMVQRIGKDGRSTYYNYNADNNITGRWEEEGQMEKYE YNVDGSLAASISGTTIHTYAYTLAGRLKSKTTNGQKVLEYDYNKNGLISRLPDISGTP VEYTYDVLGRLTTVTNGGKVSARYEYNIDNTIAQVLYGSGVCARYEYNLDKMITRLLN IDPTGKEMFAYRYAYDGNGNQILKEENDKVTAYSYDALNRLKEVAYPGSIKERFIYDA NGNRLKREYGDIFEQYEYDSCNRLIQRIKNGLLTEYEYDARGNLIKEKEGELTKLYSY DGFDRLIRVQNPDGTYMENIYDAENLRTVSIENGRYNRYVYNGRNIACEVDEDWSLKD RIVFGHTILQREDSDKNEYYYIHNAHGDITALTDGKGEVINSYSYDAFGNILDSVEKI ENRFKYSGEMLDPVTGQYYLRARYYNPSIGRFMQEDTFRGDGLNLYTYVANNPIKYID PTGHCKENAAIAYQVENILRRLRRNPIISLSKVSILLDYLIEGLSYNPVDHTATSGPT VMEAALIAKHVYSGEKGDELPGGWKMLEDPYMVGGLRMGVYGRKGEDGEMEYVIANAG TEPTSLIDWENNLKQPFGKSEDMKNSLAFVEEFMKNNPSINVTFVGHSKGGAEAAANA VLTNRNAILFNPATVNLESYLKPYGVNKSNYTAEMTAFIVEDEILNNIFGFISTPIDK VVYLPRQHSFFISIPLIDMVNSIRNHSMDATIKAIEEWEENRQ" misc_feature <27..1535 /locus_tag="ClothDRAFT_2932" /note="Rhs family protein [Cell envelope biogenesis, outer membrane]; Region: RhsA; COG3209" /db_xref="CDD:33022" misc_feature 57..170 /locus_tag="ClothDRAFT_2932" /note="RHS Repeat; Region: RHS_repeat; cl11982" /db_xref="CDD:159659" misc_feature 120..230 /locus_tag="ClothDRAFT_2932" /note="RHS Repeat; Region: RHS_repeat; cl11982" /db_xref="CDD:159659" misc_feature 1311..1538 /locus_tag="ClothDRAFT_2932" /note="RHS repeat-associated core domain; Region: Rhs_assc_core; TIGR03696" /db_xref="CDD:163408" gene 2351..3280 /locus_tag="ClothDRAFT_2933" CDS 2351..3280 /locus_tag="ClothDRAFT_2933" /inference="protein motif:PFAM:PF00023" /note="PFAM: Ankyrin; SMART: Ankyrin; KEGG: ankyrin repeat protein" /codon_start=1 /transl_table=11 /product="Ankyrin" /protein_id="ZP_05431072.1" /db_xref="GI:256006151" /db_xref="InterPro:IPR002110" /translation="MSRKKIMIVMLIVVMTFPILLSSCQFDILGKEEEYRITNVKIFK DTPVWELALAVKNEKTRTIEKLAKENPELLNYQEPKYGATLLLWAVGMEKYKSAEALL KCGADPNIASTVDGMTPLYLAAGFSWIDNYAKKDPKFVKLLLKYNADPNITYGGNAII EPGTSPLMNSIRCGIEKTKALVEAGAYINYKTKSGTTAAIKALLAGQNATLEALEYAH YLIVEKKAKVTDPYYPWLVYEENNIQELYPVDILRRWVYPLDSEEYRIKMEIVEEFAR QGVNYWDTEIDKYTLEQIKKLYPDTWEEYIKRY" sig_peptide 2351..2422 /locus_tag="ClothDRAFT_2933" /note="Signal predicted by SignalP 3.0 HMM (Signal peptide probabilty 0.952) with cleavage site probability 0.743 at residue 24" misc_feature 2588..2992 /locus_tag="ClothDRAFT_2933" /note="ankyrin repeats; ankyrin repeats mediate protein-protein interactions in very diverse families of proteins. The number of ANK repeats in a protein can range from 2 to over 20 (ankyrins, for example). ANK repeats may occur in combinations with other...; Region: ANK; cd00204" /db_xref="CDD:29261" ORIGIN 1 tgtggggtaa ggtaataaac ataacggaac ccgacggaac caatataaaa tacgattatg 61 actatgcggg aaatcttgta tccaccactg acggtaacgg aaacaccacc cgttatacat 121 acaacagctt gaaccttctg tcggagataa tagatcctga cggaaggaaa ataaccttca 181 agtatgacag acagggaaga atggtgcaga ggatagggaa agacggacgc agcacatatt 241 ataattacaa tgcggataac aatataaccg ggcgttggga agaagaaggg cagatggaaa 301 aatacgagta taatgtagac ggaagcctgg ctgcgtcaat aagcggtact actatacata 361 cttatgccta taccttggca ggaaggctga aaagtaagac aaccaacgga cagaaggtat 421 tggagtatga ttacaataaa aatgggctta tatcaaggct ccccgatata agtggaacac 481 cggtggagta tacatatgac gtattgggga gattaacaac ggtaacaaac ggaggcaaag 541 tttctgcgag gtatgaatat aatattgaca atacaatagc acaggtattg tacggaagcg 601 gagtatgtgc gaggtatgaa tacaacttgg ataagatgat aacaaggctt ttaaatatag 661 atccgacagg aaaagaaatg tttgcataca ggtatgccta tgacggaaac ggcaaccaga 721 ttttgaaaga agagaacgat aaagtaacgg cctacagtta tgatgcgctg aaccgtttga 781 aggaagtggc ataccctgga agtataaaag agagatttat atatgatgcg aacggtaaca 841 ggcttaagag agaatatgga gacatatttg agcaatatga atatgatagt tgtaatagat 901 tgattcaaag aataaaaaac ggactgttaa cggaatatga gtatgatgcg aggggaaatt 961 tgataaaaga aaaagagggt gagttgacta aattatacag ctatgacgga tttgacagac 1021 tgatacgtgt acaaaatccg gacggaacat atatggaaaa tatatacgat gccgagaatt 1081 tgagaacggt ctcgatagaa aacggtaggt acaacaggta tgtgtacaac ggaagaaata 1141 tagcgtgtga agtagacgag gattggagtc taaaagacag aatagtcttt gggcatacga 1201 tattacaaag agaagacagt gacaagaatg agtattatta tattcacaat gcccatgggg 1261 atattacagc tcttaccgat gggaaaggag aagtaataaa cagctacagt tacgatgctt 1321 ttggaaatat attggacagt gttgagaaga tagagaacag attcaaatat tcgggagaaa 1381 tgcttgatcc tgttacggga caatattacc tgagagcgag atattataac ccaagcatag 1441 gaaggtttat gcaggaagat accttcagag gagacggact caatttatat acttatgttg 1501 ccaacaaccc gataaagtac attgacccaa ccggtcactg caaagagaat gcagctattg 1561 cttaccaagt tgagaatatt ttgcgcagat tgcggagaaa ccccattatt tctctgtcga 1621 aagtgagtat tcttttggat tatttaatag agggtttaag ttataatcct gtagaccaca 1681 cagctacatc tggaccaact gtaatggaag ctgcactgat tgctaaacat gtttattcag 1741 gggaaaaagg agatgaatta cccggtggat ggaaaatgct tgaagatcca tatatggttg 1801 gaggtcttcg aatgggcgta tatgggagaa aaggtgagga tggagagatg gaatatgtaa 1861 ttgcaaatgc aggaacagaa cctactagtt tgatagattg ggagaataat ttgaaacaac 1921 cttttgggaa atcagaagat atgaaaaatt ctttagcttt tgttgaagag tttatgaaaa 1981 acaatccaag tattaatgta acatttgttg gacattcaaa aggtggggct gaagcagctg 2041 caaatgcggt acttacaaat aggaatgcaa tactatttaa tcctgccaca gtgaacttag 2101 aatcatattt aaagccatat ggtgtgaaca agtcaaatta tactgctgag atgacggcat 2161 ttattgtaga agacgaaatt ttgaataata tctttggatt tatatcaacg ccgatagaca 2221 aggtagttta tttacccaga cagcattctt ttttcatatc gattccactt atagatatgg 2281 taaattcgat tcgaaatcat tcgatggatg caacgataaa ggcaatagaa gaatgggagg 2341 aaaatagaca atgagtagga aaaagataat gattgttatg ctgattgttg taatgacttt 2401 tccgatttta ttatcttcat gtcaatttga tatattaggg aaagaggagg aatataggat 2461 tacaaacgta aaaattttta aggacacacc ggtatgggaa ctggcattgg ctgttaagaa 2521 tgagaaaacc cgtacaatag agaaattggc aaaagagaat ccggagttgc tgaattatca 2581 ggaaccgaaa tatggagcga ctttactgtt gtgggcagtt gggatggaaa agtataaatc 2641 tgcagaagca ctattaaaat gtggagctga ccccaatatt gcctcaacag ttgacggaat 2701 gactccgctt tatttggcag caggattttc ttggatagac aattacgcga aaaaagaccc 2761 taagtttgta aagctcctac tgaaatataa tgcagaccca aacataactt atggtggaaa 2821 tgccattatt gagccaggaa ctagtccgct tatgaactca atacgatgtg gtattgaaaa 2881 aacgaaagca ttagtagaag caggagctta tatcaactat aaaactaaaa gtgggactac 2941 agctgcaatt aaagcattgc tagccggtca aaatgcgaca ttggaagcat tggaatatgc 3001 acattatttg atagtagaga agaaagctaa ggtaacagat ccctattatc catggttggt 3061 ttatgaagaa aacaatatcc aagaattata tccggtggat atattaaggc gttgggttta 3121 tccattggat tcggaagaat accgaataaa aatggagatt gtagaggaat ttgcccgaca 3181 aggtgtaaat tattgggata cagaaattga taaatatact cttgaacaga taaaaaagct 3241 ttatcctgat acttgggagg aatatataaa aaggtattaa aataaatatg tattacttat 3301 aatatataat aactttttta tgcaaaagct t //