assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	1	629602-629699	1	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	TGATTAACTTCAACATGAGATGTATTTAAATA	32	0	0	NA	NA	II-B	1	1	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|104aa|up_5|NC_020291.1_622688_623000_-,NA|108aa|down_1|NC_020291.1_631909_632233_+,NA|104aa|down_2|NC_020291.1_632331_632643_+,NA|78aa|down_8|NC_020291.1_641802_642036_+,NA|85aa|down_9|NC_020291.1_642048_642303_+	NA|273aa|up_9|NC_020291.1_618676_619495_+	PRK06182, PRK06182, short chain dehydrogenase; Validated	NA|161aa|up_8|NC_020291.1_619911_620394_+	PRK07116, PRK07116, flavodoxin; Provisional	NA|212aa|up_7|NC_020291.1_620808_621444_+	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]	NA|330aa|up_6|NC_020291.1_621513_622503_+	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|104aa|up_5|NC_020291.1_622688_623000_-	NA	NA|136aa|up_4|NC_020291.1_623462_623870_+	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|143aa|up_3|NC_020291.1_623866_624295_+	COG2445, COG2445, Uncharacterized conserved protein [Function unknown]	NA|553aa|up_2|NC_020291.1_624534_626193_+	cd00839, MPP_PAPs, purple acid phosphatases of the metallophosphatase superfamily, metallophosphatase domain	NA|422aa|up_1|NC_020291.1_626306_627572_+	pfam07907, YibE_F, YibE/F-like protein	NA|528aa|up_0|NC_020291.1_627797_629381_+	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|431aa|down_0|NC_020291.1_630538_631831_+	COG0124, HisS, Histidyl-tRNA synthetase [Translation, ribosomal structure and biogenesis]	NA|108aa|down_1|NC_020291.1_631909_632233_+	NA	NA|104aa|down_2|NC_020291.1_632331_632643_+	NA	NA|280aa|down_3|NC_020291.1_632792_633632_-	cd13530, PBP2_peptides_like, Peptide-binding protein and related homologs; type 2 periplasmic binding protein fold	NA|111aa|down_4|NC_020291.1_634422_634755_-	pfam03992, ABM, Antibiotic biosynthesis monooxygenase	NA|574aa|down_5|NC_020291.1_635271_636993_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|149aa|down_6|NC_020291.1_637393_637840_+	COG0537, Hit, Diadenosine tetraphosphate (Ap4A) hydrolase and other HIT family hydrolases [Nucleotide transport and metabolism / Carbohydrate transport and metabolism / General function prediction only]	NA|722aa|down_7|NC_020291.1_639394_641560_+	COG1511, COG1511, Predicted membrane protein [Function unknown]	NA|78aa|down_8|NC_020291.1_641802_642036_+	NA	NA|85aa|down_9|NC_020291.1_642048_642303_+	NA
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	2	629945-630175	2,1	CRISPRCasFinder,CRT	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	TGATTAACTTCAACATGAGATGTATTTAAATA,AACATGAGATGTATTTAAATA	32,21	0	0	NA	NA	II-B:NA	3,3	3	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|104aa|up_5|NC_020291.1_622688_623000_-,NA|108aa|down_1|NC_020291.1_631909_632233_+,NA|104aa|down_2|NC_020291.1_632331_632643_+,NA|78aa|down_8|NC_020291.1_641802_642036_+,NA|85aa|down_9|NC_020291.1_642048_642303_+	NA|273aa|up_9|NC_020291.1_618676_619495_+	PRK06182, PRK06182, short chain dehydrogenase; Validated	NA|161aa|up_8|NC_020291.1_619911_620394_+	PRK07116, PRK07116, flavodoxin; Provisional	NA|212aa|up_7|NC_020291.1_620808_621444_+	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]	NA|330aa|up_6|NC_020291.1_621513_622503_+	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|104aa|up_5|NC_020291.1_622688_623000_-	NA	NA|136aa|up_4|NC_020291.1_623462_623870_+	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|143aa|up_3|NC_020291.1_623866_624295_+	COG2445, COG2445, Uncharacterized conserved protein [Function unknown]	NA|553aa|up_2|NC_020291.1_624534_626193_+	cd00839, MPP_PAPs, purple acid phosphatases of the metallophosphatase superfamily, metallophosphatase domain	NA|422aa|up_1|NC_020291.1_626306_627572_+	pfam07907, YibE_F, YibE/F-like protein	NA|528aa|up_0|NC_020291.1_627797_629381_+	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|431aa|down_0|NC_020291.1_630538_631831_+	COG0124, HisS, Histidyl-tRNA synthetase [Translation, ribosomal structure and biogenesis]	NA|108aa|down_1|NC_020291.1_631909_632233_+	NA	NA|104aa|down_2|NC_020291.1_632331_632643_+	NA	NA|280aa|down_3|NC_020291.1_632792_633632_-	cd13530, PBP2_peptides_like, Peptide-binding protein and related homologs; type 2 periplasmic binding protein fold	NA|111aa|down_4|NC_020291.1_634422_634755_-	pfam03992, ABM, Antibiotic biosynthesis monooxygenase	NA|574aa|down_5|NC_020291.1_635271_636993_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|149aa|down_6|NC_020291.1_637393_637840_+	COG0537, Hit, Diadenosine tetraphosphate (Ap4A) hydrolase and other HIT family hydrolases [Nucleotide transport and metabolism / Carbohydrate transport and metabolism / General function prediction only]	NA|722aa|down_7|NC_020291.1_639394_641560_+	COG1511, COG1511, Predicted membrane protein [Function unknown]	NA|78aa|down_8|NC_020291.1_641802_642036_+	NA	NA|85aa|down_9|NC_020291.1_642048_642303_+	NA
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	3	634173-634260	3	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	GATTAACTTCAACATGAGATGTAT	24	0	0	NA	NA	II-B	1	1	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|104aa|up_9|NC_020291.1_622688_623000_-,NA|108aa|up_2|NC_020291.1_631909_632233_+,NA|104aa|up_1|NC_020291.1_632331_632643_+,NA|78aa|down_4|NC_020291.1_641802_642036_+,NA|85aa|down_5|NC_020291.1_642048_642303_+	NA|104aa|up_9|NC_020291.1_622688_623000_-	NA	NA|136aa|up_8|NC_020291.1_623462_623870_+	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|143aa|up_7|NC_020291.1_623866_624295_+	COG2445, COG2445, Uncharacterized conserved protein [Function unknown]	NA|553aa|up_6|NC_020291.1_624534_626193_+	cd00839, MPP_PAPs, purple acid phosphatases of the metallophosphatase superfamily, metallophosphatase domain	NA|422aa|up_5|NC_020291.1_626306_627572_+	pfam07907, YibE_F, YibE/F-like protein	NA|528aa|up_4|NC_020291.1_627797_629381_+	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|431aa|up_3|NC_020291.1_630538_631831_+	COG0124, HisS, Histidyl-tRNA synthetase [Translation, ribosomal structure and biogenesis]	NA|108aa|up_2|NC_020291.1_631909_632233_+	NA	NA|104aa|up_1|NC_020291.1_632331_632643_+	NA	NA|280aa|up_0|NC_020291.1_632792_633632_-	cd13530, PBP2_peptides_like, Peptide-binding protein and related homologs; type 2 periplasmic binding protein fold	NA|111aa|down_0|NC_020291.1_634422_634755_-	pfam03992, ABM, Antibiotic biosynthesis monooxygenase	NA|574aa|down_1|NC_020291.1_635271_636993_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|149aa|down_2|NC_020291.1_637393_637840_+	COG0537, Hit, Diadenosine tetraphosphate (Ap4A) hydrolase and other HIT family hydrolases [Nucleotide transport and metabolism / Carbohydrate transport and metabolism / General function prediction only]	NA|722aa|down_3|NC_020291.1_639394_641560_+	COG1511, COG1511, Predicted membrane protein [Function unknown]	NA|78aa|down_4|NC_020291.1_641802_642036_+	NA	NA|85aa|down_5|NC_020291.1_642048_642303_+	NA	NA|415aa|down_6|NC_020291.1_642938_644183_+	cd10923, CE4_COG5298, Putative NodB-like catalytic domain of uncharacterized proteins found in bacteria	NA|207aa|down_7|NC_020291.1_644466_645087_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|397aa|down_8|NC_020291.1_645138_646329_-	pfam06500, DUF1100, Alpha/beta hydrolase of unknown function (DUF1100)	NA|265aa|down_9|NC_020291.1_646473_647268_-	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	4	638183-638343	4	CRISPRCasFinder	no	RT	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Unclear	GATTAACTTTAACATGAGATGTATTTAAAT	30	0	0	NA	NA	II-B	2	2	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|108aa|up_5|NC_020291.1_631909_632233_+,NA|104aa|up_4|NC_020291.1_632331_632643_+,NA|78aa|down_1|NC_020291.1_641802_642036_+,NA|85aa|down_2|NC_020291.1_642048_642303_+	NA|553aa|up_9|NC_020291.1_624534_626193_+	cd00839, MPP_PAPs, purple acid phosphatases of the metallophosphatase superfamily, metallophosphatase domain	NA|422aa|up_8|NC_020291.1_626306_627572_+	pfam07907, YibE_F, YibE/F-like protein	NA|528aa|up_7|NC_020291.1_627797_629381_+	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|431aa|up_6|NC_020291.1_630538_631831_+	COG0124, HisS, Histidyl-tRNA synthetase [Translation, ribosomal structure and biogenesis]	NA|108aa|up_5|NC_020291.1_631909_632233_+	NA	NA|104aa|up_4|NC_020291.1_632331_632643_+	NA	NA|280aa|up_3|NC_020291.1_632792_633632_-	cd13530, PBP2_peptides_like, Peptide-binding protein and related homologs; type 2 periplasmic binding protein fold	NA|111aa|up_2|NC_020291.1_634422_634755_-	pfam03992, ABM, Antibiotic biosynthesis monooxygenase	NA|574aa|up_1|NC_020291.1_635271_636993_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|149aa|up_0|NC_020291.1_637393_637840_+	COG0537, Hit, Diadenosine tetraphosphate (Ap4A) hydrolase and other HIT family hydrolases [Nucleotide transport and metabolism / Carbohydrate transport and metabolism / General function prediction only]	NA|722aa|down_0|NC_020291.1_639394_641560_+	COG1511, COG1511, Predicted membrane protein [Function unknown]	NA|78aa|down_1|NC_020291.1_641802_642036_+	NA	NA|85aa|down_2|NC_020291.1_642048_642303_+	NA	NA|415aa|down_3|NC_020291.1_642938_644183_+	cd10923, CE4_COG5298, Putative NodB-like catalytic domain of uncharacterized proteins found in bacteria	NA|207aa|down_4|NC_020291.1_644466_645087_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|397aa|down_5|NC_020291.1_645138_646329_-	pfam06500, DUF1100, Alpha/beta hydrolase of unknown function (DUF1100)	NA|265aa|down_6|NC_020291.1_646473_647268_-	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]	NA|124aa|down_7|NC_020291.1_647376_647748_+	cd01109, HTH_YyaN, Helix-Turn-Helix DNA binding domain of the MerR-like transcription regulators YyaN and YraB	NA|234aa|down_8|NC_020291.1_647940_648642_+	COG0731, COG0731, Fe-S oxidoreductases [Energy production and conversion]	NA|84aa|down_9|NC_020291.1_648721_648973_+	pfam13684, Dak1_2, Dihydroxyacetone kinase family
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	5	1174106-1174207	5	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	ATCAGATGGTACTAGAGGTGCAATGAA	27	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|64aa|up_8|NC_020291.1_1164443_1164635_-,NA|127aa|down_4|NC_020291.1_1181956_1182337_-	NA|243aa|up_9|NC_020291.1_1163599_1164328_+	pfam04463, DUF523, Protein of unknown function (DUF523)	NA|64aa|up_8|NC_020291.1_1164443_1164635_-	NA	NA|492aa|up_7|NC_020291.1_1164734_1166210_-	PRK09852, PRK09852, cryptic 6-phospho-beta-glucosidase; Provisional	NA|486aa|up_6|NC_020291.1_1166430_1167888_+	cd17502, MFS_Azr1_MDR_like, Saccharomyces cerevisiae Azole resistance protein 1 (Azr1p), and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|255aa|up_5|NC_020291.1_1168026_1168791_-	cd07363, 45_DOPA_Dioxygenase, The Class III extradiol dioxygenase, 4,5-DOPA Dioxygenase, catalyzes the incorporation of both atoms of molecular oxygen into 4,5-dihydroxy-phenylalanine	NA|145aa|up_4|NC_020291.1_1169040_1169475_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|158aa|up_3|NC_020291.1_1169573_1170047_+	COG0386, BtuE, Glutathione peroxidase [Posttranslational modification, protein turnover, chaperones]	NA|289aa|up_2|NC_020291.1_1170090_1170957_+	COG0492, TrxB, Thioredoxin reductase [Posttranslational modification, protein turnover, chaperones]	NA|104aa|up_1|NC_020291.1_1170973_1171285_+	TIGR01068, Thioredoxin-like_protein_slr0233, thioredoxin	NA|179aa|up_0|NC_020291.1_1171445_1171982_+	COG0386, BtuE, Glutathione peroxidase [Posttranslational modification, protein turnover, chaperones]	NA|412aa|down_0|NC_020291.1_1174587_1175823_+	COG0420, SbcD, DNA repair exonuclease [DNA replication, recombination, and repair]	NA|1163aa|down_1|NC_020291.1_1175797_1179286_+	TIGR00618, Nuclease_SbcCD_subunit_C, exonuclease SbcC	NA|549aa|down_2|NC_020291.1_1179358_1181005_-	PRK05290, PRK05290, hybrid cluster protein; Provisional	NA|248aa|down_3|NC_020291.1_1181194_1181938_-	COG3279, LytT, Response regulator of the LytR/AlgR family [Transcription / Signal transduction mechanisms]	NA|127aa|down_4|NC_020291.1_1181956_1182337_-	NA	NA|325aa|down_5|NC_020291.1_1182364_1183339_-	PRK13665, PRK13665, hypothetical protein; Provisional	NA|166aa|down_6|NC_020291.1_1183411_1183909_-	COG1030, NfeD, Membrane-bound serine protease (ClpP class) [Posttranslational modification, protein turnover, chaperones]	NA|283aa|down_7|NC_020291.1_1184108_1184957_-	COG3290, CitA, Signal transduction histidine kinase regulating citrate/malate metabolism [Signal transduction mechanisms]	NA|576aa|down_8|NC_020291.1_1185228_1186956_+	cd05799, PGM2, This CD includes PGM2 (phosphoglucomutase 2) and PGM2L1 (phosphoglucomutase 2-like 1)	NA|367aa|down_9|NC_020291.1_1187114_1188215_+	sd00006, TPR, Tetratricopeptide repeat
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	6	2066409-2066536	6	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	GCATAGCTGCTCTTTTTATAAGGGCA	26	1	4	2066435-2066454|2066435-2066454|2066435-2066454|2066435-2066454	NC_020291.1_2722980-2722999|NC_020291.1_910605-910586|NC_020291.1_4561423-4561442|NC_020291.1_5926267-5926286	NA	2	2	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|48aa|up_7|NC_020291.1_2056237_2056381_+,NA|51aa|down_9|NC_020291.1_2078975_2079128_+	NA|742aa|up_9|NC_020291.1_2050799_2053025_+	pfam02011, Glyco_hydro_48, Glycosyl hydrolase family 48	NA|872aa|up_8|NC_020291.1_2053441_2056057_+	pfam00759, Glyco_hydro_9, Glycosyl hydrolase family 9	NA|48aa|up_7|NC_020291.1_2056237_2056381_+	NA	NA|714aa|up_6|NC_020291.1_2056653_2058795_+	pfam00759, Glyco_hydro_9, Glycosyl hydrolase family 9	NA|609aa|up_5|NC_020291.1_2058820_2060647_+	pfam12891, Glyco_hydro_44, Glycoside hydrolase family 44	NA|473aa|up_4|NC_020291.1_2060675_2062094_+	COG3934, COG3934, Endo-beta-mannanase [Carbohydrate transport and metabolism]	NA|441aa|up_3|NC_020291.1_2062163_2063486_-	cd16935, HATPase_AgrC-ComD-like, Histidine kinase-like ATPase domain of two-component sensor histidine kinases similar to Staphylococcus aureus AgrC and Streptococcus pneumoniae ComD which are involved in quorum sensing	NA|244aa|up_2|NC_020291.1_2063473_2064205_-	COG3279, LytT, Response regulator of the LytR/AlgR family [Transcription / Signal transduction mechanisms]	NA|199aa|up_1|NC_020291.1_2064492_2065089_-	PRK01100, PRK01100, accessory gene regulator ArgB-like protein	NA|179aa|up_0|NC_020291.1_2065459_2065996_+	pfam02517, Abi, CAAX protease self-immunity	NA|494aa|down_0|NC_020291.1_2066706_2068188_+	COG2730, BglC, Endoglucanase [Carbohydrate transport and metabolism]	NA|380aa|down_1|NC_020291.1_2068222_2069362_+	COG4124, ManB, Beta-mannanase [Carbohydrate transport and metabolism]	NA|407aa|down_2|NC_020291.1_2069753_2070974_-	cd17320, MFS_MdfA_MDR_like, Multidrug transporter MdfA and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|295aa|down_3|NC_020291.1_2071263_2072148_-	cd07712, MBLAC2-like_MBL-fold, uncharacterized human metallo-beta-lactamase domain-containing protein 2 and related proteins; MBL-fold metallo hydrolase domain	NA|112aa|down_4|NC_020291.1_2072452_2072788_+	COG1733, COG1733, Predicted transcriptional regulators [Transcription]	NA|420aa|down_5|NC_020291.1_2073698_2074958_+	cd06174, MFS, Major Facilitator Superfamily	NA|653aa|down_6|NC_020291.1_2074941_2076900_+	COG0480, FusA, Translation elongation factors (GTPases) [Translation, ribosomal structure and biogenesis]	NA|100aa|down_7|NC_020291.1_2077233_2077533_+	pfam17098, Wtap, WTAP/Mum2p family	NA|251aa|down_8|NC_020291.1_2078239_2078992_+	cd00229, SGNH_hydrolase, SGNH_hydrolase, or GDSL_hydrolase, is a diverse family of lipases and esterases	NA|51aa|down_9|NC_020291.1_2078975_2079128_+	NA
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	7	4306294-4306455	7	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	TATTCCTAATGGGGTAACAAATAT	24	0	0	NA	NA	NA	2	2	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|140aa|up_5|NC_020291.1_4298220_4298640_-,NA|430aa|up_0|NC_020291.1_4303977_4305267_-,NA|32aa|down_3|NC_020291.1_4309816_4309912_-	NA|310aa|up_9|NC_020291.1_4290879_4291809_-	TIGR00745, Putative_2-dehydropantoate_2-reductase, 2-dehydropantoate 2-reductase	NA|112aa|up_8|NC_020291.1_4292232_4292568_-	COG4538, COG4538, Uncharacterized conserved protein [Function unknown]	NA|213aa|up_7|NC_020291.1_4292595_4293234_-	pfam02589, LUD_dom, LUD domain	NA|1635aa|up_6|NC_020291.1_4293297_4298202_-	pfam13569, DUF4132, Domain of unknown function (DUF4132)	NA|140aa|up_5|NC_020291.1_4298220_4298640_-	NA	NA|574aa|up_4|NC_020291.1_4299244_4300966_-	cd18043, DEXXQc_SF1, DEXXQ-box helicase domain of Superfamily 1 helicases	NA|301aa|up_3|NC_020291.1_4301057_4301960_-	cd01174, ribokinase, Ribokinase catalyses the phosphorylation of ribose to ribose-5-phosphate using ATP	NA|299aa|up_2|NC_020291.1_4302101_4302998_-	cd08434, PBP2_GltC_like, The substrate binding domain of LysR-type transcriptional regulator GltC, which activates gltA expression of glutamate synthase operon, contains type 2 periplasmic binding fold	NA|187aa|up_1|NC_020291.1_4303327_4303888_+	cd02136, PnbA_NfnB-like, nitroreductase similar to Mycobacterium smegmatis NfnB	NA|430aa|up_0|NC_020291.1_4303977_4305267_-	NA	NA|261aa|down_0|NC_020291.1_4306753_4307536_-	COG1187, RsuA, 16S rRNA uridine-516 pseudouridylate synthase and related pseudouridylate synthases [Translation, ribosomal structure and biogenesis]	NA|319aa|down_1|NC_020291.1_4307633_4308590_-	cd12162, 2-Hacid_dh_4, Putative D-isomer specific 2-hydroxyacid dehydrogenases	NA|331aa|down_2|NC_020291.1_4308626_4309619_-	TIGR02917, TPR_domain_protein, putative PEP-CTERM system TPR-repeat lipoprotein	NA|32aa|down_3|NC_020291.1_4309816_4309912_-	NA	NA|152aa|down_4|NC_020291.1_4309984_4310440_-	pfam04074, DUF386, Domain of unknown function (DUF386)	NA|249aa|down_5|NC_020291.1_4310476_4311223_-	PRK05653, fabG, 3-oxoacyl-ACP reductase FabG	NA|399aa|down_6|NC_020291.1_4311483_4312680_-	COG4692, COG4692, Predicted neuraminidase (sialidase) [Carbohydrate transport and metabolism]	NA|471aa|down_7|NC_020291.1_4313017_4314430_-	cd10322, SLC5sbd, Solute carrier 5 family, sodium/glucose transporters and related proteins; solute-binding domain	NA|332aa|down_8|NC_020291.1_4314526_4315522_-	PRK00232, pdxA, 4-hydroxythreonine-4-phosphate dehydrogenase; Reviewed	NA|431aa|down_9|NC_020291.1_4315518_4316811_-	pfam07005, DUF1537, Putative sugar-binding N-terminal domain
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	8	4341559-4341685	8	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	GGAGTTACTGCATCATTCTTTTTTGCATTTACTTTTATA	39	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA,NA	NA|417aa|up_9|NC_020291.1_4326179_4327430_-	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|1048aa|up_8|NC_020291.1_4327419_4330563_-	COG0841, AcrB, Cation/multidrug efflux pump [Defense mechanisms]	NA|290aa|up_7|NC_020291.1_4330726_4331596_-	PRK08185, PRK08185, hypothetical protein; Provisional	NA|287aa|up_6|NC_020291.1_4331636_4332497_-	pfam01116, F_bP_aldolase, Fructose-bisphosphate aldolase class-II	NA|359aa|up_5|NC_020291.1_4332524_4333601_-	COG1299, FruA, Phosphotransferase system, fructose-specific IIC component [Carbohydrate transport and metabolism]	NA|104aa|up_4|NC_020291.1_4333631_4333943_-	COG1445, FrwB, Phosphotransferase system fructose-specific component IIB [Carbohydrate transport and metabolism]	NA|800aa|up_3|NC_020291.1_4334015_4336415_-	pfam00359, PTS_EIIA_2, Phosphoenolpyruvate-dependent sugar phosphotransferase system, EIIA 2	NA|662aa|up_2|NC_020291.1_4336745_4338731_+	COG0840, Tar, Methyl-accepting chemotaxis protein [Cell motility and secretion / Signal transduction mechanisms]	NA|373aa|up_1|NC_020291.1_4339358_4340477_+	cd04735, OYE_like_4_FMN, Old yellow enzyme (OYE)-related FMN binding domain, group 4	NA|185aa|up_0|NC_020291.1_4340812_4341367_-	cd02209, cupin_XRE_C, XRE (Xenobiotic Response Element) family transcriptional regulators, C-terminal cupin domain	NA|297aa|down_0|NC_020291.1_4342865_4343756_-	COG3677, COG3677, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|334aa|down_1|NC_020291.1_4344110_4345112_-	COG1984, DUR1, Allophanate hydrolase subunit 2 [Amino acid transport and metabolism]	NA|237aa|down_2|NC_020291.1_4345111_4345822_-	COG2049, DUR1, Allophanate hydrolase subunit 1 [Amino acid transport and metabolism]	NA|260aa|down_3|NC_020291.1_4345969_4346749_-	cd10787, LamB_YcsF_like, LamB/YcsF family of  lactam utilization protein	NA|263aa|down_4|NC_020291.1_4347107_4347896_-	PRK05463, PRK05463, putative hydro-lyase	NA|358aa|down_5|NC_020291.1_4348316_4349390_-	pfam14336, DUF4392, Domain of unknown function (DUF4392)	NA|283aa|down_6|NC_020291.1_4349400_4350249_-	cd01558, D-AAT_like, D-Alanine aminotransferase (D-AAT_like): D-amino acid aminotransferase catalyzes transamination between D-amino acids and their respective alpha-keto acids	NA|152aa|down_7|NC_020291.1_4350629_4351085_-	COG1522, Lrp, Transcriptional regulators [Transcription]	NA|235aa|down_8|NC_020291.1_4351094_4351799_-	COG0410, LivF, ABC-type branched-chain amino acid transport systems, ATPase component [Amino acid transport and metabolism]	NA|257aa|down_9|NC_020291.1_4351800_4352571_-	COG0411, LivG, ABC-type branched-chain amino acid transport systems, ATPase component [Amino acid transport and metabolism]
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	9	4375620-4375720	9	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	ATAATCTTGGTTGCAGATAAGTT	23	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|316aa|up_5|NC_020291.1_4369224_4370172_-,NA|65aa|up_4|NC_020291.1_4370652_4370847_-,NA|249aa|up_1|NC_020291.1_4372789_4373536_-,NA|82aa|down_3|NC_020291.1_4377805_4378051_-,NA|197aa|down_4|NC_020291.1_4378431_4379022_-,NA|186aa|down_7|NC_020291.1_4381434_4381992_-,NA|60aa|down_8|NC_020291.1_4382042_4382222_-,NA|75aa|down_9|NC_020291.1_4382299_4382524_-	NA|171aa|up_9|NC_020291.1_4364456_4364969_-	pfam00232, Glyco_hydro_1, Glycosyl hydrolase family 1	NA|313aa|up_8|NC_020291.1_4365166_4366105_+	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|568aa|up_7|NC_020291.1_4366293_4367997_-	COG4715, COG4715, Uncharacterized conserved protein [Function unknown]	NA|293aa|up_6|NC_020291.1_4368104_4368983_-	TIGR01784, Uncharacterized_protein_pSLT051, conserved hypothetical protein (putative transposase or invertase)	NA|316aa|up_5|NC_020291.1_4369224_4370172_-	NA	NA|65aa|up_4|NC_020291.1_4370652_4370847_-	NA	NA|211aa|up_3|NC_020291.1_4370945_4371578_-	COG0727, COG0727, Predicted Fe-S-cluster oxidoreductase [General function prediction only]	NA|59aa|up_2|NC_020291.1_4372034_4372211_-	PRK00270, rpsU, 30S ribosomal protein S21; Reviewed	NA|249aa|up_1|NC_020291.1_4372789_4373536_-	NA	NA|645aa|up_0|NC_020291.1_4373620_4375555_-	pfam09848, DUF2075, Uncharacterized conserved protein (DUF2075)	NA|106aa|down_0|NC_020291.1_4375743_4376061_-	cd11537, NTP-PPase_RS21-C6_like, Nucleoside Triphosphate Pyrophosphohydrolase (EC 3	NA|294aa|down_1|NC_020291.1_4376329_4377211_-	TIGR01784, Uncharacterized_protein_pSLT051, conserved hypothetical protein (putative transposase or invertase)	NA|122aa|down_2|NC_020291.1_4377443_4377809_-	pfam13975, gag-asp_proteas, gag-polyprotein putative aspartyl protease	NA|82aa|down_3|NC_020291.1_4377805_4378051_-	NA	NA|197aa|down_4|NC_020291.1_4378431_4379022_-	NA	NA|359aa|down_5|NC_020291.1_4379240_4380317_+	PRK00558, uvrC, excinuclease ABC subunit UvrC	NA|219aa|down_6|NC_020291.1_4380634_4381291_-	sd00036, LRR_3, leucine-rich repeats	NA|186aa|down_7|NC_020291.1_4381434_4381992_-	NA	NA|60aa|down_8|NC_020291.1_4382042_4382222_-	NA	NA|75aa|down_9|NC_020291.1_4382299_4382524_-	NA
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	10	5276834-5278564	2,1,10	CRT,PILER-CR,CRISPRCasFinder	no	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Unclear	ATTTACATTCCTCATAGTTAATATAANNAAC,ATTTACATTCCTCATAGTTAATATAAAAC,ATTTACATTCCTCATAGTTAATATAAAAC	31,29,29	0	0	NA	NA	NA:I-A:I-A	26,24,25	26	Unclear	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|381aa|up_2|NC_020291.1_5272990_5274133_-,NA	NA|264aa|up_9|NC_020291.1_5263130_5263922_+	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|347aa|up_8|NC_020291.1_5263950_5264991_+	cd01148, TroA_a, Metal binding protein TroA_a	NA|601aa|up_7|NC_020291.1_5265369_5267172_+	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|112aa|up_6|NC_020291.1_5267240_5267576_-	cd06983, cupin_dsy2733, Desulfitobacterium hafniense dsy2733 and related proteins, cupin domain	NA|113aa|up_5|NC_020291.1_5267580_5267919_-	cd02230, cupin_HP0902-like, Helicobacter pylori HP0902 and related proteins, cupin domain	NA|1290aa|up_4|NC_020291.1_5268096_5271966_-	COG1924, COG1924, Activator of 2-hydroxyglutaryl-CoA dehydratase (HSP70-class ATPase domain) [Lipid metabolism]	NA|228aa|up_3|NC_020291.1_5272072_5272756_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|381aa|up_2|NC_020291.1_5272990_5274133_-	NA	NA|371aa|up_1|NC_020291.1_5274438_5275551_-	PRK06520, PRK06520, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase	NA|303aa|up_0|NC_020291.1_5275716_5276625_-	COG0583, LysR, Transcriptional regulator [Transcription]	cas2|88aa|down_0|NC_020291.1_5281036_5281300_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|328aa|down_1|NC_020291.1_5281301_5282285_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|173aa|down_2|NC_020291.1_5282289_5282808_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas3|739aa|down_3|NC_020291.1_5282851_5285068_-	TIGR01587, CRISPR-associated_endonuclease/helicase_Cas3, CRISPR-associated helicase Cas3	cas5|224aa|down_4|NC_020291.1_5285207_5285879_-	cd09658, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|303aa|down_5|NC_020291.1_5285885_5286794_-	TIGR02585, conserved_protein, CRISPR-associated protein Cas7/Cst2/DevR, subtype I-B/TNEAP	cas8b2|608aa|down_6|NC_020291.1_5286795_5288619_-	cd09665, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|246aa|down_7|NC_020291.1_5288633_5289371_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	WYL|317aa|down_8|NC_020291.1_5289462_5290413_-	pfam13280, WYL, WYL domain	NA|251aa|down_9|NC_020291.1_5290673_5291426_-	PRK10621, PRK10621, hypothetical protein; Provisional
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	11	5278601-5280855	3,2,11	CRT,PILER-CR,CRISPRCasFinder	no	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Unclear	ATTTACATTCCTCATAGTTAATATAAAAC,ATTTACATTCCTCATAGTTAATATAAAAC,ATTTACATTCCTCATAGTTAATATAAAAC	29,29,29	0	0	NA	NA	I-A:I-A:I-A	34,33,33	34	Unclear	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|381aa|up_2|NC_020291.1_5272990_5274133_-,NA	NA|264aa|up_9|NC_020291.1_5263130_5263922_+	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|347aa|up_8|NC_020291.1_5263950_5264991_+	cd01148, TroA_a, Metal binding protein TroA_a	NA|601aa|up_7|NC_020291.1_5265369_5267172_+	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|112aa|up_6|NC_020291.1_5267240_5267576_-	cd06983, cupin_dsy2733, Desulfitobacterium hafniense dsy2733 and related proteins, cupin domain	NA|113aa|up_5|NC_020291.1_5267580_5267919_-	cd02230, cupin_HP0902-like, Helicobacter pylori HP0902 and related proteins, cupin domain	NA|1290aa|up_4|NC_020291.1_5268096_5271966_-	COG1924, COG1924, Activator of 2-hydroxyglutaryl-CoA dehydratase (HSP70-class ATPase domain) [Lipid metabolism]	NA|228aa|up_3|NC_020291.1_5272072_5272756_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|381aa|up_2|NC_020291.1_5272990_5274133_-	NA	NA|371aa|up_1|NC_020291.1_5274438_5275551_-	PRK06520, PRK06520, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase	NA|303aa|up_0|NC_020291.1_5275716_5276625_-	COG0583, LysR, Transcriptional regulator [Transcription]	cas2|88aa|down_0|NC_020291.1_5281036_5281300_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|328aa|down_1|NC_020291.1_5281301_5282285_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|173aa|down_2|NC_020291.1_5282289_5282808_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas3|739aa|down_3|NC_020291.1_5282851_5285068_-	TIGR01587, CRISPR-associated_endonuclease/helicase_Cas3, CRISPR-associated helicase Cas3	cas5|224aa|down_4|NC_020291.1_5285207_5285879_-	cd09658, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|303aa|down_5|NC_020291.1_5285885_5286794_-	TIGR02585, conserved_protein, CRISPR-associated protein Cas7/Cst2/DevR, subtype I-B/TNEAP	cas8b2|608aa|down_6|NC_020291.1_5286795_5288619_-	cd09665, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|246aa|down_7|NC_020291.1_5288633_5289371_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	WYL|317aa|down_8|NC_020291.1_5289462_5290413_-	pfam13280, WYL, WYL domain	NA|251aa|down_9|NC_020291.1_5290673_5291426_-	PRK10621, PRK10621, hypothetical protein; Provisional
GCF_000340885.1_ASM34088v1	NC_020291	Clostridium saccharoperbutylacetonicum N1-4(HMT), complete sequence	12	6007076-6007161	12	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	Orphan	AACCAACCAGTTTTCATTGCTCCTGA	26	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,PD-DExK,WYL,DinG,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6,cas14j	NA|105aa|up_8|NC_020291.1_5988032_5988347_-,NA|465aa|down_7|NC_020291.1_6021861_6023256_-	NA|776aa|up_9|NC_020291.1_5985560_5987888_-	cd02696, MurNAc-LAA, N-acetylmuramoyl-L-alanine amidase or MurNAc-LAA (also known as peptidoglycan aminohydrolase, NAMLA amidase, NAMLAA, Amidase 3, and peptidoglycan amidase; EC 3	NA|105aa|up_8|NC_020291.1_5988032_5988347_-	NA	NA|532aa|up_7|NC_020291.1_5988605_5990201_-	COG4108, PrfC, Peptide chain release factor RF-3 [Translation, ribosomal structure and biogenesis]	NA|355aa|up_6|NC_020291.1_5990744_5991809_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|1153aa|up_5|NC_020291.1_5991897_5995356_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|668aa|up_4|NC_020291.1_5996093_5998097_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|685aa|up_3|NC_020291.1_5998269_6000324_-	COG3437, COG3437, Response regulator containing a CheY-like receiver domain and an HD-GYP domain [Transcription / Signal transduction mechanisms]	NA|436aa|up_2|NC_020291.1_6000839_6002147_-	COG0840, Tar, Methyl-accepting chemotaxis protein [Cell motility and secretion / Signal transduction mechanisms]	NA|743aa|up_1|NC_020291.1_6002411_6004640_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|482aa|up_0|NC_020291.1_6005193_6006639_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|564aa|down_0|NC_020291.1_6009493_6011185_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|605aa|down_1|NC_020291.1_6011485_6013300_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|376aa|down_2|NC_020291.1_6013702_6014830_+	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|468aa|down_3|NC_020291.1_6014954_6016358_-	COG1672, COG1672, Predicted ATPase (AAA+ superfamily) [General function prediction only]	NA|517aa|down_4|NC_020291.1_6016657_6018208_-	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|561aa|down_5|NC_020291.1_6018268_6019951_-	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|567aa|down_6|NC_020291.1_6019984_6021685_-	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|465aa|down_7|NC_020291.1_6021861_6023256_-	NA	NA|391aa|down_8|NC_020291.1_6024362_6025535_+	COG1835, COG1835, Predicted acyltransferases [Lipid metabolism]	NA|318aa|down_9|NC_020291.1_6026015_6026969_-	cd04187, DPM1_like_bac, Bacterial DPM1_like enzymes are related to eukaryotic DPM1
