assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000016965.1_ASM1696v1	NC_009617	Clostridium beijerinckii NCIMB 8052, complete sequence	1	1015037-1015137	1	CRISPRCasFinder	no		cas3,DEDDh,csa3,DinG,RT,WYL	Orphan	AAAAAGTGCGAAGCACAATTAAGA	24	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,csa3,DinG,RT,WYL	NA|110aa|up_9|NC_009617.1_1002633_1002963_+,NA	NA|110aa|up_9|NC_009617.1_1002633_1002963_+	NA	NA|602aa|up_8|NC_009617.1_1003134_1004940_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|147aa|up_7|NC_009617.1_1005120_1005561_+	cd07311, terB_like_1, tellurium resistance terB-like protein, subgroup 1	NA|376aa|up_6|NC_009617.1_1005776_1006904_+	PRK05799, PRK05799, oxygen-independent coproporphyrinogen III oxidase	NA|343aa|up_5|NC_009617.1_1007142_1008171_+	PRK00082, hrcA, heat-inducible transcription repressor; Provisional	NA|208aa|up_4|NC_009617.1_1008208_1008832_+	PRK14160, PRK14160, heat shock protein GrpE; Provisional	NA|615aa|up_3|NC_009617.1_1008937_1010782_+	PRK00290, dnaK, molecular chaperone DnaK; Provisional	NA|378aa|up_2|NC_009617.1_1010892_1012026_+	PRK14297, PRK14297, molecular chaperone DnaJ	NA|517aa|up_1|NC_009617.1_1012186_1013737_+	COG0155, CysI, Sulfite reductase, beta subunit (hemoprotein) [Inorganic ion transport and metabolism]	NA|220aa|up_0|NC_009617.1_1014158_1014818_+	PRK00121, trmB, tRNA (guanine-N(7)-)-methyltransferase; Reviewed	NA|315aa|down_0|NC_009617.1_1015517_1016462_+	pfam06325, PrmA, Ribosomal protein L11 methyltransferase (PrmA)	NA|256aa|down_1|NC_009617.1_1016668_1017436_+	PRK11713, PRK11713, 16S ribosomal RNA methyltransferase RsmE; Provisional	NA|468aa|down_2|NC_009617.1_1017435_1018839_+	COG0621, MiaB, 2-methylthioadenine synthetase [Translation, ribosomal structure and biogenesis]	NA|115aa|down_3|NC_009617.1_1018988_1019333_+	cd01276, PKCI_related, Protein Kinase C Interacting protein related (PKCI): PKCI and related proteins belong to the ubiquitous HIT family of hydrolases that act on alpha-phosphates of ribonucleotides	NA|59aa|down_4|NC_009617.1_1019475_1019652_+	PRK00270, rpsU, 30S ribosomal protein S21; Reviewed	NA|151aa|down_5|NC_009617.1_1019682_1020135_+	pfam09424, YqeY, Yqey-like protein	NA|93aa|down_6|NC_009617.1_1020423_1020702_+	TIGR02856, Uncharacterized_protein_YqfC, sporulation protein YqfC	NA|376aa|down_7|NC_009617.1_1020708_1021836_+	pfam06898, YqfD, Putative stage IV sporulation protein YqfD	NA|695aa|down_8|NC_009617.1_1021896_1023981_+	COG1480, COG1480, Predicted membrane-associated HD superfamily hydrolase [General function prediction only]	NA|168aa|down_9|NC_009617.1_1024007_1024511_+	PRK00016, PRK00016, metal-binding heat shock protein; Provisional
GCF_000016965.1_ASM1696v1	NC_009617	Clostridium beijerinckii NCIMB 8052, complete sequence	2	1516095-1516173	2	CRISPRCasFinder	no		cas3,DEDDh,csa3,DinG,RT,WYL	Orphan	ATGAAAAGAGTGCGGAGCACAATT	24	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,csa3,DinG,RT,WYL	NA|172aa|up_9|NC_009617.1_1505487_1506003_+,NA|313aa|down_9|NC_009617.1_1526935_1527874_+	NA|172aa|up_9|NC_009617.1_1505487_1506003_+	NA	NA|209aa|up_8|NC_009617.1_1506198_1506825_-	TIGR02840, conserved_hypothetical_protein, putative sporulation protein YtaF	NA|271aa|up_7|NC_009617.1_1507135_1507948_+	cd07516, HAD_Pase, phosphatase, similar to Escherichia coli Cof and Thermotoga maritima TM0651; belongs to the haloacid dehalogenase-like superfamily	NA|369aa|up_6|NC_009617.1_1508407_1509514_+	COG2206, COG2206, c-di-GMP phosphodiesterase class II (HD-GYP domain) [Signal transduction mechanisms]	NA|590aa|up_5|NC_009617.1_1509559_1511329_-	COG1001, AdeC, Adenine deaminase [Nucleotide transport and metabolism]	NA|353aa|up_4|NC_009617.1_1511586_1512645_-	pfam10282, Lactonase, Lactonase, 7-bladed beta-propeller	NA|305aa|up_3|NC_009617.1_1513234_1514149_+	PRK05368, PRK05368, homoserine O-succinyltransferase; Provisional	NA|203aa|up_2|NC_009617.1_1514234_1514843_+	pfam09997, DUF2238, Predicted membrane protein (DUF2238)	NA|89aa|up_1|NC_009617.1_1514881_1515148_-	pfam06961, DUF1294, Protein of unknown function (DUF1294)	NA|214aa|up_0|NC_009617.1_1515293_1515935_-	cd00475, Cis_IPPS, Cis (Z)-Isoprenyl Diphosphate Synthases	NA|402aa|down_0|NC_009617.1_1517020_1518226_+	PRK00045, hemA, glutamyl-tRNA reductase; Reviewed	NA|227aa|down_1|NC_009617.1_1518183_1518864_+	PRK05562, PRK05562, NAD(P)-dependent oxidoreductase	NA|292aa|down_2|NC_009617.1_1518907_1519783_+	PRK00072, hemC, porphobilinogen deaminase; Reviewed	NA|488aa|down_3|NC_009617.1_1519795_1521259_+	TIGR01469, Uroporphyrinogen-III_C-methyltransferase, uroporphyrin-III C-methyltransferase	NA|322aa|down_4|NC_009617.1_1521357_1522323_+	PRK09283, PRK09283, porphobilinogen synthase	NA|432aa|down_5|NC_009617.1_1522560_1523856_+	PRK00062, PRK00062, glutamate-1-semialdehyde 2,1-aminomutase	NA|214aa|down_6|NC_009617.1_1523898_1524540_+	pfam02677, DUF208, Uncharacterized BCR, COG1636	NA|186aa|down_7|NC_009617.1_1524623_1525181_+	pfam12983, DUF3867, Protein of unknown function (DUF3867)	NA|325aa|down_8|NC_009617.1_1525587_1526562_-	COG0657, Aes, Esterase/lipase [Lipid metabolism]	NA|313aa|down_9|NC_009617.1_1526935_1527874_+	NA
GCF_000016965.1_ASM1696v1	NC_009617	Clostridium beijerinckii NCIMB 8052, complete sequence	3	1588990-1589129	1	PILER-CR	no		cas3,DEDDh,csa3,DinG,RT,WYL	Orphan	AACCTATATAAACAATTTAAAATAAAA	27	0	0	NA	NA	NA	2	2	Orphan	cas3,DEDDh,csa3,DinG,RT,WYL	NA|242aa|up_8|NC_009617.1_1583738_1584464_+,NA|100aa|up_7|NC_009617.1_1584495_1584795_+,NA|218aa|up_4|NC_009617.1_1586346_1587000_+,NA|66aa|up_3|NC_009617.1_1587024_1587222_+,NA|54aa|up_2|NC_009617.1_1587311_1587473_+,NA|118aa|up_1|NC_009617.1_1587497_1587851_+,NA|319aa|up_0|NC_009617.1_1587939_1588896_+,NA|138aa|down_0|NC_009617.1_1589376_1589790_+,NA|66aa|down_1|NC_009617.1_1589898_1590096_+,NA|616aa|down_2|NC_009617.1_1590098_1591946_+,NA|1152aa|down_3|NC_009617.1_1592467_1595923_+,NA|212aa|down_5|NC_009617.1_1596635_1597271_+,NA|185aa|down_6|NC_009617.1_1597844_1598399_+,NA|102aa|down_7|NC_009617.1_1598409_1598715_+,NA|280aa|down_8|NC_009617.1_1598785_1599625_+	NA|59aa|up_9|NC_009617.1_1583464_1583641_+	pfam07411, DUF1508, Domain of unknown function (DUF1508)	NA|242aa|up_8|NC_009617.1_1583738_1584464_+	NA	NA|100aa|up_7|NC_009617.1_1584495_1584795_+	NA	NA|138aa|up_6|NC_009617.1_1585276_1585690_+	pfam09851, SHOCT, Short C-terminal domain	NA|67aa|up_5|NC_009617.1_1585993_1586194_-	pfam12651, RHH_3, Ribbon-helix-helix domain	NA|218aa|up_4|NC_009617.1_1586346_1587000_+	NA	NA|66aa|up_3|NC_009617.1_1587024_1587222_+	NA	NA|54aa|up_2|NC_009617.1_1587311_1587473_+	NA	NA|118aa|up_1|NC_009617.1_1587497_1587851_+	NA	NA|319aa|up_0|NC_009617.1_1587939_1588896_+	NA	NA|138aa|down_0|NC_009617.1_1589376_1589790_+	NA	NA|66aa|down_1|NC_009617.1_1589898_1590096_+	NA	NA|616aa|down_2|NC_009617.1_1590098_1591946_+	NA	NA|1152aa|down_3|NC_009617.1_1592467_1595923_+	NA	NA|60aa|down_4|NC_009617.1_1596126_1596306_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|212aa|down_5|NC_009617.1_1596635_1597271_+	NA	NA|185aa|down_6|NC_009617.1_1597844_1598399_+	NA	NA|102aa|down_7|NC_009617.1_1598409_1598715_+	NA	NA|280aa|down_8|NC_009617.1_1598785_1599625_+	NA	NA|84aa|down_9|NC_009617.1_1599763_1600015_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins
GCF_000016965.1_ASM1696v1	NC_009617	Clostridium beijerinckii NCIMB 8052, complete sequence	4	4694168-4694264	3	CRISPRCasFinder	no		cas3,DEDDh,csa3,DinG,RT,WYL	Orphan	CCATACTTGTATGGTAGTTATATTT	25	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,csa3,DinG,RT,WYL	NA,NA|99aa|down_3|NC_009617.1_4699933_4700230_+,NA|104aa|down_7|NC_009617.1_4702564_4702876_-	NA|300aa|up_9|NC_009617.1_4680079_4680979_-	cd01174, ribokinase, Ribokinase catalyses the phosphorylation of ribose to ribose-5-phosphate using ATP	NA|566aa|up_8|NC_009617.1_4681144_4682842_-	COG0840, Tar, Methyl-accepting chemotaxis protein [Cell motility and secretion / Signal transduction mechanisms]	NA|488aa|up_7|NC_009617.1_4682924_4684388_-	cd01536, PBP1_ABC_sugar_binding-like, periplasmic sugar-binding domain of active transport systems that are members of the type 1 periplasmic binding protein (PBP1) superfamily	NA|186aa|up_6|NC_009617.1_4684965_4685523_-	COG3963, COG3963, Phospholipid N-methyltransferase [Lipid metabolism]	NA|141aa|up_5|NC_009617.1_4686410_4686833_-	COG0537, Hit, Diadenosine tetraphosphate (Ap4A) hydrolase and other HIT family hydrolases [Nucleotide transport and metabolism / Carbohydrate transport and metabolism / General function prediction only]	NA|502aa|up_4|NC_009617.1_4687117_4688623_-	COG2211, MelB, Na+/melibiose symporter and related transporters [Carbohydrate transport and metabolism]	NA|474aa|up_3|NC_009617.1_4688661_4690083_-	pfam02614, UxaC, Glucuronate isomerase	NA|533aa|up_2|NC_009617.1_4690486_4692085_-	COG0246, MtlD, Mannitol-1-phosphate/altronate dehydrogenases [Carbohydrate transport and metabolism]	NA|354aa|up_1|NC_009617.1_4692213_4693275_-	PRK03906, PRK03906, mannonate dehydratase; Provisional	NA|224aa|up_0|NC_009617.1_4693465_4694137_-	COG1802, GntR, Transcriptional regulators [Transcription]	NA|560aa|down_0|NC_009617.1_4694483_4696163_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|392aa|down_1|NC_009617.1_4696244_4697420_+	COG4134, COG4134, ABC-type uncharacterized transport system, periplasmic component [General function prediction only]	NA|621aa|down_2|NC_009617.1_4697499_4699362_-	COG0531, PotE, Amino acid transporters [Amino acid transport and metabolism]	NA|99aa|down_3|NC_009617.1_4699933_4700230_+	NA	NA|148aa|down_4|NC_009617.1_4700367_4700811_-	pfam13508, Acetyltransf_7, Acetyltransferase (GNAT) domain	NA|52aa|down_5|NC_009617.1_4701099_4701255_-	PRK09857, PRK09857, recombination-promoting nuclease RpnA	NA|354aa|down_6|NC_009617.1_4701407_4702469_-	cd08174, G1PDH-like, Glycerol-1-phosphate dehydrogenase-like	NA|104aa|down_7|NC_009617.1_4702564_4702876_-	NA	NA|64aa|down_8|NC_009617.1_4702959_4703151_-	pfam04024, PspC, PspC domain	NA|572aa|down_9|NC_009617.1_4703555_4705271_-	pfam00920, ILVD_EDD, Dehydratase family
GCF_000016965.1_ASM1696v1	NC_009617	Clostridium beijerinckii NCIMB 8052, complete sequence	5	5491433-5491638	4	CRISPRCasFinder	no		cas3,DEDDh,csa3,DinG,RT,WYL	Orphan	TGGTTGAATGATAATGGAACTTGGTA	26	0	0	NA	NA	NA	3	3	Orphan	cas3,DEDDh,csa3,DinG,RT,WYL	NA|346aa|up_7|NC_009617.1_5477625_5478663_-,NA|95aa|up_3|NC_009617.1_5483585_5483870_+,NA	NA|439aa|up_9|NC_009617.1_5475067_5476384_-	COG0677, WecC, UDP-N-acetyl-D-mannosaminuronate dehydrogenase [Cell envelope biogenesis, outer membrane]	NA|297aa|up_8|NC_009617.1_5476716_5477607_-	cd03352, LbH_LpxD, UDP-3-O-acyl-glucosamine N-acyltransferase (LpxD): The enzyme catalyzes the transfer of 3-hydroxymyristic acid or 3-hydroxy-arachidic acid, depending on the organism, from the acyl carrier protein (ACP) to UDP-3-O-acyl-glucosamine to produce UDP-2,3-diacyl-GlcNAc	NA|346aa|up_7|NC_009617.1_5477625_5478663_-	NA	NA|368aa|up_6|NC_009617.1_5478655_5479759_-	cd00616, AHBA_syn, 3-amino-5-hydroxybenzoic acid synthase family (AHBA_syn)	NA|321aa|up_5|NC_009617.1_5479751_5480714_-	cd05230, UGD_SDR_e, UDP-glucuronate decarboxylase (UGD) and related proteins, extended (e) SDRs	NA|837aa|up_4|NC_009617.1_5480710_5483221_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|95aa|up_3|NC_009617.1_5483585_5483870_+	NA	NA|320aa|up_2|NC_009617.1_5484283_5485243_+	pfam00688, TGFb_propeptide, TGF-beta propeptide	NA|532aa|up_1|NC_009617.1_5485394_5486990_-	PRK00741, prfC, peptide chain release factor 3; Provisional	NA|628aa|up_0|NC_009617.1_5487518_5489402_+	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|650aa|down_0|NC_009617.1_5492038_5493988_+	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|291aa|down_1|NC_009617.1_5494261_5495134_-	cd08563, GDPD_TtGDE_like, Glycerophosphodiester phosphodiesterase domain of Thermoanaerobacter tengcongensis and similar proteins	NA|356aa|down_2|NC_009617.1_5495425_5496493_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|1106aa|down_3|NC_009617.1_5496584_5499902_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|701aa|down_4|NC_009617.1_5500217_5502320_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|436aa|down_5|NC_009617.1_5502592_5503900_-	COG0840, Tar, Methyl-accepting chemotaxis protein [Cell motility and secretion / Signal transduction mechanisms]	NA|745aa|down_6|NC_009617.1_5504169_5506404_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|474aa|down_7|NC_009617.1_5506726_5508148_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|594aa|down_8|NC_009617.1_5508580_5510362_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|656aa|down_9|NC_009617.1_5511390_5513358_-	cd03255, ABC_MJ0796_LolCDE_FtsE, ATP-binding cassette domain of the transporters involved in export of lipoprotein and macrolide, and cell division protein
GCF_000016965.1_ASM1696v1	NC_009617	Clostridium beijerinckii NCIMB 8052, complete sequence	6	5552525-5552671	5	CRISPRCasFinder	no		cas3,DEDDh,csa3,DinG,RT,WYL	Orphan	CATAGCACCTGATCCATTTAAGTAGTA	27	0	0	NA	NA	NA	2	2	Orphan	cas3,DEDDh,csa3,DinG,RT,WYL	NA,NA|86aa|down_6|NC_009617.1_5564653_5564911_+,NA|74aa|down_7|NC_009617.1_5564931_5565153_+,NA|84aa|down_8|NC_009617.1_5565251_5565503_+,NA|48aa|down_9|NC_009617.1_5565548_5565692_+	NA|421aa|up_9|NC_009617.1_5539229_5540492_-	cd03220, ABC_KpsT_Wzt, ATP-binding cassette component of polysaccharide transport system	NA|459aa|up_8|NC_009617.1_5540504_5541881_-	COG1682, TagG, ABC-type polysaccharide/polyol phosphate export systems, permease component [Carbohydrate transport and metabolism / Cell envelope biogenesis, outer membrane]	NA|280aa|up_7|NC_009617.1_5541896_5542736_-	pfam04321, RmlD_sub_bind, RmlD substrate binding domain	NA|323aa|up_6|NC_009617.1_5542750_5543719_-	cd04196, GT_2_like_d, Subfamily of Glycosyltransferase Family GT2 of unknown function	NA|340aa|up_5|NC_009617.1_5543705_5544725_-	COG1088, RfbB, dTDP-D-glucose 4,6-dehydratase [Cell envelope biogenesis, outer membrane]	NA|184aa|up_4|NC_009617.1_5544890_5545442_-	pfam00908, dTDP_sugar_isom, dTDP-4-dehydrorhamnose 3,5-epimerase	NA|294aa|up_3|NC_009617.1_5545476_5546358_-	TIGR01207, Glucose-1-phosphate_thymidylyltransferase_1, glucose-1-phosphate thymidylyltransferase, short form	NA|473aa|up_2|NC_009617.1_5546785_5548204_+	TIGR03023, Sugar_transferase	NA|290aa|up_1|NC_009617.1_5548279_5549149_+	cd04186, GT_2_like_c, Subfamily of Glycosyltransferase Family GT2 of unknown function	NA|611aa|up_0|NC_009617.1_5549357_5551190_+	pfam04932, Wzy_C, O-Antigen ligase	NA|406aa|down_0|NC_009617.1_5555078_5556296_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|415aa|down_1|NC_009617.1_5556426_5557671_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|514aa|down_2|NC_009617.1_5557721_5559263_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|422aa|down_3|NC_009617.1_5559493_5560759_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|434aa|down_4|NC_009617.1_5560923_5562225_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|576aa|down_5|NC_009617.1_5562692_5564420_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|86aa|down_6|NC_009617.1_5564653_5564911_+	NA	NA|74aa|down_7|NC_009617.1_5564931_5565153_+	NA	NA|84aa|down_8|NC_009617.1_5565251_5565503_+	NA	NA|48aa|down_9|NC_009617.1_5565548_5565692_+	NA
