assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000307125.1_ASM30712v1	NC_018648	Clostridium botulinum B str. Eklund 17B (NRP), complete genome	1	592472-592577	1	CRISPRCasFinder	no		csx1,cas3,csa3,DEDDh,DinG,RT,WYL	Orphan	AAATTAACTAAATGAAAATTAAAT	24	0	0	NA	NA	NA	1	1	Orphan	csx1,cas3,csa3,DEDDh,DinG,RT,WYL	NA|235aa|up_5|NC_018648.1_588001_588706_+,NA|58aa|up_1|NC_018648.1_591687_591861_-,NA|101aa|down_5|NC_018648.1_594559_594862_+,NA|214aa|down_6|NC_018648.1_596526_597168_+,NA|159aa|down_8|NC_018648.1_598180_598657_-,NA|81aa|down_9|NC_018648.1_598921_599164_+	NA|432aa|up_9|NC_018648.1_583432_584728_+	COG1316, LytR, Transcriptional regulator [Transcription]	NA|299aa|up_8|NC_018648.1_584752_585649_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|440aa|up_7|NC_018648.1_585662_586982_-	COG1686, DacC, D-alanyl-D-alanine carboxypeptidase [Cell envelope biogenesis, outer membrane]	NA|207aa|up_6|NC_018648.1_587198_587819_+	TIGR01259, ComE_operon_protein_1, comEA protein	NA|235aa|up_5|NC_018648.1_588001_588706_+	NA	NA|126aa|up_4|NC_018648.1_588731_589109_+	pfam06271, RDD, RDD family	NA|451aa|up_3|NC_018648.1_589125_590478_+	COG2265, TrmA, SAM-dependent methyltransferases related to tRNA (uracil-5-)-methyltransferase [Translation, ribosomal structure and biogenesis]	NA|386aa|up_2|NC_018648.1_590546_591704_-	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons	NA|58aa|up_1|NC_018648.1_591687_591861_-	NA	NA|125aa|up_0|NC_018648.1_592045_592420_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|63aa|down_0|NC_018648.1_592619_592808_+	COG1476, COG1476, Predicted transcriptional regulators [Transcription]	NA|70aa|down_1|NC_018648.1_592859_593069_+	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|74aa|down_2|NC_018648.1_593085_593307_+	pfam12728, HTH_17, Helix-turn-helix domain	NA|211aa|down_3|NC_018648.1_593384_594017_+	pfam09681, Phage_rep_org_N, N-terminal phage replisome organizer (Phage_rep_org_N)	NA|96aa|down_4|NC_018648.1_594089_594377_+	TIGR01446, replication_protein, DnaD and phage-associated domain	NA|101aa|down_5|NC_018648.1_594559_594862_+	NA	NA|214aa|down_6|NC_018648.1_596526_597168_+	NA	NA|67aa|down_7|NC_018648.1_597539_597740_-	pfam12841, YvrJ, YvrJ protein family	NA|159aa|down_8|NC_018648.1_598180_598657_-	NA	NA|81aa|down_9|NC_018648.1_598921_599164_+	NA
GCF_000307125.1_ASM30712v1	NC_018648	Clostridium botulinum B str. Eklund 17B (NRP), complete genome	2	973905-974004	2	CRISPRCasFinder	no		csx1,cas3,csa3,DEDDh,DinG,RT,WYL	Orphan	TTATAATTAATTACAATAAATTATAAT	27	0	0	NA	NA	NA	1	1	Orphan	csx1,cas3,csa3,DEDDh,DinG,RT,WYL	NA|111aa|up_8|NC_018648.1_969383_969716_+,NA|52aa|up_7|NC_018648.1_969715_969871_+,NA|184aa|up_6|NC_018648.1_970127_970679_+,NA|216aa|up_5|NC_018648.1_970846_971494_+,NA|52aa|up_4|NC_018648.1_971480_971636_-,NA|59aa|up_2|NC_018648.1_972016_972193_+,NA|134aa|up_0|NC_018648.1_973230_973632_+,NA|346aa|down_3|NC_018648.1_977329_978367_+	NA|484aa|up_9|NC_018648.1_967929_969381_+	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|111aa|up_8|NC_018648.1_969383_969716_+	NA	NA|52aa|up_7|NC_018648.1_969715_969871_+	NA	NA|184aa|up_6|NC_018648.1_970127_970679_+	NA	NA|216aa|up_5|NC_018648.1_970846_971494_+	NA	NA|52aa|up_4|NC_018648.1_971480_971636_-	NA	NA|71aa|up_3|NC_018648.1_971790_972003_+	pfam10779, XhlA, Haemolysin XhlA	NA|59aa|up_2|NC_018648.1_972016_972193_+	NA	NA|267aa|up_1|NC_018648.1_972238_973039_+	cd06525, GH25_Lyc-like, Lyc muramidase is an autolytic lysozyme (autolysin) from Clostridium acetobutylicum encoded by the lyc gene	NA|134aa|up_0|NC_018648.1_973230_973632_+	NA	NA|67aa|down_0|NC_018648.1_974881_975082_+	pfam10960, Holin_BhlA, BhlA holin family	NA|189aa|down_1|NC_018648.1_975391_975958_-	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|348aa|down_2|NC_018648.1_976267_977311_+	pfam09992, NAGPA, Phosphodiester glycosidase	NA|346aa|down_3|NC_018648.1_977329_978367_+	NA	NA|370aa|down_4|NC_018648.1_978519_979629_+	PRK11650, ugpC, sn-glycerol-3-phosphate ABC transporter ATP-binding protein UgpC	NA|314aa|down_5|NC_018648.1_979650_980592_+	COG2508, COG2508, Regulator of polyketide synthase expression [Signal transduction mechanisms / Secondary metabolites biosynthesis, transport, and catabolism]	NA|340aa|down_6|NC_018648.1_980753_981773_+	COG1609, PurR, Transcriptional regulators [Transcription]	NA|496aa|down_7|NC_018648.1_981920_983408_+	PRK14508, PRK14508, 4-alpha-glucanotransferase; Provisional	NA|787aa|down_8|NC_018648.1_983407_985768_+	cd04300, GT35_Glycogen_Phosphorylase, glycogen phosphorylase and similar proteins	NA|580aa|down_9|NC_018648.1_986284_988024_+	pfam03814, KdpA, Potassium-transporting ATPase A subunit
GCF_000307125.1_ASM30712v1	NC_018648	Clostridium botulinum B str. Eklund 17B (NRP), complete genome	3	2143741-2144745	3,1,1	CRISPRCasFinder,CRT,PILER-CR	no		csx1,cas3,csa3,DEDDh,DinG,RT,WYL	Orphan	ATTTAAATACATCTCATGTTAAGGTTAATC,ATTTAAATACATCTCATGTTAAGGTTAATC,TTAAATACATCTCATGTTAAGGTTAATC	30,30,28	1	1	2143835-2143870	NC_018648.1_1998000-1998035	II-B:II-B:II-B	15,15,15	15	Orphan	csx1,cas3,csa3,DEDDh,DinG,RT,WYL	NA,NA	NA|139aa|up_9|NC_018648.1_2133597_2134014_-	PRK05568, PRK05568, flavodoxin; Provisional	NA|487aa|up_8|NC_018648.1_2134105_2135566_-	cd07082, ALDH_F11_NP-GAPDH, NADP+-dependent non-phosphorylating glyceraldehyde 3-phosphate dehydrogenase and ALDH family 11	NA|257aa|up_7|NC_018648.1_2135617_2136388_-	cd06184, flavohem_like_fad_nad_binding, FAD_NAD(P)H binding domain of flavohemoglobin	NA|411aa|up_6|NC_018648.1_2136880_2138113_+	COG0426, FpaA, Uncharacterized flavoproteins [Energy production and conversion]	NA|111aa|up_5|NC_018648.1_2138385_2138718_+	pfam13751, DDE_Tnp_1_6, Transposase DDE domain	NA|54aa|up_4|NC_018648.1_2138760_2138922_-	pfam00301, Rubredoxin, Rubredoxin	NA|78aa|up_3|NC_018648.1_2139119_2139353_-	COG4309, COG4309, Uncharacterized conserved protein [Function unknown]	NA|568aa|up_2|NC_018648.1_2139715_2141419_-	PRK05290, PRK05290, hybrid cluster protein; Provisional	NA|181aa|up_1|NC_018648.1_2141635_2142178_-	PRK14879, PRK14879, Kae1-associated kinase Bud32	NA|425aa|up_0|NC_018648.1_2142315_2143590_-	cd07563, Peptidase_S41_IRBP, Interphotoreceptor retinoid-binding protein; serine protease family S41	NA|264aa|down_0|NC_018648.1_2146548_2147340_-	COG2382, Fes, Enterochelin esterase and related enzymes [Inorganic ion transport and metabolism]	NA|290aa|down_1|NC_018648.1_2147582_2148452_+	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|243aa|down_2|NC_018648.1_2148648_2149377_+	pfam05857, TraX, TraX protein	NA|404aa|down_3|NC_018648.1_2149617_2150829_-	cd17335, MFS_MFSD6, Major facilitator superfamily domain-containing protein 6	NA|297aa|down_4|NC_018648.1_2150933_2151824_-	COG1940, NagC, Transcriptional regulator/sugar kinase [Transcription / Carbohydrate transport and metabolism]	NA|312aa|down_5|NC_018648.1_2151834_2152770_-	COG1482, ManA, Phosphomannose isomerase [Carbohydrate transport and metabolism]	NA|534aa|down_6|NC_018648.1_2152947_2154549_-	cd11333, AmyAc_SI_OligoGlu_DGase, Alpha amylase catalytic domain found in Sucrose isomerases, oligo-1,6-glucosidase (also called isomaltase; sucrase-isomaltase; alpha-limit dextrinase), dextran glucosidase (also called glucan 1,6-alpha-glucosidase), and related proteins	NA|306aa|down_7|NC_018648.1_2154563_2155481_-	pfam08950, DUF1861, Protein of unknown function (DUF1861)	NA|354aa|down_8|NC_018648.1_2155494_2156556_-	cd19974, PBP1_LacI-like, ligand-binding domain of uncharacterized DNA-binding regulatory proteins that are members of the LacI-GalR family of bacterial transcription repressors	NA|363aa|down_9|NC_018648.1_2156624_2157713_-	cd18612, GH130_Lin0857-like, Glycoside hydrolase family 130 such as Listeria innocua beta-1,2-mannobiose phosphorylase
GCF_000307125.1_ASM30712v1	NC_018648	Clostridium botulinum B str. Eklund 17B (NRP), complete genome	4	3372795-3372971	2	PILER-CR	no		csx1,cas3,csa3,DEDDh,DinG,RT,WYL	Orphan	CTCCTGATGCATTAGTGTAGTACCAAGTTCCATTATCATTAA	42	0	0	NA	NA	NA	2	2	Orphan	csx1,cas3,csa3,DEDDh,DinG,RT,WYL	NA|184aa|up_7|NC_018648.1_3360930_3361482_-,NA	NA|532aa|up_9|NC_018648.1_3354601_3356197_-	PRK00741, prfC, peptide chain release factor 3; Provisional	NA|1401aa|up_8|NC_018648.1_3356631_3360834_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|184aa|up_7|NC_018648.1_3360930_3361482_-	NA	NA|696aa|up_6|NC_018648.1_3361774_3363862_-	cd01949, GGDEF, Diguanylate-cyclase (DGC) or GGDEF domain	NA|478aa|up_5|NC_018648.1_3363905_3365339_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|410aa|up_4|NC_018648.1_3365994_3367224_-	pfam12733, Cadherin-like, Cadherin-like beta sandwich domain	NA|449aa|up_3|NC_018648.1_3367373_3368720_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|304aa|up_2|NC_018648.1_3368943_3369855_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|495aa|up_1|NC_018648.1_3370141_3371626_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|106aa|up_0|NC_018648.1_3372109_3372427_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|745aa|down_0|NC_018648.1_3374954_3377189_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|560aa|down_1|NC_018648.1_3377448_3379128_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|763aa|down_2|NC_018648.1_3379546_3381835_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|593aa|down_3|NC_018648.1_3382311_3384090_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|492aa|down_4|NC_018648.1_3384559_3386035_+	cd10923, CE4_COG5298, Putative NodB-like catalytic domain of uncharacterized proteins found in bacteria	NA|680aa|down_5|NC_018648.1_3386281_3388321_-	cd08662, M13, Peptidase family M13 includes neprilysin and endothelin-converting enzyme I	NA|392aa|down_6|NC_018648.1_3388706_3389882_-	pfam09681, Phage_rep_org_N, N-terminal phage replisome organizer (Phage_rep_org_N)	NA|283aa|down_7|NC_018648.1_3390101_3390950_-	cd02525, Succinoglycan_BP_ExoA, ExoA is involved in the biosynthesis of succinoglycan	NA|112aa|down_8|NC_018648.1_3391196_3391532_-	TIGR03340, phn_DUF6, phosphonate utilization associated putative membrane protein	NA|114aa|down_9|NC_018648.1_3391524_3391866_-	PRK15051, PRK15051, 4-amino-4-deoxy-L-arabinose-phosphoundecaprenol flippase subunit ArnE; Provisional
GCF_000307125.1_ASM30712v1	NC_018653	Clostridium botulinum B str. Eklund 17B (NRP) plasmid p17BNRP, complete sequence	1	12964-13339	1	CRISPRCasFinder	no			Orphan	GGAAAAATGCTTAATGGTTGGATTAATGATAATGGCAACTGGTATT	46	0	0	NA	NA	NA	3	3	Orphan	csx1,cas3,csa3,DEDDh,DinG,RT,WYL	NA|120aa|up_7|NC_018653.1_5319_5679_+,NA|74aa|up_6|NC_018653.1_5722_5944_-,NA|121aa|up_2|NC_018653.1_7635_7998_+,NA|63aa|up_1|NC_018653.1_8032_8221_+,NA|171aa|up_0|NC_018653.1_8317_8830_+,NA|63aa|down_1|NC_018653.1_13862_14051_+,NA|54aa|down_2|NC_018653.1_14073_14235_+,NA|79aa|down_3|NC_018653.1_14247_14484_+,NA|712aa|down_5|NC_018653.1_16771_18907_+,NA|213aa|down_7|NC_018653.1_19294_19933_+,NA|227aa|down_9|NC_018653.1_21903_22584_+	NA|257aa|up_9|NC_018653.1_3416_4187_+	pfam01841, Transglut_core, Transglutaminase-like superfamily	NA|298aa|up_8|NC_018653.1_4433_5327_+	cd10227, ParM_like, Plasmid segregation protein ParM and similar proteins	NA|120aa|up_7|NC_018653.1_5319_5679_+	NA	NA|74aa|up_6|NC_018653.1_5722_5944_-	NA	NA|85aa|up_5|NC_018653.1_6149_6404_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|236aa|up_4|NC_018653.1_6458_7166_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|79aa|up_3|NC_018653.1_7326_7563_+	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|121aa|up_2|NC_018653.1_7635_7998_+	NA	NA|63aa|up_1|NC_018653.1_8032_8221_+	NA	NA|171aa|up_0|NC_018653.1_8317_8830_+	NA	NA|110aa|down_0|NC_018653.1_13471_13801_+	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|63aa|down_1|NC_018653.1_13862_14051_+	NA	NA|54aa|down_2|NC_018653.1_14073_14235_+	NA	NA|79aa|down_3|NC_018653.1_14247_14484_+	NA	NA|740aa|down_4|NC_018653.1_14547_16767_+	COG3505, VirD4, Type IV secretory pathway, VirD4 components [Intracellular trafficking and secretion]	NA|712aa|down_5|NC_018653.1_16771_18907_+	NA	NA|92aa|down_6|NC_018653.1_18907_19183_+	pfam17332, pXO2-11, Uncharacterized protein pXO2-11	NA|213aa|down_7|NC_018653.1_19294_19933_+	NA	NA|638aa|down_8|NC_018653.1_19988_21902_+	TIGR02746, hypothetical_protein, type-IV secretion system protein TraC	NA|227aa|down_9|NC_018653.1_21903_22584_+	NA
GCF_000307125.1_ASM30712v1	NC_018653	Clostridium botulinum B str. Eklund 17B (NRP) plasmid p17BNRP, complete sequence	2	27618-27744	2	CRISPRCasFinder	no			Orphan	ATGTAGATTTAAGAAATGCAAATTT	25	0	0	NA	NA	NA	2	2	Orphan	csx1,cas3,csa3,DEDDh,DinG,RT,WYL	NA|712aa|up_9|NC_018653.1_16771_18907_+,NA|213aa|up_7|NC_018653.1_19294_19933_+,NA|227aa|up_5|NC_018653.1_21903_22584_+,NA|92aa|up_2|NC_018653.1_24927_25203_+,NA|172aa|down_0|NC_018653.1_27983_28499_+,NA|117aa|down_1|NC_018653.1_28521_28872_+,NA|137aa|down_3|NC_018653.1_29437_29848_+,NA|53aa|down_4|NC_018653.1_29928_30087_+,NA|104aa|down_5|NC_018653.1_30102_30414_+,NA|105aa|down_6|NC_018653.1_30706_31021_+,NA|79aa|down_7|NC_018653.1_31579_31816_+,NA|72aa|down_8|NC_018653.1_31912_32128_+,NA|96aa|down_9|NC_018653.1_32201_32489_+	NA|712aa|up_9|NC_018653.1_16771_18907_+	NA	NA|92aa|up_8|NC_018653.1_18907_19183_+	pfam17332, pXO2-11, Uncharacterized protein pXO2-11	NA|213aa|up_7|NC_018653.1_19294_19933_+	NA	NA|638aa|up_6|NC_018653.1_19988_21902_+	TIGR02746, hypothetical_protein, type-IV secretion system protein TraC	NA|227aa|up_5|NC_018653.1_21903_22584_+	NA	NA|390aa|up_4|NC_018653.1_22644_23814_+	pfam00877, NLPC_P60, NlpC/P60 family	NA|271aa|up_3|NC_018653.1_23832_24645_+	TIGR02169, chromosome_segregation_protein_related_ptotein, chromosome segregation protein SMC, primarily archaeal type	NA|92aa|up_2|NC_018653.1_24927_25203_+	NA	NA|137aa|up_1|NC_018653.1_25208_25619_+	cd19586, serpin_mimivirus, serpin-like proteins found in mimiviruses	NA|380aa|up_0|NC_018653.1_25632_26772_+	pfam18555, MobL, MobL relaxases	NA|172aa|down_0|NC_018653.1_27983_28499_+	NA	NA|117aa|down_1|NC_018653.1_28521_28872_+	NA	NA|117aa|down_2|NC_018653.1_28885_29236_+	pfam00436, SSB, Single-strand binding protein family	NA|137aa|down_3|NC_018653.1_29437_29848_+	NA	NA|53aa|down_4|NC_018653.1_29928_30087_+	NA	NA|104aa|down_5|NC_018653.1_30102_30414_+	NA	NA|105aa|down_6|NC_018653.1_30706_31021_+	NA	NA|79aa|down_7|NC_018653.1_31579_31816_+	NA	NA|72aa|down_8|NC_018653.1_31912_32128_+	NA	NA|96aa|down_9|NC_018653.1_32201_32489_+	NA
