assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001548175.1_ASM154817v1	NZ_AP014864	Bacillus thuringiensis serovar tolworthi strain Pasteur Institute Standard strain	1	1149125-1149232	1	CRISPRCasFinder	no		cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4	Orphan	AAGTTGTGATAGATATATTTGAAAAA	26	1	1	1149151-1149206	NZ_AP014864.1_1149110-1149165	NA	1	1	Orphan	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4,cas14j,cas7,cas8c,cas5	NA|59aa|up_3|NZ_AP014864.1_1144050_1144227_+,NA|63aa|down_7|NZ_AP014864.1_1157641_1157830_+,NA|71aa|down_9|NZ_AP014864.1_1158023_1158236_-	NA|755aa|up_9|NZ_AP014864.1_1134718_1136983_+	PRK13024, PRK13024, bifunctional preprotein translocase subunit SecD/SecF; Reviewed	NA|298aa|up_8|NZ_AP014864.1_1137139_1138033_+	COG0053, MMT1, Predicted Co/Zn/Cd cation transporters [Inorganic ion transport and metabolism]	NA|780aa|up_7|NZ_AP014864.1_1138134_1140474_+	TIGR00644, recJ, single-stranded-DNA-specific exonuclease RecJ	NA|171aa|up_6|NZ_AP014864.1_1140521_1141034_+	PRK02304, PRK02304, adenine phosphoribosyltransferase; Provisional	NA|728aa|up_5|NZ_AP014864.1_1141244_1143428_+	COG0317, SpoT, Guanosine polyphosphate pyrophosphohydrolases/synthetases [Signal transduction mechanisms / Transcription]	NA|147aa|up_4|NZ_AP014864.1_1143444_1143885_+	PRK05273, PRK05273, D-tyrosyl-tRNA(Tyr) deacylase; Provisional	NA|59aa|up_3|NZ_AP014864.1_1144050_1144227_+	NA	NA|424aa|up_2|NZ_AP014864.1_1144581_1145853_+	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|592aa|up_1|NZ_AP014864.1_1145865_1147641_+	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|256aa|up_0|NZ_AP014864.1_1147982_1148750_+	COG1179, COG1179, Dinucleotide-utilizing enzymes involved in molybdopterin and thiamine biosynthesis family 1 [Coenzyme metabolism]	NA|214aa|down_0|NZ_AP014864.1_1149324_1149966_-	TIGR02894, DNA_bind_RsfA, transcription factor, RsfA family	NA|429aa|down_1|NZ_AP014864.1_1150003_1151290_-	PRK13342, PRK13342, recombination factor protein RarA; Reviewed	NA|139aa|down_2|NZ_AP014864.1_1151583_1152000_+	COG1959, COG1959, Predicted transcriptional regulator [Transcription]	NA|382aa|down_3|NZ_AP014864.1_1152035_1153181_+	COG1104, NifS, Cysteine sulfinate desulfinase/cysteine desulfurase and related enzymes [Amino acid transport and metabolism]	NA|372aa|down_4|NZ_AP014864.1_1153197_1154313_+	PRK00143, mnmA, tRNA-specific 2-thiouridylase MnmA; Reviewed	NA|220aa|down_5|NZ_AP014864.1_1154422_1155082_+	sd00006, TPR, Tetratricopeptide repeat	NA|779aa|down_6|NZ_AP014864.1_1155177_1157514_+	TIGR01448, recD_rel, helicase, putative, RecD/TraA family	NA|63aa|down_7|NZ_AP014864.1_1157641_1157830_+	NA	NA|43aa|down_8|NZ_AP014864.1_1157848_1157977_+	pfam13056, DUF3918, Protein of unknown function (DUF3918)	NA|71aa|down_9|NZ_AP014864.1_1158023_1158236_-	NA
GCF_001548175.1_ASM154817v1	NZ_AP014864	Bacillus thuringiensis serovar tolworthi strain Pasteur Institute Standard strain	2	2250361-2250471	2	CRISPRCasFinder	no		cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4	Orphan	GTAGGACCAGTTATTCCGATTCCGGTA	27	0	0	NA	NA	NA	1	1	Orphan	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4,cas14j,cas7,cas8c,cas5	NA,NA	NA|386aa|up_9|NZ_AP014864.1_2237392_2238550_+	pfam04371, PAD_porph, Porphyromonas-type peptidyl-arginine deiminase	NA|139aa|up_8|NZ_AP014864.1_2238713_2239130_+	PRK02833, PRK02833, phosphate-starvation-inducible protein PsiE; Provisional	NA|311aa|up_7|NZ_AP014864.1_2239311_2240244_+	COG3781, COG3781, Predicted membrane protein [Function unknown]	NA|326aa|up_6|NZ_AP014864.1_2240473_2241451_+	pfam04371, PAD_porph, Porphyromonas-type peptidyl-arginine deiminase	NA|274aa|up_5|NZ_AP014864.1_2241493_2242315_+	cd01107, HTH_BmrR, Helix-Turn-Helix DNA binding domain of the BmrR transcription regulator	NA|581aa|up_4|NZ_AP014864.1_2242396_2244139_+	cd01300, YtcJ_like, YtcJ_like metal dependent amidohydrolases	NA|349aa|up_3|NZ_AP014864.1_2244246_2245293_+	pfam04371, PAD_porph, Porphyromonas-type peptidyl-arginine deiminase	NA|596aa|up_2|NZ_AP014864.1_2245339_2247127_-	cd09608, M3B_PepF, Peptidase family M3B, oligopeptidase F (PepF)	NA|264aa|up_1|NZ_AP014864.1_2247244_2248036_-	pfam00797, Acetyltransf_2, N-acetyltransferase	NA|514aa|up_0|NZ_AP014864.1_2248239_2249781_+	PRK09441, PRK09441, cytoplasmic alpha-amylase; Reviewed	NA|634aa|down_0|NZ_AP014864.1_2251254_2253156_+	PRK00409, PRK00409, recombination and DNA strand exchange inhibitor protein; Reviewed	NA|175aa|down_1|NZ_AP014864.1_2253162_2253687_+	COG3153, COG3153, Predicted acetyltransferase [General function prediction only]	NA|237aa|down_2|NZ_AP014864.1_2253847_2254558_+	pfam00300, His_Phos_1, Histidine phosphatase superfamily (branch 1)	NA|322aa|down_3|NZ_AP014864.1_2254623_2255589_-	cd05286, QOR2, Quinone oxidoreductase (QOR)	NA|298aa|down_4|NZ_AP014864.1_2255712_2256606_+	COG0583, LysR, Transcriptional regulator [Transcription]	NA|171aa|down_5|NZ_AP014864.1_2256897_2257410_+	pfam10901, DUF2690, Protein of unknown function (DUF2690)	NA|159aa|down_6|NZ_AP014864.1_2257427_2257904_+	pfam10901, DUF2690, Protein of unknown function (DUF2690)	NA|179aa|down_7|NZ_AP014864.1_2258016_2258553_-	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|163aa|down_8|NZ_AP014864.1_2258780_2259269_-	pfam05163, DinB, DinB family	NA|152aa|down_9|NZ_AP014864.1_2259461_2259917_+	pfam12867, DinB_2, DinB superfamily
GCF_001548175.1_ASM154817v1	NZ_AP014864	Bacillus thuringiensis serovar tolworthi strain Pasteur Institute Standard strain	3	2846579-2846744	1	PILER-CR	no	RT	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4	Unclear	AGGAATGAATATTCATTCCGAAACAAAAGTAAA	33	0	0	NA	NA	NA	2	2	Orphan	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4,cas14j,cas7,cas8c,cas5	NA,NA|137aa|down_1|NZ_AP014864.1_2849252_2849663_+,NA|137aa|down_4|NZ_AP014864.1_2856125_2856536_+	NA|177aa|up_9|NZ_AP014864.1_2832818_2833349_+	cd01014, nicotinamidase_related, Nicotinamidase_ related amidohydrolases	NA|146aa|up_8|NZ_AP014864.1_2833499_2833937_-	pfam10710, DUF2512, Protein of unknown function (DUF2512)	NA|1161aa|up_7|NZ_AP014864.1_2834118_2837601_+	pfam13212, DUF4020, Domain of unknown function (DUF4020)	NA|359aa|up_6|NZ_AP014864.1_2838428_2839505_+	PRK12595, PRK12595, bifunctional 3-deoxy-7-phosphoheptulonate synthase/chorismate mutase; Reviewed	NA|391aa|up_5|NZ_AP014864.1_2839787_2840960_+	PRK12463, PRK12463, chorismate synthase; Reviewed	NA|367aa|up_4|NZ_AP014864.1_2840978_2842079_+	PRK01533, PRK01533, histidinol-phosphate aminotransferase; Validated	NA|367aa|up_3|NZ_AP014864.1_2842071_2843172_+	PRK06545, PRK06545, prephenate dehydrogenase; Validated	NA|430aa|up_2|NZ_AP014864.1_2843189_2844479_+	PRK02427, PRK02427, 3-phosphoshikimate 1-carboxyvinyltransferase; Provisional	NA|386aa|up_1|NZ_AP014864.1_2844604_2845762_+	COG4552, Eis, Predicted acetyltransferase involved in intracellular survival and related acetyltransferases [General function prediction only]	NA|189aa|up_0|NZ_AP014864.1_2845991_2846558_+	pfam16295, TetR_C_10, Tetracycline repressor, C-terminal all-alpha domain	NA|345aa|down_0|NZ_AP014864.1_2847795_2848830_+	PHA03169, PHA03169, hypothetical protein; Provisional	NA|137aa|down_1|NZ_AP014864.1_2849252_2849663_+	NA	RT|436aa|down_2|NZ_AP014864.1_2851374_2852682_+	TIGR04416, hypothetical_protein, group II intron reverse transcriptase/maturase	NA|479aa|down_3|NZ_AP014864.1_2853478_2854915_-	pfam01609, DDE_Tnp_1, Transposase DDE domain	NA|137aa|down_4|NZ_AP014864.1_2856125_2856536_+	NA	NA|477aa|down_5|NZ_AP014864.1_2856684_2858115_+	pfam01609, DDE_Tnp_1, Transposase DDE domain	NA|542aa|down_6|NZ_AP014864.1_2860009_2861635_+	PRK15064, PRK15064, ABC transporter ATP-binding protein; Provisional	NA|658aa|down_7|NZ_AP014864.1_2862162_2864136_+	COG1368, MdoB, Phosphoglycerol transferase and related proteins, alkaline phosphatase superfamily [Cell envelope biogenesis, outer membrane]	NA|225aa|down_8|NZ_AP014864.1_2864192_2864867_-	TIGR03717, R_switched_YjbE, integral membrane protein, YjbE family	NA|221aa|down_9|NZ_AP014864.1_2864977_2865640_-	pfam12952, DUF3841, Domain of unknown function (DUF3841)
GCF_001548175.1_ASM154817v1	NZ_AP014866	Bacillus thuringiensis serovar tolworthi strain Pasteur Institute Standard strain plasmid pKK2, complete sequence	1	6398-7021	1,1,1	CRISPRCasFinder,CRT,PILER-CR	no	cas7,cas8c,cas5,cas3	cas7,cas8c,cas5,cas3,RT,csa3,cas14j	Type I-U, Type I-U?,Type I-C	ATTTCAATCCACGCACCTATATGAGGTGCGAC,ATTTCAATCCACGCACCTATAT,ATTTCAATCCACGCACCTATATGAGGTGCGAC	32,22,32	0	0	NA	NA	I-C:NA:I-C	9,9,4	9	TypeI-U,TypeI-U?,TypeI-C	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4,cas14j,cas7,cas8c,cas5	NA,NA|306aa|down_1|NZ_AP014866.1_9556_10474_-,NA|131aa|down_3|NZ_AP014866.1_11363_11756_-,NA|270aa|down_4|NZ_AP014866.1_13553_14363_+,NA|575aa|down_5|NZ_AP014866.1_14744_16469_-,NA|490aa|down_6|NZ_AP014866.1_16504_17974_-,NA|570aa|down_7|NZ_AP014866.1_18660_20370_+,NA|48aa|down_8|NZ_AP014866.1_21312_21456_+	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	cas7|287aa|up_3|NZ_AP014866.1_207_1068_-	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas8c|640aa|up_2|NZ_AP014866.1_1070_2990_-	cd09757, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas5|240aa|up_1|NZ_AP014866.1_2990_3710_-	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas3|810aa|up_0|NZ_AP014866.1_3884_6314_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|601aa|down_0|NZ_AP014866.1_7344_9147_-	sd00006, TPR, Tetratricopeptide repeat	NA|306aa|down_1|NZ_AP014866.1_9556_10474_-	NA	NA|261aa|down_2|NZ_AP014866.1_10488_11271_-	pfam06114, Peptidase_M78, IrrE N-terminal-like domain	NA|131aa|down_3|NZ_AP014866.1_11363_11756_-	NA	NA|270aa|down_4|NZ_AP014866.1_13553_14363_+	NA	NA|575aa|down_5|NZ_AP014866.1_14744_16469_-	NA	NA|490aa|down_6|NZ_AP014866.1_16504_17974_-	NA	NA|570aa|down_7|NZ_AP014866.1_18660_20370_+	NA	NA|48aa|down_8|NZ_AP014866.1_21312_21456_+	NA	NA|316aa|down_9|NZ_AP014866.1_21596_22544_+	cd00397, DNA_BRE_C, DNA breaking-rejoining enzymes, C-terminal catalytic domain
GCF_001548175.1_ASM154817v1	NZ_AP014866	Bacillus thuringiensis serovar tolworthi strain Pasteur Institute Standard strain plasmid pKK2, complete sequence	2	292316-292614	2	CRT	no	RT	cas7,cas8c,cas5,cas3,RT,csa3,cas14j	Unclear	ATATTTCAATCCACGCACCTATATAAGGTGCGACTT	36	0	0	NA	NA	I-C	4	4	Orphan	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4,cas14j,cas7,cas8c,cas5	NA|193aa|up_9|NZ_AP014866.1_279084_279663_+,NA|212aa|up_8|NZ_AP014866.1_279713_280349_-,NA|210aa|up_7|NZ_AP014866.1_280348_280978_-,NA|238aa|up_6|NZ_AP014866.1_281314_282028_-,NA|60aa|up_3|NZ_AP014866.1_288316_288496_-,NA|46aa|up_1|NZ_AP014866.1_289707_289845_-,NA|142aa|up_0|NZ_AP014866.1_289866_290292_-,NA	NA|193aa|up_9|NZ_AP014866.1_279084_279663_+	NA	NA|212aa|up_8|NZ_AP014866.1_279713_280349_-	NA	NA|210aa|up_7|NZ_AP014866.1_280348_280978_-	NA	NA|238aa|up_6|NZ_AP014866.1_281314_282028_-	NA	NA|802aa|up_5|NZ_AP014866.1_282044_284450_-	COG0553, HepA, Superfamily II DNA/RNA helicases, SNF2 family [Transcription / DNA replication, recombination, and repair]	RT|622aa|up_4|NZ_AP014866.1_284724_286590_-	TIGR04416, hypothetical_protein, group II intron reverse transcriptase/maturase	NA|60aa|up_3|NZ_AP014866.1_288316_288496_-	NA	NA|364aa|up_2|NZ_AP014866.1_288511_289603_-	TIGR02987, m6_adenine_and_m5_cytosine_DNA_methyltransferase, type II restriction m6 adenine DNA methyltransferase, Alw26I/Eco31I/Esp3I family	NA|46aa|up_1|NZ_AP014866.1_289707_289845_-	NA	NA|142aa|up_0|NZ_AP014866.1_289866_290292_-	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA
GCF_001548175.1_ASM154817v1	NZ_AP014865	Bacillus thuringiensis serovar tolworthi strain Pasteur Institute Standard strain plasmid pKK1, complete sequence	1	384578-384680	1	CRISPRCasFinder	no		csa3,cas14j,cas3,RT	Orphan	AACTTGCAACAGGTTGCTCTTTCT	24	1	2	384602-384656|384602-384656	NZ_AP014865.1_384762-384816|NZ_AP014865.1_384922-384976	NA	1	1	Orphan	cas3,cas14k,DEDDh,csa3,RT,WYL,DinG,c2c9_V-U4,cas14j,cas7,cas8c,cas5	NA|137aa|up_6|NZ_AP014865.1_377280_377691_-,NA|570aa|down_0|NZ_AP014865.1_386085_387795_+,NA|49aa|down_1|NZ_AP014865.1_388737_388884_+,NA|98aa|down_6|NZ_AP014865.1_394711_395005_-,NA|570aa|down_7|NZ_AP014865.1_395936_397646_+,NA|91aa|down_9|NZ_AP014865.1_398952_399225_+	NA|72aa|up_9|NZ_AP014865.1_372969_373185_-	pfam00269, SASP, Small, acid-soluble spore proteins, alpha/beta type	NA|581aa|up_8|NZ_AP014865.1_373351_375094_-	cd11386, MCP_signal, Methyl-accepting chemotaxis protein (MCP), signaling domain	NA|160aa|up_7|NZ_AP014865.1_376082_376562_+	pfam02517, Abi, CAAX protease self-immunity	NA|137aa|up_6|NZ_AP014865.1_377280_377691_-	NA	NA|138aa|up_5|NZ_AP014865.1_378107_378521_-	pfam01934, DUF86, Protein of unknown function DUF86	NA|136aa|up_4|NZ_AP014865.1_378510_378918_-	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|116aa|up_3|NZ_AP014865.1_379280_379628_-	pfam06486, DUF1093, Protein of unknown function (DUF1093)	NA|550aa|up_2|NZ_AP014865.1_379838_381488_-	cd04843, Peptidases_S8_11, Peptidase S8 family domain, uncharacterized subfamily 11	NA|156aa|up_1|NZ_AP014865.1_381842_382310_+	TIGR02894, DNA_bind_RsfA, transcription factor, RsfA family	NA|566aa|up_0|NZ_AP014865.1_382471_384169_-	pfam01418, HTH_6, Helix-turn-helix domain, rpiR family	NA|570aa|down_0|NZ_AP014865.1_386085_387795_+	NA	NA|49aa|down_1|NZ_AP014865.1_388737_388884_+	NA	NA|151aa|down_2|NZ_AP014865.1_390010_390463_-	pfam14567, SUKH_5, SMI1-KNR4 cell-wall	NA|107aa|down_3|NZ_AP014865.1_390467_390788_-	pfam14411, LHH, A nuclease of the HNH/ENDO VII superfamily with conserved LHH	NA|145aa|down_4|NZ_AP014865.1_391673_392108_-	pfam09346, SMI1_KNR4, SMI1 / KNR4 family (SUKH-1)	NA|565aa|down_5|NZ_AP014865.1_392256_393951_-	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|98aa|down_6|NZ_AP014865.1_394711_395005_-	NA	NA|570aa|down_7|NZ_AP014865.1_395936_397646_+	NA	NA|41aa|down_8|NZ_AP014865.1_398702_398825_+	PRK10594, PRK10594, murein L,D-transpeptidase; Provisional	NA|91aa|down_9|NZ_AP014865.1_398952_399225_+	NA
