assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_007559025.1_ASM755902v1	NZ_CP041765	Tomitella sp. HY188 chromosome, complete genome	1	3557049-3557566	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,csa3,WYL,cas4,DEDDh,DinG,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Type I-E	GTGCTCCCCGCGAACGCGGGGATGATCC,GTGCTCCCCGCGAACGCGGGGATGATCCG,GTGCTCCCCGCGAACGCGGGGATGATCC	28,29,28	0	0	NA	NA	I-E:I-E:I-E	7,8,8	8	TypeI-E	cas3,csa3,WYL,cas4,DEDDh,DinG,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA,NA|663aa|down_8|NZ_CP041765.1_3568393_3570382_-	NA|384aa|up_9|NZ_CP041765.1_3545715_3546867_+	cd01158, SCAD_SBCAD, Short chain acyl-CoA dehydrogenases and eukaryotic short/branched chain acyl-CoA dehydrogenases	NA|151aa|up_8|NZ_CP041765.1_3546952_3547405_+	pfam00990, GGDEF, Diguanylate cyclase, GGDEF domain	cas3|941aa|up_7|NZ_CP041765.1_3548007_3550830_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas8e|536aa|up_6|NZ_CP041765.1_3550819_3552427_+	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cse2gr11|234aa|up_5|NZ_CP041765.1_3552423_3553125_+	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas7|380aa|up_4|NZ_CP041765.1_3553167_3554307_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|232aa|up_3|NZ_CP041765.1_3554303_3554999_+	cd09756, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|226aa|up_2|NZ_CP041765.1_3554998_3555676_+	pfam08798, CRISPR_assoc, CRISPR associated protein	cas1|324aa|up_1|NZ_CP041765.1_3555683_3556655_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|114aa|up_0|NZ_CP041765.1_3556648_3556990_+	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	NA|315aa|down_0|NZ_CP041765.1_3560023_3560968_-	pfam13828, DUF4190, Domain of unknown function (DUF4190)	NA|295aa|down_1|NZ_CP041765.1_3561137_3562022_-	pfam00582, Usp, Universal stress protein family	NA|261aa|down_2|NZ_CP041765.1_3562166_3562949_-	COG2258, COG2258, Uncharacterized protein conserved in bacteria [Function unknown]	NA|423aa|down_3|NZ_CP041765.1_3563049_3564318_-	pfam10011, DUF2254, Predicted membrane protein (DUF2254)	NA|129aa|down_4|NZ_CP041765.1_3564392_3564779_-	pfam09851, SHOCT, Short C-terminal domain	NA|143aa|down_5|NZ_CP041765.1_3564792_3565221_-	pfam06897, DUF1269, Protein of unknown function (DUF1269)	NA|402aa|down_6|NZ_CP041765.1_3565329_3566535_-	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|609aa|down_7|NZ_CP041765.1_3566570_3568397_-	cd06423, CESA_like, CESA_like is  the cellulose synthase superfamily	NA|663aa|down_8|NZ_CP041765.1_3568393_3570382_-	NA	NA|400aa|down_9|NZ_CP041765.1_3570374_3571574_-	cd05255, SQD1_like_SDR_e, UDP_sulfoquinovose_synthase (Arabidopsis thaliana SQD1 and related proteins), extended (e) SDRs
GCF_007559025.1_ASM755902v1	NZ_CP041765	Tomitella sp. HY188 chromosome, complete genome	2	3558646-3559944	2,2,2	CRT,CRISPRCasFinder,PILER-CR	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,csa3,WYL,cas4,DEDDh,DinG,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Type I-E	CGAACGCGGGGATGATCC,GTGCTCCCCGCGAACGCGGGGATGATCCG,AGTGCTCCCCGCGAACGCGGGGATGATCC	18,29,29	0	0	NA	NA	NA:I-E:I-E	21,20,3	21	TypeI-E	cas3,csa3,WYL,cas4,DEDDh,DinG,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA,NA|663aa|down_8|NZ_CP041765.1_3568393_3570382_-	NA|384aa|up_9|NZ_CP041765.1_3545715_3546867_+	cd01158, SCAD_SBCAD, Short chain acyl-CoA dehydrogenases and eukaryotic short/branched chain acyl-CoA dehydrogenases	NA|151aa|up_8|NZ_CP041765.1_3546952_3547405_+	pfam00990, GGDEF, Diguanylate cyclase, GGDEF domain	cas3|941aa|up_7|NZ_CP041765.1_3548007_3550830_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas8e|536aa|up_6|NZ_CP041765.1_3550819_3552427_+	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cse2gr11|234aa|up_5|NZ_CP041765.1_3552423_3553125_+	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas7|380aa|up_4|NZ_CP041765.1_3553167_3554307_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|232aa|up_3|NZ_CP041765.1_3554303_3554999_+	cd09756, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|226aa|up_2|NZ_CP041765.1_3554998_3555676_+	pfam08798, CRISPR_assoc, CRISPR associated protein	cas1|324aa|up_1|NZ_CP041765.1_3555683_3556655_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|114aa|up_0|NZ_CP041765.1_3556648_3556990_+	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	NA|315aa|down_0|NZ_CP041765.1_3560023_3560968_-	pfam13828, DUF4190, Domain of unknown function (DUF4190)	NA|295aa|down_1|NZ_CP041765.1_3561137_3562022_-	pfam00582, Usp, Universal stress protein family	NA|261aa|down_2|NZ_CP041765.1_3562166_3562949_-	COG2258, COG2258, Uncharacterized protein conserved in bacteria [Function unknown]	NA|423aa|down_3|NZ_CP041765.1_3563049_3564318_-	pfam10011, DUF2254, Predicted membrane protein (DUF2254)	NA|129aa|down_4|NZ_CP041765.1_3564392_3564779_-	pfam09851, SHOCT, Short C-terminal domain	NA|143aa|down_5|NZ_CP041765.1_3564792_3565221_-	pfam06897, DUF1269, Protein of unknown function (DUF1269)	NA|402aa|down_6|NZ_CP041765.1_3565329_3566535_-	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|609aa|down_7|NZ_CP041765.1_3566570_3568397_-	cd06423, CESA_like, CESA_like is  the cellulose synthase superfamily	NA|663aa|down_8|NZ_CP041765.1_3568393_3570382_-	NA	NA|400aa|down_9|NZ_CP041765.1_3570374_3571574_-	cd05255, SQD1_like_SDR_e, UDP_sulfoquinovose_synthase (Arabidopsis thaliana SQD1 and related proteins), extended (e) SDRs
GCF_007559025.1_ASM755902v1	NZ_CP041765	Tomitella sp. HY188 chromosome, complete genome	3	3809531-3809607	3	CRISPRCasFinder	no		cas3,csa3,WYL,cas4,DEDDh,DinG,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Orphan	CGCGGGCGGTGACGGCGCGGCCGGCGGCG	29	1	33	3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578|3809560-3809578	NZ_CP041765.1_17604-17622|NZ_CP041765.1_162732-162750|NZ_CP041765.1_391653-391671|NZ_CP041765.1_865142-865160|NZ_CP041765.1_934984-935002|NZ_CP041765.1_1031498-1031516|NZ_CP041765.1_1664805-1664823|NZ_CP041765.1_1886421-1886439|NZ_CP041765.1_2101602-2101620|NZ_CP041765.1_2206604-2206622|NZ_CP041765.1_2249674-2249692|NZ_CP041765.1_2616933-2616951|NZ_CP041765.1_2750157-2750175|NZ_CP041765.1_3289125-3289143|NZ_CP041765.1_3564515-3564533|NZ_CP041765.1_293805-293787|NZ_CP041765.1_762830-762812|NZ_CP041765.1_767825-767807|NZ_CP041765.1_828327-828309|NZ_CP041765.1_983494-983476|NZ_CP041765.1_1948494-1948476|NZ_CP041765.1_2059987-2059969|NZ_CP041765.1_2569938-2569920|NZ_CP041765.1_2617382-2617364|NZ_CP041765.1_2645826-2645808|NZ_CP041765.1_2696434-2696416|NZ_CP041765.1_2993393-2993375|NZ_CP041765.1_3167120-3167102|NZ_CP041765.1_3433294-3433276|NZ_CP041765.1_3648082-3648064|NZ_CP041765.1_3755257-3755239|NZ_CP041766.1_49293-49275|NZ_CP041766.1_49392-49374	NA	1	1	Orphan	cas3,csa3,WYL,cas4,DEDDh,DinG,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA|101aa|up_5|NZ_CP041765.1_3802806_3803109_-,NA|158aa|down_1|NZ_CP041765.1_3812200_3812674_-	NA|596aa|up_9|NZ_CP041765.1_3798215_3800003_-	COG0768, FtsI, Cell division protein FtsI/penicillin-binding protein 2 [Cell envelope biogenesis, outer membrane]	NA|317aa|up_8|NZ_CP041765.1_3800071_3801022_-	pfam13354, Beta-lactamase2, Beta-lactamase enzyme family	NA|312aa|up_7|NZ_CP041765.1_3801014_3801950_-	COG0583, LysR, Transcriptional regulator [Transcription]	NA|235aa|up_6|NZ_CP041765.1_3802051_3802756_+	COG1051, COG1051, ADP-ribose pyrophosphatase [Nucleotide transport and metabolism]	NA|101aa|up_5|NZ_CP041765.1_3802806_3803109_-	NA	NA|295aa|up_4|NZ_CP041765.1_3803098_3803983_-	PRK07825, PRK07825, short chain dehydrogenase; Provisional	NA|325aa|up_3|NZ_CP041765.1_3804560_3805535_+	COG1075, LipA, Predicted acetyltransferases and hydrolases with the alpha/beta hydrolase fold [General function prediction only]	NA|207aa|up_2|NZ_CP041765.1_3805674_3806295_+	cd02145, BluB, 5,6-dimethylbenzimidazole synthase	NA|162aa|up_1|NZ_CP041765.1_3806399_3806885_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|550aa|up_0|NZ_CP041765.1_3806881_3808531_+	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily	NA|494aa|down_0|NZ_CP041765.1_3810556_3812038_-	PRK07121, PRK07121, FAD-binding protein	NA|158aa|down_1|NZ_CP041765.1_3812200_3812674_-	NA	NA|364aa|down_2|NZ_CP041765.1_3812745_3813837_+	pfam14249, Tocopherol_cycl, Tocopherol cyclase	NA|257aa|down_3|NZ_CP041765.1_3813937_3814708_-	pfam00596, Aldolase_II, Class II Aldolase and Adducin N-terminal domain	NA|406aa|down_4|NZ_CP041765.1_3814709_3815927_-	pfam04909, Amidohydro_2, Amidohydrolase	NA|242aa|down_5|NZ_CP041765.1_3816080_3816806_+	COG1414, IclR, Transcriptional regulator [Transcription]	NA|133aa|down_6|NZ_CP041765.1_3816822_3817221_-	COG3189, COG3189, Uncharacterized conserved protein [Function unknown]	NA|235aa|down_7|NZ_CP041765.1_3817375_3818080_+	COG3393, COG3393, Predicted acetyltransferase [General function prediction only]	NA|127aa|down_8|NZ_CP041765.1_3818119_3818500_-	pfam18029, Glyoxalase_6, Glyoxalase-like domain	NA|461aa|down_9|NZ_CP041765.1_3818812_3820195_+	TIGR03026, NDP-sugDHase, nucleotide sugar dehydrogenase
