assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000307105.1_ASM30710v1	NC_018645	Desulfobacula toluolica Tol2, complete genome	1	1120959-1125463	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	Unclear	CTTTTAATCAGACCAGTGTGGAATTGAAAC,CTTTTAATCAGACCAGTGTGGAATTGAAAC,CTTTTAATCAGACCAGTGTGGAATTGAAAC,CTTTTAATCAGACCAGTGTGGAATTGAAAC	30,30,30,30	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	66,68,68,66	68	Unclear	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	NA|239aa|up_9|NC_018645.1_1111016_1111733_+,NA|264aa|up_8|NC_018645.1_1111745_1112537_+,cas5|193aa|up_7|NC_018645.1_1112810_1113389_+,cas8b6|467aa|up_5|NC_018645.1_1115564_1116965_+,NA|107aa|down_2|NC_018645.1_1127421_1127742_-	NA|239aa|up_9|NC_018645.1_1111016_1111733_+	NA	NA|264aa|up_8|NC_018645.1_1111745_1112537_+	NA	cas5|193aa|up_7|NC_018645.1_1112810_1113389_+	NA	cas3|720aa|up_6|NC_018645.1_1113391_1115551_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8b6|467aa|up_5|NC_018645.1_1115564_1116965_+	NA	cas7|356aa|up_4|NC_018645.1_1117003_1118071_+	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas6|268aa|up_3|NC_018645.1_1118125_1118929_+	COG1583, COG1583, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas4|165aa|up_2|NC_018645.1_1118964_1119459_+	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas1|330aa|up_1|NC_018645.1_1119556_1120546_+	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas2|94aa|up_0|NC_018645.1_1120548_1120830_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|511aa|down_0|NC_018645.1_1125500_1127033_-	pfam03050, DDE_Tnp_IS66, Transposase IS66 family	NA|116aa|down_1|NC_018645.1_1127077_1127425_-	pfam05717, TnpB_IS66, IS66 Orf2 like protein	NA|107aa|down_2|NC_018645.1_1127421_1127742_-	NA	NA|173aa|down_3|NC_018645.1_1128390_1128909_-	pfam03972, MmgE_PrpD, MmgE/PrpD family	NA|268aa|down_4|NC_018645.1_1128927_1129731_-	pfam03972, MmgE_PrpD, MmgE/PrpD family	NA|557aa|down_5|NC_018645.1_1129754_1131425_-	pfam08269, dCache_2, Cache domain	NA|390aa|down_6|NC_018645.1_1131452_1132622_-	cd06325, PBP1_ABC_unchar_transporter, type 1 periplasmic ligand-binding domain of uncharacterized ABC-type transport systems predicted to be involved in uptake of amino acids, peptides, or inorganic ions	NA|802aa|down_7|NC_018645.1_1132945_1135351_-	COG0466, Lon, ATP-dependent Lon protease, bacterial type [Posttranslational modification, protein turnover, chaperones]	NA|983aa|down_8|NC_018645.1_1135850_1138799_+	cd16434, CheB-CheR_fusion, Chemotaxis response regulator protein-glutamate methylesterase, CheB, fused with CheR domain	NA|721aa|down_9|NC_018645.1_1138810_1140973_+	PRK11360, PRK11360, two-component system sensor histidine kinase AtoS
GCF_000307105.1_ASM30710v1	NC_018645	Desulfobacula toluolica Tol2, complete genome	2	1127805-1128164	2,3,2	CRT,PILER-CR,CRISPRCasFinder	no	cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	Unclear	CTTTTAATCAGACCAGTGTGGAATTGAAAC,CTTTTAATCAGACCAGTGTGGAATTGAAAC,CTTTTAATCAGACCAGTGTGGAATTGAAAC	30,30,30	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	5,4,4	5	Unclear	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	cas8b6|467aa|up_8|NC_018645.1_1115564_1116965_+,NA|107aa|up_0|NC_018645.1_1127421_1127742_-,NA|64aa|down_7|NC_018645.1_1141000_1141192_-	cas3|720aa|up_9|NC_018645.1_1113391_1115551_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8b6|467aa|up_8|NC_018645.1_1115564_1116965_+	NA	cas7|356aa|up_7|NC_018645.1_1117003_1118071_+	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas6|268aa|up_6|NC_018645.1_1118125_1118929_+	COG1583, COG1583, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas4|165aa|up_5|NC_018645.1_1118964_1119459_+	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas1|330aa|up_4|NC_018645.1_1119556_1120546_+	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas2|94aa|up_3|NC_018645.1_1120548_1120830_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|511aa|up_2|NC_018645.1_1125500_1127033_-	pfam03050, DDE_Tnp_IS66, Transposase IS66 family	NA|116aa|up_1|NC_018645.1_1127077_1127425_-	pfam05717, TnpB_IS66, IS66 Orf2 like protein	NA|107aa|up_0|NC_018645.1_1127421_1127742_-	NA	NA|173aa|down_0|NC_018645.1_1128390_1128909_-	pfam03972, MmgE_PrpD, MmgE/PrpD family	NA|268aa|down_1|NC_018645.1_1128927_1129731_-	pfam03972, MmgE_PrpD, MmgE/PrpD family	NA|557aa|down_2|NC_018645.1_1129754_1131425_-	pfam08269, dCache_2, Cache domain	NA|390aa|down_3|NC_018645.1_1131452_1132622_-	cd06325, PBP1_ABC_unchar_transporter, type 1 periplasmic ligand-binding domain of uncharacterized ABC-type transport systems predicted to be involved in uptake of amino acids, peptides, or inorganic ions	NA|802aa|down_4|NC_018645.1_1132945_1135351_-	COG0466, Lon, ATP-dependent Lon protease, bacterial type [Posttranslational modification, protein turnover, chaperones]	NA|983aa|down_5|NC_018645.1_1135850_1138799_+	cd16434, CheB-CheR_fusion, Chemotaxis response regulator protein-glutamate methylesterase, CheB, fused with CheR domain	NA|721aa|down_6|NC_018645.1_1138810_1140973_+	PRK11360, PRK11360, two-component system sensor histidine kinase AtoS	NA|64aa|down_7|NC_018645.1_1141000_1141192_-	NA	NA|409aa|down_8|NC_018645.1_1141365_1142592_-	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|45aa|down_9|NC_018645.1_1142790_1142925_-	PRK05826, PRK05826, pyruvate kinase; Provisional
GCF_000307105.1_ASM30710v1	NC_018645	Desulfobacula toluolica Tol2, complete genome	3	1808150-1808247	3	CRISPRCasFinder	no		csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	Orphan	CGCTACTGGCAGGCCGTCGCCCGATG	26	0	0	NA	NA	NA	1	1	Orphan	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	NA|133aa|up_1|NC_018645.1_1803174_1803573_+,NA|444aa|down_0|NC_018645.1_1814734_1816066_-,NA|62aa|down_7|NC_018645.1_1822481_1822667_-	NA|142aa|up_9|NC_018645.1_1796910_1797336_+	COG4244, COG4244, Predicted membrane protein [Function unknown]	NA|182aa|up_8|NC_018645.1_1797351_1797897_+	cd09631, DOMON_DOH, DOMON-like domain of copper-dependent monooxygenases and related proteins	NA|288aa|up_7|NC_018645.1_1797992_1798856_+	cd02968, SCO, SCO (an acronym for Synthesis of Cytochrome c Oxidase) family; composed of proteins similar to Sco1, a membrane-anchored protein possessing a soluble domain with a TRX fold	NA|543aa|up_6|NC_018645.1_1798873_1800502_+	TIGR02891, Probable_cytochrome_c_oxidase_subunit_1-beta, cytochrome c oxidase, subunit I	NA|199aa|up_5|NC_018645.1_1800542_1801139_+	cd02862, NorE_like, NorE_like subfamily of heme-copper oxidase subunit III	NA|96aa|up_4|NC_018645.1_1801263_1801551_+	TIGR02229, hypothetical_protein, caa(3)-type oxidase, subunit IV	NA|204aa|up_3|NC_018645.1_1801558_1802170_+	COG1622, CyoA, Heme/copper-type cytochrome/quinol oxidases, subunit 2 [Energy production and conversion]	NA|307aa|up_2|NC_018645.1_1802159_1803080_+	cd13957, PT_UbiA_Cox10, Protoheme IX farnesyltransferase	NA|133aa|up_1|NC_018645.1_1803174_1803573_+	NA	NA|541aa|up_0|NC_018645.1_1803846_1805469_+	pfam03050, DDE_Tnp_IS66, Transposase IS66 family	NA|444aa|down_0|NC_018645.1_1814734_1816066_-	NA	NA|117aa|down_1|NC_018645.1_1816302_1816653_+	pfam05973, Gp49, Phage derived protein Gp49-like (DUF891)	NA|92aa|down_2|NC_018645.1_1816649_1816925_+	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|451aa|down_3|NC_018645.1_1817216_1818569_+	pfam13751, DDE_Tnp_1_6, Transposase DDE domain	NA|303aa|down_4|NC_018645.1_1818813_1819722_+	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|523aa|down_5|NC_018645.1_1819835_1821404_+	cd07574, nitrilase_Rim1_like, Uncharacterized subgroup of the nitrilase superfamily; some members of this subgroup have an N-terminal RimI domain (class 12 nitrilases)	NA|317aa|down_6|NC_018645.1_1821534_1822485_+	COG0731, COG0731, Fe-S oxidoreductases [Energy production and conversion]	NA|62aa|down_7|NC_018645.1_1822481_1822667_-	NA	NA|325aa|down_8|NC_018645.1_1822945_1823920_+	COG0714, COG0714, MoxR-like ATPases [General function prediction only]	NA|293aa|down_9|NC_018645.1_1823938_1824817_+	COG1721, COG1721, Uncharacterized conserved protein (some members contain a von Willebrand factor type A (vWA) domain) [General function prediction only]
GCF_000307105.1_ASM30710v1	NC_018645	Desulfobacula toluolica Tol2, complete genome	4	3489798-3490420	4,4,3	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas2,cas6,cas8b1,cas7,cas5,cas3,cas4	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	Type I-B	GTCTGAACGGCATATCCAGAAGAACAAGGATTGAAAC,GTCTGAACGGCATATCCAGAAGAACAAGGATTGAAAC,GTCTGAACGGCATATCCAGAAGAACAAGGATTGAAAC	37,37,37	0	0	NA	NA	I-B:I-B:I-B	8,8,8	8	TypeI-B	csa3,RT,c2c9_V-U4,cas5,cas3,cas8b6,cas7,cas6,cas4,cas1,cas2,DEDDh,cas8b1,Cas9_archaeal,PD-DExK	NA,NA|184aa|down_0|NC_018645.1_3490820_3491372_+,NA|183aa|down_6|NC_018645.1_3499995_3500544_-	NA|66aa|up_9|NC_018645.1_3480200_3480398_+	TIGR03833, TIGR03833, conserved hypothetical protein	NA|123aa|up_8|NC_018645.1_3480447_3480816_-	cd02230, cupin_HP0902-like, Helicobacter pylori HP0902 and related proteins, cupin domain	cas1|338aa|up_7|NC_018645.1_3481091_3482105_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas2|97aa|up_6|NC_018645.1_3482115_3482406_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas6|222aa|up_5|NC_018645.1_3482428_3483094_+	pfam17262, DUF5328, Family of unknown function (DUF5328)	cas8b1|617aa|up_4|NC_018645.1_3483090_3484941_+	pfam09484, Cas_TM1802, CRISPR-associated protein TM1802 (cas_TM1802)	cas7|331aa|up_3|NC_018645.1_3484944_3485937_+	TIGR02590, hypothetical_protein_MM_0563, CRISPR-associated protein Cas7/Csh2, subtype I-B/HMARI	cas5|237aa|up_2|NC_018645.1_3485936_3486647_+	TIGR02592, hypothetical_protein_CTC_01466, CRISPR-associated protein Cas5, subtype I-B/HMARI	cas3|801aa|up_1|NC_018645.1_3486633_3489036_+	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas4|201aa|up_0|NC_018645.1_3489036_3489639_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	NA|184aa|down_0|NC_018645.1_3490820_3491372_+	NA	NA|897aa|down_1|NC_018645.1_3491558_3494249_+	PRK04914, PRK04914, RNA polymerase-associated protein RapA	NA|283aa|down_2|NC_018645.1_3494275_3495124_-	PRK05778, PRK05778, 2-oxoglutarate ferredoxin oxidoreductase subunit beta; Validated	NA|587aa|down_3|NC_018645.1_3495123_3496884_-	TIGR03710, OAFO_sf, 2-oxoacid:acceptor oxidoreductase, alpha subunit	NA|344aa|down_4|NC_018645.1_3496914_3497946_-	COG1251, NirB, NAD(P)H-nitrite reductase [Energy production and conversion]	NA|566aa|down_5|NC_018645.1_3497975_3499673_-	PRK11749, PRK11749, dihydropyrimidine dehydrogenase subunit A; Provisional	NA|183aa|down_6|NC_018645.1_3499995_3500544_-	NA	NA|286aa|down_7|NC_018645.1_3500959_3501817_+	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|430aa|down_8|NC_018645.1_3502452_3503742_+	pfam07589, VPEP, PEP-CTERM motif	NA|698aa|down_9|NC_018645.1_3503902_3505996_+	TIGR02917, TPR_domain_protein, putative PEP-CTERM system TPR-repeat lipoprotein
