assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000208385.1_ASM20838v1	NC_015436	Sphaerochaeta coccoides DSM 17374, complete sequence	1	1302007-1306491	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f	DEDDh,DinG,cas3,csa3,c2c9_V-U4,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	Type I-F,Type I-E	CTATTCCCCGCAAGTGCGGGGGTGTTTC,CTATTCCCCGCAAGTGCGGGGGTGTTTC,CTATTCCCCGCAAGTGCGGGGGTGTTTC,TATTCCCCGCAAGTGCGGGGGTGTTTC	28,28,28,27	2	2	1306431-1306463|1306431-1306464	NC_015436.1_114033-114065|NC_015436.1_114033-114066	NA:NA:NA:NA	67,73,73,67	73	TypeI-F,TypeI-E	DEDDh,DinG,cas3,csa3,c2c9_V-U4,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	NA,NA|150aa|down_2|NC_015436.1_1307584_1308034_+,NA|109aa|down_3|NC_015436.1_1308123_1308450_+,NA|154aa|down_6|NC_015436.1_1310624_1311086_+	NA|253aa|up_9|NC_015436.1_1291568_1292327_+	COG4604, CeuD, ABC-type enterochelin transport system, ATPase component [Inorganic ion transport and metabolism]	NA|321aa|up_8|NC_015436.1_1292376_1293339_+	cd01140, FatB, Siderophore binding protein FatB	cas3|873aa|up_7|NC_015436.1_1293816_1296435_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas8e|503aa|up_6|NC_015436.1_1296428_1297937_+	cd09729, Cse1_I-E, CRISPR/Cas system-associated protein Cse1	cse2gr11|176aa|up_5|NC_015436.1_1297926_1298454_+	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas6e|199aa|up_4|NC_015436.1_1298450_1299047_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas7|358aa|up_3|NC_015436.1_1299043_1300117_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|233aa|up_2|NC_015436.1_1300127_1300826_+	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas1|282aa|up_1|NC_015436.1_1300825_1301671_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|93aa|up_0|NC_015436.1_1301673_1301952_+	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	NA|161aa|down_0|NC_015436.1_1306495_1306978_+	pfam18818, MPTase-PolyVal, Metallopeptidase superfamily domain	NA|197aa|down_1|NC_015436.1_1306970_1307561_+	pfam18819, MuF_C, Phage MuF-C-terminal domain	NA|150aa|down_2|NC_015436.1_1307584_1308034_+	NA	NA|109aa|down_3|NC_015436.1_1308123_1308450_+	NA	NA|295aa|down_4|NC_015436.1_1308618_1309503_-	pfam13391, HNH_2, HNH endonuclease	NA|144aa|down_5|NC_015436.1_1309879_1310311_-	COG2819, COG2819, Predicted hydrolase of the alpha/beta superfamily [General function prediction only]	NA|154aa|down_6|NC_015436.1_1310624_1311086_+	NA	NA|69aa|down_7|NC_015436.1_1311040_1311247_+	pfam07553, Lipoprotein_Ltp, Host cell surface-exposed lipoprotein	NA|64aa|down_8|NC_015436.1_1311303_1311495_-	cd09126, PLDc_C_DEXD_like, C-terminal putative phospholipase D-like domain of uncharacterized prokaryotic HKD family nucleases fused to DEAD/DEAH box helicases	PrimPol|861aa|down_9|NC_015436.1_1311572_1314155_-	COG4951, COG4951, Uncharacterized protein conserved in bacteria [Function unknown]
GCF_000208385.1_ASM20838v1	NC_015436	Sphaerochaeta coccoides DSM 17374, complete sequence	2	1319989-1322002	2,2,3	CRISPRCasFinder,CRT,PILER-CR	no	cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	DEDDh,DinG,cas3,csa3,c2c9_V-U4,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	Type I-F	TTTCTAAGCTGCCTATGCGGCAGCATAC,TTTCTAAGCTGCCTATGCGGCAGCATAC,TTTCTAAGCTGCCTATGCGGCAGCATAC	28,28,28	0	0	NA	NA	I-F:I-F:I-F	33,33,21	33	TypeI-F	DEDDh,DinG,cas3,csa3,c2c9_V-U4,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	NA|154aa|up_9|NC_015436.1_1310624_1311086_+,NA|204aa|up_4|NC_015436.1_1316354_1316966_-,NA|254aa|up_3|NC_015436.1_1317113_1317875_-,NA|174aa|up_2|NC_015436.1_1318114_1318636_+,NA|50aa|up_1|NC_015436.1_1318712_1318862_-,NA|109aa|up_0|NC_015436.1_1319130_1319457_-,NA	NA|154aa|up_9|NC_015436.1_1310624_1311086_+	NA	NA|69aa|up_8|NC_015436.1_1311040_1311247_+	pfam07553, Lipoprotein_Ltp, Host cell surface-exposed lipoprotein	NA|64aa|up_7|NC_015436.1_1311303_1311495_-	cd09126, PLDc_C_DEXD_like, C-terminal putative phospholipase D-like domain of uncharacterized prokaryotic HKD family nucleases fused to DEAD/DEAH box helicases	PrimPol|861aa|up_6|NC_015436.1_1311572_1314155_-	COG4951, COG4951, Uncharacterized protein conserved in bacteria [Function unknown]	NA|500aa|up_5|NC_015436.1_1314183_1315683_-	COG2865, COG2865, Predicted transcriptional regulator containing an HTH domain and an uncharacterized domain shared with the mammalian protein Schlafen [Transcription]	NA|204aa|up_4|NC_015436.1_1316354_1316966_-	NA	NA|254aa|up_3|NC_015436.1_1317113_1317875_-	NA	NA|174aa|up_2|NC_015436.1_1318114_1318636_+	NA	NA|50aa|up_1|NC_015436.1_1318712_1318862_-	NA	NA|109aa|up_0|NC_015436.1_1319130_1319457_-	NA	cas6f|194aa|down_0|NC_015436.1_1322086_1322668_-	pfam09618, Cas_Csy4, CRISPR-associated protein (Cas_Csy4)	cas7f|345aa|down_1|NC_015436.1_1322677_1323712_-	pfam09615, Cas_Csy3, CRISPR-associated protein (Cas_Csy3)	cas5f|298aa|down_2|NC_015436.1_1323713_1324607_-	pfam09614, Cas_Csy2, CRISPR-associated protein (Cas_Csy2)	cas8f|401aa|down_3|NC_015436.1_1324603_1325806_-	pfam09611, Cas_Csy1, CRISPR-associated protein (Cas_Csy1)	cas3f|1098aa|down_4|NC_015436.1_1325826_1329120_-	cd09673, Cas3_Cas2_I-F, CRISPR/Cas system-associated protein Cas3/Cas2	cas1|322aa|down_5|NC_015436.1_1329116_1330082_-	TIGR03637, cas1_YPEST, CRISPR-associated endonuclease Cas1, subtype I-F/YPEST	NA|67aa|down_6|NC_015436.1_1330172_1330373_-	pfam03852, Vsr, DNA mismatch endonuclease Vsr	NA|395aa|down_7|NC_015436.1_1330934_1332119_-	cd06173, MFS_MefA_like, Macrolide efflux protein A and similar proteins of the Major Facilitator Superfamily of transporters	NA|275aa|down_8|NC_015436.1_1332123_1332948_-	TIGR04470, hypothetical_protein_ALIPUT_00462, radical SAM mobile pair protein B	NA|479aa|down_9|NC_015436.1_1333233_1334670_-	COG2865, COG2865, Predicted transcriptional regulator containing an HTH domain and an uncharacterized domain shared with the mammalian protein Schlafen [Transcription]
GCF_000208385.1_ASM20838v1	NC_015436	Sphaerochaeta coccoides DSM 17374, complete sequence	3	1699847-1700061	3,4	CRISPRCasFinder,PILER-CR	no		DEDDh,DinG,cas3,csa3,c2c9_V-U4,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	Orphan	TGACTATTCCCCGCAGGTGCGGGGGTGTTTCT,CTATTCCCCGCAAGTGCGGGGGTGTTTC	32,28	0	0	NA	NA	NA:NA	3,3	3	Orphan	DEDDh,DinG,cas3,csa3,c2c9_V-U4,cas8e,cse2gr11,cas6e,cas7,cas5,cas1,cas2,PrimPol,cas6f,cas7f,cas5f,cas8f,cas3f	NA,NA|56aa|down_8|NC_015436.1_1710135_1710303_+	NA|434aa|up_9|NC_015436.1_1678545_1679847_+	PRK02427, PRK02427, 3-phosphoshikimate 1-carboxyvinyltransferase; Provisional	NA|348aa|up_8|NC_015436.1_1679833_1680877_+	PLN02721, PLN02721, threonine aldolase	NA|422aa|up_7|NC_015436.1_1680873_1682139_+	COG1168, MalY, Bifunctional PLP-dependent enzyme with beta-cystathionase and maltose regulon repressor activities [Amino acid transport and metabolism]	NA|1219aa|up_6|NC_015436.1_1682185_1685842_-	COG1074, RecB, ATP-dependent exoDNAse (exonuclease V) beta subunit (contains helicase and exonuclease domains) [DNA replication, recombination, and repair]	NA|1014aa|up_5|NC_015436.1_1685838_1688880_-	pfam12705, PDDEXK_1, PD-(D/E)XK nuclease superfamily	NA|327aa|up_4|NC_015436.1_1688918_1689899_+	COG1266, COG1266, Predicted metal-dependent membrane protease [General function prediction only]	NA|388aa|up_3|NC_015436.1_1689946_1691110_+	pfam01223, Endonuclease_NS, DNA/RNA non-specific endonuclease	NA|447aa|up_2|NC_015436.1_1691237_1692578_+	cd08175, G1PDH, Glycerol-1-phosphate dehydrogenase (G1PDH) catalyzes the reversible reduction of dihydroxyacetone phosphate (DHAP) to glycerol-1-phosphate (G1P) in an NADH-dependent manner	NA|77aa|up_1|NC_015436.1_1693415_1693646_+	pfam13936, HTH_38, Helix-turn-helix domain	NA|2085aa|up_0|NC_015436.1_1693572_1699827_+	pfam18760, ART-PolyVal, ADP-Ribosyltransferase in polyvalent proteins	NA|180aa|down_0|NC_015436.1_1700527_1701067_-	PRK06842, PRK06842, Fe-S-containing hydro-lyase	NA|309aa|down_1|NC_015436.1_1701059_1701986_-	pfam05681, Fumerase, Fumarate hydratase (Fumerase)	NA|187aa|down_2|NC_015436.1_1701985_1702546_-	COG5652, COG5652, Predicted integral membrane protein [Function unknown]	NA|334aa|down_3|NC_015436.1_1702520_1703522_-	COG1242, COG1242, Predicted Fe-S oxidoreductase [General function prediction only]	NA|812aa|down_4|NC_015436.1_1703521_1705957_-	COG1752, RssA, Predicted esterase of the alpha-beta hydrolase superfamily [General function prediction only]	NA|350aa|down_5|NC_015436.1_1705958_1707008_-	COG0223, Fmt, Methionyl-tRNA formyltransferase [Translation, ribosomal structure and biogenesis]	NA|168aa|down_6|NC_015436.1_1706964_1707468_-	PRK00150, def, peptide deformylase; Reviewed	NA|692aa|down_7|NC_015436.1_1707939_1710015_+	COG5184, ATS1, Alpha-tubulin suppressor and related RCC1 domain-containing proteins [Cell division and chromosome partitioning / Cytoskeleton]	NA|56aa|down_8|NC_015436.1_1710135_1710303_+	NA	NA|668aa|down_9|NC_015436.1_1710397_1712401_-	PRK05580, PRK05580, primosome assembly protein PriA; Validated
