assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001592425.1_ASM159242v1	NZ_CP010875	Streptococcus agalactiae strain CU_GBS_98 chromosome, complete genome	1	464180-464872	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-C,Type I-U, Type I-U?	GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT	32,32,32,32	0	0	NA	NA	I-C:I-C:I-C:I-C	8,9,10,8	10	TypeI-C,TypeI-U,TypeI-U?	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|231aa|up_9|NZ_CP010875.1_450627_451320_+,NA|260aa|up_7|NZ_CP010875.1_454210_454990_-,NA|97aa|down_6|NZ_CP010875.1_470535_470826_+	NA|231aa|up_9|NZ_CP010875.1_450627_451320_+	NA	NA|884aa|up_8|NZ_CP010875.1_451341_453993_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|260aa|up_7|NZ_CP010875.1_454210_454990_-	NA	cas3|808aa|up_6|NZ_CP010875.1_456001_458425_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_CP010875.1_458557_459286_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_CP010875.1_459285_461181_+	cd09642, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|283aa|up_3|NZ_CP010875.1_461185_462034_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|224aa|up_2|NZ_CP010875.1_462035_462707_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_CP010875.1_462703_463729_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_CP010875.1_463739_464033_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|320aa|down_0|NZ_CP010875.1_465008_465968_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|301aa|down_1|NZ_CP010875.1_466128_467031_+	cd12827, EcCorA_ZntB-like_u2, uncharacterized bacterial subfamily of the Escherichia coli CorA-Salmonella typhimurium ZntB family	NA|355aa|down_2|NZ_CP010875.1_467190_468255_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|331aa|down_3|NZ_CP010875.1_468367_469360_+	COG2502, AsnA, Asparagine synthetase A [Amino acid transport and metabolism]	NA|150aa|down_4|NZ_CP010875.1_469404_469854_-	TIGR01295, Pediocin_PA-1_biosynthesis_protein_PedC, bacteriocin transport accessory protein, putative	NA|180aa|down_5|NZ_CP010875.1_469984_470524_+	pfam03602, Cons_hypoth95, Conserved hypothetical protein 95	NA|97aa|down_6|NZ_CP010875.1_470535_470826_+	NA	NA|162aa|down_7|NZ_CP010875.1_470822_471308_+	cd02163, PPAT, Phosphopantetheine adenylyltransferase	NA|358aa|down_8|NZ_CP010875.1_471297_472371_+	COG3480, SdrC, Predicted secreted protein containing a PDZ domain [Signal transduction mechanisms]	NA|445aa|down_9|NZ_CP010875.1_472445_473780_+	cd00845, MPP_UshA_N_like, Escherichia coli UshA-like family, N-terminal metallophosphatase domain
GCF_001592425.1_ASM159242v1	NZ_CP010875	Streptococcus agalactiae strain CU_GBS_98 chromosome, complete genome	2	866399-867094	3,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas9,cas1,cas2,csn2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type II-B,Type II-A,Type II-C	GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	9,9,10	10	TypeII-B,TypeII-A,TypeII-C	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA,NA	NA|124aa|up_9|NZ_CP010875.1_855780_856152_+	pfam08349, DUF1722, Protein of unknown function (DUF1722)	NA|127aa|up_8|NZ_CP010875.1_856176_856557_+	TIGR02328, TIGR02328, conserved hypothetical protein	NA|377aa|up_7|NZ_CP010875.1_856648_857779_+	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|246aa|up_6|NZ_CP010875.1_857782_858520_+	pfam01643, Acyl-ACP_TE, Acyl-ACP thioesterase	NA|257aa|up_5|NZ_CP010875.1_858520_859291_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|219aa|up_4|NZ_CP010875.1_859280_859937_+	COG4478, COG4478, Predicted membrane protein [Function unknown]	cas9|1371aa|up_3|NZ_CP010875.1_860324_864437_+	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	cas1|290aa|up_2|NZ_CP010875.1_864438_865308_+	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	cas2|114aa|up_1|NZ_CP010875.1_865304_865646_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|222aa|up_0|NZ_CP010875.1_865632_866298_+	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	NA|139aa|down_0|NZ_CP010875.1_867651_868068_+	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|611aa|down_1|NZ_CP010875.1_868203_870036_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|878aa|down_2|NZ_CP010875.1_870282_872916_+	NF033189, internalin_A, class 1 internalin InlA	NA|220aa|down_3|NZ_CP010875.1_873015_873675_+	COG1418, COG1418, Predicted HD superfamily hydrolase [General function prediction only]	NA|155aa|down_4|NZ_CP010875.1_873683_874148_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|130aa|down_5|NZ_CP010875.1_874147_874537_+	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|931aa|down_6|NZ_CP010875.1_874688_877481_+	COG0474, MgtA, Cation transport ATPase [Inorganic ion transport and metabolism]	NA|368aa|down_7|NZ_CP010875.1_877480_878584_+	pfam11187, DUF2974, Protein of unknown function (DUF2974)	NA|213aa|down_8|NZ_CP010875.1_878704_879343_-	cd03349, LbH_XAT, Xenobiotic acyltransferase (XAT): The XAT class of hexapeptide acyltransferases is composed of a large number of microbial enzymes that catalyze the CoA-dependent acetylation of a variety of hydroxyl-bearing acceptors such as chloramphenicol and streptogramin, among others	NA|204aa|down_9|NZ_CP010875.1_880053_880665_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]
GCF_001592425.1_ASM159242v1	NZ_CP010875	Streptococcus agalactiae strain CU_GBS_98 chromosome, complete genome	3	1887119-1887616	3	CRT	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Orphan	CTGGTTTGGCNTCTGGNT	18	1	1	1887581-1887598	NZ_CP010875.1_1986981-1986964	NA	8	8	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|203aa|up_4|NZ_CP010875.1_1879478_1880087_+,NA	NA|746aa|up_9|NZ_CP010875.1_1868430_1870668_-	PRK05222, PRK05222, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase; Provisional	NA|108aa|up_8|NZ_CP010875.1_1871037_1871361_-	COG4392, COG4392, Predicted membrane protein [Function unknown]	NA|231aa|up_7|NZ_CP010875.1_1871350_1872043_-	COG1296, AzlC, Predicted branched-chain amino acid permease (azaleucine resistance) [Amino acid transport and metabolism]	NA|1572aa|up_6|NZ_CP010875.1_1872365_1877081_+	cd07475, Peptidases_S8_C5a_Peptidase, Peptidase S8 family domain in Streptococcal C5a peptidases	NA|463aa|up_5|NZ_CP010875.1_1877997_1879386_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|203aa|up_4|NZ_CP010875.1_1879478_1880087_+	NA	NA|834aa|up_3|NZ_CP010875.1_1880176_1882678_-	PRK00390, leuS, leucyl-tRNA synthetase; Validated	NA|416aa|up_2|NZ_CP010875.1_1883054_1884302_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|269aa|up_1|NZ_CP010875.1_1884959_1885765_-	pfam13359, DDE_Tnp_4, DDE superfamily endonuclease	NA|180aa|up_0|NZ_CP010875.1_1886188_1886728_-	PRK05609, nusG, transcription antitermination protein NusG; Validated	NA|58aa|down_0|NZ_CP010875.1_1889719_1889893_-	COG0690, SecE, Preprotein translocase subunit SecE [Intracellular trafficking and secretion]	NA|51aa|down_1|NZ_CP010875.1_1889928_1890081_-	PRK00504, rpmG, 50S ribosomal protein L33; Validated	NA|774aa|down_2|NZ_CP010875.1_1890129_1892451_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|295aa|down_3|NZ_CP010875.1_1892494_1893379_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|547aa|down_4|NZ_CP010875.1_1893403_1895044_-	COG4640, COG4640, Predicted membrane protein [Function unknown]	NA|404aa|down_5|NZ_CP010875.1_1895213_1896425_-	PRK05362, PRK05362, phosphopentomutase; Provisional	NA|224aa|down_6|NZ_CP010875.1_1896491_1897163_-	PRK00507, PRK00507, deoxyribose-phosphate aldolase; Provisional	NA|401aa|down_7|NZ_CP010875.1_1897192_1898395_-	COG1972, NupC, Nucleoside permease [Nucleotide transport and metabolism]	NA|260aa|down_8|NZ_CP010875.1_1898415_1899195_-	cd17767, UP_EcUdp-like, uridine phosphorylases similar to Escherichia coli Udp and related phosphorylases	NA|246aa|down_9|NZ_CP010875.1_1899353_1900091_+	COG2188, PhnF, Transcriptional regulators [Transcription]
GCF_001592425.1_ASM159242v1	NZ_CP010875	Streptococcus agalactiae strain CU_GBS_98 chromosome, complete genome	4	1937169-1937255	3	CRISPRCasFinder	no	csa3	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-A	AGCAGTATCGTACTTAGTTTGAGC	24	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|154aa|up_0|NZ_CP010875.1_1935823_1936285_-,NA|319aa|down_1|NZ_CP010875.1_1939674_1940631_-,NA|98aa|down_2|NZ_CP010875.1_1940865_1941159_+,NA|147aa|down_3|NZ_CP010875.1_1941240_1941681_+,NA|177aa|down_4|NZ_CP010875.1_1941677_1942208_+,NA|424aa|down_6|NZ_CP010875.1_1943117_1944389_+,NA|88aa|down_7|NZ_CP010875.1_1944471_1944735_+,NA|62aa|down_9|NZ_CP010875.1_1946301_1946487_-	NA|146aa|up_9|NZ_CP010875.1_1927164_1927602_-	TIGR01529, Arginine_repressor	NA|564aa|up_8|NZ_CP010875.1_1927823_1929515_+	PRK12451, PRK12451, arginyl-tRNA synthetase; Reviewed	NA|103aa|up_7|NZ_CP010875.1_1929602_1929911_+	pfam08951, EntA_Immun, Enterocin A Immunity	NA|291aa|up_6|NZ_CP010875.1_1929937_1930810_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|315aa|up_5|NZ_CP010875.1_1930917_1931862_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|584aa|up_4|NZ_CP010875.1_1931851_1933603_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|427aa|up_3|NZ_CP010875.1_1933695_1934976_-	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|61aa|up_2|NZ_CP010875.1_1935195_1935378_+	PRK01110, rpmF, 50S ribosomal protein L32; Validated	NA|50aa|up_1|NZ_CP010875.1_1935393_1935543_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|154aa|up_0|NZ_CP010875.1_1935823_1936285_-	NA	NA|112aa|down_0|NZ_CP010875.1_1939302_1939638_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|319aa|down_1|NZ_CP010875.1_1939674_1940631_-	NA	NA|98aa|down_2|NZ_CP010875.1_1940865_1941159_+	NA	NA|147aa|down_3|NZ_CP010875.1_1941240_1941681_+	NA	NA|177aa|down_4|NZ_CP010875.1_1941677_1942208_+	NA	NA|249aa|down_5|NZ_CP010875.1_1942207_1942954_+	COG1674, FtsK, DNA segregation ATPase FtsK/SpoIIIE and related proteins [Cell division and chromosome partitioning]	NA|424aa|down_6|NZ_CP010875.1_1943117_1944389_+	NA	NA|88aa|down_7|NZ_CP010875.1_1944471_1944735_+	NA	NA|422aa|down_8|NZ_CP010875.1_1944831_1946097_+	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons	NA|62aa|down_9|NZ_CP010875.1_1946301_1946487_-	NA
