assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_900474745.1_41800_E02	NZ_LS483315	Streptococcus pyogenes strain NCTC12059 chromosome 1	1	119182-119384	1	PILER-CR	no		cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Orphan	TAGATGGTGAAGAAGTCCCAGAAGTTCCAAGCGAGAGCTTAGAACCTGCGCTTCCCCCATT	61	0	0	NA	NA	NA	2	2	Orphan	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA|222aa|down_8|NZ_LS483315.1_132023_132689_-	NA|257aa|up_9|NZ_LS483315.1_109467_110238_-	PRK11880, PRK11880, pyrroline-5-carboxylate reductase; Reviewed	NA|356aa|up_8|NZ_LS483315.1_110285_111353_-	TIGR03107, Glutamyl_aminopeptidase, glutamyl aminopeptidase	NA|98aa|up_7|NZ_LS483315.1_111808_112102_+	pfam15513, DUF4651, Domain of unknown function (DUF4651)	NA|106aa|up_6|NZ_LS483315.1_112098_112416_+	cd02947, TRX_family, TRX family; composed of two groups: Group I, which includes proteins that exclusively encode a TRX domain; and Group II, which are composed of fusion proteins of TRX and additional domains	NA|209aa|up_5|NZ_LS483315.1_112433_113060_+	cd02796, tRNA_bind_bactPheRS, tRNA-binding-domain-containing prokaryotic phenylalanly tRNA synthetase (PheRS) beta chain	NA|132aa|up_4|NZ_LS483315.1_113211_113607_+	PRK07274, PRK07274, single-stranded DNA-binding protein; Provisional	NA|214aa|up_3|NZ_LS483315.1_113865_114507_-	COG1428, COG1428, Deoxynucleoside kinases [Nucleotide transport and metabolism]	NA|326aa|up_2|NZ_LS483315.1_114526_115504_-	TIGR00737, Probable_tRNA-dihydrouridine_synthase, putative TIM-barrel protein, nifR3 family	NA|291aa|up_1|NZ_LS483315.1_115490_116363_-	PRK00114, hslO, Hsp33 family molecular chaperone HslO	NA|498aa|up_0|NZ_LS483315.1_116509_118003_-	pfam08270, PRD_Mga, M protein trans-acting positive regulator (MGA) PRD domain	NA|283aa|down_0|NZ_LS483315.1_120212_121061_+	cd05827, Sortase_C, Sortase domain found in class C sortases	NA|747aa|down_1|NZ_LS483315.1_121346_123587_+	NF033396, pilus_ancill_1, pilus ancillary protein 1	NA|174aa|down_2|NZ_LS483315.1_123583_124105_+	TIGR02227, Inactive_signal_peptidase_IA	NA|352aa|down_3|NZ_LS483315.1_124126_125182_+	TIGR03065, srtB_sig_QVPTGV, sortase B signal domain, QVPTGV class	NA|242aa|down_4|NZ_LS483315.1_125197_125923_+	TIGR03064, sortase_srtB, sortase, SrtB family	NA|196aa|down_5|NZ_LS483315.1_125939_126527_+	TIGR03786, strep_pil_rpt, streptococcal pilin isopeptide linkage domain	NA|402aa|down_6|NZ_LS483315.1_126685_127891_-	TIGR04094, AraC_family_transcriptional_regulator, YSIRK-targeted surface antigen transcriptional regulator	NA|1161aa|down_7|NZ_LS483315.1_128275_131758_+	NF033395, fibronec_SfbI, fibronectin-binding protein SfbI	NA|222aa|down_8|NZ_LS483315.1_132023_132689_-	NA	NA|469aa|down_9|NZ_LS483315.1_133041_134448_+	COG2031, AtoE, Short chain fatty acids transporter [Lipid metabolism]
GCF_900474745.1_41800_E02	NZ_LS483315	Streptococcus pyogenes strain NCTC12059 chromosome 1	2	569205-569633	2,1,1,3	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Type I-C,Type I-U, Type I-U?	GTCTCACCCTTCGCGGGTGAGTGGATTGAAATT,GTCTCACCCTTCGCGGGTGAGTGGATTGAAAT,GTCTCACCCTTCNNGGGTGAGTGGATTGAAAT,TAGTCTCACCCTTCATGGGTGAGTGGATTGAAAT	33,32,32,34	0	0	NA	NA	I-C:I-C:I-C:I-C	5,6,6,5	6	TypeI-C,TypeI-U?,TypeI-U	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA	NA|132aa|up_9|NZ_LS483315.1_556672_557068_+	PRK07758, PRK07758, hypothetical protein; Provisional	NA|188aa|up_8|NZ_LS483315.1_557669_558233_+	pfam13238, AAA_18, AAA domain	NA|883aa|up_7|NZ_LS483315.1_558234_560883_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	cas3|803aa|up_6|NZ_LS483315.1_561036_563445_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_LS483315.1_563577_564306_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_LS483315.1_564305_566201_+	TIGR01863, CRISPR-associated_protein_CT1133_family, CRISPR-associated protein Cas8c/Csd1, subtype I-C/DVULG	cas7|283aa|up_3|NZ_LS483315.1_566205_567054_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|225aa|up_2|NZ_LS483315.1_567055_567730_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_LS483315.1_567726_568752_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_LS483315.1_568762_569056_+	COG1343, COG1343, CRISPR-associated protein Cas2 [Defense mechanisms]	NA|237aa|down_0|NZ_LS483315.1_569792_570503_+	COG0785, CcdA, Cytochrome c biogenesis protein [Posttranslational modification, protein turnover, chaperones]	NA|208aa|down_1|NZ_LS483315.1_570515_571139_+	cd02966, TlpA_like_family, TlpA-like family; composed of  TlpA, ResA, DsbE and similar proteins	NA|369aa|down_2|NZ_LS483315.1_571181_572288_+	PRK14018, PRK14018, bifunctional peptide-methionine (S)-S-oxide reductase MsrA/peptide-methionine (R)-S-oxide reductase MsrB	NA|247aa|down_3|NZ_LS483315.1_572378_573119_+	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|578aa|down_4|NZ_LS483315.1_573115_574849_+	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|360aa|down_5|NZ_LS483315.1_574921_576001_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|239aa|down_6|NZ_LS483315.1_576014_576731_+	COG3382, COG3382, Solo B3/4 domain (OB-fold DNA/RNA-binding) of Phe-aaRS-beta [General function prediction only]	NA|158aa|down_7|NZ_LS483315.1_576896_577370_-	COG1438, ArgR, Arginine repressor [Transcription]	NA|227aa|down_8|NZ_LS483315.1_577511_578192_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|412aa|down_9|NZ_LS483315.1_578465_579701_+	PRK01388, PRK01388, arginine deiminase; Provisional
GCF_900474745.1_41800_E02	NZ_LS483315	Streptococcus pyogenes strain NCTC12059 chromosome 1	3	794214-794314	2	CRISPRCasFinder	no		cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Orphan	TATAATTAGACTATACCAATTTT	23	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA|262aa|up_5|NZ_LS483315.1_785598_786384_-,NA	NA|498aa|up_9|NZ_LS483315.1_779448_780942_+	PRK14508, PRK14508, 4-alpha-glucanotransferase; Provisional	NA|755aa|up_8|NZ_LS483315.1_780976_783241_+	cd04300, GT35_Glycogen_Phosphorylase, glycogen phosphorylase and similar proteins	NA|207aa|up_7|NZ_LS483315.1_783496_784117_-	pfam12978, DUF3862, Domain of Unknown Function with PDB structure (DUF3862)	NA|205aa|up_6|NZ_LS483315.1_784857_785472_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]	NA|262aa|up_5|NZ_LS483315.1_785598_786384_-	NA	NA|124aa|up_4|NZ_LS483315.1_787090_787462_-	COG1725, COG1725, Predicted transcriptional regulators [Transcription]	NA|1037aa|up_3|NZ_LS483315.1_787646_790757_+	PRK07279, dnaE, DNA polymerase III DnaE; Reviewed	NA|338aa|up_2|NZ_LS483315.1_790836_791850_+	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|501aa|up_1|NZ_LS483315.1_791912_793415_+	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|186aa|up_0|NZ_LS483315.1_793632_794190_+	TIGR02227, Inactive_signal_peptidase_IA	NA|605aa|down_0|NZ_LS483315.1_794365_796180_+	PRK00331, PRK00331, isomerizing glutamine--fructose-6-phosphate transaminase	NA|112aa|down_1|NZ_LS483315.1_796375_796711_+	COG2824, PhnA, Uncharacterized Zn-ribbon-containing protein involved in phosphonate metabolism [Inorganic ion transport and metabolism]	NA|214aa|down_2|NZ_LS483315.1_796817_797459_+	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|210aa|down_3|NZ_LS483315.1_797468_798098_+	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|279aa|down_4|NZ_LS483315.1_798113_798950_+	cd00996, PBP2_AatB_like, Polar amino acids-binding domain of ATP-binding cassette transporter-like systems that belong to the type 2 periplasmic binding fold protein superfamily	NA|258aa|down_5|NZ_LS483315.1_799319_800093_+	pfam07373, CAMP_factor, CAMP factor (Cfa)	NA|412aa|down_6|NZ_LS483315.1_800462_801698_-	COG0053, MMT1, Predicted Co/Zn/Cd cation transporters [Inorganic ion transport and metabolism]	NA|441aa|down_7|NZ_LS483315.1_801817_803140_-	COG1115, AlsT, Na+/alanine symporter [Amino acid transport and metabolism]	NA|773aa|down_8|NZ_LS483315.1_803669_805988_+	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|83aa|down_9|NZ_LS483315.1_806350_806599_+	COG2261, COG2261, Predicted membrane protein [Function unknown]
GCF_900474745.1_41800_E02	NZ_LS483315	Streptococcus pyogenes strain NCTC12059 chromosome 1	4	983370-983567	2	CRT	no	csn2,cas2,cas1,cas9	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Type II-C,Type II-A,Type II-B	ACCTGGAAGACCATCTTT	18	0	0	NA	NA	NA	4	4	TypeII-C,TypeII-A,TypeII-B	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA|214aa|down_9|NZ_LS483315.1_997158_997800_-	NA|466aa|up_9|NZ_LS483315.1_973342_974740_-	cd07100, ALDH_SSADH1_GabD1, Mycobacterium tuberculosis succinate-semialdehyde dehydrogenase 1-like	NA|349aa|up_8|NZ_LS483315.1_974852_975899_-	cd13546, PBP2_BitB, Substrate binding domain of a putative iron transporter BitB, a member of the type 2 periplasmic binding fold superfamily	NA|263aa|up_7|NZ_LS483315.1_975892_976681_-	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|550aa|up_6|NZ_LS483315.1_976684_978334_-	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|276aa|up_5|NZ_LS483315.1_978469_979297_-	COG3716, ManZ, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IID [Carbohydrate transport and metabolism]	NA|270aa|up_4|NZ_LS483315.1_979293_980103_-	COG3715, ManY, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIC [Carbohydrate transport and metabolism]	NA|164aa|up_3|NZ_LS483315.1_980119_980611_-	COG3444, COG3444, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIB [Carbohydrate transport and metabolism]	NA|142aa|up_2|NZ_LS483315.1_980629_981055_-	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|340aa|up_1|NZ_LS483315.1_981261_982281_-	COG2855, COG2855, Predicted membrane protein [Function unknown]	NA|146aa|up_0|NZ_LS483315.1_982410_982848_-	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|611aa|down_0|NZ_LS483315.1_984585_986418_-	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	csn2|221aa|down_1|NZ_LS483315.1_987398_988061_-	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	cas2|114aa|down_2|NZ_LS483315.1_988050_988392_-	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	cas1|290aa|down_3|NZ_LS483315.1_988388_989258_-	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas9|1369aa|down_4|NZ_LS483315.1_989257_993364_-	COG3513, COG3513, Predicted CRISPR-associated nuclease, contains McrA/HNH-nuclease and RuvC-like nuclease domain [Defense mechanisms]	NA|211aa|down_5|NZ_LS483315.1_993807_994440_-	COG4478, COG4478, Predicted membrane protein [Function unknown]	NA|255aa|down_6|NZ_LS483315.1_994439_995204_-	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|251aa|down_7|NZ_LS483315.1_995203_995956_-	COG3884, FatA, Acyl-ACP thioesterase [Lipid metabolism]	NA|377aa|down_8|NZ_LS483315.1_995965_997096_-	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|214aa|down_9|NZ_LS483315.1_997158_997800_-	NA
GCF_900474745.1_41800_E02	NZ_LS483315	Streptococcus pyogenes strain NCTC12059 chromosome 1	5	987063-987296	3,3,4	CRISPRCasFinder,CRT,PILER-CR	no	csn2,cas2,cas1,cas9	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Type II-C,Type II-A,Type II-B	GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC,GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC,CTCCTAGTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC	36,36,42	0	0	NA	NA	II-A:II-A:II-A	3,3,2	3	TypeII-C,TypeII-A,TypeII-B	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA|214aa|down_8|NZ_LS483315.1_997158_997800_-	NA|263aa|up_9|NZ_LS483315.1_975892_976681_-	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|550aa|up_8|NZ_LS483315.1_976684_978334_-	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|276aa|up_7|NZ_LS483315.1_978469_979297_-	COG3716, ManZ, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IID [Carbohydrate transport and metabolism]	NA|270aa|up_6|NZ_LS483315.1_979293_980103_-	COG3715, ManY, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIC [Carbohydrate transport and metabolism]	NA|164aa|up_5|NZ_LS483315.1_980119_980611_-	COG3444, COG3444, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIB [Carbohydrate transport and metabolism]	NA|142aa|up_4|NZ_LS483315.1_980629_981055_-	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|340aa|up_3|NZ_LS483315.1_981261_982281_-	COG2855, COG2855, Predicted membrane protein [Function unknown]	NA|146aa|up_2|NZ_LS483315.1_982410_982848_-	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|459aa|up_1|NZ_LS483315.1_983033_984410_-	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|611aa|up_0|NZ_LS483315.1_984585_986418_-	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	csn2|221aa|down_0|NZ_LS483315.1_987398_988061_-	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	cas2|114aa|down_1|NZ_LS483315.1_988050_988392_-	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	cas1|290aa|down_2|NZ_LS483315.1_988388_989258_-	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas9|1369aa|down_3|NZ_LS483315.1_989257_993364_-	COG3513, COG3513, Predicted CRISPR-associated nuclease, contains McrA/HNH-nuclease and RuvC-like nuclease domain [Defense mechanisms]	NA|211aa|down_4|NZ_LS483315.1_993807_994440_-	COG4478, COG4478, Predicted membrane protein [Function unknown]	NA|255aa|down_5|NZ_LS483315.1_994439_995204_-	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|251aa|down_6|NZ_LS483315.1_995203_995956_-	COG3884, FatA, Acyl-ACP thioesterase [Lipid metabolism]	NA|377aa|down_7|NZ_LS483315.1_995965_997096_-	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|214aa|down_8|NZ_LS483315.1_997158_997800_-	NA	NA|452aa|down_9|NZ_LS483315.1_997923_999279_-	PRK14316, glmM, phosphoglucosamine mutase; Provisional
