assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001039695.1_emm89-1	NZ_HG316453	Streptococcus pyogenes strain H293	1	118051-118147	1	CRISPRCasFinder	no		cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	Orphan	GCTAGATGGTGAAGAAGTCCCAGAA	25	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	NA,NA|222aa|down_8|NZ_HG316453.1_131001_131667_-	NA|257aa|up_9|NZ_HG316453.1_108368_109139_-	PRK11880, PRK11880, pyrroline-5-carboxylate reductase; Reviewed	NA|356aa|up_8|NZ_HG316453.1_109186_110254_-	TIGR03107, Glutamyl_aminopeptidase, glutamyl aminopeptidase	NA|98aa|up_7|NZ_HG316453.1_110709_111003_+	pfam15513, DUF4651, Domain of unknown function (DUF4651)	NA|106aa|up_6|NZ_HG316453.1_110999_111317_+	cd02947, TRX_family, TRX family; composed of two groups: Group I, which includes proteins that exclusively encode a TRX domain; and Group II, which are composed of fusion proteins of TRX and additional domains	NA|209aa|up_5|NZ_HG316453.1_111334_111961_+	cd02796, tRNA_bind_bactPheRS, tRNA-binding-domain-containing prokaryotic phenylalanly tRNA synthetase (PheRS) beta chain	NA|132aa|up_4|NZ_HG316453.1_112112_112508_+	PRK07274, PRK07274, single-stranded DNA-binding protein; Provisional	NA|214aa|up_3|NZ_HG316453.1_112761_113403_-	COG1428, COG1428, Deoxynucleoside kinases [Nucleotide transport and metabolism]	NA|326aa|up_2|NZ_HG316453.1_113422_114400_-	TIGR00737, Probable_tRNA-dihydrouridine_synthase, putative TIM-barrel protein, nifR3 family	NA|291aa|up_1|NZ_HG316453.1_114386_115259_-	PRK00114, hslO, Hsp33 family molecular chaperone HslO	NA|498aa|up_0|NZ_HG316453.1_115405_116899_-	pfam08270, PRD_Mga, M protein trans-acting positive regulator (MGA) PRD domain	NA|283aa|down_0|NZ_HG316453.1_119274_120123_+	cd05827, Sortase_C, Sortase domain found in class C sortases	NA|754aa|down_1|NZ_HG316453.1_120408_122670_+	NF033396, pilus_ancill_1, pilus ancillary protein 1	NA|174aa|down_2|NZ_HG316453.1_122666_123188_+	TIGR02227, Inactive_signal_peptidase_IA	NA|350aa|down_3|NZ_HG316453.1_123209_124259_+	TIGR03786, strep_pil_rpt, streptococcal pilin isopeptide linkage domain	NA|242aa|down_4|NZ_HG316453.1_124274_125000_+	TIGR03064, sortase_srtB, sortase, SrtB family	NA|196aa|down_5|NZ_HG316453.1_125016_125604_+	TIGR03786, strep_pil_rpt, streptococcal pilin isopeptide linkage domain	NA|402aa|down_6|NZ_HG316453.1_125762_126968_-	TIGR04094, AraC_family_transcriptional_regulator, YSIRK-targeted surface antigen transcriptional regulator	NA|1126aa|down_7|NZ_HG316453.1_127358_130736_+	pfam05738, Cna_B, Cna protein B-type domain	NA|222aa|down_8|NZ_HG316453.1_131001_131667_-	NA	NA|469aa|down_9|NZ_HG316453.1_132019_133426_+	COG2031, AtoE, Short chain fatty acids transporter [Lipid metabolism]
GCF_001039695.1_emm89-1	NZ_HG316453	Streptococcus pyogenes strain H293	2	770899-771264	1,2,1	PILER-CR,CRISPRCasFinder,CRT	no	cas9,cas1,cas2,csn2	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	Type II-A,Type II-C,Type II-B	GTTTTAGAGCTATGCTGTTTTGAATGGTCCCAAAAC,GTTTTAGAGCTATGCTGTTTTGAATGGTCCCAAAAC,GTTTTAGAGCTATGCTGTTTTGAATGGTCCCAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	4,5,5	5	TypeII-A,TypeII-C,TypeII-B	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	NA|214aa|up_8|NZ_HG316453.1_760360_761002_+,NA	NA|452aa|up_9|NZ_HG316453.1_758881_760237_+	PRK14316, glmM, phosphoglucosamine mutase; Provisional	NA|214aa|up_8|NZ_HG316453.1_760360_761002_+	NA	NA|377aa|up_7|NZ_HG316453.1_761064_762195_+	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|251aa|up_6|NZ_HG316453.1_762204_762957_+	COG3884, FatA, Acyl-ACP thioesterase [Lipid metabolism]	NA|255aa|up_5|NZ_HG316453.1_762956_763721_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|211aa|up_4|NZ_HG316453.1_763720_764353_+	COG4478, COG4478, Predicted membrane protein [Function unknown]	cas9|1369aa|up_3|NZ_HG316453.1_764830_768937_+	COG3513, COG3513, Predicted CRISPR-associated nuclease, contains McrA/HNH-nuclease and RuvC-like nuclease domain [Defense mechanisms]	cas1|290aa|up_2|NZ_HG316453.1_768936_769806_+	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas2|114aa|up_1|NZ_HG316453.1_769802_770144_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|221aa|up_0|NZ_HG316453.1_770133_770796_+	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	NA|611aa|down_0|NZ_HG316453.1_771907_773740_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|372aa|down_1|NZ_HG316453.1_774138_775254_+	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|146aa|down_2|NZ_HG316453.1_775453_775891_+	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|340aa|down_3|NZ_HG316453.1_776020_777040_+	COG2855, COG2855, Predicted membrane protein [Function unknown]	NA|142aa|down_4|NZ_HG316453.1_777246_777672_+	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|164aa|down_5|NZ_HG316453.1_777690_778182_+	COG3444, COG3444, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIB [Carbohydrate transport and metabolism]	NA|270aa|down_6|NZ_HG316453.1_778198_779008_+	COG3715, ManY, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIC [Carbohydrate transport and metabolism]	NA|276aa|down_7|NZ_HG316453.1_779004_779832_+	COG3716, ManZ, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IID [Carbohydrate transport and metabolism]	NA|550aa|down_8|NZ_HG316453.1_779967_781617_+	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|263aa|down_9|NZ_HG316453.1_781620_782409_+	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]
GCF_001039695.1_emm89-1	NZ_HG316453	Streptococcus pyogenes strain H293	3	967214-967315	3	CRISPRCasFinder	no		cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	Orphan	AATAATTGGTATAGTCTAATTATA	24	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	NA,NA|262aa|down_6|NZ_HG316453.1_975145_975931_+	NA|83aa|up_9|NZ_HG316453.1_954930_955179_-	COG2261, COG2261, Predicted membrane protein [Function unknown]	NA|773aa|up_8|NZ_HG316453.1_955541_957860_-	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|441aa|up_7|NZ_HG316453.1_958388_959711_+	COG1115, AlsT, Na+/alanine symporter [Amino acid transport and metabolism]	NA|412aa|up_6|NZ_HG316453.1_959830_961066_+	COG0053, MMT1, Predicted Co/Zn/Cd cation transporters [Inorganic ion transport and metabolism]	NA|258aa|up_5|NZ_HG316453.1_961435_962209_-	pfam07373, CAMP_factor, CAMP factor (Cfa)	NA|279aa|up_4|NZ_HG316453.1_962578_963415_-	cd00996, PBP2_AatB_like, Polar amino acids-binding domain of ATP-binding cassette transporter-like systems that belong to the type 2 periplasmic binding fold protein superfamily	NA|210aa|up_3|NZ_HG316453.1_963430_964060_-	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|214aa|up_2|NZ_HG316453.1_964069_964711_-	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|112aa|up_1|NZ_HG316453.1_964817_965153_-	COG2824, PhnA, Uncharacterized Zn-ribbon-containing protein involved in phosphonate metabolism [Inorganic ion transport and metabolism]	NA|605aa|up_0|NZ_HG316453.1_965348_967163_-	PRK00331, PRK00331, isomerizing glutamine--fructose-6-phosphate transaminase	NA|186aa|down_0|NZ_HG316453.1_967338_967896_-	TIGR02227, Inactive_signal_peptidase_IA	NA|501aa|down_1|NZ_HG316453.1_968113_969616_-	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|338aa|down_2|NZ_HG316453.1_969678_970692_-	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|1037aa|down_3|NZ_HG316453.1_970771_973882_-	PRK07279, dnaE, DNA polymerase III DnaE; Reviewed	NA|124aa|down_4|NZ_HG316453.1_974066_974438_+	COG1725, COG1725, Predicted transcriptional regulators [Transcription]	NA|233aa|down_5|NZ_HG316453.1_974437_975136_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|262aa|down_6|NZ_HG316453.1_975145_975931_+	NA	NA|205aa|down_7|NZ_HG316453.1_976061_976676_-	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]	NA|207aa|down_8|NZ_HG316453.1_977416_978037_+	pfam12978, DUF3862, Domain of Unknown Function with PDB structure (DUF3862)	NA|755aa|down_9|NZ_HG316453.1_978293_980558_-	cd04300, GT35_Glycogen_Phosphorylase, glycogen phosphorylase and similar proteins
GCF_001039695.1_emm89-1	NZ_HG316453	Streptococcus pyogenes strain H293	4	1161892-1162786	4,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas7,cas8c,cas5,cas3	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	 Type I-U?,Type I-C,Type I-U	ATTTCAATCCACTCACCCATGAAGGGTGAGAC,ATTTCAATCCACTCACCCATGAAGGGTGAGAC,ATTTCAATCCACTCACCCATGAAGGGTGAGAC	32,32,32	0	0	NA	NA	I-C:I-C:I-C	13,13,13	13	TypeI-U?,TypeI-C,TypeI-U	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	NA,NA	NA|412aa|up_9|NZ_HG316453.1_1151826_1153062_-	PRK01388, PRK01388, arginine deiminase; Provisional	NA|227aa|up_8|NZ_HG316453.1_1153335_1154016_-	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|158aa|up_7|NZ_HG316453.1_1154157_1154631_+	COG1438, ArgR, Arginine repressor [Transcription]	NA|239aa|up_6|NZ_HG316453.1_1154796_1155513_-	COG3382, COG3382, Solo B3/4 domain (OB-fold DNA/RNA-binding) of Phe-aaRS-beta [General function prediction only]	NA|360aa|up_5|NZ_HG316453.1_1155526_1156606_-	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|578aa|up_4|NZ_HG316453.1_1156678_1158412_-	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|247aa|up_3|NZ_HG316453.1_1158408_1159149_-	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|369aa|up_2|NZ_HG316453.1_1159236_1160343_-	PRK14018, PRK14018, bifunctional peptide-methionine (S)-S-oxide reductase MsrA/peptide-methionine (R)-S-oxide reductase MsrB	NA|208aa|up_1|NZ_HG316453.1_1160385_1161009_-	cd02966, TlpA_like_family, TlpA-like family; composed of  TlpA, ResA, DsbE and similar proteins	NA|237aa|up_0|NZ_HG316453.1_1161021_1161732_-	COG0785, CcdA, Cytochrome c biogenesis protein [Posttranslational modification, protein turnover, chaperones]	cas2|98aa|down_0|NZ_HG316453.1_1162934_1163228_-	COG1343, COG1343, CRISPR-associated protein Cas2 [Defense mechanisms]	cas1|342aa|down_1|NZ_HG316453.1_1163238_1164264_-	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas4|225aa|down_2|NZ_HG316453.1_1164260_1164935_-	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas7|283aa|down_3|NZ_HG316453.1_1164936_1165785_-	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas8c|632aa|down_4|NZ_HG316453.1_1165789_1167685_-	TIGR01863, CRISPR-associated_protein_CT1133_family, CRISPR-associated protein Cas8c/Csd1, subtype I-C/DVULG	cas5|243aa|down_5|NZ_HG316453.1_1167684_1168413_-	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas3|803aa|down_6|NZ_HG316453.1_1168545_1170954_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|883aa|down_7|NZ_HG316453.1_1171107_1173756_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|188aa|down_8|NZ_HG316453.1_1173757_1174321_-	pfam13238, AAA_18, AAA domain	NA|132aa|down_9|NZ_HG316453.1_1174921_1175317_-	PRK07758, PRK07758, hypothetical protein; Provisional
GCF_001039695.1_emm89-1	NZ_HG316453	Streptococcus pyogenes strain H293	5	1557083-1557274	3	CRT	no		cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	Orphan	TGATGGAGATGGGGTTTC	18	0	0	NA	NA	NA	3	3	Orphan	cas3,DinG,csm6,cas9,cas1,cas2,csn2,cas4,cas7,cas8c,cas5,DEDDh,csa3	NA|75aa|up_8|NZ_HG316453.1_1547067_1547292_-,NA|84aa|down_5|NZ_HG316453.1_1568127_1568379_-	NA|234aa|up_9|NZ_HG316453.1_1546040_1546742_+	pfam02876, Stap_Strp_tox_C, Staphylococcal/Streptococcal toxin, beta-grasp domain	NA|75aa|up_8|NZ_HG316453.1_1547067_1547292_-	NA	NA|543aa|up_7|NZ_HG316453.1_1547470_1549099_+	cd08518, PBP2_NikA_DppA_OppA_like_19, The substrate-binding component of an uncharacterized ABC-type nickel/dipeptide/oligopeptide-like import system contains the type 2 periplasmic binding fold	NA|326aa|up_6|NZ_HG316453.1_1549211_1550189_+	COG0601, DppB, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|274aa|up_5|NZ_HG316453.1_1550185_1551007_+	COG1173, DppC, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|268aa|up_4|NZ_HG316453.1_1551018_1551822_+	COG0444, DppD, ABC-type dipeptide/oligopeptide/nickel transport system, ATPase component [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|209aa|up_3|NZ_HG316453.1_1551805_1552432_+	COG1124, DppF, ABC-type dipeptide/oligopeptide/nickel transport system, ATPase component [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|67aa|up_2|NZ_HG316453.1_1552511_1552712_-	COG3237, COG3237, Uncharacterized protein conserved in bacteria [Function unknown]	NA|824aa|up_1|NZ_HG316453.1_1552880_1555352_-	TIGR01363, pneumococcal_histidine_triad_A_protein, streptococcal histidine triad protein	NA|307aa|up_0|NZ_HG316453.1_1555364_1556285_-	cd01017, AdcA, Metal binding protein AdcA	NA|1183aa|down_0|NZ_HG316453.1_1557868_1561417_-	cd07475, Peptidases_S8_C5a_Peptidase, Peptidase S8 family domain in Streptococcal C5a peptidases	NA|369aa|down_1|NZ_HG316453.1_1561751_1562858_-	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|368aa|down_2|NZ_HG316453.1_1563067_1564171_-	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|426aa|down_3|NZ_HG316453.1_1564395_1565673_-	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|531aa|down_4|NZ_HG316453.1_1565859_1567452_-	pfam08270, PRD_Mga, M protein trans-acting positive regulator (MGA) PRD domain	NA|84aa|down_5|NZ_HG316453.1_1568127_1568379_-	NA	NA|543aa|down_6|NZ_HG316453.1_1568456_1570085_-	COG3942, COG3942, Surface antigen [General function prediction only]	NA|463aa|down_7|NZ_HG316453.1_1570186_1571575_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|218aa|down_8|NZ_HG316453.1_1571571_1572225_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|406aa|down_9|NZ_HG316453.1_1572318_1573536_-	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB
