assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000183345.1_ASM18334v1	NC_017634	Escherichia coli O83:H1 str. NRG 857C, complete sequence	1	144057-144140	1	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	Orphan	ACGCCGCATCCGGCACGAACAAA	23	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	NA,NA	NA|888aa|up_9|NC_017634.1_128343_131007_+	PRK09405, aceE, pyruvate dehydrogenase subunit E1; Reviewed	NA|631aa|up_8|NC_017634.1_131021_132914_+	PRK11854, aceF, pyruvate dehydrogenase dihydrolipoyltransacetylase; Validated	NA|475aa|up_7|NC_017634.1_133121_134546_+	PRK06467, PRK06467, dihydrolipoamide dehydrogenase; Reviewed	NA|582aa|up_6|NC_017634.1_134787_136533_-	pfam11737, DUF3300, Protein of unknown function (DUF3300)	NA|866aa|up_5|NC_017634.1_136887_139485_+	PRK09238, PRK09238, bifunctional aconitate hydratase 2/2-methylisocitrate dehydratase; Validated	NA|121aa|up_4|NC_017634.1_139659_140022_+	PRK05248, PRK05248, hypothetical protein; Provisional	NA|265aa|up_3|NC_017634.1_140059_140854_-	PRK05462, PRK05462, adenosylmethionine decarboxylase	NA|289aa|up_2|NC_017634.1_140869_141736_-	PRK00811, PRK00811, polyamine aminopropyltransferase	NA|116aa|up_1|NC_017634.1_141841_142189_-	pfam09691, T2SS_PulS_OutS, Type II secretion system pilotin lipoprotein (PulS_OutS)	NA|517aa|up_0|NC_017634.1_142354_143905_+	PRK10965, PRK10965, multicopper oxidase; Provisional	NA|797aa|down_0|NC_017634.1_144169_146560_-	TIGR03074, PQQ_membr_DH, membrane-bound PQQ-dependent dehydrogenase, glucose/quinate/shikimate family	NA|179aa|down_1|NC_017634.1_146765_147302_+	PRK15423, PRK15423, hypoxanthine phosphoribosyltransferase; Provisional	NA|221aa|down_2|NC_017634.1_147342_148005_-	PRK10437, PRK10437, carbonic anhydrase; Provisional	NA|309aa|down_3|NC_017634.1_148113_149040_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|257aa|down_4|NC_017634.1_149036_149807_+	PRK15066, PRK15066, inner membrane transport permease; Provisional	NA|147aa|down_5|NC_017634.1_149911_150352_+	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|410aa|down_6|NC_017634.1_150415_151645_+	cd10966, CE4_yadE_5s, Putative catalytic polysaccharide deacetylase domain of uncharacterized protein yadE and similar proteins	NA|127aa|down_7|NC_017634.1_151648_152029_-	TIGR00223, Aspartate_1-decarboxylase, L-aspartate-alpha-decarboxylase	NA|295aa|down_8|NC_017634.1_152302_153187_+	pfam04754, Transposase_31, Putative transposase, YhgA-like	NA|284aa|down_9|NC_017634.1_153268_154120_-	PRK00380, panC, pantoate--beta-alanine ligase; Reviewed
GCF_000183345.1_ASM18334v1	NC_017634	Escherichia coli O83:H1 str. NRG 857C, complete sequence	2	873114-873681	1,2,1	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas3f,cas8f,cas5f,cas7f,cas6f	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	Type I-F	GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA	28,28,28	0	0	NA	NA	I-F:I-F:I-F	8,9,9	9	TypeI-F	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	NA,NA	NA|551aa|up_9|NC_017634.1_859522_861175_-	PRK05290, PRK05290, hybrid cluster protein; Provisional	NA|300aa|up_8|NC_017634.1_861318_862218_-	COG2431, COG2431, Predicted membrane protein [Function unknown]	NA|232aa|up_7|NC_017634.1_862712_863408_-	PRK05420, PRK05420, aquaporin Z; Provisional	NA|553aa|up_6|NC_017634.1_863833_865492_+	COG3593, COG3593, Predicted ATP-dependent endonuclease of the OLD family [DNA replication, recombination, and repair]	NA|319aa|up_5|NC_017634.1_865488_866445_-	COG2990, VirK, Uncharacterized protein conserved in bacteria [Function unknown]	NA|372aa|up_4|NC_017634.1_866595_867711_+	PRK11578, PRK11578, macrolide transporter subunit MacA; Provisional	NA|649aa|up_3|NC_017634.1_867707_869654_+	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|75aa|up_2|NC_017634.1_869726_869951_-	PRK09937, PRK09937, cold shock-like protein CspD	NA|107aa|up_1|NC_017634.1_870273_870594_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|759aa|up_0|NC_017634.1_870624_872901_+	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	cas1|328aa|down_0|NC_017634.1_873853_874837_+	TIGR03637, cas1_YPEST, CRISPR-associated endonuclease Cas1, subtype I-F/YPEST	cas3f|1078aa|down_1|NC_017634.1_874833_878067_+	TIGR02562, conserved_hypothetical_protein, CRISPR-associated helicase Cas3, subtype I-F/YPEST	cas8f|436aa|down_2|NC_017634.1_878396_879704_+	cd09735, Csy1_I-F, CRISPR/Cas system-associated protein Csy1	cas5f|308aa|down_3|NC_017634.1_879700_880624_+	pfam09614, Cas_Csy2, CRISPR-associated protein (Cas_Csy2)	cas7f|334aa|down_4|NC_017634.1_880634_881636_+	pfam09615, Cas_Csy3, CRISPR-associated protein (Cas_Csy3)	cas6f|185aa|down_5|NC_017634.1_881646_882201_+	cd09739, Cas6_I-F, CRISPR/Cas system-associated RAMP superfamily protein Cas6f	NA|73aa|down_6|NC_017634.1_884142_884361_-	PRK00276, infA, translation initiation factor IF-1; Validated	NA|235aa|down_7|NC_017634.1_884645_885350_-	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|574aa|down_8|NC_017634.1_885391_887113_-	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|589aa|down_9|NC_017634.1_887113_888880_-	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed
GCF_000183345.1_ASM18334v1	NC_017634	Escherichia coli O83:H1 str. NRG 857C, complete sequence	3	882741-884030	2,3,2	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas3f,cas8f,cas5f,cas7f,cas6f	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	Type I-F	GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA	28,28,28	0	0	NA	NA	I-F:I-F:I-F	20,21,21	21	TypeI-F	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	NA,NA	NA|649aa|up_9|NC_017634.1_867707_869654_+	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|75aa|up_8|NC_017634.1_869726_869951_-	PRK09937, PRK09937, cold shock-like protein CspD	NA|107aa|up_7|NC_017634.1_870273_870594_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|759aa|up_6|NC_017634.1_870624_872901_+	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	cas1|328aa|up_5|NC_017634.1_873853_874837_+	TIGR03637, cas1_YPEST, CRISPR-associated endonuclease Cas1, subtype I-F/YPEST	cas3f|1078aa|up_4|NC_017634.1_874833_878067_+	TIGR02562, conserved_hypothetical_protein, CRISPR-associated helicase Cas3, subtype I-F/YPEST	cas8f|436aa|up_3|NC_017634.1_878396_879704_+	cd09735, Csy1_I-F, CRISPR/Cas system-associated protein Csy1	cas5f|308aa|up_2|NC_017634.1_879700_880624_+	pfam09614, Cas_Csy2, CRISPR-associated protein (Cas_Csy2)	cas7f|334aa|up_1|NC_017634.1_880634_881636_+	pfam09615, Cas_Csy3, CRISPR-associated protein (Cas_Csy3)	cas6f|185aa|up_0|NC_017634.1_881646_882201_+	cd09739, Cas6_I-F, CRISPR/Cas system-associated RAMP superfamily protein Cas6f	NA|73aa|down_0|NC_017634.1_884142_884361_-	PRK00276, infA, translation initiation factor IF-1; Validated	NA|235aa|down_1|NC_017634.1_884645_885350_-	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|574aa|down_2|NC_017634.1_885391_887113_-	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|589aa|down_3|NC_017634.1_887113_888880_-	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|322aa|down_4|NC_017634.1_889002_889968_-	PRK10262, PRK10262, thioredoxin reductase; Provisional	NA|165aa|down_5|NC_017634.1_890511_891006_+	PRK11169, PRK11169, leucine-responsive transcriptional regulator Lrp	NA|1351aa|down_6|NC_017634.1_891140_895193_+	PRK10263, PRK10263, DNA translocase FtsK; Provisional	NA|204aa|down_7|NC_017634.1_895351_895963_+	TIGR00547, Outer-membrane_lipoprotein_carrier_protein, periplasmic chaperone LolA	NA|448aa|down_8|NC_017634.1_895973_897317_+	PRK13342, PRK13342, recombination factor protein RarA; Reviewed	NA|431aa|down_9|NC_017634.1_897407_898700_+	PRK05431, PRK05431, seryl-tRNA synthetase; Provisional
GCF_000183345.1_ASM18334v1	NC_017634	Escherichia coli O83:H1 str. NRG 857C, complete sequence	4	2369407-2369520	4	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	Orphan	TTTGTAGGCCGGATAAGCGAAGCGCATCCGGCA	33	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	NA,NA	NA|395aa|up_9|NC_017634.1_2348309_2349494_+	PRK05790, PRK05790, putative acyltransferase; Provisional	NA|259aa|up_8|NC_017634.1_2349567_2350344_-	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|550aa|up_7|NC_017634.1_2350348_2351998_-	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|1505aa|up_6|NC_017634.1_2351998_2356513_-	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|208aa|up_5|NC_017634.1_2356536_2357160_-	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|563aa|up_4|NC_017634.1_2357156_2358845_-	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|876aa|up_3|NC_017634.1_2358993_2361621_-	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|241aa|up_2|NC_017634.1_2361767_2362490_+	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|1253aa|up_1|NC_017634.1_2362629_2366388_-	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|762aa|up_0|NC_017634.1_2367069_2369355_+	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|377aa|down_0|NC_017634.1_2369544_2370675_+	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|85aa|down_1|NC_017634.1_2370674_2370929_+	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|217aa|down_2|NC_017634.1_2370982_2371633_-	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|359aa|down_3|NC_017634.1_2371835_2372912_-	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|453aa|down_4|NC_017634.1_2372916_2374275_-	PRK11273, glpT, glycerol-3-phosphate transporter	NA|543aa|down_5|NC_017634.1_2374547_2376176_+	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|420aa|down_6|NC_017634.1_2376165_2377425_+	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|397aa|down_7|NC_017634.1_2377421_2378612_+	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|320aa|down_8|NC_017634.1_2378804_2379764_+	PRK09956, PRK09956, ISNCY family transposase	NA|66aa|down_9|NC_017634.1_2379776_2379974_+	PRK09956, PRK09956, ISNCY family transposase
GCF_000183345.1_ASM18334v1	NC_017634	Escherichia coli O83:H1 str. NRG 857C, complete sequence	5	4609610-4609749	5	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	Orphan	TGTGTAGGTCGGATAAGGCGTTCACGTCGCATCCGACAATAACA	44	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas1,cas3f,cas8f,cas5f,cas7f,cas6f,cas3,csa3,PD-DExK	NA,NA	NA|335aa|up_9|NC_017634.1_4598154_4599159_-	PRK02102, PRK02102, ornithine carbamoyltransferase; Validated	NA|315aa|up_8|NC_017634.1_4599169_4600114_-	PRK12354, PRK12354, carbamate kinase; Reviewed	NA|407aa|up_7|NC_017634.1_4600124_4601345_-	PRK01388, PRK01388, arginine deiminase; Provisional	NA|151aa|up_6|NC_017634.1_4602022_4602475_+	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|335aa|up_5|NC_017634.1_4602519_4603524_-	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|139aa|up_4|NC_017634.1_4603685_4604102_+	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|168aa|up_3|NC_017634.1_4604279_4604783_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|396aa|up_2|NC_017634.1_4604975_4606163_+	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|952aa|up_1|NC_017634.1_4606209_4609065_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|148aa|up_0|NC_017634.1_4609064_4609508_-	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|504aa|down_0|NC_017634.1_4609765_4611277_-	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|367aa|down_1|NC_017634.1_4611543_4612644_+	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|361aa|down_2|NC_017634.1_4612643_4613726_+	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|501aa|down_3|NC_017634.1_4613886_4615389_-	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|333aa|down_4|NC_017634.1_4615466_4616465_-	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|440aa|down_5|NC_017634.1_4616531_4617851_-	TIGR00791, Gluconate_permease, gluconate transporter	NA|255aa|down_6|NC_017634.1_4617915_4618680_-	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|344aa|down_7|NC_017634.1_4618703_4619735_-	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|188aa|down_8|NC_017634.1_4619951_4620515_+	PRK09825, idnK, gluconokinase	NA|340aa|down_9|NC_017634.1_4620518_4621538_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)
