assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000167875.2_ASM16787v2	NZ_CP035751	Escherichia coli E110019 chromosome, complete genome	1	513286-513399	1	PILER-CR	no		DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	Orphan	TTTTTTTACCTGATTCGGGTAAA	23	0	0	NA	NA	NA	2	2	Orphan	DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	NA|50aa|up_3|NZ_CP035751.1_511225_511375_-,NA|101aa|up_1|NZ_CP035751.1_511822_512125_-,NA|94aa|down_9|NZ_CP035751.1_518828_519110_+	NA|182aa|up_9|NZ_CP035751.1_504893_505439_-	pfam07471, Phage_Nu1, Phage DNA packaging protein Nu1	NA|65aa|up_8|NZ_CP035751.1_505827_506022_+	pfam13132, DUF3950, Domain of unknown function (DUF3950)	NA|405aa|up_7|NZ_CP035751.1_506499_507713_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|266aa|up_6|NZ_CP035751.1_507818_508616_-	smart00342, HTH_ARAC, helix_turn_helix, arabinose operon control protein	NA|184aa|up_5|NZ_CP035751.1_508625_509177_-	PRK09818, PRK09818, kinase inhibitor	NA|509aa|up_4|NZ_CP035751.1_509641_511168_-	cd00338, Ser_Recombinase, Serine Recombinase family, catalytic domain; a DNA binding domain may be present either N- or C-terminal to the catalytic domain	NA|50aa|up_3|NZ_CP035751.1_511225_511375_-	NA	NA|111aa|up_2|NZ_CP035751.1_511422_511755_-	PRK09541, emrE, EmrE family multidrug efflux SMR transporter	NA|101aa|up_1|NZ_CP035751.1_511822_512125_-	NA	NA|234aa|up_0|NZ_CP035751.1_512121_512823_-	pfam06992, Phage_lambda_P, Replication protein P	NA|180aa|down_0|NZ_CP035751.1_513835_514375_-	pfam06254, YdaT_toxin, Putative bacterial toxin ydaT	NA|77aa|down_1|NZ_CP035751.1_514443_514674_-	pfam15943, YdaS_antitoxin, Putative antitoxin of bacterial toxin-antitoxin system, YdaS/YdaT	NA|252aa|down_2|NZ_CP035751.1_514712_515468_+	COG2932, COG2932, Predicted transcriptional regulator [Transcription]	NA|69aa|down_3|NZ_CP035751.1_516063_516270_+	PRK11354, kil, FtsZ inhibitor protein; Reviewed	NA|99aa|down_4|NZ_CP035751.1_516345_516642_+	pfam06064, Gam, Host-nuclease inhibitor protein Gam	NA|262aa|down_5|NZ_CP035751.1_516647_517433_+	TIGR01913, Uncharacterized_protein_UU154, phage recombination protein Bet	NA|227aa|down_6|NZ_CP035751.1_517429_518110_+	pfam09588, YqaJ, YqaJ-like viral recombinase domain	NA|54aa|down_7|NZ_CP035751.1_518106_518268_+	pfam07026, DUF1317, Protein of unknown function (DUF1317)	NA|186aa|down_8|NZ_CP035751.1_518260_518818_+	pfam05869, Dam, DNA N-6-adenine-methyltransferase (Dam)	NA|94aa|down_9|NZ_CP035751.1_518828_519110_+	NA
GCF_000167875.2_ASM16787v2	NZ_CP035751	Escherichia coli E110019 chromosome, complete genome	2	2509873-2510018	1	CRISPRCasFinder	no		DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	Orphan	TAAGACGCGAACAGCGTCGCATCAGGCACACTGCCAATGTCGGATGCGG	49	0	0	NA	NA	NA	1	1	Orphan	DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	NA,NA|22aa|down_2|NZ_CP035751.1_2511806_2511872_-	NA|214aa|up_9|NZ_CP035751.1_2497709_2498351_-	PRK05718, PRK05718, keto-hydroxyglutarate-aldolase/keto-deoxy-phosphogluconate aldolase; Provisional	NA|604aa|up_8|NZ_CP035751.1_2498387_2500199_-	PRK09054, PRK09054, phosphogluconate dehydratase; Validated	NA|492aa|up_7|NZ_CP035751.1_2500433_2501909_-	PRK05722, PRK05722, glucose-6-phosphate 1-dehydrogenase; Validated	NA|290aa|up_6|NZ_CP035751.1_2502246_2503116_+	PRK11302, PRK11302, DNA-binding transcriptional regulator HexR; Provisional	NA|481aa|up_5|NZ_CP035751.1_2503243_2504686_+	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|324aa|up_4|NZ_CP035751.1_2504816_2505788_-	PRK08943, PRK08943, lipid A biosynthesis (KDO)2-(lauroyl)-lipid IVA acyltransferase; Validated	NA|441aa|up_3|NZ_CP035751.1_2505907_2507230_-	PRK11649, PRK11649, putative peptidase; Provisional	NA|311aa|up_2|NZ_CP035751.1_2507245_2508178_-	PRK09545, znuA, zinc ABC transporter substrate-binding protein ZnuA	NA|252aa|up_1|NZ_CP035751.1_2508256_2509012_+	PRK09544, znuC, high-affinity zinc transporter ATPase; Reviewed	NA|262aa|up_0|NZ_CP035751.1_2509008_2509794_+	PRK09543, znuB, zinc ABC transporter permease subunit ZnuB	NA|337aa|down_0|NZ_CP035751.1_2510037_2511048_-	PRK00080, ruvB, Holliday junction branch migration DNA helicase RuvB	NA|204aa|down_1|NZ_CP035751.1_2511056_2511668_-	PRK00116, ruvA, Holliday junction branch migration protein RuvA	NA|22aa|down_2|NZ_CP035751.1_2511806_2511872_-	NA	NA|201aa|down_3|NZ_CP035751.1_2511943_2512546_+	PRK11470, PRK11470, YebB family permuted papain-like enzyme	NA|174aa|down_4|NZ_CP035751.1_2512547_2513069_-	TIGR00228, Crossover_junction_endodeoxyribonuclease_RuvC, crossover junction endodeoxyribonuclease RuvC	NA|247aa|down_5|NZ_CP035751.1_2513103_2513844_-	PRK00110, PRK00110, YebC/PmpR family DNA-binding transcriptional regulator	NA|151aa|down_6|NZ_CP035751.1_2513872_2514325_-	PRK09438, nudB, dihydroneopterin triphosphate pyrophosphatase; Provisional	NA|591aa|down_7|NZ_CP035751.1_2514442_2516215_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|84aa|down_8|NZ_CP035751.1_2516524_2516776_+	PRK11440, PRK11440, putative hydrolase; Provisional	NA|93aa|down_9|NZ_CP035751.1_2516812_2517091_+	PRK11440, PRK11440, putative hydrolase; Provisional
GCF_000167875.2_ASM16787v2	NZ_CP035751	Escherichia coli E110019 chromosome, complete genome	3	3617485-3618123	1,2,2	CRT,PILER-CR,CRISPRCasFinder	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	Type I-E	CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	10,9,9	10	TypeI-E	DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	NA,NA	NA|254aa|up_9|NZ_CP035751.1_3609358_3610120_-	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional	NA|350aa|up_8|NZ_CP035751.1_3610100_3611150_-	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|160aa|up_7|NZ_CP035751.1_3611146_3611626_-	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|237aa|up_6|NZ_CP035751.1_3611625_3612336_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|104aa|up_5|NZ_CP035751.1_3612354_3612666_-	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|108aa|up_4|NZ_CP035751.1_3612859_3613183_-	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|202aa|up_3|NZ_CP035751.1_3613232_3613838_-	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|476aa|up_2|NZ_CP035751.1_3613837_3615265_-	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|303aa|up_1|NZ_CP035751.1_3615266_3616175_-	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|346aa|up_0|NZ_CP035751.1_3616426_3617464_+	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	cas2|98aa|down_0|NZ_CP035751.1_3618219_3618513_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|307aa|down_1|NZ_CP035751.1_3618512_3619433_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|217aa|down_2|NZ_CP035751.1_3619429_3620080_-	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas5|249aa|down_3|NZ_CP035751.1_3620061_3620808_-	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|352aa|down_4|NZ_CP035751.1_3620818_3621874_-	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cse2gr11|179aa|down_5|NZ_CP035751.1_3621885_3622422_-	TIGR02548, CRISPR_system_Cascade_subunit_CasB, CRISPR type I-E/ECOLI-associated protein CasB/Cse2	cas8e|521aa|down_6|NZ_CP035751.1_3622418_3623981_-	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	NA|51aa|down_7|NZ_CP035751.1_3626971_3627124_-	pfam01848, HOK_GEF, Hok/gef family	NA|245aa|down_8|NZ_CP035751.1_3627388_3628123_-	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|571aa|down_9|NZ_CP035751.1_3628196_3629909_-	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit
GCF_000167875.2_ASM16787v2	NZ_CP035751	Escherichia coli E110019 chromosome, complete genome	4	3643822-3644521	3,2,3	CRISPRCasFinder,CRT,PILER-CR	no		DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	Orphan	CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	11,11,10	11	Orphan	DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	NA,NA|47aa|down_1|NZ_CP035751.1_3645670_3645811_+	NA|424aa|up_9|NZ_CP035751.1_3632466_3633738_+	PRK10015, PRK10015, oxidoreductase; Provisional	NA|87aa|up_8|NZ_CP035751.1_3633728_3633989_+	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|192aa|up_7|NZ_CP035751.1_3634005_3634581_+	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|298aa|up_6|NZ_CP035751.1_3634728_3635622_-	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|260aa|up_5|NZ_CP035751.1_3635585_3636365_-	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|470aa|up_4|NZ_CP035751.1_3636342_3637752_-	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|485aa|up_3|NZ_CP035751.1_3637773_3639228_-	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|262aa|up_2|NZ_CP035751.1_3639297_3640083_-	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|426aa|up_1|NZ_CP035751.1_3640401_3641679_+	cd06174, MFS, Major Facilitator Superfamily	NA|493aa|up_0|NZ_CP035751.1_3641705_3643184_+	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|224aa|down_0|NZ_CP035751.1_3644860_3645532_-	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|47aa|down_1|NZ_CP035751.1_3645670_3645811_+	NA	NA|291aa|down_2|NZ_CP035751.1_3645824_3646697_+	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|405aa|down_3|NZ_CP035751.1_3647192_3648406_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|433aa|down_4|NZ_CP035751.1_3649457_3650756_-	PRK00077, eno, enolase; Provisional	NA|546aa|down_5|NZ_CP035751.1_3650843_3652481_-	PRK05380, pyrG, CTP synthetase; Validated	NA|264aa|down_6|NZ_CP035751.1_3652708_3653500_-	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|112aa|down_7|NZ_CP035751.1_3653570_3653906_-	PRK09907, PRK09907, endoribonuclease MazF	NA|83aa|down_8|NZ_CP035751.1_3653905_3654154_-	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|745aa|down_9|NZ_CP035751.1_3654231_3656466_-	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional
GCF_000167875.2_ASM16787v2	NZ_CP035751	Escherichia coli E110019 chromosome, complete genome	5	4082218-4082613	4	PILER-CR	no		DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	Orphan	CCGCTTCGGCGGGTTTTTGCTTTTGGAGGGGCAGAAAGATGAATGACTGTCCACGAC	57	0	0	NA	NA	NA	3	3	Orphan	DEDDh,DinG,RT,cas3,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK	NA,NA	NA|158aa|up_9|NZ_CP035751.1_4071727_4072201_-	PRK11425, PRK11425, PTS N-acetylgalactosamine transporter subunit IIB	NA|427aa|up_8|NZ_CP035751.1_4072223_4073504_-	PRK15458, PRK15458, tagatose 6-phosphate aldolase subunit KbaZ; Provisional	NA|270aa|up_7|NZ_CP035751.1_4073752_4074562_+	PRK09802, PRK09802, DeoR family transcriptional regulator	NA|155aa|up_6|NZ_CP035751.1_4074616_4075081_-	pfam11663, Toxin_YhaV, Toxin with endonuclease activity, of toxin-antitoxin system	NA|112aa|up_5|NZ_CP035751.1_4075080_4075416_-	PRK09974, PRK09974, type II toxin-antitoxin system PrlF family antitoxin	NA|524aa|up_4|NZ_CP035751.1_4075564_4077136_-	TIGR03248, galactar-dH20, galactarate dehydratase	NA|445aa|up_3|NZ_CP035751.1_4077510_4078845_+	TIGR00893, Probable_glucarate_transporter, D-galactonate transporter	NA|257aa|up_2|NZ_CP035751.1_4078860_4079631_+	PRK10558, PRK10558, alpha-dehydro-beta-deoxy-D-glucarate aldolase; Provisional	NA|297aa|up_1|NZ_CP035751.1_4079660_4080551_+	PRK11559, garR, tartronate semialdehyde reductase; Provisional	NA|382aa|up_0|NZ_CP035751.1_4080647_4081793_+	PRK10342, PRK10342, glycerate kinase I; Provisional	NA|327aa|down_0|NZ_CP035751.1_4082889_4083870_-	pfam02371, Transposase_20, Transposase IS116/IS110/IS902 family	NA|415aa|down_1|NZ_CP035751.1_4084128_4085373_-	PRK10483, PRK10483, tryptophan permease; Provisional	NA|630aa|down_2|NZ_CP035751.1_4085526_4087416_-	PRK11634, PRK11634, ATP-dependent RNA helicase DeaD; Provisional	NA|27aa|down_3|NZ_CP035751.1_4087408_4087489_-	NF033440, small_YrbN, protein YrbN	NA|295aa|down_4|NZ_CP035751.1_4087595_4088480_-	PRK11189, PRK11189, lipoprotein NlpI; Provisional	NA|712aa|down_5|NZ_CP035751.1_4088588_4090724_-	PRK11824, PRK11824, polynucleotide phosphorylase/polyadenylase; Provisional	NA|90aa|down_6|NZ_CP035751.1_4090970_4091240_-	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|315aa|down_7|NZ_CP035751.1_4091388_4092333_-	PRK05033, truB, tRNA pseudouridine synthase B; Provisional	NA|134aa|down_8|NZ_CP035751.1_4092332_4092734_-	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|891aa|down_9|NZ_CP035751.1_4092897_4095570_-	PRK05306, infB, translation initiation factor IF-2; Validated
