assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_008642395.1_ASM864239v1	NZ_CP040263	Escherichia coli strain 631 chromosome, complete genome	1	1130245-1131005	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no		cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	Orphan	GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	11,12,12	12	Orphan	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	NA,NA	NA|919aa|up_9|NZ_CP040263.1_1116837_1119594_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|434aa|up_8|NZ_CP040263.1_1119650_1120952_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_7|NZ_CP040263.1_1120999_1123234_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|83aa|up_6|NZ_CP040263.1_1123311_1123560_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_5|NZ_CP040263.1_1123559_1123895_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_4|NZ_CP040263.1_1123966_1124758_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_3|NZ_CP040263.1_1124985_1126623_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_2|NZ_CP040263.1_1126710_1128009_+	PRK00077, eno, enolase; Provisional	NA|291aa|up_1|NZ_CP040263.1_1128068_1128941_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|224aa|up_0|NZ_CP040263.1_1129234_1129906_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_CP040263.1_1131642_1133121_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_CP040263.1_1133147_1134425_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_CP040263.1_1134743_1135529_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_CP040263.1_1135598_1137053_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|446aa|down_4|NZ_CP040263.1_1137146_1138484_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_CP040263.1_1138461_1139241_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_CP040263.1_1139237_1140098_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|450aa|down_7|NZ_CP040263.1_1140197_1141546_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|192aa|down_8|NZ_CP040263.1_1141680_1142256_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_9|NZ_CP040263.1_1142272_1142533_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]
GCF_008642395.1_ASM864239v1	NZ_CP040263	Escherichia coli strain 631 chromosome, complete genome	2	1158143-1158781	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	Type I-E	GTGTTCCCCGCGTCAGCGGGGATAAACCG,GTGTTCCCCGCGTCAGCGGGGATAAACCG,GTGTTCCCCGCGNCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	10,10,10	10	TypeI-E	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	NA,NA	NA|245aa|up_9|NZ_CP040263.1_1148138_1148873_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|51aa|up_8|NZ_CP040263.1_1149137_1149290_+	pfam01848, HOK_GEF, Hok/gef family	cas3|900aa|up_7|NZ_CP040263.1_1149484_1152184_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|521aa|up_6|NZ_CP040263.1_1152281_1153844_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|up_5|NZ_CP040263.1_1153840_1154377_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|NZ_CP040263.1_1154391_1155447_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP040263.1_1155457_1156204_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP040263.1_1156185_1156836_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|NZ_CP040263.1_1156832_1157756_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP040263.1_1157752_1158046_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP040263.1_1158862_1159900_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP040263.1_1160151_1161060_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP040263.1_1161061_1162489_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP040263.1_1162488_1163094_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP040263.1_1163143_1163467_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP040263.1_1163660_1163972_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP040263.1_1163990_1164701_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP040263.1_1164700_1165180_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP040263.1_1165176_1166226_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP040263.1_1166206_1166968_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_008642395.1_ASM864239v1	NZ_CP040263	Escherichia coli strain 631 chromosome, complete genome	3	1618263-1618358	3	CRISPRCasFinder	no		cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	Orphan	ATTGTCCAACGGTTGTCCAACGGTTGTCCA	30	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	NA|92aa|up_9|NZ_CP040263.1_1613566_1613842_-,NA|157aa|up_8|NZ_CP040263.1_1613931_1614402_-,NA|89aa|up_7|NZ_CP040263.1_1614457_1614724_-,NA|65aa|up_6|NZ_CP040263.1_1614785_1614980_+,NA|121aa|up_5|NZ_CP040263.1_1614910_1615273_-,NA|91aa|up_4|NZ_CP040263.1_1615275_1615548_-,NA|123aa|up_3|NZ_CP040263.1_1615915_1616284_-,NA|69aa|down_1|NZ_CP040263.1_1621309_1621516_+,NA|119aa|down_2|NZ_CP040263.1_1621533_1621890_+	NA|92aa|up_9|NZ_CP040263.1_1613566_1613842_-	NA	NA|157aa|up_8|NZ_CP040263.1_1613931_1614402_-	NA	NA|89aa|up_7|NZ_CP040263.1_1614457_1614724_-	NA	NA|65aa|up_6|NZ_CP040263.1_1614785_1614980_+	NA	NA|121aa|up_5|NZ_CP040263.1_1614910_1615273_-	NA	NA|91aa|up_4|NZ_CP040263.1_1615275_1615548_-	NA	NA|123aa|up_3|NZ_CP040263.1_1615915_1616284_-	NA	NA|239aa|up_2|NZ_CP040263.1_1616301_1617018_-	COG1974, LexA, SOS-response transcriptional repressors (RecA-mediated autopeptidases) [Transcription / Signal transduction mechanisms]	NA|65aa|up_1|NZ_CP040263.1_1617124_1617319_+	pfam09048, Cro, Cro	NA|93aa|up_0|NZ_CP040263.1_1617427_1617706_+	pfam05269, Phage_CII, Bacteriophage CII protein	NA|822aa|down_0|NZ_CP040263.1_1618768_1621234_+	TIGR03600, phage_DnaB, phage replicative helicase, DnaB family, HK022 subfamily	NA|69aa|down_1|NZ_CP040263.1_1621309_1621516_+	NA	NA|119aa|down_2|NZ_CP040263.1_1621533_1621890_+	NA	NA|137aa|down_3|NZ_CP040263.1_1621861_1622272_+	pfam05772, NinB, NinB protein	NA|61aa|down_4|NZ_CP040263.1_1622268_1622451_+	pfam05322, NinE, NINE Protein	NA|57aa|down_5|NZ_CP040263.1_1622447_1622618_+	pfam05810, NinF, NinF protein	NA|241aa|down_6|NZ_CP040263.1_1622610_1623333_+	COG3645, COG3645, Uncharacterized phage-encoded protein [Function unknown]	NA|97aa|down_7|NZ_CP040263.1_1623332_1623623_+	pfam07102, DUF1364, Protein of unknown function (DUF1364)	NA|121aa|down_8|NZ_CP040263.1_1623619_1623982_+	PRK09786, PRK09786, endodeoxyribonuclease RUS; Reviewed	NA|63aa|down_9|NZ_CP040263.1_1623978_1624167_+	pfam06322, Phage_NinH, Phage NinH protein
GCF_008642395.1_ASM864239v1	NZ_CP040263	Escherichia coli strain 631 chromosome, complete genome	4	2445068-2445191	4	CRISPRCasFinder	no	DEDDh	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	NA,NA|30aa|down_7|NZ_CP040263.1_2454088_2454178_+	NA|471aa|up_9|NZ_CP040263.1_2434521_2435934_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP040263.1_2436490_2436700_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP040263.1_2437155_2437782_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP040263.1_2437802_2439905_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|216aa|up_5|NZ_CP040263.1_2439908_2440556_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP040263.1_2440619_2441288_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP040263.1_2441284_2442070_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP040263.1_2442073_2442886_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|535aa|up_1|NZ_CP040263.1_2442897_2444502_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP040263.1_2444627_2444933_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP040263.1_2445506_2446763_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP040263.1_2446803_2448177_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP040263.1_2448391_2449033_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP040263.1_2449072_2450221_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP040263.1_2450511_2451723_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP040263.1_2451835_2452768_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP040263.1_2452764_2453790_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP040263.1_2454088_2454178_+	NA	NA|390aa|down_8|NZ_CP040263.1_2454343_2455513_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP040263.1_2455658_2456240_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_008642395.1_ASM864239v1	NZ_CP040263	Escherichia coli strain 631 chromosome, complete genome	5	3141915-3142006	5	CRISPRCasFinder	no		cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,WYL,RT,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,c2c9_V-U4,cas14j,DinG	NA|70aa|up_9|NZ_CP040263.1_3131165_3131375_-,NA	NA|70aa|up_9|NZ_CP040263.1_3131165_3131375_-	NA	NA|1321aa|up_8|NZ_CP040263.1_3131429_3135392_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_7|NZ_CP040263.1_3135431_3136070_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_6|NZ_CP040263.1_3136357_3137449_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_5|NZ_CP040263.1_3137448_3138141_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_4|NZ_CP040263.1_3138152_3138539_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|267aa|up_3|NZ_CP040263.1_3138546_3139347_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_2|NZ_CP040263.1_3139356_3139947_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_CP040263.1_3139957_3140452_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP040263.1_3140472_3141801_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP040263.1_3142429_3143026_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP040263.1_3143046_3143274_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP040263.1_3143311_3144553_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|419aa|down_3|NZ_CP040263.1_3144844_3146101_-	PRK09784, PRK09784, YccE family protein	NA|307aa|down_4|NZ_CP040263.1_3146360_3147281_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_5|NZ_CP040263.1_3147280_3147586_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_6|NZ_CP040263.1_3147737_3148337_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_7|NZ_CP040263.1_3148333_3150880_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_8|NZ_CP040263.1_3150879_3152052_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_9|NZ_CP040263.1_3152181_3152874_+	PRK10766, PRK10766, two-component system response regulator TorR
