assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_012934655.2_ASM1293465v2	NZ_CP051700	Escherichia coli strain SCU-125 chromosome, complete genome	1	585208-585331	1	CRISPRCasFinder	no	DEDDh	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	NA,NA|30aa|down_7|NZ_CP051700.1_594227_594317_+	NA|471aa|up_9|NZ_CP051700.1_574660_576073_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP051700.1_576630_576840_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP051700.1_577295_577922_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP051700.1_577942_580045_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|213aa|up_5|NZ_CP051700.1_580057_580696_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP051700.1_580759_581428_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP051700.1_581424_582210_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP051700.1_582213_583026_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|535aa|up_1|NZ_CP051700.1_583037_584642_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP051700.1_584767_585073_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP051700.1_585645_586902_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP051700.1_586942_588316_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP051700.1_588530_589172_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP051700.1_589211_590360_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP051700.1_590650_591862_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP051700.1_591974_592907_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP051700.1_592903_593929_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP051700.1_594227_594317_+	NA	NA|390aa|down_8|NZ_CP051700.1_594482_595652_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP051700.1_595797_596379_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_012934655.2_ASM1293465v2	NZ_CP051700	Escherichia coli strain SCU-125 chromosome, complete genome	2	1304151-1304242	2	CRISPRCasFinder	no		DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	NA|70aa|up_7|NZ_CP051700.1_1293400_1293610_-,NA	NA|277aa|up_9|NZ_CP051700.1_1290683_1291514_-	TIGR00145, Uncharacterized_protein_slr0964, FTR1 family protein	NA|503aa|up_8|NZ_CP051700.1_1291733_1293242_-	PRK15419, PRK15419, sodium/proline symporter PutP	NA|70aa|up_7|NZ_CP051700.1_1293400_1293610_-	NA	NA|1321aa|up_6|NZ_CP051700.1_1293664_1297627_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_5|NZ_CP051700.1_1297666_1298305_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_4|NZ_CP051700.1_1298592_1299684_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|129aa|up_3|NZ_CP051700.1_1300388_1300775_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|267aa|up_2|NZ_CP051700.1_1300782_1301583_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_1|NZ_CP051700.1_1301592_1302183_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|443aa|up_0|NZ_CP051700.1_1302708_1304037_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP051700.1_1304665_1305262_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP051700.1_1305282_1305510_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP051700.1_1305547_1306789_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|307aa|down_3|NZ_CP051700.1_1307323_1308244_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_4|NZ_CP051700.1_1308243_1308549_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_5|NZ_CP051700.1_1308904_1309504_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_6|NZ_CP051700.1_1309500_1312047_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_7|NZ_CP051700.1_1312046_1313219_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_8|NZ_CP051700.1_1313348_1314041_+	PRK10766, PRK10766, two-component system response regulator TorR	NA|343aa|down_9|NZ_CP051700.1_1314013_1315042_-	PRK10936, PRK10936, TMAO reductase system periplasmic protein TorT; Provisional
GCF_012934655.2_ASM1293465v2	NZ_CP051700	Escherichia coli strain SCU-125 chromosome, complete genome	3	1948352-1948487	3	CRISPRCasFinder	no		DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	Orphan	GCGCCACTCGTAGGCCGGATAAGGCGTTCACGCCGCATCCGGC	43	0	0	NA	NA	NA	1	1	Orphan	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	NA|82aa|up_9|NZ_CP051700.1_1937675_1937921_-,NA|272aa|up_8|NZ_CP051700.1_1938333_1939149_-,NA	NA|82aa|up_9|NZ_CP051700.1_1937675_1937921_-	NA	NA|272aa|up_8|NZ_CP051700.1_1938333_1939149_-	NA	NA|350aa|up_7|NZ_CP051700.1_1939391_1940441_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)	NA|319aa|up_6|NZ_CP051700.1_1940527_1941484_-	COG1172, AraH, Ribose/xylose/arabinose/galactoside ABC-type transport systems, permease components [Carbohydrate transport and metabolism]	NA|324aa|up_5|NZ_CP051700.1_1941480_1942452_-	COG1172, AraH, Ribose/xylose/arabinose/galactoside ABC-type transport systems, permease components [Carbohydrate transport and metabolism]	NA|495aa|up_4|NZ_CP051700.1_1942444_1943929_-	COG1129, MglA, ABC-type sugar transport system, ATPase component [Carbohydrate transport and metabolism]	NA|328aa|up_3|NZ_CP051700.1_1943977_1944961_-	cd20002, PBP1_LsrB_Quorum_Sensing-like, ligand-binding protein LsrB-like of ABC transporter periplasmic binding protein	NA|137aa|up_2|NZ_CP051700.1_1945214_1945625_-	COG4405, COG4405, Uncharacterized protein conserved in bacteria [Function unknown]	NA|461aa|up_1|NZ_CP051700.1_1945921_1947304_-	PRK06846, PRK06846, putative deaminase; Validated	NA|317aa|up_0|NZ_CP051700.1_1947313_1948264_-	PRK12352, PRK12352, putative carbamate kinase; Reviewed	NA|473aa|down_0|NZ_CP051700.1_1948510_1949929_-	pfam06545, DUF1116, Protein of unknown function (DUF1116)	NA|516aa|down_1|NZ_CP051700.1_1949928_1951476_-	PRK06091, PRK06091, membrane protein FdrA; Validated	NA|288aa|down_2|NZ_CP051700.1_1951465_1952329_-	pfam11392, DUF2877, Protein of unknown function (DUF2877)	NA|202aa|down_3|NZ_CP051700.1_1952368_1952974_-	sd00045, ANK, ankyrin repeats	NA|166aa|down_4|NZ_CP051700.1_1953231_1953729_+	pfam06496, DUF1097, Protein of unknown function (DUF1097)	NA|311aa|down_5|NZ_CP051700.1_1953820_1954753_+	PRK10094, PRK10094, HTH-type transcriptional activator AllS	NA|363aa|down_6|NZ_CP051700.1_1954794_1955883_-	smart00052, EAL, Putative diguanylate phosphodiesterase	NA|678aa|down_7|NZ_CP051700.1_1956758_1958792_-	PRK09928, PRK09928, choline transport protein BetT; Provisional	NA|196aa|down_8|NZ_CP051700.1_1958920_1959508_+	PRK00767, PRK00767, transcriptional regulator BetI; Validated	NA|491aa|down_9|NZ_CP051700.1_1959521_1960994_+	PRK13252, PRK13252, betaine aldehyde dehydrogenase; Provisional
GCF_012934655.2_ASM1293465v2	NZ_CP051700	Escherichia coli strain SCU-125 chromosome, complete genome	4	2261406-2261538	1	PILER-CR	no		DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	Orphan	ATCACCAATATTGAAAA	17	0	0	NA	NA	NA	2	2	Orphan	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	NA,NA	NA|105aa|up_9|NZ_CP051700.1_2252777_2253092_-	pfam01845, CcdB, CcdB protein	NA|78aa|up_8|NZ_CP051700.1_2253094_2253328_-	COG5302, COG5302, Post-segregation antitoxin (ccd killing mechanism protein) encoded by the F plasmid [General function prediction only]	NA|160aa|up_7|NZ_CP051700.1_2253413_2253893_-	PRK10769, folA, type 3 dihydrofolate reductase	NA|621aa|up_6|NZ_CP051700.1_2254084_2255947_-	PRK03562, PRK03562, glutathione-regulated potassium-efflux system protein KefC; Provisional	NA|177aa|up_5|NZ_CP051700.1_2255939_2256470_-	PRK00871, PRK00871, glutathione-regulated potassium-efflux system oxidoreductase KefF	NA|444aa|up_4|NZ_CP051700.1_2256577_2257909_-	cd17316, MFS_SV2_like, Metazoan Synaptic vesicle glycoprotein 2 (SV2) and related small molecule transporters of the Major Facilitator Superfamily	NA|96aa|up_3|NZ_CP051700.1_2257967_2258255_-	PRK15449, PRK15449, ferredoxin-like protein FixX; Provisional	NA|429aa|up_2|NZ_CP051700.1_2258251_2259538_-	PRK10157, PRK10157, putative oxidoreductase FixC; Provisional	NA|314aa|up_1|NZ_CP051700.1_2259588_2260530_-	PRK03363, fixB, electron transfer flavoprotein subunit alpha/FixB family protein	NA|257aa|up_0|NZ_CP051700.1_2260544_2261315_-	PRK03359, PRK03359, putative electron transfer flavoprotein FixA; Reviewed	NA|505aa|down_0|NZ_CP051700.1_2261787_2263302_+	PRK03356, PRK03356, L-carnitine/gamma-butyrobetaine antiport BCCT transporter	NA|381aa|down_1|NZ_CP051700.1_2263332_2264475_+	PRK03354, PRK03354, crotonobetainyl-CoA dehydrogenase; Validated	NA|406aa|down_2|NZ_CP051700.1_2264603_2265821_+	PRK03525, PRK03525, L-carnitine CoA-transferase	NA|518aa|down_3|NZ_CP051700.1_2265893_2267447_+	PRK08008, caiC, putative crotonobetaine/carnitine-CoA ligase; Validated	NA|262aa|down_4|NZ_CP051700.1_2267555_2268341_+	PRK03580, PRK03580, crotonobetainyl-CoA hydratase	NA|197aa|down_5|NZ_CP051700.1_2268346_2268937_+	PRK13627, PRK13627, carnitine operon protein CaiE; Provisional	NA|132aa|down_6|NZ_CP051700.1_2269055_2269451_-	PRK11476, PRK11476, carnitine metabolism transcriptional regulator CaiF	NA|1074aa|down_7|NZ_CP051700.1_2269711_2272933_-	PRK05294, carB, carbamoyl-phosphate synthase large subunit	NA|383aa|down_8|NZ_CP051700.1_2272950_2274099_-	PRK12564, PRK12564, carbamoyl-phosphate synthase small subunit	NA|274aa|down_9|NZ_CP051700.1_2274554_2275376_-	COG0289, DapB, Dihydrodipicolinate reductase [Amino acid transport and metabolism]
GCF_012934655.2_ASM1293465v2	NZ_CP051700	Escherichia coli strain SCU-125 chromosome, complete genome	5	2473909-2474058	4	CRISPRCasFinder	no	cas3	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	Unclear	TGAACGCCTTATCCGACCTACACAGCACTGAACTCGTAGGCCTGATAAGACGCG	54	0	0	NA	NA	NA	1	1	Unclear	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	NA|284aa|up_6|NZ_CP051700.1_2464038_2464890_-,NA	NA|969aa|up_9|NZ_CP051700.1_2458211_2461118_-	cd18011, DEXDc_RapA, DEXH-box helicase domain of RapA	NA|378aa|up_8|NZ_CP051700.1_2461584_2462718_-	TIGR03187, hypothetical_protein, DGQHR domain	NA|417aa|up_7|NZ_CP051700.1_2462714_2463965_-	COG0343, Tgt, Queuine/archaeosine tRNA-ribosyltransferase [Translation, ribosomal structure and biogenesis]	NA|284aa|up_6|NZ_CP051700.1_2464038_2464890_-	NA	NA|415aa|up_5|NZ_CP051700.1_2465430_2466675_-	PRK09692, PRK09692, integrase; Provisional	NA|340aa|up_4|NZ_CP051700.1_2467141_2468161_+	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)	NA|501aa|up_3|NZ_CP051700.1_2468290_2469793_+	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|361aa|up_2|NZ_CP051700.1_2469911_2470994_-	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|367aa|up_1|NZ_CP051700.1_2470993_2472094_-	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|504aa|up_0|NZ_CP051700.1_2472360_2473872_+	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|148aa|down_0|NZ_CP051700.1_2474225_2474669_+	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|952aa|down_1|NZ_CP051700.1_2474668_2477524_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|399aa|down_2|NZ_CP051700.1_2477577_2478774_-	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|168aa|down_3|NZ_CP051700.1_2478966_2479470_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|139aa|down_4|NZ_CP051700.1_2479515_2479932_-	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|338aa|down_5|NZ_CP051700.1_2480093_2481107_+	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|151aa|down_6|NZ_CP051700.1_2482916_2483369_-	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|198aa|down_7|NZ_CP051700.1_2483513_2484107_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|238aa|down_8|NZ_CP051700.1_2484177_2484891_+	PRK12742, PRK12742, SDR family oxidoreductase	NA|132aa|down_9|NZ_CP051700.1_2485021_2485417_+	cd02198, YjgH_like, YjgH belongs to a large family of YjgF/YER057c/UK114-like proteins present in bacteria, archaea, and eukaryotes with no definitive function
GCF_012934655.2_ASM1293465v2	NZ_CP051700	Escherichia coli strain SCU-125 chromosome, complete genome	6	4898378-4898491	5	CRISPRCasFinder	no		DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	Orphan	TGCCGGATGCGCTTCGCTTATCCGGCCTACAAA	33	0	0	NA	NA	NA	1	1	Orphan	DEDDh,DinG,cas3,cas14j,RT,c2c9_V-U4,WYL,csa3	NA,NA	NA|268aa|up_9|NZ_CP051700.1_4887285_4888089_+	PRK10128, PRK10128, 2-keto-3-deoxy-L-rhamnonate aldolase; Provisional	NA|321aa|up_8|NZ_CP051700.1_4888129_4889092_-	PRK09956, PRK09956, ISNCY family transposase	NA|397aa|up_7|NZ_CP051700.1_4889285_4890476_-	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|420aa|up_6|NZ_CP051700.1_4890472_4891732_-	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|543aa|up_5|NZ_CP051700.1_4891721_4893350_-	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|453aa|up_4|NZ_CP051700.1_4893622_4894981_+	PRK11273, glpT, glycerol-3-phosphate transporter	NA|359aa|up_3|NZ_CP051700.1_4894985_4896062_+	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|217aa|up_2|NZ_CP051700.1_4896264_4896915_+	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|85aa|up_1|NZ_CP051700.1_4896968_4897223_-	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|377aa|up_0|NZ_CP051700.1_4897222_4898353_-	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|762aa|down_0|NZ_CP051700.1_4898543_4900829_-	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|1248aa|down_1|NZ_CP051700.1_4901510_4905254_+	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|241aa|down_2|NZ_CP051700.1_4905393_4906116_-	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|876aa|down_3|NZ_CP051700.1_4906262_4908890_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|563aa|down_4|NZ_CP051700.1_4909038_4910727_+	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|208aa|down_5|NZ_CP051700.1_4910723_4911347_+	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|1442aa|down_6|NZ_CP051700.1_4911490_4915816_+	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|550aa|down_7|NZ_CP051700.1_4915816_4917466_+	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|259aa|down_8|NZ_CP051700.1_4917470_4918247_+	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|395aa|down_9|NZ_CP051700.1_4918320_4919505_-	PRK05790, PRK05790, putative acyltransferase; Provisional
