assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_900635325.1_41556_D01	LR134092	Escherichia coli strain NCTC10444 genome assembly, chromosome: 1	1	1142689-1143449	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	Unclear	GAGTTCCCCGCGCTAGCGGGGATAAACCG,GAGTTCCCCGCGCTAGCGGGGATAAACCG,GAGTTCCCCGCGCNAGCGGGGATAAACCG,GTGGTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29,32	0	0	NA	NA	I-E:I-E:I-E:I-E	9,12,12,9	12	Unclear	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	NA,NA	NA|83aa|up_9|LR134092.1_1133165_1133414_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_8|LR134092.1_1133413_1133749_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_7|LR134092.1_1133820_1134612_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_6|LR134092.1_1134839_1136477_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_5|LR134092.1_1136564_1137863_+	PRK00077, eno, enolase; Provisional	NA|305aa|up_4|LR134092.1_1137922_1138837_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|383aa|up_3|LR134092.1_1138833_1139982_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|298aa|up_2|LR134092.1_1139996_1140890_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|201aa|up_1|LR134092.1_1140903_1141506_-	COG1704, LemA, Uncharacterized conserved protein [Function unknown]	NA|224aa|up_0|LR134092.1_1141678_1142350_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|LR134092.1_1144086_1145565_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|LR134092.1_1145591_1146869_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|LR134092.1_1147187_1147973_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|LR134092.1_1148042_1149497_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|470aa|down_4|LR134092.1_1149518_1150928_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|LR134092.1_1150905_1151685_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|LR134092.1_1151681_1152542_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|LR134092.1_1152688_1153264_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|LR134092.1_1153280_1153541_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|300aa|down_9|LR134092.1_1153531_1154431_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCA_900635325.1_41556_D01	LR134092	Escherichia coli strain NCTC10444 genome assembly, chromosome: 1	2	1169149-1169970	3,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	13,13,13	13	TypeI-E	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	NA,NA	NA|571aa|up_9|LR134092.1_1157360_1159073_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|up_8|LR134092.1_1159146_1159881_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	cas3|900aa|up_7|LR134092.1_1160490_1163190_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|521aa|up_6|LR134092.1_1163287_1164850_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|up_5|LR134092.1_1164846_1165383_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|LR134092.1_1165397_1166453_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|LR134092.1_1166463_1167210_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|LR134092.1_1167191_1167842_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|LR134092.1_1167838_1168762_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|LR134092.1_1168758_1169052_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|LR134092.1_1170051_1171089_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|LR134092.1_1171340_1172249_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|LR134092.1_1172250_1173678_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|LR134092.1_1173677_1174283_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|LR134092.1_1174332_1174656_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|LR134092.1_1174849_1175161_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|LR134092.1_1175179_1175890_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|LR134092.1_1175889_1176369_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|LR134092.1_1176365_1177415_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|LR134092.1_1177395_1178157_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCA_900635325.1_41556_D01	LR134092	Escherichia coli strain NCTC10444 genome assembly, chromosome: 1	3	1691351-1691468	3	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	Orphan	CCGAGCCGTAGGCCGGATAAGGCGTTCACGC	31	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	NA|357aa|up_6|LR134092.1_1685330_1686401_-,NA|44aa|up_5|LR134092.1_1686579_1686711_-,NA	NA|543aa|up_9|LR134092.1_1680766_1682395_-	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|453aa|up_8|LR134092.1_1682667_1684026_+	PRK11273, glpT, glycerol-3-phosphate transporter	NA|359aa|up_7|LR134092.1_1684030_1685107_+	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|357aa|up_6|LR134092.1_1685330_1686401_-	NA	NA|44aa|up_5|LR134092.1_1686579_1686711_-	NA	NA|293aa|up_4|LR134092.1_1686864_1687743_-	cd05466, PBP2_LTTR_substrate, The substrate binding domain of LysR-type transcriptional regulators (LTTRs), a member of the type 2 periplasmic binding fold protein superfamily	NA|397aa|up_3|LR134092.1_1687894_1689085_+	cd17489, MFS_YfcJ_like, Escherichia coli YfcJ, YhhS, and similar transporters of the Major Facilitator Superfamily	NA|217aa|up_2|LR134092.1_1689165_1689816_+	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|85aa|up_1|LR134092.1_1689869_1690124_-	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|377aa|up_0|LR134092.1_1690123_1691254_-	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|762aa|down_0|LR134092.1_1691487_1693773_-	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|1251aa|down_1|LR134092.1_1694468_1698221_+	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|241aa|down_2|LR134092.1_1698361_1699084_-	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|876aa|down_3|LR134092.1_1699230_1701858_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|563aa|down_4|LR134092.1_1702006_1703695_+	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|208aa|down_5|LR134092.1_1703691_1704315_+	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|1465aa|down_6|LR134092.1_1704458_1708853_+	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|550aa|down_7|LR134092.1_1708853_1710503_+	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|259aa|down_8|LR134092.1_1710507_1711284_+	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|395aa|down_9|LR134092.1_1711357_1712542_-	PRK05790, PRK05790, putative acyltransferase; Provisional
GCA_900635325.1_41556_D01	LR134092	Escherichia coli strain NCTC10444 genome assembly, chromosome: 1	4	2383703-2383826	4	CRISPRCasFinder	no	DEDDh	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	NA,NA	NA|471aa|up_9|LR134092.1_2373155_2374568_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|LR134092.1_2375124_2375334_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|LR134092.1_2375789_2376416_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|LR134092.1_2376436_2378539_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|213aa|up_5|LR134092.1_2378551_2379190_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|LR134092.1_2379253_2379922_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|LR134092.1_2379918_2380704_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|255aa|up_2|LR134092.1_2380755_2381520_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|393aa|up_1|LR134092.1_2381531_2382710_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|128aa|up_0|LR134092.1_2382753_2383137_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|419aa|down_0|LR134092.1_2384140_2385397_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|LR134092.1_2385437_2386811_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|LR134092.1_2387025_2387667_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|LR134092.1_2387706_2388855_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|LR134092.1_2389145_2390357_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|LR134092.1_2390469_2391402_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|LR134092.1_2391398_2392424_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|390aa|down_7|LR134092.1_2392977_2394147_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_8|LR134092.1_2394292_2394874_-	PRK10543, PRK10543, superoxide dismutase [Fe]	NA|276aa|down_9|LR134092.1_2395001_2395829_-	pfam00877, NLPC_P60, NlpC/P60 family
GCA_900635325.1_41556_D01	LR134092	Escherichia coli strain NCTC10444 genome assembly, chromosome: 1	6	3399377-3399525	6,4	CRISPRCasFinder,PILER-CR	no	PrimPol	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	Unclear	TTTCTAAGCTGCCTGTACGGCAGTGAAC,TTTCTAAGCTGCCTGTACGGCAGTGAAC	28,28	0	0	NA	NA	I-F:I-F	2,2	2	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	NA|63aa|up_6|LR134092.1_3389425_3389614_+,NA|612aa|up_3|LR134092.1_3394046_3395882_-,NA	NA|135aa|up_9|LR134092.1_3387433_3387838_+	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|116aa|up_8|LR134092.1_3387834_3388182_+	pfam05717, TnpB_IS66, IS66 Orf2 like protein	NA|311aa|up_7|LR134092.1_3388426_3389359_+	pfam03050, DDE_Tnp_IS66, Transposase IS66 family	NA|63aa|up_6|LR134092.1_3389425_3389614_+	NA	PrimPol|787aa|up_5|LR134092.1_3389631_3391992_-	COG4951, COG4951, Uncharacterized protein conserved in bacteria [Function unknown]	NA|188aa|up_4|LR134092.1_3392146_3392710_-	pfam11726, Inovirus_Gp2, Inovirus Gp2	NA|612aa|up_3|LR134092.1_3394046_3395882_-	NA	NA|96aa|up_2|LR134092.1_3395982_3396270_+	COG3311, AlpA, Predicted transcriptional regulator [Transcription]	NA|510aa|up_1|LR134092.1_3396241_3397771_+	pfam13148, DUF3987, Protein of unknown function (DUF3987)	NA|406aa|up_0|LR134092.1_3397940_3399158_-	cd00801, INT_P4_C, Bacteriophage P4 integrase, C-terminal catalytic domain	NA|759aa|down_0|LR134092.1_3399736_3402013_-	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	NA|107aa|down_1|LR134092.1_3402043_3402364_-	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|75aa|down_2|LR134092.1_3402686_3402911_+	PRK09937, PRK09937, cold shock-like protein CspD	NA|649aa|down_3|LR134092.1_3402983_3404930_-	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|372aa|down_4|LR134092.1_3404926_3406042_-	PRK11578, PRK11578, macrolide transporter subunit MacA; Provisional	NA|331aa|down_5|LR134092.1_3406156_3407149_+	COG2990, VirK, Uncharacterized protein conserved in bacteria [Function unknown]	NA|553aa|down_6|LR134092.1_3407145_3408804_-	COG3593, COG3593, Predicted ATP-dependent endonuclease of the OLD family [DNA replication, recombination, and repair]	NA|232aa|down_7|LR134092.1_3409229_3409925_+	PRK05420, PRK05420, aquaporin Z; Provisional	NA|300aa|down_8|LR134092.1_3410382_3411282_+	COG2431, COG2431, Predicted membrane protein [Function unknown]	NA|551aa|down_9|LR134092.1_3411425_3413078_+	PRK05290, PRK05290, hybrid cluster protein; Provisional
GCA_900635325.1_41556_D01	LR134092	Escherichia coli strain NCTC10444 genome assembly, chromosome: 1	8	4663797-4663946	8	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	Orphan	TGAACGCCTTATCCGACCTACACAGCACTGAACTCGTAGGCCTGATAAGACGCG	54	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,cas14j,c2c9_V-U4,DEDDh,DinG,RT,PrimPol,WYL	NA,NA|551aa|down_6|LR134092.1_4671058_4672711_-	NA|340aa|up_9|LR134092.1_4651990_4653010_+	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)	NA|188aa|up_8|LR134092.1_4653013_4653577_-	PRK09825, idnK, gluconokinase	NA|344aa|up_7|LR134092.1_4653793_4654825_+	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|255aa|up_6|LR134092.1_4654848_4655613_+	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|440aa|up_5|LR134092.1_4655674_4656994_+	TIGR00791, Gluconate_permease, gluconate transporter	NA|333aa|up_4|LR134092.1_4657060_4658059_+	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|501aa|up_3|LR134092.1_4658136_4659639_+	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|361aa|up_2|LR134092.1_4659799_4660882_-	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|360aa|up_1|LR134092.1_4660881_4661961_-	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|504aa|up_0|LR134092.1_4662248_4663760_+	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|148aa|down_0|LR134092.1_4664113_4664557_+	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|952aa|down_1|LR134092.1_4664556_4667412_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|399aa|down_2|LR134092.1_4667465_4668662_-	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|168aa|down_3|LR134092.1_4668854_4669358_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|139aa|down_4|LR134092.1_4669403_4669820_-	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|335aa|down_5|LR134092.1_4669981_4670986_+	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|551aa|down_6|LR134092.1_4671058_4672711_-	NA	NA|151aa|down_7|LR134092.1_4672833_4673286_-	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|198aa|down_8|LR134092.1_4673430_4674024_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|238aa|down_9|LR134092.1_4674094_4674808_+	PRK12742, PRK12742, SDR family oxidoreductase
