assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002804345.1_ASM280434v1	NZ_CP024997	Escherichia coli strain S17-13 chromosome, complete genome	1	169922-170071	1	CRISPRCasFinder	no		DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	Orphan	CGCGTCTTATCAGGCCTACGAGTTCGGTGCTGTGTAGGTCGGATAAGGCGTTCA	54	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	NA|528aa|up_7|NZ_CP024997.1_161128_162712_+,NA|36aa|up_6|NZ_CP024997.1_162712_162820_+,NA	NA|198aa|up_9|NZ_CP024997.1_159815_160409_+	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|151aa|up_8|NZ_CP024997.1_160553_161006_+	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|528aa|up_7|NZ_CP024997.1_161128_162712_+	NA	NA|36aa|up_6|NZ_CP024997.1_162712_162820_+	NA	NA|338aa|up_5|NZ_CP024997.1_162872_163886_-	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|139aa|up_4|NZ_CP024997.1_164047_164464_+	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|168aa|up_3|NZ_CP024997.1_164509_165013_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|399aa|up_2|NZ_CP024997.1_165205_166402_+	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|952aa|up_1|NZ_CP024997.1_166455_169311_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|148aa|up_0|NZ_CP024997.1_169310_169754_-	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|504aa|down_0|NZ_CP024997.1_170107_171619_-	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|367aa|down_1|NZ_CP024997.1_171885_172986_+	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|361aa|down_2|NZ_CP024997.1_172985_174068_+	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|501aa|down_3|NZ_CP024997.1_174228_175731_-	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|333aa|down_4|NZ_CP024997.1_175808_176807_-	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|440aa|down_5|NZ_CP024997.1_176873_178193_-	TIGR00791, Gluconate_permease, gluconate transporter	NA|255aa|down_6|NZ_CP024997.1_178255_179020_-	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|344aa|down_7|NZ_CP024997.1_179043_180075_-	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|188aa|down_8|NZ_CP024997.1_180291_180855_+	PRK09825, idnK, gluconokinase	NA|340aa|down_9|NZ_CP024997.1_180858_181878_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)
GCF_002804345.1_ASM280434v1	NZ_CP024997	Escherichia coli strain S17-13 chromosome, complete genome	2	440348-440463	2	CRISPRCasFinder	no		DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	Orphan	GATAAGACGCGCCAGCGTCGCATCAGGCGTT	31	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	NA,NA	NA|126aa|up_9|NZ_CP024997.1_426352_426730_-	PRK05461, apaG, CO2+/MG2+ efflux protein ApaG; Reviewed	NA|274aa|up_8|NZ_CP024997.1_426732_427554_-	PRK00274, ksgA, 16S rRNA (adenine(1518)-N(6)/adenine(1519)-N(6))-dimethyltransferase RsmA	NA|330aa|up_7|NZ_CP024997.1_427550_428540_-	PRK00232, pdxA, 4-hydroxythreonine-4-phosphate dehydrogenase; Reviewed	NA|429aa|up_6|NZ_CP024997.1_428539_429826_-	PRK10770, PRK10770, peptidyl-prolyl cis-trans isomerase SurA; Provisional	NA|785aa|up_5|NZ_CP024997.1_429878_432233_-	PRK03761, PRK03761, LPS assembly outer membrane complex protein LptD; Provisional	NA|272aa|up_4|NZ_CP024997.1_432487_433303_+	PRK09430, djlA, co-chaperone DjlA	NA|220aa|up_3|NZ_CP024997.1_433419_434079_-	PRK10158, PRK10158, bifunctional tRNA pseudouridine(32) synthase/23S rRNA pseudouridine(746) synthase RluA	NA|969aa|up_2|NZ_CP024997.1_434090_436997_-	PRK04914, PRK04914, RNA polymerase-associated protein RapA	NA|784aa|up_1|NZ_CP024997.1_437161_439513_-	PRK05762, PRK05762, DNA polymerase II; Reviewed	NA|232aa|up_0|NZ_CP024997.1_439587_440283_-	PRK08193, araD, L-ribulose-5-phosphate 4-epimerase AraD	NA|501aa|down_0|NZ_CP024997.1_440482_441985_-	PRK02929, PRK02929, L-arabinose isomerase; Provisional	NA|567aa|down_1|NZ_CP024997.1_441995_443696_-	PRK04123, PRK04123, ribulokinase; Provisional	NA|293aa|down_2|NZ_CP024997.1_444034_444913_+	PRK10572, PRK10572, arabinose operon transcriptional regulator AraC	NA|255aa|down_3|NZ_CP024997.1_444998_445763_+	COG0586, DedA, Uncharacterized membrane-associated protein [Function unknown]	NA|233aa|down_4|NZ_CP024997.1_445876_446575_-	PRK10771, thiQ, thiamine ABC transporter ATP-binding protein ThiQ	NA|537aa|down_5|NZ_CP024997.1_446558_448169_-	PRK09433, thiP, thiamine transporter membrane protein; Reviewed	NA|328aa|down_6|NZ_CP024997.1_448144_449128_-	PRK11205, tbpA, thiamine transporter substrate binding subunit; Provisional	NA|552aa|down_7|NZ_CP024997.1_449291_450947_-	PRK13626, PRK13626, HTH-type transcriptional regulator SgrR	NA|44aa|down_8|NZ_CP024997.1_451035_451167_+	pfam15894, SgrT, Inhibitor of glucose uptake transporter SgrT	NA|393aa|down_9|NZ_CP024997.1_451268_452447_+	TIGR00899, Sugar_efflux_transporter_A, sugar efflux transporter
GCF_002804345.1_ASM280434v1	NZ_CP024997	Escherichia coli strain S17-13 chromosome, complete genome	3	650191-650344	3	CRISPRCasFinder	no		DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	Orphan	CGCGTCTTATCATGCCTACAAACCTGTGCCGGATCGGTAGGCCGGATAAGGCG	53	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	NA|150aa|up_8|NZ_CP024997.1_640163_640613_+,NA|63aa|down_4|NZ_CP024997.1_654615_654804_-	NA|1418aa|up_9|NZ_CP024997.1_635898_640152_+	COG3209, RhsA, Rhs family protein [Cell envelope biogenesis, outer membrane]	NA|150aa|up_8|NZ_CP024997.1_640163_640613_+	NA	NA|257aa|up_7|NZ_CP024997.1_642051_642822_-	PRK10438, PRK10438, C-N hydrolase family amidase; Provisional	NA|158aa|up_6|NZ_CP024997.1_642975_643449_+	PRK09993, PRK09993, C-lysozyme inhibitor; Provisional	NA|815aa|up_5|NZ_CP024997.1_643491_645936_-	PRK09463, fadE, acyl-CoA dehydrogenase; Reviewed	NA|193aa|up_4|NZ_CP024997.1_646175_646754_+	PRK00414, gmhA, D-sedoheptulose 7-phosphate isomerase	NA|256aa|up_3|NZ_CP024997.1_646959_647727_+	pfam13230, GATase_4, Glutamine amidotransferases class-II	NA|247aa|up_2|NZ_CP024997.1_647697_648438_-	COG3034, COG3034, Uncharacterized protein conserved in bacteria [Function unknown]	NA|253aa|up_1|NZ_CP024997.1_648729_649488_+	COG0791, Spr, Cell wall-associated hydrolases (invasion-associated proteins) [Cell envelope biogenesis, outer membrane]	NA|166aa|up_0|NZ_CP024997.1_649663_650161_+	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|580aa|down_0|NZ_CP024997.1_650478_652218_-	COG1298, FlhA, Flagellar biosynthesis pathway, component FlhA [Cell motility and secretion / Intracellular trafficking and secretion]	NA|263aa|down_1|NZ_CP024997.1_652159_652948_+	PRK06778, PRK06778, hypothetical protein; Validated	NA|352aa|down_2|NZ_CP024997.1_653018_654074_+	PRK02406, PRK02406, DNA polymerase IV; Validated	NA|151aa|down_3|NZ_CP024997.1_654070_654523_+	PRK09831, PRK09831, GNAT family N-acetyltransferase	NA|63aa|down_4|NZ_CP024997.1_654615_654804_-	NA	NA|89aa|down_5|NZ_CP024997.1_654829_655096_+	PRK09588, PRK09588, hypothetical protein; Reviewed	NA|486aa|down_6|NZ_CP024997.1_655452_656910_-	PRK15026, PRK15026, aminoacyl-histidine dipeptidase; Provisional	NA|153aa|down_7|NZ_CP024997.1_657170_657629_+	PRK09177, PRK09177, xanthine-guanine phosphoribosyltransferase; Validated	NA|415aa|down_8|NZ_CP024997.1_657720_658965_+	PRK05077, frsA, esterase FrsA	NA|134aa|down_9|NZ_CP024997.1_659022_659424_+	PRK10984, PRK10984, sigma factor-binding protein Crl
GCF_002804345.1_ASM280434v1	NZ_CP024997	Escherichia coli strain S17-13 chromosome, complete genome	4	3536636-3537030	4,1,1	CRISPRCasFinder,CRT,PILER-CR	no	cas3	DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	Unclear	CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC,GGTTTATCCCCGCTGGCGCGGGGAACTC	29,29,28	0	0	NA	NA	I-E:I-E:I-E	6,6,6	6	Unclear	DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	NA,NA|47aa|down_1|NZ_CP024997.1_3538179_3538320_+	NA|424aa|up_9|NZ_CP024997.1_3525280_3526552_+	PRK10015, PRK10015, oxidoreductase; Provisional	NA|87aa|up_8|NZ_CP024997.1_3526542_3526803_+	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|192aa|up_7|NZ_CP024997.1_3526819_3527395_+	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|287aa|up_6|NZ_CP024997.1_3527542_3528403_-	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|260aa|up_5|NZ_CP024997.1_3528399_3529179_-	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|446aa|up_4|NZ_CP024997.1_3529156_3530494_-	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|485aa|up_3|NZ_CP024997.1_3530587_3532042_-	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|262aa|up_2|NZ_CP024997.1_3532111_3532897_-	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|426aa|up_1|NZ_CP024997.1_3533215_3534493_+	cd06174, MFS, Major Facilitator Superfamily	NA|493aa|up_0|NZ_CP024997.1_3534519_3535998_+	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|224aa|down_0|NZ_CP024997.1_3537369_3538041_-	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|47aa|down_1|NZ_CP024997.1_3538179_3538320_+	NA	NA|291aa|down_2|NZ_CP024997.1_3538333_3539206_+	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|433aa|down_3|NZ_CP024997.1_3539265_3540564_-	PRK00077, eno, enolase; Provisional	NA|546aa|down_4|NZ_CP024997.1_3540651_3542289_-	PRK05380, pyrG, CTP synthetase; Validated	NA|264aa|down_5|NZ_CP024997.1_3542516_3543308_-	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|112aa|down_6|NZ_CP024997.1_3543378_3543714_-	PRK09907, PRK09907, endoribonuclease MazF	NA|83aa|down_7|NZ_CP024997.1_3543713_3543962_-	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|745aa|down_8|NZ_CP024997.1_3544039_3546274_-	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|434aa|down_9|NZ_CP024997.1_3546321_3547623_-	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD
GCF_002804345.1_ASM280434v1	NZ_CP024997	Escherichia coli strain S17-13 chromosome, complete genome	5	4070186-4070325	5	CRISPRCasFinder	no		DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	Orphan	TGCCTGATGCGACGCTTGCCGCGTCTTATCAGGCCTACAACGACACAAA	49	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas3,DinG,c2c9_V-U4,RT,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,WYL,PD-DExK	NA,NA	NA|252aa|up_9|NZ_CP024997.1_4059456_4060212_+	PRK09762, PRK09762, galactosamine-6-phosphate isomerase; Provisional	NA|195aa|up_8|NZ_CP024997.1_4060612_4061197_+	COG3539, FimA, P pilus assembly protein, pilin FimA [Cell motility and secretion / Intracellular trafficking and secretion]	NA|232aa|up_7|NZ_CP024997.1_4061276_4061972_+	COG3121, FimC, P pilus assembly protein, chaperone PapD [Cell motility and secretion / Intracellular trafficking and secretion]	NA|839aa|up_6|NZ_CP024997.1_4062001_4064518_+	COG3188, FimD, P pilus assembly protein, porin PapC [Cell motility and secretion / Intracellular trafficking and secretion]	NA|364aa|up_5|NZ_CP024997.1_4064528_4065620_+	pfam00419, Fimbrial, Fimbrial protein	NA|287aa|up_4|NZ_CP024997.1_4065662_4066523_-	PRK14994, PRK14994, SAM-dependent 16S ribosomal RNA C1402 ribose 2'-O-methyltransferase; Provisional	NA|679aa|up_3|NZ_CP024997.1_4066587_4068624_+	COG3107, LppC, Putative lipoprotein [General function prediction only]	NA|132aa|up_2|NZ_CP024997.1_4068581_4068977_+	TIGR00252, UPF0102_protein_HI_1656, TIGR00252 family protein	NA|197aa|up_1|NZ_CP024997.1_4068996_4069587_+	PRK10886, PRK10886, DnaA initiator-associating protein DiaA; Provisional	NA|192aa|up_0|NZ_CP024997.1_4069596_4070172_+	PRK11023, PRK11023, divisome-associated lipoprotein YraP	NA|347aa|down_0|NZ_CP024997.1_4070376_4071417_-	COG0701, COG0701, Predicted permeases [General function prediction only]	NA|212aa|down_1|NZ_CP024997.1_4071489_4072125_-	cd05250, CC3_like_SDR_a, CC3(TIP30)-like, atypical (a) SDRs	NA|173aa|down_2|NZ_CP024997.1_4072252_4072771_+	cd03134, GATase1_PfpI_like, A type 1 glutamine amidotransferase (GATase1)-like domain found in PfpI from Pyrococcus furiosus	NA|148aa|down_3|NZ_CP024997.1_4072750_4073194_-	PRK03467, PRK03467, hypothetical protein; Provisional	NA|101aa|down_4|NZ_CP024997.1_4073244_4073547_+	PRK00329, PRK00329, GIY-YIG nuclease superfamily protein; Validated	NA|168aa|down_5|NZ_CP024997.1_4073533_4074037_-	COG3153, COG3153, Predicted acetyltransferase [General function prediction only]	NA|175aa|down_6|NZ_CP024997.1_4074030_4074555_-	COG3154, COG3154, Putative lipid carrier protein [Lipid metabolism]	NA|332aa|down_7|NZ_CP024997.1_4074763_4075759_+	COG0826, COG0826, Collagenase and related proteases [Posttranslational modification, protein turnover, chaperones]	NA|293aa|down_8|NZ_CP024997.1_4075767_4076646_+	PRK15447, PRK15447, putative protease; Provisional	NA|336aa|down_9|NZ_CP024997.1_4076851_4077859_+	PRK10508, PRK10508, luciferase-like monooxygenase
