assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	1	687113-687238	1	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	AGGCCTGATAAGACGCGGCAAGCGTCGCATCAGGCA	36	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|336aa|up_9|NZ_CP043414.1_679690_680698_-	PRK10508, PRK10508, luciferase-like monooxygenase	NA|293aa|up_8|NZ_CP043414.1_680778_681657_-	PRK15447, PRK15447, putative protease; Provisional	NA|332aa|up_7|NZ_CP043414.1_681665_682661_-	COG0826, COG0826, Collagenase and related proteases [Posttranslational modification, protein turnover, chaperones]	NA|175aa|up_6|NZ_CP043414.1_682869_683394_+	COG3154, COG3154, Putative lipid carrier protein [Lipid metabolism]	NA|168aa|up_5|NZ_CP043414.1_683387_683891_+	COG3153, COG3153, Predicted acetyltransferase [General function prediction only]	NA|101aa|up_4|NZ_CP043414.1_683877_684180_-	PRK00329, PRK00329, GIY-YIG nuclease superfamily protein; Validated	NA|148aa|up_3|NZ_CP043414.1_684230_684674_+	PRK03467, PRK03467, hypothetical protein; Provisional	NA|173aa|up_2|NZ_CP043414.1_684653_685172_-	cd03134, GATase1_PfpI_like, A type 1 glutamine amidotransferase (GATase1)-like domain found in PfpI from Pyrococcus furiosus	NA|212aa|up_1|NZ_CP043414.1_685299_685935_+	cd05250, CC3_like_SDR_a, CC3(TIP30)-like, atypical (a) SDRs	NA|347aa|up_0|NZ_CP043414.1_686007_687048_+	COG0701, COG0701, Predicted permeases [General function prediction only]	NA|192aa|down_0|NZ_CP043414.1_687251_687827_-	PRK11023, PRK11023, divisome-associated lipoprotein YraP	NA|197aa|down_1|NZ_CP043414.1_687836_688427_-	PRK10886, PRK10886, DnaA initiator-associating protein DiaA; Provisional	NA|132aa|down_2|NZ_CP043414.1_688446_688842_-	TIGR00252, UPF0102_protein_HI_1656, TIGR00252 family protein	NA|679aa|down_3|NZ_CP043414.1_688799_690836_-	COG3107, LppC, Putative lipoprotein [General function prediction only]	NA|288aa|down_4|NZ_CP043414.1_690900_691764_+	PRK14994, PRK14994, SAM-dependent 16S ribosomal RNA C1402 ribose 2'-O-methyltransferase; Provisional	NA|256aa|down_5|NZ_CP043414.1_691813_692581_-	PRK09762, PRK09762, galactosamine-6-phosphate isomerase; Provisional	NA|264aa|down_6|NZ_CP043414.1_692581_693373_-	PRK09855, PRK09855, PTS N-acetylgalactosamine transporter subunit IID	NA|268aa|down_7|NZ_CP043414.1_693362_694166_-	PRK09757, PRK09757, PTS N-acetylgalactosamine transporter subunit IIC	NA|159aa|down_8|NZ_CP043414.1_694204_694681_-	PRK09756, PRK09756, PTS N-acetylgalactosamine transporter subunit IIB	NA|287aa|down_9|NZ_CP043414.1_694847_695708_-	PRK12738, kbaY, tagatose-bisphosphate aldolase subunit KbaY
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	2	1148396-1149218	1,2,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Unclear	GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	12,13,13	13	Unclear	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|83aa|up_9|NZ_CP043414.1_1138869_1139118_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_8|NZ_CP043414.1_1139117_1139453_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_7|NZ_CP043414.1_1139524_1140316_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_6|NZ_CP043414.1_1140543_1142181_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_5|NZ_CP043414.1_1142268_1143567_+	PRK00077, eno, enolase; Provisional	NA|301aa|up_4|NZ_CP043414.1_1143626_1144529_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|383aa|up_3|NZ_CP043414.1_1144525_1145674_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|303aa|up_2|NZ_CP043414.1_1145688_1146597_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|201aa|up_1|NZ_CP043414.1_1146610_1147213_-	COG1704, LemA, Uncharacterized conserved protein [Function unknown]	NA|224aa|up_0|NZ_CP043414.1_1147385_1148057_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_CP043414.1_1149855_1151334_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_CP043414.1_1151360_1152638_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_CP043414.1_1152956_1153742_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_CP043414.1_1153811_1155266_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|470aa|down_4|NZ_CP043414.1_1155287_1156697_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_CP043414.1_1156674_1157454_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_CP043414.1_1157450_1158311_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|NZ_CP043414.1_1158456_1159032_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|NZ_CP043414.1_1159048_1159309_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|NZ_CP043414.1_1159299_1160571_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	3	1174925-1175990	2,3,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACC,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	28,29,29	0	0	NA	NA	I-E:I-E:I-E	17,17,17	17	TypeI-E	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|245aa|up_9|NZ_CP043414.1_1164920_1165655_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|51aa|up_8|NZ_CP043414.1_1165918_1166071_+	pfam01848, HOK_GEF, Hok/gef family	cas3|886aa|up_7|NZ_CP043414.1_1166309_1168967_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|521aa|up_6|NZ_CP043414.1_1169063_1170626_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|up_5|NZ_CP043414.1_1170622_1171159_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|NZ_CP043414.1_1171173_1172229_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP043414.1_1172239_1172986_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP043414.1_1172967_1173618_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|NZ_CP043414.1_1173614_1174538_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP043414.1_1174534_1174828_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP043414.1_1176072_1177110_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP043414.1_1177361_1178270_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP043414.1_1178271_1179699_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP043414.1_1179698_1180304_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP043414.1_1180353_1180677_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP043414.1_1180870_1181182_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP043414.1_1181200_1181911_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP043414.1_1181910_1182390_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP043414.1_1182386_1183436_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP043414.1_1183416_1184178_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	4	1269250-1269369	4	CRISPRCasFinder	no	csa3	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Type I-A	TGTCGGATGCGGCGTAAACGCCTTATCCGAC	31	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA|46aa|down_7|NZ_CP043414.1_1280636_1280774_+	NA|110aa|up_9|NZ_CP043414.1_1262879_1263209_-	PRK10132, PRK10132, hypothetical protein; Provisional	NA|115aa|up_8|NZ_CP043414.1_1263360_1263705_+	PRK10556, PRK10556, hypothetical protein; Provisional	NA|150aa|up_7|NZ_CP043414.1_1263741_1264191_-	pfam06610, AlaE, L-alanine exporter	NA|135aa|up_6|NZ_CP043414.1_1264857_1265262_+	PRK10328, PRK10328, DNA-binding protein StpA	NA|175aa|up_5|NZ_CP043414.1_1265308_1265833_-	cd01527, RHOD_YgaP, Member of the Rhodanese Homology Domain superfamily	csa3|100aa|up_4|NZ_CP043414.1_1265842_1266142_-	COG0640, ArsR, Predicted transcriptional regulators [Transcription]	NA|53aa|up_3|NZ_CP043414.1_1266324_1266483_+	COG0401, COG0401, Uncharacterized homolog of Blt101 [Function unknown]	NA|150aa|up_2|NZ_CP043414.1_1266566_1267016_+	PRK11198, PRK11198, LysM domain/BON superfamily protein; Provisional	NA|221aa|up_1|NZ_CP043414.1_1267016_1267679_-	PRK11534, PRK11534, DNA-binding transcriptional regulator CsiR; Provisional	NA|467aa|up_0|NZ_CP043414.1_1267699_1269100_-	PRK10197, PRK10197, GABA permease	NA|427aa|down_0|NZ_CP043414.1_1269426_1270707_-	PRK08088, PRK08088, 4-aminobutyrate--2-oxoglutarate transaminase	NA|483aa|down_1|NZ_CP043414.1_1270720_1272169_-	PRK11241, gabD, NADP-dependent succinate-semialdehyde dehydrogenase I	NA|423aa|down_2|NZ_CP043414.1_1272191_1273460_-	PRK11728, PRK11728, L-2-hydroxyglutarate oxidase	NA|326aa|down_3|NZ_CP043414.1_1273479_1274457_-	PRK02963, PRK02963, carbon starvation induced protein CsiD	NA|751aa|down_4|NZ_CP043414.1_1274791_1277044_-	cd11315, AmyAc_bac1_AmyA, Alpha amylase catalytic domain found in bacterial Alpha-amylases (also called 1,4-alpha-D-glucan-4-glucanohydrolase)	NA|485aa|down_5|NZ_CP043414.1_1278431_1279886_+	pfam17621, DUF5508, Family of unknown function (DUF5508)	NA|53aa|down_6|NZ_CP043414.1_1280216_1280375_+	cd03768, SR_ResInv, Serine Recombinase (SR) family, Resolvase and Invertase subfamily, catalytic domain; members contain a C-terminal DNA binding domain	NA|46aa|down_7|NZ_CP043414.1_1280636_1280774_+	NA	NA|1525aa|down_8|NZ_CP043414.1_1280821_1285396_+	TIGR01414, Contains:_AIDA-I_translocator, outer membrane autotransporter barrel domain	NA|67aa|down_9|NZ_CP043414.1_1286146_1286347_+	COG3311, AlpA, Predicted transcriptional regulator [Transcription]
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	5	1546507-1546648	5	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	CACATGTAGGGCGGATAAGGCGTTCACGCCGCATCCGCCAAT	42	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA|106aa|down_7|NZ_CP043414.1_1553940_1554258_-	NA|112aa|up_9|NZ_CP043414.1_1538978_1539314_+	PRK15468, PRK15468, ethanolamine utilization microcompartment protein EutS	NA|160aa|up_8|NZ_CP043414.1_1539326_1539806_+	PRK15467, PRK15467, ethanolamine utilization acetate kinase EutP	NA|234aa|up_7|NZ_CP043414.1_1539780_1540482_+	PRK15457, PRK15457, ethanolamine utilization acetate kinase EutQ	NA|268aa|up_6|NZ_CP043414.1_1540478_1541282_+	PRK15020, PRK15020, ethanolamine utilization cob(I)yrinic acid a,c-diamide adenosyltransferase EutT	NA|339aa|up_5|NZ_CP043414.1_1541278_1542295_+	PRK09653, eutD, phosphotransacetylase	NA|98aa|up_4|NZ_CP043414.1_1542333_1542627_+	PRK15474, PRK15474, ethanolamine utilization microcompartment protein EutM	NA|96aa|up_3|NZ_CP043414.1_1542733_1543021_+	PRK15448, PRK15448, ethanolamine utilization microcompartment protein EutN	NA|468aa|up_2|NZ_CP043414.1_1543032_1544436_+	PRK15398, PRK15398, aldehyde dehydrogenase	NA|279aa|up_1|NZ_CP043414.1_1544446_1545283_+	COG4820, EutJ, Ethanolamine utilization protein, possible chaperonin [Amino acid transport and metabolism]	NA|396aa|up_0|NZ_CP043414.1_1545272_1546460_+	PRK15454, PRK15454, ethanolamine utilization ethanol dehydrogenase EutG	NA|409aa|down_0|NZ_CP043414.1_1546676_1547903_+	COG3192, EutH, Ethanolamine utilization protein [Amino acid transport and metabolism]	NA|468aa|down_1|NZ_CP043414.1_1547899_1549303_+	PRK10719, eutA, ethanolamine ammonia-lyase reactivating factor EutA	NA|454aa|down_2|NZ_CP043414.1_1549314_1550676_+	COG4303, EutB, Ethanolamine ammonia-lyase, large subunit [Amino acid transport and metabolism]	NA|296aa|down_3|NZ_CP043414.1_1550696_1551584_+	COG4302, EutC, Ethanolamine ammonia-lyase, small subunit [Amino acid transport and metabolism]	NA|220aa|down_4|NZ_CP043414.1_1551593_1552253_+	PRK15405, PRK15405, ethanolamine utilization microcompartment protein EutL	NA|167aa|down_5|NZ_CP043414.1_1552265_1552766_+	PRK15466, PRK15466, ethanolamine utilization microcompartment protein EutK	NA|351aa|down_6|NZ_CP043414.1_1552811_1553864_+	PRK10130, PRK10130, HTH-type transcriptional regulator EutR	NA|106aa|down_7|NZ_CP043414.1_1553940_1554258_-	NA	NA|300aa|down_8|NZ_CP043414.1_1555698_1556598_-	PRK05330, PRK05330, oxygen-dependent coproporphyrinogen oxidase	NA|290aa|down_9|NZ_CP043414.1_1556601_1557471_-	PRK10319, PRK10319, N-acetylmuramoyl-L-alanine amidase AmiA
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	6	1757529-1757637	6	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	GCCGGATAAGGCATTTTACGCCGCATCC	28	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA|357aa|up_3|NZ_CP043414.1_1753457_1754528_-,NA	NA|301aa|up_9|NZ_CP043414.1_1745364_1746267_-	PRK09956, PRK09956, ISNCY family transposase	NA|397aa|up_8|NZ_CP043414.1_1746460_1747651_-	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|420aa|up_7|NZ_CP043414.1_1747647_1748907_-	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|543aa|up_6|NZ_CP043414.1_1748896_1750525_-	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|453aa|up_5|NZ_CP043414.1_1750798_1752157_+	PRK11273, glpT, glycerol-3-phosphate transporter	NA|359aa|up_4|NZ_CP043414.1_1752161_1753238_+	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|357aa|up_3|NZ_CP043414.1_1753457_1754528_-	NA	NA|217aa|up_2|NZ_CP043414.1_1755415_1756066_+	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|85aa|up_1|NZ_CP043414.1_1756118_1756373_-	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|377aa|up_0|NZ_CP043414.1_1756372_1757503_-	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|762aa|down_0|NZ_CP043414.1_1757649_1759935_-	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|1253aa|down_1|NZ_CP043414.1_1760630_1764389_+	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|241aa|down_2|NZ_CP043414.1_1764528_1765251_-	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|876aa|down_3|NZ_CP043414.1_1765397_1768025_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|563aa|down_4|NZ_CP043414.1_1768171_1769860_+	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|208aa|down_5|NZ_CP043414.1_1769856_1770480_+	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|1465aa|down_6|NZ_CP043414.1_1770623_1775018_+	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|550aa|down_7|NZ_CP043414.1_1775018_1776668_+	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|259aa|down_8|NZ_CP043414.1_1776672_1777449_+	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|395aa|down_9|NZ_CP043414.1_1777522_1778707_-	PRK05790, PRK05790, putative acyltransferase; Provisional
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	7	1993398-1993539	7	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	TGTTTGTCGGATGCGGCGTGAACGCCTTATCCGACCTACGGTTCGGATTTGTAG	54	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|163aa|up_9|NZ_CP043414.1_1983909_1984398_+	PRK10191, PRK10191, putative acyl transferase; Provisional	NA|406aa|up_8|NZ_CP043414.1_1984394_1985612_+	TIGR04015, WcaC, colanic acid biosynthesis glycosyl transferase WcaC	NA|406aa|up_7|NZ_CP043414.1_1985586_1986804_+	TIGR04010, WcaD, putative colanic acid polymerase WcaD	NA|249aa|up_6|NZ_CP043414.1_1986814_1987561_+	PRK10063, PRK10063, colanic acid biosynthesis glycosyltransferase WcaE	NA|183aa|up_5|NZ_CP043414.1_1987576_1988125_+	TIGR04008, WcaF, colanic acid biosynthesis acetyltransferase WcaF	NA|374aa|up_4|NZ_CP043414.1_1988150_1989272_+	COG1089, Gmd, GDP-D-mannose dehydratase [Cell envelope biogenesis, outer membrane]	NA|322aa|up_3|NZ_CP043414.1_1989274_1990240_+	cd05239, GDP_FS_SDR_e, GDP-fucose synthetase, extended (e) SDRs	NA|160aa|up_2|NZ_CP043414.1_1990242_1990722_+	PRK15434, PRK15434, GDP-mannose mannosyl hydrolase	NA|408aa|up_1|NZ_CP043414.1_1990718_1991942_+	TIGR04007, wcaI, colanic acid biosynthesis glycosyl transferase WcaI	NA|479aa|up_0|NZ_CP043414.1_1991944_1993381_+	PRK15460, cpsB, mannose-1-phosphate guanyltransferase; Provisional	NA|457aa|down_0|NZ_CP043414.1_1993661_1995032_+	PRK15414, PRK15414, phosphomannomutase	NA|465aa|down_1|NZ_CP043414.1_1995167_1996562_+	PRK10124, PRK10124, putative UDP-glucose lipid carrier transferase; Provisional	NA|493aa|down_2|NZ_CP043414.1_1996563_1998042_+	PRK10459, PRK10459, MOP flippase family protein	NA|427aa|down_3|NZ_CP043414.1_1998113_1999394_+	TIGR04006, wcaK, colanic acid biosynthesis pyruvyl transferase WcaK	NA|407aa|down_4|NZ_CP043414.1_1999390_2000611_+	TIGR04005, wcaL, colanic acid biosynthesis glycosyltransferase WcaL	NA|465aa|down_5|NZ_CP043414.1_2000621_2002016_+	PRK10123, wcaM, putative colanic acid biosynthesis protein; Provisional	NA|332aa|down_6|NZ_CP043414.1_2002173_2003169_+	cd05238, Gne_like_SDR_e, Escherichia coli Gne (a nucleoside-diphosphate-sugar 4-epimerase)-like, extended (e) SDRs	NA|298aa|down_7|NZ_CP043414.1_2003411_2004305_+	PRK10122, PRK10122, UTP--glucose-1-phosphate uridylyltransferase GalF	NA|305aa|down_8|NZ_CP043414.1_2004521_2005436_+	cd04195, GT2_AmsE_like, GT2_AmsE_like is involved in exopolysaccharide amylovora biosynthesis	NA|589aa|down_9|NZ_CP043414.1_2005437_2007204_+	COG5610, COG5610, Predicted hydrolase (HAD superfamily) [General function prediction only]
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	8	2383640-2383763	8	CRISPRCasFinder	no	DEDDh	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA|30aa|down_7|NZ_CP043414.1_2392660_2392750_+	NA|471aa|up_9|NZ_CP043414.1_2373081_2374494_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP043414.1_2375050_2375260_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP043414.1_2375715_2376342_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP043414.1_2376362_2378465_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|217aa|up_5|NZ_CP043414.1_2378477_2379128_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP043414.1_2379191_2379860_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP043414.1_2379856_2380642_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP043414.1_2380645_2381458_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|537aa|up_1|NZ_CP043414.1_2381463_2383074_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP043414.1_2383199_2383505_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP043414.1_2384078_2385335_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP043414.1_2385375_2386749_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP043414.1_2386963_2387605_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP043414.1_2387644_2388793_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP043414.1_2389083_2390295_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP043414.1_2390407_2391340_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP043414.1_2391336_2392362_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP043414.1_2392660_2392750_+	NA	NA|390aa|down_8|NZ_CP043414.1_2392915_2394085_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP043414.1_2394230_2394812_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	9	3085663-3085754	9	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA|70aa|up_9|NZ_CP043414.1_3074738_3074948_-,NA	NA|70aa|up_9|NZ_CP043414.1_3074738_3074948_-	NA	NA|1321aa|up_8|NZ_CP043414.1_3075002_3078965_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_7|NZ_CP043414.1_3079004_3079643_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_6|NZ_CP043414.1_3079930_3081022_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_5|NZ_CP043414.1_3081021_3081714_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_4|NZ_CP043414.1_3081725_3082112_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|267aa|up_3|NZ_CP043414.1_3082119_3082920_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_2|NZ_CP043414.1_3082929_3083520_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_CP043414.1_3083530_3084025_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP043414.1_3084045_3085374_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP043414.1_3086177_3086774_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP043414.1_3086794_3087022_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP043414.1_3087059_3088301_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|418aa|down_3|NZ_CP043414.1_3088595_3089849_-	PRK09784, PRK09784, YccE family protein	NA|307aa|down_4|NZ_CP043414.1_3090106_3091027_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_5|NZ_CP043414.1_3091026_3091332_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_6|NZ_CP043414.1_3091483_3092083_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_7|NZ_CP043414.1_3092079_3094626_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_8|NZ_CP043414.1_3094625_3095798_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_9|NZ_CP043414.1_3095927_3096620_+	PRK10766, PRK10766, two-component system response regulator TorR
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	10	3430179-3430315	10	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	GATAAGATACGTCAGCATCGCATCCGACAATAAGTGCCGGATGCG	45	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA|551aa|up_8|NZ_CP043414.1_3418744_3420397_+,NA	NA|766aa|up_9|NZ_CP043414.1_3415963_3418261_-	PRK15377, PRK15377, type III secretion system effector HECT-type E3 ubiquitin transferase	NA|551aa|up_8|NZ_CP043414.1_3418744_3420397_+	NA	NA|674aa|up_7|NZ_CP043414.1_3420555_3422577_-	PRK05298, PRK05298, excinuclease ABC subunit UvrB	NA|226aa|up_6|NZ_CP043414.1_3423155_3423833_-	PRK00090, bioD, ATP-dependent dethiobiotin synthetase BioD	NA|252aa|up_5|NZ_CP043414.1_3423825_3424581_-	PRK10258, PRK10258, biotin biosynthesis protein BioC; Provisional	NA|385aa|up_4|NZ_CP043414.1_3424567_3425722_-	PRK05958, PRK05958, 8-amino-7-oxononanoate synthase; Reviewed	NA|347aa|up_3|NZ_CP043414.1_3425718_3426759_-	PRK15108, PRK15108, biotin synthase; Provisional	NA|430aa|up_2|NZ_CP043414.1_3426845_3428135_+	PRK07986, PRK07986, adenosylmethionine--8-amino-7-oxononanoate transaminase; Validated	NA|159aa|up_1|NZ_CP043414.1_3428193_3428670_+	PRK10257, PRK10257, putative kinase inhibitor protein; Provisional	NA|428aa|up_0|NZ_CP043414.1_3428821_3430105_+	PRK10531, PRK10531, putative acyl-CoA thioester hydrolase	NA|754aa|down_0|NZ_CP043414.1_3430337_3432599_-	PRK11413, PRK11413, putative hydratase; Provisional	NA|478aa|down_1|NZ_CP043414.1_3432781_3434215_-	pfam00939, Na_sulph_symp, Sodium:sulfate symporter transmembrane region	NA|351aa|down_2|NZ_CP043414.1_3434289_3435342_-	NF033377, OMA_tautomer, 4-oxalomesaconate tautomerase	NA|318aa|down_3|NZ_CP043414.1_3435525_3436479_+	cd08440, PBP2_LTTR_like_4, TThe C-terminal substrate binding domain of an uncharacterized LysR-type transcriptional regulator, contains the type 2 periplasmic binding fold	NA|332aa|down_4|NZ_CP043414.1_3436519_3437515_-	PRK11028, PRK11028, 6-phosphogluconolactonase; Provisional	NA|273aa|down_5|NZ_CP043414.1_3437669_3438488_+	PRK10530, PRK10530, pyridoxal phosphate (PLP) phosphatase; Provisional	NA|353aa|down_6|NZ_CP043414.1_3438488_3439547_-	PRK11144, modC, molybdenum ABC transporter ATP-binding protein ModC	NA|230aa|down_7|NZ_CP043414.1_3439549_3440239_-	PRK09421, modB, molybdate ABC transporter permease subunit	NA|258aa|down_8|NZ_CP043414.1_3440238_3441012_-	PRK10677, modA, molybdate transporter periplasmic protein; Provisional	NA|50aa|down_9|NZ_CP043414.1_3441177_3441327_-	pfam10766, AcrZ, Multidrug efflux pump-associated protein AcrZ
GCF_009931435.1_ASM993143v1	NZ_CP043414	Escherichia coli strain EC42405 chromosome, complete genome	11	4649572-4649683	11	CRISPRCasFinder	no		WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	TGTAGGCCGGATAAGGCGTAGCCGCCATCCGGC	33	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,RT,csa3,PD-DExK,c2c9_V-U4,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|148aa|up_9|NZ_CP043414.1_4641775_4642219_+	PRK10148, PRK10148, VOC family metalloprotein YjdN	NA|263aa|up_8|NZ_CP043414.1_4642351_4643140_+	PRK09984, PRK09984, phosphonate ABC transporter ATP-binding protein	NA|339aa|up_7|NZ_CP043414.1_4643164_4644181_+	cd13575, PBP2_PnhD, Substrate binding domain of ABC-type phosphonate uptake system; contains the type 2 periplasmic binding fold	NA|260aa|up_6|NZ_CP043414.1_4644307_4645087_+	COG3639, COG3639, ABC-type phosphate/phosphonate transport system, permease component [Inorganic ion transport and metabolism]	NA|242aa|up_5|NZ_CP043414.1_4645107_4645833_+	PRK10079, PRK10079, phosphonate metabolism transcriptional regulator PhnF; Provisional	NA|151aa|up_4|NZ_CP043414.1_4645833_4646286_+	COG3624, PhnG, Uncharacterized enzyme of phosphonate metabolism [Inorganic ion transport and metabolism]	NA|195aa|up_3|NZ_CP043414.1_4646282_4646867_+	COG3625, PhnH, Uncharacterized enzyme of phosphonate metabolism [Inorganic ion transport and metabolism]	NA|355aa|up_2|NZ_CP043414.1_4646866_4647931_+	COG3626, PhnI, Uncharacterized enzyme of phosphonate metabolism [Inorganic ion transport and metabolism]	NA|282aa|up_1|NZ_CP043414.1_4647923_4648769_+	COG3627, PhnJ, Uncharacterized enzyme of phosphonate metabolism [Inorganic ion transport and metabolism]	NA|253aa|up_0|NZ_CP043414.1_4648765_4649524_+	PRK11701, phnK, phosphonate C-P lyase system protein PhnK; Provisional	NA|227aa|down_0|NZ_CP043414.1_4649703_4650384_+	COG4778, PhnL, ABC-type phosphonate transport system, ATPase component [Inorganic ion transport and metabolism]	NA|379aa|down_1|NZ_CP043414.1_4650380_4651517_+	PRK15446, PRK15446, phosphonate metabolism protein PhnM; Provisional	NA|186aa|down_2|NZ_CP043414.1_4651516_4652074_+	PRK10078, PRK10078, ribose 1,5-bisphosphokinase; Provisional	NA|145aa|down_3|NZ_CP043414.1_4652060_4652495_+	PRK10146, PRK10146, aminoalkylphosphonate N-acetyltransferase	NA|253aa|down_4|NZ_CP043414.1_4652496_4653255_+	PRK11244, phnP, carbon-phosphorus lyase complex accessory protein; Provisional	NA|103aa|down_5|NZ_CP043414.1_4653289_4653598_-	PRK12704, PRK12704, phosphodiesterase; Provisional	NA|106aa|down_6|NZ_CP043414.1_4653666_4653984_-	TIGR01120, Ribose-5-phosphate_isomerase_B, ribose 5-phosphate isomerase B	NA|662aa|down_7|NZ_CP043414.1_4654236_4656222_+	COG2015, COG2015, Alkyl sulfatase and related hydrolases [Secondary metabolites biosynthesis, transport, and catabolism]	NA|92aa|down_8|NZ_CP043414.1_4656430_4656706_+	pfam17090, Ytca, Uncharacterized protein family	NA|344aa|down_9|NZ_CP043414.1_4656724_4657756_+	PRK10476, PRK10476, multidrug transporter subunit MdtN
