assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	1	170644-170788	1	CRISPRCasFinder	no		RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Orphan	GTAGGTCGGATAAGATGCGCAAGCATCGCATCCGACAATAAGTGCCGGATGC	52	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA	NA|330aa|up_9|NZ_CP019961.1_158542_159532_-	PRK00164, moaA, GTP 3',8-cyclase MoaA	NA|303aa|up_8|NZ_CP019961.1_159928_160837_+	TIGR01826, Putative_gluconeogenesis_factor, conserved hypothetical protein, cofD-related	NA|674aa|up_7|NZ_CP019961.1_161028_163050_-	PRK05298, PRK05298, excinuclease ABC subunit UvrB	NA|226aa|up_6|NZ_CP019961.1_163628_164306_-	PRK00090, bioD, ATP-dependent dethiobiotin synthetase BioD	NA|252aa|up_5|NZ_CP019961.1_164298_165054_-	PRK10258, PRK10258, biotin biosynthesis protein BioC; Provisional	NA|385aa|up_4|NZ_CP019961.1_165040_166195_-	PRK05958, PRK05958, 8-amino-7-oxononanoate synthase; Reviewed	NA|347aa|up_3|NZ_CP019961.1_166191_167232_-	PRK15108, PRK15108, biotin synthase; Provisional	NA|430aa|up_2|NZ_CP019961.1_167318_168608_+	PRK07986, PRK07986, adenosylmethionine--8-amino-7-oxononanoate transaminase; Validated	NA|159aa|up_1|NZ_CP019961.1_168666_169143_+	PRK10257, PRK10257, putative kinase inhibitor protein; Provisional	NA|428aa|up_0|NZ_CP019961.1_169294_170578_+	PRK10531, PRK10531, putative acyl-CoA thioester hydrolase	NA|754aa|down_0|NZ_CP019961.1_170811_173073_-	PRK11413, PRK11413, putative hydratase; Provisional	NA|478aa|down_1|NZ_CP019961.1_173255_174689_-	pfam00939, Na_sulph_symp, Sodium:sulfate symporter transmembrane region	NA|351aa|down_2|NZ_CP019961.1_174764_175817_-	NF033377, OMA_tautomer, 4-oxalomesaconate tautomerase	NA|318aa|down_3|NZ_CP019961.1_176000_176954_+	cd08440, PBP2_LTTR_like_4, TThe C-terminal substrate binding domain of an uncharacterized LysR-type transcriptional regulator, contains the type 2 periplasmic binding fold	NA|332aa|down_4|NZ_CP019961.1_176994_177990_-	PRK11028, PRK11028, 6-phosphogluconolactonase; Provisional	NA|273aa|down_5|NZ_CP019961.1_178144_178963_+	PRK10530, PRK10530, pyridoxal phosphate (PLP) phosphatase; Provisional	NA|353aa|down_6|NZ_CP019961.1_178963_180022_-	PRK11144, modC, molybdenum ABC transporter ATP-binding protein ModC	NA|230aa|down_7|NZ_CP019961.1_180024_180714_-	PRK09421, modB, molybdate ABC transporter permease subunit	NA|258aa|down_8|NZ_CP019961.1_180713_181487_-	PRK10677, modA, molybdate transporter periplasmic protein; Provisional	NA|50aa|down_9|NZ_CP019961.1_181653_181803_-	pfam10766, AcrZ, Multidrug efflux pump-associated protein AcrZ
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	2	761416-761512	2	CRISPRCasFinder	no		RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Orphan	GCCAGCGTCGCATCAGGCATCCGCGCA	27	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA	NA|153aa|up_9|NZ_CP019961.1_753294_753753_-	PRK09177, PRK09177, xanthine-guanine phosphoribosyltransferase; Validated	NA|486aa|up_8|NZ_CP019961.1_754013_755471_+	PRK15026, PRK15026, aminoacyl-histidine dipeptidase; Provisional	NA|179aa|up_7|NZ_CP019961.1_755527_756064_-	PRK08179, prfH, peptide chain release factor-like protein; Reviewed	NA|89aa|up_6|NZ_CP019961.1_755996_756263_-	PRK09588, PRK09588, hypothetical protein; Reviewed	NA|151aa|up_5|NZ_CP019961.1_756496_756949_-	PRK09831, PRK09831, GNAT family N-acetyltransferase	NA|133aa|up_4|NZ_CP019961.1_756958_757357_-	PRK09885, PRK09885, type II toxin-antitoxin system YafO family toxin	NA|98aa|up_3|NZ_CP019961.1_757359_757653_-	PRK09778, PRK09778, type I toxin-antitoxin system antitoxin YafN	NA|352aa|up_2|NZ_CP019961.1_757704_758760_-	PRK02406, PRK02406, DNA polymerase IV; Validated	NA|257aa|up_1|NZ_CP019961.1_758830_759601_-	PRK06778, PRK06778, hypothetical protein; Validated	NA|580aa|up_0|NZ_CP019961.1_759560_761300_+	COG1298, FlhA, Flagellar biosynthesis pathway, component FlhA [Cell motility and secretion / Intracellular trafficking and secretion]	NA|166aa|down_0|NZ_CP019961.1_761515_762013_-	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|258aa|down_1|NZ_CP019961.1_762188_762962_-	COG0791, Spr, Cell wall-associated hydrolases (invasion-associated proteins) [Cell envelope biogenesis, outer membrane]	NA|87aa|down_2|NZ_CP019961.1_763147_763408_+	COG3077, RelB, DNA-damage-inducible protein J [DNA replication, recombination, and repair]	NA|93aa|down_3|NZ_CP019961.1_763410_763689_+	COG3041, COG3041, Uncharacterized protein conserved in bacteria [Function unknown]	NA|247aa|down_4|NZ_CP019961.1_763844_764585_+	COG3034, COG3034, Uncharacterized protein conserved in bacteria [Function unknown]	NA|256aa|down_5|NZ_CP019961.1_764555_765323_-	pfam13230, GATase_4, Glutamine amidotransferases class-II	NA|193aa|down_6|NZ_CP019961.1_765528_766107_-	PRK00414, gmhA, D-sedoheptulose 7-phosphate isomerase	NA|815aa|down_7|NZ_CP019961.1_766346_768791_+	PRK09463, fadE, acyl-CoA dehydrogenase; Reviewed	NA|158aa|down_8|NZ_CP019961.1_768833_769307_-	PRK09993, PRK09993, C-lysozyme inhibitor; Provisional	NA|257aa|down_9|NZ_CP019961.1_769460_770231_+	PRK10438, PRK10438, C-N hydrolase family amidase; Provisional
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	3	984429-984570	3	CRISPRCasFinder	no		RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Orphan	GCTGGAGAGCAACCGTAGGCCGGATAAGATGCGCCAGCATCGCATCCGGCGA	52	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA	NA|96aa|up_9|NZ_CP019961.1_973420_973708_-	PRK15449, PRK15449, ferredoxin-like protein FixX; Provisional	NA|429aa|up_8|NZ_CP019961.1_973704_974991_-	PRK10157, PRK10157, putative oxidoreductase FixC; Provisional	NA|314aa|up_7|NZ_CP019961.1_975041_975983_-	PRK03363, fixB, electron transfer flavoprotein subunit alpha/FixB family protein	NA|257aa|up_6|NZ_CP019961.1_975997_976768_-	PRK03359, PRK03359, putative electron transfer flavoprotein FixA; Reviewed	NA|505aa|up_5|NZ_CP019961.1_977240_978755_+	PRK03356, PRK03356, L-carnitine/gamma-butyrobetaine antiport BCCT transporter	NA|381aa|up_4|NZ_CP019961.1_978785_979928_+	PRK03354, PRK03354, crotonobetainyl-CoA dehydrogenase; Validated	NA|406aa|up_3|NZ_CP019961.1_980056_981274_+	PRK03525, PRK03525, L-carnitine CoA-transferase	NA|518aa|up_2|NZ_CP019961.1_981347_982901_+	PRK08008, caiC, putative crotonobetaine/carnitine-CoA ligase; Validated	NA|262aa|up_1|NZ_CP019961.1_983009_983795_+	PRK03580, PRK03580, crotonobetainyl-CoA hydratase	NA|197aa|up_0|NZ_CP019961.1_983800_984391_+	PRK13627, PRK13627, carnitine operon protein CaiE; Provisional	NA|132aa|down_0|NZ_CP019961.1_984599_984995_-	PRK11476, PRK11476, carnitine metabolism transcriptional regulator CaiF	NA|1074aa|down_1|NZ_CP019961.1_985256_988478_-	PRK05294, carB, carbamoyl-phosphate synthase large subunit	NA|383aa|down_2|NZ_CP019961.1_988495_989644_-	PRK12564, PRK12564, carbamoyl-phosphate synthase small subunit	NA|274aa|down_3|NZ_CP019961.1_990099_990921_-	COG0289, DapB, Dihydrodipicolinate reductase [Amino acid transport and metabolism]	NA|305aa|down_4|NZ_CP019961.1_991087_992002_-	PRK10768, PRK10768, ribonucleoside hydrolase RihC; Provisional	NA|317aa|down_5|NZ_CP019961.1_992067_993018_-	PRK01045, ispH, 4-hydroxy-3-methylbut-2-enyl diphosphate reductase; Reviewed	NA|150aa|down_6|NZ_CP019961.1_993019_993469_-	PRK15095, PRK15095, FKBP-type peptidyl-prolyl cis-trans isomerase; Provisional	NA|165aa|down_7|NZ_CP019961.1_993593_994088_-	PRK00376, lspA, lipoprotein signal peptidase	NA|939aa|down_8|NZ_CP019961.1_994087_996904_-	PRK05743, ileS, isoleucyl-tRNA synthetase; Reviewed	NA|314aa|down_9|NZ_CP019961.1_996946_997888_-	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	4	2772743-2773442	1,4,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Unclear	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	10,11,11	11	Unclear	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA|47aa|up_1|NZ_CP019961.1_2771452_2771593_-,NA	NA|434aa|up_9|NZ_CP019961.1_2762149_2763451_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_8|NZ_CP019961.1_2763498_2765733_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|83aa|up_7|NZ_CP019961.1_2765810_2766059_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_6|NZ_CP019961.1_2766058_2766394_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_5|NZ_CP019961.1_2766464_2767256_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_4|NZ_CP019961.1_2767483_2769121_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_3|NZ_CP019961.1_2769208_2770507_+	PRK00077, eno, enolase; Provisional	NA|291aa|up_2|NZ_CP019961.1_2770566_2771439_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|47aa|up_1|NZ_CP019961.1_2771452_2771593_-	NA	NA|224aa|up_0|NZ_CP019961.1_2771731_2772403_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_CP019961.1_2774080_2775559_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_CP019961.1_2775585_2776863_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_CP019961.1_2777181_2777967_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_CP019961.1_2778036_2779491_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|446aa|down_4|NZ_CP019961.1_2779584_2780922_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_CP019961.1_2780899_2781679_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_CP019961.1_2781675_2782536_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|NZ_CP019961.1_2782683_2783259_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|NZ_CP019961.1_2783275_2783536_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|NZ_CP019961.1_2783526_2784798_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	5	2798992-2799569	5,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Type I-E	GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	9,9,3	9	TypeI-E	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA	NA|571aa|up_9|NZ_CP019961.1_2787355_2789068_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|up_8|NZ_CP019961.1_2789142_2789877_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	cas3|889aa|up_7|NZ_CP019961.1_2790235_2792902_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas8e|503aa|up_6|NZ_CP019961.1_2793316_2794825_+	PRK09693, PRK09693, Cascade antiviral complex protein; Validated	cse2gr11|161aa|up_5|NZ_CP019961.1_2794817_2795300_+	cd09670, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|364aa|up_4|NZ_CP019961.1_2795312_2796404_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|225aa|up_3|NZ_CP019961.1_2796406_2797081_+	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas6e|200aa|up_2|NZ_CP019961.1_2797067_2797667_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|306aa|up_1|NZ_CP019961.1_2797682_2798600_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|95aa|up_0|NZ_CP019961.1_2798601_2798886_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP019961.1_2799589_2800627_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP019961.1_2800878_2801787_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP019961.1_2801788_2803216_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP019961.1_2803215_2803821_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP019961.1_2803870_2804194_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP019961.1_2804387_2804699_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP019961.1_2804717_2805428_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP019961.1_2805427_2805907_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP019961.1_2805903_2806953_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP019961.1_2806933_2807695_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	6	3331832-3331949	6	CRISPRCasFinder	no		RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Orphan	CCGAGCCGTAGGCCGGATAAGGCGTTCACGC	31	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA	NA|268aa|up_9|NZ_CP019961.1_3320468_3321272_+	PRK10128, PRK10128, 2-keto-3-deoxy-L-rhamnonate aldolase; Provisional	NA|301aa|up_8|NZ_CP019961.1_3321312_3322215_-	PRK09956, PRK09956, ISNCY family transposase	NA|397aa|up_7|NZ_CP019961.1_3322407_3323598_-	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|420aa|up_6|NZ_CP019961.1_3323594_3324854_-	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|543aa|up_5|NZ_CP019961.1_3324843_3326472_-	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|453aa|up_4|NZ_CP019961.1_3326744_3328103_+	PRK11273, glpT, glycerol-3-phosphate transporter	NA|359aa|up_3|NZ_CP019961.1_3328107_3329184_+	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|217aa|up_2|NZ_CP019961.1_3329646_3330297_+	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|85aa|up_1|NZ_CP019961.1_3330350_3330605_-	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|377aa|up_0|NZ_CP019961.1_3330604_3331735_-	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|762aa|down_0|NZ_CP019961.1_3331968_3334254_-	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|241aa|down_1|NZ_CP019961.1_3338829_3339552_-	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|876aa|down_2|NZ_CP019961.1_3339698_3342326_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|563aa|down_3|NZ_CP019961.1_3342474_3344163_+	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|208aa|down_4|NZ_CP019961.1_3344159_3344783_+	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|1465aa|down_5|NZ_CP019961.1_3344926_3349321_+	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|550aa|down_6|NZ_CP019961.1_3349321_3350971_+	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|259aa|down_7|NZ_CP019961.1_3350975_3351752_+	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|395aa|down_8|NZ_CP019961.1_3351825_3353010_-	PRK05790, PRK05790, putative acyltransferase; Provisional	NA|441aa|down_9|NZ_CP019961.1_3353040_3354363_-	pfam02667, SCFA_trans, Short chain fatty acid transporter
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	7	3553509-3553649	7	CRISPRCasFinder	no		RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Orphan	ACCTACGGTTCGGATTTGTAGGCCTGATAAGACGCGGCAGCGTCGCATCAGGC	53	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA	NA|163aa|up_9|NZ_CP019961.1_3543987_3544476_+	PRK10191, PRK10191, putative acyl transferase; Provisional	NA|406aa|up_8|NZ_CP019961.1_3544472_3545690_+	TIGR04015, WcaC, colanic acid biosynthesis glycosyl transferase WcaC	NA|406aa|up_7|NZ_CP019961.1_3545664_3546882_+	TIGR04010, WcaD, putative colanic acid polymerase WcaD	NA|249aa|up_6|NZ_CP019961.1_3546892_3547639_+	PRK10063, PRK10063, colanic acid biosynthesis glycosyltransferase WcaE	NA|183aa|up_5|NZ_CP019961.1_3547654_3548203_+	TIGR04008, WcaF, colanic acid biosynthesis acetyltransferase WcaF	NA|374aa|up_4|NZ_CP019961.1_3548228_3549350_+	COG1089, Gmd, GDP-D-mannose dehydratase [Cell envelope biogenesis, outer membrane]	NA|322aa|up_3|NZ_CP019961.1_3549352_3550318_+	cd05239, GDP_FS_SDR_e, GDP-fucose synthetase, extended (e) SDRs	NA|160aa|up_2|NZ_CP019961.1_3550320_3550800_+	PRK15434, PRK15434, GDP-mannose mannosyl hydrolase	NA|408aa|up_1|NZ_CP019961.1_3550796_3552020_+	TIGR04007, wcaI, colanic acid biosynthesis glycosyl transferase WcaI	NA|479aa|up_0|NZ_CP019961.1_3552022_3553459_+	PRK15460, cpsB, mannose-1-phosphate guanyltransferase; Provisional	NA|457aa|down_0|NZ_CP019961.1_3553739_3555110_+	PRK15414, PRK15414, phosphomannomutase	NA|465aa|down_1|NZ_CP019961.1_3555164_3556559_+	PRK10124, PRK10124, putative UDP-glucose lipid carrier transferase; Provisional	NA|493aa|down_2|NZ_CP019961.1_3556560_3558039_+	PRK10459, PRK10459, MOP flippase family protein	NA|427aa|down_3|NZ_CP019961.1_3558410_3559691_+	TIGR04006, wcaK, colanic acid biosynthesis pyruvyl transferase WcaK	NA|407aa|down_4|NZ_CP019961.1_3559687_3560908_+	TIGR04005, wcaL, colanic acid biosynthesis glycosyltransferase WcaL	NA|465aa|down_5|NZ_CP019961.1_3560918_3562313_+	PRK10123, wcaM, putative colanic acid biosynthesis protein; Provisional	NA|298aa|down_6|NZ_CP019961.1_3562487_3563381_+	PRK10122, PRK10122, UTP--glucose-1-phosphate uridylyltransferase GalF	NA|362aa|down_7|NZ_CP019961.1_3563752_3564838_+	PRK10084, PRK10084, dTDP-glucose 4,6 dehydratase; Provisional	NA|300aa|down_8|NZ_CP019961.1_3564837_3565737_+	PRK09987, PRK09987, dTDP-4-dehydrorhamnose reductase; Provisional	NA|293aa|down_9|NZ_CP019961.1_3565794_3566673_+	PRK15480, PRK15480, glucose-1-phosphate thymidylyltransferase RfbA; Provisional
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	8	3995865-3995988	8	CRISPRCasFinder	no	DEDDh	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA,NA|30aa|down_7|NZ_CP019961.1_4004884_4004974_+	NA|471aa|up_9|NZ_CP019961.1_3985319_3986732_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP019961.1_3987288_3987498_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP019961.1_3987952_3988579_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP019961.1_3988599_3990702_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|216aa|up_5|NZ_CP019961.1_3990705_3991353_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP019961.1_3991416_3992085_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP019961.1_3992081_3992867_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP019961.1_3992870_3993683_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|535aa|up_1|NZ_CP019961.1_3993694_3995299_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP019961.1_3995424_3995730_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP019961.1_3996302_3997559_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP019961.1_3997599_3998973_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP019961.1_3999187_3999829_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP019961.1_3999868_4001017_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP019961.1_4001307_4002519_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP019961.1_4002631_4003564_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP019961.1_4003560_4004586_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP019961.1_4004884_4004974_+	NA	NA|390aa|down_8|NZ_CP019961.1_4005139_4006309_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP019961.1_4006543_4007125_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_003031225.1_ASM303122v1	NZ_CP019961	Escherichia coli strain HKUOPY1 chromosome, complete genome	9	4648760-4648851	9	CRISPRCasFinder	no		RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	RT,DinG,DEDDh,cas3,csa3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4	NA|70aa|up_9|NZ_CP019961.1_4637835_4638045_-,NA	NA|70aa|up_9|NZ_CP019961.1_4637835_4638045_-	NA	NA|1321aa|up_8|NZ_CP019961.1_4638099_4642062_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_7|NZ_CP019961.1_4642101_4642740_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_6|NZ_CP019961.1_4643027_4644119_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_5|NZ_CP019961.1_4644118_4644811_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_4|NZ_CP019961.1_4644822_4645209_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|267aa|up_3|NZ_CP019961.1_4645216_4646017_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_2|NZ_CP019961.1_4646026_4646617_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_CP019961.1_4646627_4647122_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP019961.1_4647142_4648471_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP019961.1_4649274_4649871_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP019961.1_4649891_4650119_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP019961.1_4650156_4651398_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|83aa|down_3|NZ_CP019961.1_4651690_4651939_-	PRK09784, PRK09784, YccE family protein	NA|295aa|down_4|NZ_CP019961.1_4652056_4652941_-	PRK09784, PRK09784, YccE family protein	NA|307aa|down_5|NZ_CP019961.1_4653201_4654122_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_6|NZ_CP019961.1_4654121_4654427_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_7|NZ_CP019961.1_4654578_4655178_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_8|NZ_CP019961.1_4655174_4657721_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_9|NZ_CP019961.1_4657720_4658893_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC
