assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001021595.1_ASM102159v1	NZ_CP007275	Escherichia coli strain O18 chromosome, complete genome	1	3391643-3391844	1	PILER-CR	no		cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	Orphan	GTAGACCGGATAAGGCGTTCACGCCGCATCCGGCAA	36	0	0	NA	NA	NA	2	2	Orphan	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	NA,NA	NA|252aa|up_9|NZ_CP007275.1_3383192_3383948_+	PRK00216, ubiE, bifunctional demethylmenaquinone methyltransferase/2-methoxy-6-polyprenyl-1,4-benzoquinol methylase UbiE	NA|202aa|up_8|NZ_CP007275.1_3383961_3384567_+	COG3165, COG3165, Uncharacterized protein conserved in bacteria [Function unknown]	NA|547aa|up_7|NZ_CP007275.1_3384563_3386204_+	PRK04750, ubiB, putative ubiquinone biosynthesis protein UbiB; Reviewed	NA|90aa|up_6|NZ_CP007275.1_3386282_3386552_+	PRK03554, tatA, Sec-independent protein translocase subunit TatA	NA|172aa|up_5|NZ_CP007275.1_3386555_3387071_+	PRK01770, PRK01770, Sec-independent protein translocase subunit TatB	NA|259aa|up_4|NZ_CP007275.1_3387073_3387850_+	PRK10921, PRK10921, Sec-independent protein translocase subunit TatC	NA|261aa|up_3|NZ_CP007275.1_3387891_3388674_+	PRK10425, PRK10425, 3'-5' ssDNA/RNA exonuclease TatD	NA|163aa|up_2|NZ_CP007275.1_3388670_3389159_-	PRK09014, rfaH, transcription/translation regulatory transformer protein RfaH	NA|498aa|up_1|NZ_CP007275.1_3389325_3390819_+	PRK10922, PRK10922, 4-hydroxy-3-polyprenylbenzoate decarboxylase	NA|234aa|up_0|NZ_CP007275.1_3390864_3391566_+	PRK08051, fre, FMN reductase; Validated	NA|388aa|down_0|NZ_CP007275.1_3391848_3393012_-	PRK08947, fadA, 3-ketoacyl-CoA thiolase; Reviewed	NA|730aa|down_1|NZ_CP007275.1_3393021_3395211_-	PRK11730, fadB, fatty acid oxidation complex subunit alpha FadB	NA|444aa|down_2|NZ_CP007275.1_3395400_3396732_+	PRK13607, PRK13607, proline dipeptidase; Provisional	NA|205aa|down_3|NZ_CP007275.1_3396731_3397346_+	PRK11568, PRK11568, IMPACT family protein	NA|484aa|down_4|NZ_CP007275.1_3397384_3398836_+	PRK10750, PRK10750, Trk system potassium transporter TrkH	NA|182aa|down_5|NZ_CP007275.1_3398847_3399393_+	PRK11104, hemG, menaquinone-dependent protoporphyrinogen IX dehydrogenase	NA|176aa|down_6|NZ_CP007275.1_3404883_3405411_-	PRK10751, PRK10751, molybdopterin-guanine dinucleotide biosynthesis protein B; Provisional	NA|195aa|down_7|NZ_CP007275.1_3405392_3405977_-	PRK00317, mobA, molybdopterin-guanine dinucleotide biosynthesis protein MobA; Reviewed	NA|90aa|down_8|NZ_CP007275.1_3406046_3406316_+	pfam06288, DUF1040, Protein of unknown function (DUF1040)	NA|329aa|down_9|NZ_CP007275.1_3406392_3407379_+	PRK11768, PRK11768, serine/threonine protein kinase
GCF_001021595.1_ASM102159v1	NZ_CP007275	Escherichia coli strain O18 chromosome, complete genome	2	3672632-3672759	1	CRISPRCasFinder	no		cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	Orphan	GCCTGATGCGACGCTGTCGCGTCTTATCAGGCCTACA	37	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	NA,NA	NA|529aa|up_9|NZ_CP007275.1_3662227_3663814_+	COG4943, COG4943, Predicted signal transduction protein containing sensor and EAL domains [Signal transduction mechanisms]	NA|108aa|up_8|NZ_CP007275.1_3663816_3664140_-	PRK10219, PRK10219, superoxide response transcriptional regulator SoxS	NA|155aa|up_7|NZ_CP007275.1_3664225_3664690_+	PRK15002, PRK15002, redox-sensitive transcriptional activator SoxR	NA|450aa|up_6|NZ_CP007275.1_3665236_3666586_+	COG2252, COG2252, Xanthine/uracil/vitamin C permease [Nucleotide transport and    metabolism]	NA|550aa|up_5|NZ_CP007275.1_3666736_3668386_+	TIGR00831, Putative_Na+/H+_exchanger_Rv2287/MT2345/Mb2309	NA|295aa|up_4|NZ_CP007275.1_3668421_3669306_-	cd08438, PBP2_CidR, The C-terminal substrate binding domain of LysR-like transcriptional regulator CidR, contains the type 2 periplasmic binding fold	NA|137aa|up_3|NZ_CP007275.1_3669409_3669820_+	COG1380, COG1380, Putative effector of murein hydrolase LrgA [General function prediction only]	NA|230aa|up_2|NZ_CP007275.1_3669812_3670502_+	COG1346, LrgB, Putative effector of murein hydrolase [Cell envelope biogenesis, outer membrane]	NA|550aa|up_1|NZ_CP007275.1_3670540_3672190_-	PRK09395, actP, cation/acetate symporter ActP	NA|105aa|up_0|NZ_CP007275.1_3672186_3672501_-	COG3162, COG3162, Predicted membrane protein [Function unknown]	NA|653aa|down_0|NZ_CP007275.1_3672792_3674751_-	PRK00174, PRK00174, acetyl-CoA synthetase; Provisional	NA|479aa|down_1|NZ_CP007275.1_3675142_3676579_+	PRK11125, nrfA, ammonia-forming cytochrome c nitrite reductase	NA|189aa|down_2|NZ_CP007275.1_3676623_3677190_+	PRK11659, PRK11659, cytochrome c nitrite reductase pentaheme subunit; Provisional	NA|224aa|down_3|NZ_CP007275.1_3677186_3677858_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|319aa|down_4|NZ_CP007275.1_3677854_3678811_+	TIGR03148, cyt_nit_nrfD, cytochrome c nitrite reductase, NrfD subunit	NA|573aa|down_5|NZ_CP007275.1_3678830_3680549_+	PRK10369, PRK10369, heme lyase subunit NrfE; Provisional	NA|128aa|down_6|NZ_CP007275.1_3680541_3680925_+	PRK10144, PRK10144, formate-dependent nitrite reductase complex subunit NrfF; Provisional	NA|199aa|down_7|NZ_CP007275.1_3680921_3681518_+	PRK10370, PRK10370, formate-dependent nitrite reductase complex subunit NrfG; Provisional	NA|438aa|down_8|NZ_CP007275.1_3681860_3683174_+	PRK11283, gltP, glutamate/aspartate:proton symporter; Provisional	NA|230aa|down_9|NZ_CP007275.1_3683321_3684011_-	COG0790, COG0790, FOG: TPR repeat, SEL1 subfamily [General function prediction only]
GCF_001021595.1_ASM102159v1	NZ_CP007275	Escherichia coli strain O18 chromosome, complete genome	3	3883085-3883224	2	CRISPRCasFinder	no		cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	Orphan	TGTGTAGGTCGGATAAGGCGTTCACGTCGCATCCGACAATAACA	44	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	NA,NA	NA|335aa|up_9|NZ_CP007275.1_3871629_3872634_-	PRK02102, PRK02102, ornithine carbamoyltransferase; Validated	NA|315aa|up_8|NZ_CP007275.1_3872644_3873589_-	PRK12354, PRK12354, carbamate kinase; Reviewed	NA|407aa|up_7|NZ_CP007275.1_3873599_3874820_-	PRK01388, PRK01388, arginine deiminase; Provisional	NA|151aa|up_6|NZ_CP007275.1_3875497_3875950_+	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|335aa|up_5|NZ_CP007275.1_3875995_3877000_-	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|139aa|up_4|NZ_CP007275.1_3877161_3877578_+	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|168aa|up_3|NZ_CP007275.1_3877754_3878258_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|396aa|up_2|NZ_CP007275.1_3878450_3879638_+	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|952aa|up_1|NZ_CP007275.1_3879684_3882540_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|148aa|up_0|NZ_CP007275.1_3882539_3882983_-	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|504aa|down_0|NZ_CP007275.1_3883240_3884752_-	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|367aa|down_1|NZ_CP007275.1_3885018_3886119_+	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|361aa|down_2|NZ_CP007275.1_3886118_3887201_+	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|501aa|down_3|NZ_CP007275.1_3887361_3888864_-	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|333aa|down_4|NZ_CP007275.1_3888941_3889940_-	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|440aa|down_5|NZ_CP007275.1_3890006_3891326_-	TIGR00791, Gluconate_permease, gluconate transporter	NA|255aa|down_6|NZ_CP007275.1_3891390_3892155_-	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|344aa|down_7|NZ_CP007275.1_3892178_3893210_-	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|188aa|down_8|NZ_CP007275.1_3893426_3893990_+	PRK09825, idnK, gluconokinase	NA|340aa|down_9|NZ_CP007275.1_3893993_3895013_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)
GCF_001021595.1_ASM102159v1	NZ_CP007275	Escherichia coli strain O18 chromosome, complete genome	4	4790473-4790603	3	CRISPRCasFinder	no		cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	Orphan	AGGCCTGATAAGACGCGCAAGCGTCGCATCAGGCAA	36	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	NA|125aa|up_6|NZ_CP007275.1_4784725_4785100_-,NA|36aa|up_4|NZ_CP007275.1_4786736_4786844_-,NA	NA|245aa|up_9|NZ_CP007275.1_4781969_4782704_+	cd10800, LamB_YcsF_YbgL_like, Escherichia coli putative lactam utilization protein YbgL and similar proteins	NA|264aa|up_8|NZ_CP007275.1_4782739_4783531_+	PRK10445, PRK10445, endonuclease VIII; Provisional	NA|349aa|up_7|NZ_CP007275.1_4783527_4784574_-	COG3180, AbrB, Putative ammonia monooxygenase [General function prediction only]	NA|125aa|up_6|NZ_CP007275.1_4784725_4785100_-	NA	NA|428aa|up_5|NZ_CP007275.1_4785247_4786531_-	PRK05614, gltA, citrate synthase	NA|36aa|up_4|NZ_CP007275.1_4786736_4786844_-	NA	NA|135aa|up_3|NZ_CP007275.1_4787224_4787629_+	PRK09487, sdhC, succinate dehydrogenase cytochrome b556 subunit	NA|116aa|up_2|NZ_CP007275.1_4787622_4787970_+	PRK09488, sdhD, succinate dehydrogenase membrane anchor subunit	NA|589aa|up_1|NZ_CP007275.1_4787969_4789736_+	PRK08958, sdhA, succinate dehydrogenase flavoprotein subunit; Reviewed	NA|239aa|up_0|NZ_CP007275.1_4789751_4790468_+	PRK05950, sdhB, succinate dehydrogenase iron-sulfur subunit; Reviewed	NA|934aa|down_0|NZ_CP007275.1_4790828_4793630_+	PRK09404, sucA, 2-oxoglutarate dehydrogenase E1 component; Reviewed	NA|406aa|down_1|NZ_CP007275.1_4793644_4794862_+	PRK05704, PRK05704, 2-oxoglutarate dehydrogenase complex dihydrolipoyllysine-residue succinyltransferase	NA|389aa|down_2|NZ_CP007275.1_4794955_4796122_+	PRK00696, sucC, ADP-forming succinate--CoA ligase subunit beta	NA|290aa|down_3|NZ_CP007275.1_4796121_4796991_+	PRK05678, PRK05678, succinyl-CoA synthetase subunit alpha; Validated	NA|372aa|down_4|NZ_CP007275.1_4797230_4798346_+	sd00006, TPR, Tetratricopeptide repeat	NA|523aa|down_5|NZ_CP007275.1_4799675_4801244_+	PRK15097, PRK15097, cytochrome bd-I ubiquinol oxidase subunit CydA	NA|380aa|down_6|NZ_CP007275.1_4801259_4802399_+	PRK15003, PRK15003, cytochrome d ubiquinol oxidase subunit II	NA|38aa|down_7|NZ_CP007275.1_4802413_4802527_+	COG4890, COG4890, Predicted outer membrane lipoprotein [Function unknown]	NA|98aa|down_8|NZ_CP007275.1_4802526_4802820_+	PRK10588, PRK10588, hypothetical protein; Provisional	NA|135aa|down_9|NZ_CP007275.1_4802968_4803373_+	PRK10800, PRK10800, acyl-CoA thioesterase YbgC; Provisional
GCF_001021595.1_ASM102159v1	NZ_CP007275	Escherichia coli strain O18 chromosome, complete genome	5	4961160-4961727	2,4,1	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas3f,cas8f,cas7f,cas6f	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	Type I-F	GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA	28,28,28	0	0	NA	NA	I-F:I-F:I-F	8,9,9	9	TypeI-F	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	NA|69aa|up_8|NZ_CP007275.1_4954304_4954511_+,NA|138aa|up_5|NZ_CP007275.1_4955925_4956339_+,NA|94aa|up_3|NZ_CP007275.1_4957345_4957627_+,NA|87aa|up_2|NZ_CP007275.1_4957776_4958037_-,NA	NA|141aa|up_9|NZ_CP007275.1_4953466_4953889_+	cd04496, SSB_OBF, SSB_OBF: A subfamily of OB folds similar to the OB fold of ssDNA-binding protein (SSB)	NA|69aa|up_8|NZ_CP007275.1_4954304_4954511_+	NA	NA|352aa|up_7|NZ_CP007275.1_4954510_4955566_+	pfam03864, Phage_cap_E, Phage major capsid protein E	NA|112aa|up_6|NZ_CP007275.1_4955577_4955913_+	pfam02924, HDPD, Bacteriophage lambda head decoration protein D	NA|138aa|up_5|NZ_CP007275.1_4955925_4956339_+	NA	NA|181aa|up_4|NZ_CP007275.1_4956546_4957089_+	COG4220, COG4220, Phage DNA packaging protein, Nu1 subunit of terminase [DNA replication, recombination, and repair]	NA|94aa|up_3|NZ_CP007275.1_4957345_4957627_+	NA	NA|87aa|up_2|NZ_CP007275.1_4957776_4958037_-	NA	NA|107aa|up_1|NZ_CP007275.1_4958319_4958640_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|759aa|up_0|NZ_CP007275.1_4958670_4960947_+	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	cas1|328aa|down_0|NZ_CP007275.1_4961899_4962883_+	TIGR03637, cas1_YPEST, CRISPR-associated endonuclease Cas1, subtype I-F/YPEST	cas3f|1078aa|down_1|NZ_CP007275.1_4962879_4966113_+	TIGR02562, conserved_hypothetical_protein, CRISPR-associated helicase Cas3, subtype I-F/YPEST	cas8f|436aa|down_2|NZ_CP007275.1_4966442_4967750_+	cd09735, Csy1_I-F, CRISPR/Cas system-associated protein Csy1	cas7f|334aa|down_3|NZ_CP007275.1_4968680_4969682_+	pfam09615, Cas_Csy3, CRISPR-associated protein (Cas_Csy3)	cas6f|185aa|down_4|NZ_CP007275.1_4969692_4970247_+	cd09739, Cas6_I-F, CRISPR/Cas system-associated RAMP superfamily protein Cas6f	NA|73aa|down_5|NZ_CP007275.1_4971288_4971507_-	PRK00276, infA, translation initiation factor IF-1; Validated	NA|235aa|down_6|NZ_CP007275.1_4971791_4972496_-	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|574aa|down_7|NZ_CP007275.1_4972537_4974259_-	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|589aa|down_8|NZ_CP007275.1_4974259_4976026_-	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|322aa|down_9|NZ_CP007275.1_4976148_4977114_-	PRK10262, PRK10262, thioredoxin reductase; Provisional
GCF_001021595.1_ASM102159v1	NZ_CP007275	Escherichia coli strain O18 chromosome, complete genome	6	4970788-4971176	3,5,2	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas3f,cas8f,cas7f,cas6f	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	Type I-F	GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA,GTTCACTGCCGTACAGGCAGCTTAGAAA	28,28,28	0	0	NA	NA	I-F:I-F:I-F	5,6,6	6	TypeI-F	cas3,DEDDh,DinG,csa3,cas1,cas3f,cas8f,cas7f,cas6f	NA|94aa|up_8|NZ_CP007275.1_4957345_4957627_+,NA|87aa|up_7|NZ_CP007275.1_4957776_4958037_-,NA	NA|181aa|up_9|NZ_CP007275.1_4956546_4957089_+	COG4220, COG4220, Phage DNA packaging protein, Nu1 subunit of terminase [DNA replication, recombination, and repair]	NA|94aa|up_8|NZ_CP007275.1_4957345_4957627_+	NA	NA|87aa|up_7|NZ_CP007275.1_4957776_4958037_-	NA	NA|107aa|up_6|NZ_CP007275.1_4958319_4958640_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|759aa|up_5|NZ_CP007275.1_4958670_4960947_+	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	cas1|328aa|up_4|NZ_CP007275.1_4961899_4962883_+	TIGR03637, cas1_YPEST, CRISPR-associated endonuclease Cas1, subtype I-F/YPEST	cas3f|1078aa|up_3|NZ_CP007275.1_4962879_4966113_+	TIGR02562, conserved_hypothetical_protein, CRISPR-associated helicase Cas3, subtype I-F/YPEST	cas8f|436aa|up_2|NZ_CP007275.1_4966442_4967750_+	cd09735, Csy1_I-F, CRISPR/Cas system-associated protein Csy1	cas7f|334aa|up_1|NZ_CP007275.1_4968680_4969682_+	pfam09615, Cas_Csy3, CRISPR-associated protein (Cas_Csy3)	cas6f|185aa|up_0|NZ_CP007275.1_4969692_4970247_+	cd09739, Cas6_I-F, CRISPR/Cas system-associated RAMP superfamily protein Cas6f	NA|73aa|down_0|NZ_CP007275.1_4971288_4971507_-	PRK00276, infA, translation initiation factor IF-1; Validated	NA|235aa|down_1|NZ_CP007275.1_4971791_4972496_-	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|574aa|down_2|NZ_CP007275.1_4972537_4974259_-	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|589aa|down_3|NZ_CP007275.1_4974259_4976026_-	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|322aa|down_4|NZ_CP007275.1_4976148_4977114_-	PRK10262, PRK10262, thioredoxin reductase; Provisional	NA|165aa|down_5|NZ_CP007275.1_4977657_4978152_+	PRK11169, PRK11169, leucine-responsive transcriptional regulator Lrp	NA|1354aa|down_6|NZ_CP007275.1_4978286_4982348_+	PRK10263, PRK10263, DNA translocase FtsK; Provisional	NA|204aa|down_7|NZ_CP007275.1_4982506_4983118_+	TIGR00547, Outer-membrane_lipoprotein_carrier_protein, periplasmic chaperone LolA	NA|448aa|down_8|NZ_CP007275.1_4983128_4984472_+	PRK13342, PRK13342, recombination factor protein RarA; Reviewed	NA|431aa|down_9|NZ_CP007275.1_4984562_4985855_+	PRK05431, PRK05431, seryl-tRNA synthetase; Provisional
