assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_003018095.1_ASM301809v1	NZ_CP027452	Escherichia coli strain 2014C-3338 chromosome, complete genome	1	173657-173748	1	CRISPRCasFinder	no		cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA|70aa|up_8|NZ_CP027452.1_162907_163117_-,NA	NA|503aa|up_9|NZ_CP027452.1_161240_162749_-	PRK15419, PRK15419, sodium/proline symporter PutP	NA|70aa|up_8|NZ_CP027452.1_162907_163117_-	NA	NA|1321aa|up_7|NZ_CP027452.1_163171_167134_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_6|NZ_CP027452.1_167173_167812_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_5|NZ_CP027452.1_168099_169191_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_4|NZ_CP027452.1_169190_169883_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_3|NZ_CP027452.1_169894_170281_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|271aa|up_2|NZ_CP027452.1_170288_171101_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|165aa|up_1|NZ_CP027452.1_171699_172194_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP027452.1_172214_173543_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP027452.1_174171_174768_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP027452.1_174788_175016_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP027452.1_175053_176295_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|307aa|down_3|NZ_CP027452.1_176829_177750_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_4|NZ_CP027452.1_177749_178055_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_5|NZ_CP027452.1_178410_179010_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_6|NZ_CP027452.1_179006_181553_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_7|NZ_CP027452.1_181552_182725_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_8|NZ_CP027452.1_182854_183547_+	PRK10766, PRK10766, two-component system response regulator TorR	NA|343aa|down_9|NZ_CP027452.1_183519_184548_-	PRK10936, PRK10936, TMAO reductase system periplasmic protein TorT; Provisional
GCF_003018095.1_ASM301809v1	NZ_CP027452	Escherichia coli strain 2014C-3338 chromosome, complete genome	2	675976-676088	1	PILER-CR	no		cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Orphan	TTTTCTTACCTGATTCGGGTAAA	23	0	0	NA	NA	NA	2	2	Orphan	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA|34aa|up_7|NZ_CP027452.1_670565_670667_-,NA|310aa|up_6|NZ_CP027452.1_670765_671695_-,NA|36aa|up_3|NZ_CP027452.1_673912_674020_-,NA|101aa|up_1|NZ_CP027452.1_674511_674814_-,NA|94aa|down_9|NZ_CP027452.1_681153_681435_+	NA|57aa|up_9|NZ_CP027452.1_669943_670114_-	PRK09689, PRK09689, prophage protein NinE; Provisional	NA|152aa|up_8|NZ_CP027452.1_670113_670569_-	PRK09741, PRK09741, hypothetical protein; Provisional	NA|34aa|up_7|NZ_CP027452.1_670565_670667_-	NA	NA|310aa|up_6|NZ_CP027452.1_670765_671695_-	NA	NA|106aa|up_5|NZ_CP027452.1_671899_672217_-	pfam10548, P22_AR_C, P22AR C-terminal domain	NA|509aa|up_4|NZ_CP027452.1_672328_673855_-	cd00338, Ser_Recombinase, Serine Recombinase family, catalytic domain; a DNA binding domain may be present either N- or C-terminal to the catalytic domain	NA|36aa|up_3|NZ_CP027452.1_673912_674020_-	NA	NA|111aa|up_2|NZ_CP027452.1_674111_674444_-	PRK09541, emrE, EmrE family multidrug efflux SMR transporter	NA|101aa|up_1|NZ_CP027452.1_674511_674814_-	NA	NA|234aa|up_0|NZ_CP027452.1_674810_675512_-	pfam06992, Phage_lambda_P, Replication protein P	NA|180aa|down_0|NZ_CP027452.1_676524_677064_-	pfam06254, YdaT_toxin, Putative bacterial toxin ydaT	NA|77aa|down_1|NZ_CP027452.1_677133_677364_-	pfam15943, YdaS_antitoxin, Putative antitoxin of bacterial toxin-antitoxin system, YdaS/YdaT	NA|230aa|down_2|NZ_CP027452.1_677468_678158_+	COG2932, COG2932, Predicted transcriptional regulator [Transcription]	NA|97aa|down_3|NZ_CP027452.1_678669_678960_+	PRK11354, kil, FtsZ inhibitor protein; Reviewed	NA|99aa|down_4|NZ_CP027452.1_679035_679332_+	pfam06064, Gam, Host-nuclease inhibitor protein Gam	NA|262aa|down_5|NZ_CP027452.1_679337_680123_+	TIGR01913, Uncharacterized_protein_UU154, phage recombination protein Bet	NA|227aa|down_6|NZ_CP027452.1_680119_680800_+	pfam09588, YqaJ, YqaJ-like viral recombinase domain	NA|61aa|down_7|NZ_CP027452.1_680796_680979_+	pfam07026, DUF1317, Protein of unknown function (DUF1317)	NA|64aa|down_8|NZ_CP027452.1_680951_681143_+	pfam07131, DUF1382, Protein of unknown function (DUF1382)	NA|94aa|down_9|NZ_CP027452.1_681153_681435_+	NA
GCF_003018095.1_ASM301809v1	NZ_CP027452	Escherichia coli strain 2014C-3338 chromosome, complete genome	3	3132313-3132768	2,2,1,3	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Unclear	GAGTTCCCCACGTCAGCGGGGATAAACCG,GAGTTCCCCACGTCAGCGGGGATAAACCG,GAGTTCCCCNCGNCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29,29	0	0	NA	NA	I-E:I-E:I-E:I-E	6,7,7,6	7	Unclear	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA,NA	NA|150aa|up_9|NZ_CP027452.1_3114371_3114821_+	PRK08105, PRK08105, flavodoxin; Provisional	NA|451aa|up_8|NZ_CP027452.1_3115255_3116608_+	TIGR00893, Probable_glucarate_transporter, D-galactonate transporter	NA|447aa|up_7|NZ_CP027452.1_3116609_3117950_+	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|447aa|up_6|NZ_CP027452.1_3117970_3119311_+	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|434aa|up_5|NZ_CP027452.1_3122353_3123655_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_4|NZ_CP027452.1_3123702_3125937_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|264aa|up_3|NZ_CP027452.1_3126032_3126824_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_2|NZ_CP027452.1_3127051_3128689_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_1|NZ_CP027452.1_3128775_3130074_+	PRK00077, eno, enolase; Provisional	NA|224aa|up_0|NZ_CP027452.1_3131301_3131973_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_CP027452.1_3133405_3134884_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_CP027452.1_3134910_3136188_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_CP027452.1_3136506_3137292_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_CP027452.1_3137361_3138816_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|446aa|down_4|NZ_CP027452.1_3138909_3140247_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_CP027452.1_3140224_3141004_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_CP027452.1_3141000_3141861_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|NZ_CP027452.1_3142007_3142583_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|NZ_CP027452.1_3142599_3142860_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|NZ_CP027452.1_3142850_3144122_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCF_003018095.1_ASM301809v1	NZ_CP027452	Escherichia coli strain 2014C-3338 chromosome, complete genome	4	3158469-3159534	4,3,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	17,17,17	17	TypeI-E	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA,NA	NA|571aa|up_9|NZ_CP027452.1_3146679_3148392_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|51aa|up_8|NZ_CP027452.1_3149462_3149615_+	pfam01848, HOK_GEF, Hok/gef family	cas3|886aa|up_7|NZ_CP027452.1_3149852_3152510_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|521aa|up_6|NZ_CP027452.1_3152607_3154170_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|up_5|NZ_CP027452.1_3154166_3154703_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|NZ_CP027452.1_3154717_3155773_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP027452.1_3155783_3156530_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP027452.1_3156511_3157162_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|NZ_CP027452.1_3157158_3158082_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP027452.1_3158078_3158372_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP027452.1_3159615_3160653_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP027452.1_3160904_3161813_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP027452.1_3161814_3163242_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP027452.1_3163241_3163847_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP027452.1_3163896_3164220_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP027452.1_3164413_3164725_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP027452.1_3164743_3165454_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP027452.1_3165453_3165933_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP027452.1_3165929_3166979_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP027452.1_3166959_3167721_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_003018095.1_ASM301809v1	NZ_CP027452	Escherichia coli strain 2014C-3338 chromosome, complete genome	5	3743686-3743781	4	CRISPRCasFinder	no		cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Orphan	GCGTTTTATCCGGCCTACAATGAG	24	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA,NA	NA|294aa|up_9|NZ_CP027452.1_3730753_3731635_+	PRK10837, PRK10837, putative DNA-binding transcriptional regulator; Provisional	NA|490aa|up_8|NZ_CP027452.1_3731839_3733309_+	PRK10836, PRK10836, lysine transporter; Provisional	NA|660aa|up_7|NZ_CP027452.1_3733601_3735581_+	PRK10064, PRK10064, catecholate siderophore receptor CirA; Provisional	NA|279aa|up_6|NZ_CP027452.1_3735612_3736449_-	PLN02442, PLN02442, S-formylglutathione hydrolase	NA|223aa|up_5|NZ_CP027452.1_3736706_3737375_+	TIGR00063, GTP_cyclohydrolase_1, GTP cyclohydrolase I	NA|386aa|up_4|NZ_CP027452.1_3737391_3738549_+	PRK10835, PRK10835, hypothetical protein; Provisional	NA|347aa|up_3|NZ_CP027452.1_3738690_3739731_+	PRK10401, PRK10401, HTH-type transcriptional regulator GalS	NA|333aa|up_2|NZ_CP027452.1_3740010_3741009_+	PRK15395, PRK15395, galactose/glucose ABC transporter substrate-binding protein MglB	NA|507aa|up_1|NZ_CP027452.1_3741069_3742590_+	PRK10982, PRK10982, galactose/methyl galaxtoside transporter ATP-binding protein; Provisional	NA|337aa|up_0|NZ_CP027452.1_3742605_3743616_+	PRK09478, mglC, galactose/methyl galactoside ABC transporter permease MglC	NA|412aa|down_0|NZ_CP027452.1_3743874_3745110_-	PRK08318, PRK08318, NAD-dependent dihydropyrimidine dehydrogenase subunit PreA	NA|413aa|down_1|NZ_CP027452.1_3745103_3746342_-	PRK11749, PRK11749, dihydropyrimidine dehydrogenase subunit A; Provisional	NA|240aa|down_2|NZ_CP027452.1_3746903_3747623_-	PRK10834, PRK10834, outer membrane permeability protein SanA	NA|295aa|down_3|NZ_CP027452.1_3747772_3748657_-	PRK09027, PRK09027, cytidine deaminase; Provisional	NA|232aa|down_4|NZ_CP027452.1_3748786_3749482_-	PRK10711, PRK10711, hypothetical protein; Provisional	NA|133aa|down_5|NZ_CP027452.1_3749478_3749877_-	PRK01821, PRK01821, hypothetical protein; Provisional	NA|303aa|down_6|NZ_CP027452.1_3750007_3750916_-	TIGR02424, TF_pcaQ, pca operon transcription factor PcaQ	NA|453aa|down_7|NZ_CP027452.1_3751042_3752401_+	TIGR00895, transport_protein, benzoate transport	NA|343aa|down_8|NZ_CP027452.1_3752412_3753441_+	TIGR02272, gentisate_12-dioxygenase, gentisate 1,2-dioxygenase	NA|234aa|down_9|NZ_CP027452.1_3753456_3754158_+	COG0179, MhpD, 2-keto-4-pentenoate hydratase/2-oxohepta-3-ene-1,7-dioic acid hydratase (catechol pathway) [Secondary metabolites biosynthesis, transport, and catabolism]
GCF_003018095.1_ASM301809v1	NZ_CP027452	Escherichia coli strain 2014C-3338 chromosome, complete genome	6	4222868-4222991	5	CRISPRCasFinder	no	DEDDh	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,DEDDh,WYL,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	NA,NA|30aa|down_7|NZ_CP027452.1_4231887_4231977_+	NA|471aa|up_9|NZ_CP027452.1_4212321_4213734_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP027452.1_4214290_4214500_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP027452.1_4214955_4215582_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP027452.1_4215602_4217705_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|216aa|up_5|NZ_CP027452.1_4217708_4218356_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP027452.1_4218419_4219088_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP027452.1_4219084_4219870_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP027452.1_4219873_4220686_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|537aa|up_1|NZ_CP027452.1_4220691_4222302_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP027452.1_4222427_4222733_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP027452.1_4223306_4224563_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP027452.1_4224603_4225977_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|210aa|down_2|NZ_CP027452.1_4226202_4226832_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP027452.1_4226871_4228020_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP027452.1_4228310_4229522_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP027452.1_4229634_4230567_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP027452.1_4230563_4231589_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP027452.1_4231887_4231977_+	NA	NA|390aa|down_8|NZ_CP027452.1_4232142_4233312_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP027452.1_4233457_4234039_-	PRK10543, PRK10543, superoxide dismutase [Fe]
