assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_013315715.1_ASM1331571v1	NZ_CP054363	Escherichia coli strain SCU-171 chromosome, complete genome	1	943984-944079	1	CRISPRCasFinder	no		cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	Orphan	CTCATTGTAGGCCGGATAAAACGC	24	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	NA,NA	NA|343aa|up_9|NZ_CP054363.1_934324_935353_-	TIGR02272, gentisate_12-dioxygenase, gentisate 1,2-dioxygenase	NA|453aa|up_8|NZ_CP054363.1_935364_936723_-	TIGR00895, transport_protein, benzoate transport	NA|303aa|up_7|NZ_CP054363.1_936849_937758_+	TIGR02424, TF_pcaQ, pca operon transcription factor PcaQ	NA|133aa|up_6|NZ_CP054363.1_937888_938287_+	PRK01821, PRK01821, hypothetical protein; Provisional	NA|232aa|up_5|NZ_CP054363.1_938283_938979_+	PRK10711, PRK10711, hypothetical protein; Provisional	NA|295aa|up_4|NZ_CP054363.1_939108_939993_+	PRK09027, PRK09027, cytidine deaminase; Provisional	NA|240aa|up_3|NZ_CP054363.1_940142_940862_+	PRK10834, PRK10834, outer membrane permeability protein SanA	NA|80aa|up_2|NZ_CP054363.1_940864_941104_+	pfam10808, DUF2542, Protein of unknown function (DUF2542)	NA|413aa|up_1|NZ_CP054363.1_941422_942661_+	PRK11749, PRK11749, dihydropyrimidine dehydrogenase subunit A; Provisional	NA|412aa|up_0|NZ_CP054363.1_942654_943890_+	PRK08318, PRK08318, NAD-dependent dihydropyrimidine dehydrogenase subunit PreA	NA|337aa|down_0|NZ_CP054363.1_944148_945159_-	PRK09478, mglC, galactose/methyl galactoside ABC transporter permease MglC	NA|507aa|down_1|NZ_CP054363.1_945174_946695_-	PRK10982, PRK10982, galactose/methyl galaxtoside transporter ATP-binding protein; Provisional	NA|333aa|down_2|NZ_CP054363.1_946755_947754_-	PRK15395, PRK15395, galactose/glucose ABC transporter substrate-binding protein MglB	NA|347aa|down_3|NZ_CP054363.1_948033_949074_-	PRK10401, PRK10401, HTH-type transcriptional regulator GalS	NA|386aa|down_4|NZ_CP054363.1_949215_950373_-	PRK10835, PRK10835, hypothetical protein; Provisional	NA|223aa|down_5|NZ_CP054363.1_950389_951058_-	TIGR00063, GTP_cyclohydrolase_1, GTP cyclohydrolase I	NA|279aa|down_6|NZ_CP054363.1_951315_952152_+	PLN02442, PLN02442, S-formylglutathione hydrolase	NA|660aa|down_7|NZ_CP054363.1_952183_954163_-	PRK10064, PRK10064, catecholate siderophore receptor CirA; Provisional	NA|490aa|down_8|NZ_CP054363.1_954455_955925_-	PRK10836, PRK10836, lysine transporter; Provisional	NA|294aa|down_9|NZ_CP054363.1_956129_957011_-	PRK10837, PRK10837, putative DNA-binding transcriptional regulator; Provisional
GCF_013315715.1_ASM1331571v1	NZ_CP054363	Escherichia coli strain SCU-171 chromosome, complete genome	2	1539870-1541424	1,2,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	Type I-E	CCGGTTTATCCCCGCTGGCGCGGGGAACACA,CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC	31,29,29,29	0	0	NA	NA	I-E:I-E:I-E:I-E	23,25,25,23	25	TypeI-E	cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	NA,NA	NA|254aa|up_9|NZ_CP054363.1_1531683_1532445_-	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional	NA|350aa|up_8|NZ_CP054363.1_1532425_1533475_-	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|160aa|up_7|NZ_CP054363.1_1533471_1533951_-	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|237aa|up_6|NZ_CP054363.1_1533950_1534661_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|104aa|up_5|NZ_CP054363.1_1534679_1534991_-	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|108aa|up_4|NZ_CP054363.1_1535184_1535508_-	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|202aa|up_3|NZ_CP054363.1_1535557_1536163_-	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|476aa|up_2|NZ_CP054363.1_1536162_1537590_-	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|303aa|up_1|NZ_CP054363.1_1537591_1538500_-	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|346aa|up_0|NZ_CP054363.1_1538751_1539789_+	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	cas2|98aa|down_0|NZ_CP054363.1_1541520_1541814_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|308aa|down_1|NZ_CP054363.1_1541810_1542734_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|217aa|down_2|NZ_CP054363.1_1542730_1543381_-	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas5|249aa|down_3|NZ_CP054363.1_1543362_1544109_-	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|352aa|down_4|NZ_CP054363.1_1544119_1545175_-	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cse2gr11|179aa|down_5|NZ_CP054363.1_1545189_1545726_-	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|521aa|down_6|NZ_CP054363.1_1545722_1547285_-	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cas3|886aa|down_7|NZ_CP054363.1_1547382_1550040_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|51aa|down_8|NZ_CP054363.1_1550277_1550430_-	pfam01848, HOK_GEF, Hok/gef family	NA|245aa|down_9|NZ_CP054363.1_1550693_1551428_-	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase
GCF_013315715.1_ASM1331571v1	NZ_CP054363	Escherichia coli strain SCU-171 chromosome, complete genome	3	1567125-1567580	3,2,3,4	CRISPRCasFinder,CRT,PILER-CR,PILER-CR	no	cas3	cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	Unclear	CGGTTTATCCCCGCTGACGTGGGGAACTC,CGGTTTATCCCCGCTGNCGNGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGACGTGGGGAACTC	29,29,29,29	0	0	NA	NA	I-E:I-E:I-E:I-E	7,7,6,6	7	Unclear	cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	NA,NA	NA|424aa|up_9|NZ_CP054363.1_1555771_1557043_+	PRK10015, PRK10015, oxidoreductase; Provisional	NA|87aa|up_8|NZ_CP054363.1_1557033_1557294_+	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|192aa|up_7|NZ_CP054363.1_1557310_1557886_+	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|287aa|up_6|NZ_CP054363.1_1558032_1558893_-	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|260aa|up_5|NZ_CP054363.1_1558889_1559669_-	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|470aa|up_4|NZ_CP054363.1_1559646_1561056_-	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|485aa|up_3|NZ_CP054363.1_1561077_1562532_-	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|262aa|up_2|NZ_CP054363.1_1562601_1563387_-	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|426aa|up_1|NZ_CP054363.1_1563704_1564982_+	cd06174, MFS, Major Facilitator Superfamily	NA|493aa|up_0|NZ_CP054363.1_1565008_1566487_+	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|224aa|down_0|NZ_CP054363.1_1567919_1568591_-	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|433aa|down_1|NZ_CP054363.1_1569818_1571117_-	PRK00077, eno, enolase; Provisional	NA|546aa|down_2|NZ_CP054363.1_1571203_1572841_-	PRK05380, pyrG, CTP synthetase; Validated	NA|264aa|down_3|NZ_CP054363.1_1573068_1573860_-	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|745aa|down_4|NZ_CP054363.1_1573955_1576190_-	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|434aa|down_5|NZ_CP054363.1_1576237_1577539_-	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|919aa|down_6|NZ_CP054363.1_1577595_1580352_+	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|447aa|down_7|NZ_CP054363.1_1580582_1581923_-	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|447aa|down_8|NZ_CP054363.1_1581943_1583284_-	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|451aa|down_9|NZ_CP054363.1_1583285_1584638_-	TIGR00893, Probable_glucarate_transporter, D-galactonate transporter
GCF_013315715.1_ASM1331571v1	NZ_CP054363	Escherichia coli strain SCU-171 chromosome, complete genome	4	4103992-4104136	4	CRISPRCasFinder	no		cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	Orphan	TGCCTTAACGGTAGGCCGGATAAGGCGTTCACGCCGCATCCGGC	44	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG,c2c9_V-U4,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,casR,WYL	NA,NA	NA|379aa|up_9|NZ_CP054363.1_4093984_4095121_+	pfam13808, DDE_Tnp_1_assoc, DDE_Tnp_1-associated	NA|257aa|up_8|NZ_CP054363.1_4095190_4095961_-	PRK10438, PRK10438, C-N hydrolase family amidase; Provisional	NA|158aa|up_7|NZ_CP054363.1_4096114_4096588_+	PRK09993, PRK09993, C-lysozyme inhibitor; Provisional	NA|815aa|up_6|NZ_CP054363.1_4096630_4099075_-	PRK09463, fadE, acyl-CoA dehydrogenase; Reviewed	NA|193aa|up_5|NZ_CP054363.1_4099314_4099893_+	PRK00414, gmhA, D-sedoheptulose 7-phosphate isomerase	NA|256aa|up_4|NZ_CP054363.1_4100008_4100776_+	pfam13230, GATase_4, Glutamine amidotransferases class-II	NA|247aa|up_3|NZ_CP054363.1_4100746_4101487_-	COG3034, COG3034, Uncharacterized protein conserved in bacteria [Function unknown]	NA|87aa|up_2|NZ_CP054363.1_4102048_4102309_-	COG3077, RelB, DNA-damage-inducible protein J [DNA replication, recombination, and repair]	NA|258aa|up_1|NZ_CP054363.1_4102494_4103268_+	COG0791, Spr, Cell wall-associated hydrolases (invasion-associated proteins) [Cell envelope biogenesis, outer membrane]	NA|166aa|up_0|NZ_CP054363.1_4103444_4103942_+	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|580aa|down_0|NZ_CP054363.1_4104159_4105899_-	COG1298, FlhA, Flagellar biosynthesis pathway, component FlhA [Cell motility and secretion / Intracellular trafficking and secretion]	NA|263aa|down_1|NZ_CP054363.1_4105840_4106629_+	PRK06778, PRK06778, hypothetical protein; Validated	NA|352aa|down_2|NZ_CP054363.1_4106699_4107755_+	PRK02406, PRK02406, DNA polymerase IV; Validated	NA|151aa|down_3|NZ_CP054363.1_4107751_4108204_+	PRK09831, PRK09831, GNAT family N-acetyltransferase	NA|89aa|down_4|NZ_CP054363.1_4108382_4108649_+	PRK09588, PRK09588, hypothetical protein; Reviewed	NA|47aa|down_5|NZ_CP054363.1_4108808_4108949_+	PRK08179, prfH, peptide chain release factor-like protein; Reviewed	NA|486aa|down_6|NZ_CP054363.1_4109005_4110463_-	PRK15026, PRK15026, aminoacyl-histidine dipeptidase; Provisional	NA|153aa|down_7|NZ_CP054363.1_4110723_4111182_+	PRK09177, PRK09177, xanthine-guanine phosphoribosyltransferase; Validated	NA|415aa|down_8|NZ_CP054363.1_4111273_4112518_+	PRK05077, frsA, esterase FrsA	NA|134aa|down_9|NZ_CP054363.1_4112575_4112977_+	PRK10984, PRK10984, sigma factor-binding protein Crl
