assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_003856675.1_ASM385667v1	CP023820	Escherichia coli strain 7/2 chromosome, complete genome	1	46832-46963	1	PILER-CR	no		DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	Orphan	TTTTCAATATTGGTGAT	17	0	0	NA	NA	NA	2	2	Orphan	DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	NA|73aa|up_7|CP023820.1_38674_38893_-,NA	NA|383aa|up_9|CP023820.1_34279_35428_+	PRK12564, PRK12564, carbamoyl-phosphate synthase small subunit	NA|1074aa|up_8|CP023820.1_35445_38667_+	PRK05294, carB, carbamoyl-phosphate synthase large subunit	NA|73aa|up_7|CP023820.1_38674_38893_-	NA	NA|132aa|up_6|CP023820.1_38927_39323_+	PRK11476, PRK11476, carnitine metabolism transcriptional regulator CaiF	NA|197aa|up_5|CP023820.1_39441_40032_-	PRK13627, PRK13627, carnitine operon protein CaiE; Provisional	NA|262aa|up_4|CP023820.1_40037_40823_-	PRK03580, PRK03580, crotonobetainyl-CoA hydratase	NA|518aa|up_3|CP023820.1_40931_42485_-	PRK08008, caiC, putative crotonobetaine/carnitine-CoA ligase; Validated	NA|406aa|up_2|CP023820.1_42558_43776_-	PRK03525, PRK03525, L-carnitine CoA-transferase	NA|381aa|up_1|CP023820.1_43893_45036_-	PRK03354, PRK03354, crotonobetainyl-CoA dehydrogenase; Validated	NA|505aa|up_0|CP023820.1_45066_46581_-	PRK03356, PRK03356, L-carnitine/gamma-butyrobetaine antiport BCCT transporter	NA|257aa|down_0|CP023820.1_47053_47824_+	PRK03359, PRK03359, putative electron transfer flavoprotein FixA; Reviewed	NA|314aa|down_1|CP023820.1_47838_48780_+	PRK03363, fixB, electron transfer flavoprotein subunit alpha/FixB family protein	NA|429aa|down_2|CP023820.1_48830_50117_+	PRK10157, PRK10157, putative oxidoreductase FixC; Provisional	NA|96aa|down_3|CP023820.1_50113_50401_+	PRK15449, PRK15449, ferredoxin-like protein FixX; Provisional	NA|444aa|down_4|CP023820.1_50459_51791_+	cd17316, MFS_SV2_like, Metazoan Synaptic vesicle glycoprotein 2 (SV2) and related small molecule transporters of the Major Facilitator Superfamily	NA|177aa|down_5|CP023820.1_51898_52429_+	PRK00871, PRK00871, glutathione-regulated potassium-efflux system oxidoreductase KefF	NA|621aa|down_6|CP023820.1_52421_54284_+	PRK03562, PRK03562, glutathione-regulated potassium-efflux system protein KefC; Provisional	NA|160aa|down_7|CP023820.1_54475_54955_+	PRK10769, folA, type 3 dihydrofolate reductase	NA|78aa|down_8|CP023820.1_55040_55274_+	COG5302, COG5302, Post-segregation antitoxin (ccd killing mechanism protein) encoded by the F plasmid [General function prediction only]	NA|84aa|down_9|CP023820.1_55276_55528_+	pfam01845, CcdB, CcdB protein
GCA_003856675.1_ASM385667v1	CP023820	Escherichia coli strain 7/2 chromosome, complete genome	2	3166593-3167228	1,2,1	CRT,PILER-CR,CRISPRCasFinder	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	Type I-E	TTTATCCCCGCTGGCGCGGGGAACAC,CGATTTATCCCCGCTGGCGCGGGGAACAC,TTTATCCCCGCTGGCGCGGGGAACAC	26,29,26	0	0	NA	NA	I-E:I-E:I-E	10,9,9	10	TypeI-E	DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	NA,NA	NA|254aa|up_9|CP023820.1_3158463_3159225_-	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional	NA|350aa|up_8|CP023820.1_3159205_3160255_-	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|160aa|up_7|CP023820.1_3160251_3160731_-	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|237aa|up_6|CP023820.1_3160730_3161441_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|104aa|up_5|CP023820.1_3161459_3161771_-	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|108aa|up_4|CP023820.1_3161964_3162288_-	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|202aa|up_3|CP023820.1_3162337_3162943_-	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|476aa|up_2|CP023820.1_3162942_3164370_-	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|303aa|up_1|CP023820.1_3164371_3165280_-	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|346aa|up_0|CP023820.1_3165531_3166569_+	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	cas2|98aa|down_0|CP023820.1_3167324_3167618_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|308aa|down_1|CP023820.1_3167614_3168538_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|217aa|down_2|CP023820.1_3168534_3169185_-	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas5|249aa|down_3|CP023820.1_3169166_3169913_-	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|352aa|down_4|CP023820.1_3169923_3170979_-	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cse2gr11|179aa|down_5|CP023820.1_3170993_3171530_-	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|521aa|down_6|CP023820.1_3171526_3173089_-	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cas3|900aa|down_7|CP023820.1_3173186_3175886_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|51aa|down_8|CP023820.1_3176080_3176233_-	pfam01848, HOK_GEF, Hok/gef family	NA|245aa|down_9|CP023820.1_3176497_3177232_-	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase
GCA_003856675.1_ASM385667v1	CP023820	Escherichia coli strain 7/2 chromosome, complete genome	3	3194366-3194699	2,2,3	CRISPRCasFinder,CRT,PILER-CR	no		DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	Orphan	CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	5,5,4	5	Orphan	DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	NA,NA	NA|192aa|up_9|CP023820.1_3183114_3183690_+	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|174aa|up_8|CP023820.1_3183824_3184346_+	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|241aa|up_7|CP023820.1_3184450_3185173_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|287aa|up_6|CP023820.1_3185272_3186133_-	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|260aa|up_5|CP023820.1_3186129_3186909_-	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|446aa|up_4|CP023820.1_3186886_3188224_-	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|485aa|up_3|CP023820.1_3188317_3189772_-	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|262aa|up_2|CP023820.1_3189841_3190627_-	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|426aa|up_1|CP023820.1_3190945_3192223_+	cd06174, MFS, Major Facilitator Superfamily	NA|493aa|up_0|CP023820.1_3192249_3193728_+	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|224aa|down_0|CP023820.1_3195037_3195709_-	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|291aa|down_1|CP023820.1_3196002_3196875_+	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|433aa|down_2|CP023820.1_3196934_3198233_-	PRK00077, eno, enolase; Provisional	NA|546aa|down_3|CP023820.1_3198319_3199957_-	PRK05380, pyrG, CTP synthetase; Validated	NA|264aa|down_4|CP023820.1_3200184_3200976_-	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|112aa|down_5|CP023820.1_3201047_3201383_-	PRK09907, PRK09907, endoribonuclease MazF	NA|83aa|down_6|CP023820.1_3201382_3201631_-	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|745aa|down_7|CP023820.1_3201708_3203943_-	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|434aa|down_8|CP023820.1_3203990_3205292_-	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|919aa|down_9|CP023820.1_3205348_3208105_+	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional
GCA_003856675.1_ASM385667v1	CP023820	Escherichia coli strain 7/2 chromosome, complete genome	4	4914622-4914771	3	CRISPRCasFinder	no		DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	Orphan	CGCGTCTTATCAGGCCTACGAGTTCGGTGCTGTGTAGGTCGGATAAGGCGTTCA	54	0	0	NA	NA	NA	1	1	Orphan	DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	NA|532aa|up_6|CP023820.1_4905928_4907524_+,NA	NA|238aa|up_9|CP023820.1_4903831_4904545_-	PRK12742, PRK12742, SDR family oxidoreductase	NA|198aa|up_8|CP023820.1_4904615_4905209_+	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|151aa|up_7|CP023820.1_4905353_4905806_+	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|532aa|up_6|CP023820.1_4905928_4907524_+	NA	NA|335aa|up_5|CP023820.1_4907579_4908584_-	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|139aa|up_4|CP023820.1_4908745_4909162_+	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|168aa|up_3|CP023820.1_4909207_4909711_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|399aa|up_2|CP023820.1_4909903_4911100_+	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|952aa|up_1|CP023820.1_4911155_4914011_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|148aa|up_0|CP023820.1_4914010_4914454_-	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|504aa|down_0|CP023820.1_4914807_4916319_-	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|367aa|down_1|CP023820.1_4916585_4917686_+	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|361aa|down_2|CP023820.1_4917685_4918768_+	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|501aa|down_3|CP023820.1_4918928_4920431_-	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|333aa|down_4|CP023820.1_4920508_4921507_-	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|440aa|down_5|CP023820.1_4921573_4922893_-	TIGR00791, Gluconate_permease, gluconate transporter	NA|255aa|down_6|CP023820.1_4922955_4923720_-	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|344aa|down_7|CP023820.1_4923743_4924775_-	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|188aa|down_8|CP023820.1_4924991_4925555_+	PRK09825, idnK, gluconokinase	NA|340aa|down_9|CP023820.1_4925558_4926578_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)
GCA_003856675.1_ASM385667v1	CP023822	Escherichia coli strain 7/2 plasmid p7_2.2, complete sequence	1	28370-28543	1,1	CRISPRCasFinder,CRT	no			Orphan	TGTACCGCTTTGTTGGTTAAAGTGTACCT,ACCGCTTTGTTGGTTAAAGTGTACCT	29,26	0	0	NA	NA	NA:NA	1,3	3	Orphan	DEDDh,c2c9_V-U4,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,PD-DExK,WYL,RT	NA|60aa|up_8|CP023822.1_21107_21287_-,NA|133aa|up_5|CP023822.1_24481_24880_-,NA|105aa|up_4|CP023822.1_24937_25252_-,NA|137aa|up_2|CP023822.1_26041_26452_-,NA|83aa|down_0|CP023822.1_29112_29361_+,NA|213aa|down_2|CP023822.1_30562_31201_+,NA|86aa|down_3|CP023822.1_31242_31500_+,NA|80aa|down_4|CP023822.1_31697_31937_+,NA|102aa|down_5|CP023822.1_32297_32603_+,NA|233aa|down_7|CP023822.1_33785_34484_+,NA|112aa|down_8|CP023822.1_34523_34859_+,NA|74aa|down_9|CP023822.1_34868_35090_+	NA|266aa|up_9|CP023822.1_20310_21108_-	cd16424, VirB8, periplasmic domain of VirB8 protein	NA|60aa|up_8|CP023822.1_21107_21287_-	NA	NA|218aa|up_7|CP023822.1_21338_21992_-	pfam07996, T4SS, Type IV secretion system proteins	NA|838aa|up_6|CP023822.1_22002_24516_-	TIGR00929, CAG_pathogenicity_island_protein_23, type IV secretion/conjugal transfer ATPase, VirB4 family	NA|133aa|up_5|CP023822.1_24481_24880_-	NA	NA|105aa|up_4|CP023822.1_24937_25252_-	NA	NA|226aa|up_3|CP023822.1_25268_25946_-	cd16892, LT_VirB1-like, VirB1-like subfamily	NA|137aa|up_2|CP023822.1_26041_26452_-	NA	NA|168aa|up_1|CP023822.1_26661_27165_-	cd06170, LuxR_C_like, C-terminal DNA-binding domain of LuxR-like proteins	NA|354aa|up_0|CP023822.1_27168_28230_-	pfam01051, Rep_3, Initiator Replication protein	NA|83aa|down_0|CP023822.1_29112_29361_+	NA	NA|351aa|down_1|CP023822.1_29380_30433_+	pfam04610, TrbL, TrbL/VirB6 plasmid conjugal transfer protein	NA|213aa|down_2|CP023822.1_30562_31201_+	NA	NA|86aa|down_3|CP023822.1_31242_31500_+	NA	NA|80aa|down_4|CP023822.1_31697_31937_+	NA	NA|102aa|down_5|CP023822.1_32297_32603_+	NA	NA|328aa|down_6|CP023822.1_32746_33730_+	TIGR00180, Probable_chromosome-partitioning_protein_ParB, ParB/RepB/Spo0J family partition protein	NA|233aa|down_7|CP023822.1_33785_34484_+	NA	NA|112aa|down_8|CP023822.1_34523_34859_+	NA	NA|74aa|down_9|CP023822.1_34868_35090_+	NA
