assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000182745.2_ASM18274v1	NC_016027	Komagataeibacter medellinensis NBRC 3288, complete genome	1	883982-884437	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG	Type I-E	GTGTTCCCCGCACGCGCGGGGATGAACCG,GTGTTCCCCGCACGCGCGGGGATGAACCG,GTGTTCCCCGCACGCGCGGGGATGAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	6,7,7	7	TypeI-E	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG,WYL	NA|392aa|up_3|NC_016027.1_877331_878507_-,NA|206aa|up_0|NC_016027.1_883143_883761_-,NA|70aa|down_2|NC_016027.1_889598_889808_+	NA|663aa|up_9|NC_016027.1_869812_871801_-	pfam13624, SurA_N_3, SurA N-terminal domain	NA|248aa|up_8|NC_016027.1_872004_872748_+	PRK00042, tpiA, triosephosphate isomerase; Provisional	NA|105aa|up_7|NC_016027.1_872785_873100_+	COG1314, SecG, Preprotein translocase subunit SecG [Intracellular trafficking and secretion]	NA|550aa|up_6|NC_016027.1_873228_874878_+	PRK05380, pyrG, CTP synthetase; Validated	NA|283aa|up_5|NC_016027.1_874874_875723_+	PRK05198, PRK05198, 2-dehydro-3-deoxyphosphooctonate aldolase; Provisional	NA|367aa|up_4|NC_016027.1_876175_877276_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|392aa|up_3|NC_016027.1_877331_878507_-	NA	NA|697aa|up_2|NC_016027.1_878753_880844_-	COG5001, COG5001, Predicted signal transduction protein containing a membrane domain, an EAL and a GGDEF domain [Signal transduction mechanisms]	NA|560aa|up_1|NC_016027.1_881073_882753_-	pfam07396, Porin_O_P, Phosphate-selective porin O and P	NA|206aa|up_0|NC_016027.1_883143_883761_-	NA	NA|800aa|down_0|NC_016027.1_885039_887439_-	TIGR02505, RTPR, ribonucleoside-triphosphate reductase, adenosylcobalamin-dependent	NA|392aa|down_1|NC_016027.1_887722_888898_+	pfam06772, LtrA, Bacterial low temperature requirement A protein (LtrA)	NA|70aa|down_2|NC_016027.1_889598_889808_+	NA	cas2|114aa|down_3|NC_016027.1_890955_891297_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|320aa|down_4|NC_016027.1_891277_892237_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|236aa|down_5|NC_016027.1_892246_892954_-	smart01101, CRISPR_assoc, This domain forms an anti-parallel beta strand structure with flanking alpha helical regions	cas5|262aa|down_6|NC_016027.1_892950_893736_-	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas7|353aa|down_7|NC_016027.1_893739_894798_-	pfam09344, Cas_CT1975, CT1975-like protein	cse2gr11|183aa|down_8|NC_016027.1_894918_895467_-	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|548aa|down_9|NC_016027.1_895466_897110_-	cd09729, Cse1_I-E, CRISPR/Cas system-associated protein Cse1
GCF_000182745.2_ASM18274v1	NC_016027	Komagataeibacter medellinensis NBRC 3288, complete genome	2	889939-890882	2,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG	Type I-E	CGGTTCATCCCCGCGTGTGCGGGGAACAC,CGGTTCATCCCCGCGTGTGCGGGGAACAC,CGGTTCATCCCCGCGTGTGCGGGGAACAC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	15,15,14	15	TypeI-E	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG,WYL	NA|392aa|up_6|NC_016027.1_877331_878507_-,NA|206aa|up_3|NC_016027.1_883143_883761_-,NA|70aa|up_0|NC_016027.1_889598_889808_+,NA	NA|550aa|up_9|NC_016027.1_873228_874878_+	PRK05380, pyrG, CTP synthetase; Validated	NA|283aa|up_8|NC_016027.1_874874_875723_+	PRK05198, PRK05198, 2-dehydro-3-deoxyphosphooctonate aldolase; Provisional	NA|367aa|up_7|NC_016027.1_876175_877276_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|392aa|up_6|NC_016027.1_877331_878507_-	NA	NA|697aa|up_5|NC_016027.1_878753_880844_-	COG5001, COG5001, Predicted signal transduction protein containing a membrane domain, an EAL and a GGDEF domain [Signal transduction mechanisms]	NA|560aa|up_4|NC_016027.1_881073_882753_-	pfam07396, Porin_O_P, Phosphate-selective porin O and P	NA|206aa|up_3|NC_016027.1_883143_883761_-	NA	NA|800aa|up_2|NC_016027.1_885039_887439_-	TIGR02505, RTPR, ribonucleoside-triphosphate reductase, adenosylcobalamin-dependent	NA|392aa|up_1|NC_016027.1_887722_888898_+	pfam06772, LtrA, Bacterial low temperature requirement A protein (LtrA)	NA|70aa|up_0|NC_016027.1_889598_889808_+	NA	cas2|114aa|down_0|NC_016027.1_890955_891297_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|320aa|down_1|NC_016027.1_891277_892237_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|236aa|down_2|NC_016027.1_892246_892954_-	smart01101, CRISPR_assoc, This domain forms an anti-parallel beta strand structure with flanking alpha helical regions	cas5|262aa|down_3|NC_016027.1_892950_893736_-	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas7|353aa|down_4|NC_016027.1_893739_894798_-	pfam09344, Cas_CT1975, CT1975-like protein	cse2gr11|183aa|down_5|NC_016027.1_894918_895467_-	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|548aa|down_6|NC_016027.1_895466_897110_-	cd09729, Cse1_I-E, CRISPR/Cas system-associated protein Cse1	cas3|904aa|down_7|NC_016027.1_897570_900282_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|168aa|down_8|NC_016027.1_901431_901935_-	pfam01613, Flavin_Reduct, Flavin reductase like domain	NA|457aa|down_9|NC_016027.1_902305_903676_+	cd07100, ALDH_SSADH1_GabD1, Mycobacterium tuberculosis succinate-semialdehyde dehydrogenase 1-like
GCF_000182745.2_ASM18274v1	NC_016027	Komagataeibacter medellinensis NBRC 3288, complete genome	3	900439-901260	3,3,3	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG	Type I-E	CGGTTCATCCCCGCGCGTGCGGGGAACAC,CGGTTCATCCCCGCGCGTGCGGGGAACAC,CGGTTCATCCCCGCGCGTGCGGGGAACAC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	13,13,12	13	TypeI-E	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG,WYL	NA|70aa|up_8|NC_016027.1_889598_889808_+,NA|127aa|down_4|NC_016027.1_913573_913954_+	NA|392aa|up_9|NC_016027.1_887722_888898_+	pfam06772, LtrA, Bacterial low temperature requirement A protein (LtrA)	NA|70aa|up_8|NC_016027.1_889598_889808_+	NA	cas2|114aa|up_7|NC_016027.1_890955_891297_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|320aa|up_6|NC_016027.1_891277_892237_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|236aa|up_5|NC_016027.1_892246_892954_-	smart01101, CRISPR_assoc, This domain forms an anti-parallel beta strand structure with flanking alpha helical regions	cas5|262aa|up_4|NC_016027.1_892950_893736_-	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas7|353aa|up_3|NC_016027.1_893739_894798_-	pfam09344, Cas_CT1975, CT1975-like protein	cse2gr11|183aa|up_2|NC_016027.1_894918_895467_-	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|548aa|up_1|NC_016027.1_895466_897110_-	cd09729, Cse1_I-E, CRISPR/Cas system-associated protein Cse1	cas3|904aa|up_0|NC_016027.1_897570_900282_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|168aa|down_0|NC_016027.1_901431_901935_-	pfam01613, Flavin_Reduct, Flavin reductase like domain	NA|457aa|down_1|NC_016027.1_902305_903676_+	cd07100, ALDH_SSADH1_GabD1, Mycobacterium tuberculosis succinate-semialdehyde dehydrogenase 1-like	NA|181aa|down_2|NC_016027.1_910651_911194_+	COG2032, SodC, Cu/Zn superoxide dismutase [Inorganic ion transport and metabolism]	NA|534aa|down_3|NC_016027.1_911805_913407_-	PRK00074, guaA, GMP synthase; Reviewed	NA|127aa|down_4|NC_016027.1_913573_913954_+	NA	NA|170aa|down_5|NC_016027.1_914047_914557_+	cd04673, Nudix_Hydrolase_15, Members of the Nudix hydrolase superfamily catalyze the hydrolysis of NUcleoside DIphosphates linked to other moieties, X	NA|117aa|down_6|NC_016027.1_914553_914904_+	cd00156, REC, phosphoacceptor receiver (REC) domain of response regulators (RRs) and pseudo response regulators (PRRs)	NA|483aa|down_7|NC_016027.1_915011_916460_-	pfam13231, PMT_2, Dolichyl-phosphate-mannose-protein mannosyltransferase	NA|157aa|down_8|NC_016027.1_916480_916951_-	COG1522, Lrp, Transcriptional regulators [Transcription]	NA|319aa|down_9|NC_016027.1_917091_918048_+	TIGR01292, Thioredoxin_reductase, thioredoxin-disulfide reductase
GCF_000182745.2_ASM18274v1	NC_016027	Komagataeibacter medellinensis NBRC 3288, complete genome	4	1851600-1851709	4	CRISPRCasFinder	no		DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG	Orphan	CTGCCCGACATGCCCGACTGCCCGA	25	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG,WYL	NA,NA|91aa|down_2|NC_016027.1_1854636_1854909_-,NA|136aa|down_3|NC_016027.1_1854905_1855313_-,NA|258aa|down_5|NC_016027.1_1855814_1856588_-,NA|63aa|down_6|NC_016027.1_1856590_1856779_-,NA|110aa|down_7|NC_016027.1_1856775_1857105_-,NA|83aa|down_8|NC_016027.1_1857101_1857350_-,NA|78aa|down_9|NC_016027.1_1857346_1857580_-	NA|288aa|up_9|NC_016027.1_1838779_1839643_+	COG1108, ZnuB, ABC-type Mn2+/Zn2+ transport systems, permease components [Inorganic ion transport and metabolism]	NA|299aa|up_8|NC_016027.1_1839656_1840553_+	cd01137, PsaA, Metal binding protein PsaA	NA|590aa|up_7|NC_016027.1_1840524_1842294_-	COG4178, COG4178, ABC-type uncharacterized transport system, permease and ATPase components [General function prediction only]	NA|150aa|up_6|NC_016027.1_1842678_1843128_+	PRK11667, PRK11667, hypothetical protein; Provisional	NA|560aa|up_5|NC_016027.1_1843200_1844880_-	cd08506, PBP2_clavulanate_OppA2, The substrate-binding domain of an oligopeptide binding protein (OppA2) from the biosynthesis pathway of the beta-lactamase inhibitor clavulanic acid contains the type 2 periplasmic binding fold	NA|210aa|up_4|NC_016027.1_1844894_1845524_-	pfam02630, SCO1-SenC, SCO1/SenC	NA|925aa|up_3|NC_016027.1_1845523_1848298_-	PRK05755, PRK05755, DNA polymerase I; Provisional	NA|72aa|up_2|NC_016027.1_1848312_1848528_-	pfam10276, zf-CHCC, Zinc-finger domain	NA|362aa|up_1|NC_016027.1_1848600_1849686_+	pfam12146, Hydrolase_4, Serine aminopeptidase, S33	NA|187aa|up_0|NC_016027.1_1850165_1850726_-	cd03768, SR_ResInv, Serine Recombinase (SR) family, Resolvase and Invertase subfamily, catalytic domain; members contain a C-terminal DNA binding domain	NA|866aa|down_0|NC_016027.1_1851736_1854334_-	pfam06048, DUF927, Domain of unknown function (DUF927)	NA|101aa|down_1|NC_016027.1_1854337_1854640_-	PRK07078, PRK07078, hypothetical protein; Validated	NA|91aa|down_2|NC_016027.1_1854636_1854909_-	NA	NA|136aa|down_3|NC_016027.1_1854905_1855313_-	NA	NA|69aa|down_4|NC_016027.1_1855513_1855720_-	TIGR01764, Probable_excisionase, DNA binding domain, excisionase family	NA|258aa|down_5|NC_016027.1_1855814_1856588_-	NA	NA|63aa|down_6|NC_016027.1_1856590_1856779_-	NA	NA|110aa|down_7|NC_016027.1_1856775_1857105_-	NA	NA|83aa|down_8|NC_016027.1_1857101_1857350_-	NA	NA|78aa|down_9|NC_016027.1_1857346_1857580_-	NA
GCF_000182745.2_ASM18274v1	NC_016021	Komagataeibacter medellinensis NBRC 3288 plasmid pGXY020, complete sequence	1	968-1321	1,1	CRT,PILER-CR	no	csa3	csa3	Type I-A	NCGGTGCAATCNCCACCC,CGGTGCAATCGCCACCC	18,17	0	0	NA	NA	NA:NA	7,7	7	Orphan	DEDDh,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3,csa3,DinG,WYL	NA,NA|121aa|down_1|NC_016021.1_3369_3732_+,NA|132aa|down_7|NC_016021.1_8241_8637_+	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|302aa|up_0|NC_016021.1_39_945_+	pfam04796, RepA_C, Plasmid encoded RepA protein	NA|190aa|down_0|NC_016021.1_2302_2872_+	cd03768, SR_ResInv, Serine Recombinase (SR) family, Resolvase and Invertase subfamily, catalytic domain; members contain a C-terminal DNA binding domain	NA|121aa|down_1|NC_016021.1_3369_3732_+	NA	NA|237aa|down_2|NC_016021.1_3790_4501_+	cd16892, LT_VirB1-like, VirB1-like subfamily	NA|108aa|down_3|NC_016021.1_4504_4828_+	PRK13857, PRK13857, pilin major subunit VirB2	NA|108aa|down_4|NC_016021.1_4831_5155_+	PRK13854, PRK13854, type IV secretion system protein VirB3; Provisional	NA|791aa|down_5|NC_016021.1_5154_7527_+	PRK13853, PRK13853, type IV secretion system protein VirB4; Provisional	NA|229aa|down_6|NC_016021.1_7543_8230_+	pfam07996, T4SS, Type IV secretion system proteins	NA|132aa|down_7|NC_016021.1_8241_8637_+	NA	NA|307aa|down_8|NC_016021.1_8681_9602_+	PRK13852, PRK13852, type IV secretion system protein	NA|57aa|down_9|NC_016021.1_9640_9811_+	PRK13859, PRK13859, type IV secretion system lipoprotein VirB7; Provisional
