assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_007741555.1_ASM774155v1	NZ_CP036526	Planctomycetes bacterium K23_9 chromosome, complete genome	1	14950-15164	1	CRISPRCasFinder	no		Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	Orphan	AAGAAAAAAGCAGCTAAGAAGAAGCCTGCTAAGAA	35	0	0	NA	NA	NA	3	3	Orphan	Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	NA|205aa|up_7|NZ_CP036526.1_6944_7559_+,NA|110aa|up_6|NZ_CP036526.1_7599_7929_+,NA|136aa|down_1|NZ_CP036526.1_16776_17184_-,NA|108aa|down_3|NZ_CP036526.1_18736_19060_-,NA|470aa|down_4|NZ_CP036526.1_19379_20789_+,NA|227aa|down_5|NZ_CP036526.1_20857_21538_+,NA|243aa|down_6|NZ_CP036526.1_21766_22495_+	NA|102aa|up_9|NZ_CP036526.1_5910_6216_+	pfam05258, DUF721, Protein of unknown function (DUF721)	NA|211aa|up_8|NZ_CP036526.1_6234_6867_+	pfam03352, Adenine_glyco, Methyladenine glycosylase	NA|205aa|up_7|NZ_CP036526.1_6944_7559_+	NA	NA|110aa|up_6|NZ_CP036526.1_7599_7929_+	NA	NA|401aa|up_5|NZ_CP036526.1_7957_9160_-	sd00006, TPR, Tetratricopeptide repeat	NA|376aa|up_4|NZ_CP036526.1_9299_10427_-	PRK00578, prfB, peptide chain release factor 2; Validated	NA|384aa|up_3|NZ_CP036526.1_10494_11646_+	PRK00143, mnmA, tRNA-specific 2-thiouridylase MnmA; Reviewed	NA|311aa|up_2|NZ_CP036526.1_11895_12828_+	COG0705, COG0705, Membrane associated serine protease [Amino acid transport and metabolism]	NA|193aa|up_1|NZ_CP036526.1_12881_13460_+	pfam00578, AhpC-TSA, AhpC/TSA family	NA|265aa|up_0|NZ_CP036526.1_13558_14353_+	cd06164, S2P-M50_SpoIVFB_CBS, SpoIVFB Site-2 protease (S2P), a zinc metalloprotease (MEROPS family M50B), regulates intramembrane proteolysis (RIP), and is involved in the pro-sigmaK pathway of bacterial spore formation	NA|359aa|down_0|NZ_CP036526.1_15426_16503_-	pfam10609, ParA, NUBPL iron-transfer P-loop NTPase	NA|136aa|down_1|NZ_CP036526.1_16776_17184_-	NA	NA|486aa|down_2|NZ_CP036526.1_17180_18638_-	COG3829, RocR, Transcriptional regulator containing PAS, AAA-type ATPase, and DNA-binding domains [Transcription / Signal transduction mechanisms]	NA|108aa|down_3|NZ_CP036526.1_18736_19060_-	NA	NA|470aa|down_4|NZ_CP036526.1_19379_20789_+	NA	NA|227aa|down_5|NZ_CP036526.1_20857_21538_+	NA	NA|243aa|down_6|NZ_CP036526.1_21766_22495_+	NA	NA|392aa|down_7|NZ_CP036526.1_22553_23729_-	pfam14486, DUF4432, Domain of unknown function (DUF4432)	NA|334aa|down_8|NZ_CP036526.1_24421_25423_+	pfam01261, AP_endonuc_2, Xylose isomerase-like TIM barrel	NA|380aa|down_9|NZ_CP036526.1_26057_27197_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]
GCF_007741555.1_ASM774155v1	NZ_CP036526	Planctomycetes bacterium K23_9 chromosome, complete genome	2	4211209-4211289	2	CRISPRCasFinder	no		Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	Orphan	TCATCGAACAGGCTCCCGTCATCG	24	0	0	NA	NA	NA	1	1	Orphan	Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	NA|78aa|up_9|NZ_CP036526.1_4197090_4197324_-,NA|79aa|down_3|NZ_CP036526.1_4216836_4217073_+,NA|325aa|down_4|NZ_CP036526.1_4217069_4218044_-,NA|169aa|down_6|NZ_CP036526.1_4220226_4220733_+,NA|283aa|down_7|NZ_CP036526.1_4221434_4222283_+,NA|186aa|down_8|NZ_CP036526.1_4222481_4223039_+	NA|78aa|up_9|NZ_CP036526.1_4197090_4197324_-	NA	NA|858aa|up_8|NZ_CP036526.1_4197396_4199970_-	COG4232, COG4232, Thiol:disulfide interchange protein [Posttranslational modification, protein turnover, chaperones / Energy production and conversion]	NA|373aa|up_7|NZ_CP036526.1_4200094_4201213_-	pfam01636, APH, Phosphotransferase enzyme family	NA|192aa|up_6|NZ_CP036526.1_4201209_4201785_-	pfam02367, TsaE, Threonylcarbamoyl adenosine biosynthesis protein TsaE	NA|362aa|up_5|NZ_CP036526.1_4202092_4203178_+	cd06853, GT_WecA_like, This subfamily contains Escherichia coli WecA, Bacillus subtilis TagO and related proteins	NA|830aa|up_4|NZ_CP036526.1_4203156_4205646_+	pfam04932, Wzy_C, O-Antigen ligase	NA|418aa|up_3|NZ_CP036526.1_4205745_4206999_+	pfam07610, DUF1573, Protein of unknown function (DUF1573)	NA|528aa|up_2|NZ_CP036526.1_4207814_4209398_+	pfam13435, Cytochrome_C554, Cytochrome c554 and c-prime	NA|154aa|up_1|NZ_CP036526.1_4209460_4209922_-	pfam13673, Acetyltransf_10, Acetyltransferase (GNAT) domain	NA|289aa|up_0|NZ_CP036526.1_4209939_4210806_-	COG0384, COG0384, Predicted epimerase, PhzC/PhzF homolog [General function prediction only]	NA|801aa|down_0|NZ_CP036526.1_4211993_4214396_+	pfam07631, PSD4, Protein of unknown function (DUF1592)	NA|420aa|down_1|NZ_CP036526.1_4214452_4215712_+	pfam07586, HXXSHH, Protein of unknown function (DUF1552)	NA|261aa|down_2|NZ_CP036526.1_4216035_4216818_+	pfam13240, zinc_ribbon_2, zinc-ribbon domain	NA|79aa|down_3|NZ_CP036526.1_4216836_4217073_+	NA	NA|325aa|down_4|NZ_CP036526.1_4217069_4218044_-	NA	NA|547aa|down_5|NZ_CP036526.1_4218323_4219964_-	PRK06676, rpsA, 30S ribosomal protein S1; Reviewed	NA|169aa|down_6|NZ_CP036526.1_4220226_4220733_+	NA	NA|283aa|down_7|NZ_CP036526.1_4221434_4222283_+	NA	NA|186aa|down_8|NZ_CP036526.1_4222481_4223039_+	NA	NA|3201aa|down_9|NZ_CP036526.1_4223109_4232712_-	pfam07452, CHRD, CHRD domain
GCF_007741555.1_ASM774155v1	NZ_CP036526	Planctomycetes bacterium K23_9 chromosome, complete genome	3	7478642-7478733	3	CRISPRCasFinder	no		Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	Orphan	AGCTTGGCGAACAATCCGCCACCGCT	26	0	0	NA	NA	NA	1	1	Orphan	Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	NA,NA|231aa|down_0|NZ_CP036526.1_7479348_7480041_-,NA|64aa|down_1|NZ_CP036526.1_7481255_7481447_+,NA|355aa|down_9|NZ_CP036526.1_7489945_7491010_+	NA|658aa|up_9|NZ_CP036526.1_7466059_7468033_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|272aa|up_8|NZ_CP036526.1_7468280_7469096_+	cd05372, ENR_SDR, Enoyl acyl carrier protein (ACP) reductase (ENR), divergent SDR	NA|200aa|up_7|NZ_CP036526.1_7469141_7469741_+	cd02969, PRX_like1, Peroxiredoxin (PRX)-like 1 family; hypothetical proteins that show sequence similarity to PRXs	NA|310aa|up_6|NZ_CP036526.1_7469931_7470861_+	cd00688, ISOPREN_C2_like, This group contains class II terpene cyclases, protein prenyltransferases beta subunit, two broadly specific proteinase inhibitors alpha2-macroglobulin (alpha (2)-M) and pregnancy zone protein (PZP) and, the C3 C4 and C5 components of vertebrate complement	NA|223aa|up_5|NZ_CP036526.1_7470891_7471560_+	cd03255, ABC_MJ0796_LolCDE_FtsE, ATP-binding cassette domain of the transporters involved in export of lipoprotein and macrolide, and cell division protein	NA|203aa|up_4|NZ_CP036526.1_7471846_7472455_+	PRK05327, rpsD, 30S ribosomal protein S4; Validated	NA|476aa|up_3|NZ_CP036526.1_7472735_7474163_+	PRK06467, PRK06467, dihydrolipoamide dehydrogenase; Reviewed	NA|301aa|up_2|NZ_CP036526.1_7475407_7476310_-	cd06533, Glyco_transf_WecG_TagA, The glycosyltransferase WecG/TagA superfamily contains Escherichia coli WecG, Bacillus subtilis TagA and related proteins	NA|398aa|up_1|NZ_CP036526.1_7476532_7477726_+	cd16148, sulfatase_like, uncharacterized sulfatase subfamily	NA|78aa|up_0|NZ_CP036526.1_7477803_7478037_-	PRK05704, PRK05704, 2-oxoglutarate dehydrogenase complex dihydrolipoyllysine-residue succinyltransferase	NA|231aa|down_0|NZ_CP036526.1_7479348_7480041_-	NA	NA|64aa|down_1|NZ_CP036526.1_7481255_7481447_+	NA	NA|451aa|down_2|NZ_CP036526.1_7481446_7482799_+	PRK09496, trkA, Trk system potassium transporter TrkA	NA|198aa|down_3|NZ_CP036526.1_7482809_7483403_+	pfam12867, DinB_2, DinB superfamily	NA|452aa|down_4|NZ_CP036526.1_7483599_7484955_+	pfam00404, Dockerin_1, Dockerin type I repeat	NA|410aa|down_5|NZ_CP036526.1_7485033_7486263_-	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|264aa|down_6|NZ_CP036526.1_7487220_7488012_+	cd08970, AcNei1_N, N-terminal domain of the actinomycetal Nei1 and related DNA glycosylases	NA|323aa|down_7|NZ_CP036526.1_7488134_7489103_+	pfam01916, DS, Deoxyhypusine synthase	NA|181aa|down_8|NZ_CP036526.1_7489406_7489949_+	COG4970, FimT, Tfp pilus assembly protein FimT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|355aa|down_9|NZ_CP036526.1_7489945_7491010_+	NA
GCF_007741555.1_ASM774155v1	NZ_CP036526	Planctomycetes bacterium K23_9 chromosome, complete genome	4	7496801-7497856	1,4,1	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas2,cas3,csb2gr5,csb1gr7,WYL	Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	Unclear	GCTTCAATGAGGCCGCGTTCGGATGAACGCGGAAAG,GCTTCAATGAGGCCGCGTTCGGATGAACGCGGAAAG,GCTTCAATGAGGCCGCGTTCGGATGAACGCGGAAAG	36,36,36	0	0	NA	NA	NA:NA:NA	14,14,14	14	Unclear	Cas9_archaeal,cas3,csa3,RT,DEDDh,WYL,DinG,cas1,cas2,csb2gr5,csb1gr7	NA|355aa|up_5|NZ_CP036526.1_7489945_7491010_+,NA|230aa|up_4|NZ_CP036526.1_7491006_7491696_+,NA|423aa|up_3|NZ_CP036526.1_7491818_7493087_+,NA|73aa|down_5|NZ_CP036526.1_7507923_7508142_-,NA|83aa|down_6|NZ_CP036526.1_7508606_7508855_+	NA|410aa|up_9|NZ_CP036526.1_7485033_7486263_-	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|264aa|up_8|NZ_CP036526.1_7487220_7488012_+	cd08970, AcNei1_N, N-terminal domain of the actinomycetal Nei1 and related DNA glycosylases	NA|323aa|up_7|NZ_CP036526.1_7488134_7489103_+	pfam01916, DS, Deoxyhypusine synthase	NA|181aa|up_6|NZ_CP036526.1_7489406_7489949_+	COG4970, FimT, Tfp pilus assembly protein FimT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|355aa|up_5|NZ_CP036526.1_7489945_7491010_+	NA	NA|230aa|up_4|NZ_CP036526.1_7491006_7491696_+	NA	NA|423aa|up_3|NZ_CP036526.1_7491818_7493087_+	NA	NA|204aa|up_2|NZ_CP036526.1_7493122_7493734_+	cd02165, NMNAT, Nicotinamide/nicotinate mononucleotide adenylyltransferase	NA|538aa|up_1|NZ_CP036526.1_7493753_7495367_-	COG0034, PurF, Glutamine phosphoribosylpyrophosphate amidotransferase [Nucleotide transport and metabolism]	NA|384aa|up_0|NZ_CP036526.1_7495599_7496751_+	PRK05429, PRK05429, gamma-glutamyl kinase; Provisional	cas1|705aa|down_0|NZ_CP036526.1_7498047_7500162_-	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas2|97aa|down_1|NZ_CP036526.1_7500201_7500492_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas3|1376aa|down_2|NZ_CP036526.1_7500803_7504931_-	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb2gr5|544aa|down_3|NZ_CP036526.1_7504927_7506559_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csb1gr7|391aa|down_4|NZ_CP036526.1_7506693_7507866_-	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	NA|73aa|down_5|NZ_CP036526.1_7507923_7508142_-	NA	NA|83aa|down_6|NZ_CP036526.1_7508606_7508855_+	NA	NA|122aa|down_7|NZ_CP036526.1_7508875_7509241_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	WYL|341aa|down_8|NZ_CP036526.1_7509249_7510272_-	pfam13280, WYL, WYL domain	NA|299aa|down_9|NZ_CP036526.1_7510409_7511306_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]
