assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_007971385.1_ASM797138v1	NZ_CP042434	Arachidicoccus ginsenosidivorans strain Gsoil 809 chromosome, complete genome	1	3980775-3984533	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas6,cas7,cas3,cas1,cas2	cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	Unclear	GGCTTAATCGAACAATAGTTGAATTGAAAT,GGCTTAATCGAACAATAGTTGAATTGAAAT,GGCTTAATCGAACAATAGTTGAATTGAAAT,GGCTTAATCGAACAATAGTTGAATTGAAAT	30,30,30,30	0	0	NA	NA	NA:NA:NA:NA	53,56,56,53	56	Unclear	cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	NA|201aa|up_6|NZ_CP042434.1_3972706_3973309_+,NA|472aa|up_5|NZ_CP042434.1_3973356_3974772_+,NA|118aa|down_2|NZ_CP042434.1_3989207_3989561_-,NA|187aa|down_4|NZ_CP042434.1_3990906_3991467_-	NA|320aa|up_9|NZ_CP042434.1_3969200_3970160_+	PRK10416, PRK10416, signal recognition particle-docking protein FtsY; Provisional	NA|189aa|up_8|NZ_CP042434.1_3970635_3971202_-	pfam14066, DUF4256, Protein of unknown function (DUF4256)	cas6|260aa|up_7|NZ_CP042434.1_3971613_3972393_+	cd09759, Cas6_I-A, CRISPR/Cas system-associated RAMP superfamily protein Cas6	NA|201aa|up_6|NZ_CP042434.1_3972706_3973309_+	NA	NA|472aa|up_5|NZ_CP042434.1_3973356_3974772_+	NA	cas7|343aa|up_4|NZ_CP042434.1_3974780_3975809_+	TIGR02585, conserved_protein, CRISPR-associated protein Cas7/Cst2/DevR, subtype I-B/TNEAP	NA|227aa|up_3|NZ_CP042434.1_3975801_3976482_+	TIGR01895, conserved_hypothetical_protein, CRISPR-associated protein Cas5, subtype I-B/TNEAP	cas3|767aa|up_2|NZ_CP042434.1_3976474_3978775_+	TIGR01587, CRISPR-associated_endonuclease/helicase_Cas3, CRISPR-associated helicase Cas3	cas1|337aa|up_1|NZ_CP042434.1_3979280_3980291_+	cd09722, Cas1_I-B, CRISPR/Cas system-associated protein Cas1	cas2|88aa|up_0|NZ_CP042434.1_3980292_3980556_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|241aa|down_0|NZ_CP042434.1_3986729_3987452_+	pfam13568, OMP_b-brl_2, Outer membrane protein beta-barrel domain	NA|447aa|down_1|NZ_CP042434.1_3987730_3989071_-	PRK09414, PRK09414, NADP-specific glutamate dehydrogenase	NA|118aa|down_2|NZ_CP042434.1_3989207_3989561_-	NA	NA|426aa|down_3|NZ_CP042434.1_3989621_3990899_-	pfam12697, Abhydrolase_6, Alpha/beta hydrolase family	NA|187aa|down_4|NZ_CP042434.1_3990906_3991467_-	NA	NA|91aa|down_5|NZ_CP042434.1_3991471_3991744_-	pfam09862, DUF2089, Protein of unknown function (DUF2089)	NA|292aa|down_6|NZ_CP042434.1_3992981_3993857_-	cd05374, 17beta-HSD-like_SDR_c, 17beta hydroxysteroid dehydrogenase-like, classical (c) SDRs	NA|497aa|down_7|NZ_CP042434.1_3994067_3995558_-	pfam12771, SusD-like_2, Starch-binding associating with outer membrane	NA|1107aa|down_8|NZ_CP042434.1_3995659_3998980_-	TIGR04056, OMP_RagA_SusC, TonB-linked outer membrane protein, SusC/RagA family	NA|398aa|down_9|NZ_CP042434.1_3999304_4000498_-	COG3712, FecR, periplasmic ferric-dicitrate binding protein FecR, regulates iron transport through sigma-19 [Inorganic ion transport and metabolism, Signal transduction mechanisms]
GCF_007971385.1_ASM797138v1	NZ_CP042434	Arachidicoccus ginsenosidivorans strain Gsoil 809 chromosome, complete genome	2	3985505-3986442	2,2,3	CRISPRCasFinder,CRT,PILER-CR	no	cas6,cas7,cas3,cas1,cas2	cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	Unclear	GGCTTAATCGAACAATAGTTGAATTGAAAT,GGCTTAATCGAACAATAGTTGAATTGAAAT,GGCTTAATCGAACAATAGTTGAATTGAAAT	30,30,30	0	0	NA	NA	NA:NA:NA	14,14,9	14	Unclear	cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	NA|201aa|up_6|NZ_CP042434.1_3972706_3973309_+,NA|472aa|up_5|NZ_CP042434.1_3973356_3974772_+,NA|118aa|down_2|NZ_CP042434.1_3989207_3989561_-,NA|187aa|down_4|NZ_CP042434.1_3990906_3991467_-	NA|320aa|up_9|NZ_CP042434.1_3969200_3970160_+	PRK10416, PRK10416, signal recognition particle-docking protein FtsY; Provisional	NA|189aa|up_8|NZ_CP042434.1_3970635_3971202_-	pfam14066, DUF4256, Protein of unknown function (DUF4256)	cas6|260aa|up_7|NZ_CP042434.1_3971613_3972393_+	cd09759, Cas6_I-A, CRISPR/Cas system-associated RAMP superfamily protein Cas6	NA|201aa|up_6|NZ_CP042434.1_3972706_3973309_+	NA	NA|472aa|up_5|NZ_CP042434.1_3973356_3974772_+	NA	cas7|343aa|up_4|NZ_CP042434.1_3974780_3975809_+	TIGR02585, conserved_protein, CRISPR-associated protein Cas7/Cst2/DevR, subtype I-B/TNEAP	NA|227aa|up_3|NZ_CP042434.1_3975801_3976482_+	TIGR01895, conserved_hypothetical_protein, CRISPR-associated protein Cas5, subtype I-B/TNEAP	cas3|767aa|up_2|NZ_CP042434.1_3976474_3978775_+	TIGR01587, CRISPR-associated_endonuclease/helicase_Cas3, CRISPR-associated helicase Cas3	cas1|337aa|up_1|NZ_CP042434.1_3979280_3980291_+	cd09722, Cas1_I-B, CRISPR/Cas system-associated protein Cas1	cas2|88aa|up_0|NZ_CP042434.1_3980292_3980556_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|241aa|down_0|NZ_CP042434.1_3986729_3987452_+	pfam13568, OMP_b-brl_2, Outer membrane protein beta-barrel domain	NA|447aa|down_1|NZ_CP042434.1_3987730_3989071_-	PRK09414, PRK09414, NADP-specific glutamate dehydrogenase	NA|118aa|down_2|NZ_CP042434.1_3989207_3989561_-	NA	NA|426aa|down_3|NZ_CP042434.1_3989621_3990899_-	pfam12697, Abhydrolase_6, Alpha/beta hydrolase family	NA|187aa|down_4|NZ_CP042434.1_3990906_3991467_-	NA	NA|91aa|down_5|NZ_CP042434.1_3991471_3991744_-	pfam09862, DUF2089, Protein of unknown function (DUF2089)	NA|292aa|down_6|NZ_CP042434.1_3992981_3993857_-	cd05374, 17beta-HSD-like_SDR_c, 17beta hydroxysteroid dehydrogenase-like, classical (c) SDRs	NA|497aa|down_7|NZ_CP042434.1_3994067_3995558_-	pfam12771, SusD-like_2, Starch-binding associating with outer membrane	NA|1107aa|down_8|NZ_CP042434.1_3995659_3998980_-	TIGR04056, OMP_RagA_SusC, TonB-linked outer membrane protein, SusC/RagA family	NA|398aa|down_9|NZ_CP042434.1_3999304_4000498_-	COG3712, FecR, periplasmic ferric-dicitrate binding protein FecR, regulates iron transport through sigma-19 [Inorganic ion transport and metabolism, Signal transduction mechanisms]
GCF_007971385.1_ASM797138v1	NZ_CP042434	Arachidicoccus ginsenosidivorans strain Gsoil 809 chromosome, complete genome	3	4328993-4329134	3	CRT	no		cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	Orphan	TATACCTTTTAGGGTATAAT	20	0	0	NA	NA	NA	3	3	Orphan	cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	NA|103aa|up_7|NZ_CP042434.1_4319698_4320007_-,NA|261aa|up_6|NZ_CP042434.1_4320158_4320941_-,NA|145aa|down_4|NZ_CP042434.1_4336117_4336552_-,NA|110aa|down_5|NZ_CP042434.1_4336695_4337025_-,NA|1050aa|down_9|NZ_CP042434.1_4343392_4346542_+	NA|565aa|up_9|NZ_CP042434.1_4315007_4316702_-	pfam03929, PepSY_TM, PepSY-associated TM region	NA|818aa|up_8|NZ_CP042434.1_4316720_4319174_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|103aa|up_7|NZ_CP042434.1_4319698_4320007_-	NA	NA|261aa|up_6|NZ_CP042434.1_4320158_4320941_-	NA	NA|328aa|up_5|NZ_CP042434.1_4321163_4322147_+	TIGR00950, Uncharacterized_inner_membrane_transporter_YicL, Carboxylate/Amino Acid/Amine Transporter	NA|892aa|up_4|NZ_CP042434.1_4322192_4324868_-	PRK05580, PRK05580, primosome assembly protein PriA; Validated	NA|221aa|up_3|NZ_CP042434.1_4325120_4325783_+	cd04502, SGNH_hydrolase_like_7, Members of the SGNH-hydrolase superfamily, a diverse family of lipases and esterases	NA|442aa|up_2|NZ_CP042434.1_4325880_4327206_-	cd13131, MATE_NorM_like, Subfamily of the multidrug and toxic compound extrusion (MATE)-like proteins similar to Vibrio cholerae NorM	NA|112aa|up_1|NZ_CP042434.1_4328454_4328790_-	TIGR03071, couple_hipA, HipA N-terminal domain	NA|69aa|up_0|NZ_CP042434.1_4328783_4328990_-	TIGR03070, couple_hipB, transcriptional regulator, y4mF family	NA|234aa|down_0|NZ_CP042434.1_4329345_4330047_+	pfam02405, MlaE, Permease MlaE	NA|355aa|down_1|NZ_CP042434.1_4330200_4331265_+	TIGR04018, thioredoxin_reductase, putative bacillithiol system oxidoreductase, YpdA family	NA|1132aa|down_2|NZ_CP042434.1_4331863_4335259_-	TIGR03696, tRNA_nuclease_WapA, RHS repeat-associated core domain	NA|158aa|down_3|NZ_CP042434.1_4335435_4335909_-	pfam02371, Transposase_20, Transposase IS116/IS110/IS902 family	NA|145aa|down_4|NZ_CP042434.1_4336117_4336552_-	NA	NA|110aa|down_5|NZ_CP042434.1_4336695_4337025_-	NA	NA|108aa|down_6|NZ_CP042434.1_4337205_4337529_-	pfam15580, Imm53, Immunity protein 53	NA|1438aa|down_7|NZ_CP042434.1_4337494_4341808_-	TIGR03696, tRNA_nuclease_WapA, RHS repeat-associated core domain	NA|434aa|down_8|NZ_CP042434.1_4341923_4343225_-	sd00010, SLR, Sel1-like repeat	NA|1050aa|down_9|NZ_CP042434.1_4343392_4346542_+	NA
GCF_007971385.1_ASM797138v1	NZ_CP042434	Arachidicoccus ginsenosidivorans strain Gsoil 809 chromosome, complete genome	4	5419329-5419665	4,3,4	CRT,CRISPRCasFinder,PILER-CR	no		cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	Orphan	CTAACGCGTTCCTCTTTACAATTTTT,TAACGCGTTCCTCTTTACAATTTTT,CTAACGCGTTCCTCTTTACAATTTTT	26,25,26	0	0	NA	NA	NA:NA:NA	3,4,2	4	Orphan	cas3,PD-DExK,RT,csa3,c2c10_CAS-V-U3,PrimPol,WYL,Cas14u_CAS-V,DEDDh,cas14i,cas6,cas7,cas1,cas2,cas14j	NA|365aa|up_9|NZ_CP042434.1_5410506_5411601_-,NA|93aa|up_8|NZ_CP042434.1_5412422_5412701_-,NA|91aa|up_6|NZ_CP042434.1_5413239_5413512_-,NA|89aa|up_5|NZ_CP042434.1_5413730_5413997_-,NA|264aa|down_2|NZ_CP042434.1_5424595_5425387_-,NA|154aa|down_6|NZ_CP042434.1_5427026_5427488_-	NA|365aa|up_9|NZ_CP042434.1_5410506_5411601_-	NA	NA|93aa|up_8|NZ_CP042434.1_5412422_5412701_-	NA	NA|163aa|up_7|NZ_CP042434.1_5412733_5413222_-	pfam14054, DUF4249, Domain of unknown function (DUF4249)	NA|91aa|up_6|NZ_CP042434.1_5413239_5413512_-	NA	NA|89aa|up_5|NZ_CP042434.1_5413730_5413997_-	NA	NA|354aa|up_4|NZ_CP042434.1_5414016_5415078_-	COG5421, COG5421, Transposase [DNA replication, recombination, and repair]	NA|277aa|up_3|NZ_CP042434.1_5416109_5416940_-	PRK09183, PRK09183, transposase/IS protein; Provisional	NA|480aa|up_2|NZ_CP042434.1_5416932_5418372_-	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|217aa|up_1|NZ_CP042434.1_5418361_5419012_-	TIGR04285, parB-like_partition_protein, nucleoid occlusion protein	NA|84aa|up_0|NZ_CP042434.1_5419027_5419279_-	smart00470, ParB, ParB-like nuclease domain	NA|299aa|down_0|NZ_CP042434.1_5421055_5421952_-	cd05242, SDR_a8, atypical (a) SDRs, subgroup 8	NA|271aa|down_1|NZ_CP042434.1_5422495_5423308_-	cd05266, SDR_a4, atypical (a) SDRs, subgroup 4	NA|264aa|down_2|NZ_CP042434.1_5424595_5425387_-	NA	NA|239aa|down_3|NZ_CP042434.1_5425383_5426100_-	TIGR03462, Bifunctional_lycopene_cyclase/phytoene_synthase, lycopene cyclase domain	NA|153aa|down_4|NZ_CP042434.1_5426096_5426555_-	PLN02601, PLN02601, beta-carotene hydroxylase	NA|158aa|down_5|NZ_CP042434.1_5426551_5427025_-	cd07820, SRPBCC_3, Ligand-binding SRPBCC domain of an uncharacterized subfamily of proteins	NA|154aa|down_6|NZ_CP042434.1_5427026_5427488_-	NA	NA|279aa|down_7|NZ_CP042434.1_5427484_5428321_-	cd00683, Trans_IPPS_HH, Trans-Isoprenyl Diphosphate Synthases, head-to-head	NA|498aa|down_8|NZ_CP042434.1_5428304_5429798_-	TIGR02734, Phytoene_desaturase_lycopene-forming, phytoene desaturase	NA|227aa|down_9|NZ_CP042434.1_5429924_5430605_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein
