assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_002863805.1_ASM286380v1	CP020026	Rhodocyclaceae bacterium strain Thauera-like chromosome, complete genome	1	377963-378494	1,1,1	CRISPRCasFinder,CRT,PILER-CR	no		cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	Orphan	GTCTTAATCCCTTTGAAATCAGGGCAACTGCTTGGAC,GTCTTAATCCCTTTGAAATCAGGGCAACTGCTTGGAC,GTCTTAATCCCTTTGAAATCAGGGCAACTGCTTGGAC	37,37,37	0	0	NA	NA	NA:NA:NA	7,7,6	7	Orphan	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	NA|75aa|up_5|CP020026.1_372711_372936_+,NA|116aa|up_3|CP020026.1_374221_374569_-,NA|261aa|down_8|CP020026.1_386610_387393_-	NA|278aa|up_9|CP020026.1_369578_370412_+	PRK00450, dapF, diaminopimelate epimerase; Provisional	NA|217aa|up_8|CP020026.1_370470_371121_+	COG3159, COG3159, Uncharacterized protein conserved in bacteria [Function unknown]	NA|295aa|up_7|CP020026.1_371159_372044_+	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|157aa|up_6|CP020026.1_372231_372702_+	smart00419, HTH_CRP, helix_turn_helix, cAMP Regulatory protein	NA|75aa|up_5|CP020026.1_372711_372936_+	NA	NA|397aa|up_4|CP020026.1_373007_374198_+	PRK15128, PRK15128, 23S rRNA (cytosine(1962)-C(5))-methyltransferase RlmI	NA|116aa|up_3|CP020026.1_374221_374569_-	NA	NA|353aa|up_2|CP020026.1_374630_375689_-	PRK00080, ruvB, Holliday junction branch migration DNA helicase RuvB	NA|332aa|up_1|CP020026.1_375797_376793_-	pfam07589, VPEP, PEP-CTERM motif	NA|347aa|up_0|CP020026.1_376886_377927_-	pfam13358, DDE_3, DDE superfamily endonuclease	NA|378aa|down_0|CP020026.1_378632_379766_+	pfam13808, DDE_Tnp_1_assoc, DDE_Tnp_1-associated	NA|202aa|down_1|CP020026.1_381159_381765_-	PRK00116, ruvA, Holliday junction branch migration protein RuvA	NA|329aa|down_2|CP020026.1_381801_382788_-	cd13962, PT_UbiA_UBIAD1, 1,4-Dihydroxy-2-naphthoate octaprenyltransferase	NA|485aa|down_3|CP020026.1_382784_384239_-	PRK11712, PRK11712, ribonuclease G; Provisional	NA|208aa|down_4|CP020026.1_384375_384999_-	PRK00032, PRK00032, septum formation inhibitor Maf	NA|157aa|down_5|CP020026.1_385104_385575_-	PRK00103, PRK00103, rRNA large subunit methyltransferase; Provisional	NA|122aa|down_6|CP020026.1_385581_385947_-	TIGR00090, rsfS_iojap_ybeB, ribosome silencing factor RsfS/YbeB/iojap	NA|226aa|down_7|CP020026.1_385946_386624_-	PRK00071, nadD, nicotinate-nucleotide adenylyltransferase	NA|261aa|down_8|CP020026.1_386610_387393_-	NA	NA|258aa|down_9|CP020026.1_387403_388177_-	COG5473, COG5473, Predicted integral membrane protein [Function unknown]
GCA_002863805.1_ASM286380v1	CP020026	Rhodocyclaceae bacterium strain Thauera-like chromosome, complete genome	2	379808-380968	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no		cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	Orphan	GTCTTAATCCCTTTGAAATCAGGGCAACTGCTTGGAC,GTCTTAATCCCTTTGAAATCAGGGCAACTGCTTGGAC,GTCTTAATCCCTTTGAAATCAGGGCAACTGCTTGGAC	37,37,37	0	0	NA	NA	NA:NA:NA	16,16,16	16	Orphan	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	NA|75aa|up_6|CP020026.1_372711_372936_+,NA|116aa|up_4|CP020026.1_374221_374569_-,NA|261aa|down_7|CP020026.1_386610_387393_-	NA|217aa|up_9|CP020026.1_370470_371121_+	COG3159, COG3159, Uncharacterized protein conserved in bacteria [Function unknown]	NA|295aa|up_8|CP020026.1_371159_372044_+	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|157aa|up_7|CP020026.1_372231_372702_+	smart00419, HTH_CRP, helix_turn_helix, cAMP Regulatory protein	NA|75aa|up_6|CP020026.1_372711_372936_+	NA	NA|397aa|up_5|CP020026.1_373007_374198_+	PRK15128, PRK15128, 23S rRNA (cytosine(1962)-C(5))-methyltransferase RlmI	NA|116aa|up_4|CP020026.1_374221_374569_-	NA	NA|353aa|up_3|CP020026.1_374630_375689_-	PRK00080, ruvB, Holliday junction branch migration DNA helicase RuvB	NA|332aa|up_2|CP020026.1_375797_376793_-	pfam07589, VPEP, PEP-CTERM motif	NA|347aa|up_1|CP020026.1_376886_377927_-	pfam13358, DDE_3, DDE superfamily endonuclease	NA|378aa|up_0|CP020026.1_378632_379766_+	pfam13808, DDE_Tnp_1_assoc, DDE_Tnp_1-associated	NA|202aa|down_0|CP020026.1_381159_381765_-	PRK00116, ruvA, Holliday junction branch migration protein RuvA	NA|329aa|down_1|CP020026.1_381801_382788_-	cd13962, PT_UbiA_UBIAD1, 1,4-Dihydroxy-2-naphthoate octaprenyltransferase	NA|485aa|down_2|CP020026.1_382784_384239_-	PRK11712, PRK11712, ribonuclease G; Provisional	NA|208aa|down_3|CP020026.1_384375_384999_-	PRK00032, PRK00032, septum formation inhibitor Maf	NA|157aa|down_4|CP020026.1_385104_385575_-	PRK00103, PRK00103, rRNA large subunit methyltransferase; Provisional	NA|122aa|down_5|CP020026.1_385581_385947_-	TIGR00090, rsfS_iojap_ybeB, ribosome silencing factor RsfS/YbeB/iojap	NA|226aa|down_6|CP020026.1_385946_386624_-	PRK00071, nadD, nicotinate-nucleotide adenylyltransferase	NA|261aa|down_7|CP020026.1_386610_387393_-	NA	NA|258aa|down_8|CP020026.1_387403_388177_-	COG5473, COG5473, Predicted integral membrane protein [Function unknown]	NA|317aa|down_9|CP020026.1_388173_389124_-	PRK05231, PRK05231, homoserine kinase; Provisional
GCA_002863805.1_ASM286380v1	CP020026	Rhodocyclaceae bacterium strain Thauera-like chromosome, complete genome	3	975505-975578	3	CRISPRCasFinder	no		cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	Orphan	AATCGTTACCAAACCGTAACCGA	23	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	NA,NA|159aa|down_9|CP020026.1_987049_987526_+	NA|581aa|up_9|CP020026.1_962350_964093_+	COG0581, PstA, ABC-type phosphate transport system, permease component [Inorganic ion transport and metabolism]	NA|277aa|up_8|CP020026.1_964112_964943_+	PRK14236, PRK14236, phosphate transporter ATP-binding protein; Provisional	NA|451aa|up_7|CP020026.1_964983_966336_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|493aa|up_6|CP020026.1_966292_967771_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|293aa|up_5|CP020026.1_967767_968646_-	cd13571, PBP2_PnhD_1, Substrate binding domain of uncharacterized ABC-type phosphonate-like transporter; contains the type 2 periplasmic binding fold	NA|320aa|up_4|CP020026.1_968721_969681_-	COG3381, TorD, Uncharacterized component of anaerobic dehydrogenases [General function prediction only]	NA|431aa|up_3|CP020026.1_969589_970882_-	COG5557, COG5557, Polysulphide reductase [Energy production and conversion]	NA|250aa|up_2|CP020026.1_970894_971644_-	cd10551, PsrB, polysulfide reductase beta (PsrB) subunit	NA|846aa|up_1|CP020026.1_971674_974212_-	cd02757, MopB_Arsenate-R, This CD includes the respiratory arsenate reductase, As(V), catalytic subunit (ArrA) and other related proteins	NA|269aa|up_0|CP020026.1_974204_975011_-	cd10549, MtMvhB_like, Uncharacterized polyferredoxin-like protein	NA|494aa|down_0|CP020026.1_976426_977908_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|442aa|down_1|CP020026.1_977886_979212_+	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|237aa|down_2|CP020026.1_979635_980346_+	cd10551, PsrB, polysulfide reductase beta (PsrB) subunit	NA|286aa|down_3|CP020026.1_980356_981214_+	pfam03916, NrfD, Polysulphide reductase, NrfD	NA|880aa|down_4|CP020026.1_981237_983877_+	cd02757, MopB_Arsenate-R, This CD includes the respiratory arsenate reductase, As(V), catalytic subunit (ArrA) and other related proteins	NA|347aa|down_5|CP020026.1_984013_985054_+	pfam13358, DDE_3, DDE superfamily endonuclease	NA|280aa|down_6|CP020026.1_985066_985906_+	pfam02613, Nitrate_red_del, Nitrate reductase delta subunit	NA|150aa|down_7|CP020026.1_985920_986370_+	pfam03745, DUF309, Domain of unknown function (DUF309)	NA|229aa|down_8|CP020026.1_986366_987053_+	pfam00977, His_biosynth, Histidine biosynthesis protein	NA|159aa|down_9|CP020026.1_987049_987526_+	NA
GCA_002863805.1_ASM286380v1	CP020026	Rhodocyclaceae bacterium strain Thauera-like chromosome, complete genome	4	1867363-1870074	3,4,3	PILER-CR,CRISPRCasFinder,CRT	no	csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	Type III-A,Type III-B,Type III-C,Type III-D	GTCTTAATCCCTTTGAAATCAGGGCAACCGCTTGGAC,GTCCAAGCGGTTGCCCTGATTTCAAAGGGATTAAGAC,GTCCAAGCGGTTGCCCTGATTTCAAAGGGATTAAGAC	37,37,37	0	0	NA	NA	NA:NA:NA	38,38,38	38	TypeIII-A,TypeIII-B,TypeIII-C,TypeIII-D	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	NA,NA|149aa|down_0|CP020026.1_1870152_1870599_+,NA|64aa|down_1|CP020026.1_1870600_1870792_-	cmr4gr7|314aa|up_9|CP020026.1_1859667_1860609_+	TIGR02580, putative_CRISPR-associated_protein, CRISPR type III-B/RAMP module RAMP protein Cmr4	cmr5gr11|136aa|up_8|CP020026.1_1860623_1861031_+	pfam09701, Cas_Cmr5, CRISPR-associated protein (Cas_Cmr5)	cmr6gr7|404aa|up_7|CP020026.1_1861041_1862253_+	TIGR01898, repair_system, CRISPR type III-B/RAMP module RAMP protein Cmr6	csx16|99aa|up_6|CP020026.1_1862249_1862546_+	pfam09652, Cas_VVA1548, Putative CRISPR-associated protein (Cas_VVA1548)	csx1|393aa|up_5|CP020026.1_1862568_1863747_+	TIGR02221, CRISPR-associated_protein_Csx1_2, CRISPR-associated protein, TM1812 family	cas6|361aa|up_4|CP020026.1_1863637_1864720_+	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	cas2|95aa|up_3|CP020026.1_1864806_1865091_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|331aa|up_2|CP020026.1_1865095_1866088_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|269aa|up_1|CP020026.1_1866090_1866897_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|116aa|up_0|CP020026.1_1866887_1867235_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|149aa|down_0|CP020026.1_1870152_1870599_+	NA	NA|64aa|down_1|CP020026.1_1870600_1870792_-	NA	NA|162aa|down_2|CP020026.1_1871010_1871496_-	PRK07994, PRK07994, DNA polymerase III subunits gamma and tau; Validated	NA|1039aa|down_3|CP020026.1_1871495_1874612_-	COG0841, AcrB, Cation/multidrug efflux pump [Defense mechanisms]	NA|355aa|down_4|CP020026.1_1874627_1875692_-	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|349aa|down_5|CP020026.1_1875825_1876872_-	PRK05385, PRK05385, phosphoribosylaminoimidazole synthetase; Provisional	NA|368aa|down_6|CP020026.1_1877019_1878123_+	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|224aa|down_7|CP020026.1_1878119_1878791_+	PRK08903, PRK08903, DnaA regulatory inactivator Hda; Validated	NA|223aa|down_8|CP020026.1_1878848_1879517_+	cd02612, HAD_PGPPase, phosphatidylglycerol-phosphate phosphatase, similar to Escherichia coli K-12 phosphatidylglycerol-phosphate phosphatase C	NA|334aa|down_9|CP020026.1_1879599_1880601_-	COG1858, MauG, Cytochrome c peroxidase [Inorganic ion transport and metabolism]
GCA_002863805.1_ASM286380v1	CP020026	Rhodocyclaceae bacterium strain Thauera-like chromosome, complete genome	5	3093715-3096440	4,5,4,5	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	Type I-E	GTGTTCCCCACGCCCGTGGGGATGAACCG,GTGTTCCCCACGCCCGTGGGGATGAACCG,GTGTTCCCCACGCCCGTGGGGATGAACCG,GTGTTCCCCACGCCCGTGGGGATGAACC	29,29,29,28	0	0	NA	NA	I-E:I-E:I-E:I-E	33,44,44,33	44	TypeI-E	cas3,csa3,DEDDh,DinG,csx1,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx16,cas6,cas2,cas1,WYL,cas8e,cse2gr11,cas7,cas5,cas6e	NA,NA|132aa|down_0|CP020026.1_3096518_3096914_+,NA|130aa|down_1|CP020026.1_3096986_3097376_+	NA|380aa|up_9|CP020026.1_3083640_3084780_+	cd17324, MFS_NepI_like, Purine ribonucleoside efflux pump NepI and similar transporters of the Major Facilitator Superfamily	cas3|860aa|up_8|CP020026.1_3085030_3087610_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas8e|519aa|up_7|CP020026.1_3087623_3089180_+	cd09729, Cse1_I-E, CRISPR/Cas system-associated protein Cse1	cse2gr11|182aa|up_6|CP020026.1_3089176_3089722_+	PRK13921, PRK13921, CRISPR-associated Cse2 family protein; Provisional	cas7|386aa|up_5|CP020026.1_3089718_3090876_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|223aa|up_4|CP020026.1_3090879_3091548_+	pfam09704, Cas_Cas5d, CRISPR-associated protein (Cas_Cas5)	cas6e|211aa|up_3|CP020026.1_3091522_3092155_+	pfam08798, CRISPR_assoc, CRISPR associated protein	NA|82aa|up_2|CP020026.1_3092174_3092420_+	COG2405, COG2405, Predicted nucleic acid-binding protein, contains PIN domain [General function prediction only]	cas1|309aa|up_1|CP020026.1_3092422_3093349_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|99aa|up_0|CP020026.1_3093329_3093626_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|132aa|down_0|CP020026.1_3096518_3096914_+	NA	NA|130aa|down_1|CP020026.1_3096986_3097376_+	NA	NA|138aa|down_2|CP020026.1_3097759_3098173_-	cd18738, PIN_VapC4-5_FitB-like, uncharacterized subgroup of the PIN_VapC4-5_FitB-like subfamily of the PIN domain superfamily	NA|89aa|down_3|CP020026.1_3098166_3098433_-	pfam02604, PhdYeFM_antitox, Antitoxin Phd_YefM, type II toxin-antitoxin system	NA|1230aa|down_4|CP020026.1_3098901_3102591_-	PRK09490, metH, B12-dependent methionine synthase; Provisional	NA|214aa|down_5|CP020026.1_3102821_3103463_-	pfam04355, SmpA_OmlA, SmpA / OmlA family	NA|257aa|down_6|CP020026.1_3103717_3104488_+	COG0411, LivG, ABC-type branched-chain amino acid transport systems, ATPase component [Amino acid transport and metabolism]	NA|244aa|down_7|CP020026.1_3104477_3105209_+	COG0410, LivF, ABC-type branched-chain amino acid transport systems, ATPase component [Amino acid transport and metabolism]	NA|410aa|down_8|CP020026.1_3105228_3106458_-	cd17320, MFS_MdfA_MDR_like, Multidrug transporter MdfA and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|500aa|down_9|CP020026.1_3106576_3108076_-	COG0606, COG0606, Predicted ATPase with chaperone activity [Posttranslational modification, protein turnover, chaperones]
