assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000012865.1_ASM1286v1	NC_007503	Carboxydothermus hydrogenoformans Z-2901, complete sequence	1	187603-187704	1	CRISPRCasFinder	no	cas3	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	Unclear	GAACATTTAAATTTAAAATTCCTTATCTAGATGAAG	36	0	0	NA	NA	NA	1	1	Unclear	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	NA,NA|98aa|down_3|NC_007503.1_193695_193989_+,NA|208aa|down_4|NC_007503.1_194082_194706_+	NA|78aa|up_9|NC_007503.1_174744_174978_+	pfam08281, Sigma70_r4_2, Sigma-70, region 4	NA|108aa|up_8|NC_007503.1_174977_175301_+	pfam04977, DivIC, Septum formation initiator	NA|296aa|up_7|NC_007503.1_175284_176172_+	COG0248, GppA, Exopolyphosphatase [Nucleotide transport and metabolism / Inorganic ion transport and metabolism]	NA|800aa|up_6|NC_007503.1_176241_178641_+	TIGR02865, Stage_II_sporulation_protein_E, stage II sporulation protein E	NA|447aa|up_5|NC_007503.1_178630_179971_+	cd01992, PP-ATPase, N-terminal domain of predicted ATPase of the PP-loop faimly implicated in cell cycle control [Cell division and chromosome partitioning]	NA|620aa|up_4|NC_007503.1_180028_181888_+	TIGR01241, ATP-dependent_zinc_metalloprotease_FtsH, ATP-dependent metalloprotease FtsH	NA|150aa|up_3|NC_007503.1_181953_182403_+	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|369aa|up_2|NC_007503.1_182542_183649_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|367aa|up_1|NC_007503.1_183775_184876_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|843aa|up_0|NC_007503.1_184902_187431_-	pfam09699, Paired_CXXCH_1, Doubled CXXCH motif (Paired_CXXCH_1)	NA|451aa|down_0|NC_007503.1_190371_191724_+	TIGR03153, cytochr_NrfH, cytochrome c nitrite reductase, small subunit	NA|219aa|down_1|NC_007503.1_191740_192397_+	sd00006, TPR, Tetratricopeptide repeat	NA|336aa|down_2|NC_007503.1_192409_193417_+	cd14963, NHL_like_5, Uncharacterized NHL-repeat domain in bacterial proteins	NA|98aa|down_3|NC_007503.1_193695_193989_+	NA	NA|208aa|down_4|NC_007503.1_194082_194706_+	NA	NA|236aa|down_5|NC_007503.1_194784_195492_-	pfam13649, Methyltransf_25, Methyltransferase domain	NA|325aa|down_6|NC_007503.1_195505_196480_-	TIGR02163, Ferredoxin-type_protein_NapH_homolog, ferredoxin-type protein, NapH/MauN family	cas3|431aa|down_7|NC_007503.1_196710_198003_+	COG0513, SrmB, Superfamily II DNA and RNA helicases [DNA replication, recombination, and repair / Transcription / Translation, ribosomal structure and biogenesis]	NA|172aa|down_8|NC_007503.1_198205_198721_+	pfam09515, Thia_YuaJ, Thiamine transporter protein (Thia_YuaJ)	NA|204aa|down_9|NC_007503.1_198721_199333_+	cd07995, TPK, Thiamine pyrophosphokinase
GCF_000012865.1_ASM1286v1	NC_007503	Carboxydothermus hydrogenoformans Z-2901, complete sequence	2	1402684-1402782	2	CRISPRCasFinder	no		cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	Orphan	GAGGGGTTTACTTTAAATATACCTCCGTTGC	31	0	0	NA	NA	NA	1	1	Orphan	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	NA|51aa|up_8|NC_007503.1_1388128_1388281_-,NA	NA|458aa|up_9|NC_007503.1_1386648_1388022_-	PRK09613, thiH, thiamine biosynthesis protein ThiH; Reviewed	NA|51aa|up_8|NC_007503.1_1388128_1388281_-	NA	NA|229aa|up_7|NC_007503.1_1388446_1389133_-	PRK00507, PRK00507, deoxyribose-phosphate aldolase; Provisional	NA|133aa|up_6|NC_007503.1_1389132_1389531_-	COG0295, Cdd, Cytidine deaminase [Nucleotide transport and metabolism]	NA|443aa|up_5|NC_007503.1_1389523_1390852_-	PRK06078, PRK06078, pyrimidine-nucleoside phosphorylase; Reviewed	NA|211aa|up_4|NC_007503.1_1390861_1391494_-	pfam00596, Aldolase_II, Class II Aldolase and Adducin N-terminal domain	NA|344aa|up_3|NC_007503.1_1391495_1392527_-	PRK05720, mtnA, methylthioribose-1-phosphate isomerase; Reviewed	NA|200aa|up_2|NC_007503.1_1398202_1398802_-	TIGR02832, conserved_hypothetical_protein, sporulation protein YunB	NA|412aa|up_1|NC_007503.1_1398891_1400127_-	PRK05912, PRK05912, tyrosyl-tRNA synthetase; Validated	NA|806aa|up_0|NC_007503.1_1400265_1402683_+	TIGR02074, Includes:_Penicillin-insensitive_transglycosylase, penicillin-binding protein, 1A family	NA|830aa|down_0|NC_007503.1_1405095_1407585_-	COG0826, COG0826, Collagenase and related proteases [Posttranslational modification, protein turnover, chaperones]	NA|317aa|down_1|NC_007503.1_1407630_1408581_-	pfam01784, NIF3, NIF3 (NGG1p interacting factor 3)	NA|192aa|down_2|NC_007503.1_1408596_1409172_-	cd00540, AAG, Alkyladenine DNA glycosylase catalyzes the first step in base excision repair	NA|551aa|down_3|NC_007503.1_1409221_1410874_-	cd07436, PHP_PolX, Polymerase and Histidinol Phosphatase domain of bacterial polymerase X	NA|85aa|down_4|NC_007503.1_1410870_1411125_-	pfam05164, ZapA, Cell division protein ZapA	NA|799aa|down_5|NC_007503.1_1411187_1413584_-	PRK00629, pheT, phenylalanyl-tRNA synthetase subunit beta; Reviewed	NA|341aa|down_6|NC_007503.1_1413597_1414620_-	PRK00488, pheS, phenylalanyl-tRNA synthetase subunit alpha; Validated	NA|259aa|down_7|NC_007503.1_1415037_1415814_-	COG0566, SpoU, rRNA methylases [Translation, ribosomal structure and biogenesis]	NA|221aa|down_8|NC_007503.1_1415806_1416469_-	COG0569, TrkA, K+ transport systems, NAD-binding component [Inorganic ion transport and metabolism]	NA|450aa|down_9|NC_007503.1_1416481_1417831_-	TIGR00933, Trk_system_potassium_uptake_protein_trkH
GCF_000012865.1_ASM1286v1	NC_007503	Carboxydothermus hydrogenoformans Z-2901, complete sequence	3	1926257-1930135	3,1,1	CRISPRCasFinder,CRT,PILER-CR	no	WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas3,cas5,cas7,cas8b1	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	Type III-A,Type III-B,Type I-B,Type III-D,Type III-C	GTTTCAATCCCAGAATGGTTCGATTAAAAC,GTTTCAATCCCAGAATGGTTCGATTAAAAC,CAATCCCAGAATGGTTCGATTAAAAC	30,30,26	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	58,58,58	58	TypeIII-A,TypeIII-B,TypeI-B,TypeIII-D,TypeIII-C	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	NA|101aa|up_2|NC_007503.1_1924077_1924380_-,NA|82aa|up_1|NC_007503.1_1924876_1925122_-,NA|107aa|down_8|NC_007503.1_1939511_1939832_+	NA|156aa|up_9|NC_007503.1_1916281_1916749_-	cd12208, septicolysin_like, putative septicolysin, cholesterol-dependent cytolysin family and related proteins	cas6|249aa|up_8|NC_007503.1_1917739_1918486_-	cd09759, Cas6_I-A, CRISPR/Cas system-associated RAMP superfamily protein Cas6	csm5gr7|367aa|up_7|NC_007503.1_1918546_1919647_-	cd09662, Csm5_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm5	csm4gr5|319aa|up_6|NC_007503.1_1919647_1920604_-	TIGR01903, Hypothetical_protein	csm3gr7|267aa|up_5|NC_007503.1_1920617_1921418_-	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|145aa|up_4|NC_007503.1_1921430_1921865_-	pfam03750, Csm2_III-A, Csm2 Type III-A	cas10|739aa|up_3|NC_007503.1_1921864_1924081_-	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	NA|101aa|up_2|NC_007503.1_1924077_1924380_-	NA	NA|82aa|up_1|NC_007503.1_1924876_1925122_-	NA	NA|70aa|up_0|NC_007503.1_1925143_1925353_-	pfam16277, DUF4926, Domain of unknown function (DUF4926)	cas2|88aa|down_0|NC_007503.1_1930462_1930726_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|331aa|down_1|NC_007503.1_1930727_1931720_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|167aa|down_2|NC_007503.1_1931730_1932231_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas3|815aa|down_3|NC_007503.1_1932315_1934760_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|249aa|down_4|NC_007503.1_1934759_1935506_-	cd09692, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|314aa|down_5|NC_007503.1_1935522_1936464_-	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas8b1|647aa|down_6|NC_007503.1_1936464_1938405_-	cd09730, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|249aa|down_7|NC_007503.1_1938476_1939223_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	NA|107aa|down_8|NC_007503.1_1939511_1939832_+	NA	NA|412aa|down_9|NC_007503.1_1940457_1941693_-	COG1222, RPT1, ATP-dependent 26S proteasome regulatory subunit [Posttranslational modification, protein turnover, chaperones]
GCF_000012865.1_ASM1286v1	NC_007503	Carboxydothermus hydrogenoformans Z-2901, complete sequence	4	1944006-1949572	2,4,2,3	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas3,cas5,cas7,cas8b1,cas6	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	Type I-B	GTTTCAATCCCAGATTGGTTCGATTAAAAC,GTTTCAATCCCAGATTGGTTCGATTAAAAC,NNGTTTCAATCCCAGATTGGTTCGATTAAAAC,GTTTCAATCCCAGATTGGTTCGATTAAAAC	30,30,32,30	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	80,83,83,80	83	TypeI-B	cas3,Cas14b_CAS-V-F,Cas14u_CAS-V,csa3,DEDDh,csm6,csx1,WYL,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,cas4,cas5,cas7,cas8b1,cas3HD	NA|107aa|up_4|NC_007503.1_1939511_1939832_+,NA|51aa|up_0|NC_007503.1_1943720_1943873_-,NA|58aa|down_2|NC_007503.1_1953506_1953680_-,NA|162aa|down_3|NC_007503.1_1953751_1954237_-,NA|143aa|down_4|NC_007503.1_1954276_1954705_-,NA|62aa|down_5|NC_007503.1_1955103_1955289_+,NA|86aa|down_6|NC_007503.1_1955291_1955549_+,NA|63aa|down_7|NC_007503.1_1955700_1955889_+,NA|260aa|down_8|NC_007503.1_1956096_1956876_-	cas3|815aa|up_9|NC_007503.1_1932315_1934760_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|249aa|up_8|NC_007503.1_1934759_1935506_-	cd09692, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|314aa|up_7|NC_007503.1_1935522_1936464_-	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas8b1|647aa|up_6|NC_007503.1_1936464_1938405_-	cd09730, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|249aa|up_5|NC_007503.1_1938476_1939223_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	NA|107aa|up_4|NC_007503.1_1939511_1939832_+	NA	NA|412aa|up_3|NC_007503.1_1940457_1941693_-	COG1222, RPT1, ATP-dependent 26S proteasome regulatory subunit [Posttranslational modification, protein turnover, chaperones]	NA|186aa|up_2|NC_007503.1_1941750_1942308_-	smart00318, SNc, Staphylococcal nuclease homologues	NA|291aa|up_1|NC_007503.1_1942571_1943444_-	pfam01610, DDE_Tnp_ISL3, Transposase	NA|51aa|up_0|NC_007503.1_1943720_1943873_-	NA	NA|357aa|down_0|NC_007503.1_1949952_1951023_-	pfam09992, NAGPA, Phosphodiester glycosidase	NA|625aa|down_1|NC_007503.1_1951128_1953003_-	TIGR02552, Low_calcium_response_locus_protein_H, type III secretion low calcium response chaperone LcrH/SycD	NA|58aa|down_2|NC_007503.1_1953506_1953680_-	NA	NA|162aa|down_3|NC_007503.1_1953751_1954237_-	NA	NA|143aa|down_4|NC_007503.1_1954276_1954705_-	NA	NA|62aa|down_5|NC_007503.1_1955103_1955289_+	NA	NA|86aa|down_6|NC_007503.1_1955291_1955549_+	NA	NA|63aa|down_7|NC_007503.1_1955700_1955889_+	NA	NA|260aa|down_8|NC_007503.1_1956096_1956876_-	NA	NA|231aa|down_9|NC_007503.1_1956954_1957647_-	pfam06940, DUF1287, Domain of unknown function (DUF1287)
