assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000020965.1_ASM2096v1	NC_011297	Dictyoglomus thermophilum H-6-12, complete sequence	1	46252-50335	1,1,1	CRISPRCasFinder,CRT,PILER-CR	no		cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	Orphan	GTTTGTAGCGTGCCTATAAGGGATTGAAAC,GTTTGTAGCGTGCCTATAAGGGATTGAAAC,GTTTGTAGCGTGCCTATAAGGGATTGAAAC	30,30,30	0	0	NA	NA	NA:NA:NA	61,61,59	61	Orphan	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	NA|51aa|up_9|NC_011297.1_33814_33967_+,NA|278aa|up_7|NC_011297.1_35785_36619_-,NA|403aa|up_6|NC_011297.1_36741_37950_+,NA|169aa|down_8|NC_011297.1_61827_62334_+	NA|51aa|up_9|NC_011297.1_33814_33967_+	NA	NA|523aa|up_8|NC_011297.1_34161_35730_+	cd02808, GltS_FMN, Glutamate synthase (GltS) FMN-binding domain	NA|278aa|up_7|NC_011297.1_35785_36619_-	NA	NA|403aa|up_6|NC_011297.1_36741_37950_+	NA	NA|310aa|up_5|NC_011297.1_37946_38876_+	COG0530, ECM27, Ca2+/Na+ antiporter [Inorganic ion transport and metabolism]	NA|567aa|up_4|NC_011297.1_38920_40621_-	cd13582, PBP2_AlgQ_like_3, Periplasmic-binding component of alginate-specific ABC uptake system-like; contains the type 2 periplasmic binding fold	NA|297aa|up_3|NC_011297.1_40718_41609_-	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|305aa|up_2|NC_011297.1_41619_42534_-	COG4209, LplB, ABC-type polysaccharide transport system, permease component [Carbohydrate transport and metabolism]	NA|579aa|up_1|NC_011297.1_42684_44421_+	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|497aa|up_0|NC_011297.1_44410_45901_+	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|465aa|down_0|NC_011297.1_50411_51806_-	smart00812, Alpha_L_fucos, Alpha-L-fucosidase	NA|133aa|down_1|NC_011297.1_52006_52405_+	pfam02537, CRCB, CrcB-like protein, Camphor Resistance (CrcB)	NA|121aa|down_2|NC_011297.1_52401_52764_+	pfam02537, CRCB, CrcB-like protein, Camphor Resistance (CrcB)	NA|776aa|down_3|NC_011297.1_52841_55169_-	PRK10658, PRK10658, putative alpha-glucosidase; Provisional	NA|928aa|down_4|NC_011297.1_55181_57965_-	PLN03080, PLN03080, Probable beta-xylosidase; Provisional	NA|251aa|down_5|NC_011297.1_59056_59809_-	pfam01063, Aminotran_4, Amino-transferase class IV	NA|445aa|down_6|NC_011297.1_59814_61149_-	COG0147, TrpE, Anthranilate/para-aminobenzoate synthases component I [Amino acid transport and metabolism / Coenzyme metabolism]	NA|188aa|down_7|NC_011297.1_61145_61709_-	PRK05670, PRK05670, anthranilate synthase component II; Provisional	NA|169aa|down_8|NC_011297.1_61827_62334_+	NA	NA|372aa|down_9|NC_011297.1_62396_63512_-	COG2407, FucI, L-fucose isomerase and related proteins [Carbohydrate transport and metabolism]
GCF_000020965.1_ASM2096v1	NC_011297	Dictyoglomus thermophilum H-6-12, complete sequence	2	71018-73143	2,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	Unclear	GTTTAAATCCCACATAGTTCAGATCAAAC,GTTTAAATCCCACATAGTTCAGATCAAAC,GTTTAAATCCCACATAGTTCAGATCAAAC	29,29,29	0	0	NA	NA	I-A:I-A:I-A	32,32,31	32	Unclear	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	NA|169aa|up_7|NC_011297.1_61827_62334_+,NA	NA|445aa|up_9|NC_011297.1_59814_61149_-	COG0147, TrpE, Anthranilate/para-aminobenzoate synthases component I [Amino acid transport and metabolism / Coenzyme metabolism]	NA|188aa|up_8|NC_011297.1_61145_61709_-	PRK05670, PRK05670, anthranilate synthase component II; Provisional	NA|169aa|up_7|NC_011297.1_61827_62334_+	NA	NA|372aa|up_6|NC_011297.1_62396_63512_-	COG2407, FucI, L-fucose isomerase and related proteins [Carbohydrate transport and metabolism]	NA|169aa|up_5|NC_011297.1_63515_64022_-	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|428aa|up_4|NC_011297.1_64287_65571_+	COG1653, UgpB, ABC-type sugar transport system, periplasmic component [Carbohydrate transport and metabolism]	NA|292aa|up_3|NC_011297.1_65673_66549_+	COG1175, UgpA, ABC-type sugar transport systems, permease components [Carbohydrate transport and metabolism]	NA|279aa|up_2|NC_011297.1_66548_67385_+	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|486aa|up_1|NC_011297.1_67430_68888_+	COG1621, SacC, Beta-fructosidases (levanase/invertase) [Carbohydrate transport and metabolism]	NA|329aa|up_0|NC_011297.1_68908_69895_-	cd06291, PBP1_Qymf-like, ligand binding domain of the lacI-like transcription regulator from a novel metal-reducing bacterium Alkaliphilus Metalliredigens (strain Qymf) and its close homologs	cas2|88aa|down_0|NC_011297.1_73359_73623_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|327aa|down_1|NC_011297.1_73625_74606_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|171aa|down_2|NC_011297.1_74610_75123_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas3|756aa|down_3|NC_011297.1_75143_77411_-	cd09639, Cas3_I, CRISPR/Cas system-associated protein Cas3	cas5|234aa|down_4|NC_011297.1_77388_78090_-	TIGR01895, conserved_hypothetical_protein, CRISPR-associated protein Cas5, subtype I-B/TNEAP	cas7|300aa|down_5|NC_011297.1_78076_78976_-	TIGR02585, conserved_protein, CRISPR-associated protein Cas7/Cst2/DevR, subtype I-B/TNEAP	cas8b2|559aa|down_6|NC_011297.1_78991_80668_-	cd09665, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|248aa|down_7|NC_011297.1_80669_81413_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	NA|397aa|down_8|NC_011297.1_81673_82864_+	cd08185, Fe-ADH-like, Iron-containing alcohol dehydrogenases-like	NA|347aa|down_9|NC_011297.1_82943_83984_+	cd00761, Glyco_tranf_GTA_type, Glycosyltransferase family A (GT-A) includes diverse families of glycosyl transferases with a common GT-A type structural fold
GCF_000020965.1_ASM2096v1	NC_011297	Dictyoglomus thermophilum H-6-12, complete sequence	3	178426-182925	3,3,3	CRISPRCasFinder,CRT,PILER-CR	no	WYL,cas6,cas8b1,cas7,cas5,cas3,cas4,cas1,cas2,csx3,cas10,csm2gr11,csm3gr7	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	Type I-B,Type III-C,Type III-A,Type III-D,Type III-B	GTTTGTAGCGTGCCTATAAGGGATTGAAAC,GTTTGTAGCGTGCCTATAAGGGATTGAAAC,GTTTGTAGCGTGCCTATAAGGGATTGAAAC	30,30,30	0	0	NA	NA	NA:NA:NA	67,67,66	67	TypeI-B,TypeIII-C,TypeIII-A,TypeIII-D,TypeIII-B	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	NA|55aa|up_9|NC_011297.1_168384_168549_+,NA|56aa|down_0|NC_011297.1_183387_183555_+	NA|55aa|up_9|NC_011297.1_168384_168549_+	NA	WYL|281aa|up_8|NC_011297.1_168533_169376_+	pfam13280, WYL, WYL domain	cas6|261aa|up_7|NC_011297.1_169448_170231_+	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	cas8b1|655aa|up_6|NC_011297.1_170220_172185_+	TIGR02556, hypothetical_protein_MM_0564, CRISPR-associated protein, TM1802 family	cas7|318aa|up_5|NC_011297.1_172185_173139_+	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas5|251aa|up_4|NC_011297.1_173155_173908_+	cd09692, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas3|802aa|up_3|NC_011297.1_173909_176315_+	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas4|165aa|up_2|NC_011297.1_176331_176826_+	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas1|332aa|up_1|NC_011297.1_176822_177818_+	cd09722, Cas1_I-B, CRISPR/Cas system-associated protein Cas1	cas2|88aa|up_0|NC_011297.1_177819_178083_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|56aa|down_0|NC_011297.1_183387_183555_+	NA	NA|366aa|down_1|NC_011297.1_183823_184921_+	cd01907, GlxB, Glutamine amidotransferases class-II (Gn-AT)_GlxB-type	NA|503aa|down_2|NC_011297.1_184917_186426_+	COG0069, GltB, Glutamate synthase domain 2 [Amino acid transport and metabolism]	NA|152aa|down_3|NC_011297.1_186429_186885_+	cd10563, CooF_like, CooF, iron-sulfur subunit of carbon monoxide dehydrogenase	NA|418aa|down_4|NC_011297.1_186898_188152_+	COG1251, NirB, NAD(P)H-nitrite reductase [Energy production and conversion]	NA|247aa|down_5|NC_011297.1_188172_188913_+	cd00981, arch_gltB, Archaeal-type gltB domain	NA|541aa|down_6|NC_011297.1_188941_190564_+	PRK13981, PRK13981, NAD synthetase; Provisional	NA|447aa|down_7|NC_011297.1_190645_191986_-	COG0174, GlnA, Glutamine synthetase [Amino acid transport and metabolism]	NA|113aa|down_8|NC_011297.1_192218_192557_-	COG0347, GlnK, Nitrogen regulatory protein PII [Amino acid transport and metabolism]	NA|447aa|down_9|NC_011297.1_192553_193894_-	TIGR03644, marine_trans_1, probable ammonium transporter, marine subtype
GCF_000020965.1_ASM2096v1	NC_011297	Dictyoglomus thermophilum H-6-12, complete sequence	4	1230930-1231048	4	CRISPRCasFinder	no		cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	Orphan	TGGTCGGGGCGACTGGACTTGAACCAGCGACCT	33	0	0	NA	NA	NA	1	1	Orphan	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6,WYL,cas8b1,csx3,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csx1,csa3	NA|100aa|up_4|NC_011297.1_1228159_1228459_-,NA|150aa|down_5|NC_011297.1_1236371_1236821_-	NA|169aa|up_9|NC_011297.1_1221418_1221925_-	cd01275, FHIT, FHIT (fragile histidine family): FHIT proteins, related to the HIT family carry a motif HxHxH/Qxx (x, is a hydrophobic amino acid), On the basis of sequence, substrate specificity, structure, evolution and mechanism, HIT proteins are classified into three  branches: the Hint branch, which consists of adenosine 5' -monophosphoramide hydrolases, the Fhit branch, that consists of diadenosine polyphosphate hydrolases, and the GalT branch consisting of specific nucloside monophosphate transferases	NA|319aa|up_8|NC_011297.1_1222095_1223052_-	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|272aa|up_7|NC_011297.1_1223051_1223867_-	PRK05724, PRK05724, acetyl-CoA carboxylase carboxyltransferase subunit alpha; Validated	NA|281aa|up_6|NC_011297.1_1223860_1224703_-	PRK05654, PRK05654, acetyl-CoA carboxylase carboxyltransferase subunit beta	NA|1128aa|up_5|NC_011297.1_1224748_1228132_-	PRK06826, dnaE, DNA polymerase III DnaE; Reviewed	NA|100aa|up_4|NC_011297.1_1228159_1228459_-	NA	NA|211aa|up_3|NC_011297.1_1228495_1229128_-	cd10030, UDG-F4_TTUDGA_SPO1dp_like, Uracil DNA glycosylase family 4, includes Thermotoga maritima TTUDGA, Bacillus phage SPO1 DNA polymerase, and similar proteins	NA|221aa|up_2|NC_011297.1_1229115_1229778_-	PRK00312, pcm, protein-L-isoaspartate(D-aspartate) O-methyltransferase	NA|286aa|up_1|NC_011297.1_1229783_1230641_-	PRK00811, PRK00811, polyamine aminopropyltransferase	NA|91aa|up_0|NC_011297.1_1230647_1230920_-	pfam00708, Acylphosphatase, Acylphosphatase	NA|626aa|down_0|NC_011297.1_1231121_1232999_-	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|81aa|down_1|NC_011297.1_1233003_1233246_-	pfam03776, MinE, Septum formation topological specificity factor MinE	NA|265aa|down_2|NC_011297.1_1233258_1234053_-	COG2894, MinD, Septum formation inhibitor-activating ATPase [Cell division and chromosome partitioning]	NA|203aa|down_3|NC_011297.1_1234045_1234654_-	pfam03775, MinC_C, Septum formation inhibitor MinC, C-terminal domain	NA|575aa|down_4|NC_011297.1_1234650_1236375_-	TIGR03423, pbp2_mrdA, penicillin-binding protein 2	NA|150aa|down_5|NC_011297.1_1236371_1236821_-	NA	NA|263aa|down_6|NC_011297.1_1236805_1237594_-	PRK13922, PRK13922, rod shape-determining protein MreC; Provisional	NA|349aa|down_7|NC_011297.1_1237593_1238640_-	PRK13927, PRK13927, rod shape-determining protein MreB; Provisional	NA|194aa|down_8|NC_011297.1_1238675_1239257_-	pfam02545, Maf, Maf-like protein	NA|279aa|down_9|NC_011297.1_1239253_1240090_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]
