assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	1	90010-90102	1	CRISPRCasFinder	no		csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Orphan	CGGCGGCCCTTGCAGGTCTCGCAG	24	0	0	NA	NA	NA	1	1	Orphan	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|170aa|up_1|NZ_AP019796.1_87501_88011_+,NA|106aa|down_1|NZ_AP019796.1_93166_93484_+,NA|313aa|down_6|NZ_AP019796.1_101038_101977_-,NA|61aa|down_7|NZ_AP019796.1_102078_102261_+	NA|526aa|up_9|NZ_AP019796.1_74527_76105_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|143aa|up_8|NZ_AP019796.1_76105_76534_-	cd12152, F1-ATPase_delta, mitochondrial ATP synthase delta subunit	NA|502aa|up_7|NZ_AP019796.1_76536_78042_-	PRK09280, PRK09280, F0F1 ATP synthase subunit beta; Validated	NA|835aa|up_6|NZ_AP019796.1_78295_80800_+	cd06238, M14-like, Peptidase M14-like domain; uncharacterized subgroup	NA|447aa|up_5|NZ_AP019796.1_80803_82144_-	PRK05820, deoA, thymidine phosphorylase; Reviewed	NA|838aa|up_4|NZ_AP019796.1_82145_84659_-	cd02850, E_set_Cellulase_N, N-terminal Early set domain associated with the catalytic domain of cellulase	NA|84aa|up_3|NZ_AP019796.1_84776_85028_-	pfam01197, Ribosomal_L31, Ribosomal protein L31	NA|628aa|up_2|NZ_AP019796.1_85110_86994_-	PRK09284, PRK09284, thiamine biosynthesis protein ThiC; Provisional	NA|170aa|up_1|NZ_AP019796.1_87501_88011_+	NA	NA|362aa|up_0|NZ_AP019796.1_88282_89368_+	cd14956, NHL_like_3, Uncharacterized NHL-repeat domain in bacterial proteins	NA|198aa|down_0|NZ_AP019796.1_92492_93086_+	COG2095, MarC, Multiple antibiotic transporter [Intracellular trafficking and secretion]	NA|106aa|down_1|NZ_AP019796.1_93166_93484_+	NA	NA|816aa|down_2|NZ_AP019796.1_93564_96012_-	pfam14498, Glyco_hyd_65N_2, Glycosyl hydrolase family 65, N-terminal domain	NA|353aa|down_3|NZ_AP019796.1_96295_97354_+	TIGR02800, Protein_TolB, tol-pal system beta propeller repeat protein TolB	NA|777aa|down_4|NZ_AP019796.1_97373_99704_+	TIGR03921, T7SS_mycosin, type VII secretion-associated serine protease mycosin	NA|333aa|down_5|NZ_AP019796.1_99974_100973_-	cd19143, AKR_AKR6C1_2, AKR6C family of aldo-keto reductase (AKR)	NA|313aa|down_6|NZ_AP019796.1_101038_101977_-	NA	NA|61aa|down_7|NZ_AP019796.1_102078_102261_+	NA	NA|922aa|down_8|NZ_AP019796.1_102376_105142_+	COG0612, PqqL, Predicted Zn-dependent peptidases [General function prediction only]	NA|262aa|down_9|NZ_AP019796.1_105242_106028_+	COG1842, PspA, Phage shock protein A (IM30), suppresses sigma54-dependent transcription [Transcription / Signal transduction mechanisms]
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	2	358280-358380	2	CRISPRCasFinder	no		csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Orphan	GGTGCCGGTTGCAGATGCCGAGCGTAAGCGAT	32	0	0	NA	NA	NA	1	1	Orphan	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|298aa|up_8|NZ_AP019796.1_348474_349368_-,NA|725aa|down_5|NZ_AP019796.1_371504_373679_+,NA|539aa|down_7|NZ_AP019796.1_375977_377594_+,NA|355aa|down_9|NZ_AP019796.1_380510_381575_+	NA|1218aa|up_9|NZ_AP019796.1_344785_348439_-	sd00008, TPR_YbbN, C-terminal Tetratricopeptide repeat (TPR) region of YbbN and similar motifs	NA|298aa|up_8|NZ_AP019796.1_348474_349368_-	NA	NA|234aa|up_7|NZ_AP019796.1_349695_350397_-	TIGR04508, queE_Cx14CxxC, 7-carboxy-7-deazaguanine synthase, Cx14CxxC type	NA|239aa|up_6|NZ_AP019796.1_350399_351116_-	pfam06508, QueC, Queuosine biosynthesis protein QueC	NA|157aa|up_5|NZ_AP019796.1_351075_351546_-	pfam01242, PTPS, 6-pyruvoyl tetrahydropterin synthase	NA|169aa|up_4|NZ_AP019796.1_351685_352192_+	PRK13258, PRK13258, 7-cyano-7-deazaguanine reductase; Provisional	NA|586aa|up_3|NZ_AP019796.1_352188_353946_-	cd09912, DLP_2, Dynamin-like protein including dynamins, mitofusins, and guanylate-binding proteins	NA|459aa|up_2|NZ_AP019796.1_354003_355380_-	PRK13341, PRK13341, AAA family ATPase	NA|572aa|up_1|NZ_AP019796.1_355417_357133_-	PRK00911, PRK00911, dihydroxy-acid dehydratase; Provisional	NA|218aa|up_0|NZ_AP019796.1_357222_357876_+	pfam09601, DUF2459, Protein of unknown function (DUF2459)	NA|333aa|down_0|NZ_AP019796.1_359195_360194_+	pfam13546, DDE_5, DDE superfamily endonuclease	NA|279aa|down_1|NZ_AP019796.1_363171_364008_-	pfam10881, DUF2726, Protein of unknown function (DUF2726)	NA|801aa|down_2|NZ_AP019796.1_364071_366474_+	COG1506, DAP2, Dipeptidyl aminopeptidases/acylaminoacyl-peptidases [Amino acid transport and metabolism]	NA|469aa|down_3|NZ_AP019796.1_366515_367922_-	COG5563, COG5563, Predicted integral membrane proteins containing uncharacterized repeats [Function unknown]	NA|1048aa|down_4|NZ_AP019796.1_368064_371208_-	pfam13620, CarboxypepD_reg, Carboxypeptidase regulatory-like domain	NA|725aa|down_5|NZ_AP019796.1_371504_373679_+	NA	NA|733aa|down_6|NZ_AP019796.1_373708_375907_+	TIGR04183, hypothetical_protein, Por secretion system C-terminal sorting domain	NA|539aa|down_7|NZ_AP019796.1_375977_377594_+	NA	NA|972aa|down_8|NZ_AP019796.1_377590_380506_+	pfam13715, CarbopepD_reg_2, CarboxypepD_reg-like domain	NA|355aa|down_9|NZ_AP019796.1_380510_381575_+	NA
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	3	567791-568673	1,3,1	PILER-CR,CRISPRCasFinder,CRT	no	DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type I-E	GGTGTCCCCGCACCCGCGGGGATAGTCC,GGTGTCCCCGCACCCGCGGGGATAGTCCC,GGTGTCCCCGCACCCGCGGGGATAGTCC	28,29,28	0	0	NA	NA	NA:NA:NA	14,14,14	14	TypeI-E	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|194aa|up_7|NZ_AP019796.1_560870_561452_+,NA|850aa|down_1|NZ_AP019796.1_570076_572626_+	DEDDh|168aa|up_9|NZ_AP019796.1_557619_558123_+	cd06127, DEDDh, DEDDh 3'-5' exonuclease domain family	cas3|877aa|up_8|NZ_AP019796.1_558142_560773_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|194aa|up_7|NZ_AP019796.1_560870_561452_+	NA	cas8e|520aa|up_6|NZ_AP019796.1_561468_563028_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|180aa|up_5|NZ_AP019796.1_563024_563564_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|424aa|up_4|NZ_AP019796.1_563611_564883_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|253aa|up_3|NZ_AP019796.1_564882_565641_+	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas6e|266aa|up_2|NZ_AP019796.1_565630_566428_+	smart01101, CRISPR_assoc, This domain forms an anti-parallel beta strand structure with flanking alpha helical regions	cas1|298aa|up_1|NZ_AP019796.1_566445_567339_+	cd09719, Cas1_I-E, CRISPR/Cas system-associated protein Cas1	cas2|143aa|up_0|NZ_AP019796.1_567310_567739_+	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	NA|163aa|down_0|NZ_AP019796.1_569343_569832_-	COG2318, DinB, Uncharacterized protein conserved in bacteria [Function unknown]	NA|850aa|down_1|NZ_AP019796.1_570076_572626_+	NA	NA|415aa|down_2|NZ_AP019796.1_572631_573876_-	COG0153, GalK, Galactokinase [Carbohydrate transport and metabolism]	NA|510aa|down_3|NZ_AP019796.1_573889_575419_-	cd10325, SLC5sbd_vSGLT, Vibrio parahaemolyticus Na(+)/galactose cotransporter (vSGLT) and related proteins; solute binding domain	NA|352aa|down_4|NZ_AP019796.1_575441_576497_-	PRK11720, PRK11720, UDP-glucose--hexose-1-phosphate uridylyltransferase	NA|114aa|down_5|NZ_AP019796.1_576756_577098_+	pfam04342, DMT_6, Putative member of DMT superfamily (DUF486)	NA|306aa|down_6|NZ_AP019796.1_577194_578112_+	cd00408, DHDPS-like, Dihydrodipicolinate synthase family	NA|483aa|down_7|NZ_AP019796.1_578131_579580_+	cd07097, ALDH_KGSADH-YcbD, Bacillus subtilis NADP+-dependent alpha-ketoglutaric semialdehyde dehydrogenase ycbD-like	NA|219aa|down_8|NZ_AP019796.1_579583_580240_+	COG1802, GntR, Transcriptional regulators [Transcription]	NA|588aa|down_9|NZ_AP019796.1_580236_582000_+	pfam05960, DUF885, Bacterial protein of unknown function (DUF885)
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	4	610758-610898	4	CRISPRCasFinder	no		csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Orphan	GAGGCGAAACTGGAAAAGCAGATCGCCGAGGTGGAGGGTCGG	42	0	0	NA	NA	NA	1	1	Orphan	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|207aa|up_9|NZ_AP019796.1_598706_599327_-,NA|169aa|up_2|NZ_AP019796.1_608534_609041_+,NA|84aa|up_0|NZ_AP019796.1_609270_609522_-,NA	NA|207aa|up_9|NZ_AP019796.1_598706_599327_-	NA	NA|431aa|up_8|NZ_AP019796.1_599345_600638_+	COG2133, COG2133, Glucose/sorbosone dehydrogenases [Carbohydrate transport and metabolism]	NA|490aa|up_7|NZ_AP019796.1_600622_602092_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|229aa|up_6|NZ_AP019796.1_602095_602782_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|394aa|up_5|NZ_AP019796.1_602945_604127_+	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|1048aa|up_4|NZ_AP019796.1_604130_607274_+	COG3696, COG3696, Putative silver efflux pump [Inorganic ion transport and metabolism]	NA|414aa|up_3|NZ_AP019796.1_607286_608528_+	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|169aa|up_2|NZ_AP019796.1_608534_609041_+	NA	NA|85aa|up_1|NZ_AP019796.1_609061_609316_-	COG2026, RelE, Cytotoxic translational repressor of toxin-antitoxin stability system [Translation, ribosomal structure and biogenesis / Cell division and chromosome partitioning]	NA|84aa|up_0|NZ_AP019796.1_609270_609522_-	NA	NA|779aa|down_0|NZ_AP019796.1_611034_613371_+	cd07551, P-type_ATPase_HM_ZosA_PfeT-like, P-type heavy metal-transporting ATPase, similar to Bacillus subtilis ZosA/PfeT which transports copper, and perhaps zinc under oxidative stress, and perhaps ferrous iron	NA|330aa|down_1|NZ_AP019796.1_613371_614361_-	COG3292, COG3292, Predicted periplasmic ligand-binding sensor domain [Signal transduction mechanisms]	NA|677aa|down_2|NZ_AP019796.1_614608_616639_+	COG1785, PhoA, Alkaline phosphatase [Inorganic ion transport and metabolism]	NA|544aa|down_3|NZ_AP019796.1_616876_618508_-	COG0578, GlpA, Glycerol-3-phosphate dehydrogenase [Energy production and conversion]	NA|982aa|down_4|NZ_AP019796.1_618604_621550_+	pfam15979, Glyco_hydro_115, Glycosyl hydrolase family 115	NA|172aa|down_5|NZ_AP019796.1_621933_622449_+	COG2080, CoxS, Aerobic-type carbon monoxide dehydrogenase, small subunit CoxS/CutS homologs [Energy production and conversion]	NA|791aa|down_6|NZ_AP019796.1_622488_624861_+	COG1529, CoxL, Aerobic-type carbon monoxide dehydrogenase, large subunit CoxL/CutL homologs [Energy production and conversion]	NA|290aa|down_7|NZ_AP019796.1_624885_625755_+	COG1319, CoxM, Aerobic-type carbon monoxide dehydrogenase, middle subunit CoxM/CutM homologs [Energy production and conversion]	NA|124aa|down_8|NZ_AP019796.1_625818_626190_-	TIGR03879, Uncharacterized_protein_MJ1053, probable regulatory domain	NA|302aa|down_9|NZ_AP019796.1_626192_627098_-	TIGR03878, thermo_KaiC_2, KaiC domain protein, AF_0795 family
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	5	1680847-1682485	2,5,2	PILER-CR,CRISPRCasFinder,CRT	no	c2c9_V-U4,cas6,cas8b1,cas7,cas5,cas3,cas4,cas1,cas2	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type I-B	GTTTGTAGCCTACCTATGAGGGATTGAAAT,GTTTGTAGCCTACCTATGAGGGATTGAAAT,GTTTGTAGCCTACCTATGAGGGATTGAAAT	30,30,30	0	0	NA	NA	NA:NA:NA	24,24,24	24	TypeI-B	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|111aa|up_9|NZ_AP019796.1_1671417_1671750_+,NA|89aa|up_0|NZ_AP019796.1_1680353_1680620_-,NA|84aa|down_0|NZ_AP019796.1_1684532_1684784_+,NA|217aa|down_1|NZ_AP019796.1_1685612_1686263_-,NA|356aa|down_5|NZ_AP019796.1_1694593_1695661_-,NA|1132aa|down_6|NZ_AP019796.1_1695632_1699028_-	NA|111aa|up_9|NZ_AP019796.1_1671417_1671750_+	NA	cas6|263aa|up_8|NZ_AP019796.1_1671775_1672564_+	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	cas8b1|584aa|up_7|NZ_AP019796.1_1672610_1674362_+	pfam09484, Cas_TM1802, CRISPR-associated protein TM1802 (cas_TM1802)	cas7|306aa|up_6|NZ_AP019796.1_1674358_1675276_+	TIGR02590, hypothetical_protein_MM_0563, CRISPR-associated protein Cas7/Csh2, subtype I-B/HMARI	cas5|259aa|up_5|NZ_AP019796.1_1675272_1676049_+	TIGR02592, hypothetical_protein_CTC_01466, CRISPR-associated protein Cas5, subtype I-B/HMARI	cas3|828aa|up_4|NZ_AP019796.1_1676009_1678493_+	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas4|172aa|up_3|NZ_AP019796.1_1678518_1679034_+	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas1|331aa|up_2|NZ_AP019796.1_1679035_1680028_+	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas2|88aa|up_1|NZ_AP019796.1_1680039_1680303_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|89aa|up_0|NZ_AP019796.1_1680353_1680620_-	NA	NA|84aa|down_0|NZ_AP019796.1_1684532_1684784_+	NA	NA|217aa|down_1|NZ_AP019796.1_1685612_1686263_-	NA	NA|297aa|down_2|NZ_AP019796.1_1686520_1687411_-	pfam13354, Beta-lactamase2, Beta-lactamase enzyme family	NA|1757aa|down_3|NZ_AP019796.1_1687438_1692709_-	TIGR04183, hypothetical_protein, Por secretion system C-terminal sorting domain	NA|543aa|down_4|NZ_AP019796.1_1692965_1694594_-	cd06583, PGRP, Peptidoglycan recognition proteins (PGRPs) are pattern recognition receptors that bind, and in certain cases, hydrolyze peptidoglycans (PGNs) of bacterial cell walls	NA|356aa|down_5|NZ_AP019796.1_1694593_1695661_-	NA	NA|1132aa|down_6|NZ_AP019796.1_1695632_1699028_-	NA	NA|898aa|down_7|NZ_AP019796.1_1699042_1701736_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|903aa|down_8|NZ_AP019796.1_1701808_1704517_-	PRK06655, flgD, flagellar hook assembly protein FlgD	csm5gr7|552aa|down_9|NZ_AP019796.1_1706257_1707913_-	cd09662, Csm5_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm5
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	6	1683359-1683792	6,3,3	CRISPRCasFinder,CRT,PILER-CR	no	c2c9_V-U4,cas6,cas8b1,cas7,cas5,cas3,cas4,cas1,cas2	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type I-B	GTTTGTAGCCTACCTATGAGGGATTGAAAT,GTTTGTAGCCTACCTATGAGGGATTGAAAT,GTTTGTAGCCTACCTATGAGGGATTGAAAT	30,30,30	1	1	1683389-1683423	NZ_AP019796.1_1682485-1682519	NA:NA:NA	6,6,5	6	TypeI-B	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|111aa|up_9|NZ_AP019796.1_1671417_1671750_+,NA|89aa|up_0|NZ_AP019796.1_1680353_1680620_-,NA|84aa|down_0|NZ_AP019796.1_1684532_1684784_+,NA|217aa|down_1|NZ_AP019796.1_1685612_1686263_-,NA|356aa|down_5|NZ_AP019796.1_1694593_1695661_-,NA|1132aa|down_6|NZ_AP019796.1_1695632_1699028_-	NA|111aa|up_9|NZ_AP019796.1_1671417_1671750_+	NA	cas6|263aa|up_8|NZ_AP019796.1_1671775_1672564_+	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	cas8b1|584aa|up_7|NZ_AP019796.1_1672610_1674362_+	pfam09484, Cas_TM1802, CRISPR-associated protein TM1802 (cas_TM1802)	cas7|306aa|up_6|NZ_AP019796.1_1674358_1675276_+	TIGR02590, hypothetical_protein_MM_0563, CRISPR-associated protein Cas7/Csh2, subtype I-B/HMARI	cas5|259aa|up_5|NZ_AP019796.1_1675272_1676049_+	TIGR02592, hypothetical_protein_CTC_01466, CRISPR-associated protein Cas5, subtype I-B/HMARI	cas3|828aa|up_4|NZ_AP019796.1_1676009_1678493_+	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas4|172aa|up_3|NZ_AP019796.1_1678518_1679034_+	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas1|331aa|up_2|NZ_AP019796.1_1679035_1680028_+	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas2|88aa|up_1|NZ_AP019796.1_1680039_1680303_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|89aa|up_0|NZ_AP019796.1_1680353_1680620_-	NA	NA|84aa|down_0|NZ_AP019796.1_1684532_1684784_+	NA	NA|217aa|down_1|NZ_AP019796.1_1685612_1686263_-	NA	NA|297aa|down_2|NZ_AP019796.1_1686520_1687411_-	pfam13354, Beta-lactamase2, Beta-lactamase enzyme family	NA|1757aa|down_3|NZ_AP019796.1_1687438_1692709_-	TIGR04183, hypothetical_protein, Por secretion system C-terminal sorting domain	NA|543aa|down_4|NZ_AP019796.1_1692965_1694594_-	cd06583, PGRP, Peptidoglycan recognition proteins (PGRPs) are pattern recognition receptors that bind, and in certain cases, hydrolyze peptidoglycans (PGNs) of bacterial cell walls	NA|356aa|down_5|NZ_AP019796.1_1694593_1695661_-	NA	NA|1132aa|down_6|NZ_AP019796.1_1695632_1699028_-	NA	NA|898aa|down_7|NZ_AP019796.1_1699042_1701736_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|903aa|down_8|NZ_AP019796.1_1701808_1704517_-	PRK06655, flgD, flagellar hook assembly protein FlgD	csm5gr7|552aa|down_9|NZ_AP019796.1_1706257_1707913_-	cd09662, Csm5_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm5
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	7	1705337-1706070	4,7,4,5	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,Cas14u_CAS-V,csx20,cas6	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type III-A,Type III-D,Type III-C,Type III-B	GTCGTAATCCCCTTTTCATCGGGTCAGGTCTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTCTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTCTTCAGAC,TGTCGTAATCCCCTTTTCATCGGGTCAGGTCTTCAGACGC	37,37,37,40	0	0	NA	NA	NA:NA:NA:NA	8,9,9,8	9	TypeIII-A,TypeIII-D,TypeIII-C,TypeIII-B	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|89aa|up_9|NZ_AP019796.1_1680353_1680620_-,NA|84aa|up_8|NZ_AP019796.1_1684532_1684784_+,NA|217aa|up_7|NZ_AP019796.1_1685612_1686263_-,NA|356aa|up_3|NZ_AP019796.1_1694593_1695661_-,NA|1132aa|up_2|NZ_AP019796.1_1695632_1699028_-,NA|343aa|down_7|NZ_AP019796.1_1714974_1716003_+,NA|273aa|down_9|NZ_AP019796.1_1717817_1718636_+	NA|89aa|up_9|NZ_AP019796.1_1680353_1680620_-	NA	NA|84aa|up_8|NZ_AP019796.1_1684532_1684784_+	NA	NA|217aa|up_7|NZ_AP019796.1_1685612_1686263_-	NA	NA|297aa|up_6|NZ_AP019796.1_1686520_1687411_-	pfam13354, Beta-lactamase2, Beta-lactamase enzyme family	NA|1757aa|up_5|NZ_AP019796.1_1687438_1692709_-	TIGR04183, hypothetical_protein, Por secretion system C-terminal sorting domain	NA|543aa|up_4|NZ_AP019796.1_1692965_1694594_-	cd06583, PGRP, Peptidoglycan recognition proteins (PGRPs) are pattern recognition receptors that bind, and in certain cases, hydrolyze peptidoglycans (PGNs) of bacterial cell walls	NA|356aa|up_3|NZ_AP019796.1_1694593_1695661_-	NA	NA|1132aa|up_2|NZ_AP019796.1_1695632_1699028_-	NA	NA|898aa|up_1|NZ_AP019796.1_1699042_1701736_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|903aa|up_0|NZ_AP019796.1_1701808_1704517_-	PRK06655, flgD, flagellar hook assembly protein FlgD	csm5gr7|552aa|down_0|NZ_AP019796.1_1706257_1707913_-	cd09662, Csm5_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm5	csm4gr5|338aa|down_1|NZ_AP019796.1_1707930_1708944_-	cd09663, Csm4_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm4	csm3gr7|265aa|down_2|NZ_AP019796.1_1708940_1709735_-	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|129aa|down_3|NZ_AP019796.1_1709751_1710138_-	pfam03750, Csm2_III-A, Csm2 Type III-A	cas10|738aa|down_4|NZ_AP019796.1_1710167_1712381_-	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	csx1|306aa|down_5|NZ_AP019796.1_1712483_1713401_-	cd09741, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	NA|62aa|down_6|NZ_AP019796.1_1714666_1714852_+	pfam14020, DUF4236, Protein of unknown function (DUF4236)	NA|343aa|down_7|NZ_AP019796.1_1714974_1716003_+	NA	NA|596aa|down_8|NZ_AP019796.1_1716023_1717811_+	TIGR04211, hypothetical_protein, SH3 domain protein	NA|273aa|down_9|NZ_AP019796.1_1717817_1718636_+	NA
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	8	1713542-1714377	8,5,6	CRISPRCasFinder,CRT,PILER-CR	no	csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,Cas14u_CAS-V,csx20,cas6,cas2,cas1	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type III-A,Type III-D,Type III-C,Type III-B	GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC	37,37,37	0	0	NA	NA	NA:NA:NA	10,10,6	10	TypeIII-A,TypeIII-D,TypeIII-C,TypeIII-B	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|356aa|up_9|NZ_AP019796.1_1694593_1695661_-,NA|1132aa|up_8|NZ_AP019796.1_1695632_1699028_-,NA|343aa|down_1|NZ_AP019796.1_1714974_1716003_+,NA|273aa|down_3|NZ_AP019796.1_1717817_1718636_+,csx20|131aa|down_6|NZ_AP019796.1_1721073_1721466_+,NA|133aa|down_7|NZ_AP019796.1_1721578_1721977_+,NA|122aa|down_8|NZ_AP019796.1_1721980_1722346_+	NA|356aa|up_9|NZ_AP019796.1_1694593_1695661_-	NA	NA|1132aa|up_8|NZ_AP019796.1_1695632_1699028_-	NA	NA|898aa|up_7|NZ_AP019796.1_1699042_1701736_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|903aa|up_6|NZ_AP019796.1_1701808_1704517_-	PRK06655, flgD, flagellar hook assembly protein FlgD	csm5gr7|552aa|up_5|NZ_AP019796.1_1706257_1707913_-	cd09662, Csm5_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm5	csm4gr5|338aa|up_4|NZ_AP019796.1_1707930_1708944_-	cd09663, Csm4_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm4	csm3gr7|265aa|up_3|NZ_AP019796.1_1708940_1709735_-	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|129aa|up_2|NZ_AP019796.1_1709751_1710138_-	pfam03750, Csm2_III-A, Csm2 Type III-A	cas10|738aa|up_1|NZ_AP019796.1_1710167_1712381_-	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	csx1|306aa|up_0|NZ_AP019796.1_1712483_1713401_-	cd09741, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	NA|62aa|down_0|NZ_AP019796.1_1714666_1714852_+	pfam14020, DUF4236, Protein of unknown function (DUF4236)	NA|343aa|down_1|NZ_AP019796.1_1714974_1716003_+	NA	NA|596aa|down_2|NZ_AP019796.1_1716023_1717811_+	TIGR04211, hypothetical_protein, SH3 domain protein	NA|273aa|down_3|NZ_AP019796.1_1717817_1718636_+	NA	csx1|283aa|down_4|NZ_AP019796.1_1718639_1719488_+	pfam09455, Cas_DxTHG, CRISPR-associated (Cas) DxTHG family	Cas14u_CAS-V|383aa|down_5|NZ_AP019796.1_1719538_1720687_+	COG0675, COG0675, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	csx20|131aa|down_6|NZ_AP019796.1_1721073_1721466_+	NA	NA|133aa|down_7|NZ_AP019796.1_1721578_1721977_+	NA	NA|122aa|down_8|NZ_AP019796.1_1721980_1722346_+	NA	csx1|395aa|down_9|NZ_AP019796.1_1722399_1723584_+	cd09686, Csx1_III-U, CRISPR/Cas system-associated protein Csx1
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	9	1730758-1731513	9,6,7	CRISPRCasFinder,CRT,PILER-CR	no	csx1,Cas14u_CAS-V,csx20,cas6,cas2,cas1	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Unclear	GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC	37,37,37	0	0	NA	NA	NA:NA:NA	9,9,8	9	Unclear	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|122aa|up_9|NZ_AP019796.1_1721980_1722346_+,NA|242aa|up_2|NZ_AP019796.1_1728827_1729553_-,NA|125aa|down_0|NZ_AP019796.1_1731731_1732106_-,NA|107aa|down_1|NZ_AP019796.1_1732166_1732487_-,NA|494aa|down_5|NZ_AP019796.1_1735612_1737094_+,NA|1032aa|down_7|NZ_AP019796.1_1741029_1744125_+,NA|72aa|down_9|NZ_AP019796.1_1744820_1745036_-	NA|122aa|up_9|NZ_AP019796.1_1721980_1722346_+	NA	csx1|395aa|up_8|NZ_AP019796.1_1722399_1723584_+	cd09686, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	csx1|448aa|up_7|NZ_AP019796.1_1723590_1724934_+	cd09732, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	cas6|330aa|up_6|NZ_AP019796.1_1724919_1725909_-	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	NA|292aa|up_5|NZ_AP019796.1_1725970_1726846_-	cd06257, DnaJ, DnaJ domain or J-domain	cas2|94aa|up_4|NZ_AP019796.1_1726860_1727142_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|526aa|up_3|NZ_AP019796.1_1727142_1728720_-	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|242aa|up_2|NZ_AP019796.1_1728827_1729553_-	NA	NA|161aa|up_1|NZ_AP019796.1_1729549_1730032_-	pfam04343, DUF488, Protein of unknown function, DUF488	NA|199aa|up_0|NZ_AP019796.1_1730034_1730631_-	pfam04343, DUF488, Protein of unknown function, DUF488	NA|125aa|down_0|NZ_AP019796.1_1731731_1732106_-	NA	NA|107aa|down_1|NZ_AP019796.1_1732166_1732487_-	NA	NA|119aa|down_2|NZ_AP019796.1_1732745_1733102_-	pfam00436, SSB, Single-strand binding protein family	NA|90aa|down_3|NZ_AP019796.1_1733109_1733379_-	PRK11747, dinG, ATP-dependent DNA helicase DinG; Provisional	NA|679aa|down_4|NZ_AP019796.1_1733567_1735604_+	cd17933, DEXSc_RecD-like, DEXS-box helicase domain of RecD and similar proteins	NA|494aa|down_5|NZ_AP019796.1_1735612_1737094_+	NA	csx1|514aa|down_6|NZ_AP019796.1_1739320_1740862_-	cd09747, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	NA|1032aa|down_7|NZ_AP019796.1_1741029_1744125_+	NA	NA|181aa|down_8|NZ_AP019796.1_1744090_1744633_+	TIGR02168, Chromosome_partition_protein_Smc, chromosome segregation protein SMC, common bacterial type	NA|72aa|down_9|NZ_AP019796.1_1744820_1745036_-	NA
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	10	1737827-1739136	10,7,8,9	CRISPRCasFinder,CRT,PILER-CR,PILER-CR	no	csx1,Cas14u_CAS-V,csx20,cas6,cas2,cas1	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Unclear	GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC,GTCGTAATCCCCTTTTCATCGGGTCAGGTTTTCAGAC	37,37,37,37	0	0	NA	NA	NA:NA:NA:NA	16,16,12,12	16	Unclear	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|242aa|up_8|NZ_AP019796.1_1728827_1729553_-,NA|125aa|up_5|NZ_AP019796.1_1731731_1732106_-,NA|107aa|up_4|NZ_AP019796.1_1732166_1732487_-,NA|494aa|up_0|NZ_AP019796.1_1735612_1737094_+,NA|1032aa|down_1|NZ_AP019796.1_1741029_1744125_+,NA|72aa|down_3|NZ_AP019796.1_1744820_1745036_-,NA|91aa|down_4|NZ_AP019796.1_1744945_1745218_-	cas1|526aa|up_9|NZ_AP019796.1_1727142_1728720_-	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|242aa|up_8|NZ_AP019796.1_1728827_1729553_-	NA	NA|161aa|up_7|NZ_AP019796.1_1729549_1730032_-	pfam04343, DUF488, Protein of unknown function, DUF488	NA|199aa|up_6|NZ_AP019796.1_1730034_1730631_-	pfam04343, DUF488, Protein of unknown function, DUF488	NA|125aa|up_5|NZ_AP019796.1_1731731_1732106_-	NA	NA|107aa|up_4|NZ_AP019796.1_1732166_1732487_-	NA	NA|119aa|up_3|NZ_AP019796.1_1732745_1733102_-	pfam00436, SSB, Single-strand binding protein family	NA|90aa|up_2|NZ_AP019796.1_1733109_1733379_-	PRK11747, dinG, ATP-dependent DNA helicase DinG; Provisional	NA|679aa|up_1|NZ_AP019796.1_1733567_1735604_+	cd17933, DEXSc_RecD-like, DEXS-box helicase domain of RecD and similar proteins	NA|494aa|up_0|NZ_AP019796.1_1735612_1737094_+	NA	csx1|514aa|down_0|NZ_AP019796.1_1739320_1740862_-	cd09747, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	NA|1032aa|down_1|NZ_AP019796.1_1741029_1744125_+	NA	NA|181aa|down_2|NZ_AP019796.1_1744090_1744633_+	TIGR02168, Chromosome_partition_protein_Smc, chromosome segregation protein SMC, common bacterial type	NA|72aa|down_3|NZ_AP019796.1_1744820_1745036_-	NA	NA|91aa|down_4|NZ_AP019796.1_1744945_1745218_-	NA	NA|348aa|down_5|NZ_AP019796.1_1745465_1746509_+	COG1609, PurR, Transcriptional regulators [Transcription]	NA|329aa|down_6|NZ_AP019796.1_1746513_1747500_+	PRK12607, PRK12607, phosphoribosylaminoimidazole-succinocarboxamide synthase; Provisional	NA|269aa|down_7|NZ_AP019796.1_1747484_1748291_-	cd07577, Ph0642_like, Pyrococcus horikoshii Ph0642 and related proteins, members of the nitrilase superfamily (putative class 13 nitrilases)	NA|139aa|down_8|NZ_AP019796.1_1748295_1748712_-	cd00756, MoaE, MoaE family	NA|88aa|down_9|NZ_AP019796.1_1748779_1749043_-	cd00754, Ubl_MoaD, ubiquitin-like (Ubl) domain found in molybdenum cofactor biosynthesis protein D (MoaD) and similar proteins
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	11	2074729-2080688	11,8,10,11	CRISPRCasFinder,CRT,PILER-CR,PILER-CR	no	cas2,cas1,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cas10,cmr1gr7,cas4,cas3,cas5,cas7,cas8b1,cas6,WYL	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type III-A,Type III-B,Type III-C,Type III-D,Type I-B	ATTTCAATACCAAAAAGGTGCGATTAAAAC,ATTTCAATACCAAAAAGGTGCGATTAAAAC,TATTTCAATACCAAAAAGGTGCGATTAAAACCA,ATTTCAATACCAAAAAGGTGCGATTAAAAC	30,30,33,30	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	89,89,86,86	89	TypeIII-A,TypeIII-B,TypeIII-C,TypeIII-D,TypeI-B	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA,NA	NA|437aa|up_9|NZ_AP019796.1_2061854_2063165_-	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|188aa|up_8|NZ_AP019796.1_2063161_2063725_-	pfam00359, PTS_EIIA_2, Phosphoenolpyruvate-dependent sugar phosphotransferase system, EIIA 2	NA|356aa|up_7|NZ_AP019796.1_2063791_2064859_-	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|369aa|up_6|NZ_AP019796.1_2064939_2066046_+	cd05651, M20_ArgE_DapE-like, M20 peptidases with similarity to acetylornithine deacetylases and succinyl-diaminopimelate desuccinylases	NA|256aa|up_5|NZ_AP019796.1_2066129_2066897_-	pfam06439, DUF1080, Domain of Unknown Function (DUF1080)	NA|643aa|up_4|NZ_AP019796.1_2067464_2069393_-	COG0840, Tar, Methyl-accepting chemotaxis protein [Cell motility and secretion / Signal transduction mechanisms]	NA|440aa|up_3|NZ_AP019796.1_2069536_2070856_+	PRK00855, PRK00855, argininosuccinate lyase; Provisional	NA|97aa|up_2|NZ_AP019796.1_2070856_2071147_-	pfam08734, GYD, GYD domain	NA|262aa|up_1|NZ_AP019796.1_2071721_2072507_-	pfam01670, Glyco_hydro_12, Glycosyl hydrolase family 12	NA|678aa|up_0|NZ_AP019796.1_2072582_2074616_-	pfam03629, SASA, Carbohydrate esterase, sialic acid-specific acetylesterase	cas2|89aa|down_0|NZ_AP019796.1_2080949_2081216_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|361aa|down_1|NZ_AP019796.1_2081217_2082300_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	NA|230aa|down_2|NZ_AP019796.1_2082296_2082986_-	cd05782, DNA_polB_like1_exo, Uncharacterized bacterial subgroup of the DEDDy 3'-5' exonuclease domain of family-B DNA polymerases	csm6|355aa|down_3|NZ_AP019796.1_2083137_2084202_-	cd09742, Csm6_III-A, CRISPR/Cas system-associated protein Csm6	cmr6gr7|361aa|down_4|NZ_AP019796.1_2084212_2085295_-	cd09661, Cmr6_III-B, CRISPR/Cas system-associated RAMP superfamily protein Cmr6	cmr5gr11|141aa|down_5|NZ_AP019796.1_2085392_2085815_-	pfam09701, Cas_Cmr5, CRISPR-associated protein (Cas_Cmr5)	cmr4gr7|323aa|down_6|NZ_AP019796.1_2085811_2086780_-	TIGR02580, putative_CRISPR-associated_protein, CRISPR type III-B/RAMP module RAMP protein Cmr4	cmr3gr5|376aa|down_7|NZ_AP019796.1_2086791_2087919_-	cd09748, Cmr3_III-B, CRISPR/Cas system-associated RAMP superfamily protein Cmr3	cas10|956aa|down_8|NZ_AP019796.1_2087915_2090783_-	cd09679, Cas10_III, CRISPR/Cas system-associated protein Cas10	cmr1gr7|316aa|down_9|NZ_AP019796.1_2090776_2091724_-	cd09657, Cmr1_III-B, CRISPR/Cas system-associated RAMP superfamily protein Cmr1
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	12	2276178-2277152	12,12,9	PILER-CR,CRISPRCasFinder,CRT	no		csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Orphan	ATTTCAATACCAAAAAGGTGCGATTAAAAC,ATTTCAATACCAAAAAGGTGCGATTAAAAC,ATTTCAATACCAAAAAGGTGCGATTAAAAC	30,30,30	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	14,14,14	14	Orphan	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|55aa|up_5|NZ_AP019796.1_2271144_2271309_+,NA	NA|509aa|up_9|NZ_AP019796.1_2266467_2267994_-	TIGR03521, gliding_motility_protein_GldG, gliding-associated putative ABC transporter substrate-binding component GldG	NA|236aa|up_8|NZ_AP019796.1_2267997_2268705_-	TIGR03518, ABC_transporter_permease_protein, gliding motility-associated ABC transporter permease protein GldF	NA|309aa|up_7|NZ_AP019796.1_2268718_2269645_-	TIGR03522, GldA_ABC_ATP, gliding motility-associated ABC transporter ATP-binding subunit GldA	NA|392aa|up_6|NZ_AP019796.1_2269820_2270996_-	COG1373, COG1373, Predicted ATPase (AAA+ superfamily) [General function prediction only]	NA|55aa|up_5|NZ_AP019796.1_2271144_2271309_+	NA	NA|342aa|up_4|NZ_AP019796.1_2271299_2272325_+	pfam04966, OprB, Carbohydrate-selective porin, OprB family	NA|123aa|up_3|NZ_AP019796.1_2272321_2272690_-	pfam18480, DUF5615, Domain of unknown function (DUF5615)	NA|85aa|up_2|NZ_AP019796.1_2272686_2272941_-	pfam04255, DUF433, Protein of unknown function (DUF433)	NA|445aa|up_1|NZ_AP019796.1_2272966_2274301_-	pfam01204, Trehalase, Trehalase	NA|556aa|up_0|NZ_AP019796.1_2274435_2276103_+	PLN02791, PLN02791, Nudix hydrolase homolog	NA|219aa|down_0|NZ_AP019796.1_2277657_2278314_+	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|322aa|down_1|NZ_AP019796.1_2278326_2279292_+	PRK03598, PRK03598, putative efflux pump membrane fusion protein; Provisional	NA|316aa|down_2|NZ_AP019796.1_2279295_2280243_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|445aa|down_3|NZ_AP019796.1_2280263_2281598_+	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|313aa|down_4|NZ_AP019796.1_2281594_2282533_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|382aa|down_5|NZ_AP019796.1_2282540_2283686_+	pfam12698, ABC2_membrane_3, ABC-2 family transporter protein	NA|365aa|down_6|NZ_AP019796.1_2283692_2284787_+	COG0842, COG0842, ABC-type multidrug transport system, permease component [Defense mechanisms]	NA|270aa|down_7|NZ_AP019796.1_2284801_2285611_-	cd07177, terB_like, tellurium resistance terB-like protein	NA|930aa|down_8|NZ_AP019796.1_2285752_2288542_-	COG1042, COG1042, Acyl-CoA synthetase (NDP forming) [Energy production and conversion]	NA|459aa|down_9|NZ_AP019796.1_2288642_2290019_-	cd05803, PGM_like4, This PGM-like (phosphoglucomutase-like) domain is located C-terminal to a mannose-1-phosphate guanyltransferase domain in a protein of unknown function that is found in both prokaryotes and eukaryotes
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	13	3047818-3047914	13	CRISPRCasFinder	no	csa3	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Type I-A	CGCTACAACGCGCCATGAAGACGATCGAACT	31	0	0	NA	NA	NA	1	1	Orphan	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|163aa|up_8|NZ_AP019796.1_3035529_3036018_+,NA|122aa|down_1|NZ_AP019796.1_3052927_3053293_+,NA|120aa|down_8|NZ_AP019796.1_3065579_3065939_+	NA|109aa|up_9|NZ_AP019796.1_3035065_3035392_+	COG2608, CopZ, Copper chaperone [Inorganic ion transport and metabolism]	NA|163aa|up_8|NZ_AP019796.1_3035529_3036018_+	NA	NA|428aa|up_7|NZ_AP019796.1_3036114_3037398_+	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|574aa|up_6|NZ_AP019796.1_3037401_3039123_+	pfam16576, HlyD_D23, Barrel-sandwich domain of CusB or HlyD membrane-fusion	NA|1055aa|up_5|NZ_AP019796.1_3039138_3042303_+	COG3696, COG3696, Putative silver efflux pump [Inorganic ion transport and metabolism]	NA|251aa|up_4|NZ_AP019796.1_3043914_3044667_+	pfam03413, PepSY, Peptidase propeptide and YPEB domain	NA|137aa|up_3|NZ_AP019796.1_3044659_3045070_-	cd18683, PIN_VapC-like, Uncharacterized subfamily of the VapC (virulence-associated protein C)-like family of the PIN domain superfamily	NA|87aa|up_2|NZ_AP019796.1_3045085_3045346_-	smart00966, SpoVT_AbrB, SpoVT / AbrB like domain	NA|410aa|up_1|NZ_AP019796.1_3045412_3046642_-	cd17325, MFS_MdtG_SLC18_like, bacterial MdtG-like and eukaryotic solute carrier 18 (SLC18) family of the Major Facilitator Superfamily of transporters	NA|238aa|up_0|NZ_AP019796.1_3046657_3047371_-	cd19366, TenA_C_BhTenA-like, TenA_C proteins similar to Bacillus halodurans TenA	NA|881aa|down_0|NZ_AP019796.1_3050086_3052729_+	TIGR03346, chaperone_ClpB, ATP-dependent chaperone ClpB	NA|122aa|down_1|NZ_AP019796.1_3052927_3053293_+	NA	NA|392aa|down_2|NZ_AP019796.1_3053329_3054505_-	TIGR00937, Chromate_transport_protein, chromate transporter, chromate ion transporter (CHR) family	NA|426aa|down_3|NZ_AP019796.1_3054588_3055866_-	COG0412, COG0412, Dienelactone hydrolase and related enzymes [Secondary metabolites biosynthesis, transport, and catabolism]	NA|747aa|down_4|NZ_AP019796.1_3055838_3058079_-	pfam16153, DUF4861, Domain of unknown function (DUF4861)	NA|394aa|down_5|NZ_AP019796.1_3058181_3059363_-	pfam07470, Glyco_hydro_88, Glycosyl Hydrolase Family 88	NA|577aa|down_6|NZ_AP019796.1_3059465_3061196_-	pfam13860, FlgD_ig, FlgD Ig-like domain	NA|1005aa|down_7|NZ_AP019796.1_3062078_3065093_-	TIGR01782, TonB-dependent_receptor, TonB-dependent receptor	NA|120aa|down_8|NZ_AP019796.1_3065579_3065939_+	NA	NA|211aa|down_9|NZ_AP019796.1_3065919_3066552_+	cd02503, MobA, MobA catalyzes the formation of molybdopterin guanine dinucleotide
GCF_009936255.1_ASM993625v1	NZ_AP019796	Rhodothermus marinus strain AA2-13	14	3377903-3378049	13	PILER-CR	no	cas3,WYL	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	Unclear	ATGTTTCACGTGAAACGCTGC	21	0	0	NA	NA	NA	3	3	Unclear	csa3,DEDDh,cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,Cas14u_CAS-V,c2c9_V-U4,cas14j,WYL,cas6,cas8b1,cas4,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,csx1,csx20,csm6,cmr6gr7,cmr5gr11,cmr4gr7,cmr3gr5,cmr1gr7,cas3HD,DinG	NA|163aa|up_8|NZ_AP019796.1_3366998_3367487_+,NA|302aa|up_6|NZ_AP019796.1_3369045_3369951_+,NA	NA|368aa|up_9|NZ_AP019796.1_3365898_3367002_+	cd03799, GT4_AmsK-like, Erwinia amylovora AmsK and similar proteins	NA|163aa|up_8|NZ_AP019796.1_3366998_3367487_+	NA	NA|522aa|up_7|NZ_AP019796.1_3367483_3369049_+	smart00752, HTTM, Horizontally Transferred TransMembrane Domain	NA|302aa|up_6|NZ_AP019796.1_3369045_3369951_+	NA	NA|278aa|up_5|NZ_AP019796.1_3369932_3370766_-	cd00761, Glyco_tranf_GTA_type, Glycosyltransferase family A (GT-A) includes diverse families of glycosyl transferases with a common GT-A type structural fold	NA|141aa|up_4|NZ_AP019796.1_3370914_3371337_+	cd03449, R_hydratase, (R)-hydratase [(R)-specific enoyl-CoA hydratase] catalyzes the hydration of trans-2-enoyl CoA to (R)-3-hydroxyacyl-CoA as part of the PHA (polyhydroxyalkanoate) biosynthetic pathway	NA|494aa|up_3|NZ_AP019796.1_3371344_3372826_-	cd07333, M48C_bepA_like, Peptidase M48C Ste24p bepA-like, integral membrane protein	NA|388aa|up_2|NZ_AP019796.1_3372857_3374021_-	PRK00064, recF, recombination protein F; Reviewed	NA|894aa|up_1|NZ_AP019796.1_3374310_3376992_+	pfam12770, CHAT, CHAT domain	NA|311aa|up_0|NZ_AP019796.1_3376969_3377902_+	PRK05441, murQ, N-acetylmuramic acid-6-phosphate etherase; Reviewed	cas3|1113aa|down_0|NZ_AP019796.1_3378128_3381467_+	COG1197, Mfd, Transcription-repair coupling factor (superfamily II helicase) [DNA replication, recombination, and repair / Transcription]	WYL|337aa|down_1|NZ_AP019796.1_3381439_3382450_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|240aa|down_2|NZ_AP019796.1_3382489_3383209_-	PRK00107, gidB, 16S rRNA (guanine(527)-N(7))-methyltransferase RsmG	NA|634aa|down_3|NZ_AP019796.1_3383209_3385111_-	PRK05192, PRK05192, tRNA uridine-5-carboxymethylaminomethyl(34) synthesis enzyme MnmG	NA|322aa|down_4|NZ_AP019796.1_3385250_3386216_-	pfam13546, DDE_5, DDE superfamily endonuclease	NA|858aa|down_5|NZ_AP019796.1_3386347_3388921_+	TIGR02956, sensor_protein_TorS, TMAO reductase sytem sensor TorS	NA|786aa|down_6|NZ_AP019796.1_3388922_3391280_+	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|463aa|down_7|NZ_AP019796.1_3391256_3392645_-	PRK05291, trmE, tRNA uridine-5-carboxymethylaminomethyl(34) synthesis GTPase MnmE	NA|608aa|down_8|NZ_AP019796.1_3392663_3394487_-	PRK01318, PRK01318, membrane protein insertase; Provisional	NA|135aa|down_9|NZ_AP019796.1_3394562_3394967_-	PRK01903, rnpA, ribonuclease P protein component
