assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000166415.1_ASM16641v1	NC_014654	Halanaerobium hydrogeniformans, complete sequence	1	9304-9387	1	CRISPRCasFinder	no		csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	Orphan	TTGTTCTATTAAAGAAGATCAGTG	24	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	NA,NA|292aa|down_0|NC_014654.1_15338_16214_+	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|474aa|up_6|NC_014654.1_76_1498_+	TIGR00362, DnaA, chromosomal replication initiator protein DnaA	NA|372aa|up_5|NC_014654.1_1759_2875_+	PRK05643, PRK05643, DNA polymerase III subunit beta; Validated	NA|73aa|up_4|NC_014654.1_2888_3107_+	pfam13275, S4_2, S4 domain	NA|374aa|up_3|NC_014654.1_3110_4232_+	PRK00064, recF, recombination protein F; Reviewed	NA|87aa|up_2|NC_014654.1_4240_4501_+	pfam04025, DUF370, Domain of unknown function (DUF370)	NA|641aa|up_1|NC_014654.1_4500_6423_+	PRK05644, gyrB, DNA gyrase subunit B; Validated	NA|833aa|up_0|NC_014654.1_6455_8954_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|292aa|down_0|NC_014654.1_15338_16214_+	NA	NA|499aa|down_1|NC_014654.1_16341_17838_+	PRK00047, glpK, glycerol kinase GlpK	NA|493aa|down_2|NC_014654.1_17976_19455_+	COG0579, COG0579, Predicted dehydrogenase [General function prediction only]	NA|427aa|down_3|NC_014654.1_19447_20728_+	pfam07992, Pyr_redox_2, Pyridine nucleotide-disulphide oxidoreductase	NA|126aa|down_4|NC_014654.1_20728_21106_+	pfam07892, DUF1667, Protein of unknown function (DUF1667)	NA|174aa|down_5|NC_014654.1_21109_21631_+	cd03134, GATase1_PfpI_like, A type 1 glutamine amidotransferase (GATase1)-like domain found in PfpI from Pyrococcus furiosus	NA|331aa|down_6|NC_014654.1_21922_22915_+	PRK14481, PRK14481, dihydroxyacetone kinase subunit DhaK; Provisional	NA|210aa|down_7|NC_014654.1_22950_23580_+	TIGR02365, dha_L_ycgS, dihydroxyacetone kinase, phosphoprotein-dependent, L subunit	NA|131aa|down_8|NC_014654.1_23607_24000_+	TIGR02364, dha_pts, dihydroxyacetone kinase, phosphotransfer subunit	NA|254aa|down_9|NC_014654.1_24166_24928_+	COG1349, GlpR, Transcriptional regulators of sugar metabolism [Transcription / Carbohydrate transport and metabolism]
GCF_000166415.1_ASM16641v1	NC_014654	Halanaerobium hydrogeniformans, complete sequence	2	594431-594556	2	CRISPRCasFinder	no		csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	Orphan	ATGGGACAATCGAGAATATCTCTATAAAAGATGTAGATATAA	42	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	NA|193aa|up_9|NC_014654.1_579060_579639_+,NA	NA|193aa|up_9|NC_014654.1_579060_579639_+	NA	NA|354aa|up_8|NC_014654.1_579823_580885_+	COG3947, COG3947, Response regulator containing CheY-like receiver and SARP domains [Signal transduction mechanisms]	NA|617aa|up_7|NC_014654.1_581077_582928_+	PRK00558, uvrC, excinuclease ABC subunit UvrC	NA|396aa|up_6|NC_014654.1_582946_584134_+	TIGR01292, Thioredoxin_reductase, thioredoxin-disulfide reductase	NA|331aa|up_5|NC_014654.1_584330_585323_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|534aa|up_4|NC_014654.1_585426_587028_+	PRK05270, PRK05270, UDP-glucose--hexose-1-phosphate uridylyltransferase	NA|229aa|up_3|NC_014654.1_587051_587738_+	COG1802, GntR, Transcriptional regulators [Transcription]	NA|615aa|up_2|NC_014654.1_587784_589629_+	COG2206, COG2206, c-di-GMP phosphodiesterase class II (HD-GYP domain) [Signal transduction mechanisms]	NA|319aa|up_1|NC_014654.1_589707_590664_-	COG2206, COG2206, c-di-GMP phosphodiesterase class II (HD-GYP domain) [Signal transduction mechanisms]	NA|402aa|up_0|NC_014654.1_590828_592034_-	pfam08447, PAS_3, PAS fold	NA|62aa|down_0|NC_014654.1_597538_597724_-	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|383aa|down_1|NC_014654.1_597889_599038_+	pfam02595, Gly_kinase, Glycerate kinase family	NA|1531aa|down_2|NC_014654.1_599236_603829_+	PRK11750, gltB, glutamate synthase subunit alpha; Provisional	NA|489aa|down_3|NC_014654.1_603850_605317_+	PRK12810, gltD, glutamate synthase subunit beta; Reviewed	NA|245aa|down_4|NC_014654.1_605497_606232_+	cd13624, PBP2_Arg_Lys_His, Substrate binding domain of the arginine-, lysine-, histidine-binding protein ArtJ; the type 2 periplasmic binding protein fold	NA|230aa|down_5|NC_014654.1_606395_607085_+	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|253aa|down_6|NC_014654.1_607074_607833_+	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|221aa|down_7|NC_014654.1_607832_608495_+	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|506aa|down_8|NC_014654.1_608775_610293_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|429aa|down_9|NC_014654.1_610540_611827_+	cd06174, MFS, Major Facilitator Superfamily
GCF_000166415.1_ASM16641v1	NC_014654	Halanaerobium hydrogeniformans, complete sequence	3	1520849-1520931	3	CRISPRCasFinder	no		csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	Orphan	CCTTCGCGCTATATCTTCATTTTA	24	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	NA|70aa|up_9|NC_014654.1_1511397_1511607_-,NA	NA|70aa|up_9|NC_014654.1_1511397_1511607_-	NA	NA|186aa|up_8|NC_014654.1_1511610_1512168_-	PRK00083, frr, ribosome recycling factor; Reviewed	NA|240aa|up_7|NC_014654.1_1512186_1512906_-	PRK00358, pyrH, uridylate kinase; Provisional	NA|300aa|up_6|NC_014654.1_1513022_1513922_-	PRK09377, tsf, elongation factor Ts; Provisional	NA|253aa|up_5|NC_014654.1_1514028_1514787_-	PRK05299, rpsB, 30S ribosomal protein S2; Provisional	NA|261aa|up_4|NC_014654.1_1515033_1515816_-	PRK04158, PRK04158, GTP-sensing pleiotropic transcriptional regulator CodY	NA|458aa|up_3|NC_014654.1_1515847_1517221_-	PRK05201, hslU, ATP-dependent protease ATPase subunit HslU	NA|188aa|up_2|NC_014654.1_1517213_1517777_-	PRK05456, PRK05456, ATP-dependent protease subunit HslV	NA|692aa|up_1|NC_014654.1_1517999_1520075_-	PRK05582, PRK05582, type I DNA topoisomerase	NA|160aa|up_0|NC_014654.1_1520104_1520584_-	pfam04361, DUF494, Protein of unknown function (DUF494)	NA|382aa|down_0|NC_014654.1_1521004_1522150_-	pfam02481, DNA_processg_A, DNA recombination-mediator protein A	NA|497aa|down_1|NC_014654.1_1522282_1523773_+	COG0168, TrkG, Trk-type K+ transport systems, membrane components [Inorganic ion transport and metabolism]	NA|224aa|down_2|NC_014654.1_1523796_1524468_+	PRK09496, trkA, Trk system potassium transporter TrkA	NA|253aa|down_3|NC_014654.1_1524530_1525289_-	pfam04402, SIMPL, Protein of unknown function (DUF541)	NA|133aa|down_4|NC_014654.1_1525437_1525836_-	pfam02472, ExbD, Biopolymer transport protein ExbD/TolR	NA|206aa|down_5|NC_014654.1_1525837_1526455_-	pfam01618, MotA_ExbB, MotA/TolQ/ExbB proton channel family	NA|363aa|down_6|NC_014654.1_1526469_1527558_-	pfam03544, TonB_C, Gram-negative bacterial TonB protein C-terminal	NA|595aa|down_7|NC_014654.1_1527583_1529368_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|122aa|down_8|NC_014654.1_1529922_1530288_+	PRK12497, PRK12497, YraN family protein	NA|513aa|down_9|NC_014654.1_1530306_1531845_+	COG0606, COG0606, Predicted ATPase with chaperone activity [Posttranslational modification, protein turnover, chaperones]
GCF_000166415.1_ASM16641v1	NC_014654	Halanaerobium hydrogeniformans, complete sequence	4	1666592-1670122	1,4,1	PILER-CR,CRISPRCasFinder,CRT	no	cas6,cas4,cas2,cas1,cas3,cas5,cas7,cas8b1,WYL	csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	Type I-B	GTTTCAATCCTTATTTTAATGGATTAGTCATTGGAGC,GTTTCAATCCTTATTTTAATGGATTAGTCATTGGAGC,GTTTCAATCCTTATTTTAATGGATTAGTCATTGGAGC	37,37,37	0	0	NA	NA	I-B:I-B:I-B	48,48,48	48	TypeI-B	csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	NA|378aa|up_0|NC_014654.1_1665305_1666439_+,NA	NA|241aa|up_9|NC_014654.1_1649411_1650134_-	COG1285, SapB, Uncharacterized membrane protein [Function unknown]	NA|277aa|up_8|NC_014654.1_1650550_1651381_-	NF033188, internalin_H, InlH/InlC2 family class 1 internalin	NA|393aa|up_7|NC_014654.1_1651401_1652580_-	pfam07907, YibE_F, YibE/F-like protein	NA|531aa|up_6|NC_014654.1_1654400_1655993_-	cd16012, ALP, Alkaline Phosphatase	NA|357aa|up_5|NC_014654.1_1656628_1657699_-	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|423aa|up_4|NC_014654.1_1658138_1659406_+	pfam00665, rve, Integrase core domain	NA|277aa|up_3|NC_014654.1_1659677_1660508_-	NF033189, internalin_A, class 1 internalin InlA	NA|393aa|up_2|NC_014654.1_1660528_1661707_-	pfam07907, YibE_F, YibE/F-like protein	NA|528aa|up_1|NC_014654.1_1661837_1663421_-	cd16012, ALP, Alkaline Phosphatase	NA|378aa|up_0|NC_014654.1_1665305_1666439_+	NA	cas6|230aa|down_0|NC_014654.1_1670380_1671070_-	pfam17262, DUF5328, Family of unknown function (DUF5328)	cas4|197aa|down_1|NC_014654.1_1671084_1671675_-	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4	cas2|97aa|down_2|NC_014654.1_1671691_1671982_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|327aa|down_3|NC_014654.1_1671981_1672962_-	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas3|820aa|down_4|NC_014654.1_1672986_1675446_-	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas5|240aa|down_5|NC_014654.1_1675464_1676184_-	TIGR02592, hypothetical_protein_CTC_01466, CRISPR-associated protein Cas5, subtype I-B/HMARI	cas7|305aa|down_6|NC_014654.1_1676250_1677165_-	TIGR02590, hypothetical_protein_MM_0563, CRISPR-associated protein Cas7/Csh2, subtype I-B/HMARI	cas8b1|610aa|down_7|NC_014654.1_1677167_1678997_-	pfam09484, Cas_TM1802, CRISPR-associated protein TM1802 (cas_TM1802)	WYL|322aa|down_8|NC_014654.1_1679256_1680222_-	pfam13280, WYL, WYL domain	NA|882aa|down_9|NC_014654.1_1680736_1683382_-	cd02080, P-type_ATPase_cation, P-type cation-transporting ATPase similar to Exiguobacterium aurantiacum Mna, an Na(+)-ATPase, and Synechocystis sp
GCF_000166415.1_ASM16641v1	NC_014654	Halanaerobium hydrogeniformans, complete sequence	5	2151542-2151626	5	CRISPRCasFinder	no		csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	Orphan	CACTGAATCTTCTTTAATAGAACAA	25	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14k,RT,WYL,cas4,cas3,DinG,DEDDh,cas6,cas2,cas1,cas5,cas7,cas8b1	NA,NA	NA|264aa|up_9|NC_014654.1_2135038_2135830_-	pfam09021, HutP, HutP	NA|178aa|up_8|NC_014654.1_2135816_2136350_-	pfam02542, YgbB, YgbB family	NA|230aa|up_7|NC_014654.1_2136350_2137040_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|362aa|up_6|NC_014654.1_2137056_2138142_-	COG4956, COG4956, Integral membrane protein (PIN domain superfamily) [General function prediction only]	NA|167aa|up_5|NC_014654.1_2138175_2138676_-	COG1329, COG1329, Transcriptional regulators, similar to M	NA|360aa|up_4|NC_014654.1_2138793_2139873_-	PRK13482, PRK13482, DNA integrity scanning protein DisA; Provisional	NA|818aa|up_3|NC_014654.1_2141429_2143883_-	COG0542, clpA, ATP-binding subunits of Clp protease and DnaK/DnaJ chaperones [Posttranslational modification, protein turnover, chaperones]	NA|343aa|up_2|NC_014654.1_2143902_2144931_-	PRK01059, PRK01059, ATP:guanido phosphotransferase; Provisional	NA|182aa|up_1|NC_014654.1_2144911_2145457_-	COG3880, COG3880, Modulator of heat shock repressor CtsR, McsA [Signal transduction    mechanisms]	NA|156aa|up_0|NC_014654.1_2145460_2145928_-	COG4463, CtsR, Transcriptional repressor of class III stress genes [Transcription]	NA|134aa|down_0|NC_014654.1_2152041_2152443_-	pfam01894, UPF0047, Uncharacterized protein family UPF0047	NA|492aa|down_1|NC_014654.1_2152527_2154003_-	PRK00484, lysS, lysyl-tRNA synthetase; Reviewed	NA|161aa|down_2|NC_014654.1_2154099_2154582_-	PRK00226, greA, transcription elongation factor GreA; Reviewed	NA|326aa|down_3|NC_014654.1_2154741_2155719_-	TIGR00737, Probable_tRNA-dihydrouridine_synthase, putative TIM-barrel protein, nifR3 family	NA|258aa|down_4|NC_014654.1_2155726_2156500_-	PRK13318, PRK13318, type III pantothenate kinase	NA|314aa|down_5|NC_014654.1_2156513_2157455_-	cd04730, NPD_like, 2-Nitropropane dioxygenase (NPD), one of the nitroalkane oxidizing enzyme families, catalyzes oxidative denitrification of nitroalkanes to their corresponding carbonyl compounds and nitrites	NA|324aa|down_6|NC_014654.1_2157585_2158557_-	cd06354, PBP1_PrnA-like, periplasmic binding domain of basic membrane lipoprotein, PnrA, in Treponema pallidum and its homologs from other bacteria and Archaea	NA|285aa|down_7|NC_014654.1_2158584_2159439_-	COG0340, BirA, Biotin-(acetyl-CoA carboxylase) ligase [Coenzyme metabolism]	NA|210aa|down_8|NC_014654.1_2159511_2160141_-	TIGR04518, conserved_hypothetical_protein, ECF transporter S component, folate family	NA|557aa|down_9|NC_014654.1_2160273_2161944_-	pfam01268, FTHFS, Formate--tetrahydrofolate ligase
