assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002222595.2_ASM222259v2	NZ_CP022413	Blautia hansenii DSM 20583 chromosome, complete genome	1	996449-996775	1	CRT	no		cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	Orphan	TGGGGAGCAATGTGCACCGGCTGGGTA	27	3	5	996476-996508|996536-996568|996536-996568|996536-996568|996656-996688	NZ_CP022413.2_996416-996448|NZ_CP022413.2_2596881-2596849|NZ_CP022413.2_2596581-2596549|NZ_CP022413.2_2596701-2596669|NZ_CP022413.2_996416-996448	NA	5	5	Orphan	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	NA,NA|98aa|down_1|NZ_CP022413.2_998792_999086_+	NA|42aa|up_9|NZ_CP022413.2_980399_980525_+	pfam09339, HTH_IclR, IclR helix-turn-helix domain	NA|141aa|up_8|NZ_CP022413.2_980521_980944_+	pfam02028, BCCT, BCCT, betaine/carnitine/choline family transporter	NA|214aa|up_7|NZ_CP022413.2_981031_981673_+	TIGR01367, Orotate_phosphoribosyltransferase, orotate phosphoribosyltransferase, Thermus family	NA|456aa|up_6|NZ_CP022413.2_981806_983174_-	COG5263, COG5263, FOG: Glucan-binding domain (YG repeat) [General function prediction only]	NA|383aa|up_5|NZ_CP022413.2_983378_984527_+	pfam13785, DUF4178, Domain of unknown function (DUF4178)	NA|142aa|up_4|NZ_CP022413.2_984551_984977_+	pfam03994, DUF350, Domain of Unknown Function (DUF350)	NA|509aa|up_3|NZ_CP022413.2_984976_986503_+	PRK03612, PRK03612, polyamine aminopropyltransferase	NA|973aa|up_2|NZ_CP022413.2_986594_989513_+	COG1026, COG1026, Predicted Zn-dependent peptidases, insulinase-like [General function prediction only]	NA|302aa|up_1|NZ_CP022413.2_989524_990430_+	PRK00089, era, GTPase Era; Reviewed	NA|248aa|up_0|NZ_CP022413.2_990429_991173_+	PRK00085, recO, DNA repair protein RecO; Reviewed	NA|465aa|down_0|NZ_CP022413.2_996995_998390_+	PRK04173, PRK04173, glycyl-tRNA synthetase; Provisional	NA|98aa|down_1|NZ_CP022413.2_998792_999086_+	NA	NA|89aa|down_2|NZ_CP022413.2_999063_999330_+	cd01948, EAL, EAL domain	NA|428aa|down_3|NZ_CP022413.2_999349_1000633_+	pfam09587, PGA_cap, Bacterial capsule synthesis protein PGA_cap	NA|416aa|down_4|NZ_CP022413.2_1000773_1002021_+	PRK14072, PRK14072, diphosphate--fructose-6-phosphate 1-phosphotransferase	NA|308aa|down_5|NZ_CP022413.2_1002170_1003094_+	cd04181, NTP_transferase, NTP_transferases catalyze the transfer of nucleotides onto phosphosugars	NA|449aa|down_6|NZ_CP022413.2_1003179_1004526_+	cd05802, GlmM, GlmM is a bacterial phosphoglucosamine mutase (PNGM) that belongs to the alpha-D-phosphohexomutase superfamily	NA|333aa|down_7|NZ_CP022413.2_1004580_1005579_+	sd00006, TPR, Tetratricopeptide repeat	NA|368aa|down_8|NZ_CP022413.2_1005621_1006725_+	pfam11258, DUF3048, Protein of unknown function (DUF3048) N-terminal domain	NA|298aa|down_9|NZ_CP022413.2_1006862_1007756_+	TIGR00762, DegV, EDD domain protein, DegV family
GCF_002222595.2_ASM222259v2	NZ_CP022413	Blautia hansenii DSM 20583 chromosome, complete genome	2	1172933-1173030	1	CRISPRCasFinder	no		cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	Orphan	AACCGACCAAACAACCGTTTTAA	23	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	NA,NA	NA|705aa|up_9|NZ_CP022413.2_1160809_1162924_+	cd07731, ComA-like_MBL-fold, Competence protein ComA, ComEC and related proteins; MBL-fold metallo hydrolase domain	NA|279aa|up_8|NZ_CP022413.2_1163032_1163869_-	COG0613, COG0613, Predicted metal-dependent phosphoesterases (PHP family) [General function prediction only]	NA|182aa|up_7|NZ_CP022413.2_1164246_1164792_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|641aa|up_6|NZ_CP022413.2_1164835_1166758_+	PRK05644, gyrB, DNA gyrase subunit B; Validated	NA|749aa|up_5|NZ_CP022413.2_1166768_1169015_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|389aa|up_4|NZ_CP022413.2_1169035_1170202_+	COG5279, CYK3, Uncharacterized protein involved in cytokinesis, contains TGc (transglutaminase/protease-like) domain [Cell division and chromosome partitioning]	NA|155aa|up_3|NZ_CP022413.2_1170335_1170800_+	PRK00092, PRK00092, ribosome maturation protein RimP; Reviewed	NA|385aa|up_2|NZ_CP022413.2_1170820_1171975_+	PRK12327, nusA, transcription elongation factor NusA; Provisional	NA|93aa|up_1|NZ_CP022413.2_1171984_1172263_+	pfam04296, DUF448, Protein of unknown function (DUF448)	NA|105aa|up_0|NZ_CP022413.2_1172249_1172564_+	PRK07714, PRK07714, YlxQ family RNA-binding protein	NA|129aa|down_0|NZ_CP022413.2_1175370_1175757_+	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|321aa|down_1|NZ_CP022413.2_1175737_1176700_+	COG0618, COG0618, Exopolyphosphatase-related proteins [General function prediction only]	NA|299aa|down_2|NZ_CP022413.2_1176702_1177599_+	PRK00130, truB, tRNA pseudouridine synthase B; Provisional	NA|317aa|down_3|NZ_CP022413.2_1177614_1178565_+	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase	NA|545aa|down_4|NZ_CP022413.2_1178609_1180244_+	COG1283, NptA, Na+/phosphate symporter [Inorganic ion transport and metabolism]	NA|255aa|down_5|NZ_CP022413.2_1180340_1181105_+	COG0791, Spr, Cell wall-associated hydrolases (invasion-associated proteins) [Cell envelope biogenesis, outer membrane]	NA|89aa|down_6|NZ_CP022413.2_1181233_1181500_+	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|698aa|down_7|NZ_CP022413.2_1181693_1183787_+	PRK11824, PRK11824, polynucleotide phosphorylase/polyadenylase; Provisional	NA|179aa|down_8|NZ_CP022413.2_1183822_1184359_+	pfam13353, Fer4_12, 4Fe-4S single cluster domain	NA|172aa|down_9|NZ_CP022413.2_1184367_1184883_+	COG0756, Dut, dUTPase [Nucleotide transport and metabolism]
GCF_002222595.2_ASM222259v2	NZ_CP022413	Blautia hansenii DSM 20583 chromosome, complete genome	3	1920180-1920343	2	CRISPRCasFinder	no	RT,cas14j,c2c9_V-U4	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	Unclear	GATGCATTTTATATATATAAGTGGATTGAAATC	33	0	0	NA	NA	NA	2	2	TypeV	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	NA|91aa|up_7|NZ_CP022413.2_1916394_1916667_+,NA|95aa|up_6|NZ_CP022413.2_1916653_1916938_+,NA|108aa|up_4|NZ_CP022413.2_1917625_1917949_+,NA|116aa|up_3|NZ_CP022413.2_1917968_1918316_+,NA|52aa|up_2|NZ_CP022413.2_1918331_1918487_+,NA|67aa|down_1|NZ_CP022413.2_1921535_1921736_+,NA|188aa|down_2|NZ_CP022413.2_1921756_1922320_+,NA|65aa|down_4|NZ_CP022413.2_1923031_1923226_+,NA|227aa|down_5|NZ_CP022413.2_1923232_1923913_+,NA|247aa|down_7|NZ_CP022413.2_1925467_1926208_+,NA|224aa|down_8|NZ_CP022413.2_1926195_1926867_+,NA|56aa|down_9|NZ_CP022413.2_1926921_1927089_+	NA|47aa|up_9|NZ_CP022413.2_1914210_1914351_-	pfam10139, Virul_Fac, Putative bacterial virulence factor	NA|397aa|up_8|NZ_CP022413.2_1914993_1916184_+	pfam00004, AAA, ATPase family associated with various cellular activities (AAA)	NA|91aa|up_7|NZ_CP022413.2_1916394_1916667_+	NA	NA|95aa|up_6|NZ_CP022413.2_1916653_1916938_+	NA	NA|229aa|up_5|NZ_CP022413.2_1916937_1917624_+	cd00844, MPP_Dbr1_N, Dbr1 RNA lariat debranching enzyme, N-terminal metallophosphatase domain	NA|108aa|up_4|NZ_CP022413.2_1917625_1917949_+	NA	NA|116aa|up_3|NZ_CP022413.2_1917968_1918316_+	NA	NA|52aa|up_2|NZ_CP022413.2_1918331_1918487_+	NA	cas14j|374aa|up_1|NZ_CP022413.2_1918509_1919631_+	pfam01385, OrfB_IS605, Probable transposase	c2c9_V-U4|99aa|up_0|NZ_CP022413.2_1919602_1919899_+	pfam07282, OrfB_Zn_ribbon, Putative transposase DNA-binding domain	NA|151aa|down_0|NZ_CP022413.2_1920945_1921398_+	pfam09424, YqeY, Yqey-like protein	NA|67aa|down_1|NZ_CP022413.2_1921535_1921736_+	NA	NA|188aa|down_2|NZ_CP022413.2_1921756_1922320_+	NA	NA|241aa|down_3|NZ_CP022413.2_1922309_1923032_+	pfam18346, SH3_15, Mind bomb SH3 repeat domain	NA|65aa|down_4|NZ_CP022413.2_1923031_1923226_+	NA	NA|227aa|down_5|NZ_CP022413.2_1923232_1923913_+	NA	NA|413aa|down_6|NZ_CP022413.2_1923896_1925135_+	smart00487, DEXDc, DEAD-like helicases superfamily	NA|247aa|down_7|NZ_CP022413.2_1925467_1926208_+	NA	NA|224aa|down_8|NZ_CP022413.2_1926195_1926867_+	NA	NA|56aa|down_9|NZ_CP022413.2_1926921_1927089_+	NA
GCF_002222595.2_ASM222259v2	NZ_CP022413	Blautia hansenii DSM 20583 chromosome, complete genome	4	1920674-1920906	1,2,3	PILER-CR,CRT,CRISPRCasFinder	no	RT,cas14j,c2c9_V-U4	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	Unclear	TCTGATGCATTTTATATATATAAGTGGATTGAAATC,TGATGCATTTTATATATATAAGTGGATTGAAATC,GATGCATTTTATATATATAAGTGGATTGAAATC	36,34,33	0	0	NA	NA	NA:NA:NA	2,3,3	3	TypeV	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	NA|91aa|up_7|NZ_CP022413.2_1916394_1916667_+,NA|95aa|up_6|NZ_CP022413.2_1916653_1916938_+,NA|108aa|up_4|NZ_CP022413.2_1917625_1917949_+,NA|116aa|up_3|NZ_CP022413.2_1917968_1918316_+,NA|52aa|up_2|NZ_CP022413.2_1918331_1918487_+,NA|67aa|down_1|NZ_CP022413.2_1921535_1921736_+,NA|188aa|down_2|NZ_CP022413.2_1921756_1922320_+,NA|65aa|down_4|NZ_CP022413.2_1923031_1923226_+,NA|227aa|down_5|NZ_CP022413.2_1923232_1923913_+,NA|247aa|down_7|NZ_CP022413.2_1925467_1926208_+,NA|224aa|down_8|NZ_CP022413.2_1926195_1926867_+,NA|56aa|down_9|NZ_CP022413.2_1926921_1927089_+	NA|47aa|up_9|NZ_CP022413.2_1914210_1914351_-	pfam10139, Virul_Fac, Putative bacterial virulence factor	NA|397aa|up_8|NZ_CP022413.2_1914993_1916184_+	pfam00004, AAA, ATPase family associated with various cellular activities (AAA)	NA|91aa|up_7|NZ_CP022413.2_1916394_1916667_+	NA	NA|95aa|up_6|NZ_CP022413.2_1916653_1916938_+	NA	NA|229aa|up_5|NZ_CP022413.2_1916937_1917624_+	cd00844, MPP_Dbr1_N, Dbr1 RNA lariat debranching enzyme, N-terminal metallophosphatase domain	NA|108aa|up_4|NZ_CP022413.2_1917625_1917949_+	NA	NA|116aa|up_3|NZ_CP022413.2_1917968_1918316_+	NA	NA|52aa|up_2|NZ_CP022413.2_1918331_1918487_+	NA	cas14j|374aa|up_1|NZ_CP022413.2_1918509_1919631_+	pfam01385, OrfB_IS605, Probable transposase	c2c9_V-U4|99aa|up_0|NZ_CP022413.2_1919602_1919899_+	pfam07282, OrfB_Zn_ribbon, Putative transposase DNA-binding domain	NA|151aa|down_0|NZ_CP022413.2_1920945_1921398_+	pfam09424, YqeY, Yqey-like protein	NA|67aa|down_1|NZ_CP022413.2_1921535_1921736_+	NA	NA|188aa|down_2|NZ_CP022413.2_1921756_1922320_+	NA	NA|241aa|down_3|NZ_CP022413.2_1922309_1923032_+	pfam18346, SH3_15, Mind bomb SH3 repeat domain	NA|65aa|down_4|NZ_CP022413.2_1923031_1923226_+	NA	NA|227aa|down_5|NZ_CP022413.2_1923232_1923913_+	NA	NA|413aa|down_6|NZ_CP022413.2_1923896_1925135_+	smart00487, DEXDc, DEAD-like helicases superfamily	NA|247aa|down_7|NZ_CP022413.2_1925467_1926208_+	NA	NA|224aa|down_8|NZ_CP022413.2_1926195_1926867_+	NA	NA|56aa|down_9|NZ_CP022413.2_1926921_1927089_+	NA
GCF_002222595.2_ASM222259v2	NZ_CP022413	Blautia hansenii DSM 20583 chromosome, complete genome	5	2644919-2647259	3,2,4	CRT,PILER-CR,CRISPRCasFinder	no	cas2,cas1,cas4,cas3,cas5,cas7,cas8b2,cas6	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	Unclear	ATTTACATTCCAATATGTTTCTATTAATAC,ATTTACATTCCAATATGTTTCTATTAATAC,ATTTACATTCCAATATGTTTCTATTAATAC	30,30,30	0	0	NA	NA	NA:NA:NA	35,34,34	35	Unclear	cas3,DEDDh,csa3,RT,DinG,cas14j,c2c9_V-U4,PD-DExK,cas2,cas1,cas4,cas5,cas7,cas8b2,cas6	NA|302aa|up_4|NZ_CP022413.2_2637475_2638381_-,NA|475aa|up_2|NZ_CP022413.2_2639371_2640796_-,NA|122aa|up_1|NZ_CP022413.2_2641243_2641609_+,NA	NA|429aa|up_9|NZ_CP022413.2_2632397_2633684_-	pfam06824, Glyco_hydro_125, Metal-independent alpha-mannosidase (GH125)	NA|120aa|up_8|NZ_CP022413.2_2633705_2634065_-	PRK11770, PRK11770, YccF domain-containing protein	NA|249aa|up_7|NZ_CP022413.2_2634210_2634957_+	PRK05557, fabG, 3-ketoacyl-(acyl-carrier-protein) reductase; Validated	NA|295aa|up_6|NZ_CP022413.2_2634981_2635866_-	COG0583, LysR, Transcriptional regulator [Transcription]	NA|477aa|up_5|NZ_CP022413.2_2635995_2637426_+	cd06450, DOPA_deC_like, DOPA decarboxylase family	NA|302aa|up_4|NZ_CP022413.2_2637475_2638381_-	NA	NA|280aa|up_3|NZ_CP022413.2_2638377_2639217_-	pfam13676, TIR_2, TIR domain	NA|475aa|up_2|NZ_CP022413.2_2639371_2640796_-	NA	NA|122aa|up_1|NZ_CP022413.2_2641243_2641609_+	NA	NA|121aa|up_0|NZ_CP022413.2_2641598_2641961_+	pfam05717, TnpB_IS66, IS66 Orf2 like protein	cas2|93aa|down_0|NZ_CP022413.2_2647424_2647703_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|331aa|down_1|NZ_CP022413.2_2647704_2648697_-	cd09722, Cas1_I-B, CRISPR/Cas system-associated protein Cas1	cas4|165aa|down_2|NZ_CP022413.2_2648709_2649204_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas3|794aa|down_3|NZ_CP022413.2_2649222_2651604_-	TIGR01587, CRISPR-associated_endonuclease/helicase_Cas3, CRISPR-associated helicase Cas3	cas5|242aa|down_4|NZ_CP022413.2_2651649_2652375_-	cd09658, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|292aa|down_5|NZ_CP022413.2_2652358_2653234_-	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas8b2|561aa|down_6|NZ_CP022413.2_2653236_2654919_-	cd09754, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|241aa|down_7|NZ_CP022413.2_2654934_2655657_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	NA|550aa|down_8|NZ_CP022413.2_2656820_2658470_-	COG1595, RpoE, DNA-directed RNA polymerase specialized sigma subunit, sigma24 homolog [Transcription]	NA|121aa|down_9|NZ_CP022413.2_2658841_2659204_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins
