assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000210515.1_ASM21051v1	NC_017465	Lactobacillus fermentum CECT 5716, complete sequence	1	286320-286408	1	CRISPRCasFinder	no	cas14j	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	Unclear	GAGCCTCCAGCGGGTGAATGGGATGGTG	28	0	0	NA	NA	NA	1	1	TypeV	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	NA|171aa|up_5|NC_017465.1_280606_281119_+,NA|135aa|up_4|NC_017465.1_281193_281598_+,NA|71aa|up_0|NC_017465.1_285814_286027_-,NA|170aa|down_0|NC_017465.1_286557_287067_-,NA|112aa|down_1|NC_017465.1_287081_287417_-,NA|117aa|down_2|NC_017465.1_287430_287781_-,NA|50aa|down_5|NC_017465.1_290886_291036_-	NA|183aa|up_9|NC_017465.1_266965_267514_+	COG0634, Hpt, Hypoxanthine-guanine phosphoribosyltransferase [Nucleotide transport and metabolism]	NA|723aa|up_8|NC_017465.1_267597_269766_+	TIGR01241, ATP-dependent_zinc_metalloprotease_FtsH, ATP-dependent metalloprotease FtsH	NA|294aa|up_7|NC_017465.1_269847_270729_+	PRK00114, hslO, Hsp33 family molecular chaperone HslO	NA|498aa|up_6|NC_017465.1_271835_273329_+	PRK00484, lysS, lysyl-tRNA synthetase; Reviewed	NA|171aa|up_5|NC_017465.1_280606_281119_+	NA	NA|135aa|up_4|NC_017465.1_281193_281598_+	NA	NA|255aa|up_3|NC_017465.1_282318_283083_+	pfam10479, FSA_C, Fragile site-associated protein C-terminus	NA|110aa|up_2|NC_017465.1_283269_283599_+	pfam13240, zinc_ribbon_2, zinc-ribbon domain	NA|105aa|up_1|NC_017465.1_283610_283925_+	pfam13248, zf-ribbon_3, zinc-ribbon domain	NA|71aa|up_0|NC_017465.1_285814_286027_-	NA	NA|170aa|down_0|NC_017465.1_286557_287067_-	NA	NA|112aa|down_1|NC_017465.1_287081_287417_-	NA	NA|117aa|down_2|NC_017465.1_287430_287781_-	NA	NA|523aa|down_3|NC_017465.1_288098_289667_-	COG3378, COG3378, Phage associated DNA primase [General function prediction only]	NA|275aa|down_4|NC_017465.1_289721_290546_-	cd04859, Prim_Pol, Prim_Pol: Primase-polymerase (primpol) domain of the type found in bifunctional replicases from archaeal plasmids, including ORF904 protein of the crenarchaeal plasmid pRN1 from Sulfolobus islandicus (pRN1 primpol)	NA|50aa|down_5|NC_017465.1_290886_291036_-	NA	NA|89aa|down_6|NC_017465.1_291207_291474_-	pfam12728, HTH_17, Helix-turn-helix domain	NA|61aa|down_7|NC_017465.1_291490_291673_-	pfam12728, HTH_17, Helix-turn-helix domain	NA|371aa|down_8|NC_017465.1_291789_292902_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|368aa|down_9|NC_017465.1_293019_294123_+	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons
GCF_000210515.1_ASM21051v1	NC_017465	Lactobacillus fermentum CECT 5716, complete sequence	2	817592-818780	1,2,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cse2gr11,cas7,cas5,cas6e,cas1	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	Type I-E	GTATTCCCCATGTATGTGGGGGTGATCC,GTATTCCCCATGTATGTGGGGGTGATCCT,GTATTCCCCATGTATGTGGGGGTGATCCT	28,29,29	0	0	NA	NA	I-B,III-A,III-B:I-B,III-A,III-B:I-B,III-A,III-B	19,19,19	19	TypeI-E	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	NA,NA|121aa|down_0|NC_017465.1_823491_823854_+,NA|107aa|down_3|NC_017465.1_825742_826063_-	NA|293aa|up_9|NC_017465.1_800645_801524_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|413aa|up_8|NC_017465.1_802573_803812_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|96aa|up_7|NC_017465.1_803922_804210_+	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	cas3|908aa|up_6|NC_017465.1_805672_808396_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|396aa|up_5|NC_017465.1_808599_809787_+	pfam00872, Transposase_mut, Transposase, Mutator family	cse2gr11|198aa|up_4|NC_017465.1_811464_812058_+	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas7|361aa|up_3|NC_017465.1_812084_813167_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|236aa|up_2|NC_017465.1_813147_813855_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|214aa|up_1|NC_017465.1_813872_814514_+	pfam08798, CRISPR_assoc, CRISPR associated protein	cas1|314aa|up_0|NC_017465.1_814527_815469_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	NA|121aa|down_0|NC_017465.1_823491_823854_+	NA	NA|231aa|down_1|NC_017465.1_824055_824748_+	pfam13518, HTH_28, Helix-turn-helix domain	NA|317aa|down_2|NC_017465.1_824672_825623_+	pfam00665, rve, Integrase core domain	NA|107aa|down_3|NC_017465.1_825742_826063_-	NA	NA|408aa|down_4|NC_017465.1_826191_827415_+	pfam04087, DUF389, Domain of unknown function (DUF389)	NA|445aa|down_5|NC_017465.1_827436_828771_-	TIGR00909, putative_amino_acid_transporter, amino acid transporter	NA|229aa|down_6|NC_017465.1_828863_829550_+	COG3316, COG3316, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|209aa|down_7|NC_017465.1_831310_831937_-	PRK00215, PRK00215, transcriptional repressor LexA	NA|84aa|down_8|NC_017465.1_832092_832344_+	pfam05979, DUF896, Bacterial protein of unknown function (DUF896)	NA|76aa|down_9|NC_017465.1_832420_832648_+	pfam03672, UPF0154, Uncharacterized protein family (UPF0154)
GCF_000210515.1_ASM21051v1	NC_017465	Lactobacillus fermentum CECT 5716, complete sequence	3	820218-821650	2,3,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cse2gr11,cas7,cas5,cas6e,cas1	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	Type I-E	GTATTCCCCATGTATGTGGGGGTGATCC,GTATTCCCCATGTATGTGGGGGTGATCCT,GTATTCCCCATGTATGTGGGGGTGATCCT	28,29,29	0	0	NA	NA	I-B,III-A,III-B:I-B,III-A,III-B:I-B,III-A,III-B	23,23,23	23	TypeI-E	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	NA,NA|121aa|down_0|NC_017465.1_823491_823854_+,NA|107aa|down_3|NC_017465.1_825742_826063_-	NA|293aa|up_9|NC_017465.1_800645_801524_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|413aa|up_8|NC_017465.1_802573_803812_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|96aa|up_7|NC_017465.1_803922_804210_+	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	cas3|908aa|up_6|NC_017465.1_805672_808396_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|396aa|up_5|NC_017465.1_808599_809787_+	pfam00872, Transposase_mut, Transposase, Mutator family	cse2gr11|198aa|up_4|NC_017465.1_811464_812058_+	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas7|361aa|up_3|NC_017465.1_812084_813167_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|236aa|up_2|NC_017465.1_813147_813855_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|214aa|up_1|NC_017465.1_813872_814514_+	pfam08798, CRISPR_assoc, CRISPR associated protein	cas1|314aa|up_0|NC_017465.1_814527_815469_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	NA|121aa|down_0|NC_017465.1_823491_823854_+	NA	NA|231aa|down_1|NC_017465.1_824055_824748_+	pfam13518, HTH_28, Helix-turn-helix domain	NA|317aa|down_2|NC_017465.1_824672_825623_+	pfam00665, rve, Integrase core domain	NA|107aa|down_3|NC_017465.1_825742_826063_-	NA	NA|408aa|down_4|NC_017465.1_826191_827415_+	pfam04087, DUF389, Domain of unknown function (DUF389)	NA|445aa|down_5|NC_017465.1_827436_828771_-	TIGR00909, putative_amino_acid_transporter, amino acid transporter	NA|229aa|down_6|NC_017465.1_828863_829550_+	COG3316, COG3316, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|209aa|down_7|NC_017465.1_831310_831937_-	PRK00215, PRK00215, transcriptional repressor LexA	NA|84aa|down_8|NC_017465.1_832092_832344_+	pfam05979, DUF896, Bacterial protein of unknown function (DUF896)	NA|76aa|down_9|NC_017465.1_832420_832648_+	pfam03672, UPF0154, Uncharacterized protein family (UPF0154)
GCF_000210515.1_ASM21051v1	NC_017465	Lactobacillus fermentum CECT 5716, complete sequence	4	880947-881067	4	CRISPRCasFinder	no		cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	Orphan	TAGAGACTCTGATTTAGTATAATTAATGAAGTAAATTGGAGGATC	45	1	10	880992-881022|880992-881022|880992-881022|880992-881022|880992-881022|880992-881022|880992-881022|880992-881022|880992-881022|880992-881022	NC_017465.1_801916-801886|NC_017465.1_803842-803872|NC_017465.1_1347690-1347720|NC_017465.1_1393235-1393265|NC_017465.1_1405765-1405735|NC_017465.1_1601916-1601946|NC_017465.1_1616086-1616056|NC_017465.1_1663644-1663674|NC_017465.1_1777680-1777650|NC_017465.1_1616343-1616313	NA	1	1	Orphan	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	NA|106aa|up_6|NC_017465.1_872032_872350_+,NA|122aa|down_1|NC_017465.1_883109_883475_-	NA|565aa|up_9|NC_017465.1_867766_869461_-	cd11333, AmyAc_SI_OligoGlu_DGase, Alpha amylase catalytic domain found in Sucrose isomerases, oligo-1,6-glucosidase (also called isomaltase; sucrase-isomaltase; alpha-limit dextrinase), dextran glucosidase (also called glucan 1,6-alpha-glucosidase), and related proteins	NA|329aa|up_8|NC_017465.1_869617_870604_+	COG1609, PurR, Transcriptional regulators [Transcription]	NA|200aa|up_7|NC_017465.1_871452_872052_+	PRK03103, PRK03103, DNA polymerase IV; Reviewed	NA|106aa|up_6|NC_017465.1_872032_872350_+	NA	NA|391aa|up_5|NC_017465.1_872502_873675_+	cd08188, PDDH, 1,3-Propanediol (1,3-PD) dehydrogenase	NA|322aa|up_4|NC_017465.1_875325_876291_+	COG1893, ApbA, Ketopantoate reductase [Coenzyme metabolism]	NA|118aa|up_3|NC_017465.1_876636_876990_-	pfam06993, DUF1304, Protein of unknown function (DUF1304)	NA|204aa|up_2|NC_017465.1_877002_877614_-	COG1073, COG1073, Hydrolases of the alpha/beta superfamily [General function prediction only]	NA|443aa|up_1|NC_017465.1_877788_879117_-	PRK02991, PRK02991, D-serine dehydratase; Provisional	NA|467aa|up_0|NC_017465.1_879406_880807_-	COG1113, AnsP, Gamma-aminobutyrate permease and related permeases [Amino acid transport and metabolism]	NA|96aa|down_0|NC_017465.1_881072_881360_+	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|122aa|down_1|NC_017465.1_883109_883475_-	NA	NA|349aa|down_2|NC_017465.1_883600_884647_+	PRK00082, hrcA, heat-inducible transcription repressor; Provisional	NA|196aa|down_3|NC_017465.1_884657_885245_+	PRK14162, PRK14162, heat shock protein GrpE; Provisional	NA|619aa|down_4|NC_017465.1_885282_887139_+	PRK00290, dnaK, molecular chaperone DnaK; Provisional	NA|56aa|down_5|NC_017465.1_889393_889561_+	PRK02083, PRK02083, imidazole glycerol phosphate synthase subunit HisF; Provisional	NA|189aa|down_6|NC_017465.1_889579_890146_+	PRK02083, PRK02083, imidazole glycerol phosphate synthase subunit HisF; Provisional	NA|280aa|down_7|NC_017465.1_890353_891193_+	PRK08123, PRK08123, histidinol-phosphatase HisJ	NA|205aa|down_8|NC_017465.1_892668_893283_+	PRK01686, hisG, ATP phosphoribosyltransferase catalytic subunit; Reviewed	NA|195aa|down_9|NC_017465.1_894570_895155_+	PRK00951, hisB, imidazoleglycerol-phosphate dehydratase HisB
GCF_000210515.1_ASM21051v1	NC_017465	Lactobacillus fermentum CECT 5716, complete sequence	5	1394541-1394782	3,3,5	CRT,PILER-CR,CRISPRCasFinder	no	cas2,cas1,cas4,cas7,cas8c,cas5,cas3	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	Type I-C, Type I-U?,Type I-U	ATTTCAATCCACGCACCCCCGCGAAGGAGTGCGAC,ATTTCAATCCACGCACCCCCGCGAAGGAGTGCGAC,ATTTCAATCCACGCACCCCCGCGAAGGAGTGCGACC	35,35,36	0	0	NA	NA	I-C:I-C:I-C	3,2,2	3	TypeI-C,TypeI-U,TypeI-U?	cas14j,DEDDh,cas3,cse2gr11,cas7,cas5,cas6e,cas1,WYL,cas2,csa3,cas4,cas8c	NA,NA	NA|243aa|up_9|NC_017465.1_1369364_1370093_-	COG3935, DnaD, Putative primosome component and related proteins [DNA replication, recombination, and repair]	NA|432aa|up_8|NC_017465.1_1370184_1371480_-	PRK03932, asnC, asparaginyl-tRNA synthetase; Validated	NA|173aa|up_7|NC_017465.1_1371506_1372025_-	COG5353, COG5353, Uncharacterized protein conserved in bacteria [Function unknown]	NA|378aa|up_6|NC_017465.1_1379507_1380641_-	PRK14237, PRK14237, phosphate transporter ATP-binding protein; Provisional	NA|396aa|up_5|NC_017465.1_1380850_1382038_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|269aa|up_4|NC_017465.1_1384137_1384944_+	cd07516, HAD_Pase, phosphatase, similar to Escherichia coli Cof and Thermotoga maritima TM0651; belongs to the haloacid dehalogenase-like superfamily	NA|306aa|up_3|NC_017465.1_1385175_1386093_-	PRK07259, PRK07259, dihydroorotate dehydrogenase	NA|322aa|up_2|NC_017465.1_1391665_1392631_-	PRK00856, pyrB, aspartate carbamoyltransferase catalytic subunit	NA|96aa|up_1|NC_017465.1_1393315_1393603_+	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|293aa|up_0|NC_017465.1_1393626_1394505_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	cas2|97aa|down_0|NC_017465.1_1394940_1395231_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|344aa|down_1|NC_017465.1_1395240_1396272_-	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas4|219aa|down_2|NC_017465.1_1396268_1396925_-	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4	cas7|293aa|down_3|NC_017465.1_1396928_1397807_-	cd09689, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas8c|634aa|down_4|NC_017465.1_1397828_1399730_-	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas5|250aa|down_5|NC_017465.1_1399726_1400476_-	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	NA|407aa|down_6|NC_017465.1_1400535_1401756_-	pfam00872, Transposase_mut, Transposase, Mutator family	cas3|825aa|down_7|NC_017465.1_1401786_1404261_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|293aa|down_8|NC_017465.1_1404494_1405373_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|96aa|down_9|NC_017465.1_1405396_1405684_-	COG2963, COG2963, Transposase and inactivated derivatives [DNA replication, recombination, and repair]
