assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002355515.1_ASM235551v1	NZ_AP014809	Methylorubrum populi strain P-1M	1	2740824-2740902	1	CRISPRCasFinder	no		DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal	Orphan	ACGGCAACAACGTCGTGCTCGGCG	24	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal,c2c4_V-U1	NA|292aa|up_5|NZ_AP014809.1_2699308_2700184_+,NA|89aa|down_9|NZ_AP014809.1_2765105_2765372_+	NA|99aa|up_9|NZ_AP014809.1_2694512_2694809_-	pfam11950, DUF3467, Protein of unknown function (DUF3467)	NA|355aa|up_8|NZ_AP014809.1_2695180_2696245_+	pfam00891, Methyltransf_2, O-methyltransferase	NA|220aa|up_7|NZ_AP014809.1_2696241_2696901_+	PRK08233, PRK08233, hypothetical protein; Provisional	NA|794aa|up_6|NZ_AP014809.1_2696930_2699312_+	pfam04820, Trp_halogenase, Tryptophan halogenase	NA|292aa|up_5|NZ_AP014809.1_2699308_2700184_+	NA	NA|311aa|up_4|NZ_AP014809.1_2700291_2701224_+	COG0535, COG0535, Predicted Fe-S oxidoreductases [General function prediction only]	NA|318aa|up_3|NZ_AP014809.1_2701281_2702235_-	PRK09685, PRK09685, DNA-binding transcriptional activator FeaR; Provisional	NA|267aa|up_2|NZ_AP014809.1_2703154_2703955_+	pfam07277, SapC, SapC	NA|9087aa|up_1|NZ_AP014809.1_2704146_2731407_+	NF012206, LktA_tand_53, tandem repeat-containing filamentous protein	NA|408aa|up_0|NZ_AP014809.1_2731387_2732611_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|272aa|down_0|NZ_AP014809.1_2752090_2752906_+	pfam13640, 2OG-FeII_Oxy_3, 2OG-Fe(II) oxygenase superfamily	NA|264aa|down_1|NZ_AP014809.1_2752910_2753702_+	pfam08241, Methyltransf_11, Methyltransferase domain	NA|460aa|down_2|NZ_AP014809.1_2753893_2755273_+	COG1032, COG1032, Fe-S oxidoreductase [Energy production and conversion]	NA|438aa|down_3|NZ_AP014809.1_2755269_2756583_+	COG1032, COG1032, Fe-S oxidoreductase [Energy production and conversion]	NA|485aa|down_4|NZ_AP014809.1_2756589_2758044_-	COG2132, SufI, Putative multicopper oxidases [Secondary metabolites biosynthesis, transport, and catabolism]	NA|475aa|down_5|NZ_AP014809.1_2758404_2759829_+	PRK01490, tig, trigger factor; Provisional	NA|209aa|down_6|NZ_AP014809.1_2759964_2760591_+	PRK00277, clpP, ATP-dependent Clp protease proteolytic subunit; Reviewed	NA|424aa|down_7|NZ_AP014809.1_2760842_2762114_+	PRK05342, clpX, ATP-dependent Clp protease ATP-binding subunit ClpX	NA|808aa|down_8|NZ_AP014809.1_2762382_2764806_+	COG0466, Lon, ATP-dependent Lon protease, bacterial type [Posttranslational modification, protein turnover, chaperones]	NA|89aa|down_9|NZ_AP014809.1_2765105_2765372_+	NA
GCF_002355515.1_ASM235551v1	NZ_AP014809	Methylorubrum populi strain P-1M	2	2740995-2741096	2	CRISPRCasFinder	no		DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal	Orphan	ACGGCAACAACGTCGTGCTCGGCG	24	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal,c2c4_V-U1	NA|292aa|up_5|NZ_AP014809.1_2699308_2700184_+,NA|89aa|down_9|NZ_AP014809.1_2765105_2765372_+	NA|99aa|up_9|NZ_AP014809.1_2694512_2694809_-	pfam11950, DUF3467, Protein of unknown function (DUF3467)	NA|355aa|up_8|NZ_AP014809.1_2695180_2696245_+	pfam00891, Methyltransf_2, O-methyltransferase	NA|220aa|up_7|NZ_AP014809.1_2696241_2696901_+	PRK08233, PRK08233, hypothetical protein; Provisional	NA|794aa|up_6|NZ_AP014809.1_2696930_2699312_+	pfam04820, Trp_halogenase, Tryptophan halogenase	NA|292aa|up_5|NZ_AP014809.1_2699308_2700184_+	NA	NA|311aa|up_4|NZ_AP014809.1_2700291_2701224_+	COG0535, COG0535, Predicted Fe-S oxidoreductases [General function prediction only]	NA|318aa|up_3|NZ_AP014809.1_2701281_2702235_-	PRK09685, PRK09685, DNA-binding transcriptional activator FeaR; Provisional	NA|267aa|up_2|NZ_AP014809.1_2703154_2703955_+	pfam07277, SapC, SapC	NA|9087aa|up_1|NZ_AP014809.1_2704146_2731407_+	NF012206, LktA_tand_53, tandem repeat-containing filamentous protein	NA|408aa|up_0|NZ_AP014809.1_2731387_2732611_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|272aa|down_0|NZ_AP014809.1_2752090_2752906_+	pfam13640, 2OG-FeII_Oxy_3, 2OG-Fe(II) oxygenase superfamily	NA|264aa|down_1|NZ_AP014809.1_2752910_2753702_+	pfam08241, Methyltransf_11, Methyltransferase domain	NA|460aa|down_2|NZ_AP014809.1_2753893_2755273_+	COG1032, COG1032, Fe-S oxidoreductase [Energy production and conversion]	NA|438aa|down_3|NZ_AP014809.1_2755269_2756583_+	COG1032, COG1032, Fe-S oxidoreductase [Energy production and conversion]	NA|485aa|down_4|NZ_AP014809.1_2756589_2758044_-	COG2132, SufI, Putative multicopper oxidases [Secondary metabolites biosynthesis, transport, and catabolism]	NA|475aa|down_5|NZ_AP014809.1_2758404_2759829_+	PRK01490, tig, trigger factor; Provisional	NA|209aa|down_6|NZ_AP014809.1_2759964_2760591_+	PRK00277, clpP, ATP-dependent Clp protease proteolytic subunit; Reviewed	NA|424aa|down_7|NZ_AP014809.1_2760842_2762114_+	PRK05342, clpX, ATP-dependent Clp protease ATP-binding subunit ClpX	NA|808aa|down_8|NZ_AP014809.1_2762382_2764806_+	COG0466, Lon, ATP-dependent Lon protease, bacterial type [Posttranslational modification, protein turnover, chaperones]	NA|89aa|down_9|NZ_AP014809.1_2765105_2765372_+	NA
GCF_002355515.1_ASM235551v1	NZ_AP014809	Methylorubrum populi strain P-1M	3	2776560-2776654	3	CRISPRCasFinder	no		DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal	Orphan	TCGTCGAACCGGTCGAAGAAGTT	23	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal,c2c4_V-U1	NA|193aa|up_9|NZ_AP014809.1_2765368_2765947_+,NA|113aa|up_8|NZ_AP014809.1_2766014_2766353_-,NA|136aa|up_7|NZ_AP014809.1_2766357_2766765_-,NA|87aa|up_6|NZ_AP014809.1_2766764_2767025_-,NA|379aa|up_3|NZ_AP014809.1_2769441_2770578_-,NA|120aa|up_2|NZ_AP014809.1_2771081_2771441_-,NA|129aa|up_1|NZ_AP014809.1_2771450_2771837_-,NA|409aa|up_0|NZ_AP014809.1_2771842_2773069_-,NA|240aa|down_1|NZ_AP014809.1_2778814_2779534_-,NA|474aa|down_2|NZ_AP014809.1_2779662_2781084_-,NA|143aa|down_3|NZ_AP014809.1_2781088_2781517_-,NA|195aa|down_4|NZ_AP014809.1_2781529_2782114_-,NA|135aa|down_6|NZ_AP014809.1_2783561_2783966_-,NA|293aa|down_9|NZ_AP014809.1_2785906_2786785_-	NA|193aa|up_9|NZ_AP014809.1_2765368_2765947_+	NA	NA|113aa|up_8|NZ_AP014809.1_2766014_2766353_-	NA	NA|136aa|up_7|NZ_AP014809.1_2766357_2766765_-	NA	NA|87aa|up_6|NZ_AP014809.1_2766764_2767025_-	NA	NA|291aa|up_5|NZ_AP014809.1_2767027_2767900_-	pfam11860, Muraidase, N-acetylmuramidase	NA|447aa|up_4|NZ_AP014809.1_2768115_2769456_+	pfam04577, DUF563, Protein of unknown function (DUF563)	NA|379aa|up_3|NZ_AP014809.1_2769441_2770578_-	NA	NA|120aa|up_2|NZ_AP014809.1_2771081_2771441_-	NA	NA|129aa|up_1|NZ_AP014809.1_2771450_2771837_-	NA	NA|409aa|up_0|NZ_AP014809.1_2771842_2773069_-	NA	NA|715aa|down_0|NZ_AP014809.1_2776665_2778810_-	pfam18013, Phage_lysozyme2, Phage tail lysozyme	NA|240aa|down_1|NZ_AP014809.1_2778814_2779534_-	NA	NA|474aa|down_2|NZ_AP014809.1_2779662_2781084_-	NA	NA|143aa|down_3|NZ_AP014809.1_2781088_2781517_-	NA	NA|195aa|down_4|NZ_AP014809.1_2781529_2782114_-	NA	NA|481aa|down_5|NZ_AP014809.1_2782115_2783558_-	pfam01391, Collagen, Collagen triple helix repeat (20 copies)	NA|135aa|down_6|NZ_AP014809.1_2783561_2783966_-	NA	NA|177aa|down_7|NZ_AP014809.1_2784015_2784546_-	TIGR04211, hypothetical_protein, SH3 domain protein	NA|412aa|down_8|NZ_AP014809.1_2784643_2785879_-	pfam11651, P22_CoatProtein, P22 coat protein - gene protein 5	NA|293aa|down_9|NZ_AP014809.1_2785906_2786785_-	NA
GCF_002355515.1_ASM235551v1	NZ_AP014809	Methylorubrum populi strain P-1M	4	4482492-4482584	4	CRISPRCasFinder	no		DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal	Orphan	ACCGTGTCGTAGACCGGCGGCGTC	24	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal,c2c4_V-U1	NA|253aa|up_6|NZ_AP014809.1_4476096_4476855_+,NA|75aa|up_5|NZ_AP014809.1_4476943_4477168_+,NA|81aa|down_5|NZ_AP014809.1_4488520_4488763_-,NA|95aa|down_6|NZ_AP014809.1_4488880_4489165_+,NA|64aa|down_7|NZ_AP014809.1_4489619_4489811_+	NA|234aa|up_9|NZ_AP014809.1_4473430_4474132_-	cd05373, SDR_c10, classical (c) SDR, subgroup  10	NA|148aa|up_8|NZ_AP014809.1_4474239_4474683_-	COG0590, CumB, Cytosine/adenosine deaminases [Nucleotide transport and metabolism / Translation, ribosomal structure and biogenesis]	NA|436aa|up_7|NZ_AP014809.1_4474682_4475990_-	PRK00885, PRK00885, phosphoribosylamine--glycine ligase; Provisional	NA|253aa|up_6|NZ_AP014809.1_4476096_4476855_+	NA	NA|75aa|up_5|NZ_AP014809.1_4476943_4477168_+	NA	NA|523aa|up_4|NZ_AP014809.1_4477336_4478905_+	PRK00286, xseA, exodeoxyribonuclease VII large subunit; Reviewed	NA|76aa|up_3|NZ_AP014809.1_4479055_4479283_+	pfam13773, DUF4170, Domain of unknown function (DUF4170)	NA|315aa|up_2|NZ_AP014809.1_4479436_4480381_+	PRK01259, PRK01259, ribose-phosphate diphosphokinase	NA|155aa|up_1|NZ_AP014809.1_4480507_4480972_-	PRK06342, PRK06342, transcription elongation factor GreA	NA|329aa|up_0|NZ_AP014809.1_4481026_4482013_-	cd08288, MDR_yhdh, Yhdh putative quinone oxidoreductases	NA|113aa|down_0|NZ_AP014809.1_4483237_4483576_+	pfam11953, DUF3470, Domain of unknown function (DUF3470)	NA|197aa|down_1|NZ_AP014809.1_4484078_4484669_+	COG1329, COG1329, Transcriptional regulators, similar to M	NA|291aa|down_2|NZ_AP014809.1_4484952_4485825_+	PRK07500, rpoH2, RNA polymerase factor sigma-32; Reviewed	NA|318aa|down_3|NZ_AP014809.1_4485910_4486864_-	cd08422, PBP2_CrgA_like, The C-terminal substrate binding domain of LysR-type transcriptional regulator CrgA and its related homologs, contains the type 2 periplasmic binding domain	NA|138aa|down_4|NZ_AP014809.1_4488044_4488458_+	cd01184, INT_C_like_1, Uncharacterized site-specific tyrosine recombinase, C-terminal catalytic domain	NA|81aa|down_5|NZ_AP014809.1_4488520_4488763_-	NA	NA|95aa|down_6|NZ_AP014809.1_4488880_4489165_+	NA	NA|64aa|down_7|NZ_AP014809.1_4489619_4489811_+	NA	NA|475aa|down_8|NZ_AP014809.1_4490177_4491602_-	PRK05335, PRK05335, tRNA (uracil-5-)-methyltransferase Gid; Reviewed	NA|717aa|down_9|NZ_AP014809.1_4491739_4493890_-	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)
GCF_002355515.1_ASM235551v1	NZ_AP014809	Methylorubrum populi strain P-1M	5	4904944-4905041	5	CRISPRCasFinder	no		DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal	Orphan	CGCGGCGGCGGATCGCGGCTCGG	23	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,c2c9_V-U4,WYL,cas3,RT,Cas9_archaeal,c2c4_V-U1	NA|156aa|up_7|NZ_AP014809.1_4897470_4897938_-,NA|135aa|up_4|NZ_AP014809.1_4900729_4901134_+,NA|96aa|down_4|NZ_AP014809.1_4910077_4910365_-,NA|55aa|down_5|NZ_AP014809.1_4910509_4910674_+,NA|356aa|down_7|NZ_AP014809.1_4914597_4915665_+	NA|30aa|up_9|NZ_AP014809.1_4896393_4896483_+	PRK00284, pqqA, pyrroloquinoline quinone precursor peptide PqqA	NA|173aa|up_8|NZ_AP014809.1_4896790_4897309_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|156aa|up_7|NZ_AP014809.1_4897470_4897938_-	NA	NA|386aa|up_6|NZ_AP014809.1_4897934_4899092_-	pfam16113, ECH_2, Enoyl-CoA hydratase/isomerase	NA|352aa|up_5|NZ_AP014809.1_4899636_4900692_+	PRK09283, PRK09283, porphobilinogen synthase	NA|135aa|up_4|NZ_AP014809.1_4900729_4901134_+	NA	NA|165aa|up_3|NZ_AP014809.1_4901257_4901752_+	pfam06271, RDD, RDD family	NA|249aa|up_2|NZ_AP014809.1_4901903_4902650_+	PRK01305, PRK01305, arginyl-tRNA-protein transferase; Provisional	NA|188aa|up_1|NZ_AP014809.1_4902685_4903249_-	cd03357, LbH_MAT_GAT, Maltose O-acetyltransferase (MAT) and Galactoside O-acetyltransferase (GAT): MAT and GAT catalyze the CoA-dependent acetylation of the 6-hydroxyl group of their respective sugar substrates	NA|301aa|up_0|NZ_AP014809.1_4903273_4904176_-	COG2321, COG2321, Predicted metalloprotease [General function prediction only]	NA|558aa|down_0|NZ_AP014809.1_4905429_4907103_+	COG0644, FixC, Dehydrogenases (flavoproteins) [Energy production and conversion]	NA|335aa|down_1|NZ_AP014809.1_4907207_4908212_-	cd02252, nylC_like, nylC-like family; composed of proteins with similarity to Flavobacterium endo-type 6-aminohexanoate-oligomer hydrolase (EIII), the product of the nylon oligomer degradation gene, nylC	NA|254aa|down_2|NZ_AP014809.1_4908338_4909100_-	pfam05257, CHAP, CHAP domain	NA|285aa|down_3|NZ_AP014809.1_4909165_4910020_-	COG2962, RarD, Predicted permeases [General function prediction only]	NA|96aa|down_4|NZ_AP014809.1_4910077_4910365_-	NA	NA|55aa|down_5|NZ_AP014809.1_4910509_4910674_+	NA	NA|398aa|down_6|NZ_AP014809.1_4910745_4911939_+	PRK05967, PRK05967, cystathionine beta-lyase; Provisional	NA|356aa|down_7|NZ_AP014809.1_4914597_4915665_+	NA	NA|199aa|down_8|NZ_AP014809.1_4915906_4916503_-	TIGR04026, hypothetical_protein, PPOX class probable FMN-dependent enzyme, alr4036 family	NA|1087aa|down_9|NZ_AP014809.1_4916938_4920199_+	PRK13557, PRK13557, histidine kinase; Provisional
