assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001542565.1_ASM154256v1	NZ_CP014196	Arthrobacter sp. ATCC 21022, complete genome	1	1517049-1517146	1	CRISPRCasFinder	no		csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	Orphan	CCGCGTCCGGGCAACAACCCCTT	23	0	0	NA	NA	NA	1	1	Orphan	csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	NA|247aa|up_8|NZ_CP014196.1_1506683_1507424_+,NA|118aa|down_4|NZ_CP014196.1_1522812_1523166_+,NA|155aa|down_5|NZ_CP014196.1_1523167_1523632_+	NA|293aa|up_9|NZ_CP014196.1_1505715_1506594_+	pfam13312, DUF4081, Domain of unknown function (DUF4081)	NA|247aa|up_8|NZ_CP014196.1_1506683_1507424_+	NA	NA|248aa|up_7|NZ_CP014196.1_1507520_1508264_-	TIGR00025, Mtu_efflux, ABC transporter efflux protein, DrrB family	NA|254aa|up_6|NZ_CP014196.1_1508272_1509034_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|604aa|up_5|NZ_CP014196.1_1509508_1511320_+	PRK09194, PRK09194, prolyl-tRNA synthetase; Provisional	NA|265aa|up_4|NZ_CP014196.1_1511316_1512111_+	PRK10621, PRK10621, hypothetical protein; Provisional	NA|336aa|up_3|NZ_CP014196.1_1512107_1513115_-	pfam04655, APH_6_hur, Aminoglycoside/hydroxyurea antibiotic resistance kinase	NA|204aa|up_2|NZ_CP014196.1_1514370_1514982_+	PRK00092, PRK00092, ribosome maturation protein RimP; Reviewed	NA|327aa|up_1|NZ_CP014196.1_1514981_1515962_+	PRK12327, nusA, transcription elongation factor NusA; Provisional	NA|118aa|up_0|NZ_CP014196.1_1516092_1516446_+	pfam04296, DUF448, Protein of unknown function (DUF448)	NA|168aa|down_0|NZ_CP014196.1_1519559_1520063_+	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|161aa|down_1|NZ_CP014196.1_1520141_1520624_+	cd01285, nucleoside_deaminase, Nucleoside deaminases include adenosine, guanine and cytosine deaminases	NA|388aa|down_2|NZ_CP014196.1_1520655_1521819_-	COG0436, COG0436, Aspartate/tyrosine/aromatic aminotransferase [Amino acid transport and metabolism]	NA|334aa|down_3|NZ_CP014196.1_1521808_1522810_+	PRK03287, truB, tRNA pseudouridine synthase B; Provisional	NA|118aa|down_4|NZ_CP014196.1_1522812_1523166_+	NA	NA|155aa|down_5|NZ_CP014196.1_1523167_1523632_+	NA	NA|328aa|down_6|NZ_CP014196.1_1523715_1524699_+	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase	NA|90aa|down_7|NZ_CP014196.1_1524855_1525125_+	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|750aa|down_8|NZ_CP014196.1_1525358_1527608_+	TIGR02696, polyribonucleotide_nucleotidyltransferase, guanosine pentaphosphate synthetase I/polynucleotide phosphorylase	NA|448aa|down_9|NZ_CP014196.1_1527683_1529027_+	COG0612, PqqL, Predicted Zn-dependent peptidases [General function prediction only]
GCF_001542565.1_ASM154256v1	NZ_CP014196	Arthrobacter sp. ATCC 21022, complete genome	2	2315389-2315530	2	CRISPRCasFinder	no		csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	Orphan	GTGACAGAGGAACCCCCGAAACCCGACGGGACATGACAGAGGAAC	45	0	0	NA	NA	NA	1	1	Orphan	csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	NA,NA	NA|272aa|up_9|NZ_CP014196.1_2303630_2304446_+	PRK00042, tpiA, triosephosphate isomerase; Provisional	NA|86aa|up_8|NZ_CP014196.1_2304482_2304740_+	PRK06870, secG, preprotein translocase subunit SecG; Reviewed	NA|132aa|up_7|NZ_CP014196.1_2304849_2305245_+	pfam13397, RbpA, RNA polymerase-binding protein	NA|273aa|up_6|NZ_CP014196.1_2305197_2306016_-	pfam01182, Glucosamine_iso, Glucosamine-6-phosphate isomerases/6-phosphogluconolactonase	NA|314aa|up_5|NZ_CP014196.1_2306005_2306947_-	pfam10128, OpcA_G6PD_assem, Glucose-6-phosphate dehydrogenase subunit	NA|519aa|up_4|NZ_CP014196.1_2306943_2308500_-	PRK05722, PRK05722, glucose-6-phosphate 1-dehydrogenase; Validated	NA|544aa|up_3|NZ_CP014196.1_2308515_2310147_-	PRK09533, PRK09533, bifunctional transaldolase/phosoglucose isomerase; Validated	NA|373aa|up_2|NZ_CP014196.1_2310153_2311272_-	PRK03343, PRK03343, transaldolase; Validated	NA|706aa|up_1|NZ_CP014196.1_2311303_2313421_-	COG0021, TktA, Transketolase [Carbohydrate transport and metabolism]	NA|321aa|up_0|NZ_CP014196.1_2313862_2314825_+	PRK04375, PRK04375, protoheme IX farnesyltransferase; Provisional	NA|315aa|down_0|NZ_CP014196.1_2315554_2316499_-	COG1612, CtaA, Uncharacterized protein required for cytochrome oxidase assembly [Posttranslational modification, protein turnover, chaperones]	NA|255aa|down_1|NZ_CP014196.1_2316521_2317286_-	TIGR00025, Mtu_efflux, ABC transporter efflux protein, DrrB family	NA|320aa|down_2|NZ_CP014196.1_2317282_2318242_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|274aa|down_3|NZ_CP014196.1_2318352_2319174_+	COG2345, COG2345, Predicted transcriptional regulator [Transcription]	NA|492aa|down_4|NZ_CP014196.1_2319173_2320649_+	TIGR01980, UPF0051_protein_slr0074, FeS assembly protein SufB	NA|435aa|down_5|NZ_CP014196.1_2320651_2321956_+	pfam01458, UPF0051, Uncharacterized protein family (UPF0051)	NA|119aa|down_6|NZ_CP014196.1_2322009_2322366_+	cd03528, Rieske_RO_ferredoxin, Rieske non-heme iron oxygenase (RO) family, Rieske ferredoxin component; composed of the Rieske ferredoxin component of some three-component RO systems including biphenyl dioxygenase (BPDO) and carbazole 1,9a-dioxygenase (CARDO)	NA|262aa|down_7|NZ_CP014196.1_2322411_2323197_+	COG0396, sufC, Cysteine desulfurase activator ATPase [Posttranslational modification, protein turnover, chaperones]	NA|111aa|down_8|NZ_CP014196.1_2323210_2323543_+	COG2151, PaaD, Predicted metal-sulfur cluster biosynthetic enzyme [General function prediction only]	NA|300aa|down_9|NZ_CP014196.1_2323621_2324521_-	COG2321, COG2321, Predicted metalloprotease [General function prediction only]
GCF_001542565.1_ASM154256v1	NZ_CP014196	Arthrobacter sp. ATCC 21022, complete genome	3	2864815-2864894	3	CRISPRCasFinder	no	WYL	csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	Unclear	GCCGGGACACTCTAGTCCGGCGGGA	25	0	0	NA	NA	NA	1	1	Orphan	csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	NA|101aa|up_8|NZ_CP014196.1_2853216_2853519_+,NA	NA|339aa|up_9|NZ_CP014196.1_2852122_2853139_+	cd09597, M4_TLP, Peptidase M4 family including thermolysin, protealysin, aureolysin, and neutral protease	NA|101aa|up_8|NZ_CP014196.1_2853216_2853519_+	NA	NA|323aa|up_7|NZ_CP014196.1_2853556_2854525_-	PRK09393, ftrA, transcriptional activator FtrA; Provisional	WYL|331aa|up_6|NZ_CP014196.1_2854942_2855935_+	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|1328aa|up_5|NZ_CP014196.1_2855948_2859932_+	PRK11131, PRK11131, ATP-dependent RNA helicase HrpA; Provisional	NA|143aa|up_4|NZ_CP014196.1_2859941_2860370_-	COG0537, Hit, Diadenosine tetraphosphate (Ap4A) hydrolase and other HIT family hydrolases [Nucleotide transport and metabolism / Carbohydrate transport and metabolism / General function prediction only]	NA|385aa|up_3|NZ_CP014196.1_2860366_2861521_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)	NA|298aa|up_2|NZ_CP014196.1_2861517_2862411_-	COG2897, SseA, Rhodanese-related sulfurtransferase [Inorganic ion transport and metabolism]	NA|361aa|up_1|NZ_CP014196.1_2862518_2863601_+	COG0031, CysK, Cysteine synthase [Amino acid transport and metabolism]	NA|224aa|up_0|NZ_CP014196.1_2863597_2864269_-	COG2220, COG2220, Predicted Zn-dependent hydrolases of the beta-lactamase fold [General function prediction only]	NA|297aa|down_0|NZ_CP014196.1_2864902_2865793_-	COG1108, ZnuB, ABC-type Mn2+/Zn2+ transport systems, permease components [Inorganic ion transport and metabolism]	NA|268aa|down_1|NZ_CP014196.1_2865792_2866596_-	COG1121, ZnuC, ABC-type Mn/Zn transport systems, ATPase component [Inorganic ion transport and metabolism]	NA|333aa|down_2|NZ_CP014196.1_2866721_2867720_-	cd01020, TroA_b, Metal binding protein TroA_b	NA|358aa|down_3|NZ_CP014196.1_2867810_2868884_-	COG1253, TlyC, Hemolysins and related proteins containing CBS domains [General function prediction only]	NA|451aa|down_4|NZ_CP014196.1_2868880_2870233_-	COG1253, TlyC, Hemolysins and related proteins containing CBS domains [General function prediction only]	NA|1267aa|down_5|NZ_CP014196.1_2870711_2874512_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|210aa|down_6|NZ_CP014196.1_2874617_2875247_+	cd01835, SGNH_hydrolase_like_3, SGNH_hydrolase subfamily	NA|283aa|down_7|NZ_CP014196.1_2875344_2876193_+	pfam13349, DUF4097, Putative adhesin	NA|209aa|down_8|NZ_CP014196.1_2876192_2876819_+	COG1695, COG1695, Predicted transcriptional regulators [Transcription]	NA|87aa|down_9|NZ_CP014196.1_2877088_2877349_-	TIGR03988, antisig_RsrA, mycothiol system anti-sigma-R factor
GCF_001542565.1_ASM154256v1	NZ_CP014196	Arthrobacter sp. ATCC 21022, complete genome	4	3704777-3704889	4	CRISPRCasFinder	no		csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	Orphan	GCACAGCCAATCGATCCGCAGCAGCC	26	0	0	NA	NA	NA	1	1	Orphan	csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	NA|116aa|up_6|NZ_CP014196.1_3698234_3698582_+,NA	NA|277aa|up_9|NZ_CP014196.1_3696308_3697139_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|170aa|up_8|NZ_CP014196.1_3697297_3697807_+	TIGR03180, UraD_2, OHCU decarboxylase	NA|114aa|up_7|NZ_CP014196.1_3697803_3698145_+	TIGR02962, Probable_5-hydroxyisourate_hydrolase_R09H10	NA|116aa|up_6|NZ_CP014196.1_3698234_3698582_+	NA	NA|548aa|up_5|NZ_CP014196.1_3698738_3700382_+	PRK07847, PRK07847, amidophosphoribosyltransferase; Provisional	NA|385aa|up_4|NZ_CP014196.1_3700378_3701533_+	PRK05385, PRK05385, phosphoribosylaminoimidazole synthetase; Provisional	NA|261aa|up_3|NZ_CP014196.1_3701656_3702439_-	cd07247, SgaA_N_like, N-terminal domain of Streptomyces griseus SgaA and similar domains	NA|247aa|up_2|NZ_CP014196.1_3702435_3703176_-	cd07247, SgaA_N_like, N-terminal domain of Streptomyces griseus SgaA and similar domains	NA|156aa|up_1|NZ_CP014196.1_3703423_3703891_+	pfam14325, DUF4383, Domain of unknown function (DUF4383)	NA|75aa|up_0|NZ_CP014196.1_3704171_3704396_-	pfam11273, DUF3073, Protein of unknown function (DUF3073)	NA|891aa|down_0|NZ_CP014196.1_3705525_3708198_-	TIGR03346, chaperone_ClpB, ATP-dependent chaperone ClpB	NA|206aa|down_1|NZ_CP014196.1_3708522_3709140_+	TIGR04025, hypothetical_protein, PPOX class probable FMN-dependent enzyme, DR_2398 family	NA|357aa|down_2|NZ_CP014196.1_3709143_3710214_-	COG3842, PotA, ABC-type spermidine/putrescine transport systems, ATPase components [Amino acid transport and metabolism]	NA|279aa|down_3|NZ_CP014196.1_3710210_3711047_-	TIGR01581, Molybdenum_transport_system_permease_protein_modB	NA|260aa|down_4|NZ_CP014196.1_3711074_3711854_-	cd13538, PBP2_ModA_like_1, Substrate binding domain of putative molybdate-binding protein;the type 2 periplasmic binding protein fold	NA|137aa|down_5|NZ_CP014196.1_3711850_3712261_-	cd04762, HTH_MerR-trunc, Helix-Turn-Helix DNA binding domain of truncated MerR-like proteins	NA|445aa|down_6|NZ_CP014196.1_3712552_3713887_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|295aa|down_7|NZ_CP014196.1_3714039_3714924_+	COG4339, COG4339, Uncharacterized protein conserved in bacteria [Function unknown]	NA|576aa|down_8|NZ_CP014196.1_3714934_3716662_+	cd15482, Sialidase_non-viral, Non-viral sialidases	NA|134aa|down_9|NZ_CP014196.1_3716682_3717084_-	PRK11770, PRK11770, YccF domain-containing protein
GCF_001542565.1_ASM154256v1	NZ_CP014196	Arthrobacter sp. ATCC 21022, complete genome	5	3794252-3794341	5	CRISPRCasFinder	no		csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	Orphan	ACGAGCACCCGGAAAGCGCACAACAGG	27	0	0	NA	NA	NA	1	1	Orphan	csa3,cas3,DinG,WYL,PD-DExK,DEDDh,RT	NA|172aa|up_4|NZ_CP014196.1_3788766_3789282_-,NA|221aa|up_2|NZ_CP014196.1_3791228_3791891_+,NA|252aa|down_0|NZ_CP014196.1_3794863_3795619_+,NA|113aa|down_2|NZ_CP014196.1_3797149_3797488_+,NA|153aa|down_6|NZ_CP014196.1_3801149_3801608_+	NA|238aa|up_9|NZ_CP014196.1_3783287_3784001_-	pfam13305, WHG, WHG domain	NA|310aa|up_8|NZ_CP014196.1_3784133_3785063_+	cd05229, SDR_a3, atypical (a) SDRs, subgroup 3	NA|268aa|up_7|NZ_CP014196.1_3785123_3785927_+	COG1414, IclR, Transcriptional regulator [Transcription]	NA|260aa|up_6|NZ_CP014196.1_3786081_3786861_-	cd01015, CSHase, N-carbamoylsarcosine amidohydrolase (CSHase) hydrolyzes N-carbamoylsarcosine to sarcosine, carbon dioxide and ammonia	NA|460aa|up_5|NZ_CP014196.1_3787170_3788550_+	cd17369, MFS_ShiA_like, Shikimate transporter and similar proteins of the Major Facilitator Superfamily	NA|172aa|up_4|NZ_CP014196.1_3788766_3789282_-	NA	NA|527aa|up_3|NZ_CP014196.1_3789468_3791049_+	COG3540, PhoD, Phosphodiesterase/alkaline phosphatase D [Inorganic ion transport and metabolism]	NA|221aa|up_2|NZ_CP014196.1_3791228_3791891_+	NA	NA|445aa|up_1|NZ_CP014196.1_3791926_3793261_+	COG3497, COG3497, Phage tail sheath protein FI [General function prediction only]	NA|160aa|up_0|NZ_CP014196.1_3793262_3793742_+	pfam06841, Phage_T4_gp19, T4-like virus tail tube protein gp19	NA|252aa|down_0|NZ_CP014196.1_3794863_3795619_+	NA	NA|507aa|down_1|NZ_CP014196.1_3795615_3797136_+	PHA02561, D, tail protein; Provisional	NA|113aa|down_2|NZ_CP014196.1_3797149_3797488_+	NA	NA|145aa|down_3|NZ_CP014196.1_3797513_3797948_+	pfam04965, GPW_gp25, Gene 25-like lysozyme	NA|869aa|down_4|NZ_CP014196.1_3797944_3800551_+	TIGR02243, hypothetical_protein_SCD8A	NA|188aa|down_5|NZ_CP014196.1_3800537_3801101_+	TIGR02242, putative_secreted_protein, phage tail protein domain	NA|153aa|down_6|NZ_CP014196.1_3801149_3801608_+	NA	NA|312aa|down_7|NZ_CP014196.1_3801653_3802589_+	sd00037, PASTA, PASTA domain	NA|409aa|down_8|NZ_CP014196.1_3802632_3803859_+	PRK09265, PRK09265, aminotransferase AlaT; Validated	NA|346aa|down_9|NZ_CP014196.1_3803939_3804977_-	cd08260, Zn_ADH6, Alcohol dehydrogenases of the MDR family
