assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001484605.1_ASM148460v1	NZ_CP013747	Pseudarthrobacter sulfonivorans strain Ar51 chromosome, complete genome	1	744977-745078	1	CRISPRCasFinder	no		RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	Orphan	GCGAACGGGTTGTTACCCGGACGGGGA	27	0	0	NA	NA	NA	1	1	Orphan	RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	NA|118aa|up_5|NZ_CP013747.1_737443_737797_-,NA	NA|416aa|up_9|NZ_CP013747.1_733620_734868_-	COG3844, COG3844, Kynureninase [Amino acid transport and metabolism]	NA|285aa|up_8|NZ_CP013747.1_734876_735731_-	TIGR03036, trp_2_3_diox, tryptophan 2,3-dioxygenase	NA|328aa|up_7|NZ_CP013747.1_735771_736755_-	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase	NA|151aa|up_6|NZ_CP013747.1_736971_737424_-	TIGR01478, Plasmodium_falciparum, variant surface antigen, stevor family	NA|118aa|up_5|NZ_CP013747.1_737443_737797_-	NA	NA|328aa|up_4|NZ_CP013747.1_737799_738783_-	PRK03287, truB, tRNA pseudouridine synthase B; Provisional	NA|391aa|up_3|NZ_CP013747.1_738870_740043_+	COG0436, COG0436, Aspartate/tyrosine/aromatic aminotransferase [Amino acid transport and metabolism]	NA|162aa|up_2|NZ_CP013747.1_740058_740544_-	cd01285, nucleoside_deaminase, Nucleoside deaminases include adenosine, guanine and cytosine deaminases	NA|366aa|up_1|NZ_CP013747.1_740725_741823_+	NF033206, ScyE_fam, ScyD/ScyE family protein	NA|170aa|up_0|NZ_CP013747.1_741897_742407_-	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|126aa|down_0|NZ_CP013747.1_745721_746099_-	pfam04296, DUF448, Protein of unknown function (DUF448)	NA|327aa|down_1|NZ_CP013747.1_746268_747249_-	PRK12327, nusA, transcription elongation factor NusA; Provisional	NA|205aa|down_2|NZ_CP013747.1_747248_747863_-	PRK00092, PRK00092, ribosome maturation protein RimP; Reviewed	NA|383aa|down_3|NZ_CP013747.1_747969_749118_+	pfam14530, DUF4439, Domain of unknown function (DUF4439)	NA|243aa|down_4|NZ_CP013747.1_749169_749898_+	cd02432, Nodulin-21_like_1, Nodulin-21 and CCC1-related protein family	NA|344aa|down_5|NZ_CP013747.1_749894_750926_+	pfam04655, APH_6_hur, Aminoglycoside/hydroxyurea antibiotic resistance kinase	NA|265aa|down_6|NZ_CP013747.1_752475_753270_-	PRK10621, PRK10621, hypothetical protein; Provisional	NA|603aa|down_7|NZ_CP013747.1_753279_755088_-	PRK09194, PRK09194, prolyl-tRNA synthetase; Provisional	NA|263aa|down_8|NZ_CP013747.1_755498_756287_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|248aa|down_9|NZ_CP013747.1_756295_757039_+	TIGR00025, Mtu_efflux, ABC transporter efflux protein, DrrB family
GCF_001484605.1_ASM148460v1	NZ_CP013747	Pseudarthrobacter sulfonivorans strain Ar51 chromosome, complete genome	2	777176-777261	2	CRISPRCasFinder	no		RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	Orphan	GCGTCGGTTTCGACAGGCTCAACCAC	26	0	0	NA	NA	NA	1	1	Orphan	RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	NA,NA|152aa|down_3|NZ_CP013747.1_780797_781253_+	NA|248aa|up_9|NZ_CP013747.1_764762_765506_-	pfam01925, TauE, Sulfite exporter TauE/SafE	NA|487aa|up_8|NZ_CP013747.1_765555_767016_+	pfam06762, LMF1, Lipase maturation factor	NA|280aa|up_7|NZ_CP013747.1_767032_767872_-	COG2301, CitE, Citrate lyase beta subunit [Carbohydrate transport and metabolism]	NA|206aa|up_6|NZ_CP013747.1_767868_768486_-	cd03451, FkbR2, FkbR2 is a Streptomyces hygroscopicus protein with a hot dog fold that belongs to a conserved family of proteins found in prokaryotes and archaea but not in eukaryotes	NA|256aa|up_5|NZ_CP013747.1_768482_769250_-	TIGR02428, 3-oxoadipate_CoA-transferase_subunit_B, 3-oxoacid CoA-transferase, B subunit	NA|265aa|up_4|NZ_CP013747.1_769252_770047_-	COG1788, AtoD, Acyl CoA:acetate/3-ketoacid CoA transferase, alpha subunit [Lipid metabolism]	NA|388aa|up_3|NZ_CP013747.1_770112_771276_-	cd01158, SCAD_SBCAD, Short chain acyl-CoA dehydrogenases and eukaryotic short/branched chain acyl-CoA dehydrogenases	NA|741aa|up_2|NZ_CP013747.1_771278_773501_-	COG4770, COG4770, Acetyl/propionyl-CoA carboxylase, alpha subunit [Lipid metabolism]	NA|536aa|up_1|NZ_CP013747.1_773508_775116_-	PLN02820, PLN02820, 3-methylcrotonyl-CoA carboxylase, beta chain	NA|207aa|up_0|NZ_CP013747.1_775415_776036_+	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|337aa|down_0|NZ_CP013747.1_777686_778697_-	COG0022, AcoB, Pyruvate/2-oxoglutarate dehydrogenase complex, dehydrogenase (E1) component, eukaryotic type, beta subunit [Energy production and conversion]	NA|377aa|down_1|NZ_CP013747.1_778696_779827_-	TIGR03181, PDH_E1_alph_x, pyruvate dehydrogenase E1 component, alpha subunit	NA|158aa|down_2|NZ_CP013747.1_780001_780475_+	COG1522, Lrp, Transcriptional regulators [Transcription]	NA|152aa|down_3|NZ_CP013747.1_780797_781253_+	NA	NA|539aa|down_4|NZ_CP013747.1_781363_782980_-	PRK09395, actP, cation/acetate symporter ActP	NA|127aa|down_5|NZ_CP013747.1_782976_783357_-	pfam04341, DUF485, Protein of unknown function, DUF485	NA|397aa|down_6|NZ_CP013747.1_783535_784726_+	COG3275, LytS, Putative regulator of cell autolysis [Signal transduction mechanisms]	NA|241aa|down_7|NZ_CP013747.1_784772_785495_+	COG3279, LytT, Response regulator of the LytR/AlgR family [Transcription / Signal transduction mechanisms]	NA|117aa|down_8|NZ_CP013747.1_785491_785842_+	pfam04341, DUF485, Protein of unknown function, DUF485	NA|489aa|down_9|NZ_CP013747.1_785849_787316_+	cd11480, SLC5sbd_u4, Uncharacterized bacterial solute carrier 5 subfamily; putative solute-binding domain
GCF_001484605.1_ASM148460v1	NZ_CP013747	Pseudarthrobacter sulfonivorans strain Ar51 chromosome, complete genome	3	2880991-2881094	3	CRISPRCasFinder	no		RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	Orphan	CGCAGTTAACATGTTGGAAACATTC	25	0	0	NA	NA	NA	1	1	Orphan	RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	NA,NA	NA|158aa|up_9|NZ_CP013747.1_2867553_2868027_+	PRK05571, PRK05571, ribose-5-phosphate isomerase B; Provisional	NA|340aa|up_8|NZ_CP013747.1_2868109_2869129_+	PRK09197, PRK09197, fructose-bisphosphate aldolase; Provisional	NA|342aa|up_7|NZ_CP013747.1_2869135_2870161_-	TIGR02483, ATP-dependent_6-phosphofructokinase_1, phosphofructokinase	NA|498aa|up_6|NZ_CP013747.1_2870473_2871967_-	PRK08289, PRK08289, glyceraldehyde-3-phosphate dehydrogenase; Reviewed	NA|121aa|up_5|NZ_CP013747.1_2872217_2872580_+	COG3450, COG3450, Predicted enzyme of the cupin superfamily [General function prediction only]	NA|319aa|up_4|NZ_CP013747.1_2872809_2873766_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|344aa|up_3|NZ_CP013747.1_2873846_2874878_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|394aa|up_2|NZ_CP013747.1_2874988_2876170_-	COG0475, KefB, Kef-type K+ transport systems, membrane components [Inorganic ion transport and metabolism]	NA|220aa|up_1|NZ_CP013747.1_2876230_2876890_-	pfam17197, DUF5134, Domain of unknown function (DUF5134)	NA|494aa|up_0|NZ_CP013747.1_2876982_2878464_-	pfam13520, AA_permease_2, Amino acid permease	NA|450aa|down_0|NZ_CP013747.1_2881338_2882688_+	COG0531, PotE, Amino acid transporters [Amino acid transport and metabolism]	NA|248aa|down_1|NZ_CP013747.1_2882684_2883428_+	COG1414, IclR, Transcriptional regulator [Transcription]	NA|583aa|down_2|NZ_CP013747.1_2883564_2885313_+	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|632aa|down_3|NZ_CP013747.1_2885471_2887367_+	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|607aa|down_4|NZ_CP013747.1_2887783_2889604_+	COG3387, SGA1, Glucoamylase and related glycosyl hydrolases [Carbohydrate transport and metabolism]	NA|468aa|down_5|NZ_CP013747.1_2889625_2891029_-	COG2186, FadR, Transcriptional regulators [Transcription]	NA|494aa|down_6|NZ_CP013747.1_2891993_2893475_-	pfam13520, AA_permease_2, Amino acid permease	NA|113aa|down_7|NZ_CP013747.1_2893719_2894058_-	cd02228, cupin_EutQ, Clostridium difficile EutQ and related proteins, cupin domain	NA|127aa|down_8|NZ_CP013747.1_2894583_2894964_+	cd02228, cupin_EutQ, Clostridium difficile EutQ and related proteins, cupin domain	NA|467aa|down_9|NZ_CP013747.1_2895126_2896527_+	COG2072, TrkA, Predicted flavoprotein involved in K+ transport [Inorganic ion transport and metabolism]
GCF_001484605.1_ASM148460v1	NZ_CP013747	Pseudarthrobacter sulfonivorans strain Ar51 chromosome, complete genome	4	3290708-3291012	1	CRT	no		RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	Orphan	GGATCCGNCNNCNNNCCC	18	0	0	NA	NA	NA	5	5	Orphan	RT,csa3,DinG,cas3,DEDDh,PD-DExK,WYL	NA|150aa|up_6|NZ_CP013747.1_3282371_3282821_-,NA|180aa|down_3|NZ_CP013747.1_3298184_3298724_-	NA|92aa|up_9|NZ_CP013747.1_3280265_3280541_+	pfam05768, DUF836, Glutaredoxin-like domain (DUF836)	NA|246aa|up_8|NZ_CP013747.1_3280598_3281336_+	PRK05472, PRK05472, redox-sensing transcriptional repressor Rex; Provisional	NA|266aa|up_7|NZ_CP013747.1_3281393_3282191_-	PRK10263, PRK10263, DNA translocase FtsK; Provisional	NA|150aa|up_6|NZ_CP013747.1_3282371_3282821_-	NA	NA|183aa|up_5|NZ_CP013747.1_3283177_3283726_-	pfam04264, YceI, YceI-like domain	NA|227aa|up_4|NZ_CP013747.1_3283928_3284609_+	pfam00300, His_Phos_1, Histidine phosphatase superfamily (branch 1)	NA|212aa|up_3|NZ_CP013747.1_3284610_3285246_+	cd02966, TlpA_like_family, TlpA-like family; composed of  TlpA, ResA, DsbE and similar proteins	NA|252aa|up_2|NZ_CP013747.1_3285261_3286017_+	pfam02683, DsbD, Cytochrome C biogenesis protein transmembrane region	NA|586aa|up_1|NZ_CP013747.1_3286016_3287774_+	pfam05140, ResB, ResB-like family	NA|375aa|up_0|NZ_CP013747.1_3287773_3288898_+	TIGR03144, cytochrome_c_biogenesis_protein_chloroplast, cytochrome c-type biogenesis protein CcsB	NA|685aa|down_0|NZ_CP013747.1_3291169_3293224_+	smart00421, HTH_LUXR, helix_turn_helix, Lux Regulon	NA|382aa|down_1|NZ_CP013747.1_3293388_3294534_+	COG5271, MDN1, AAA ATPase containing von Willebrand factor type A (vWA) domain [General function prediction only]	NA|498aa|down_2|NZ_CP013747.1_3296681_3298175_+	cd09912, DLP_2, Dynamin-like protein including dynamins, mitofusins, and guanylate-binding proteins	NA|180aa|down_3|NZ_CP013747.1_3298184_3298724_-	NA	NA|154aa|down_4|NZ_CP013747.1_3298818_3299280_-	pfam13396, PLDc_N, Phospholipase_D-nuclease N-terminal	NA|119aa|down_5|NZ_CP013747.1_3299340_3299697_+	pfam14012, DUF4229, Protein of unknown function (DUF4229)	NA|294aa|down_6|NZ_CP013747.1_3299729_3300611_-	PRK06080, PRK06080, 1,4-dihydroxy-2-naphthoate octaprenyltransferase; Validated	NA|401aa|down_7|NZ_CP013747.1_3300690_3301893_-	PRK07824, PRK07824, o-succinylbenzoate--CoA ligase	NA|318aa|down_8|NZ_CP013747.1_3301966_3302920_-	PRK08321, PRK08321, 1,4-dihydroxy-2-naphthoyl-CoA synthase	NA|254aa|down_9|NZ_CP013747.1_3303063_3303825_-	COG1266, COG1266, Predicted metal-dependent membrane protease [General function prediction only]
