assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	1	204115-204214	1	CRISPRCasFinder	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	AGCGGGGTGCGGTCATGAGCGAA	23	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA|190aa|up_5|NZ_CP046171.1_198073_198643_+,NA	NA|431aa|up_9|NZ_CP046171.1_194215_195508_+	TIGR02669, stage_II_sporulation_protein_D, SpoIID/LytB domain	NA|167aa|up_8|NZ_CP046171.1_195540_196041_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|336aa|up_7|NZ_CP046171.1_196148_197156_+	TIGR00950, Uncharacterized_inner_membrane_transporter_YicL, Carboxylate/Amino Acid/Amine Transporter	NA|252aa|up_6|NZ_CP046171.1_197236_197992_+	pfam07739, TipAS, TipAS antibiotic-recognition domain	NA|190aa|up_5|NZ_CP046171.1_198073_198643_+	NA	NA|202aa|up_4|NZ_CP046171.1_198709_199315_-	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|241aa|up_3|NZ_CP046171.1_199418_200141_+	cd05233, SDR_c, classical (c) SDRs	NA|409aa|up_2|NZ_CP046171.1_200316_201543_+	COG0562, Glf, UDP-galactopyranose mutase [Cell envelope biogenesis, outer membrane]	NA|647aa|up_1|NZ_CP046171.1_201539_203480_+	pfam17994, Glft2_N, Galactofuranosyltransferase 2 N-terminal	NA|181aa|up_0|NZ_CP046171.1_203557_204100_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|644aa|down_0|NZ_CP046171.1_205151_207083_+	pfam10101, DUF2339, Predicted membrane protein (DUF2339)	NA|359aa|down_1|NZ_CP046171.1_207343_208420_+	COG0627, COG0627, Predicted esterase [General function prediction only]	NA|354aa|down_2|NZ_CP046171.1_208722_209784_+	COG0627, COG0627, Predicted esterase [General function prediction only]	NA|315aa|down_3|NZ_CP046171.1_210182_211127_+	COG0627, COG0627, Predicted esterase [General function prediction only]	NA|336aa|down_4|NZ_CP046171.1_211480_212488_+	COG0627, COG0627, Predicted esterase [General function prediction only]	NA|596aa|down_5|NZ_CP046171.1_212816_214604_+	COG0627, COG0627, Predicted esterase [General function prediction only]	NA|168aa|down_6|NZ_CP046171.1_214741_215245_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|329aa|down_7|NZ_CP046171.1_215241_216228_+	pfam01083, Cutinase, Cutinase	NA|340aa|down_8|NZ_CP046171.1_216417_217437_+	TIGR03621, F420_MSMEG_2516, probable F420-dependent oxidoreductase, MSMEG_2516 family	NA|639aa|down_9|NZ_CP046171.1_217632_219549_+	PRK07769, PRK07769, long-chain-fatty-acid--CoA ligase; Validated
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	2	490416-490534	2	CRISPRCasFinder	no	cas3	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Unclear	GCGCGCACCGAGTTGGCGCGTGCGATGGAGTTGTGCGG	38	0	0	NA	NA	NA	1	1	Unclear	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA|120aa|up_8|NZ_CP046171.1_478354_478714_+,NA|465aa|down_0|NZ_CP046171.1_490673_492068_-,NA|99aa|down_3|NZ_CP046171.1_493888_494185_-,NA|63aa|down_5|NZ_CP046171.1_494870_495059_+	NA|39aa|up_9|NZ_CP046171.1_478220_478337_+	pfam14029, DUF4244, Protein of unknown function (DUF4244)	NA|120aa|up_8|NZ_CP046171.1_478354_478714_+	NA	NA|130aa|up_7|NZ_CP046171.1_479149_479539_+	TIGR03816, tadE_like_DECH, helicase/secretion neighborhood TadE-like protein	cas3|791aa|up_6|NZ_CP046171.1_479849_482222_-	TIGR03817, DECH_helic, helicase/secretion neighborhood putative DEAH-box helicase	NA|69aa|up_5|NZ_CP046171.1_482658_482865_+	COG1278, CspC, Cold shock proteins [Transcription]	NA|966aa|up_4|NZ_CP046171.1_483186_486084_+	PRK07561, PRK07561, DNA topoisomerase I subunit omega; Validated	NA|155aa|up_3|NZ_CP046171.1_486182_486647_+	pfam04978, DUF664, Protein of unknown function (DUF664)	NA|184aa|up_2|NZ_CP046171.1_486651_487203_-	cd03169, GATase1_PfpI_1, Type 1 glutamine amidotransferase (GATase1)-like domain found in a subgroup of proteins similar to PfpI from Pyrococcus furiosus	NA|402aa|up_1|NZ_CP046171.1_487293_488499_+	PRK07940, PRK07940, DNA polymerase III subunit delta'; Validated	NA|318aa|up_0|NZ_CP046171.1_489229_490183_-	cd02034, CooC1, accessory protein CooC1	NA|465aa|down_0|NZ_CP046171.1_490673_492068_-	NA	NA|97aa|down_1|NZ_CP046171.1_492184_492475_-	pfam03992, ABM, Antibiotic biosynthesis monooxygenase	NA|351aa|down_2|NZ_CP046171.1_492610_493663_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|99aa|down_3|NZ_CP046171.1_493888_494185_-	NA	NA|155aa|down_4|NZ_CP046171.1_494351_494816_+	pfam10825, DUF2752, Protein of unknown function (DUF2752)	NA|63aa|down_5|NZ_CP046171.1_494870_495059_+	NA	NA|445aa|down_6|NZ_CP046171.1_495055_496390_-	cd09603, M1_APN_like, Peptidase M1 family similar to aminopeptidase N catalytic domain	NA|1306aa|down_7|NZ_CP046171.1_496389_500307_-	TIGR02353, NON-RIBOSOMAL_PEPTIDE_SYNTHETASE, non-ribosomal peptide synthetase terminal domain of unknown function	NA|213aa|down_8|NZ_CP046171.1_500463_501102_-	COG1280, RhtB, Putative threonine efflux protein [Amino acid transport and metabolism]	NA|440aa|down_9|NZ_CP046171.1_501373_502693_+	cd06453, SufS_like, Cysteine desulfurase (SufS)-like
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	3	1959604-1959712	3	CRISPRCasFinder	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	TGAGCGCCAGCGAAGTTGCGCTGTGAGCGA	30	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA,NA|272aa|down_7|NZ_CP046171.1_1965879_1966695_-	NA|350aa|up_9|NZ_CP046171.1_1945442_1946492_-	cd00830, KAS_III, Ketoacyl-acyl carrier protein synthase III (KASIII) initiates the elongation in type II fatty acid synthase systems	NA|279aa|up_8|NZ_CP046171.1_1946579_1947416_-	cd05327, retinol-DH_like_SDR_c_like, retinol dehydrogenase (retinol-DH), Light dependent Protochlorophyllide (Pchlide) OxidoReductase (LPOR) and related proteins, classical (c) SDRs	NA|256aa|up_7|NZ_CP046171.1_1947696_1948464_+	PRK14103, PRK14103, trans-aconitate 2-methyltransferase; Provisional	NA|236aa|up_6|NZ_CP046171.1_1948388_1949096_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|417aa|up_5|NZ_CP046171.1_1949163_1950414_-	pfam00144, Beta-lactamase, Beta-lactamase	NA|865aa|up_4|NZ_CP046171.1_1950573_1953168_-	TIGR04075, Ser/Thr_phosphatase_family_protein, polynucleotide kinase-phosphatase	NA|525aa|up_3|NZ_CP046171.1_1953167_1954742_-	TIGR04074, Methyltransferase_type_12, 3' terminal RNA ribose 2'-O-methyltransferase Hen1	NA|793aa|up_2|NZ_CP046171.1_1954815_1957194_-	PRK05261, PRK05261, phosphoketolase	NA|191aa|up_1|NZ_CP046171.1_1957456_1958029_+	pfam00254, FKBP_C, FKBP-type peptidyl-prolyl cis-trans isomerase	NA|463aa|up_0|NZ_CP046171.1_1958199_1959588_+	PRK01490, tig, trigger factor; Provisional	NA|197aa|down_0|NZ_CP046171.1_1959846_1960437_+	PRK00277, clpP, ATP-dependent Clp protease proteolytic subunit; Reviewed	NA|222aa|down_1|NZ_CP046171.1_1960506_1961172_+	PRK12553, PRK12553, ATP-dependent Clp protease proteolytic subunit; Reviewed	NA|427aa|down_2|NZ_CP046171.1_1961616_1962897_+	PRK05342, clpX, ATP-dependent Clp protease ATP-binding subunit ClpX	NA|140aa|down_3|NZ_CP046171.1_1963132_1963552_+	cd07043, STAS_anti-anti-sigma_factors, Sulphate Transporter and Anti-Sigma factor antagonist) domain of anti-anti-sigma factors, key regulators of anti-sigma factors by phosphorylation	NA|97aa|down_4|NZ_CP046171.1_1963589_1963880_+	COG0222, RplL, Ribosomal protein L7/L12 [Translation, ribosomal structure and biogenesis]	NA|151aa|down_5|NZ_CP046171.1_1963898_1964351_-	COG1522, Lrp, Transcriptional regulators [Transcription]	NA|206aa|down_6|NZ_CP046171.1_1964462_1965080_+	COG1280, RhtB, Putative threonine efflux protein [Amino acid transport and metabolism]	NA|272aa|down_7|NZ_CP046171.1_1965879_1966695_-	NA	NA|126aa|down_8|NZ_CP046171.1_1966886_1967264_-	cd00781, ketosteroid_isomerase, ketosteroid isomerase: Many biological reactions proceed by enzymatic cleavage of a C-H bond adjacent to carbonyl or a carboxyl group, leading to an enol or a enolate intermediate that is subsequently re-protonated at the same or an adjacent carbon	NA|442aa|down_9|NZ_CP046171.1_1967383_1968709_-	PRK07812, PRK07812, O-acetylhomoserine aminocarboxypropyltransferase; Validated
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	4	2666713-2666815	4	CRISPRCasFinder	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	GGTCCGGCCGCCGCCGTAGGCCCTGTCGCT	30	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA,NA|112aa|down_0|NZ_CP046171.1_2667668_2668004_-,NA|78aa|down_1|NZ_CP046171.1_2668457_2668691_-,NA|131aa|down_4|NZ_CP046171.1_2671226_2671619_+	NA|216aa|up_9|NZ_CP046171.1_2653243_2653891_+	pfam02909, TetR_C, Tetracyclin repressor, C-terminal all-alpha domain	NA|77aa|up_8|NZ_CP046171.1_2654237_2654468_-	PRK14129, PRK14129, heat shock protein HspQ; Provisional	NA|206aa|up_7|NZ_CP046171.1_2655420_2656038_+	COG3707, AmiR, Response regulator with putative antiterminator output domain [Signal transduction mechanisms]	NA|399aa|up_6|NZ_CP046171.1_2656325_2657522_+	cd06342, PBP1_ABC_LIVBP-like, type 1 periplasmic ligand-binding domain of ABC (Atpase Binding Cassette)-type active transport systems involved in the transport of all three branched chain aliphatic amino acids (leucine, isoleucine and valine)	NA|346aa|up_5|NZ_CP046171.1_2657619_2658657_+	cd06582, TM_PBP1_LivH_like, Transmembrane subunit (TM) of Escherichia coli LivH and related proteins	NA|477aa|up_4|NZ_CP046171.1_2658653_2660084_+	cd06581, TM_PBP1_LivM_like, Transmembrane subunit (TM) of Escherichia coli LivM and related proteins	NA|332aa|up_3|NZ_CP046171.1_2660080_2661076_+	COG0411, LivG, ABC-type branched-chain amino acid transport systems, ATPase component [Amino acid transport and metabolism]	NA|253aa|up_2|NZ_CP046171.1_2661084_2661843_+	COG0410, LivF, ABC-type branched-chain amino acid transport systems, ATPase component [Amino acid transport and metabolism]	NA|563aa|up_1|NZ_CP046171.1_2661885_2663574_+	pfam05960, DUF885, Bacterial protein of unknown function (DUF885)	NA|915aa|up_0|NZ_CP046171.1_2663699_2666444_+	PRK05755, PRK05755, DNA polymerase I; Provisional	NA|112aa|down_0|NZ_CP046171.1_2667668_2668004_-	NA	NA|78aa|down_1|NZ_CP046171.1_2668457_2668691_-	NA	NA|397aa|down_2|NZ_CP046171.1_2669016_2670207_-	PRK05868, PRK05868, FAD-binding protein	NA|191aa|down_3|NZ_CP046171.1_2670577_2671150_-	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|131aa|down_4|NZ_CP046171.1_2671226_2671619_+	NA	NA|163aa|down_5|NZ_CP046171.1_2671615_2672104_+	pfam08592, DUF1772, Domain of unknown function (DUF1772)	NA|243aa|down_6|NZ_CP046171.1_2672112_2672841_-	cd00592, HTH_MerR-like, Helix-Turn-Helix DNA binding domain of MerR-like transcription regulators	NA|301aa|down_7|NZ_CP046171.1_2673031_2673934_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|165aa|down_8|NZ_CP046171.1_2674293_2674788_+	cd03379, beta_CA_cladeD, Carbonic anhydrases (CA) are zinc-containing enzymes that catalyze the reversible hydration of carbon dioxide in a two-step mechanism in which the nucleophilic attack of a zinc-bound hydroxide ion on carbon dioxide is followed by the regeneration of an active site by ionization of the zinc-bound water molecule and removal of a proton from the active site	NA|145aa|down_9|NZ_CP046171.1_2675280_2675715_+	PRK03739, PRK03739, 2-isopropylmalate synthase; Validated
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	5	3491001-3491107	5	CRISPRCasFinder	no	WYL	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Unclear	ACGGGTAGCACCCCGAGCCCGTTCGAGAAGG	31	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA,NA	NA|313aa|up_9|NZ_CP046171.1_3471552_3472491_-	pfam11175, DUF2961, Protein of unknown function (DUF2961)	NA|158aa|up_8|NZ_CP046171.1_3472577_3473051_-	TIGR01068, Thioredoxin-like_protein_slr0233, thioredoxin	NA|498aa|up_7|NZ_CP046171.1_3473110_3474604_-	cd07804, FGGY_XK_like_1, uncharacterized xylulose kinase-like proteins; a subgroup of the FGGY family of carbohydrate kinases	NA|300aa|up_6|NZ_CP046171.1_3474612_3475512_-	cd08995, GH32_EcAec43-like, Glycosyl hydrolase family 32, such as the putative glycoside hydrolase Escherichia coli Aec43 (FosGH2)	NA|268aa|up_5|NZ_CP046171.1_3475579_3476383_+	pfam13350, Y_phosphatase3, Tyrosine phosphatase family	NA|768aa|up_4|NZ_CP046171.1_3476321_3478625_-	COG0178, UvrA, Excinuclease ATPase subunit [DNA replication, recombination, and repair]	WYL|324aa|up_3|NZ_CP046171.1_3478687_3479659_+	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|676aa|up_2|NZ_CP046171.1_3479725_3481753_+	TIGR02123, conserved_inner_membrane_protein, TRAP transporter, 4TM/12TM fusion protein	NA|332aa|up_1|NZ_CP046171.1_3481749_3482745_+	cd13569, PBP2_TAXI_TRAP_like_1, Substrate binding domain of putative TAXI proteins of the tripartite ATP-independent periplasmic transporters; the type 2 periplasmic binding protein fold	NA|332aa|up_0|NZ_CP046171.1_3482896_3483892_+	cd13569, PBP2_TAXI_TRAP_like_1, Substrate binding domain of putative TAXI proteins of the tripartite ATP-independent periplasmic transporters; the type 2 periplasmic binding protein fold	NA|195aa|down_0|NZ_CP046171.1_3491249_3491834_+	pfam13649, Methyltransf_25, Methyltransferase domain	NA|289aa|down_1|NZ_CP046171.1_3492118_3492985_-	COG1414, IclR, Transcriptional regulator [Transcription]	NA|264aa|down_2|NZ_CP046171.1_3493111_3493903_+	PRK07814, PRK07814, SDR family oxidoreductase	NA|361aa|down_3|NZ_CP046171.1_3493904_3494987_+	COG3804, COG3804, Uncharacterized conserved protein related to dihydrodipicolinate reductase [Function unknown]	NA|411aa|down_4|NZ_CP046171.1_3494968_3496201_-	pfam01070, FMN_dh, FMN-dependent dehydrogenase	NA|259aa|down_5|NZ_CP046171.1_3496197_3496974_-	cd05233, SDR_c, classical (c) SDRs	NA|96aa|down_6|NZ_CP046171.1_3498472_3498760_+	pfam05336, rhaM, L-rhamnose mutarotase	NA|307aa|down_7|NZ_CP046171.1_3498752_3499673_+	cd19152, AKR_AKR15A, AKR15A family of aldo-keto reductase	NA|223aa|down_8|NZ_CP046171.1_3499706_3500375_-	COG2186, FadR, Transcriptional regulators [Transcription]	NA|278aa|down_9|NZ_CP046171.1_3500434_3501268_+	COG3618, COG3618, Predicted metal-dependent hydrolase of the TIM-barrel fold [General function prediction only]
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	6	3976802-3976972	6	CRISPRCasFinder	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	CACGCGCTCGAGCGATTGCCAAATCGGACCCACACGCGCTC	41	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA,NA|575aa|down_1|NZ_CP046171.1_3978679_3980404_+,NA|318aa|down_2|NZ_CP046171.1_3980604_3981558_+,NA|124aa|down_5|NZ_CP046171.1_3983084_3983456_+	NA|441aa|up_9|NZ_CP046171.1_3962365_3963688_+	PRK06075, PRK06075, NADH-quinone oxidoreductase subunit D	NA|243aa|up_8|NZ_CP046171.1_3963752_3964481_+	PRK07539, PRK07539, NADH-quinone oxidoreductase subunit NuoE	NA|438aa|up_7|NZ_CP046171.1_3964482_3965796_+	TIGR01959, NADH-quinone_oxidoreductase_subunit_F, NADH-quinone oxidoreductase, F subunit	NA|812aa|up_6|NZ_CP046171.1_3965942_3968378_+	PRK07860, PRK07860, NADH dehydrogenase subunit G; Validated	NA|612aa|up_5|NZ_CP046171.1_3968447_3970283_+	PRK06076, PRK06076, NADH-quinone oxidoreductase subunit NuoH	NA|270aa|up_4|NZ_CP046171.1_3970279_3971089_+	PRK06638, PRK06638, NADH-quinone oxidoreductase subunit J	NA|100aa|up_3|NZ_CP046171.1_3971085_3971385_+	PRK05715, PRK05715, NADH-quinone oxidoreductase subunit NuoK	NA|629aa|up_2|NZ_CP046171.1_3971386_3973273_+	PRK06590, PRK06590, NADH:ubiquinone oxidoreductase subunit L; Reviewed	NA|540aa|up_1|NZ_CP046171.1_3973266_3974886_+	PRK05846, PRK05846, NADH:ubiquinone oxidoreductase subunit M; Reviewed	NA|540aa|up_0|NZ_CP046171.1_3974891_3976511_+	PRK05777, PRK05777, NADH-quinone oxidoreductase subunit NuoN	NA|264aa|down_0|NZ_CP046171.1_3977533_3978325_-	PRK05557, fabG, 3-ketoacyl-(acyl-carrier-protein) reductase; Validated	NA|575aa|down_1|NZ_CP046171.1_3978679_3980404_+	NA	NA|318aa|down_2|NZ_CP046171.1_3980604_3981558_+	NA	NA|143aa|down_3|NZ_CP046171.1_3981596_3982025_-	cd04781, HTH_MerR-like_sg6, Helix-Turn-Helix DNA binding domain of putative transcription regulators from the MerR superfamily	NA|249aa|down_4|NZ_CP046171.1_3982137_3982884_+	PRK06523, PRK06523, short chain dehydrogenase; Provisional	NA|124aa|down_5|NZ_CP046171.1_3983084_3983456_+	NA	NA|195aa|down_6|NZ_CP046171.1_3983871_3984456_+	pfam13305, WHG, WHG domain	NA|283aa|down_7|NZ_CP046171.1_3984452_3985301_+	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|165aa|down_8|NZ_CP046171.1_3985324_3985819_-	cd00464, SK, Shikimate kinase (SK) is the fifth enzyme in the shikimate pathway, a seven-step biosynthetic pathway which converts erythrose-4-phosphate to chorismic acid, found in bacteria, fungi and plants	NA|200aa|down_9|NZ_CP046171.1_3986144_3986744_-	pfam01872, RibD_C, RibD C-terminal domain
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	7	5172057-5172159	7	CRISPRCasFinder	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	GCCCCACCGTGCGCGATGCACCCTGC	26	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA|83aa|up_6|NZ_CP046171.1_5161734_5161983_-,NA|160aa|up_5|NZ_CP046171.1_5163449_5163929_-,NA|86aa|down_2|NZ_CP046171.1_5174577_5174835_-,NA|180aa|down_8|NZ_CP046171.1_5182663_5183203_+,NA|552aa|down_9|NZ_CP046171.1_5183253_5184909_-	NA|151aa|up_9|NZ_CP046171.1_5156277_5156730_+	COG1989, PulO, Type II secretory pathway, prepilin signal peptidase PulO and related peptidases [Cell motility and secretion / Posttranslational modification, protein turnover, chaperones / Intracellular trafficking and secretion]	NA|404aa|up_8|NZ_CP046171.1_5156946_5158158_+	PRK05382, PRK05382, chorismate synthase; Validated	NA|374aa|up_7|NZ_CP046171.1_5160478_5161600_+	PRK00002, aroB, 3-dehydroquinate synthase; Reviewed	NA|83aa|up_6|NZ_CP046171.1_5161734_5161983_-	NA	NA|160aa|up_5|NZ_CP046171.1_5163449_5163929_-	NA	NA|291aa|up_4|NZ_CP046171.1_5164846_5165719_-	PRK00258, aroE, shikimate 5-dehydrogenase; Reviewed	NA|515aa|up_3|NZ_CP046171.1_5165648_5167193_-	pfam02618, YceG, YceG-like family	NA|207aa|up_2|NZ_CP046171.1_5167189_5167810_-	PRK00109, PRK00109, Holliday junction resolvase RuvX	NA|888aa|up_1|NZ_CP046171.1_5167809_5170473_-	PRK00252, alaS, alanyl-tRNA synthetase; Reviewed	NA|449aa|up_0|NZ_CP046171.1_5170687_5172034_-	PRK13342, PRK13342, recombination factor protein RarA; Reviewed	NA|538aa|down_0|NZ_CP046171.1_5172474_5174088_+	COG3540, PhoD, Phosphodiesterase/alkaline phosphatase D [Inorganic ion transport and metabolism]	NA|104aa|down_1|NZ_CP046171.1_5174237_5174549_-	PLN03138, PLN03138, Protein TOC75; Provisional	NA|86aa|down_2|NZ_CP046171.1_5174577_5174835_-	NA	NA|390aa|down_3|NZ_CP046171.1_5174927_5176097_-	PLN02421, PLN02421, phosphotransferase, alcohol group as acceptor/kinase	NA|231aa|down_4|NZ_CP046171.1_5176753_5177446_+	COG5473, COG5473, Predicted integral membrane protein [Function unknown]	NA|326aa|down_5|NZ_CP046171.1_5177481_5178459_-	pfam04087, DUF389, Domain of unknown function (DUF389)	NA|598aa|down_6|NZ_CP046171.1_5178602_5180396_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|308aa|down_7|NZ_CP046171.1_5181013_5181937_+	COG2321, COG2321, Predicted metalloprotease [General function prediction only]	NA|180aa|down_8|NZ_CP046171.1_5182663_5183203_+	NA	NA|552aa|down_9|NZ_CP046171.1_5183253_5184909_-	NA
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	8	5913990-5914307	1	CRT	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	CCCGGCGGCGCNGGCGCA	18	1	1	5914233-5914250	NZ_CP046171.1_2767025-2767042	NA	8	8	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA|124aa|up_5|NZ_CP046171.1_5907399_5907771_+,NA|169aa|up_0|NZ_CP046171.1_5913125_5913632_+,NA|646aa|down_6|NZ_CP046171.1_5921380_5923318_-	NA|407aa|up_9|NZ_CP046171.1_5904368_5905589_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|134aa|up_8|NZ_CP046171.1_5905625_5906027_+	cd03443, PaaI_thioesterase, PaaI_thioesterase is a tetrameric acyl-CoA thioesterase with a hot dog fold and one of several proteins responsible for phenylacetic acid (PA) degradation in bacteria	NA|146aa|up_7|NZ_CP046171.1_5906171_5906609_-	COG4270, COG4270, Predicted membrane protein [Function unknown]	NA|189aa|up_6|NZ_CP046171.1_5906723_5907290_+	pfam13305, WHG, WHG domain	NA|124aa|up_5|NZ_CP046171.1_5907399_5907771_+	NA	NA|368aa|up_4|NZ_CP046171.1_5907944_5909048_+	COG4585, COG4585, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|226aa|up_3|NZ_CP046171.1_5909044_5909722_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|498aa|up_2|NZ_CP046171.1_5909787_5911281_+	PRK00302, lnt, apolipoprotein N-acyltransferase; Reviewed	NA|439aa|up_1|NZ_CP046171.1_5911531_5912848_+	cd17366, MFS_ProP, Proline/betaine transporter of the Major Facilitator Superfamily of transporters	NA|169aa|up_0|NZ_CP046171.1_5913125_5913632_+	NA	NA|155aa|down_0|NZ_CP046171.1_5914875_5915340_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|255aa|down_1|NZ_CP046171.1_5915412_5916177_-	PRK06057, PRK06057, short chain dehydrogenase; Provisional	NA|454aa|down_2|NZ_CP046171.1_5916205_5917567_-	pfam00171, Aldedh, Aldehyde dehydrogenase family	NA|254aa|down_3|NZ_CP046171.1_5917563_5918325_-	COG2071, COG2071, Predicted glutamine amidotransferases [General function prediction only]	NA|451aa|down_4|NZ_CP046171.1_5918305_5919658_-	COG0174, GlnA, Glutamine synthetase [Amino acid transport and metabolism]	NA|531aa|down_5|NZ_CP046171.1_5919763_5921356_-	cd06268, PBP1_ABC_transporter_LIVBP-like, periplasmic binding domain of ATP-binding cassette transporter-like systems that belong to the type 1 periplasmic binding fold protein superfamily	NA|646aa|down_6|NZ_CP046171.1_5921380_5923318_-	NA	NA|438aa|down_7|NZ_CP046171.1_5923456_5924770_-	pfam03583, LIP, Secretory lipase	NA|421aa|down_8|NZ_CP046171.1_5925214_5926477_+	pfam13556, HTH_30, PucR C-terminal helix-turn-helix domain	NA|133aa|down_9|NZ_CP046171.1_5926878_5927277_+	cd04762, HTH_MerR-trunc, Helix-Turn-Helix DNA binding domain of truncated MerR-like proteins
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	9	6119833-6121150	8,2,1	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Type I-E	GGATCATCCCCGCGTGCGCGGGGAGCAC,GGATCATCCCCGCGTGCGCGGGGAGCAC,GGATCATCCCCGCGTGCGCGGGGAGCAC	28,28,28	0	0	NA	NA	I-E:I-E:I-E	21,21,20	21	TypeI-E	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA|205aa|up_8|NZ_CP046171.1_6109619_6110234_-,NA|126aa|up_5|NZ_CP046171.1_6111776_6112154_-,NA|183aa|up_4|NZ_CP046171.1_6112417_6112966_-,NA|55aa|down_9|NZ_CP046171.1_6133003_6133168_-	NA|229aa|up_9|NZ_CP046171.1_6109004_6109691_+	COG2345, COG2345, Predicted transcriptional regulator [Transcription]	NA|205aa|up_8|NZ_CP046171.1_6109619_6110234_-	NA	NA|296aa|up_7|NZ_CP046171.1_6110518_6111406_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|59aa|up_6|NZ_CP046171.1_6111537_6111714_-	pfam01527, HTH_Tnp_1, Transposase	NA|126aa|up_5|NZ_CP046171.1_6111776_6112154_-	NA	NA|183aa|up_4|NZ_CP046171.1_6112417_6112966_-	NA	NA|345aa|up_3|NZ_CP046171.1_6112971_6114006_-	PRK07764, PRK07764, DNA polymerase III subunits gamma and tau; Validated	NA|180aa|up_2|NZ_CP046171.1_6114086_6114626_-	pfam09203, MspA, MspA	NA|537aa|up_1|NZ_CP046171.1_6115796_6117407_+	cd13123, MATE_MurJ_like, MurJ/MviN, a subfamily of the multidrug and toxic compound extrusion (MATE)-like proteins	NA|138aa|up_0|NZ_CP046171.1_6119224_6119638_+	pfam04218, CENP-B_N, CENP-B N-terminal DNA-binding domain	cas2|152aa|down_0|NZ_CP046171.1_6121242_6121698_-	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	cas1|254aa|down_1|NZ_CP046171.1_6121640_6122402_-	cd09719, Cas1_I-E, CRISPR/Cas system-associated protein Cas1	cas6e|223aa|down_2|NZ_CP046171.1_6122443_6123112_-	pfam08798, CRISPR_assoc, CRISPR associated protein	cas5|237aa|down_3|NZ_CP046171.1_6123111_6123822_-	cd09756, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|372aa|down_4|NZ_CP046171.1_6123818_6124934_-	pfam09344, Cas_CT1975, CT1975-like protein	cse2gr11|213aa|down_5|NZ_CP046171.1_6124926_6125565_-	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas8e|560aa|down_6|NZ_CP046171.1_6125561_6127241_-	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cas3|915aa|down_7|NZ_CP046171.1_6127237_6129982_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|54aa|down_8|NZ_CP046171.1_6131201_6131363_-	pfam18019, HD_6, HD domain	NA|55aa|down_9|NZ_CP046171.1_6133003_6133168_-	NA
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	10	6131721-6131810	9	CRISPRCasFinder	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Type I-E	CGGATCATCCCCGCGTGCGCGGGGAGCAC	29	0	0	NA	NA	I-E	1	1	TypeI-E	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA,NA|55aa|down_0|NZ_CP046171.1_6133003_6133168_-,NA|219aa|down_9|NZ_CP046171.1_6140559_6141216_-	NA|138aa|up_9|NZ_CP046171.1_6119224_6119638_+	pfam04218, CENP-B_N, CENP-B N-terminal DNA-binding domain	cas2|152aa|up_8|NZ_CP046171.1_6121242_6121698_-	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	cas1|254aa|up_7|NZ_CP046171.1_6121640_6122402_-	cd09719, Cas1_I-E, CRISPR/Cas system-associated protein Cas1	cas6e|223aa|up_6|NZ_CP046171.1_6122443_6123112_-	pfam08798, CRISPR_assoc, CRISPR associated protein	cas5|237aa|up_5|NZ_CP046171.1_6123111_6123822_-	cd09756, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|372aa|up_4|NZ_CP046171.1_6123818_6124934_-	pfam09344, Cas_CT1975, CT1975-like protein	cse2gr11|213aa|up_3|NZ_CP046171.1_6124926_6125565_-	pfam09485, CRISPR_Cse2, CRISPR-associated protein Cse2 (CRISPR_cse2)	cas8e|560aa|up_2|NZ_CP046171.1_6125561_6127241_-	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cas3|915aa|up_1|NZ_CP046171.1_6127237_6129982_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|54aa|up_0|NZ_CP046171.1_6131201_6131363_-	pfam18019, HD_6, HD domain	NA|55aa|down_0|NZ_CP046171.1_6133003_6133168_-	NA	NA|138aa|down_1|NZ_CP046171.1_6133170_6133584_-	pfam15633, Tox-ART-HYD1, HYD1 signature containing ADP-ribosyltransferase	NA|459aa|down_2|NZ_CP046171.1_6133743_6135120_-	cd19533, starter-C_NRPS, Starter Condensation domains, found in the first module of nonribosomal peptide synthetases (NRPSs)	NA|63aa|down_3|NZ_CP046171.1_6135140_6135329_-	pfam00301, Rubredoxin, Rubredoxin	NA|356aa|down_4|NZ_CP046171.1_6135372_6136440_-	cd03507, Delta12-FADS-like, The Delta12 Fatty Acid Desaturase (Delta12-FADS)-like CD includes the integral-membrane enzymes, delta-12 acyl-lipid desaturases, oleate 12-hydroxylases, omega3 and omega6 fatty acid desaturases, and other related proteins, found in a wide range of organisms including higher plants, green algae, diatoms, nematodes, fungi, and bacteria	NA|97aa|down_5|NZ_CP046171.1_6136462_6136753_-	smart00823, PKS_PP, Phosphopantetheine attachment site	NA|308aa|down_6|NZ_CP046171.1_6136787_6137711_-	COG1398, OLE1, Fatty-acid desaturase [Lipid metabolism]	NA|309aa|down_7|NZ_CP046171.1_6137761_6138688_-	COG1398, OLE1, Fatty-acid desaturase [Lipid metabolism]	NA|557aa|down_8|NZ_CP046171.1_6138684_6140355_-	cd05931, FAAL, Fatty acyl-AMP ligase (FAAL)	NA|219aa|down_9|NZ_CP046171.1_6140559_6141216_-	NA
GCF_011801125.1_ASM1180112v1	NZ_CP046171	Nocardia brasiliensis strain AUSMDU00024985 chromosome, complete genome	11	6159657-6160172	2,10,3	PILER-CR,CRISPRCasFinder,CRT	no		cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	Orphan	GGATCATCCCCGCGTGCGCGGGGAGCAC,GGATCATCCCCGCGTGCGCGGGGAGCAC,GGATCATCCCCGCGTGCGCGGGGAGCAC	28,28,28	0	0	NA	NA	I-E:I-E:I-E	8,8,8	8	Orphan	cas3,csa3,DinG,DEDDh,WYL,casR,cas4,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	NA,NA	NA|255aa|up_9|NZ_CP046171.1_6147793_6148558_-	cd01641, Bacterial_IMPase_like_1, Predominantly bacterial family of Mg++ dependend phosphatases, related to inositol monophosphatases	NA|299aa|up_8|NZ_CP046171.1_6148566_6149463_-	pfam01636, APH, Phosphotransferase enzyme family	NA|517aa|up_7|NZ_CP046171.1_6149569_6151120_+	COG2303, BetA, Choline dehydrogenase and related flavoproteins [Amino acid transport and metabolism]	NA|256aa|up_6|NZ_CP046171.1_6151132_6151900_-	COG3622, Hfi, Hydroxypyruvate isomerase [Carbohydrate transport and metabolism]	NA|275aa|up_5|NZ_CP046171.1_6151984_6152809_+	cd05327, retinol-DH_like_SDR_c_like, retinol dehydrogenase (retinol-DH), Light dependent Protochlorophyllide (Pchlide) OxidoReductase (LPOR) and related proteins, classical (c) SDRs	NA|91aa|up_4|NZ_CP046171.1_6152825_6153098_-	pfam00550, PP-binding, Phosphopantetheine attachment site	NA|557aa|up_3|NZ_CP046171.1_6153094_6154765_-	cd05931, FAAL, Fatty acyl-AMP ligase (FAAL)	NA|223aa|up_2|NZ_CP046171.1_6154954_6155623_+	COG1960, CaiA, Acyl-CoA dehydrogenases [Lipid metabolism]	NA|467aa|up_1|NZ_CP046171.1_6157097_6158498_+	pfam00067, p450, Cytochrome P450	NA|351aa|up_0|NZ_CP046171.1_6158531_6159584_+	pfam18007, DUF5593, Domain of unknown function (DUF5593)	NA|146aa|down_0|NZ_CP046171.1_6160807_6161245_-	pfam11774, Lsr2, Lsr2	NA|469aa|down_1|NZ_CP046171.1_6163732_6165139_+	pfam02720, DUF222, Domain of unknown function (DUF222)	NA|268aa|down_2|NZ_CP046171.1_6165621_6166425_-	pfam04672, Methyltransf_19, S-adenosyl methyltransferase	NA|234aa|down_3|NZ_CP046171.1_6166529_6167231_-	pfam13462, Thioredoxin_4, Thioredoxin	NA|480aa|down_4|NZ_CP046171.1_6167341_6168781_-	cd17325, MFS_MdtG_SLC18_like, bacterial MdtG-like and eukaryotic solute carrier 18 (SLC18) family of the Major Facilitator Superfamily of transporters	NA|547aa|down_5|NZ_CP046171.1_6168773_6170414_-	PRK07564, PRK07564, phosphoglucomutase; Validated	NA|80aa|down_6|NZ_CP046171.1_6170461_6170701_-	PRK14232, PRK14232, fluoride efflux transporter CrcB	NA|136aa|down_7|NZ_CP046171.1_6170697_6171105_-	pfam02641, DUF190, Uncharacterized ACR, COG1993	NA|384aa|down_8|NZ_CP046171.1_6171593_6172745_+	pfam03583, LIP, Secretory lipase	NA|500aa|down_9|NZ_CP046171.1_6173058_6174558_-	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily
