assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000306785.1_ASM30678v1	NC_017955	Modestobacter marinus, complete genome	1	15901-16009	1	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	Orphan	ATCCTCGACGAGCTGGCCGAGATCG	25	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	NA|306aa|up_3|NC_017955.1_6659_7577_+,NA|48aa|down_1|NC_017955.1_18374_18518_+	NA|NA	NA	NA|617aa|up_8|NC_017955.1_208_2059_+	PRK14086, dnaA, chromosomal replication initiator protein DnaA	NA|388aa|up_7|NC_017955.1_2665_3829_+	PRK07761, PRK07761, DNA polymerase III subunit beta; Validated	NA|323aa|up_6|NC_017955.1_3952_4921_+	PRK09599, PRK09599, NADP-dependent phosphogluconate dehydrogenase	NA|394aa|up_5|NC_017955.1_4953_6135_+	PRK00064, recF, recombination protein F; Reviewed	NA|167aa|up_4|NC_017955.1_6127_6628_+	PRK03195, PRK03195, DUF721 family protein	NA|306aa|up_3|NC_017955.1_6659_7577_+	NA	NA|635aa|up_2|NC_017955.1_7459_9364_+	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|468aa|up_1|NC_017955.1_9497_10901_+	TIGR00909, putative_amino_acid_transporter, amino acid transporter	NA|679aa|up_0|NC_017955.1_11156_13193_+	PRK05644, gyrB, DNA gyrase subunit B; Validated	NA|236aa|down_0|NC_017955.1_17418_18126_+	pfam12089, DUF3566, Transmembrane domain of unknown function (DUF3566)	NA|48aa|down_1|NC_017955.1_18374_18518_+	NA	NA|659aa|down_2|NC_017955.1_18763_20740_+	pfam07228, SpoIIE, Stage II sporulation protein E (SpoIIE)	NA|179aa|down_3|NC_017955.1_20855_21392_+	COG0652, PpiB, Peptidyl-prolyl cis-trans isomerase (rotamase) - cyclophilin family [Posttranslational modification, protein turnover, chaperones]	NA|247aa|down_4|NC_017955.1_21535_22276_+	pfam01694, Rhomboid, Rhomboid family	NA|253aa|down_5|NC_017955.1_22285_23044_-	pfam10756, bPH_6, Bacterial PH domain	NA|91aa|down_6|NC_017955.1_23282_23555_-	pfam06781, CrgA, Cell division protein CrgA	NA|260aa|down_7|NC_017955.1_23710_24490_+	pfam05949, DUF881, Bacterial protein of unknown function (DUF881)	NA|222aa|down_8|NC_017955.1_24522_25188_+	PRK07765, PRK07765, aminodeoxychorismate/anthranilate synthase component II	NA|596aa|down_9|NC_017955.1_25202_26990_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins
GCF_000306785.1_ASM30678v1	NC_017955	Modestobacter marinus, complete genome	2	84998-85121	2	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	Orphan	TGCCCCCCACGACTCGCAGGCTCGCCGCGGGCCCCTGCA	39	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	NA|112aa|up_7|NC_017955.1_75503_75839_-,NA|113aa|up_6|NC_017955.1_75835_76174_-,NA|520aa|down_8|NC_017955.1_94542_96102_+	NA|517aa|up_9|NC_017955.1_71956_73507_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|640aa|up_8|NC_017955.1_73603_75523_+	pfam07228, SpoIIE, Stage II sporulation protein E (SpoIIE)	NA|112aa|up_7|NC_017955.1_75503_75839_-	NA	NA|113aa|up_6|NC_017955.1_75835_76174_-	NA	NA|428aa|up_5|NC_017955.1_76714_77998_+	PRK00549, PRK00549, competence damage-inducible protein A; Provisional	NA|726aa|up_4|NC_017955.1_78777_80955_+	PHA03247, PHA03247, large tegument protein UL36; Provisional	NA|130aa|up_3|NC_017955.1_81430_81820_+	cd08862, SRPBCC_Smu440-like, Ligand-binding SRPBCC domain of Streptococcus mutans Smu	NA|543aa|up_2|NC_017955.1_81861_83490_+	PRK11561, PRK11561, isovaleryl CoA dehydrogenase; Provisional	NA|254aa|up_1|NC_017955.1_83497_84259_+	cd10911, PIN_LabA, PIN domain of Synechococcus elongatus LabA (low-amplitude and bright) and related proteins	NA|116aa|up_0|NC_017955.1_84262_84610_-	TIGR01150, Reaction_center_protein_H_chain, photosynthetic reaction center, subunit H, bacterial	NA|134aa|down_0|NC_017955.1_85198_85600_+	pfam13671, AAA_33, AAA domain	NA|164aa|down_1|NC_017955.1_85603_86095_-	cd16936, HATPase_RsbW-like, Histidine kinase-like ATPase domain of RsbW, an anti sigma-B factor and serine-protein kinase involved in regulating sigma-B during stress in Bacilli, and related domains	NA|101aa|down_2|NC_017955.1_86186_86489_-	cd07043, STAS_anti-anti-sigma_factors, Sulphate Transporter and Anti-Sigma factor antagonist) domain of anti-anti-sigma factors, key regulators of anti-sigma factors by phosphorylation	NA|342aa|down_3|NC_017955.1_86722_87748_-	COG1957, URH1, Inosine-uridine nucleoside N-ribohydrolase [Nucleotide transport and metabolism]	NA|607aa|down_4|NC_017955.1_88776_90597_+	COG0405, Ggt, Gamma-glutamyltransferase [Amino acid transport and metabolism]	NA|870aa|down_5|NC_017955.1_90634_93244_+	pfam07228, SpoIIE, Stage II sporulation protein E (SpoIIE)	NA|147aa|down_6|NC_017955.1_93250_93691_-	cd16936, HATPase_RsbW-like, Histidine kinase-like ATPase domain of RsbW, an anti sigma-B factor and serine-protein kinase involved in regulating sigma-B during stress in Bacilli, and related domains	NA|229aa|down_7|NC_017955.1_93852_94539_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|520aa|down_8|NC_017955.1_94542_96102_+	NA	NA|256aa|down_9|NC_017955.1_96105_96873_-	COG0619, CbiQ, ABC-type cobalt transport system, permease component CbiQ and related transporters [Inorganic ion transport and metabolism]
GCF_000306785.1_ASM30678v1	NC_017955	Modestobacter marinus, complete genome	3	2275729-2276041	3	CRISPRCasFinder	no		cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	Orphan	GGCGGCGTCCCTGACCCCGACGCCGTCC	28	0	0	NA	NA	NA	5	5	Orphan	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	NA|201aa|up_8|NC_017955.1_2267813_2268416_+,NA|146aa|up_3|NC_017955.1_2271398_2271836_-,NA|86aa|up_0|NC_017955.1_2274432_2274690_+,NA|114aa|down_8|NC_017955.1_2285117_2285459_-	NA|566aa|up_9|NC_017955.1_2266119_2267817_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|201aa|up_8|NC_017955.1_2267813_2268416_+	NA	NA|366aa|up_7|NC_017955.1_2268412_2269510_+	COG0392, COG0392, Predicted integral membrane protein [Function unknown]	NA|209aa|up_6|NC_017955.1_2269506_2270133_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|233aa|up_5|NC_017955.1_2270132_2270831_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|147aa|up_4|NC_017955.1_2270851_2271292_-	cd16936, HATPase_RsbW-like, Histidine kinase-like ATPase domain of RsbW, an anti sigma-B factor and serine-protein kinase involved in regulating sigma-B during stress in Bacilli, and related domains	NA|146aa|up_3|NC_017955.1_2271398_2271836_-	NA	NA|199aa|up_2|NC_017955.1_2271896_2272493_-	COG4122, COG4122, Predicted O-methyltransferase [General function prediction only]	NA|584aa|up_1|NC_017955.1_2272619_2274371_+	cd01662, Ubiquinol_Oxidase_I, Ubiquinol oxidase subunit I	NA|86aa|up_0|NC_017955.1_2274432_2274690_+	NA	NA|134aa|down_0|NC_017955.1_2277082_2277484_-	COG3607, COG3607, Predicted lactoylglutathione lyase [General function prediction only]	NA|393aa|down_1|NC_017955.1_2277486_2278665_-	COG0412, COG0412, Dienelactone hydrolase and related enzymes [Secondary metabolites biosynthesis, transport, and catabolism]	NA|325aa|down_2|NC_017955.1_2278692_2279667_-	pfam01557, FAA_hydrolase, Fumarylacetoacetate (FAA) hydrolase family	NA|314aa|down_3|NC_017955.1_2279666_2280608_-	cd07239, BphC5-RK37_C_like, C-terminal, catalytic domain of BphC5 (2,3-dihydroxybiphenyl 1,2-dioxygenase)	NA|377aa|down_4|NC_017955.1_2280624_2281755_-	PRK06847, PRK06847, hypothetical protein; Provisional	NA|332aa|down_5|NC_017955.1_2281763_2282759_-	pfam04199, Cyclase, Putative cyclase	NA|321aa|down_6|NC_017955.1_2282865_2283828_+	cd08417, PBP2_Nitroaromatics_like, The C-terminal substrate binding domain of LysR-type transcriptional regulators that involved in the catabolism of nitroaromatic/naphthalene compounds and that of related regulators; contains the type 2 periplasmic binding fold	NA|428aa|down_7|NC_017955.1_2283870_2285154_+	cd17473, MFS_arabinose_efflux_permease_like, Putative arabinose efflux permease family transporters of the Major Facilitator Superfamily	NA|114aa|down_8|NC_017955.1_2285117_2285459_-	NA	NA|727aa|down_9|NC_017955.1_2285497_2287678_-	COG2409, COG2409, Predicted drug exporters of the RND superfamily [General function prediction only]
GCF_000306785.1_ASM30678v1	NC_017955	Modestobacter marinus, complete genome	4	2580352-2580499	1	PILER-CR	no	WYL	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	Unclear	CAGGGCGGCTGGGGGCCGCCGAGCCAGTACGGC	33	0	0	NA	NA	NA	2	2	Orphan	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	NA|357aa|up_8|NC_017955.1_2569732_2570803_+,NA|64aa|up_4|NC_017955.1_2574782_2574974_+,NA|283aa|down_4|NC_017955.1_2585314_2586163_-	NA|453aa|up_9|NC_017955.1_2568352_2569711_+	TIGR03686, pupylate_PafA, Pup--protein ligase	NA|357aa|up_8|NC_017955.1_2569732_2570803_+	NA	NA|341aa|up_7|NC_017955.1_2571581_2572604_-	pfam12982, DUF3866, Protein of unknown function (DUF3866)	WYL|326aa|up_6|NC_017955.1_2572773_2573751_+	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	WYL|313aa|up_5|NC_017955.1_2573774_2574713_+	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|64aa|up_4|NC_017955.1_2574782_2574974_+	NA	NA|114aa|up_3|NC_017955.1_2575070_2575412_+	PRK00191, tatA, twin arginine translocase protein A; Provisional	NA|286aa|up_2|NC_017955.1_2575500_2576358_+	pfam00902, TatC, Sec-independent protein translocase protein (TatC)	NA|299aa|up_1|NC_017955.1_2576368_2577265_+	PRK11914, PRK11914, diacylglycerol kinase; Reviewed	NA|951aa|up_0|NC_017955.1_2577344_2580197_+	COG4581, COG4581, Superfamily II RNA helicase [DNA replication, recombination, and repair]	NA|303aa|down_0|NC_017955.1_2580991_2581900_-	smart00475, 53EXOc, 5'-3' exonuclease	NA|381aa|down_1|NC_017955.1_2581974_2583117_+	COG0006, PepP, Xaa-Pro aminopeptidase [Amino acid transport and metabolism]	NA|164aa|down_2|NC_017955.1_2583091_2583583_+	smart00344, HTH_ASNC, helix_turn_helix ASNC type	NA|541aa|down_3|NC_017955.1_2583681_2585304_+	cd00081, Hint, Hedgehog/Intein domain, found in Hedgehog proteins as well as proteins which contain inteins and undergo protein splicing (e	NA|283aa|down_4|NC_017955.1_2585314_2586163_-	NA	NA|252aa|down_5|NC_017955.1_2586327_2587083_-	cd07729, AHL_lactonase_MBL-fold, quorum-quenching N-acyl-homoserine lactonase, MBL-fold metallo-hydrolase domain	NA|224aa|down_6|NC_017955.1_2587287_2587959_+	COG3836, HpcH, 2,4-dihydroxyhept-2-ene-1,7-dioic acid aldolase [Carbohydrate transport and metabolism]	NA|288aa|down_7|NC_017955.1_2588013_2588877_+	cd07989, LPLAT_AGPAT-like, Lysophospholipid Acyltransferases (LPLATs) of Glycerophospholipid Biosynthesis: AGPAT-like	NA|483aa|down_8|NC_017955.1_2588860_2590309_-	pfam06762, LMF1, Lipase maturation factor	NA|171aa|down_9|NC_017955.1_2590327_2590840_-	pfam13302, Acetyltransf_3, Acetyltransferase (GNAT) domain
GCF_000306785.1_ASM30678v1	NC_017955	Modestobacter marinus, complete genome	5	4510226-4510467	1	CRT	no		cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	Orphan	GCCCCGGCGAAGCGGACCCGCAAGGCCGC	29	0	0	NA	NA	NA	3	3	Orphan	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	NA,NA|625aa|down_6|NC_017955.1_4521083_4522958_+,NA|70aa|down_9|NC_017955.1_4524557_4524767_-	NA|280aa|up_9|NC_017955.1_4494285_4495125_-	COG4132, COG4132, ABC-type uncharacterized transport system, permease component [General function prediction only]	NA|383aa|up_8|NC_017955.1_4495220_4496369_-	cd13549, PBP2_Fbp_like_3, Substrate binding domain of an uncharacterized ferric iron transporter, a member of the type 2 periplasmic binding fold superfamily	NA|262aa|up_7|NC_017955.1_4496532_4497318_-	PRK08138, PRK08138, enoyl-CoA hydratase; Provisional	NA|274aa|up_6|NC_017955.1_4497365_4498187_-	COG1119, ModF, ABC-type molybdenum transport system, ATPase component/photorepair protein PhrA [Inorganic ion transport and metabolism]	NA|715aa|up_5|NC_017955.1_4498259_4500404_+	TIGR02100, Glycogen_operon_protein_GlgX_homolog, glycogen debranching enzyme GlgX	NA|325aa|up_4|NC_017955.1_4500802_4501777_-	cd00060, FHA, Forkhead associated domain (FHA); found in eukaryotic and prokaryotic proteins	NA|850aa|up_3|NC_017955.1_4501989_4504539_-	cd04299, GT35_Glycogen_Phosphorylase-like, proteins similar to glycogen phosphorylase	NA|669aa|up_2|NC_017955.1_4504664_4506671_+	cd11344, AmyAc_GlgE_like, Alpha amylase catalytic domain found in GlgE-like proteins	NA|622aa|up_1|NC_017955.1_4506771_4508637_+	TIGR02456, Trehalose_synthase, trehalose synthase	NA|458aa|up_0|NC_017955.1_4508636_4510010_+	COG3281, Ble, Uncharacterized protein, probably involved in trehalose biosynthesis [Carbohydrate transport and metabolism]	NA|484aa|down_0|NC_017955.1_4513367_4514819_+	COG2321, COG2321, Predicted metalloprotease [General function prediction only]	NA|305aa|down_1|NC_017955.1_4514931_4515846_-	COG3118, COG3118, Thioredoxin domain-containing protein [Posttranslational modification, protein turnover, chaperones]	NA|491aa|down_2|NC_017955.1_4515962_4517435_-	COG1233, COG1233, Phytoene dehydrogenase and related proteins [Secondary metabolites biosynthesis, transport, and catabolism]	NA|410aa|down_3|NC_017955.1_4517495_4518725_-	PRK05790, PRK05790, putative acyltransferase; Provisional	NA|150aa|down_4|NC_017955.1_4518939_4519389_+	TIGR03081, Methylmalonyl-CoA_epimerase_mitochondrial, methylmalonyl-CoA epimerase	NA|475aa|down_5|NC_017955.1_4519463_4520888_+	pfam09770, PAT1, Topoisomerase II-associated protein PAT1	NA|625aa|down_6|NC_017955.1_4521083_4522958_+	NA	NA|298aa|down_7|NC_017955.1_4523004_4523898_+	pfam14344, DUF4397, Domain of unknown function (DUF4397)	NA|192aa|down_8|NC_017955.1_4523972_4524548_+	cd05829, Sortase_F, Sortase domain found in the class F family of sortases	NA|70aa|down_9|NC_017955.1_4524557_4524767_-	NA
GCF_000306785.1_ASM30678v1	NC_017955	Modestobacter marinus, complete genome	6	5166512-5166589	4	CRISPRCasFinder	no	csa3	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	Type I-A	CCGCCGAAGATGTCGCCCAGGCCG	24	0	0	NA	NA	NA	1	1	Orphan	cas3,RT,DEDDh,csa3,WYL,cas4,casR,Cas9_archaeal	NA,NA|187aa|down_3|NC_017955.1_5172312_5172873_+	NA|415aa|up_9|NC_017955.1_5153890_5155135_+	pfam02515, CoA_transf_3, CoA-transferase family III	NA|257aa|up_8|NC_017955.1_5155131_5155902_+	PRK06144, PRK06144, enoyl-CoA hydratase; Provisional	NA|269aa|up_7|NC_017955.1_5155882_5156689_-	COG1414, IclR, Transcriptional regulator [Transcription]	NA|534aa|up_6|NC_017955.1_5156919_5158521_+	PRK09255, PRK09255, malate synthase; Validated	NA|473aa|up_5|NC_017955.1_5158741_5160160_+	PRK11230, PRK11230, glycolate oxidase subunit GlcD; Provisional	NA|423aa|up_4|NC_017955.1_5160159_5161428_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|467aa|up_3|NC_017955.1_5161427_5162828_+	PRK11274, glcF, glycolate oxidase subunit GlcF	NA|585aa|up_2|NC_017955.1_5162921_5164676_+	COG1620, LldP, L-lactate permease [Energy production and conversion]	NA|176aa|up_1|NC_017955.1_5164694_5165222_-	COG1846, MarR, Transcriptional regulators [Transcription]	NA|144aa|up_0|NC_017955.1_5165257_5165689_-	cd04766, HTH_HspR, Helix-Turn-Helix DNA binding domain of the HspR transcription regulator	NA|244aa|down_0|NC_017955.1_5166997_5167729_-	PRK14164, PRK14164, heat shock protein GrpE; Provisional	NA|623aa|down_1|NC_017955.1_5167791_5169660_-	PRK00290, dnaK, molecular chaperone DnaK; Provisional	NA|764aa|down_2|NC_017955.1_5169948_5172240_+	COG0247, GlpC, Fe-S oxidoreductase [Energy production and conversion]	NA|187aa|down_3|NC_017955.1_5172312_5172873_+	NA	NA|322aa|down_4|NC_017955.1_5172935_5173901_+	TIGR00271, Uncharacterized_protein_MJ0678, uncharacterized hydrophobic domain	NA|433aa|down_5|NC_017955.1_5173944_5175243_+	cd17339, MFS_NIMT_CynX_like, 2-nitroimidazole and cyanate transporters and similar proteins of the Major Facilitator Superfamily of transporters	NA|249aa|down_6|NC_017955.1_5175239_5175986_-	COG2890, HemK, Methylase of polypeptide chain release factors [Translation, ribosomal structure and biogenesis]	NA|203aa|down_7|NC_017955.1_5176087_5176696_-	PRK00416, dcd, deoxycytidine triphosphate deaminase; Reviewed	NA|136aa|down_8|NC_017955.1_5177504_5177912_-	cd04770, HTH_HMRTR, Helix-Turn-Helix DNA binding domain of Heavy Metal Resistance transcription regulators	NA|327aa|down_9|NC_017955.1_5178012_5178993_+	COG0798, ACR3, Arsenite efflux pump ACR3 and related permeases [Inorganic ion transport and metabolism]
