assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000355675.1_ASM35567v1	NC_020888	Thalassolituus oleivorans MIL-1, complete genome	1	140787-140908	1	CRISPRCasFinder	no		WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	Orphan	TGCGGCGGTAAATCAGAAGCCGAAGGCAA	29	1	1	140816-140879	NC_020888.1_140909-140972	NA	1	1	Orphan	WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	NA,NA|255aa|down_5|NC_020888.1_145647_146412_-	NA|353aa|up_9|NC_020888.1_130219_131278_-	cd00118, LysM, Lysin Motif is a small domain involved in binding peptidoglycan	NA|174aa|up_8|NC_020888.1_131394_131916_+	PRK00150, def, peptide deformylase; Reviewed	NA|317aa|up_7|NC_020888.1_131919_132870_+	PRK00005, fmt, methionyl-tRNA formyltransferase; Reviewed	NA|434aa|up_6|NC_020888.1_132920_134222_+	PRK10901, PRK10901, 16S rRNA (cytosine(967)-C(5))-methyltransferase RsmB	NA|458aa|up_5|NC_020888.1_134274_135648_+	PRK09496, trkA, Trk system potassium transporter TrkA	NA|483aa|up_4|NC_020888.1_135659_137108_+	PRK10750, PRK10750, Trk system potassium transporter TrkH	NA|496aa|up_3|NC_020888.1_137264_138752_+	COG0659, SUL1, Sulfate permease and related transporters (MFS superfamily) [Inorganic ion transport and metabolism]	NA|284aa|up_2|NC_020888.1_138788_139640_+	cd00293, USP_Like, Usp: Universal stress protein family	NA|184aa|up_1|NC_020888.1_139775_140327_+	PRK12544, PRK12544, RNA polymerase factor sigma-70	NA|66aa|up_0|NC_020888.1_140323_140521_+	pfam13490, zf-HC2, Putative zinc-finger	NA|206aa|down_0|NC_020888.1_141074_141692_+	pfam07681, DoxX, DoxX	NA|302aa|down_1|NC_020888.1_141718_142624_-	COG1560, HtrB, Lauroyl/myristoyl acyltransferase [Cell envelope biogenesis, outer membrane]	NA|549aa|down_2|NC_020888.1_142759_144406_+	cd17589, REC_TPR, phosphoacceptor receiver (REC) domain of uncharacterized tetratricopeptide repeat (TPR)-containing response regulators	NA|220aa|down_3|NC_020888.1_144425_145085_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|187aa|down_4|NC_020888.1_145096_145657_-	COG0742, COG0742, N6-adenine-specific methylase [DNA replication, recombination, and repair]	NA|255aa|down_5|NC_020888.1_145647_146412_-	NA	NA|423aa|down_6|NC_020888.1_146547_147816_+	PRK10416, PRK10416, signal recognition particle-docking protein FtsY; Provisional	NA|237aa|down_7|NC_020888.1_147840_148551_+	COG2884, FtsE, Predicted ATPase involved in cell division [Cell division and chromosome partitioning]	NA|312aa|down_8|NC_020888.1_148651_149587_+	COG2177, FtsX, Cell division protein [Cell division and chromosome partitioning]	NA|290aa|down_9|NC_020888.1_149712_150582_+	PRK06596, PRK06596, RNA polymerase factor sigma-32; Reviewed
GCF_000355675.1_ASM35567v1	NC_020888	Thalassolituus oleivorans MIL-1, complete genome	2	439471-439691	2	CRISPRCasFinder	no		WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	Orphan	GGCGCGGTGACCGGTGATTATTATGTCGGCGGCTTGGCTGGCTATCTATCGAG	53	0	0	NA	NA	NA	1	1	Orphan	WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	NA|365aa|up_9|NC_020888.1_417332_418427_-,NA|448aa|up_8|NC_020888.1_418429_419773_-,NA|195aa|up_6|NC_020888.1_420105_420690_-,NA|2368aa|down_0|NC_020888.1_446615_453719_+,NA|104aa|down_3|NC_020888.1_457893_458205_+	NA|365aa|up_9|NC_020888.1_417332_418427_-	NA	NA|448aa|up_8|NC_020888.1_418429_419773_-	NA	NA|98aa|up_7|NC_020888.1_419808_420102_-	cd14738, PAAR_2, proline-alanine-alanine-arginine (PAAR) domain	NA|195aa|up_6|NC_020888.1_420105_420690_-	NA	NA|629aa|up_5|NC_020888.1_420701_422588_-	TIGR03361, VI_Rhs_Vgr, type VI secretion system Vgr family protein	NA|163aa|up_4|NC_020888.1_422739_423228_-	pfam05638, T6SS_HCP, Type VI secretion system effector, Hcp	NA|243aa|up_3|NC_020888.1_423640_424369_-	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|291aa|up_2|NC_020888.1_424620_425493_+	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|684aa|up_1|NC_020888.1_425902_427954_+	COG2831, FhaC, Hemolysin activation/secretion protein [Intracellular trafficking and secretion]	NA|3592aa|up_0|NC_020888.1_428051_438827_+	TIGR01901, Heme/hemopexin-binding_protein, filamentous hemagglutinin family N-terminal domain	NA|2368aa|down_0|NC_020888.1_446615_453719_+	NA	NA|702aa|down_1|NC_020888.1_453992_456098_+	COG1593, DctQ, TRAP-type C4-dicarboxylate transport system, large permease component [Carbohydrate transport and metabolism]	NA|530aa|down_2|NC_020888.1_456185_457775_+	PRK00741, prfC, peptide chain release factor 3; Provisional	NA|104aa|down_3|NC_020888.1_457893_458205_+	NA	NA|144aa|down_4|NC_020888.1_458350_458782_+	PRK09216, rplM, 50S ribosomal protein L13; Reviewed	NA|131aa|down_5|NC_020888.1_458786_459179_+	PRK00132, rpsI, 30S ribosomal protein S9; Reviewed	NA|199aa|down_6|NC_020888.1_459399_459996_+	TIGR01416, Rieske_proteo, ubiquinol-cytochrome c reductase, iron-sulfur subunit	NA|403aa|down_7|NC_020888.1_460019_461228_+	MTH00145, CYTB, cytochrome b; Provisional	NA|253aa|down_8|NC_020888.1_461230_461989_+	COG2857, CYT1, Cytochrome c1 [Energy production and conversion]	NA|209aa|down_9|NC_020888.1_462084_462711_+	PRK09481, sspA, stringent starvation protein A; Provisional
GCF_000355675.1_ASM35567v1	NC_020888	Thalassolituus oleivorans MIL-1, complete genome	3	2060414-2060500	3	CRISPRCasFinder	no		WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	Orphan	GTGTCTAAGAAACTAGGGGCGATTCAG	27	1	9	2060441-2060473|2060441-2060473|2060441-2060473|2060441-2060473|2060441-2060473|2060441-2060473|2060441-2060473|2060441-2060473|2060441-2060473	NC_020888.1_476805-476837|NC_020888.1_1429188-1429220|NC_020888.1_2291199-2291167|NC_020888.1_2692277-2692245|NC_020888.1_2944140-2944108|NC_020888.1_3498826-3498794|NC_020888.1_11381-11413|NC_020888.1_2059266-2059234|NC_020888.1_2049491-2049523	NA	1	1	Orphan	WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	NA|530aa|up_7|NC_020888.1_2049535_2051125_-,NA|175aa|down_0|NC_020888.1_2060640_2061165_+,NA|126aa|down_6|NC_020888.1_2066222_2066600_+,NA|250aa|down_7|NC_020888.1_2067461_2068211_+	NA|466aa|up_9|NC_020888.1_2046760_2048158_-	TIGR03696, tRNA_nuclease_WapA, RHS repeat-associated core domain	NA|384aa|up_8|NC_020888.1_2048380_2049531_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|530aa|up_7|NC_020888.1_2049535_2051125_-	NA	NA|192aa|up_6|NC_020888.1_2051680_2052256_-	pfam01292, Ni_hydr_CYTB, Prokaryotic cytochrome b561	NA|230aa|up_5|NC_020888.1_2052300_2052990_-	cd02432, Nodulin-21_like_1, Nodulin-21 and CCC1-related protein family	NA|327aa|up_4|NC_020888.1_2053130_2054111_-	pfam05275, CopB, Copper resistance protein B precursor (CopB)	NA|579aa|up_3|NC_020888.1_2054107_2055844_-	TIGR01480, unnamed_protein_product, copper-resistance protein, CopA family	NA|435aa|up_2|NC_020888.1_2056365_2057670_-	PRK10337, PRK10337, sensor protein QseC; Provisional	NA|219aa|up_1|NC_020888.1_2057666_2058323_-	PRK10643, PRK10643, two-component system response regulator PmrA	NA|384aa|up_0|NC_020888.1_2059225_2060376_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|175aa|down_0|NC_020888.1_2060640_2061165_+	NA	NA|194aa|down_1|NC_020888.1_2061476_2062058_-	cd02135, YdjA-like, nitroreductase family protein similar to Escherichia coli YdjA	NA|463aa|down_2|NC_020888.1_2062233_2063622_+	cd07302, CHD, cyclase homology domain	NA|279aa|down_3|NC_020888.1_2063653_2064490_-	PRK11792, queF, 7-cyano-7-deazaguanine reductase; Provisional	NA|259aa|down_4|NC_020888.1_2064504_2065281_-	PRK15066, PRK15066, inner membrane transport permease; Provisional	NA|307aa|down_5|NC_020888.1_2065277_2066198_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|126aa|down_6|NC_020888.1_2066222_2066600_+	NA	NA|250aa|down_7|NC_020888.1_2067461_2068211_+	NA	NA|157aa|down_8|NC_020888.1_2068201_2068672_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|162aa|down_9|NC_020888.1_2068671_2069157_-	COG0386, BtuE, Glutathione peroxidase [Posttranslational modification, protein turnover, chaperones]
GCF_000355675.1_ASM35567v1	NC_020888	Thalassolituus oleivorans MIL-1, complete genome	4	2343575-2351279	1,4,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas7,cas8c,cas5,cas3,WYL	WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	Type I-U, Type I-U?,Type I-C	GTTTCTATCCGCGCGCCCGTGAAGGACGCGAC,GTTTCTATCCGCGCGCCCGTGAAGGACGCGAC,GTTTCTATCCGCGCGCCCGTGAAGGACGCGAC,GTTTCTATCCGCGCGCCCGTGAAGGACGCGAC	32,32,32,32	0	0	NA	NA	NA:NA:NA:NA	114,116,116,114	116	TypeI-U,TypeI-U?,TypeI-C	WYL,cas3,csa3,RT,PD-DExK,DEDDh,DinG,cas2,cas1,cas4,cas7,cas8c,cas5	NA|140aa|up_7|NC_020888.1_2338924_2339344_-,NA|58aa|up_6|NC_020888.1_2339552_2339726_-,NA|174aa|up_5|NC_020888.1_2339722_2340244_-,NA|188aa|up_4|NC_020888.1_2340577_2341141_-,NA|86aa|up_3|NC_020888.1_2341334_2341592_-,NA|81aa|up_2|NC_020888.1_2341789_2342032_+,NA|190aa|up_1|NC_020888.1_2342154_2342724_-,NA|133aa|down_9|NC_020888.1_2362962_2363361_+	NA|371aa|up_9|NC_020888.1_2336645_2337758_-	PRK11784, PRK11784, tRNA 2-selenouridine synthase; Provisional	NA|355aa|up_8|NC_020888.1_2337754_2338819_-	PRK00943, PRK00943, selenide, water dikinase SelD	NA|140aa|up_7|NC_020888.1_2338924_2339344_-	NA	NA|58aa|up_6|NC_020888.1_2339552_2339726_-	NA	NA|174aa|up_5|NC_020888.1_2339722_2340244_-	NA	NA|188aa|up_4|NC_020888.1_2340577_2341141_-	NA	NA|86aa|up_3|NC_020888.1_2341334_2341592_-	NA	NA|81aa|up_2|NC_020888.1_2341789_2342032_+	NA	NA|190aa|up_1|NC_020888.1_2342154_2342724_-	NA	NA|209aa|up_0|NC_020888.1_2342726_2343353_-	pfam14412, AHH, A nuclease family of the HNH/ENDO VII superfamily with conserved AHH	cas2|98aa|down_0|NC_020888.1_2351467_2351761_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|339aa|down_1|NC_020888.1_2351762_2352779_-	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas4|209aa|down_2|NC_020888.1_2352775_2353402_-	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas7|287aa|down_3|NC_020888.1_2353417_2354278_-	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas8c|587aa|down_4|NC_020888.1_2354261_2356022_-	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas5|219aa|down_5|NC_020888.1_2356018_2356675_-	cd09752, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas3|757aa|down_6|NC_020888.1_2357001_2359272_-	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	WYL|288aa|down_7|NC_020888.1_2359367_2360231_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|352aa|down_8|NC_020888.1_2360662_2361718_+	TIGR02899, hypothetical_conserved_protein, spore coat assembly protein SafA	NA|133aa|down_9|NC_020888.1_2362962_2363361_+	NA
