assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	1	4713-5156	1,1	CRT,PILER-CR	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	NAAGAAGAAGAAAGCCGCCGC,AAGAAGAAGAAAGCCGCCGCCGCGGAA	21,27	0	0	NA	NA	NA:NA	6,2	6	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA,NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|NA	NA	NA|373aa|up_3|NZ_LR593887.1_97_1216_+	COG0593, DnaA, ATPase involved in DNA replication initiation [DNA replication, recombination, and repair]	NA|369aa|up_2|NZ_LR593887.1_1548_2655_+	cd00140, beta_clamp, Beta clamp domain	NA|168aa|up_1|NZ_LR593887.1_2651_3155_+	pfam05258, DUF721, Protein of unknown function (DUF721)	NA|385aa|up_0|NZ_LR593887.1_3185_4340_+	cd03894, M20_ArgE, M20 Peptidase acetylornithine deacetylase	NA|334aa|down_0|NZ_LR593887.1_5408_6410_+	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|297aa|down_1|NZ_LR593887.1_6406_7297_-	COG2129, COG2129, Predicted phosphoesterases, related to the Icc protein [General function prediction only]	NA|438aa|down_2|NZ_LR593887.1_7440_8754_-	sd00033, LRR_RI, leucine-rich repeats, ribonuclease inhibitor (RI)-like subfamily	NA|784aa|down_3|NZ_LR593887.1_8827_11179_-	pfam00326, Peptidase_S9, Prolyl oligopeptidase family	NA|415aa|down_4|NZ_LR593887.1_11244_12489_-	PRK00711, PRK00711, D-amino acid dehydrogenase	NA|310aa|down_5|NZ_LR593887.1_12485_13415_-	PRK13970, PRK13970, 4-hydroxyproline epimerase	NA|306aa|down_6|NZ_LR593887.1_13534_14452_-	cd00408, DHDPS-like, Dihydrodipicolinate synthase family	NA|295aa|down_7|NZ_LR593887.1_14594_15479_+	COG1802, GntR, Transcriptional regulators [Transcription]	NA|897aa|down_8|NZ_LR593887.1_16258_18949_+	pfam07583, PSCyt2, Protein of unknown function (DUF1549)	NA|159aa|down_9|NZ_LR593887.1_18965_19442_+	PRK13557, PRK13557, histidine kinase; Provisional
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	2	282870-282979	1	CRISPRCasFinder	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	GACAACGGCGGAGCCGGAAGCGGATC	26	1	1	282896-282953	NZ_LR593887.1_297133-297190	NA	1	1	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|113aa|up_8|NZ_LR593887.1_274794_275133_+,NA|75aa|up_6|NZ_LR593887.1_276894_277119_+,NA|269aa|up_5|NZ_LR593887.1_277322_278129_+,NA|271aa|up_3|NZ_LR593887.1_279463_280276_+,NA|215aa|up_1|NZ_LR593887.1_281560_282205_+,NA|152aa|up_0|NZ_LR593887.1_282201_282657_-,NA|401aa|down_0|NZ_LR593887.1_283139_284342_+,NA|129aa|down_1|NZ_LR593887.1_284332_284719_+,NA|177aa|down_3|NZ_LR593887.1_286115_286646_+,NA|153aa|down_7|NZ_LR593887.1_291513_291972_+,NA|179aa|down_9|NZ_LR593887.1_295267_295804_+	NA|153aa|up_9|NZ_LR593887.1_273823_274282_+	pfam14433, SUKH-3, SUKH-3 immunity protein	NA|113aa|up_8|NZ_LR593887.1_274794_275133_+	NA	NA|196aa|up_7|NZ_LR593887.1_275656_276244_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|75aa|up_6|NZ_LR593887.1_276894_277119_+	NA	NA|269aa|up_5|NZ_LR593887.1_277322_278129_+	NA	NA|298aa|up_4|NZ_LR593887.1_278546_279440_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|271aa|up_3|NZ_LR593887.1_279463_280276_+	NA	NA|325aa|up_2|NZ_LR593887.1_280583_281558_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|215aa|up_1|NZ_LR593887.1_281560_282205_+	NA	NA|152aa|up_0|NZ_LR593887.1_282201_282657_-	NA	NA|401aa|down_0|NZ_LR593887.1_283139_284342_+	NA	NA|129aa|down_1|NZ_LR593887.1_284332_284719_+	NA	NA|262aa|down_2|NZ_LR593887.1_285144_285930_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|177aa|down_3|NZ_LR593887.1_286115_286646_+	NA	NA|234aa|down_4|NZ_LR593887.1_287079_287781_+	pfam15526, Ntox21, Novel toxin 21	NA|154aa|down_5|NZ_LR593887.1_287783_288245_+	pfam18228, CdiI_N, CdiI N-terminal domain	NA|1052aa|down_6|NZ_LR593887.1_288343_291499_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|153aa|down_7|NZ_LR593887.1_291513_291972_+	NA	NA|996aa|down_8|NZ_LR593887.1_292275_295263_+	pfam10354, DUF2431, Domain of unknown function (DUF2431)	NA|179aa|down_9|NZ_LR593887.1_295267_295804_+	NA
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	3	301588-301695	2	CRISPRCasFinder	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	GGGATGATCGACGATGTTCCCACTCCTGGAAAACCGCCC	39	0	0	NA	NA	NA	1	1	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|179aa|up_8|NZ_LR593887.1_295267_295804_+,NA|403aa|up_5|NZ_LR593887.1_297376_298585_+,NA|162aa|up_4|NZ_LR593887.1_298581_299067_+,NA|219aa|up_3|NZ_LR593887.1_299299_299956_+,NA|129aa|up_2|NZ_LR593887.1_299974_300361_+,NA|48aa|up_1|NZ_LR593887.1_300384_300528_+,NA|62aa|up_0|NZ_LR593887.1_300557_300743_-,NA|96aa|down_1|NZ_LR593887.1_303888_304176_+,NA|165aa|down_2|NZ_LR593887.1_305100_305595_-,NA|82aa|down_3|NZ_LR593887.1_306453_306699_-,NA|81aa|down_4|NZ_LR593887.1_307131_307374_-,NA|72aa|down_5|NZ_LR593887.1_307948_308164_-,NA|87aa|down_7|NZ_LR593887.1_309171_309432_-,NA|136aa|down_8|NZ_LR593887.1_310017_310425_-,NA|75aa|down_9|NZ_LR593887.1_310476_310701_-	NA|996aa|up_9|NZ_LR593887.1_292275_295263_+	pfam10354, DUF2431, Domain of unknown function (DUF2431)	NA|179aa|up_8|NZ_LR593887.1_295267_295804_+	NA	NA|190aa|up_7|NZ_LR593887.1_295780_296350_-	pfam13532, 2OG-FeII_Oxy_2, 2OG-Fe(II) oxygenase superfamily	NA|70aa|up_6|NZ_LR593887.1_297042_297252_-	PRK15313, PRK15313, intestinal colonization autotransporter adhesin MisL	NA|403aa|up_5|NZ_LR593887.1_297376_298585_+	NA	NA|162aa|up_4|NZ_LR593887.1_298581_299067_+	NA	NA|219aa|up_3|NZ_LR593887.1_299299_299956_+	NA	NA|129aa|up_2|NZ_LR593887.1_299974_300361_+	NA	NA|48aa|up_1|NZ_LR593887.1_300384_300528_+	NA	NA|62aa|up_0|NZ_LR593887.1_300557_300743_-	NA	NA|237aa|down_0|NZ_LR593887.1_303013_303724_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|96aa|down_1|NZ_LR593887.1_303888_304176_+	NA	NA|165aa|down_2|NZ_LR593887.1_305100_305595_-	NA	NA|82aa|down_3|NZ_LR593887.1_306453_306699_-	NA	NA|81aa|down_4|NZ_LR593887.1_307131_307374_-	NA	NA|72aa|down_5|NZ_LR593887.1_307948_308164_-	NA	NA|171aa|down_6|NZ_LR593887.1_308300_308813_-	pfam15640, Tox-MPTase4, Metallopeptidase toxin 4	NA|87aa|down_7|NZ_LR593887.1_309171_309432_-	NA	NA|136aa|down_8|NZ_LR593887.1_310017_310425_-	NA	NA|75aa|down_9|NZ_LR593887.1_310476_310701_-	NA
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	4	480156-481428	2,3,2	PILER-CR,CRISPRCasFinder,CRT	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	GGCGCAGTCCGCACGAGCGATTAGAGCTCATTGAAAC,GGCGCAGTCCGCACGAGCGATTAGAGCTCATTGAAAC,GGCGCAGTCCGCACGAGCGATTNGAGCTCATTGAAAC	37,37,37	0	0	NA	NA	NA:NA:NA	15,15,16	16	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|183aa|up_9|NZ_LR593887.1_468723_469272_+,NA|170aa|up_7|NZ_LR593887.1_471191_471701_+,NA|98aa|up_0|NZ_LR593887.1_479600_479894_-,NA|119aa|down_0|NZ_LR593887.1_481454_481811_+	NA|183aa|up_9|NZ_LR593887.1_468723_469272_+	NA	NA|545aa|up_8|NZ_LR593887.1_469429_471064_+	PHA03247, PHA03247, large tegument protein UL36; Provisional	NA|170aa|up_7|NZ_LR593887.1_471191_471701_+	NA	NA|214aa|up_6|NZ_LR593887.1_471755_472397_+	pfam04299, FMN_bind_2, Putative FMN-binding domain	NA|474aa|up_5|NZ_LR593887.1_472478_473900_+	cd17324, MFS_NepI_like, Purine ribonucleoside efflux pump NepI and similar transporters of the Major Facilitator Superfamily	NA|311aa|up_4|NZ_LR593887.1_474081_475014_+	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau	NA|150aa|up_3|NZ_LR593887.1_475039_475489_+	cd04301, NAT_SF, N-Acyltransferase superfamily: Various enzymes that characteristically catalyze the transfer of an acyl group to a substrate	NA|799aa|up_2|NZ_LR593887.1_475604_478001_-	pfam17963, Big_9, Bacterial Ig domain	NA|438aa|up_1|NZ_LR593887.1_478220_479534_-	COG0523, COG0523, Putative GTPases (G3E family) [General function prediction only]	NA|98aa|up_0|NZ_LR593887.1_479600_479894_-	NA	NA|119aa|down_0|NZ_LR593887.1_481454_481811_+	NA	NA|511aa|down_1|NZ_LR593887.1_481924_483457_-	pfam13360, PQQ_2, PQQ-like domain	NA|359aa|down_2|NZ_LR593887.1_483481_484558_-	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|1447aa|down_3|NZ_LR593887.1_485359_489700_+	NF012211, tand_rpt_95, tandem-95 repeat protein	NA|1545aa|down_4|NZ_LR593887.1_489766_494401_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|199aa|down_5|NZ_LR593887.1_494557_495154_-	COG4566, TtrR, Response regulator [Signal transduction mechanisms]	NA|349aa|down_6|NZ_LR593887.1_495160_496207_-	COG4191, COG4191, Signal transduction histidine kinase regulating C4-dicarboxylate transport system [Signal transduction mechanisms]	NA|280aa|down_7|NZ_LR593887.1_496488_497328_+	PRK06136, PRK06136, uroporphyrinogen-III C-methyltransferase	NA|813aa|down_8|NZ_LR593887.1_497324_499763_+	COG1251, NirB, NAD(P)H-nitrite reductase [Energy production and conversion]	NA|105aa|down_9|NZ_LR593887.1_499853_500168_+	cd03530, Rieske_NirD_small_Bacillus, Small subunit of nitrite reductase (NirD) family, Rieske domain; composed of proteins similar to the Bacillus subtilis small subunit of assimilatory nitrite reductase containing a Rieske domain
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	5	576178-576411	3	CRT	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	CCAGTGACACCCCCGGTG	18	1	1	576376-576393	NZ_LR593887.1_3331761-3331744	NA	5	5	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|121aa|up_9|NZ_LR593887.1_562263_562626_-,NA|132aa|up_8|NZ_LR593887.1_562700_563096_-,NA|228aa|up_5|NZ_LR593887.1_565121_565805_+,NA|262aa|up_3|NZ_LR593887.1_566948_567734_+,NA|965aa|up_2|NZ_LR593887.1_567730_570625_+,NA|56aa|up_0|NZ_LR593887.1_573495_573663_+,NA|412aa|down_4|NZ_LR593887.1_581313_582549_-,NA|204aa|down_5|NZ_LR593887.1_582581_583193_-	NA|121aa|up_9|NZ_LR593887.1_562263_562626_-	NA	NA|132aa|up_8|NZ_LR593887.1_562700_563096_-	NA	NA|275aa|up_7|NZ_LR593887.1_563268_564093_-	cd10030, UDG-F4_TTUDGA_SPO1dp_like, Uracil DNA glycosylase family 4, includes Thermotoga maritima TTUDGA, Bacillus phage SPO1 DNA polymerase, and similar proteins	NA|301aa|up_6|NZ_LR593887.1_564213_565116_+	cd07573, CPA, N-carbamoylputrescine amidohydrolase (CPA) (class 11 nitrilases)	NA|228aa|up_5|NZ_LR593887.1_565121_565805_+	NA	NA|389aa|up_4|NZ_LR593887.1_565785_566952_+	PRK13531, PRK13531, regulatory ATPase RavA; Provisional	NA|262aa|up_3|NZ_LR593887.1_566948_567734_+	NA	NA|965aa|up_2|NZ_LR593887.1_567730_570625_+	NA	NA|914aa|up_1|NZ_LR593887.1_570643_573385_+	sd00006, TPR, Tetratricopeptide repeat	NA|56aa|up_0|NZ_LR593887.1_573495_573663_+	NA	NA|314aa|down_0|NZ_LR593887.1_577540_578482_-	smart00797, AHS2, Allophanate hydrolase subunit 2	NA|231aa|down_1|NZ_LR593887.1_578478_579171_-	pfam03746, LamB_YcsF, LamB/YcsF family	NA|429aa|down_2|NZ_LR593887.1_579372_580659_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|169aa|down_3|NZ_LR593887.1_580698_581205_+	TIGR04526, predic_Ig_block, putative immunoglobulin-blocking virulence protein	NA|412aa|down_4|NZ_LR593887.1_581313_582549_-	NA	NA|204aa|down_5|NZ_LR593887.1_582581_583193_-	NA	NA|123aa|down_6|NZ_LR593887.1_583224_583593_-	pfam09996, DUF2237, Uncharacterized protein conserved in bacteria (DUF2237)	NA|317aa|down_7|NZ_LR593887.1_583611_584562_-	TIGR01172, Serine_acetyltransferase, serine O-acetyltransferase	NA|683aa|down_8|NZ_LR593887.1_586910_588959_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|143aa|down_9|NZ_LR593887.1_588897_589326_-	pfam13911, AhpC-TSA_2, AhpC/TSA antioxidant enzyme
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	6	839447-840100	3,4,4	PILER-CR,CRISPRCasFinder,CRT	no	cas6	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Unclear	GTCACAGACCTAACGAGCGCACAGAGCTCATTGAAAC,GTCACAGACCTAACGAGCGCACAGAGCTCATTGAAAC,GTCACAGACCTAACGAGCGCACAGAGCTCATTGAAAC	37,37,37	0	0	NA	NA	NA:NA:NA	7,8,8	8	Unclear	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|619aa|up_7|NZ_LR593887.1_828548_830405_-,NA|159aa|up_3|NZ_LR593887.1_834310_834787_+,cas6|402aa|up_1|NZ_LR593887.1_837656_838862_-,NA|90aa|up_0|NZ_LR593887.1_839015_839285_+,NA|109aa|down_4|NZ_LR593887.1_847757_848084_+	NA|328aa|up_9|NZ_LR593887.1_825870_826854_-	pfam08450, SGL, SMP-30/Gluconolaconase/LRE-like region	NA|526aa|up_8|NZ_LR593887.1_826974_828552_-	TIGR02996, rpt_mate_G_obs, repeat-companion domain TIGR02996	NA|619aa|up_7|NZ_LR593887.1_828548_830405_-	NA	NA|651aa|up_6|NZ_LR593887.1_830725_832678_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|327aa|up_5|NZ_LR593887.1_832743_833724_-	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|160aa|up_4|NZ_LR593887.1_833756_834236_-	COG2005, ModE, N-terminal domain of molybdenum-binding protein [General function prediction only]	NA|159aa|up_3|NZ_LR593887.1_834310_834787_+	NA	NA|878aa|up_2|NZ_LR593887.1_834995_837629_+	TIGR03346, chaperone_ClpB, ATP-dependent chaperone ClpB	cas6|402aa|up_1|NZ_LR593887.1_837656_838862_-	NA	NA|90aa|up_0|NZ_LR593887.1_839015_839285_+	NA	NA|180aa|down_0|NZ_LR593887.1_840455_840995_-	cd03017, PRX_BCP, Peroxiredoxin (PRX) family, Bacterioferritin comigratory protein (BCP) subfamily; composed of  thioredoxin-dependent thiol peroxidases, widely expressed in pathogenic bacteria, that protect cells against toxicity from reactive oxygen species by reducing and detoxifying hydroperoxides	NA|386aa|down_1|NZ_LR593887.1_841152_842310_+	PRK06753, PRK06753, hypothetical protein; Provisional	NA|824aa|down_2|NZ_LR593887.1_842342_844814_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|752aa|down_3|NZ_LR593887.1_844851_847107_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|109aa|down_4|NZ_LR593887.1_847757_848084_+	NA	NA|1062aa|down_5|NZ_LR593887.1_848188_851374_-	cd04233, Auracyanin, Auracyanins A and B and similar proteins	NA|298aa|down_6|NZ_LR593887.1_851409_852303_-	pfam01261, AP_endonuc_2, Xylose isomerase-like TIM barrel	NA|448aa|down_7|NZ_LR593887.1_852588_853932_+	cd17353, MFS_OFA_like, Oxalate:formate antiporter (OFA) and similar proteins of the Major Facilitator Superfamily of transporters	NA|1325aa|down_8|NZ_LR593887.1_854244_858219_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|173aa|down_9|NZ_LR593887.1_858285_858804_+	PRK13291, PRK13291, putative metal-dependent hydrolase
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	7	1675079-1675617	5	CRISPRCasFinder	no	csa3	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Type I-A	TTGCAATCTTTGAAGTGGGCCAGCCCCGCATCGCT	35	0	0	NA	NA	NA	7	7	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|172aa|up_8|NZ_LR593887.1_1663580_1664096_+,NA|170aa|up_0|NZ_LR593887.1_1671620_1672130_-,NA|876aa|down_3|NZ_LR593887.1_1680009_1682637_+,NA|363aa|down_4|NZ_LR593887.1_1682633_1683722_+,NA|184aa|down_8|NZ_LR593887.1_1690078_1690630_-	NA|166aa|up_9|NZ_LR593887.1_1662887_1663385_-	COG0456, RimI, Acetyltransferases [General function prediction only]	NA|172aa|up_8|NZ_LR593887.1_1663580_1664096_+	NA	NA|395aa|up_7|NZ_LR593887.1_1664266_1665451_+	PRK07994, PRK07994, DNA polymerase III subunits gamma and tau; Validated	NA|224aa|up_6|NZ_LR593887.1_1665467_1666139_+	cd19366, TenA_C_BhTenA-like, TenA_C proteins similar to Bacillus halodurans TenA	NA|268aa|up_5|NZ_LR593887.1_1666153_1666957_+	PRK06427, PRK06427, bifunctional hydroxy-methylpyrimidine kinase/ hydroxy-phosphomethylpyrimidine kinase; Reviewed	NA|268aa|up_4|NZ_LR593887.1_1666944_1667748_-	pfam12146, Hydrolase_4, Serine aminopeptidase, S33	NA|481aa|up_3|NZ_LR593887.1_1667744_1669187_-	pfam13360, PQQ_2, PQQ-like domain	NA|456aa|up_2|NZ_LR593887.1_1669199_1670567_-	pfam07394, DUF1501, Protein of unknown function (DUF1501)	NA|217aa|up_1|NZ_LR593887.1_1670818_1671469_-	NF033186, internalin_K, class 1 internalin InlK	NA|170aa|up_0|NZ_LR593887.1_1671620_1672130_-	NA	NA|186aa|down_0|NZ_LR593887.1_1677468_1678026_-	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|186aa|down_1|NZ_LR593887.1_1678519_1679077_+	PRK12519, PRK12519, RNA polymerase sigma factor; Provisional	NA|287aa|down_2|NZ_LR593887.1_1679073_1679934_+	pfam10099, RskA, Anti-sigma-K factor rskA	NA|876aa|down_3|NZ_LR593887.1_1680009_1682637_+	NA	NA|363aa|down_4|NZ_LR593887.1_1682633_1683722_+	NA	NA|1101aa|down_5|NZ_LR593887.1_1683895_1687198_-	TIGR02604, Piru_Ver_Nterm, putative membrane-bound dehydrogenase domain	NA|165aa|down_6|NZ_LR593887.1_1687549_1688044_-	pfam08714, Fae, Formaldehyde-activating enzyme (Fae)	NA|572aa|down_7|NZ_LR593887.1_1688289_1690005_-	COG0553, HepA, Superfamily II DNA/RNA helicases, SNF2 family [Transcription / DNA replication, recombination, and repair]	NA|184aa|down_8|NZ_LR593887.1_1690078_1690630_-	NA	NA|348aa|down_9|NZ_LR593887.1_1690889_1691933_-	cd14503, PTP-bact, bacterial tyrosine-protein phosphataseS similar to Neisseria NMA1982
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	8	4370104-4371665	4,6,5	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas2	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Unclear	GTCCCTTGACTCCCGAATCCGGCGAGAATTGAAAC,GTCCCTTGACTCCCGAATCCGGCGAGAATTGAAAC,GTCCCTTGACTCCCGAATCCGGCGAGAATTGAAAC	35,35,35	0	0	NA	NA	NA:NA:NA	21,22,22	22	Unclear	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|321aa|up_9|NZ_LR593887.1_4358443_4359406_+,NA|252aa|up_8|NZ_LR593887.1_4359407_4360163_+,NA|99aa|up_4|NZ_LR593887.1_4365141_4365438_+,NA|179aa|up_3|NZ_LR593887.1_4365430_4365967_-,NA|90aa|up_2|NZ_LR593887.1_4366049_4366319_-,NA|736aa|down_7|NZ_LR593887.1_4380948_4383156_-	NA|321aa|up_9|NZ_LR593887.1_4358443_4359406_+	NA	NA|252aa|up_8|NZ_LR593887.1_4359407_4360163_+	NA	NA|632aa|up_7|NZ_LR593887.1_4360159_4362055_+	cd00865, PEBP_bact_arch, PhosphatidylEthanolamine-Binding Protein (PEBP) domain present in bacteria and archaea	NA|434aa|up_6|NZ_LR593887.1_4362165_4363467_+	cd16144, ARS_like, uncharacterized arylsulfatase subfamily	NA|485aa|up_5|NZ_LR593887.1_4363484_4364939_+	pfam16656, Pur_ac_phosph_N, Purple acid Phosphatase, N-terminal domain	NA|99aa|up_4|NZ_LR593887.1_4365141_4365438_+	NA	NA|179aa|up_3|NZ_LR593887.1_4365430_4365967_-	NA	NA|90aa|up_2|NZ_LR593887.1_4366049_4366319_-	NA	cas1|919aa|up_1|NZ_LR593887.1_4366725_4369482_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|92aa|up_0|NZ_LR593887.1_4369478_4369754_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|341aa|down_0|NZ_LR593887.1_4371959_4372982_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|384aa|down_1|NZ_LR593887.1_4373126_4374278_+	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|394aa|down_2|NZ_LR593887.1_4374499_4375681_+	cd02577, PSTD1, Pseudouridine synthase, a subgroup of the TruD family	NA|990aa|down_3|NZ_LR593887.1_4375782_4378752_-	pfam07583, PSCyt2, Protein of unknown function (DUF1549)	NA|113aa|down_4|NZ_LR593887.1_4378912_4379251_+	PRK10089, PRK10089, chaperone CsaA	NA|308aa|down_5|NZ_LR593887.1_4379603_4380527_+	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|62aa|down_6|NZ_LR593887.1_4380649_4380835_+	TIGR03302, OM_YfiO, outer membrane assembly lipoprotein YfiO	NA|736aa|down_7|NZ_LR593887.1_4380948_4383156_-	NA	NA|160aa|down_8|NZ_LR593887.1_4383198_4383678_-	cd15904, TSPO_MBR, Translocator protein (TSPO)/peripheral-type benzodiazepine receptor (MBR) family	NA|454aa|down_9|NZ_LR593887.1_4383693_4385055_-	pfam07394, DUF1501, Protein of unknown function (DUF1501)
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	9	4730617-4730723	7	CRISPRCasFinder	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	GCTCCGCCGGGTTATGATCCCTATGC	26	0	0	NA	NA	NA	1	1	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|410aa|up_7|NZ_LR593887.1_4716465_4717695_-,NA|140aa|down_2|NZ_LR593887.1_4739373_4739793_+	NA|220aa|up_9|NZ_LR593887.1_4715018_4715678_-	pfam06439, DUF1080, Domain of Unknown Function (DUF1080)	NA|112aa|up_8|NZ_LR593887.1_4715846_4716182_-	COG0633, Fdx, Ferredoxin [Energy production and conversion]	NA|410aa|up_7|NZ_LR593887.1_4716465_4717695_-	NA	NA|395aa|up_6|NZ_LR593887.1_4717999_4719184_+	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|1171aa|up_5|NZ_LR593887.1_4719253_4722766_+	TIGR00915, Probable_aminoglycoside_efflux_pump, The (Largely Gram-negative Bacterial) Hydrophobe/Amphiphile Efflux-1 (HAE1) Family	NA|543aa|up_4|NZ_LR593887.1_4723075_4724704_+	PRK00915, PRK00915, 2-isopropylmalate synthase; Validated	NA|625aa|up_3|NZ_LR593887.1_4725024_4726899_+	pfam13517, VCBS, Repeat domain in Vibrio, Colwellia, Bradyrhizobium and Shewanella	NA|253aa|up_2|NZ_LR593887.1_4726900_4727659_-	PRK00121, trmB, tRNA (guanine-N(7)-)-methyltransferase; Reviewed	NA|302aa|up_1|NZ_LR593887.1_4727677_4728583_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|401aa|up_0|NZ_LR593887.1_4728916_4730119_+	cd06142, RNaseD_exo, DEDDy 3'-5' exonuclease domain of Ribonuclease D and similar proteins	NA|234aa|down_0|NZ_LR593887.1_4732054_4732756_-	pfam08308, PEGA, PEGA domain	NA|1558aa|down_1|NZ_LR593887.1_4732904_4737578_-	cd00198, vWFA, Von Willebrand factor type A (vWA) domain was originally found in the blood coagulation protein von Willebrand factor (vWF)	NA|140aa|down_2|NZ_LR593887.1_4739373_4739793_+	NA	NA|467aa|down_3|NZ_LR593887.1_4739876_4741277_-	PRK07907, PRK07907, hypothetical protein; Provisional	NA|156aa|down_4|NZ_LR593887.1_4741400_4741868_+	COG4319, COG4319, Ketosteroid isomerase homolog [Function unknown]	NA|532aa|down_5|NZ_LR593887.1_4741897_4743493_+	cd03145, GAT1_cyanophycinase, Type 1 glutamine amidotransferase (GATase1)-like domain found in cyanophycinase	NA|196aa|down_6|NZ_LR593887.1_4743595_4744183_+	TIGR02999, Sig-70_X6, RNA polymerase sigma factor, TIGR02999 family	NA|323aa|down_7|NZ_LR593887.1_4744296_4745265_+	cd01562, Thr-dehyd, Threonine dehydratase: The first step in amino acid degradation is the removal of nitrogen	NA|188aa|down_8|NZ_LR593887.1_4745300_4745864_+	pfam13671, AAA_33, AAA domain	NA|132aa|down_9|NZ_LR593887.1_4745846_4746242_-	pfam00072, Response_reg, Response regulator receiver domain
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	10	5942792-5957854	8,6,5,6	CRISPRCasFinder,CRT,PILER-CR,PILER-CR	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	GCTTCAATTCGGCCACAGATTTTTGTCTGTGGAAAT,GCTTCAATTCGGCCACAGATTTTTGTCTGTGGAAAT,CTTCAATTCGGCCACAGATTTTTGTCTGTGGAAAT,GCTTCAATTCGGCCACAGATTTTTGTCTGTGGAAAT	36,36,35,36	0	0	NA	NA	NA:NA:NA:NA	204,204,202,202	204	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|102aa|up_9|NZ_LR593887.1_5929338_5929644_+,NA|117aa|up_8|NZ_LR593887.1_5929818_5930169_+,NA|269aa|up_7|NZ_LR593887.1_5930401_5931208_+,NA|151aa|up_4|NZ_LR593887.1_5937720_5938173_+,NA|77aa|up_3|NZ_LR593887.1_5939021_5939252_+,NA|132aa|up_1|NZ_LR593887.1_5940764_5941160_-,NA|243aa|up_0|NZ_LR593887.1_5942015_5942744_+,NA|129aa|down_2|NZ_LR593887.1_5961085_5961472_-,NA|184aa|down_3|NZ_LR593887.1_5965706_5966258_+,NA|184aa|down_9|NZ_LR593887.1_5973194_5973746_-	NA|102aa|up_9|NZ_LR593887.1_5929338_5929644_+	NA	NA|117aa|up_8|NZ_LR593887.1_5929818_5930169_+	NA	NA|269aa|up_7|NZ_LR593887.1_5930401_5931208_+	NA	NA|1573aa|up_6|NZ_LR593887.1_5931506_5936225_-	pfam05048, NosD, Periplasmic copper-binding protein (NosD)	NA|297aa|up_5|NZ_LR593887.1_5936825_5937716_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|151aa|up_4|NZ_LR593887.1_5937720_5938173_+	NA	NA|77aa|up_3|NZ_LR593887.1_5939021_5939252_+	NA	NA|288aa|up_2|NZ_LR593887.1_5939267_5940131_+	pfam07591, PT-HINT, Pretoxin HINT domain	NA|132aa|up_1|NZ_LR593887.1_5940764_5941160_-	NA	NA|243aa|up_0|NZ_LR593887.1_5942015_5942744_+	NA	NA|385aa|down_0|NZ_LR593887.1_5958482_5959637_-	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|154aa|down_1|NZ_LR593887.1_5960131_5960593_-	NF033459, DksA_like, RNA polymerase-binding protein DksA	NA|129aa|down_2|NZ_LR593887.1_5961085_5961472_-	NA	NA|184aa|down_3|NZ_LR593887.1_5965706_5966258_+	NA	NA|258aa|down_4|NZ_LR593887.1_5966389_5967163_+	pfam09844, DUF2071, Uncharacterized conserved protein (COG2071)	NA|796aa|down_5|NZ_LR593887.1_5967219_5969607_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|563aa|down_6|NZ_LR593887.1_5969612_5971301_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|233aa|down_7|NZ_LR593887.1_5971562_5972261_-	pfam01590, GAF, GAF domain	NA|123aa|down_8|NZ_LR593887.1_5972694_5973063_-	COG0222, RplL, Ribosomal protein L7/L12 [Translation, ribosomal structure and biogenesis]	NA|184aa|down_9|NZ_LR593887.1_5973194_5973746_-	NA
GCF_901538355.1_ASM90153835v1	NZ_LR593887	Tuwongella immobilis isolate MBLW1 chromosome 1	11	6220119-6220219	9	CRISPRCasFinder	no		csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	Orphan	ATTCGCATCCGGCTTCGGCTTGGAACTCG	29	0	0	NA	NA	NA	1	1	Orphan	csa3,DinG,RT,cas6,cas3,cas8u2,cas7,cas5u,cas1,cas2,cmr1gr7,cas10,cmr3gr5,cmr4gr7,cmr5gr11,cmr6gr7,csx1,csx15,DEDDh,csb2gr5	NA|119aa|up_3|NZ_LR593887.1_6215109_6215466_-,NA|206aa|up_2|NZ_LR593887.1_6215462_6216080_-,NA|147aa|up_0|NZ_LR593887.1_6217508_6217949_+,NA|140aa|down_0|NZ_LR593887.1_6220317_6220737_+,NA|208aa|down_1|NZ_LR593887.1_6220789_6221413_-	NA|406aa|up_9|NZ_LR593887.1_6205999_6207217_-	TIGR03177, pilus_cpaB, Flp pilus assembly protein CpaB	NA|278aa|up_8|NZ_LR593887.1_6207746_6208580_-	pfam01478, Peptidase_A24, Type IV leader peptidase family	NA|64aa|up_7|NZ_LR593887.1_6208691_6208883_-	COG3847, Flp, Flp pilus assembly protein, pilin Flp [Intracellular trafficking and secretion]	NA|382aa|up_6|NZ_LR593887.1_6209033_6210179_-	cd06267, PBP1_LacI_sugar_binding-like, ligand binding domain of the LacI transcriptional regulator family belonging to the type 1 periplasmic-binding fold protein superfamily	NA|770aa|up_5|NZ_LR593887.1_6210286_6212596_-	pfam07583, PSCyt2, Protein of unknown function (DUF1549)	NA|468aa|up_4|NZ_LR593887.1_6213166_6214570_+	PRK05901, PRK05901, RNA polymerase sigma factor; Provisional	NA|119aa|up_3|NZ_LR593887.1_6215109_6215466_-	NA	NA|206aa|up_2|NZ_LR593887.1_6215462_6216080_-	NA	NA|328aa|up_1|NZ_LR593887.1_6216413_6217397_+	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)	NA|147aa|up_0|NZ_LR593887.1_6217508_6217949_+	NA	NA|140aa|down_0|NZ_LR593887.1_6220317_6220737_+	NA	NA|208aa|down_1|NZ_LR593887.1_6220789_6221413_-	NA	NA|180aa|down_2|NZ_LR593887.1_6221519_6222059_-	pfam14568, SUKH_6, SMI1-KNR4 cell-wall	NA|268aa|down_3|NZ_LR593887.1_6222377_6223181_-	pfam07591, PT-HINT, Pretoxin HINT domain	NA|228aa|down_4|NZ_LR593887.1_6223276_6223960_+	cd07506, HAD_like, uncharacterized family of the haloacid dehalogenase-like (HAD) hydrolase superfamily	NA|301aa|down_5|NZ_LR593887.1_6223988_6224891_+	cd03144, GATase1_ScBLP_like, Type 1 glutamine amidotransferase (GATase1)-like domain found in proteins similar to Saccharomyces cerevisiae biotin-apoprotein ligase (ScBLP)	NA|275aa|down_6|NZ_LR593887.1_6225007_6225832_+	COG0415, PhrB, Deoxyribodipyrimidine photolyase [DNA replication, recombination, and repair]	NA|157aa|down_7|NZ_LR593887.1_6225828_6226299_+	COG3458, COG3458, Acetyl esterase (deacetylase) [Secondary metabolites biosynthesis, transport, and catabolism]	NA|413aa|down_8|NZ_LR593887.1_6226492_6227731_+	TIGR02996, rpt_mate_G_obs, repeat-companion domain TIGR02996	NA|771aa|down_9|NZ_LR593887.1_6227811_6230124_-	TIGR02608, hypothetical_protein, delta-60 repeat domain
