assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	1	609428-609705	1	CRT	no	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Unclear	GGCGAGCGCGCTCGCGGGGG	20	0	0	NA	NA	NA	6	6	Unclear	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	cas8u1|321aa|up_7|NC_021658.1_598025_598988_-,NA|59aa|up_0|NC_021658.1_609171_609348_+,NA|362aa|down_4|NC_021658.1_619578_620664_+,NA|375aa|down_8|NC_021658.1_629696_630821_+	NA|330aa|up_9|NC_021658.1_596141_597131_-	PRK00164, moaA, GTP 3',8-cyclase MoaA	NA|249aa|up_8|NC_021658.1_597214_597961_-	COG0535, COG0535, Predicted Fe-S oxidoreductases [General function prediction only]	cas8u1|321aa|up_7|NC_021658.1_598025_598988_-	NA	cas3|1000aa|up_6|NC_021658.1_598984_601984_-	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb2gr5|564aa|up_5|NC_021658.1_601976_603668_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csb1gr7|426aa|up_4|NC_021658.1_603667_604945_-	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	cas1|668aa|up_3|NC_021658.1_605490_607494_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|97aa|up_2|NC_021658.1_607554_607845_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|397aa|up_1|NC_021658.1_607885_609076_-	PRK05687, fliH, flagellar assembly protein FliH	NA|59aa|up_0|NC_021658.1_609171_609348_+	NA	NA|314aa|down_0|NC_021658.1_614751_615693_-	pfam13701, DDE_Tnp_1_4, Transposase DDE domain group 1	NA|46aa|down_1|NC_021658.1_616042_616180_+	pfam11848, DUF3368, Domain of unknown function (DUF3368)	NA|568aa|down_2|NC_021658.1_616498_618202_+	COG1595, RpoE, DNA-directed RNA polymerase specialized sigma subunit, sigma24 homolog [Transcription]	NA|402aa|down_3|NC_021658.1_618198_619404_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|362aa|down_4|NC_021658.1_619578_620664_+	NA	NA|520aa|down_5|NC_021658.1_620715_622275_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|1640aa|down_6|NC_021658.1_623232_628152_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|338aa|down_7|NC_021658.1_628206_629220_-	cd19152, AKR_AKR15A, AKR15A family of aldo-keto reductase	NA|375aa|down_8|NC_021658.1_629696_630821_+	NA	NA|180aa|down_9|NC_021658.1_631648_632188_-	PRK14971, PRK14971, DNA polymerase III subunit gamma/tau
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	2	610407-614614	1,2,1	CRISPRCasFinder,CRT,PILER-CR	no	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Unclear	CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC,CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC,CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC	36,36,36	0	0	NA	NA	NA:NA:NA	56,57,51	57	Unclear	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	cas8u1|321aa|up_7|NC_021658.1_598025_598988_-,NA|59aa|up_0|NC_021658.1_609171_609348_+,NA|362aa|down_4|NC_021658.1_619578_620664_+,NA|375aa|down_8|NC_021658.1_629696_630821_+	NA|330aa|up_9|NC_021658.1_596141_597131_-	PRK00164, moaA, GTP 3',8-cyclase MoaA	NA|249aa|up_8|NC_021658.1_597214_597961_-	COG0535, COG0535, Predicted Fe-S oxidoreductases [General function prediction only]	cas8u1|321aa|up_7|NC_021658.1_598025_598988_-	NA	cas3|1000aa|up_6|NC_021658.1_598984_601984_-	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb2gr5|564aa|up_5|NC_021658.1_601976_603668_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csb1gr7|426aa|up_4|NC_021658.1_603667_604945_-	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	cas1|668aa|up_3|NC_021658.1_605490_607494_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|97aa|up_2|NC_021658.1_607554_607845_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|397aa|up_1|NC_021658.1_607885_609076_-	PRK05687, fliH, flagellar assembly protein FliH	NA|59aa|up_0|NC_021658.1_609171_609348_+	NA	NA|314aa|down_0|NC_021658.1_614751_615693_-	pfam13701, DDE_Tnp_1_4, Transposase DDE domain group 1	NA|46aa|down_1|NC_021658.1_616042_616180_+	pfam11848, DUF3368, Domain of unknown function (DUF3368)	NA|568aa|down_2|NC_021658.1_616498_618202_+	COG1595, RpoE, DNA-directed RNA polymerase specialized sigma subunit, sigma24 homolog [Transcription]	NA|402aa|down_3|NC_021658.1_618198_619404_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|362aa|down_4|NC_021658.1_619578_620664_+	NA	NA|520aa|down_5|NC_021658.1_620715_622275_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|1640aa|down_6|NC_021658.1_623232_628152_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|338aa|down_7|NC_021658.1_628206_629220_-	cd19152, AKR_AKR15A, AKR15A family of aldo-keto reductase	NA|375aa|down_8|NC_021658.1_629696_630821_+	NA	NA|180aa|down_9|NC_021658.1_631648_632188_-	PRK14971, PRK14971, DNA polymerase III subunit gamma/tau
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	3	675300-675412	2	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCCTGAGCCCCGCGGGCGGGAGGGCCG	27	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|173aa|up_9|NC_021658.1_658180_658699_-,NA|168aa|up_5|NC_021658.1_662664_663168_-,NA|318aa|up_1|NC_021658.1_672574_673528_-,NA|298aa|down_4|NC_021658.1_682277_683171_-,NA|86aa|down_6|NC_021658.1_683921_684179_+	NA|173aa|up_9|NC_021658.1_658180_658699_-	NA	NA|95aa|up_8|NC_021658.1_659028_659313_+	PRK14954, PRK14954, DNA polymerase III subunits gamma and tau; Provisional	NA|445aa|up_7|NC_021658.1_659309_660644_+	cd00118, LysM, Lysin Motif is a small domain involved in binding peptidoglycan	NA|551aa|up_6|NC_021658.1_660991_662644_+	sd00006, TPR, Tetratricopeptide repeat	NA|168aa|up_5|NC_021658.1_662664_663168_-	NA	NA|1007aa|up_4|NC_021658.1_664262_667283_-	COG3209, RhsA, Rhs family protein [Cell envelope biogenesis, outer membrane]	NA|118aa|up_3|NC_021658.1_667305_667659_-	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|1586aa|up_2|NC_021658.1_667804_672562_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|318aa|up_1|NC_021658.1_672574_673528_-	NA	NA|388aa|up_0|NC_021658.1_673942_675106_+	pfam00561, Abhydrolase_1, alpha/beta hydrolase fold	NA|407aa|down_0|NC_021658.1_675729_676950_+	PRK01346, PRK01346, enhanced intracellular survival protein Eis	NA|175aa|down_1|NC_021658.1_676963_677488_+	smart00271, DnaJ, DnaJ molecular chaperone homology domain	NA|1046aa|down_2|NC_021658.1_677675_680813_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|233aa|down_3|NC_021658.1_681540_682239_-	cd02969, PRX_like1, Peroxiredoxin (PRX)-like 1 family; hypothetical proteins that show sequence similarity to PRXs	NA|298aa|down_4|NC_021658.1_682277_683171_-	NA	NA|256aa|down_5|NC_021658.1_683173_683941_-	cd03394, PAP2_like_5, PAP2_like_5 proteins	NA|86aa|down_6|NC_021658.1_683921_684179_+	NA	NA|119aa|down_7|NC_021658.1_684213_684570_-	pfam07883, Cupin_2, Cupin domain	NA|586aa|down_8|NC_021658.1_684683_686441_-	pfam13598, DUF4139, Domain of unknown function (DUF4139)	NA|774aa|down_9|NC_021658.1_686460_688782_-	pfam13598, DUF4139, Domain of unknown function (DUF4139)
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	4	2183485-2183586	3	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCGGCCGGCCGCCGCGGCTCTCGCTCCGGTGAGCGGCC	38	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|161aa|up_8|NC_021658.1_2173254_2173737_-,NA|159aa|up_4|NC_021658.1_2176453_2176930_-,NA|119aa|up_3|NC_021658.1_2176937_2177294_-,NA|314aa|up_1|NC_021658.1_2181969_2182911_+,NA|80aa|up_0|NC_021658.1_2182962_2183202_+,NA|80aa|down_8|NC_021658.1_2197014_2197254_+	NA|283aa|up_9|NC_021658.1_2172316_2173165_-	PTZ00121, PTZ00121, MAEBL; Provisional	NA|161aa|up_8|NC_021658.1_2173254_2173737_-	NA	NA|324aa|up_7|NC_021658.1_2173751_2174723_-	pfam14257, DUF4349, Domain of unknown function (DUF4349)	NA|192aa|up_6|NC_021658.1_2175043_2175619_-	TIGR00560, pgsA, CDP-diacylglycerol--glycerol-3-phosphate 3-phosphatidyltransferase	NA|145aa|up_5|NC_021658.1_2175779_2176214_-	pfam00582, Usp, Universal stress protein family	NA|159aa|up_4|NC_021658.1_2176453_2176930_-	NA	NA|119aa|up_3|NC_021658.1_2176937_2177294_-	NA	NA|1197aa|up_2|NC_021658.1_2177693_2181284_+	sd00038, Kelch, Kelch repeat	NA|314aa|up_1|NC_021658.1_2181969_2182911_+	NA	NA|80aa|up_0|NC_021658.1_2182962_2183202_+	NA	NA|603aa|down_0|NC_021658.1_2183753_2185562_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|331aa|down_1|NC_021658.1_2185664_2186657_+	pfam04015, DUF362, Domain of unknown function (DUF362)	NA|636aa|down_2|NC_021658.1_2186661_2188569_+	cd16373, DMSOR_beta_like, uncharacterized subfamily of DMSO Reductase beta subunit family	NA|385aa|down_3|NC_021658.1_2188621_2189776_+	COG4907, COG4907, Predicted membrane protein [Function unknown]	NA|578aa|down_4|NC_021658.1_2189841_2191575_-	COG4591, LolE, ABC-type transport system, involved in lipoprotein release, permease component [Cell envelope biogenesis, outer membrane]	NA|553aa|down_5|NC_021658.1_2192058_2193717_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|462aa|down_6|NC_021658.1_2193769_2195155_+	PRK13299, PRK13299, tRNA CCA-pyrophosphorylase; Provisional	NA|442aa|down_7|NC_021658.1_2195535_2196861_+	cd01477, vWA_F09G8-8_type, VWA F09G8	NA|80aa|down_8|NC_021658.1_2197014_2197254_+	NA	NA|435aa|down_9|NC_021658.1_2197241_2198546_-	PRK09228, PRK09228, guanine deaminase; Provisional
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	5	2641533-2641638	4	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCTCCTTTGCAATTGCAAGCATCGCGCCGG	30	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|376aa|up_3|NC_021658.1_2635911_2637039_+,NA|219aa|down_4|NC_021658.1_2645503_2646160_-,NA|96aa|down_8|NC_021658.1_2648840_2649128_-	NA|281aa|up_9|NC_021658.1_2629498_2630341_-	TIGR01250, Proline_iminopeptidase, proline-specific peptidase, Bacillus coagulans-type subfamily	NA|195aa|up_8|NC_021658.1_2630551_2631136_-	TIGR03885, putative_dehydrogenase_protein, probable non-F420 flavinoid oxidoreductase	NA|439aa|up_7|NC_021658.1_2631267_2632584_-	pfam04389, Peptidase_M28, Peptidase family M28	NA|481aa|up_6|NC_021658.1_2632737_2634180_-	cd00548, NrfA-like, cytochrome c nitrite reductase and similar proteins	NA|181aa|up_5|NC_021658.1_2634210_2634753_-	TIGR03153, cytochr_NrfH, cytochrome c nitrite reductase, small subunit	NA|296aa|up_4|NC_021658.1_2635015_2635903_+	pfam05721, PhyH, Phytanoyl-CoA dioxygenase (PhyH)	NA|376aa|up_3|NC_021658.1_2635911_2637039_+	NA	NA|415aa|up_2|NC_021658.1_2637052_2638297_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|403aa|up_1|NC_021658.1_2638680_2639889_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|376aa|up_0|NC_021658.1_2640148_2641276_-	pfam00553, CBM_2, Cellulose binding domain	NA|132aa|down_0|NC_021658.1_2642128_2642524_+	COG3791, COG3791, Uncharacterized conserved protein [Function unknown]	NA|388aa|down_1|NC_021658.1_2642574_2643738_-	pfam09113, N-glycanase_C, Peptide-N-glycosidase F, C terminal	NA|142aa|down_2|NC_021658.1_2643817_2644243_+	cd07253, GLOD5, Human glyoxalase domain-containing protein 5 and similar proteins	NA|364aa|down_3|NC_021658.1_2644265_2645357_-	pfam12146, Hydrolase_4, Serine aminopeptidase, S33	NA|219aa|down_4|NC_021658.1_2645503_2646160_-	NA	NA|122aa|down_5|NC_021658.1_2646156_2646522_-	pfam09862, DUF2089, Protein of unknown function (DUF2089)	NA|382aa|down_6|NC_021658.1_2646673_2647819_-	pfam14099, Polysacc_lyase, Polysaccharide lyase	NA|294aa|down_7|NC_021658.1_2647939_2648821_-	cd09025, Aldose_epim_Slr1438, Aldose 1-epimerase, similar to Synechocystis Slr1438	NA|96aa|down_8|NC_021658.1_2648840_2649128_-	NA	NA|167aa|down_9|NC_021658.1_2649141_2649642_-	pfam03168, LEA_2, Late embryogenesis abundant protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	6	3417681-3418202	3	CRT	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGAGCTGGTGGAGGCGGCGGAGCCGGAGCT	30	2	4	3418059-3418076|3418059-3418076|3418059-3418076|3418155-3418172	NC_021658.1_3769593-3769610|NC_021658.1_3776171-3776188|NC_021658.1_12531504-12531521|NC_021658.1_13976249-13976266	NA	7	7	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|395aa|up_4|NC_021658.1_3410262_3411447_+,NA|279aa|up_1|NC_021658.1_3413340_3414177_-,NA|251aa|down_4|NC_021658.1_3425437_3426190_-	NA|1217aa|up_9|NC_021658.1_3403296_3406947_-	COG3419, PilY1, Tfp pilus assembly protein, tip-associated adhesin PilY1 [Cell motility and secretion / Intracellular trafficking and secretion]	NA|199aa|up_8|NC_021658.1_3406963_3407560_-	COG4726, PilX, Tfp pilus assembly protein PilX [Cell motility and secretion / Intracellular trafficking and secretion]	NA|435aa|up_7|NC_021658.1_3407553_3408858_-	COG4966, PilW, Tfp pilus assembly protein PilW [Cell motility and secretion / Intracellular trafficking and secretion]	NA|202aa|up_6|NC_021658.1_3408854_3409460_-	COG4967, PilV, Tfp pilus assembly protein PilV [Cell motility and secretion / Intracellular trafficking and secretion]	NA|243aa|up_5|NC_021658.1_3409456_3410185_-	COG4970, FimT, Tfp pilus assembly protein FimT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|395aa|up_4|NC_021658.1_3410262_3411447_+	NA	NA|239aa|up_3|NC_021658.1_3411567_3412284_-	pfam13616, Rotamase_3, PPIC-type PPIASE domain	NA|283aa|up_2|NC_021658.1_3412334_3413183_-	PLN02864, PLN02864, enoyl-CoA hydratase	NA|279aa|up_1|NC_021658.1_3413340_3414177_-	NA	NA|785aa|up_0|NC_021658.1_3414187_3416542_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|115aa|down_0|NC_021658.1_3420774_3421119_-	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|165aa|down_1|NC_021658.1_3422300_3422795_+	pfam00932, LTD, Lamin Tail Domain	NA|210aa|down_2|NC_021658.1_3422995_3423625_+	pfam12728, HTH_17, Helix-turn-helix domain	NA|447aa|down_3|NC_021658.1_3423898_3425239_-	PRK11040, PRK11040, peptidase PmbA; Provisional	NA|251aa|down_4|NC_021658.1_3425437_3426190_-	NA	NA|251aa|down_5|NC_021658.1_3426470_3427223_+	COG1691, COG1691, NCAIR mutase (PurE)-related proteins [General function prediction only]	NA|459aa|down_6|NC_021658.1_3427291_3428668_+	pfam01969, DUF111, Protein of unknown function DUF111	NA|219aa|down_7|NC_021658.1_3428772_3429429_-	TIGR01068, Thioredoxin-like_protein_slr0233, thioredoxin	NA|332aa|down_8|NC_021658.1_3429609_3430605_-	COG1173, DppC, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|380aa|down_9|NC_021658.1_3430601_3431741_-	COG0601, DppB, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	7	3465079-3465174	5	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCATCAGGACACGCCACCCGGCCACCAGGACA	32	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|382aa|up_9|NC_021658.1_3451312_3452458_+,NA|151aa|up_8|NC_021658.1_3452667_3453120_+,NA|423aa|up_2|NC_021658.1_3460870_3462139_-,NA|286aa|down_0|NC_021658.1_3465345_3466203_+,NA|211aa|down_3|NC_021658.1_3469489_3470122_-,NA|262aa|down_7|NC_021658.1_3477158_3477944_+	NA|382aa|up_9|NC_021658.1_3451312_3452458_+	NA	NA|151aa|up_8|NC_021658.1_3452667_3453120_+	NA	NA|335aa|up_7|NC_021658.1_3453141_3454146_-	sd00006, TPR, Tetratricopeptide repeat	NA|874aa|up_6|NC_021658.1_3454142_3456764_-	pfam04885, Stig1, Stigma-specific protein, Stig1	NA|464aa|up_5|NC_021658.1_3456771_3458163_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|344aa|up_4|NC_021658.1_3458503_3459535_-	COG1597, LCB5, Sphingosine kinase and enzymes related to eukaryotic diacylglycerol kinase [Lipid metabolism / General function prediction only]	NA|397aa|up_3|NC_021658.1_3459535_3460726_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|423aa|up_2|NC_021658.1_3460870_3462139_-	NA	NA|473aa|up_1|NC_021658.1_3462481_3463900_+	cd17486, MFS_AmpG_like, AmpG and similar transporters of the Major Facilitator Superfamily	NA|321aa|up_0|NC_021658.1_3463926_3464889_-	PRK13386, fliH, flagellar assembly protein H; Provisional	NA|286aa|down_0|NC_021658.1_3465345_3466203_+	NA	NA|494aa|down_1|NC_021658.1_3466361_3467843_+	COG0612, PqqL, Predicted Zn-dependent peptidases [General function prediction only]	NA|516aa|down_2|NC_021658.1_3467839_3469387_+	COG0612, PqqL, Predicted Zn-dependent peptidases [General function prediction only]	NA|211aa|down_3|NC_021658.1_3469489_3470122_-	NA	NA|500aa|down_4|NC_021658.1_3470167_3471667_-	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|1202aa|down_5|NC_021658.1_3471996_3475602_-	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|394aa|down_6|NC_021658.1_3475980_3477162_+	PHA00370, III, attachment protein	NA|262aa|down_7|NC_021658.1_3477158_3477944_+	NA	NA|190aa|down_8|NC_021658.1_3478050_3478620_-	COG3031, PulC, Type II secretory pathway, component PulC [Intracellular trafficking and secretion]	NA|139aa|down_9|NC_021658.1_3479118_3479535_+	cd08354, VOC_like, uncharacterized subfamily of vicinal oxygen chelate (VOC) family
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	8	3493308-3493398	6	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	TCGCGCCCGGCCGGCGGCGCCTGGGCGG	28	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|327aa|up_9|NC_021658.1_3479735_3480716_+,NA|114aa|up_7|NC_021658.1_3481724_3482066_+,NA|158aa|up_6|NC_021658.1_3482164_3482638_+,NA|61aa|up_2|NC_021658.1_3488826_3489009_-,NA	NA|327aa|up_9|NC_021658.1_3479735_3480716_+	NA	NA|96aa|up_8|NC_021658.1_3480953_3481241_+	pfam09720, Unstab_antitox, Putative addiction module component	NA|114aa|up_7|NC_021658.1_3481724_3482066_+	NA	NA|158aa|up_6|NC_021658.1_3482164_3482638_+	NA	NA|919aa|up_5|NC_021658.1_3483022_3485779_+	TIGR02987, m6_adenine_and_m5_cytosine_DNA_methyltransferase, type II restriction m6 adenine DNA methyltransferase, Alw26I/Eco31I/Esp3I family	NA|365aa|up_4|NC_021658.1_3485766_3486861_+	COG2333, ComEC, Predicted hydrolase (metallo-beta-lactamase superfamily) [General function prediction only]	NA|367aa|up_3|NC_021658.1_3486947_3488048_-	PRK07764, PRK07764, DNA polymerase III subunits gamma and tau; Validated	NA|61aa|up_2|NC_021658.1_3488826_3489009_-	NA	NA|169aa|up_1|NC_021658.1_3490334_3490841_-	cd14505, CDKN3-like, cyclin-dependent kinase inhibitor 3 and similar proteins	NA|757aa|up_0|NC_021658.1_3491005_3493276_-	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|365aa|down_0|NC_021658.1_3493715_3494810_-	pfam10009, DUF2252, Uncharacterized protein conserved in bacteria (DUF2252)	NA|503aa|down_1|NC_021658.1_3494963_3496472_-	pfam01186, Lysyl_oxidase, Lysyl oxidase	NA|156aa|down_2|NC_021658.1_3496832_3497300_+	pfam13411, MerR_1, MerR HTH family regulatory protein	NA|868aa|down_3|NC_021658.1_3497296_3499900_+	TIGR03788, marine_srt_targ, marine proteobacterial sortase target protein	NA|349aa|down_4|NC_021658.1_3499945_3500992_-	COG1360, MotB, Flagellar motor protein [Cell motility and secretion]	NA|469aa|down_5|NC_021658.1_3501273_3502680_-	cd03398, PAP2_haloperoxidase, PAP2, haloperoxidase_like subfamily	NA|365aa|down_6|NC_021658.1_3503293_3504388_-	COG0644, FixC, Dehydrogenases (flavoproteins) [Energy production and conversion]	NA|198aa|down_7|NC_021658.1_3504402_3504996_-	COG1755, COG1755, Uncharacterized protein conserved in bacteria [Function unknown]	NA|359aa|down_8|NC_021658.1_3504989_3506066_-	COG3424, BcsA, Predicted naringenin-chalcone synthase [Secondary metabolites biosynthesis, transport, and catabolism]	NA|124aa|down_9|NC_021658.1_3506272_3506644_+	COG2076, EmrE, Membrane transporters of cations and cationic drugs [Inorganic ion transport and metabolism]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	9	3678210-3678313	7	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCGAGCTGCTCCAGGACGATCCGCTCCACGGC	32	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|68aa|up_8|NC_021658.1_3635193_3635397_+,NA|85aa|up_7|NC_021658.1_3636213_3636468_-,NA	NA|325aa|up_9|NC_021658.1_3633442_3634417_-	COG2267, PldB, Lysophospholipase [Lipid metabolism]	NA|68aa|up_8|NC_021658.1_3635193_3635397_+	NA	NA|85aa|up_7|NC_021658.1_3636213_3636468_-	NA	NA|220aa|up_6|NC_021658.1_3636717_3637377_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|195aa|up_5|NC_021658.1_3637910_3638495_+	cd12124, Pgbs, Protoglobins (Pgbs)	NA|308aa|up_4|NC_021658.1_3638844_3639768_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|358aa|up_3|NC_021658.1_3639727_3640801_+	COG0842, COG0842, ABC-type multidrug transport system, permease component [Defense mechanisms]	NA|352aa|up_2|NC_021658.1_3640941_3641997_+	TIGR04020, non-ribosomal_peptide_synthetase, natural product biosynthesis luciferase-like monooxygenase domain	NA|326aa|up_1|NC_021658.1_3642043_3643021_-	COG3319, COG3319, Thioesterase domains of type I polyketide synthases or non-ribosomal peptide synthetases [Secondary metabolites biosynthesis, transport, and catabolism]	NA|4608aa|up_0|NC_021658.1_3653022_3666846_-	PRK12467, PRK12467, peptide synthase; Provisional	NA|4889aa|down_0|NC_021658.1_3688176_3702843_-	COG3321, COG3321, Polyketide synthase modules and related proteins [Secondary metabolites biosynthesis, transport, and catabolism]	NA|269aa|down_1|NC_021658.1_3703818_3704625_-	COG2226, UbiE, Methylase involved in ubiquinone/menaquinone biosynthesis [Coenzyme metabolism]	NA|367aa|down_2|NC_021658.1_3705138_3706239_+	PRK14019, PRK14019, bifunctional 3,4-dihydroxy-2-butanone-4-phosphate synthase/GTP cyclohydrolase II	NA|171aa|down_3|NC_021658.1_3706352_3706865_+	COG1510, COG1510, Predicted transcriptional regulators [Transcription]	NA|291aa|down_4|NC_021658.1_3706874_3707747_+	TIGR00027, Hypothetical_protein_Rv0893c/MT0917/Mb0917c	NA|421aa|down_5|NC_021658.1_3707974_3709237_-	TIGR02232, myxo_disulf_rpt, Myxococcus cysteine-rich repeat	NA|429aa|down_6|NC_021658.1_3709466_3710753_+	cd13585, PBP2_TMBP_like, The periplasmic-binding component of ABC transport systems specific for trehalose/maltose and similar oligosaccharides; possess type 2 periplasmic binding fold	NA|270aa|down_7|NC_021658.1_3710851_3711661_+	COG1175, UgpA, ABC-type sugar transport systems, permease components [Carbohydrate transport and metabolism]	NA|256aa|down_8|NC_021658.1_3711777_3712545_+	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|785aa|down_9|NC_021658.1_3712541_3714896_+	PRK10658, PRK10658, putative alpha-glucosidase; Provisional
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	10	3762660-3762973	4	CRT	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCGGAGGCAGCCAGCTGCCT	20	0	0	NA	NA	NA	7	7	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|90aa|up_9|NC_021658.1_3742788_3743058_-,NA|113aa|up_7|NC_021658.1_3747031_3747370_-,NA|295aa|up_0|NC_021658.1_3761594_3762479_-,NA|94aa|down_3|NC_021658.1_3770073_3770355_+,NA|94aa|down_7|NC_021658.1_3776651_3776933_+	NA|90aa|up_9|NC_021658.1_3742788_3743058_-	NA	NA|148aa|up_8|NC_021658.1_3745209_3745653_+	pfam13546, DDE_5, DDE superfamily endonuclease	NA|113aa|up_7|NC_021658.1_3747031_3747370_-	NA	NA|1106aa|up_6|NC_021658.1_3748639_3751957_-	pfam09826, Beta_propel, Beta propeller domain	NA|309aa|up_5|NC_021658.1_3754188_3755115_+	pfam00072, Response_reg, Response regulator receiver domain	NA|534aa|up_4|NC_021658.1_3755390_3756992_+	cd09000, GH43_SXA-like, Glycosyl hydrolase family 43, such as Selenomonas ruminantium beta-D-xylosidase SXA	NA|414aa|up_3|NC_021658.1_3757149_3758391_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|393aa|up_2|NC_021658.1_3758509_3759688_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|313aa|up_1|NC_021658.1_3760431_3761370_-	pfam10118, Metal_hydrol, Predicted metal-dependent hydrolase	NA|295aa|up_0|NC_021658.1_3761594_3762479_-	NA	NA|1011aa|down_0|NC_021658.1_3763254_3766287_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|379aa|down_1|NC_021658.1_3767292_3768429_+	pfam08308, PEGA, PEGA domain	NA|583aa|down_2|NC_021658.1_3768320_3770069_+	PRK13875, PRK13875, conjugal transfer protein TrbL; Provisional	NA|94aa|down_3|NC_021658.1_3770073_3770355_+	NA	NA|259aa|down_4|NC_021658.1_3770476_3771253_+	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|893aa|down_5|NC_021658.1_3771254_3773933_+	TIGR03361, VI_Rhs_Vgr, type VI secretion system Vgr family protein	NA|327aa|down_6|NC_021658.1_3773947_3774928_+	pfam11876, DUF3396, Protein of unknown function (DUF3396)	NA|94aa|down_7|NC_021658.1_3776651_3776933_+	NA	NA|259aa|down_8|NC_021658.1_3777054_3777831_+	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|92aa|down_9|NC_021658.1_3777832_3778108_+	pfam11876, DUF3396, Protein of unknown function (DUF3396)
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	11	4114756-4114862	8	CRISPRCasFinder	no	WYL	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Unclear	GCGCGTGTCCTCGTGCGCCCGCGC	24	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|414aa|up_1|NC_021658.1_4112498_4113740_+,NA|83aa|up_0|NC_021658.1_4114345_4114594_+,NA|162aa|down_3|NC_021658.1_4119015_4119501_+,NA|126aa|down_5|NC_021658.1_4120841_4121219_+	NA|343aa|up_9|NC_021658.1_4096893_4097922_+	pfam02322, Cyt_bd_oxida_II, Cytochrome bd terminal oxidase subunit II	NA|494aa|up_8|NC_021658.1_4098624_4100106_+	pfam17517, IgGFc_binding, IgGFc binding protein	NA|571aa|up_7|NC_021658.1_4100349_4102062_+	pfam13517, VCBS, Repeat domain in Vibrio, Colwellia, Bradyrhizobium and Shewanella	NA|465aa|up_6|NC_021658.1_4102546_4103941_+	sd00001, TSP3, Calcium-binding Thrombospondin type 3 (TSP3) repeat	NA|149aa|up_5|NC_021658.1_4103838_4104285_+	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|1218aa|up_4|NC_021658.1_4104644_4108298_-	COG0613, COG0613, Predicted metal-dependent phosphoesterases (PHP family) [General function prediction only]	NA|444aa|up_3|NC_021658.1_4108309_4109641_-	PRK07764, PRK07764, DNA polymerase III subunits gamma and tau; Validated	NA|549aa|up_2|NC_021658.1_4109861_4111508_+	pfam10131, PTPS_related, 6-pyruvoyl-tetrahydropterin synthase related domain; membrane protein	NA|414aa|up_1|NC_021658.1_4112498_4113740_+	NA	NA|83aa|up_0|NC_021658.1_4114345_4114594_+	NA	WYL|399aa|down_0|NC_021658.1_4115207_4116404_+	pfam13280, WYL, WYL domain	NA|462aa|down_1|NC_021658.1_4116482_4117868_-	COG1509, KamA, Lysine 2,3-aminomutase [Amino acid transport and metabolism]	NA|234aa|down_2|NC_021658.1_4118081_4118783_-	cd00254, LT-like, lytic transglycosylase(LT)-like domain	NA|162aa|down_3|NC_021658.1_4119015_4119501_+	NA	NA|343aa|down_4|NC_021658.1_4119540_4120569_-	pfam02517, Abi, CAAX protease self-immunity	NA|126aa|down_5|NC_021658.1_4120841_4121219_+	NA	NA|644aa|down_6|NC_021658.1_4121444_4123376_+	PRK05354, PRK05354, biosynthetic arginine decarboxylase	NA|244aa|down_7|NC_021658.1_4123384_4124116_+	COG2386, CcmB, ABC-type transport system involved in cytochrome c biogenesis, permease component [Posttranslational modification, protein turnover, chaperones]	NA|425aa|down_8|NC_021658.1_4124156_4125431_-	TIGR01372, sarcosine_oxidase_alpha_subunit, sarcosine oxidase, alpha subunit family, heterotetrameric form	NA|210aa|down_9|NC_021658.1_4125640_4126270_+	cd00841, MPP_YfcE, Escherichia coli YfcE and related proteins, metallophosphatase domain
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	12	4496540-4496628	9	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	TGCGCCGGGACCTCGCCGCCGCTGCT	26	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|53aa|up_1|NC_021658.1_4494493_4494652_+,NA|280aa|down_1|NC_021658.1_4497754_4498594_+,NA|161aa|down_6|NC_021658.1_4506034_4506517_+,NA|594aa|down_8|NC_021658.1_4510565_4512347_-	NA|210aa|up_9|NC_021658.1_4483237_4483867_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|328aa|up_8|NC_021658.1_4484010_4484994_+	COG1748, LYS9, Saccharopine dehydrogenase and related proteins [Amino acid transport and metabolism]	NA|321aa|up_7|NC_021658.1_4485111_4486074_-	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|744aa|up_6|NC_021658.1_4486574_4488806_+	COG0178, UvrA, Excinuclease ATPase subunit [DNA replication, recombination, and repair]	NA|342aa|up_5|NC_021658.1_4488902_4489928_-	cd19608, GH113_mannanase-like, Glycoside hydrolase family 113 beta-1,4-mannanase and similar proteins	NA|211aa|up_4|NC_021658.1_4490003_4490636_+	pfam16859, TetR_C_11, Bacterial transcriptional repressor C-terminal	NA|391aa|up_3|NC_021658.1_4490632_4491805_-	cd03311, CIMS_C_terminal_like, CIMS - Cobalamine-independent methonine synthase, or MetE, C-terminal domain_like	NA|486aa|up_2|NC_021658.1_4492245_4493703_+	TIGR04247, nitrous_oxide_maturation_protein_NosD, nitrous oxide reductase family maturation protein NosD	NA|53aa|up_1|NC_021658.1_4494493_4494652_+	NA	NA|289aa|up_0|NC_021658.1_4495256_4496123_+	cd05269, TMR_SDR_a, triphenylmethane reductase (TMR)-like proteins, NMRa-like, atypical (a) SDRs	NA|235aa|down_0|NC_021658.1_4496649_4497354_+	pfam14518, Haem_oxygenas_2, Iron-containing redox enzyme	NA|280aa|down_1|NC_021658.1_4497754_4498594_+	NA	NA|721aa|down_2|NC_021658.1_4498618_4500781_+	pfam01593, Amino_oxidase, Flavin containing amine oxidoreductase	NA|415aa|down_3|NC_021658.1_4501038_4502283_-	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|143aa|down_4|NC_021658.1_4502983_4503412_+	COG4977, COG4977, Transcriptional regulator containing an amidase domain and an AraC-type DNA-binding HTH domain [Transcription]	NA|457aa|down_5|NC_021658.1_4504326_4505697_+	pfam00264, Tyrosinase, Common central domain of tyrosinase	NA|161aa|down_6|NC_021658.1_4506034_4506517_+	NA	NA|562aa|down_7|NC_021658.1_4508409_4510095_-	cd18618, GH43_Xsa43E-like, Glycosyl hydrolase family 43, including Butyrivibrio proteoclasticus arabinofuranosidase Xsa43E	NA|594aa|down_8|NC_021658.1_4510565_4512347_-	NA	NA|420aa|down_9|NC_021658.1_4512798_4514058_+	cd13524, PBP2_Thiaminase_I, Thiaminase-I has high structural homology to the type 2 periplasmic binding proteins of active transport systems
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	13	4522725-4522810	10	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCGGGAGATCGCCGGGCGATCCCC	24	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|161aa|up_8|NC_021658.1_4506034_4506517_+,NA|594aa|up_6|NC_021658.1_4510565_4512347_-,NA|315aa|down_8|NC_021658.1_4539270_4540215_+	NA|457aa|up_9|NC_021658.1_4504326_4505697_+	pfam00264, Tyrosinase, Common central domain of tyrosinase	NA|161aa|up_8|NC_021658.1_4506034_4506517_+	NA	NA|562aa|up_7|NC_021658.1_4508409_4510095_-	cd18618, GH43_Xsa43E-like, Glycosyl hydrolase family 43, including Butyrivibrio proteoclasticus arabinofuranosidase Xsa43E	NA|594aa|up_6|NC_021658.1_4510565_4512347_-	NA	NA|420aa|up_5|NC_021658.1_4512798_4514058_+	cd13524, PBP2_Thiaminase_I, Thiaminase-I has high structural homology to the type 2 periplasmic binding proteins of active transport systems	NA|180aa|up_4|NC_021658.1_4514184_4514724_+	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|155aa|up_3|NC_021658.1_4515010_4515475_-	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|170aa|up_2|NC_021658.1_4515670_4516180_-	pfam06993, DUF1304, Protein of unknown function (DUF1304)	NA|1299aa|up_1|NC_021658.1_4516363_4520260_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|545aa|up_0|NC_021658.1_4520968_4522603_-	cd06548, GH18_chitinase, The GH18 (glycosyl hydrolases, family 18) type II chitinases hydrolyze chitin, an abundant polymer of N-acetylglucosamine and have been identified in bacteria, fungi, insects, plants, viruses, and protozoan parasites	NA|862aa|down_0|NC_021658.1_4522974_4525560_+	COG1080, PtsA, Phosphoenolpyruvate-protein kinase (PTS system EI component in bacteria) [Carbohydrate transport and metabolism]	NA|587aa|down_1|NC_021658.1_4525635_4527396_+	TIGR01998, N-acetylglucosamine_and_glucose_PTS, PTS system, N-acetylglucosamine-specific IIBC component	NA|366aa|down_2|NC_021658.1_4527395_4528493_+	cd00854, NagA, N-acetylglucosamine-6-phosphate deacetylase, NagA, catalyzes the hydrolysis of the N-acetyl group of N-acetyl-glucosamine-6-phosphate (GlcNAc-6-P) to glucosamine 6-phosphate and acetate	NA|337aa|down_3|NC_021658.1_4528509_4529520_+	COG2222, AgaS, Predicted phosphosugar isomerases [Cell envelope biogenesis, outer membrane]	NA|918aa|down_4|NC_021658.1_4529529_4532283_+	cd06569, GH20_Sm-chitobiase-like, The chitobiase of Serratia marcescens is a beta-N-1,4-acetylhexosaminidase with a glycosyl hydrolase family 20 (GH20) domain that hydrolyzes the beta-1,4-glycosidic linkages in oligomers derived from chitin	NA|1299aa|down_5|NC_021658.1_4532301_4536198_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|365aa|down_6|NC_021658.1_4536406_4537501_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|393aa|down_7|NC_021658.1_4537908_4539087_+	cd01159, NcnH, Naphthocyclinone hydroxylase	NA|315aa|down_8|NC_021658.1_4539270_4540215_+	NA	NA|1300aa|down_9|NC_021658.1_4540317_4544217_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	14	4698117-4698184	11	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCCGGAGGCTGCCGAGGGCCTCCCGG	26	1	1	4698143-4698158	NC_021658.1_4698184-4698199	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|108aa|up_8|NC_021658.1_4687326_4687650_-,NA|143aa|up_1|NC_021658.1_4696297_4696726_+,NA|225aa|down_0|NC_021658.1_4698311_4698986_-,NA|312aa|down_1|NC_021658.1_4699411_4700347_+,NA|126aa|down_2|NC_021658.1_4700700_4701078_+,NA|61aa|down_4|NC_021658.1_4702334_4702517_+,NA|367aa|down_9|NC_021658.1_4707027_4708128_-	NA|665aa|up_9|NC_021658.1_4684899_4686894_-	pfam12770, CHAT, CHAT domain	NA|108aa|up_8|NC_021658.1_4687326_4687650_-	NA	NA|235aa|up_7|NC_021658.1_4688488_4689193_-	cd10033, UDG_like, uncharacterized family of the uracil-DNA glycosylase superfamily	NA|208aa|up_6|NC_021658.1_4689189_4689813_-	pfam01694, Rhomboid, Rhomboid family	NA|500aa|up_5|NC_021658.1_4690147_4691647_+	cd06241, M14-like, Peptidase M14-like domain; uncharacterized subgroup	NA|151aa|up_4|NC_021658.1_4691747_4692200_+	TIGR03081, Methylmalonyl-CoA_epimerase_mitochondrial, methylmalonyl-CoA epimerase	NA|883aa|up_3|NC_021658.1_4692192_4694841_+	PRK09426, PRK09426, methylmalonyl-CoA mutase; Reviewed	NA|338aa|up_2|NC_021658.1_4694842_4695856_+	PRK09435, PRK09435, methylmalonyl Co-A mutase-associated GTPase MeaB	NA|143aa|up_1|NC_021658.1_4696297_4696726_+	NA	NA|293aa|up_0|NC_021658.1_4696873_4697752_+	pfam00457, Glyco_hydro_11, Glycosyl hydrolases family 11	NA|225aa|down_0|NC_021658.1_4698311_4698986_-	NA	NA|312aa|down_1|NC_021658.1_4699411_4700347_+	NA	NA|126aa|down_2|NC_021658.1_4700700_4701078_+	NA	NA|105aa|down_3|NC_021658.1_4701712_4702027_+	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|61aa|down_4|NC_021658.1_4702334_4702517_+	NA	NA|396aa|down_5|NC_021658.1_4702726_4703914_+	pfam03942, DTW, DTW domain	NA|283aa|down_6|NC_021658.1_4704423_4705272_+	TIGR04052, hypothetical_protein_MettrDRAFT_3899, AZL_007920/MXAN_0976 family protein	NA|164aa|down_7|NC_021658.1_4705315_4705807_+	pfam13620, CarboxypepD_reg, Carboxypeptidase regulatory-like domain	NA|380aa|down_8|NC_021658.1_4705803_4706943_+	TIGR04039, MXAN_0977_Heme2, di-heme enzyme, MXAN_0977 family	NA|367aa|down_9|NC_021658.1_4707027_4708128_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	15	4716152-4716246	12	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGGGCCTGACTCGACGAGATGCC	23	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|61aa|up_9|NC_021658.1_4702334_4702517_+,NA|367aa|up_4|NC_021658.1_4707027_4708128_-,NA	NA|61aa|up_9|NC_021658.1_4702334_4702517_+	NA	NA|396aa|up_8|NC_021658.1_4702726_4703914_+	pfam03942, DTW, DTW domain	NA|283aa|up_7|NC_021658.1_4704423_4705272_+	TIGR04052, hypothetical_protein_MettrDRAFT_3899, AZL_007920/MXAN_0976 family protein	NA|164aa|up_6|NC_021658.1_4705315_4705807_+	pfam13620, CarboxypepD_reg, Carboxypeptidase regulatory-like domain	NA|380aa|up_5|NC_021658.1_4705803_4706943_+	TIGR04039, MXAN_0977_Heme2, di-heme enzyme, MXAN_0977 family	NA|367aa|up_4|NC_021658.1_4707027_4708128_-	NA	NA|796aa|up_3|NC_021658.1_4708717_4711105_+	TIGR03811, tyrosine_decarboxylase, tyrosine decarboxylase, Enterococcus type	NA|328aa|up_2|NC_021658.1_4711506_4712490_+	cd05152, MPH2', Macrolide 2'-Phosphotransferase	NA|151aa|up_1|NC_021658.1_4712586_4713039_+	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|1012aa|up_0|NC_021658.1_4713035_4716071_+	PRK11360, PRK11360, two-component system sensor histidine kinase AtoS	NA|462aa|down_0|NC_021658.1_4716510_4717896_+	cd17369, MFS_ShiA_like, Shikimate transporter and similar proteins of the Major Facilitator Superfamily	NA|333aa|down_1|NC_021658.1_4718060_4719059_-	pfam13795, HupE_UreJ_2, HupE / UreJ protein	NA|273aa|down_2|NC_021658.1_4719055_4719874_-	pfam13145, Rotamase_2, PPIC-type PPIASE domain	NA|414aa|down_3|NC_021658.1_4720059_4721301_-	cd10967, CE4_GLA_like_6s, Putative catalytic NodB homology domain of gellan lyase and similar proteins	NA|556aa|down_4|NC_021658.1_4721723_4723391_-	pfam13385, Laminin_G_3, Concanavalin A-like lectin/glucanases superfamily	NA|664aa|down_5|NC_021658.1_4723655_4725647_-	cd05562, Peptidases_S53_like, Peptidase domain in the S53 family	NA|856aa|down_6|NC_021658.1_4725995_4728563_-	TIGR04075, Ser/Thr_phosphatase_family_protein, polynucleotide kinase-phosphatase	NA|504aa|down_7|NC_021658.1_4728559_4730071_-	TIGR04074, Methyltransferase_type_12, 3' terminal RNA ribose 2'-O-methyltransferase Hen1	NA|426aa|down_8|NC_021658.1_4730509_4731787_+	COG4305, COG4305, Endoglucanase C-terminal domain/subunit and related proteins [Carbohydrate transport and metabolism]	NA|336aa|down_9|NC_021658.1_4732201_4733209_+	cd07041, STAS_RsbR_RsbS_like, Sulphate Transporter and Anti-Sigma factor antagonist domain of the "stressosome" complex proteins RsbS and RsbR, regulators of the bacterial stress activated alternative sigma factor sigma-B by phosphorylation
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	16	4887622-4887739	13	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCATCCCGGGCGCCAGGCATCCCGGGCGCG	30	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|182aa|up_7|NC_021658.1_4877828_4878374_-,NA|335aa|up_0|NC_021658.1_4885950_4886955_-,NA	NA|1102aa|up_9|NC_021658.1_4873999_4877305_+	COG0841, AcrB, Cation/multidrug efflux pump [Defense mechanisms]	NA|130aa|up_8|NC_021658.1_4877335_4877725_-	pfam04241, DUF423, Protein of unknown function (DUF423)	NA|182aa|up_7|NC_021658.1_4877828_4878374_-	NA	NA|429aa|up_6|NC_021658.1_4878370_4879657_-	TIGR00462, genX, EF-P lysine aminoacylase GenX	NA|758aa|up_5|NC_021658.1_4879902_4882176_+	COG3227, LasB, Zinc metalloprotease (elastase) [Amino acid transport and metabolism]	NA|149aa|up_4|NC_021658.1_4882254_4882701_-	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|219aa|up_3|NC_021658.1_4882745_4883402_-	TIGR00560, pgsA, CDP-diacylglycerol--glycerol-3-phosphate 3-phosphatidyltransferase	NA|566aa|up_2|NC_021658.1_4883391_4885089_-	sd00006, TPR, Tetratricopeptide repeat	NA|242aa|up_1|NC_021658.1_4885126_4885852_-	PRK00748, PRK00748, 1-(5-phosphoribosyl)-5-[(5-phosphoribosylamino)methylideneamino] imidazole-4-carboxamide isomerase; Validated	NA|335aa|up_0|NC_021658.1_4885950_4886955_-	NA	NA|377aa|down_0|NC_021658.1_4888830_4889961_-	pfam03781, FGE-sulfatase, Sulfatase-modifying factor enzyme 1	NA|727aa|down_1|NC_021658.1_4890353_4892534_+	PRK11091, PRK11091, aerobic respiration control sensor protein ArcB; Provisional	NA|487aa|down_2|NC_021658.1_4892829_4894290_+	cd07041, STAS_RsbR_RsbS_like, Sulphate Transporter and Anti-Sigma factor antagonist domain of the "stressosome" complex proteins RsbS and RsbR, regulators of the bacterial stress activated alternative sigma factor sigma-B by phosphorylation	NA|244aa|down_3|NC_021658.1_4894651_4895383_+	pfam13289, SIR2_2, SIR2-like domain	NA|181aa|down_4|NC_021658.1_4895395_4895938_+	cd00515, HAM1, NTPase/HAM1	NA|346aa|down_5|NC_021658.1_4896113_4897151_+	cd19091, AKR_PsAKR, Polaromonas Sp	NA|242aa|down_6|NC_021658.1_4897155_4897881_+	COG4359, COG4359, Uncharacterized conserved protein [Function unknown]	NA|839aa|down_7|NC_021658.1_4898709_4901226_+	pfam01804, Penicil_amidase, Penicillin amidase	NA|295aa|down_8|NC_021658.1_4902064_4902949_+	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|272aa|down_9|NC_021658.1_4903140_4903956_+	pfam08282, Hydrolase_3, haloacid dehalogenase-like hydrolase
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	17	5329135-5329478	5	CRT	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGCGNGAAGGGCAGGGCNTTGTCGGC	26	1	1	5329251-5329269	NC_021658.1_10598482-10598500	NA	7	7	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|166aa|up_8|NC_021658.1_5313630_5314128_+,NA|551aa|up_7|NC_021658.1_5314388_5316041_+,NA|99aa|up_0|NC_021658.1_5328391_5328688_+,NA|145aa|down_0|NC_021658.1_5330281_5330716_-,NA|578aa|down_7|NC_021658.1_5344037_5345771_+	NA|285aa|up_9|NC_021658.1_5312611_5313466_-	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|166aa|up_8|NC_021658.1_5313630_5314128_+	NA	NA|551aa|up_7|NC_021658.1_5314388_5316041_+	NA	NA|745aa|up_6|NC_021658.1_5316462_5318697_+	TIGR03361, VI_Rhs_Vgr, type VI secretion system Vgr family protein	NA|745aa|up_5|NC_021658.1_5318763_5320998_+	TIGR03361, VI_Rhs_Vgr, type VI secretion system Vgr family protein	NA|919aa|up_4|NC_021658.1_5321014_5323771_+	TIGR03361, VI_Rhs_Vgr, type VI secretion system Vgr family protein	NA|196aa|up_3|NC_021658.1_5323770_5324358_+	PRK07764, PRK07764, DNA polymerase III subunits gamma and tau; Validated	NA|438aa|up_2|NC_021658.1_5324802_5326116_+	pfam03080, Neprosin, Neprosin	NA|356aa|up_1|NC_021658.1_5327305_5328373_+	pfam13358, DDE_3, DDE superfamily endonuclease	NA|99aa|up_0|NC_021658.1_5328391_5328688_+	NA	NA|145aa|down_0|NC_021658.1_5330281_5330716_-	NA	NA|442aa|down_1|NC_021658.1_5331513_5332839_+	TIGR02270, hypothetical_protein_GSU3180, conserved hypothetical protein	NA|520aa|down_2|NC_021658.1_5332766_5334326_+	PRK07764, PRK07764, DNA polymerase III subunits gamma and tau; Validated	NA|246aa|down_3|NC_021658.1_5335344_5336082_-	smart00935, OmpH, Outer membrane protein (OmpH-like)	NA|1376aa|down_4|NC_021658.1_5336115_5340243_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|351aa|down_5|NC_021658.1_5340523_5341576_-	pfam01213, CAP_N, Adenylate cyclase associated (CAP) N terminal	NA|324aa|down_6|NC_021658.1_5342016_5342988_-	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|578aa|down_7|NC_021658.1_5344037_5345771_+	NA	NA|963aa|down_8|NC_021658.1_5345767_5348656_+	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|901aa|down_9|NC_021658.1_5348786_5351489_+	PRK05399, PRK05399, DNA mismatch repair protein MutS; Provisional
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	18	5769470-5769597	14	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	TTAGGTAGTCTAACGATCGGCTTTTCCGCTTCGACGAGGG	40	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|253aa|up_5|NC_021658.1_5763639_5764398_+,NA	NA|530aa|up_9|NC_021658.1_5758126_5759716_+	pfam13620, CarboxypepD_reg, Carboxypeptidase regulatory-like domain	NA|580aa|up_8|NC_021658.1_5759746_5761486_-	cd08509, PBP2_TmCBP_oligosaccharides_like, The substrate binding domain of a cellulose-binding protein from Thermotoga maritima contains the type 2 periplasmic binding fold	NA|306aa|up_7|NC_021658.1_5761544_5762462_+	COG1878, COG1878, Kynurenine formamidase [Amino acid transport and metabolism]	NA|322aa|up_6|NC_021658.1_5762522_5763488_-	pfam14394, DUF4423, Domain of unknown function (DUF4423)	NA|253aa|up_5|NC_021658.1_5763639_5764398_+	NA	NA|148aa|up_4|NC_021658.1_5764469_5764913_-	cd15457, NADAR, Escherichia coli swarming motility protein YbiA and related proteins	NA|376aa|up_3|NC_021658.1_5764987_5766115_-	cd06314, PBP1_tmGBP, periplasmic sugar-binding domain of Thermotoga maritima glucose-binding protein (tmGBP) and its close homologs	NA|250aa|up_2|NC_021658.1_5766438_5767188_-	smart00020, Tryp_SPc, Trypsin-like serine protease	NA|276aa|up_1|NC_021658.1_5768216_5769044_+	COG2894, MinD, Septum formation inhibitor-activating ATPase [Cell division and chromosome partitioning]	NA|105aa|up_0|NC_021658.1_5769055_5769370_+	PRK00296, minE, cell division topological specificity factor MinE; Reviewed	NA|1064aa|down_0|NC_021658.1_5770492_5773684_-	COG0553, HepA, Superfamily II DNA/RNA helicases, SNF2 family [Transcription / DNA replication, recombination, and repair]	NA|791aa|down_1|NC_021658.1_5774170_5776543_-	pfam11703, UPF0506, UPF0506	NA|321aa|down_2|NC_021658.1_5776853_5777816_+	COG3386, COG3386, Gluconolactonase [Carbohydrate transport and metabolism]	NA|229aa|down_3|NC_021658.1_5777853_5778540_-	pfam02592, Vut_1, Putative vitamin uptake transporter	NA|328aa|down_4|NC_021658.1_5778705_5779689_+	cd08964, L-asparaginase_II, Type II (periplasmic) bacterial L-asparaginase	NA|415aa|down_5|NC_021658.1_5779656_5780901_-	pfam04909, Amidohydro_2, Amidohydrolase	NA|152aa|down_6|NC_021658.1_5781064_5781520_-	COG0590, CumB, Cytosine/adenosine deaminases [Nucleotide transport and metabolism / Translation, ribosomal structure and biogenesis]	NA|350aa|down_7|NC_021658.1_5781516_5782566_-	cd13563, PBP2_SsuA_like_6, Putative substrate binding domain of sulfonate binding protein-like, a member of the type 2 periplasmic binding protein fold	NA|285aa|down_8|NC_021658.1_5782562_5783417_-	cd03293, ABC_NrtD_SsuB_transporters, ATP-binding cassette domain of the nitrate and sulfonate transporters	NA|282aa|down_9|NC_021658.1_5783413_5784259_-	COG0600, TauC, ABC-type nitrate/sulfonate/bicarbonate transport system, permease component [Inorganic ion transport and metabolism]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	19	5840911-5841018	15	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGGGCCGTACCCCGGCGCCGGGGC	24	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|253aa|up_8|NC_021658.1_5830675_5831434_+,NA|294aa|up_7|NC_021658.1_5831423_5832305_+,NA|344aa|up_2|NC_021658.1_5836271_5837303_+,NA	NA|182aa|up_9|NC_021658.1_5830158_5830704_+	cd02042, ParAB_family, partition proteins ParAB family	NA|253aa|up_8|NC_021658.1_5830675_5831434_+	NA	NA|294aa|up_7|NC_021658.1_5831423_5832305_+	NA	NA|442aa|up_6|NC_021658.1_5832340_5833666_-	COG3829, RocR, Transcriptional regulator containing PAS, AAA-type ATPase, and DNA-binding domains [Transcription / Signal transduction mechanisms]	NA|330aa|up_5|NC_021658.1_5833798_5834788_+	cd01949, GGDEF, Diguanylate-cyclase (DGC) or GGDEF domain	NA|195aa|up_4|NC_021658.1_5834913_5835498_+	COG4339, COG4339, Uncharacterized protein conserved in bacteria [Function unknown]	NA|248aa|up_3|NC_021658.1_5835547_5836291_-	pfam03211, Pectate_lyase, Pectate lyase	NA|344aa|up_2|NC_021658.1_5836271_5837303_+	NA	NA|357aa|up_1|NC_021658.1_5837344_5838415_-	pfam13519, VWA_2, von Willebrand factor type A domain	NA|501aa|up_0|NC_021658.1_5838564_5840067_-	pfam16208, Keratin_2_head, Keratin type II head	NA|380aa|down_0|NC_021658.1_5841644_5842784_-	cd17538, REC_D1_PleD-like, first (D1) phosphoacceptor receiver (REC) domain of response regulator PleD and similar domains	NA|354aa|down_1|NC_021658.1_5842780_5843842_-	PRK00742, PRK00742, chemotaxis-specific protein-glutamate methyltransferase CheB	NA|690aa|down_2|NC_021658.1_5843883_5845953_-	COG0643, CheA, Chemotaxis protein histidine kinase and related kinases [Cell motility and secretion / Signal transduction mechanisms]	NA|491aa|down_3|NC_021658.1_5845962_5847435_-	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|191aa|down_4|NC_021658.1_5847431_5848004_-	pfam01584, CheW, CheW-like domain	NA|520aa|down_5|NC_021658.1_5848000_5849560_-	COG1352, CheR, Methylase of chemotaxis methyl-accepting proteins [Cell motility and secretion / Signal transduction mechanisms]	NA|146aa|down_6|NC_021658.1_5849556_5849994_-	cd00732, CheW, CheW, a small regulator protein, unique to the chemotaxis signalling in prokaryotes and archea	NA|481aa|down_7|NC_021658.1_5850149_5851592_-	cd13559, PBP2_SsuA_like_3, Putative substrate binding domain of sulfonate binding protein-like, the type 2 periplasmic binding protein fold	NA|1426aa|down_8|NC_021658.1_5852074_5856352_+	PRK07726, PRK07726, DNA topoisomerase 3	NA|547aa|down_9|NC_021658.1_5856757_5858398_-	cd05819, NHL, NHL repeat unit of beta-propeller proteins
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	20	5884182-5884270	16	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CTTGCAGCCGCCCTGGCCCTTGCACTCGTTCT	32	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA,NA|378aa|down_0|NC_021658.1_5884700_5885834_+,NA|299aa|down_4|NC_021658.1_5888430_5889327_-,NA|561aa|down_5|NC_021658.1_5890431_5892114_-,NA|173aa|down_6|NC_021658.1_5892322_5892841_-,NA|287aa|down_8|NC_021658.1_5896213_5897074_-	NA|914aa|up_9|NC_021658.1_5872223_5874965_-	PRK00009, PRK00009, phosphoenolpyruvate carboxylase; Reviewed	NA|500aa|up_8|NC_021658.1_5875490_5876990_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|303aa|up_7|NC_021658.1_5876998_5877907_+	COG0583, LysR, Transcriptional regulator [Transcription]	NA|152aa|up_6|NC_021658.1_5877929_5878385_-	PRK00601, dut, dUTP diphosphatase	NA|462aa|up_5|NC_021658.1_5878435_5879821_-	cd06161, S2P-M50_SpoIVFB, SpoIVFB Site-2 protease (S2P), a zinc metalloprotease (MEROPS family M50B), regulates intramembrane proteolysis (RIP), and is involved in the pro-sigmaK pathway of bacterial spore formation	NA|291aa|up_4|NC_021658.1_5879963_5880836_+	cd00229, SGNH_hydrolase, SGNH_hydrolase, or GDSL_hydrolase, is a diverse family of lipases and esterases	NA|251aa|up_3|NC_021658.1_5880961_5881714_-	cd07989, LPLAT_AGPAT-like, Lysophospholipid Acyltransferases (LPLATs) of Glycerophospholipid Biosynthesis: AGPAT-like	NA|144aa|up_2|NC_021658.1_5881850_5882282_-	COG0432, COG0432, Uncharacterized conserved protein [Function unknown]	NA|292aa|up_1|NC_021658.1_5882291_5883167_-	pfam09836, DUF2063, Putative DNA-binding domain	NA|280aa|up_0|NC_021658.1_5883216_5884056_-	pfam05114, DUF692, Protein of unknown function (DUF692)	NA|378aa|down_0|NC_021658.1_5884700_5885834_+	NA	NA|345aa|down_1|NC_021658.1_5885814_5886849_+	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|229aa|down_2|NC_021658.1_5886845_5887532_+	cd00056, ENDO3c, endonuclease III; includes endonuclease III (DNA-(apurinic or apyrimidinic site) lyase), alkylbase DNA glycosidases (Alka-family) and other DNA glycosidases	NA|302aa|down_3|NC_021658.1_5887528_5888434_-	COG0697, RhaT, Permeases of the drug/metabolite transporter (DMT) superfamily [Carbohydrate transport and metabolism / Amino acid transport and metabolism / General function prediction only]	NA|299aa|down_4|NC_021658.1_5888430_5889327_-	NA	NA|561aa|down_5|NC_021658.1_5890431_5892114_-	NA	NA|173aa|down_6|NC_021658.1_5892322_5892841_-	NA	NA|873aa|down_7|NC_021658.1_5892935_5895554_-	TIGR03480, HpnN, hopanoid biosynthesis associated RND transporter like protein HpnN	NA|287aa|down_8|NC_021658.1_5896213_5897074_-	NA	NA|283aa|down_9|NC_021658.1_5897087_5897936_-	pfam00487, FA_desaturase, Fatty acid desaturase
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	21	6104618-6105071	17	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CTTCGGCGACGCCTGCGACAATTGC	25	0	0	NA	NA	NA	6	6	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|242aa|up_0|NC_021658.1_6099642_6100368_-,NA|263aa|down_7|NC_021658.1_6116892_6117681_+,NA|162aa|down_9|NC_021658.1_6119496_6119982_+	NA|325aa|up_9|NC_021658.1_6087961_6088936_-	cd05289, MDR_like_2, alcohol dehydrogenase and quinone reductase-like medium chain degydrogenases/reductases	NA|80aa|up_8|NC_021658.1_6089207_6089447_+	COG4118, Phd, Antitoxin of toxin-antitoxin stability system [Cell division and chromosome partitioning]	NA|136aa|up_7|NC_021658.1_6089443_6089851_+	cd09872, PIN_Sll0205-like, VapC-like PIN domain of Sll0205 protein and homologs	NA|533aa|up_6|NC_021658.1_6089867_6091466_-	cd07402, MPP_GpdQ, Enterobacter aerogenes GpdQ and related proteins, metallophosphatase domain	NA|447aa|up_5|NC_021658.1_6091592_6092933_+	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|328aa|up_4|NC_021658.1_6092949_6093933_-	cd19100, AKR_unchar, uncharacterized aldo-keto reductase (AKR) superfamily protein	NA|272aa|up_3|NC_021658.1_6094706_6095522_+	pfam05642, Sporozoite_P67, Sporozoite P67 surface antigen	NA|607aa|up_2|NC_021658.1_6095917_6097738_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|603aa|up_1|NC_021658.1_6097775_6099584_+	pfam08308, PEGA, PEGA domain	NA|242aa|up_0|NC_021658.1_6099642_6100368_-	NA	NA|244aa|down_0|NC_021658.1_6107175_6107907_+	PRK13875, PRK13875, conjugal transfer protein TrbL; Provisional	NA|474aa|down_1|NC_021658.1_6108067_6109489_-	pfam13546, DDE_5, DDE superfamily endonuclease	NA|629aa|down_2|NC_021658.1_6109731_6111618_+	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|491aa|down_3|NC_021658.1_6111904_6113377_+	cd07398, MPP_YbbF-LpxH, Escherichia coli YbbF/LpxH and related proteins, metallophosphatase domain	NA|258aa|down_4|NC_021658.1_6113499_6114273_+	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|354aa|down_5|NC_021658.1_6114318_6115380_-	cd14656, Imelysin-like_EfeO, EfeO is a component of the EfeUOB operon	NA|411aa|down_6|NC_021658.1_6115486_6116719_-	pfam06537, DHOR, Di-haem oxidoreductase, putative peroxidase	NA|263aa|down_7|NC_021658.1_6116892_6117681_+	NA	NA|517aa|down_8|NC_021658.1_6117703_6119254_-	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|162aa|down_9|NC_021658.1_6119496_6119982_+	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	22	6287268-6287372	18	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGCTGTTTCAGGTCAGCCCTCCTTTCGCG	29	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|141aa|up_8|NC_021658.1_6276111_6276534_+,NA|235aa|up_3|NC_021658.1_6282457_6283162_+,NA	NA|106aa|up_9|NC_021658.1_6275619_6275937_+	pfam08308, PEGA, PEGA domain	NA|141aa|up_8|NC_021658.1_6276111_6276534_+	NA	NA|343aa|up_7|NC_021658.1_6276530_6277559_+	COG1595, RpoE, DNA-directed RNA polymerase specialized sigma subunit, sigma24 homolog [Transcription]	NA|558aa|up_6|NC_021658.1_6277979_6279653_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|328aa|up_5|NC_021658.1_6279720_6280704_+	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau	NA|458aa|up_4|NC_021658.1_6280776_6282150_+	pfam01474, DAHP_synth_2, Class-II DAHP synthetase family	NA|235aa|up_3|NC_021658.1_6282457_6283162_+	NA	NA|128aa|up_2|NC_021658.1_6283455_6283839_+	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|236aa|up_1|NC_021658.1_6283835_6284543_+	pfam01139, RtcB, tRNA-splicing ligase RtcB	NA|871aa|up_0|NC_021658.1_6284523_6287136_-	cd07489, Peptidases_S8_5, Peptidase S8 family domain, uncharacterized subfamily 5	NA|211aa|down_0|NC_021658.1_6287533_6288166_+	pfam08241, Methyltransf_11, Methyltransferase domain	NA|321aa|down_1|NC_021658.1_6288162_6289125_+	cd05234, UDP_G4E_2_SDR_e, UDP-glucose 4 epimerase, subgroup 2, extended (e) SDRs	NA|225aa|down_2|NC_021658.1_6289175_6289850_+	cd03194, GST_C_3, C-terminal, alpha helical domain of an unknown subfamily 3 of Glutathione S-transferases	NA|583aa|down_3|NC_021658.1_6289966_6291715_+	PRK10669, PRK10669, putative cation:proton antiport protein; Provisional	NA|313aa|down_4|NC_021658.1_6291737_6292676_-	TIGR00950, Uncharacterized_inner_membrane_transporter_YicL, Carboxylate/Amino Acid/Amine Transporter	NA|292aa|down_5|NC_021658.1_6292978_6293854_+	pfam02405, MlaE, Permease MlaE	NA|286aa|down_6|NC_021658.1_6293869_6294727_+	pfam02405, MlaE, Permease MlaE	NA|247aa|down_7|NC_021658.1_6294752_6295493_-	cd03261, ABC_Org_Solvent_Resistant, ATP-binding cassette transport system involved in resistant to organic solvents	NA|341aa|down_8|NC_021658.1_6295654_6296677_+	COG1463, Ttg2C, ABC-type transport system involved in resistance to organic solvents, periplasmic component [Secondary metabolites biosynthesis, transport, and catabolism]	NA|72aa|down_9|NC_021658.1_6296795_6297011_-	cd06850, biotinyl_domain, The biotinyl-domain or biotin carboxyl carrier protein (BCCP) domain is present in all biotin-dependent enzymes, such as acetyl-CoA carboxylase, pyruvate carboxylase, propionyl-CoA carboxylase, methylcrotonyl-CoA carboxylase, geranyl-CoA carboxylase, oxaloacetate decarboxylase, methylmalonyl-CoA decarboxylase, transcarboxylase and urea amidolyase
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	23	6544700-6544812	19	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCCGCCTCAGGAAGCGCGGGCGC	23	1	1	6544768-6544789	NC_021658.1_10607772-10607793	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|330aa|up_7|NC_021658.1_6534067_6535057_-,NA|296aa|down_0|NC_021658.1_6545696_6546584_-,NA|429aa|down_4|NC_021658.1_6552688_6553975_+	NA|495aa|up_9|NC_021658.1_6530774_6532259_+	PRK14900, valS, valyl-tRNA synthetase; Provisional	NA|602aa|up_8|NC_021658.1_6532265_6534071_-	pfam13231, PMT_2, Dolichyl-phosphate-mannose-protein mannosyltransferase	NA|330aa|up_7|NC_021658.1_6534067_6535057_-	NA	NA|140aa|up_6|NC_021658.1_6535281_6535701_+	pfam05866, RusA, Endodeoxyribonuclease RusA	NA|212aa|up_5|NC_021658.1_6535697_6536333_+	pfam18743, AHJR-like, REase_AHJR-like	NA|693aa|up_4|NC_021658.1_6536448_6538527_-	PLN02791, PLN02791, Nudix hydrolase homolog	NA|505aa|up_3|NC_021658.1_6538690_6540205_-	cd07398, MPP_YbbF-LpxH, Escherichia coli YbbF/LpxH and related proteins, metallophosphatase domain	NA|169aa|up_2|NC_021658.1_6540771_6541278_+	smart00994, zf-C4_ClpX, ClpX C4-type zinc finger	NA|437aa|up_1|NC_021658.1_6541413_6542724_-	PLN03138, PLN03138, Protein TOC75; Provisional	NA|418aa|up_0|NC_021658.1_6542869_6544123_-	PHA03378, PHA03378, EBNA-3B; Provisional	NA|296aa|down_0|NC_021658.1_6545696_6546584_-	NA	NA|1406aa|down_1|NC_021658.1_6547069_6551287_-	pfam12770, CHAT, CHAT domain	NA|198aa|down_2|NC_021658.1_6551441_6552035_-	cd06260, DUF820, Domain of unknown function (DUF820)	NA|155aa|down_3|NC_021658.1_6552136_6552601_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|429aa|down_4|NC_021658.1_6552688_6553975_+	NA	NA|163aa|down_5|NC_021658.1_6554118_6554607_+	pfam03364, Polyketide_cyc, Polyketide cyclase / dehydrase and lipid transport	NA|439aa|down_6|NC_021658.1_6554739_6556056_-	TIGR04566, hypothetical_protein_Q664_47920, outer membrane exchange protein TraA, N-terminal region	NA|966aa|down_7|NC_021658.1_6556264_6559162_-	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|189aa|down_8|NC_021658.1_6559293_6559860_+	smart00702, P4Hc, Prolyl 4-hydroxylase alpha subunit homologues	NA|287aa|down_9|NC_021658.1_6559935_6560796_-	cd01409, SIRT4, SIRT4: Eukaryotic and prokaryotic group (class2) which includes human sirtuin SIRT4 and several bacterial homologs; and are members of the SIR2 family of proteins, silent information regulator 2 (Sir2) enzymes which catalyze NAD+-dependent protein/histone deacetylation
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	24	6751541-6751757	20	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGGGTCGCCCCAACCTGGGTCGG	23	0	0	NA	NA	NA	3	3	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|162aa|up_5|NC_021658.1_6741157_6741643_-,NA	NA|291aa|up_9|NC_021658.1_6737703_6738576_-	COG2084, MmsB, 3-hydroxyisobutyrate dehydrogenase and related beta-hydroxyacid dehydrogenases [Lipid metabolism]	NA|278aa|up_8|NC_021658.1_6738782_6739616_+	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|312aa|up_7|NC_021658.1_6739625_6740561_-	TIGR02957, putative_sigma_factor, RNA polymerase sigma-70 factor, TIGR02957 family	NA|180aa|up_6|NC_021658.1_6740562_6741102_-	COG2128, COG2128, Uncharacterized conserved protein [Function unknown]	NA|162aa|up_5|NC_021658.1_6741157_6741643_-	NA	NA|517aa|up_4|NC_021658.1_6741753_6743304_+	cd10170, HSP70_NBD, Nucleotide-binding domain of the HSP70 family	NA|313aa|up_3|NC_021658.1_6743880_6744819_-	COG0679, COG0679, Predicted permeases [General function prediction only]	NA|663aa|up_2|NC_021658.1_6745197_6747186_-	COG0021, TktA, Transketolase [Carbohydrate transport and metabolism]	NA|494aa|up_1|NC_021658.1_6748043_6749525_-	cd14955, NHL_like_4, Uncharacterized NHL-repeat domain in bacterial and archaeal proteins	NA|497aa|up_0|NC_021658.1_6749753_6751244_-	cd05819, NHL, NHL repeat unit of beta-propeller proteins	NA|322aa|down_0|NC_021658.1_6751835_6752801_+	pfam07676, PD40, WD40-like Beta Propeller Repeat	NA|329aa|down_1|NC_021658.1_6753453_6754440_+	cd19920, REC_PA4781-like, phosphoacceptor receiver (REC) domain of cyclic di-GMP phosphodiesterase PA4781 and similar domains	NA|2006aa|down_2|NC_021658.1_6754501_6760519_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|378aa|down_3|NC_021658.1_6760540_6761674_-	COG1960, CaiA, Acyl-CoA dehydrogenases [Lipid metabolism]	NA|373aa|down_4|NC_021658.1_6762103_6763222_+	pfam06283, ThuA, Trehalose utilisation	NA|545aa|down_5|NC_021658.1_6763316_6764951_+	COG0154, GatA, Asp-tRNAAsn/Glu-tRNAGln amidotransferase A subunit and related amidases [Translation, ribosomal structure and biogenesis]	NA|236aa|down_6|NC_021658.1_6765059_6765767_+	pfam14234, DUF4336, Domain of unknown function (DUF4336)	NA|905aa|down_7|NC_021658.1_6765914_6768629_-	pfam14200, RicinB_lectin_2, Ricin-type beta-trefoil lectin domain-like	NA|111aa|down_8|NC_021658.1_6769618_6769951_-	PRK02237, PRK02237, YnfA family protein	NA|116aa|down_9|NC_021658.1_6770175_6770523_+	PRK02888, PRK02888, nitrous-oxide reductase; Validated
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	25	7376707-7376805	21	CRISPRCasFinder	no	DEDDh	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Unclear	TCTCGTCGGGTCTCTCGTCGGGTC	24	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|116aa|up_1|NC_021658.1_7374898_7375246_-,NA|223aa|down_2|NC_021658.1_7379226_7379895_+,NA|260aa|down_8|NC_021658.1_7386965_7387745_-	NA|858aa|up_9|NC_021658.1_7361910_7364484_-	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|231aa|up_8|NC_021658.1_7364617_7365310_+	COG0546, Gph, Predicted phosphatases [General function prediction only]	NA|407aa|up_7|NC_021658.1_7365317_7366538_-	COG4637, COG4637, Predicted ATPase [General function prediction only]	NA|211aa|up_6|NC_021658.1_7367098_7367731_-	pfam14103, DUF4276, Domain of unknown function (DUF4276)	NA|409aa|up_5|NC_021658.1_7367717_7368944_-	COG4637, COG4637, Predicted ATPase [General function prediction only]	NA|1287aa|up_4|NC_021658.1_7368979_7372840_-	PRK06039, ileS, isoleucyl-tRNA synthetase; Reviewed	NA|198aa|up_3|NC_021658.1_7372936_7373530_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|204aa|up_2|NC_021658.1_7374256_7374868_-	cd00564, TMP_TenI, Thiamine monophosphate synthase (TMP synthase)/TenI	NA|116aa|up_1|NC_021658.1_7374898_7375246_-	NA	NA|425aa|up_0|NC_021658.1_7375325_7376600_-	cd03798, GT4_WlbH-like, Bordetella parapertussis WlbH and similar proteins	NA|413aa|down_0|NC_021658.1_7376829_7378068_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|261aa|down_1|NC_021658.1_7378323_7379106_-	PRK00208, thiG, thiazole synthase; Reviewed	NA|223aa|down_2|NC_021658.1_7379226_7379895_+	NA	NA|287aa|down_3|NC_021658.1_7379989_7380850_+	pfam00413, Peptidase_M10, Matrixin	NA|404aa|down_4|NC_021658.1_7380846_7382058_+	cd06142, RNaseD_exo, DEDDy 3'-5' exonuclease domain of Ribonuclease D and similar proteins	NA|587aa|down_5|NC_021658.1_7382274_7384035_+	pfam00924, MS_channel, Mechanosensitive ion channel	NA|350aa|down_6|NC_021658.1_7383976_7385026_-	PLN02389, PLN02389, biotin synthase	NA|351aa|down_7|NC_021658.1_7385655_7386708_-	COG2805, PilT, Tfp pilus assembly protein, pilus retraction ATPase PilT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|260aa|down_8|NC_021658.1_7386965_7387745_-	NA	NA|466aa|down_9|NC_021658.1_7387769_7389167_-	pfam01964, ThiC_Rad_SAM, Radical SAM ThiC family
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	26	7538290-7538389	22	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGCGGCGCGCGGCGACGACGACGACGCGCCCCG	33	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|357aa|up_7|NC_021658.1_7523572_7524643_-,NA|384aa|up_6|NC_021658.1_7524657_7525809_-,NA|243aa|up_4|NC_021658.1_7528066_7528795_-,NA|423aa|down_6|NC_021658.1_7544891_7546160_+	NA|525aa|up_9|NC_021658.1_7519716_7521291_+	cd01465, vWA_subgroup, VWA subgroup: Von Willebrand factor type A (vWA) domain was originally found in the blood coagulation protein von Willebrand factor (vWF)	NA|360aa|up_8|NC_021658.1_7521655_7522735_+	pfam02618, YceG, YceG-like family	NA|357aa|up_7|NC_021658.1_7523572_7524643_-	NA	NA|384aa|up_6|NC_021658.1_7524657_7525809_-	NA	NA|755aa|up_5|NC_021658.1_7525805_7528070_-	TIGR02168, Chromosome_partition_protein_Smc, chromosome segregation protein SMC, common bacterial type	NA|243aa|up_4|NC_021658.1_7528066_7528795_-	NA	NA|220aa|up_3|NC_021658.1_7530588_7531248_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|205aa|up_2|NC_021658.1_7531354_7531969_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|495aa|up_1|NC_021658.1_7531997_7533482_-	pfam00999, Na_H_Exchanger, Sodium/hydrogen exchanger family	NA|435aa|up_0|NC_021658.1_7533493_7534798_-	COG0475, KefB, Kef-type K+ transport systems, membrane components [Inorganic ion transport and metabolism]	NA|387aa|down_0|NC_021658.1_7538405_7539566_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|225aa|down_1|NC_021658.1_7539556_7540231_-	COG5012, COG5012, Predicted cobalamin binding protein [General function prediction only]	NA|242aa|down_2|NC_021658.1_7540374_7541100_-	pfam01182, Glucosamine_iso, Glucosamine-6-phosphate isomerases/6-phosphogluconolactonase	NA|392aa|down_3|NC_021658.1_7541122_7542298_-	pfam10128, OpcA_G6PD_assem, Glucose-6-phosphate dehydrogenase subunit	NA|526aa|down_4|NC_021658.1_7542195_7543773_-	PRK05722, PRK05722, glucose-6-phosphate 1-dehydrogenase; Validated	NA|115aa|down_5|NC_021658.1_7544262_7544607_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	NA|423aa|down_6|NC_021658.1_7544891_7546160_+	NA	NA|1257aa|down_7|NC_021658.1_7546523_7550294_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|236aa|down_8|NC_021658.1_7550389_7551097_+	cd07989, LPLAT_AGPAT-like, Lysophospholipid Acyltransferases (LPLATs) of Glycerophospholipid Biosynthesis: AGPAT-like	NA|621aa|down_9|NC_021658.1_7551797_7553660_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	27	7992019-7992095	23	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGGGCCGCGCGCGCCTTCCTGGA	23	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA,NA|81aa|down_0|NC_021658.1_7992476_7992719_+,NA|161aa|down_1|NC_021658.1_7992814_7993297_-,NA|275aa|down_6|NC_021658.1_7997317_7998142_+	NA|297aa|up_9|NC_021658.1_7974063_7974954_+	pfam03781, FGE-sulfatase, Sulfatase-modifying factor enzyme 1	NA|287aa|up_8|NC_021658.1_7975298_7976159_+	COG0668, MscS, Small-conductance mechanosensitive channel [Cell envelope biogenesis, outer membrane]	NA|271aa|up_7|NC_021658.1_7976271_7977084_+	pfam00924, MS_channel, Mechanosensitive ion channel	NA|214aa|up_6|NC_021658.1_7977170_7977812_+	PRK10119, PRK10119, putative hydrolase; Provisional	NA|278aa|up_5|NC_021658.1_7977814_7978648_-	COG0170, SEC59, Dolichol kinase [Lipid metabolism]	NA|1317aa|up_4|NC_021658.1_7979505_7983456_+	cd09596, M36, Peptidase M36 family, also known as fungalysin family	NA|220aa|up_3|NC_021658.1_7983596_7984256_+	cd03378, beta_CA_cladeC, Carbonic anhydrases (CA) are zinc-containing enzymes that catalyze the reversible hydration of carbon dioxide in a two-step mechanism in which the nucleophilic attack of a zinc-bound hydroxide ion on carbon dioxide is followed by the regeneration of an active site by ionization of the zinc-bound water molecule and removal of a proton from the active site	NA|742aa|up_2|NC_021658.1_7984317_7986543_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|674aa|up_1|NC_021658.1_7986771_7988793_-	PLN02337, PLN02337, lipoxygenase	NA|306aa|up_0|NC_021658.1_7989440_7990358_+	PRK06958, PRK06958, single-stranded DNA-binding protein; Provisional	NA|81aa|down_0|NC_021658.1_7992476_7992719_+	NA	NA|161aa|down_1|NC_021658.1_7992814_7993297_-	NA	NA|309aa|down_2|NC_021658.1_7993486_7994413_+	COG2382, Fes, Enterochelin esterase and related enzymes [Inorganic ion transport and metabolism]	NA|262aa|down_3|NC_021658.1_7994475_7995261_-	pfam06112, Herpes_capsid, Gammaherpesvirus capsid protein	NA|431aa|down_4|NC_021658.1_7995406_7996699_-	cd13970, ABC1_ADCK3, Activator of bc1 complex (ABC1) kinases, also called aarF domain containing kinase 3	NA|163aa|down_5|NC_021658.1_7996730_7997219_+	cd00002, YbaK_deacylase, This CD includes cysteinyl-tRNA(Pro) deacylases from Haemophilus influenzae and Escherichia coli and other related bacterial proteins	NA|275aa|down_6|NC_021658.1_7997317_7998142_+	NA	NA|409aa|down_7|NC_021658.1_7998341_7999568_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|174aa|down_8|NC_021658.1_7999556_8000078_-	pfam10002, DUF2243, Predicted membrane protein (DUF2243)	NA|259aa|down_9|NC_021658.1_8000323_8001100_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	28	8011479-8011543	24	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCTGAGCGCTCCCGGCCGGCGGCGC	25	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|275aa|up_8|NC_021658.1_7997317_7998142_+,NA|577aa|up_1|NC_021658.1_8004374_8006105_-,NA|57aa|down_3|NC_021658.1_8016557_8016728_+,NA|259aa|down_8|NC_021658.1_8025699_8026476_+	NA|163aa|up_9|NC_021658.1_7996730_7997219_+	cd00002, YbaK_deacylase, This CD includes cysteinyl-tRNA(Pro) deacylases from Haemophilus influenzae and Escherichia coli and other related bacterial proteins	NA|275aa|up_8|NC_021658.1_7997317_7998142_+	NA	NA|409aa|up_7|NC_021658.1_7998341_7999568_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|174aa|up_6|NC_021658.1_7999556_8000078_-	pfam10002, DUF2243, Predicted membrane protein (DUF2243)	NA|259aa|up_5|NC_021658.1_8000323_8001100_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|155aa|up_4|NC_021658.1_8001151_8001616_-	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|263aa|up_3|NC_021658.1_8001745_8002534_-	PRK06172, PRK06172, SDR family oxidoreductase	NA|315aa|up_2|NC_021658.1_8003208_8004153_+	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|577aa|up_1|NC_021658.1_8004374_8006105_-	NA	NA|1292aa|up_0|NC_021658.1_8006157_8010033_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|227aa|down_0|NC_021658.1_8011769_8012450_+	pfam00582, Usp, Universal stress protein family	NA|444aa|down_1|NC_021658.1_8012598_8013930_-	pfam07586, HXXSHH, Protein of unknown function (DUF1552)	NA|567aa|down_2|NC_021658.1_8013939_8015640_-	pfam07631, PSD4, Protein of unknown function (DUF1592)	NA|57aa|down_3|NC_021658.1_8016557_8016728_+	NA	NA|688aa|down_4|NC_021658.1_8020743_8022807_+	TIGR03696, tRNA_nuclease_WapA, RHS repeat-associated core domain	NA|148aa|down_5|NC_021658.1_8022803_8023247_+	pfam14568, SUKH_6, SMI1-KNR4 cell-wall	NA|192aa|down_6|NC_021658.1_8023382_8023958_+	TIGR01352, Protein_TonB, TonB family C-terminal domain	NA|239aa|down_7|NC_021658.1_8024163_8024880_+	COG0810, TonB, Periplasmic protein TonB, links inner and outer membranes [Cell envelope biogenesis, outer membrane]	NA|259aa|down_8|NC_021658.1_8025699_8026476_+	NA	NA|332aa|down_9|NC_021658.1_8026777_8027773_+	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	29	8210044-8210153	25	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCGAGGCCCGCCTTCTCGGTTCCGCA	26	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|266aa|up_5|NC_021658.1_8202478_8203276_+,NA|240aa|up_3|NC_021658.1_8204445_8205165_+,NA|285aa|down_0|NC_021658.1_8210407_8211262_+,NA|256aa|down_1|NC_021658.1_8211301_8212069_-	NA|522aa|up_9|NC_021658.1_8197354_8198920_-	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|244aa|up_8|NC_021658.1_8198976_8199708_+	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|451aa|up_7|NC_021658.1_8199760_8201113_+	PRK09470, cpxA, envelope stress sensor histidine kinase CpxA	NA|408aa|up_6|NC_021658.1_8201231_8202455_+	pfam13304, AAA_21, AAA domain, putative AbiEii toxin, Type IV TA system	NA|266aa|up_5|NC_021658.1_8202478_8203276_+	NA	NA|132aa|up_4|NC_021658.1_8203391_8203787_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|240aa|up_3|NC_021658.1_8204445_8205165_+	NA	NA|481aa|up_2|NC_021658.1_8205248_8206691_+	pfam10009, DUF2252, Uncharacterized protein conserved in bacteria (DUF2252)	NA|573aa|up_1|NC_021658.1_8206890_8208609_-	pfam07519, Tannase, Tannase and feruloyl esterase	NA|293aa|up_0|NC_021658.1_8208789_8209668_-	pfam05985, EutC, Ethanolamine ammonia-lyase light chain (EutC)	NA|285aa|down_0|NC_021658.1_8210407_8211262_+	NA	NA|256aa|down_1|NC_021658.1_8211301_8212069_-	NA	NA|356aa|down_2|NC_021658.1_8212796_8213864_+	cd05154, ACAD10_11_N-like, N-terminal domain of Acyl-CoA dehydrogenase (ACAD) 10 and 11, and similar proteins	NA|88aa|down_3|NC_021658.1_8213920_8214184_+	pfam13453, zf-TFIIB, Transcription factor zinc-finger	NA|94aa|down_4|NC_021658.1_8214324_8214606_+	pfam06865, DUF1255, Protein of unknown function (DUF1255)	NA|1288aa|down_5|NC_021658.1_8214887_8218751_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|300aa|down_6|NC_021658.1_8219328_8220228_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|384aa|down_7|NC_021658.1_8221193_8222345_+	COG4641, COG4641, Uncharacterized protein conserved in bacteria [Function unknown]	NA|387aa|down_8|NC_021658.1_8222427_8223588_+	COG0820, COG0820, Predicted Fe-S-cluster redox enzyme [General function prediction only]	NA|467aa|down_9|NC_021658.1_8223688_8225089_+	COG4770, COG4770, Acetyl/propionyl-CoA carboxylase, alpha subunit [Lipid metabolism]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	30	8246902-8247007	26	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCTGCACCGCCGTCGCCCCGGCGTCCTG	28	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|164aa|up_4|NC_021658.1_8241686_8242178_-,NA|130aa|down_3|NC_021658.1_8249758_8250148_+	NA|395aa|up_9|NC_021658.1_8232768_8233953_-	PRK05382, PRK05382, chorismate synthase; Validated	NA|466aa|up_8|NC_021658.1_8234994_8236392_-	PRK06349, PRK06349, homoserine dehydrogenase; Provisional	NA|645aa|up_7|NC_021658.1_8236448_8238383_+	pfam05943, VipB, Type VI secretion protein, EvpB/VC_A0108, tail sheath	NA|483aa|up_6|NC_021658.1_8239089_8240538_+	COG0654, UbiH, 2-polyprenyl-6-methoxyphenol hydroxylase and related FAD-dependent oxidoreductases [Coenzyme metabolism / Energy production and conversion]	NA|253aa|up_5|NC_021658.1_8240799_8241558_+	cd00641, GTP_cyclohydro2, GTP cyclohydrolase II (RibA)	NA|164aa|up_4|NC_021658.1_8241686_8242178_-	NA	NA|287aa|up_3|NC_021658.1_8242504_8243365_-	cd03394, PAP2_like_5, PAP2_like_5 proteins	NA|193aa|up_2|NC_021658.1_8243392_8243971_-	pfam13305, WHG, WHG domain	NA|407aa|up_1|NC_021658.1_8244262_8245483_+	cd01159, NcnH, Naphthocyclinone hydroxylase	NA|331aa|up_0|NC_021658.1_8245707_8246700_-	cd05153, HomoserineK_II, Type II Homoserine Kinase	NA|191aa|down_0|NC_021658.1_8247448_8248021_-	COG0625, Gst, Glutathione S-transferase [Posttranslational modification, protein turnover, chaperones]	NA|224aa|down_1|NC_021658.1_8248209_8248881_-	pfam13649, Methyltransf_25, Methyltransferase domain	NA|161aa|down_2|NC_021658.1_8248892_8249375_-	pfam07080, DUF1348, Protein of unknown function (DUF1348)	NA|130aa|down_3|NC_021658.1_8249758_8250148_+	NA	NA|310aa|down_4|NC_021658.1_8250210_8251140_-	COG2220, COG2220, Predicted Zn-dependent hydrolases of the beta-lactamase fold [General function prediction only]	NA|192aa|down_5|NC_021658.1_8251315_8251891_-	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|509aa|down_6|NC_021658.1_8252146_8253673_-	PHA00370, III, attachment protein	NA|338aa|down_7|NC_021658.1_8253885_8254899_-	PRK12438, PRK12438, hypothetical protein; Provisional	NA|1358aa|down_8|NC_021658.1_8254969_8259043_-	pfam13665, DUF4150, Domain of unknown function (DUF4150)	NA|339aa|down_9|NC_021658.1_8259369_8260386_+	COG0057, GapA, Glyceraldehyde-3-phosphate dehydrogenase/erythrose-4-phosphate dehydrogenase [Carbohydrate transport and metabolism]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	31	8415642-8416722	2,27,6	PILER-CR,CRISPRCasFinder,CRT	no	csa3	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Type I-A	CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC,CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC,CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC	36,36,36	0	0	NA	NA	NA:NA:NA	14,14,14	14	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|64aa|up_3|NC_021658.1_8410238_8410430_-,NA|314aa|up_1|NC_021658.1_8411707_8412649_-,NA|61aa|down_0|NC_021658.1_8417186_8417369_+,NA|424aa|down_3|NC_021658.1_8421912_8423184_+,NA|302aa|down_4|NC_021658.1_8423264_8424170_+,NA|292aa|down_5|NC_021658.1_8424265_8425141_-	NA|233aa|up_9|NC_021658.1_8394147_8394846_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|283aa|up_8|NC_021658.1_8395159_8396008_+	TIGR03425, urea_degr_2, urea carboxylase-associated protein 2	NA|224aa|up_7|NC_021658.1_8396004_8396676_+	TIGR03424, urea_degr_1, urea carboxylase-associated protein 1	NA|527aa|up_6|NC_021658.1_8400358_8401939_+	TIGR03428, ureacarb_perm, permease, urea carboxylase system	NA|589aa|up_5|NC_021658.1_8401962_8403729_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|1929aa|up_4|NC_021658.1_8403794_8409581_-	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|64aa|up_3|NC_021658.1_8410238_8410430_-	NA	NA|217aa|up_2|NC_021658.1_8411029_8411680_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|314aa|up_1|NC_021658.1_8411707_8412649_-	NA	NA|672aa|up_0|NC_021658.1_8412916_8414932_+	PRK07764, PRK07764, DNA polymerase III subunits gamma and tau; Validated	NA|61aa|down_0|NC_021658.1_8417186_8417369_+	NA	NA|196aa|down_1|NC_021658.1_8419861_8420449_+	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|326aa|down_2|NC_021658.1_8420568_8421546_-	pfam08308, PEGA, PEGA domain	NA|424aa|down_3|NC_021658.1_8421912_8423184_+	NA	NA|302aa|down_4|NC_021658.1_8423264_8424170_+	NA	NA|292aa|down_5|NC_021658.1_8424265_8425141_-	NA	NA|202aa|down_6|NC_021658.1_8425888_8426494_+	pfam08896, DUF1842, Domain of unknown function (DUF1842)	NA|492aa|down_7|NC_021658.1_8426534_8428010_+	TIGR03913, radical_SAM_domain_protein, Y_X(10)_GDL-associated radical SAM protein	NA|259aa|down_8|NC_021658.1_8428032_8428809_-	PRK06500, PRK06500, SDR family oxidoreductase	NA|316aa|down_9|NC_021658.1_8429073_8430021_+	COG4977, COG4977, Transcriptional regulator containing an amidase domain and an AraC-type DNA-binding HTH domain [Transcription]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	32	8722041-8722151	28	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCAGGCCGAGCGCGTGGGCGACAAGGCCGAGCAGCT	36	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|276aa|up_4|NC_021658.1_8715858_8716686_-,NA	NA|284aa|up_9|NC_021658.1_8707378_8708230_-	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|311aa|up_8|NC_021658.1_8708267_8709200_-	COG1175, UgpA, ABC-type sugar transport systems, permease components [Carbohydrate transport and metabolism]	NA|410aa|up_7|NC_021658.1_8709322_8710552_-	cd14750, PBP2_TMBP, The periplasmic-binding component of ABC transport systems specific for trehalose/maltose; possesses type 2 periplasmic binding fold	NA|427aa|up_6|NC_021658.1_8711899_8713180_+	COG1169, MenF, Isochorismate synthase [Coenzyme metabolism / Secondary metabolites biosynthesis, transport, and catabolism]	NA|723aa|up_5|NC_021658.1_8713364_8715533_+	PRK13566, PRK13566, anthranilate synthase component I	NA|276aa|up_4|NC_021658.1_8715858_8716686_-	NA	NA|451aa|up_3|NC_021658.1_8716847_8718200_+	PRK05370, PRK05370, argininosuccinate synthase; Validated	NA|120aa|up_2|NC_021658.1_8718453_8718813_+	pfam04020, Phage_holin_4_2, Mycobacterial 4 TMS phage holin, superfamily IV	NA|328aa|up_1|NC_021658.1_8718906_8719890_-	cd19086, AKR_AKR11C1, AKR11C family of aldo-keto reductase (AKR)	NA|595aa|up_0|NC_021658.1_8719955_8721740_-	cd03243, ABC_MutS_homologs, ATP-binding cassette domain of MutS homologs	NA|523aa|down_0|NC_021658.1_8723099_8724668_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|270aa|down_1|NC_021658.1_8725619_8726429_-	COG2226, UbiE, Methylase involved in ubiquinone/menaquinone biosynthesis [Coenzyme metabolism]	NA|354aa|down_2|NC_021658.1_8726600_8727662_-	PRK09352, PRK09352, beta-ketoacyl-ACP synthase 3	NA|209aa|down_3|NC_021658.1_8727934_8728561_-	COG0177, Nth, Predicted EndoIII-related endonuclease [DNA replication, recombination, and repair]	NA|249aa|down_4|NC_021658.1_8728569_8729316_-	COG3258, COG3258, Cytochrome c [Energy production and conversion]	NA|412aa|down_5|NC_021658.1_8729312_8730548_-	COG3391, COG3391, Uncharacterized conserved protein [Function unknown]	NA|535aa|down_6|NC_021658.1_8730816_8732421_+	TIGR03767, P_acnes_RR, metallophosphoesterase, PPA1498 family	NA|246aa|down_7|NC_021658.1_8732451_8733189_-	COG2091, Sfp, Phosphopantetheinyl transferase [Coenzyme metabolism]	NA|282aa|down_8|NC_021658.1_8733189_8734035_-	COG1409, Icc, Predicted phosphohydrolases [General function prediction only]	NA|1536aa|down_9|NC_021658.1_8734267_8738875_+	PRK11750, gltB, glutamate synthase subunit alpha; Provisional
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	33	8825266-8825396	29	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	AGCGCTCGGCCCGGTCGGAGCGC	23	1	3	8825289-8825319|8825289-8825319|8825289-8825319	NC_021658.1_3977294-3977324|NC_021658.1_3977303-3977333|NC_021658.1_3977312-3977342	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|72aa|up_9|NC_021658.1_8811706_8811922_+,NA|335aa|up_3|NC_021658.1_8819845_8820850_+,NA|296aa|up_0|NC_021658.1_8823394_8824282_-,NA|131aa|down_0|NC_021658.1_8827029_8827422_+	NA|72aa|up_9|NC_021658.1_8811706_8811922_+	NA	NA|495aa|up_8|NC_021658.1_8811930_8813415_-	pfam10092, DUF2330, Uncharacterized protein conserved in bacteria (DUF2330)	NA|481aa|up_7|NC_021658.1_8813693_8815136_-	PRK05335, PRK05335, tRNA (uracil-5-)-methyltransferase Gid; Reviewed	NA|866aa|up_6|NC_021658.1_8815142_8817740_-	PRK06599, PRK06599, DNA topoisomerase I; Validated	NA|324aa|up_5|NC_021658.1_8817869_8818841_-	pfam02481, DNA_processg_A, DNA recombination-mediator protein A	NA|283aa|up_4|NC_021658.1_8818917_8819766_-	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|335aa|up_3|NC_021658.1_8819845_8820850_+	NA	NA|268aa|up_2|NC_021658.1_8820846_8821650_+	cd08563, GDPD_TtGDE_like, Glycerophosphodiester phosphodiesterase domain of Thermoanaerobacter tengcongensis and similar proteins	NA|499aa|up_1|NC_021658.1_8821734_8823231_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|296aa|up_0|NC_021658.1_8823394_8824282_-	NA	NA|131aa|down_0|NC_021658.1_8827029_8827422_+	NA	NA|917aa|down_1|NC_021658.1_8827503_8830254_-	PRK00252, alaS, alanyl-tRNA synthetase; Reviewed	NA|280aa|down_2|NC_021658.1_8830445_8831285_-	pfam13646, HEAT_2, HEAT repeats	NA|741aa|down_3|NC_021658.1_8831571_8833794_-	TIGR04551, hypothetical_protein_CAP_1272, TIGR04551 family protein	NA|712aa|down_4|NC_021658.1_8834231_8836367_+	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|264aa|down_5|NC_021658.1_8836505_8837297_+	COG1360, MotB, Flagellar motor protein [Cell motility and secretion]	NA|517aa|down_6|NC_021658.1_8837836_8839387_+	pfam13191, AAA_16, AAA ATPase domain	NA|188aa|down_7|NC_021658.1_8839450_8840014_-	COG1595, RpoE, DNA-directed RNA polymerase specialized sigma subunit, sigma24 homolog [Transcription]	NA|205aa|down_8|NC_021658.1_8840184_8840799_+	COG2020, STE14, Putative protein-S-isoprenylcysteine methyltransferase [Posttranslational modification, protein turnover, chaperones]	NA|270aa|down_9|NC_021658.1_8843309_8844119_+	pfam18742, DpnII-MboI, REase_DpnII-MboI
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	34	8908357-8908465	30	CRISPRCasFinder	no	csa3	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Type I-A	CGCGCATCGCGGTAGGCGGCGGCCGC	26	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA,NA|99aa|down_1|NC_021658.1_8909508_8909805_+,NA|249aa|down_3|NC_021658.1_8911323_8912070_+,NA|397aa|down_4|NC_021658.1_8912098_8913289_-	NA|139aa|up_9|NC_021658.1_8889241_8889658_+	COG3607, COG3607, Predicted lactoylglutathione lyase [General function prediction only]	NA|211aa|up_8|NC_021658.1_8889816_8890449_+	COG0625, Gst, Glutathione S-transferase [Posttranslational modification, protein turnover, chaperones]	NA|1851aa|up_7|NC_021658.1_8891377_8896930_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	csa3|119aa|up_6|NC_021658.1_8897018_8897375_-	cd00090, HTH_ARSR, Arsenical Resistance Operon Repressor and similar prokaryotic, metal regulated homodimeric repressors	NA|1283aa|up_5|NC_021658.1_8897495_8901344_-	TIGR02956, sensor_protein_TorS, TMAO reductase sytem sensor TorS	NA|176aa|up_4|NC_021658.1_8901645_8902173_-	PRK14997, PRK14997, LysR family transcriptional regulator; Provisional	NA|128aa|up_3|NC_021658.1_8902280_8902664_+	COG4319, COG4319, Ketosteroid isomerase homolog [Function unknown]	NA|492aa|up_2|NC_021658.1_8902705_8904181_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|517aa|up_1|NC_021658.1_8904177_8905728_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|564aa|up_0|NC_021658.1_8906029_8907721_+	COG0659, SUL1, Sulfate permease and related transporters (MFS superfamily) [Inorganic ion transport and metabolism]	NA|168aa|down_0|NC_021658.1_8908886_8909390_+	cd07826, SRPBCC_CalC_Aha1-like_9, Putative hydrophobic ligand-binding SRPBCC domain of an uncharacterized subgroup of CalC- and Aha1-like proteins	NA|99aa|down_1|NC_021658.1_8909508_8909805_+	NA	NA|467aa|down_2|NC_021658.1_8909801_8911202_+	pfam13175, AAA_15, AAA ATPase domain	NA|249aa|down_3|NC_021658.1_8911323_8912070_+	NA	NA|397aa|down_4|NC_021658.1_8912098_8913289_-	NA	NA|128aa|down_5|NC_021658.1_8913353_8913737_-	pfam13788, DUF4180, Domain of unknown function (DUF4180)	NA|285aa|down_6|NC_021658.1_8913875_8914730_-	pfam04951, Peptidase_M55, D-aminopeptidase	NA|311aa|down_7|NC_021658.1_8915407_8916340_-	pfam11155, DUF2935, Domain of unknown function (DUF2935)	NA|133aa|down_8|NC_021658.1_8916964_8917363_+	COG3795, COG3795, Uncharacterized protein conserved in bacteria [Function unknown]	NA|421aa|down_9|NC_021658.1_8917359_8918622_+	COG4941, COG4941, Predicted RNA polymerase sigma factor containing a TPR repeat domain [Transcription]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	35	9128341-9128665	31	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGCGGCGCCGGCGGCAACGGCGGC	24	0	0	NA	NA	NA	5	5	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|446aa|up_6|NC_021658.1_9111001_9112339_-,NA|372aa|up_5|NC_021658.1_9112340_9113456_-,NA|283aa|up_3|NC_021658.1_9115979_9116828_+,NA|93aa|down_0|NC_021658.1_9129310_9129589_+	NA|263aa|up_9|NC_021658.1_9106951_9107740_-	PRK08317, PRK08317, hypothetical protein; Provisional	NA|437aa|up_8|NC_021658.1_9108260_9109571_-	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau	NA|148aa|up_7|NC_021658.1_9109646_9110090_+	pfam04972, BON, BON domain	NA|446aa|up_6|NC_021658.1_9111001_9112339_-	NA	NA|372aa|up_5|NC_021658.1_9112340_9113456_-	NA	NA|484aa|up_4|NC_021658.1_9113442_9114894_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|283aa|up_3|NC_021658.1_9115979_9116828_+	NA	NA|741aa|up_2|NC_021658.1_9116979_9119202_+	COG2268, COG2268, Uncharacterized protein conserved in bacteria [Function unknown]	NA|464aa|up_1|NC_021658.1_9119507_9120899_-	pfam01082, Cu2_monooxygen, Copper type II ascorbate-dependent monooxygenase, N-terminal domain	NA|537aa|up_0|NC_021658.1_9121307_9122918_-	pfam07586, HXXSHH, Protein of unknown function (DUF1552)	NA|93aa|down_0|NC_021658.1_9129310_9129589_+	NA	NA|724aa|down_1|NC_021658.1_9129783_9131955_+	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|629aa|down_2|NC_021658.1_9132181_9134068_+	COG1574, COG1574, Predicted metal-dependent hydrolase with the TIM-barrel fold [General function prediction only]	NA|312aa|down_3|NC_021658.1_9134134_9135070_+	pfam04227, Indigoidine_A, Indigoidine synthase A like protein	NA|297aa|down_4|NC_021658.1_9135066_9135957_+	cd01166, KdgK, 2-keto-3-deoxygluconate kinase (KdgK) phosphorylates 2-keto-3-deoxygluconate (KDG) to form 2-keto-3-deoxy-6-phosphogluconate (KDGP)	NA|144aa|down_5|NC_021658.1_9136184_9136616_+	cd04584, CBS_pair_AcuB_like, Two tandem repeats of the cystathionine beta-synthase (CBS pair) domains associated with the ACT domain	NA|331aa|down_6|NC_021658.1_9136612_9137605_-	COG4188, COG4188, Predicted dienelactone hydrolase [General function prediction only]	NA|261aa|down_7|NC_021658.1_9137889_9138672_+	smart00342, HTH_ARAC, helix_turn_helix, arabinose operon control protein	NA|192aa|down_8|NC_021658.1_9138712_9139288_-	TIGR04292, hypothetical_protein_PF0600, heavy-Cys/CGP-CTERM domain protein	NA|599aa|down_9|NC_021658.1_9139806_9141603_+	pfam12708, Pectate_lyase_3, Pectate lyase superfamily protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	36	9128740-9128910	32	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGCGGCGCCGGCGGCAACGGCGGC	24	0	0	NA	NA	NA	3	3	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|446aa|up_6|NC_021658.1_9111001_9112339_-,NA|372aa|up_5|NC_021658.1_9112340_9113456_-,NA|283aa|up_3|NC_021658.1_9115979_9116828_+,NA|93aa|down_0|NC_021658.1_9129310_9129589_+	NA|263aa|up_9|NC_021658.1_9106951_9107740_-	PRK08317, PRK08317, hypothetical protein; Provisional	NA|437aa|up_8|NC_021658.1_9108260_9109571_-	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau	NA|148aa|up_7|NC_021658.1_9109646_9110090_+	pfam04972, BON, BON domain	NA|446aa|up_6|NC_021658.1_9111001_9112339_-	NA	NA|372aa|up_5|NC_021658.1_9112340_9113456_-	NA	NA|484aa|up_4|NC_021658.1_9113442_9114894_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|283aa|up_3|NC_021658.1_9115979_9116828_+	NA	NA|741aa|up_2|NC_021658.1_9116979_9119202_+	COG2268, COG2268, Uncharacterized protein conserved in bacteria [Function unknown]	NA|464aa|up_1|NC_021658.1_9119507_9120899_-	pfam01082, Cu2_monooxygen, Copper type II ascorbate-dependent monooxygenase, N-terminal domain	NA|537aa|up_0|NC_021658.1_9121307_9122918_-	pfam07586, HXXSHH, Protein of unknown function (DUF1552)	NA|93aa|down_0|NC_021658.1_9129310_9129589_+	NA	NA|724aa|down_1|NC_021658.1_9129783_9131955_+	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|629aa|down_2|NC_021658.1_9132181_9134068_+	COG1574, COG1574, Predicted metal-dependent hydrolase with the TIM-barrel fold [General function prediction only]	NA|312aa|down_3|NC_021658.1_9134134_9135070_+	pfam04227, Indigoidine_A, Indigoidine synthase A like protein	NA|297aa|down_4|NC_021658.1_9135066_9135957_+	cd01166, KdgK, 2-keto-3-deoxygluconate kinase (KdgK) phosphorylates 2-keto-3-deoxygluconate (KDG) to form 2-keto-3-deoxy-6-phosphogluconate (KDGP)	NA|144aa|down_5|NC_021658.1_9136184_9136616_+	cd04584, CBS_pair_AcuB_like, Two tandem repeats of the cystathionine beta-synthase (CBS pair) domains associated with the ACT domain	NA|331aa|down_6|NC_021658.1_9136612_9137605_-	COG4188, COG4188, Predicted dienelactone hydrolase [General function prediction only]	NA|261aa|down_7|NC_021658.1_9137889_9138672_+	smart00342, HTH_ARAC, helix_turn_helix, arabinose operon control protein	NA|192aa|down_8|NC_021658.1_9138712_9139288_-	TIGR04292, hypothetical_protein_PF0600, heavy-Cys/CGP-CTERM domain protein	NA|599aa|down_9|NC_021658.1_9139806_9141603_+	pfam12708, Pectate_lyase_3, Pectate lyase superfamily protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	37	9167757-9170662	3,33,7,4	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	TCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC,GCTTCAATGGGGCCGCCGCCTTTCAGCGGCGGAGAG,GCTTCAATGGGGCCGCCGCCTTTCAGCGGCGGAGAG,CTCTCCGCCGCTGAAAGGCGGCGGCCCCATTGAAGC	35,36,36,36	0	0	NA	NA	NA:NA:NA:NA	37,39,39,37	39	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|72aa|up_9|NC_021658.1_9156435_9156651_+,NA|108aa|up_7|NC_021658.1_9159093_9159417_+,NA|189aa|up_6|NC_021658.1_9159707_9160274_+,NA|226aa|up_1|NC_021658.1_9165340_9166018_-,NA|348aa|up_0|NC_021658.1_9166110_9167154_-,NA|264aa|down_0|NC_021658.1_9171278_9172070_+,NA|224aa|down_8|NC_021658.1_9178750_9179422_-	NA|72aa|up_9|NC_021658.1_9156435_9156651_+	NA	NA|723aa|up_8|NC_021658.1_9156664_9158833_+	cd07484, Peptidases_S8_Thermitase_like, Peptidase S8 family domain in Thermitase-like proteins	NA|108aa|up_7|NC_021658.1_9159093_9159417_+	NA	NA|189aa|up_6|NC_021658.1_9159707_9160274_+	NA	NA|534aa|up_5|NC_021658.1_9160367_9161969_-	cd07041, STAS_RsbR_RsbS_like, Sulphate Transporter and Anti-Sigma factor antagonist domain of the "stressosome" complex proteins RsbS and RsbR, regulators of the bacterial stress activated alternative sigma factor sigma-B by phosphorylation	NA|141aa|up_4|NC_021658.1_9162297_9162720_-	pfam08837, DUF1810, Protein of unknown function (DUF1810)	NA|321aa|up_3|NC_021658.1_9162970_9163933_-	cd05292, LDH_2, A subgroup of L-lactate dehydrogenases	NA|403aa|up_2|NC_021658.1_9164083_9165292_-	pfam00924, MS_channel, Mechanosensitive ion channel	NA|226aa|up_1|NC_021658.1_9165340_9166018_-	NA	NA|348aa|up_0|NC_021658.1_9166110_9167154_-	NA	NA|264aa|down_0|NC_021658.1_9171278_9172070_+	NA	NA|149aa|down_1|NC_021658.1_9172173_9172620_+	COG1832, COG1832, Predicted CoA-binding protein [General function prediction only]	NA|388aa|down_2|NC_021658.1_9172672_9173836_+	COG4637, COG4637, Predicted ATPase [General function prediction only]	NA|141aa|down_3|NC_021658.1_9173920_9174343_-	TIGR04366, hypothetical_protein, cupin fold metalloprotein, WbuC family	NA|343aa|down_4|NC_021658.1_9174586_9175615_+	TIGR04470, hypothetical_protein_ALIPUT_00462, radical SAM mobile pair protein B	NA|260aa|down_5|NC_021658.1_9175754_9176534_+	COG5000, NtrY, Signal transduction histidine kinase involved in nitrogen fixation and metabolism regulation [Signal transduction mechanisms]	NA|153aa|down_6|NC_021658.1_9176559_9177018_+	cd07176, terB, tellurite resistance protein terB	NA|481aa|down_7|NC_021658.1_9177142_9178585_-	COG1293, COG1293, Predicted RNA-binding protein homologous to eukaryotic snRNP [Transcription]	NA|224aa|down_8|NC_021658.1_9178750_9179422_-	NA	NA|248aa|down_9|NC_021658.1_9179539_9180283_+	pfam03781, FGE-sulfatase, Sulfatase-modifying factor enzyme 1
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	38	9285648-9285732	34	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCTGACGTGGTTCAGAGATTAGGGGGGAGG	30	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|216aa|up_9|NC_021658.1_9268510_9269158_+,NA|135aa|up_8|NC_021658.1_9271530_9271935_-,NA|274aa|up_5|NC_021658.1_9274781_9275603_+,NA|306aa|up_4|NC_021658.1_9276004_9276922_-,NA|78aa|down_7|NC_021658.1_9301999_9302233_+	NA|216aa|up_9|NC_021658.1_9268510_9269158_+	NA	NA|135aa|up_8|NC_021658.1_9271530_9271935_-	NA	NA|313aa|up_7|NC_021658.1_9271873_9272812_-	cd10283, MnuA_DNase1-like, Mycoplasma pulmonis MnuA nuclease-like	NA|381aa|up_6|NC_021658.1_9273267_9274410_-	COG4637, COG4637, Predicted ATPase [General function prediction only]	NA|274aa|up_5|NC_021658.1_9274781_9275603_+	NA	NA|306aa|up_4|NC_021658.1_9276004_9276922_-	NA	NA|1293aa|up_3|NC_021658.1_9277095_9280974_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|522aa|up_2|NC_021658.1_9281152_9282718_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|260aa|up_1|NC_021658.1_9282770_9283550_-	COG4798, COG4798, Predicted methyltransferase [General function prediction only]	NA|513aa|up_0|NC_021658.1_9283991_9285530_+	PRK00260, cysS, cysteinyl-tRNA synthetase; Validated	NA|833aa|down_0|NC_021658.1_9286248_9288747_+	pfam13385, Laminin_G_3, Concanavalin A-like lectin/glucanases superfamily	NA|272aa|down_1|NC_021658.1_9289122_9289938_-	pfam00797, Acetyltransf_2, N-acetyltransferase	NA|1985aa|down_2|NC_021658.1_9290370_9296325_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|357aa|down_3|NC_021658.1_9296514_9297585_-	COG2805, PilT, Tfp pilus assembly protein, pilus retraction ATPase PilT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|513aa|down_4|NC_021658.1_9297586_9299125_-	COG2805, PilT, Tfp pilus assembly protein, pilus retraction ATPase PilT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|177aa|down_5|NC_021658.1_9299768_9300299_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|262aa|down_6|NC_021658.1_9301167_9301953_+	cd02440, AdoMet_MTases, S-adenosylmethionine-dependent methyltransferases (SAM or AdoMet-MTase), class I;  AdoMet-MTases are enzymes that use S-adenosyl-L-methionine (SAM or AdoMet) as a substrate for methyltransfer, creating the product S-adenosyl-L-homocysteine (AdoHcy)	NA|78aa|down_7|NC_021658.1_9301999_9302233_+	NA	NA|1505aa|down_8|NC_021658.1_9302901_9307416_+	cd11020, CuRO_1_CuNIR, Cupredoxin domain 1 of Copper-containing nitrite reductase	NA|609aa|down_9|NC_021658.1_9312265_9314092_+	TIGR03866, PQQ_ABC_repeats, PQQ-dependent catabolism-associated beta-propeller protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	39	9375468-9375594	35	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCGCTCCCCCCGAAAGCGCCGCTGCCGC	28	2	3	9375496-9375521|9375550-9375566|9375550-9375566	NC_021658.1_9375577-9375602|NC_021658.1_9387721-9387705|NC_021658.1_9825515-9825531	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|152aa|up_7|NC_021658.1_9363495_9363951_+,NA|145aa|up_3|NC_021658.1_9372336_9372771_+,NA|52aa|up_2|NC_021658.1_9372816_9372972_-,NA	NA|401aa|up_9|NC_021658.1_9361074_9362277_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|312aa|up_8|NC_021658.1_9362386_9363322_-	cd08422, PBP2_CrgA_like, The C-terminal substrate binding domain of LysR-type transcriptional regulator CrgA and its related homologs, contains the type 2 periplasmic binding domain	NA|152aa|up_7|NC_021658.1_9363495_9363951_+	NA	NA|497aa|up_6|NC_021658.1_9364024_9365515_-	PHA00370, III, attachment protein	NA|1803aa|up_5|NC_021658.1_9366071_9371480_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|166aa|up_4|NC_021658.1_9371494_9371992_+	pfam00072, Response_reg, Response regulator receiver domain	NA|145aa|up_3|NC_021658.1_9372336_9372771_+	NA	NA|52aa|up_2|NC_021658.1_9372816_9372972_-	NA	NA|210aa|up_1|NC_021658.1_9372952_9373582_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|325aa|up_0|NC_021658.1_9373615_9374590_+	cd03141, GATase1_Hsp31_like, Type 1 glutamine amidotransferase (GATase1)-like domain found in proteins similar to Escherichia coli Hsp31 protein	NA|68aa|down_0|NC_021658.1_9375817_9376021_-	PRK09478, mglC, galactose/methyl galactoside ABC transporter permease MglC	NA|215aa|down_1|NC_021658.1_9376165_9376810_+	COG0322, UvrC, Nuclease subunit of the excinuclease complex [DNA replication, recombination, and repair]	NA|570aa|down_2|NC_021658.1_9377002_9378712_+	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|369aa|down_3|NC_021658.1_9378892_9379999_+	cd02253, DmpA, L-Aminopeptidase D-amidase/D-esterase (DmpA) family; DmpA catalyzes the release of N-terminal D and L amino acids from peptide susbtrates	NA|1997aa|down_4|NC_021658.1_9380421_9386412_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|220aa|down_5|NC_021658.1_9386557_9387217_-	pfam00300, His_Phos_1, Histidine phosphatase superfamily (branch 1)	NA|474aa|down_6|NC_021658.1_9387474_9388896_+	COG2133, COG2133, Glucose/sorbosone dehydrogenases [Carbohydrate transport and metabolism]	NA|435aa|down_7|NC_021658.1_9388864_9390169_-	cd17485, MFS_MFSD3, Major facilitator superfamily domain containing 3 protein	NA|211aa|down_8|NC_021658.1_9390168_9390801_-	PRK00767, PRK00767, transcriptional regulator BetI; Validated	NA|198aa|down_9|NC_021658.1_9390976_9391570_+	PHA00370, III, attachment protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	40	9436281-9436463	5	PILER-CR	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GTCGAGCGTGCCGTCGCCGTT	21	0	0	NA	NA	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|89aa|up_7|NC_021658.1_9427875_9428142_+,NA|124aa|up_6|NC_021658.1_9428580_9428952_-,NA|90aa|up_5|NC_021658.1_9429038_9429308_-,NA|374aa|up_4|NC_021658.1_9429858_9430980_-,NA|371aa|up_3|NC_021658.1_9431100_9432213_-,NA|248aa|up_0|NC_021658.1_9434980_9435724_+,NA	NA|939aa|up_9|NC_021658.1_9420874_9423691_+	cd02080, P-type_ATPase_cation, P-type cation-transporting ATPase similar to Exiguobacterium aurantiacum Mna, an Na(+)-ATPase, and Synechocystis sp	NA|658aa|up_8|NC_021658.1_9423916_9425890_+	cd09619, CBM9_like_4, DOMON-like type 9 carbohydrate binding module	NA|89aa|up_7|NC_021658.1_9427875_9428142_+	NA	NA|124aa|up_6|NC_021658.1_9428580_9428952_-	NA	NA|90aa|up_5|NC_021658.1_9429038_9429308_-	NA	NA|374aa|up_4|NC_021658.1_9429858_9430980_-	NA	NA|371aa|up_3|NC_021658.1_9431100_9432213_-	NA	NA|350aa|up_2|NC_021658.1_9432243_9433293_-	sd00006, TPR, Tetratricopeptide repeat	NA|489aa|up_1|NC_021658.1_9433321_9434788_+	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|248aa|up_0|NC_021658.1_9434980_9435724_+	NA	NA|675aa|down_0|NC_021658.1_9438114_9440139_-	cd00054, EGF_CA, Calcium-binding EGF-like domain, present in a large number of membrane-bound and extracellular (mostly animal) proteins	NA|789aa|down_1|NC_021658.1_9440780_9443147_-	pfam13191, AAA_16, AAA ATPase domain	NA|423aa|down_2|NC_021658.1_9443158_9444427_-	pfam01637, ATPase_2, ATPase domain predominantly from Archaea	NA|325aa|down_3|NC_021658.1_9444511_9445486_-	cd05300, 2-Hacid_dh_1, Putative D-isomer specific 2-hydroxyacid dehydrogenase	NA|262aa|down_4|NC_021658.1_9445497_9446283_-	cd19105, AKR_unchar, uncharacterized aldo-keto reductase (AKR) superfamily protein	NA|308aa|down_5|NC_021658.1_9446304_9447228_-	cd04301, NAT_SF, N-Acyltransferase superfamily: Various enzymes that characteristically catalyze the transfer of an acyl group to a substrate	NA|595aa|down_6|NC_021658.1_9447382_9449167_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|276aa|down_7|NC_021658.1_9449276_9450104_+	cd03293, ABC_NrtD_SsuB_transporters, ATP-binding cassette domain of the nitrate and sulfonate transporters	NA|82aa|down_8|NC_021658.1_9450234_9450480_+	pfam10047, DUF2281, Protein of unknown function (DUF2281)	NA|1091aa|down_9|NC_021658.1_9450677_9453950_+	pfam07705, CARDB, CARDB
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	41	9547647-9547787	36	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCCTCTCCCGGCGCCCACGTCGCGCTC	27	0	0	NA	NA	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|492aa|up_6|NC_021658.1_9539097_9540573_+,NA|181aa|up_4|NC_021658.1_9541298_9541841_+,NA|76aa|up_3|NC_021658.1_9542135_9542363_+,NA|128aa|up_2|NC_021658.1_9543173_9543557_+,NA|182aa|up_1|NC_021658.1_9545009_9545555_+,NA|109aa|up_0|NC_021658.1_9545736_9546063_-,NA|253aa|down_0|NC_021658.1_9549055_9549814_-,NA|86aa|down_1|NC_021658.1_9550133_9550391_+	NA|103aa|up_9|NC_021658.1_9536219_9536528_-	COG1143, NuoI, Formate hydrogenlyase subunit 6/NADH:ubiquinone oxidoreductase 23 kD subunit (chain I) [Energy production and conversion]	NA|506aa|up_8|NC_021658.1_9536594_9538112_+	COG3604, FhlA, Transcriptional regulator containing GAF, AAA-type ATPase, and DNA binding domains [Transcription / Signal transduction mechanisms]	NA|309aa|up_7|NC_021658.1_9538167_9539094_-	COG3315, COG3315, O-Methyltransferase involved in polyketide biosynthesis [Secondary metabolites biosynthesis, transport, and catabolism]	NA|492aa|up_6|NC_021658.1_9539097_9540573_+	NA	NA|180aa|up_5|NC_021658.1_9540760_9541300_-	PRK14965, PRK14965, DNA polymerase III subunits gamma and tau; Provisional	NA|181aa|up_4|NC_021658.1_9541298_9541841_+	NA	NA|76aa|up_3|NC_021658.1_9542135_9542363_+	NA	NA|128aa|up_2|NC_021658.1_9543173_9543557_+	NA	NA|182aa|up_1|NC_021658.1_9545009_9545555_+	NA	NA|109aa|up_0|NC_021658.1_9545736_9546063_-	NA	NA|253aa|down_0|NC_021658.1_9549055_9549814_-	NA	NA|86aa|down_1|NC_021658.1_9550133_9550391_+	NA	NA|436aa|down_2|NC_021658.1_9552874_9554182_+	cd06828, PLPDE_III_DapDC, Type III Pyridoxal 5-phosphate (PLP)-Dependent Enzyme Diaminopimelate Decarboxylase	NA|192aa|down_3|NC_021658.1_9554261_9554837_-	smart00157, PRP, Major prion protein	NA|123aa|down_4|NC_021658.1_9555106_9555475_+	cd07245, VOC_like, uncharacterized subfamily of vicinal oxygen chelate (VOC) family	NA|924aa|down_5|NC_021658.1_9556734_9559506_-	TIGR03866, PQQ_ABC_repeats, PQQ-dependent catabolism-associated beta-propeller protein	NA|351aa|down_6|NC_021658.1_9559641_9560694_-	COG0842, COG0842, ABC-type multidrug transport system, permease component [Defense mechanisms]	NA|315aa|down_7|NC_021658.1_9560693_9561638_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|590aa|down_8|NC_021658.1_9561962_9563732_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|462aa|down_9|NC_021658.1_9563737_9565123_+	sd00008, TPR_YbbN, C-terminal Tetratricopeptide repeat (TPR) region of YbbN and similar motifs
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	42	9815196-9815386	37	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CTGGCTCGGGCGGCGCGAGCGCAGGGGCAGGCTCCGGCGAGGGCGGG	47	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|381aa|up_7|NC_021658.1_9796530_9797673_+,NA|510aa|up_4|NC_021658.1_9802656_9804186_+,NA|198aa|down_2|NC_021658.1_9819082_9819676_+,NA|298aa|down_5|NC_021658.1_9821241_9822135_+,NA|135aa|down_9|NC_021658.1_9827782_9828187_-	NA|213aa|up_9|NC_021658.1_9793786_9794425_-	COG3577, COG3577, Predicted aspartyl protease [General function prediction only]	NA|562aa|up_8|NC_021658.1_9794440_9796126_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|381aa|up_7|NC_021658.1_9796530_9797673_+	NA	NA|615aa|up_6|NC_021658.1_9797889_9799734_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|885aa|up_5|NC_021658.1_9799993_9802648_+	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|510aa|up_4|NC_021658.1_9802656_9804186_+	NA	NA|1214aa|up_3|NC_021658.1_9804313_9807955_+	cd07484, Peptidases_S8_Thermitase_like, Peptidase S8 family domain in Thermitase-like proteins	NA|593aa|up_2|NC_021658.1_9808058_9809837_-	pfam13229, Beta_helix, Right handed beta helix region	NA|805aa|up_1|NC_021658.1_9810425_9812840_-	pfam15902, Sortilin-Vps10, Sortilin, neurotensin receptor 3,	NA|465aa|up_0|NC_021658.1_9813577_9814972_+	smart00656, Amb_all, Amb_all domain	NA|365aa|down_0|NC_021658.1_9815389_9816484_+	pfam09492, Pec_lyase, Pectic acid lyase	NA|542aa|down_1|NC_021658.1_9816581_9818207_+	cd09002, GH43_XYL-like, Glycosyl hydrolase family 43, beta-D-xylosidase (uncharacterized)	NA|198aa|down_2|NC_021658.1_9819082_9819676_+	NA	NA|199aa|down_3|NC_021658.1_9819749_9820346_+	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|260aa|down_4|NC_021658.1_9820395_9821175_+	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau	NA|298aa|down_5|NC_021658.1_9821241_9822135_+	NA	NA|594aa|down_6|NC_021658.1_9822458_9824240_+	COG3591, COG3591, V8-like Glu-specific endopeptidase [Amino acid transport and metabolism]	NA|501aa|down_7|NC_021658.1_9824294_9825797_-	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|454aa|down_8|NC_021658.1_9826034_9827396_-	cd00796, INT_Rci_Hp1_C, Shufflon-specific DNA recombinase Rci and Bacteriophage Hp1_like integrase, C-terminal catalytic domain	NA|135aa|down_9|NC_021658.1_9827782_9828187_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	43	9915030-9915102	38	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGCGCTCGTCCAGCGCGCGCCGC	23	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|102aa|up_8|NC_021658.1_9906313_9906619_+,NA|748aa|up_1|NC_021658.1_9912039_9914283_+,NA|387aa|down_0|NC_021658.1_9915153_9916314_-,NA|148aa|down_4|NC_021658.1_9919409_9919853_-	NA|287aa|up_9|NC_021658.1_9905304_9906165_+	cd01990, Alpha_ANH_like_I, This is a subfamily of Adenine nucleotide alpha hydrolases superfamily	NA|102aa|up_8|NC_021658.1_9906313_9906619_+	NA	NA|204aa|up_7|NC_021658.1_9906584_9907196_-	pfam11645, PDDEXK_5, PD-(D/E)XK endonuclease	NA|148aa|up_6|NC_021658.1_9907202_9907646_+	PTZ00436, PTZ00436, 60S ribosomal protein L19-like protein; Provisional	NA|282aa|up_5|NC_021658.1_9907653_9908499_-	pfam03618, Kinase-PPPase, Kinase/pyrophosphorylase	NA|367aa|up_4|NC_021658.1_9908599_9909700_-	PRK10767, PRK10767, chaperone protein DnaJ; Provisional	NA|585aa|up_3|NC_021658.1_9909752_9911507_-	cd17631, FACL_FadD13-like, fatty acyl-CoA synthetase, including FadD13	NA|135aa|up_2|NC_021658.1_9911555_9911960_+	TIGR02266, gmx_TIGR02266, Myxococcus xanthus paralogous domain TIGR02266	NA|748aa|up_1|NC_021658.1_9912039_9914283_+	NA	NA|188aa|up_0|NC_021658.1_9914448_9915012_+	cd12108, Hr-like, Hemerythrin-like domain	NA|387aa|down_0|NC_021658.1_9915153_9916314_-	NA	NA|102aa|down_1|NC_021658.1_9916387_9916693_+	pfam07238, PilZ, PilZ domain	NA|455aa|down_2|NC_021658.1_9916745_9918110_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|319aa|down_3|NC_021658.1_9918106_9919063_-	PRK12518, PRK12518, RNA polymerase sigma factor; Provisional	NA|148aa|down_4|NC_021658.1_9919409_9919853_-	NA	NA|284aa|down_5|NC_021658.1_9919897_9920749_+	cd09009, PNP-EcPNPII_like, purine nucleoside phosphorylases similar to human PNP and Escherichia coli PNP-II (XapA)	NA|154aa|down_6|NC_021658.1_9920745_9921207_+	TIGR01354, Cytidine_deaminase, cytidine deaminase, homotetrameric	NA|1063aa|down_7|NC_021658.1_9921246_9924435_-	TIGR02168, Chromosome_partition_protein_Smc, chromosome segregation protein SMC, common bacterial type	NA|390aa|down_8|NC_021658.1_9924638_9925808_-	TIGR02483, ATP-dependent_6-phosphofructokinase_1, phosphofructokinase	NA|495aa|down_9|NC_021658.1_9927369_9928854_-	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	44	9972876-9972953	39	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCCGAGCAGCGCCTCGCCGGGCTC	24	1	1	9972900-9972929	NC_021658.1_884978-885007	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|353aa|up_7|NC_021658.1_9965167_9966226_-,NA|220aa|up_1|NC_021658.1_9970495_9971155_+,NA|203aa|up_0|NC_021658.1_9971253_9971862_+,NA|289aa|down_1|NC_021658.1_9974455_9975322_-,NA|68aa|down_2|NC_021658.1_9976613_9976817_+	NA|123aa|up_9|NC_021658.1_9963843_9964212_+	cd07311, terB_like_1, tellurium resistance terB-like protein, subgroup 1	NA|110aa|up_8|NC_021658.1_9964753_9965083_-	PRK09209, PRK09209, ribonucleoside-diphosphate reductase subunit alpha	NA|353aa|up_7|NC_021658.1_9965167_9966226_-	NA	NA|209aa|up_6|NC_021658.1_9966301_9966928_-	pfam04002, RadC, RadC-like JAB domain	NA|217aa|up_5|NC_021658.1_9966924_9967575_-	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|94aa|up_4|NC_021658.1_9967739_9968021_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|112aa|up_3|NC_021658.1_9968358_9968694_-	TIGR02249, Integrase/recombinase_E2_protein	NA|358aa|up_2|NC_021658.1_9969131_9970205_+	pfam18739, HEPN_Apea, Apea-like HEPN	NA|220aa|up_1|NC_021658.1_9970495_9971155_+	NA	NA|203aa|up_0|NC_021658.1_9971253_9971862_+	NA	NA|288aa|down_0|NC_021658.1_9973439_9974303_+	cd09276, Rnase_HI_RT_non_LTR, non-LTR RNase HI domain of reverse transcriptases	NA|289aa|down_1|NC_021658.1_9974455_9975322_-	NA	NA|68aa|down_2|NC_021658.1_9976613_9976817_+	NA	NA|310aa|down_3|NC_021658.1_9976817_9977747_-	COG1319, CoxM, Aerobic-type carbon monoxide dehydrogenase, middle subunit CoxM/CutM homologs [Energy production and conversion]	NA|161aa|down_4|NC_021658.1_9977743_9978226_-	COG2080, CoxS, Aerobic-type carbon monoxide dehydrogenase, small subunit CoxS/CutS homologs [Energy production and conversion]	NA|778aa|down_5|NC_021658.1_9978222_9980556_-	pfam02738, Ald_Xan_dh_C2, Molybdopterin-binding domain of aldehyde dehydrogenase	NA|213aa|down_6|NC_021658.1_9980670_9981309_-	pfam12804, NTP_transf_3, MobA-like NTP transferase domain	NA|321aa|down_7|NC_021658.1_9981305_9982268_-	COG1975, XdhC, Xanthine and CO dehydrogenases maturation factor, XdhC/CoxF family [Posttranslational modification, protein turnover, chaperones]	NA|1609aa|down_8|NC_021658.1_9982518_9987345_+	COG3950, COG3950, Predicted ATP-binding protein involved in virulence [General function prediction only]	NA|290aa|down_9|NC_021658.1_9987341_9988211_+	TIGR02646, Hypothetical_protein_SMc04429, TIGR02646 family protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	45	10062088-10062489	8	CRT	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	TGCCTCGTCCAGACCGTTTCCGGT	24	2	3	10062112-10062129|10062112-10062129|10062238-10062255	NC_021658.1_10113370-10113353|NC_021658.1_13449784-13449801|NC_021658.1_3144037-3144054	NA	9	9	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|161aa|up_2|NC_021658.1_10061042_10061525_+,NA|106aa|up_1|NC_021658.1_10061530_10061848_+,NA|181aa|down_1|NC_021658.1_10064247_10064790_-,NA|258aa|down_6|NC_021658.1_10069494_10070268_+,NA|245aa|down_8|NC_021658.1_10071601_10072336_-,NA|477aa|down_9|NC_021658.1_10072467_10073898_+	NA|261aa|up_9|NC_021658.1_10051241_10052024_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|206aa|up_8|NC_021658.1_10052573_10053191_+	PRK12513, PRK12513, RNA polymerase sigma factor; Provisional	NA|337aa|up_7|NC_021658.1_10053210_10054221_+	PRK07003, PRK07003, DNA polymerase III subunit gamma/tau	NA|166aa|up_6|NC_021658.1_10054249_10054747_-	TIGR02266, gmx_TIGR02266, Myxococcus xanthus paralogous domain TIGR02266	NA|796aa|up_5|NC_021658.1_10054876_10057264_-	COG1807, ArnT, 4-amino-4-deoxy-L-arabinose transferase and related glycosyltransferases of PMT family [Cell envelope biogenesis, outer membrane]	NA|318aa|up_4|NC_021658.1_10058215_10059169_+	PRK00089, era, GTPase Era; Reviewed	NA|594aa|up_3|NC_021658.1_10059165_10060947_+	PRK00093, PRK00093, GTP-binding protein Der; Reviewed	NA|161aa|up_2|NC_021658.1_10061042_10061525_+	NA	NA|106aa|up_1|NC_021658.1_10061530_10061848_+	NA	NA|73aa|up_0|NC_021658.1_10061844_10062063_+	PRK00093, PRK00093, GTP-binding protein Der; Reviewed	NA|408aa|down_0|NC_021658.1_10062852_10064076_-	COG0003, ArsA, Predicted ATPase involved in chromosome partitioning [Cell division and chromosome partitioning]	NA|181aa|down_1|NC_021658.1_10064247_10064790_-	NA	NA|245aa|down_2|NC_021658.1_10064861_10065596_+	COG4464, CapC, Capsular polysaccharide biosynthesis protein [Carbohydrate transport and metabolism / Cell envelope biogenesis, outer membrane]	NA|455aa|down_3|NC_021658.1_10065647_10067012_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|393aa|down_4|NC_021658.1_10067390_10068569_+	PRK09354, recA, recombinase A; Provisional	NA|168aa|down_5|NC_021658.1_10068586_10069090_+	COG2062, SixA, Phosphohistidine phosphatase SixA [Signal transduction mechanisms]	NA|258aa|down_6|NC_021658.1_10069494_10070268_+	NA	NA|329aa|down_7|NC_021658.1_10070441_10071428_+	TIGR02692, putative_tRNA_nucleotidyltransferase, tRNA adenylyltransferase	NA|245aa|down_8|NC_021658.1_10071601_10072336_-	NA	NA|477aa|down_9|NC_021658.1_10072467_10073898_+	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	46	10090674-10090773	40	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGCGCGCCCGGCGCGGCCGTCTCCG	25	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|182aa|up_1|NC_021658.1_10088739_10089285_-,NA|135aa|down_1|NC_021658.1_10095322_10095727_+,NA|309aa|down_2|NC_021658.1_10096598_10097525_+,NA|118aa|down_3|NC_021658.1_10097691_10098045_-,NA|408aa|down_9|NC_021658.1_10102761_10103985_-	NA|363aa|up_9|NC_021658.1_10079084_10080173_-	pfam14907, NTP_transf_5, Uncharacterized nucleotidyltransferase	NA|469aa|up_8|NC_021658.1_10080325_10081732_+	cd07100, ALDH_SSADH1_GabD1, Mycobacterium tuberculosis succinate-semialdehyde dehydrogenase 1-like	NA|125aa|up_7|NC_021658.1_10081750_10082125_+	pfam08818, DUF1801, Domain of unknown function (DU1801)	NA|809aa|up_6|NC_021658.1_10082167_10084594_-	cd06314, PBP1_tmGBP, periplasmic sugar-binding domain of Thermotoga maritima glucose-binding protein (tmGBP) and its close homologs	NA|326aa|up_5|NC_021658.1_10084731_10085709_+	COG0179, MhpD, 2-keto-4-pentenoate hydratase/2-oxohepta-3-ene-1,7-dioic acid hydratase (catechol pathway) [Secondary metabolites biosynthesis, transport, and catabolism]	NA|224aa|up_4|NC_021658.1_10085705_10086377_+	TIGR01262, Maleylacetoacetate_isomerase, maleylacetoacetate isomerase	NA|384aa|up_3|NC_021658.1_10086415_10087567_+	TIGR01263, 4-hydroxyphenylpyruvate_dioxygenase, 4-hydroxyphenylpyruvate dioxygenase	NA|387aa|up_2|NC_021658.1_10087566_10088727_+	COG3508, HmgA, Homogentisate 1,2-dioxygenase [Secondary metabolites biosynthesis, transport, and catabolism]	NA|182aa|up_1|NC_021658.1_10088739_10089285_-	NA	NA|368aa|up_0|NC_021658.1_10089299_10090403_-	pfam01916, DS, Deoxyhypusine synthase	NA|358aa|down_0|NC_021658.1_10093846_10094920_-	pfam01904, DUF72, Protein of unknown function DUF72	NA|135aa|down_1|NC_021658.1_10095322_10095727_+	NA	NA|309aa|down_2|NC_021658.1_10096598_10097525_+	NA	NA|118aa|down_3|NC_021658.1_10097691_10098045_-	NA	NA|130aa|down_4|NC_021658.1_10098332_10098722_-	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|95aa|down_5|NC_021658.1_10099234_10099519_+	pfam07883, Cupin_2, Cupin domain	NA|307aa|down_6|NC_021658.1_10099500_10100421_-	PRK00281, PRK00281, undecaprenyl-diphosphate phosphatase	NA|455aa|down_7|NC_021658.1_10100472_10101837_-	COG1075, LipA, Predicted acetyltransferases and hydrolases with the alpha/beta hydrolase fold [General function prediction only]	NA|252aa|down_8|NC_021658.1_10102009_10102765_-	cd00657, Ferritin_like, Ferritin-like superfamily of diiron-containing four-helix-bundle proteins	NA|408aa|down_9|NC_021658.1_10102761_10103985_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	47	10090890-10091091	41	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGCGCGCCCGGCGCGGCCGTCTCCG	25	0	0	NA	NA	NA	3	3	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|182aa|up_1|NC_021658.1_10088739_10089285_-,NA|135aa|down_1|NC_021658.1_10095322_10095727_+,NA|309aa|down_2|NC_021658.1_10096598_10097525_+,NA|118aa|down_3|NC_021658.1_10097691_10098045_-,NA|408aa|down_9|NC_021658.1_10102761_10103985_-	NA|363aa|up_9|NC_021658.1_10079084_10080173_-	pfam14907, NTP_transf_5, Uncharacterized nucleotidyltransferase	NA|469aa|up_8|NC_021658.1_10080325_10081732_+	cd07100, ALDH_SSADH1_GabD1, Mycobacterium tuberculosis succinate-semialdehyde dehydrogenase 1-like	NA|125aa|up_7|NC_021658.1_10081750_10082125_+	pfam08818, DUF1801, Domain of unknown function (DU1801)	NA|809aa|up_6|NC_021658.1_10082167_10084594_-	cd06314, PBP1_tmGBP, periplasmic sugar-binding domain of Thermotoga maritima glucose-binding protein (tmGBP) and its close homologs	NA|326aa|up_5|NC_021658.1_10084731_10085709_+	COG0179, MhpD, 2-keto-4-pentenoate hydratase/2-oxohepta-3-ene-1,7-dioic acid hydratase (catechol pathway) [Secondary metabolites biosynthesis, transport, and catabolism]	NA|224aa|up_4|NC_021658.1_10085705_10086377_+	TIGR01262, Maleylacetoacetate_isomerase, maleylacetoacetate isomerase	NA|384aa|up_3|NC_021658.1_10086415_10087567_+	TIGR01263, 4-hydroxyphenylpyruvate_dioxygenase, 4-hydroxyphenylpyruvate dioxygenase	NA|387aa|up_2|NC_021658.1_10087566_10088727_+	COG3508, HmgA, Homogentisate 1,2-dioxygenase [Secondary metabolites biosynthesis, transport, and catabolism]	NA|182aa|up_1|NC_021658.1_10088739_10089285_-	NA	NA|368aa|up_0|NC_021658.1_10089299_10090403_-	pfam01916, DS, Deoxyhypusine synthase	NA|358aa|down_0|NC_021658.1_10093846_10094920_-	pfam01904, DUF72, Protein of unknown function DUF72	NA|135aa|down_1|NC_021658.1_10095322_10095727_+	NA	NA|309aa|down_2|NC_021658.1_10096598_10097525_+	NA	NA|118aa|down_3|NC_021658.1_10097691_10098045_-	NA	NA|130aa|down_4|NC_021658.1_10098332_10098722_-	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|95aa|down_5|NC_021658.1_10099234_10099519_+	pfam07883, Cupin_2, Cupin domain	NA|307aa|down_6|NC_021658.1_10099500_10100421_-	PRK00281, PRK00281, undecaprenyl-diphosphate phosphatase	NA|455aa|down_7|NC_021658.1_10100472_10101837_-	COG1075, LipA, Predicted acetyltransferases and hydrolases with the alpha/beta hydrolase fold [General function prediction only]	NA|252aa|down_8|NC_021658.1_10102009_10102765_-	cd00657, Ferritin_like, Ferritin-like superfamily of diiron-containing four-helix-bundle proteins	NA|408aa|down_9|NC_021658.1_10102761_10103985_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	48	10333320-10333398	42	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCGCCGTCAGGCGACCCGGAGCCCC	25	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|423aa|up_9|NC_021658.1_10321783_10323052_-,NA|271aa|up_7|NC_021658.1_10324286_10325099_-,NA|50aa|up_6|NC_021658.1_10325331_10325481_+,NA|71aa|up_5|NC_021658.1_10326048_10326261_+,NA	NA|423aa|up_9|NC_021658.1_10321783_10323052_-	NA	NA|41aa|up_8|NC_021658.1_10323155_10323278_-	COG0606, COG0606, Predicted ATPase with chaperone activity [Posttranslational modification, protein turnover, chaperones]	NA|271aa|up_7|NC_021658.1_10324286_10325099_-	NA	NA|50aa|up_6|NC_021658.1_10325331_10325481_+	NA	NA|71aa|up_5|NC_021658.1_10326048_10326261_+	NA	NA|456aa|up_4|NC_021658.1_10326288_10327656_+	PRK00451, PRK00451, aminomethyl-transferring glycine dehydrogenase subunit GcvPA	NA|494aa|up_3|NC_021658.1_10327652_10329134_+	PRK04366, PRK04366, aminomethyl-transferring glycine dehydrogenase subunit GcvPB	NA|343aa|up_2|NC_021658.1_10329235_10330264_-	cd02197, HypE, HypE (Hydrogenase expression/formation protein)	NA|370aa|up_1|NC_021658.1_10330260_10331370_-	PRK15062, PRK15062, hydrogenase isoenzymes formation protein HypD; Provisional	NA|85aa|up_0|NC_021658.1_10331366_10331621_-	pfam01455, HupF_HypC, HupF/HypC family	NA|114aa|down_0|NC_021658.1_10334001_10334343_-	pfam01155, HypA, Hydrogenase/urease nickel incorporation, metallochaperone, hypA	NA|151aa|down_1|NC_021658.1_10334347_10334800_-	cd00518, H2MP, Hydrogenase specific C-terminal endopeptidases, also called Hydrogen Maturation Proteases (H2MP)	NA|437aa|down_2|NC_021658.1_10334796_10336107_-	COG3259, FrhA, Coenzyme F420-reducing hydrogenase, alpha subunit [Energy production and conversion]	NA|259aa|down_3|NC_021658.1_10336096_10336873_-	COG1941, FrhG, Coenzyme F420-reducing hydrogenase, gamma subunit [Energy production and conversion]	NA|281aa|down_4|NC_021658.1_10336878_10337721_-	cd06221, sulfite_reductase_like, Anaerobic sulfite reductase contains an FAD and NADPH binding module with structural similarity to ferredoxin reductase and sequence similarity to dihydroorotate dehydrogenases	NA|159aa|down_5|NC_021658.1_10337801_10338278_-	cd00038, CAP_ED, effector domain of the CAP family of transcription factors; members include CAP (or cAMP receptor protein (CRP)), which binds cAMP, FNR (fumarate and nitrate reduction), which uses an iron-sulfur cluster to sense oxygen) and CooA, a heme containing CO sensor	NA|405aa|down_6|NC_021658.1_10338284_10339499_-	pfam17179, Fer4_22, 4Fe-4S dicluster domain	NA|82aa|down_7|NC_021658.1_10339826_10340072_+	pfam04023, FeoA, FeoA domain	NA|416aa|down_8|NC_021658.1_10340816_10342064_+	COG0370, FeoB, Fe2+ transport system protein B [Inorganic ion transport and metabolism]	NA|777aa|down_9|NC_021658.1_10342205_10344536_+	PRK06464, PRK06464, phosphoenolpyruvate synthase; Validated
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	49	10533993-10534088	43	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGGCCCCTGCCAGAGCGCCCAGGG	24	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA,NA|184aa|down_8|NC_021658.1_10546422_10546974_-,NA|193aa|down_9|NC_021658.1_10547084_10547663_-	NA|610aa|up_9|NC_021658.1_10520363_10522193_-	COG0644, FixC, Dehydrogenases (flavoproteins) [Energy production and conversion]	NA|446aa|up_8|NC_021658.1_10522204_10523542_-	TIGR02946, Putative_diacyglycerol_O-acyltransferase_Mb3115, acyltransferase, WS/DGAT/MGAT	NA|313aa|up_7|NC_021658.1_10523742_10524681_+	cd08417, PBP2_Nitroaromatics_like, The C-terminal substrate binding domain of LysR-type transcriptional regulators that involved in the catabolism of nitroaromatic/naphthalene compounds and that of related regulators; contains the type 2 periplasmic binding fold	NA|792aa|up_6|NC_021658.1_10524739_10527115_-	TIGR02515, Putative_DNA_transport_protein_HofQ, type IV pilus secretin (or competence protein) PilQ	NA|214aa|up_5|NC_021658.1_10527203_10527845_-	pfam04351, PilP, Pilus assembly protein, PilP	NA|213aa|up_4|NC_021658.1_10527841_10528480_-	pfam04350, PilO, Pilus assembly protein, PilO	NA|215aa|up_3|NC_021658.1_10528479_10529124_-	COG3166, PilN, Tfp pilus assembly protein PilN [Cell motility and secretion / Intracellular trafficking and secretion]	NA|354aa|up_2|NC_021658.1_10529120_10530182_-	pfam11104, PilM_2, Type IV pilus assembly protein PilM;	NA|371aa|up_1|NC_021658.1_10530532_10531645_+	COG3108, COG3108, Uncharacterized protein conserved in bacteria [Function unknown]	NA|326aa|up_0|NC_021658.1_10531770_10532748_+	TIGR02479, RNA_polymerase_sigma_factor_WhiG, RNA polymerase sigma factor, FliA/WhiG family	NA|461aa|down_0|NC_021658.1_10535608_10536991_-	pfam05853, BKACE, beta-keto acid cleavage enzyme	NA|278aa|down_1|NC_021658.1_10537049_10537883_+	cd00475, Cis_IPPS, Cis (Z)-Isoprenyl Diphosphate Synthases	NA|267aa|down_2|NC_021658.1_10537907_10538708_+	pfam01148, CTP_transf_1, Cytidylyltransferase family	NA|442aa|down_3|NC_021658.1_10538873_10540199_+	COG0334, GdhA, Glutamate dehydrogenase/leucine dehydrogenase [Amino acid transport and metabolism]	NA|365aa|down_4|NC_021658.1_10540274_10541369_-	PRK12282, PRK12282, tryptophanyl-tRNA synthetase II; Reviewed	NA|578aa|down_5|NC_021658.1_10541520_10543254_+	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|652aa|down_6|NC_021658.1_10543307_10545263_+	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|334aa|down_7|NC_021658.1_10545344_10546346_-	COG0354, COG0354, Predicted aminomethyltransferase related to GcvT [General function prediction only]	NA|184aa|down_8|NC_021658.1_10546422_10546974_-	NA	NA|193aa|down_9|NC_021658.1_10547084_10547663_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	50	10765963-10766259	9	CRT	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCCGCCTTCTCCGGCNCN	18	0	0	NA	NA	NA	6	6	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|279aa|up_6|NC_021658.1_10757980_10758817_+,NA|99aa|up_3|NC_021658.1_10760383_10760680_-,NA|252aa|down_0|NC_021658.1_10768219_10768975_+,NA|157aa|down_1|NC_021658.1_10768971_10769442_+,NA|273aa|down_8|NC_021658.1_10778022_10778841_+	NA|311aa|up_9|NC_021658.1_10754770_10755703_+	cd06124, cupin_NimR-like_N, AraC/XylS family transcriptional regulators similar to NimR, N-terminal cupin domain	NA|294aa|up_8|NC_021658.1_10755788_10756670_-	COG1360, MotB, Flagellar motor protein [Cell motility and secretion]	NA|339aa|up_7|NC_021658.1_10756938_10757955_+	COG0473, LeuB, Isocitrate/isopropylmalate dehydrogenase [Amino acid transport and metabolism]	NA|279aa|up_6|NC_021658.1_10757980_10758817_+	NA	NA|248aa|up_5|NC_021658.1_10758864_10759608_-	pfam01213, CAP_N, Adenylate cyclase associated (CAP) N terminal	NA|172aa|up_4|NC_021658.1_10759604_10760120_-	COG2840, COG2840, Uncharacterized protein conserved in bacteria [Function unknown]	NA|99aa|up_3|NC_021658.1_10760383_10760680_-	NA	NA|156aa|up_2|NC_021658.1_10760868_10761336_-	PTZ00449, PTZ00449, 104 kDa microneme/rhoptry antigen; Provisional	NA|922aa|up_1|NC_021658.1_10762093_10764859_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|183aa|up_0|NC_021658.1_10765385_10765934_-	cd03424, ADPRase_NUDT5, ADP-ribose pyrophosphatase (ADPRase) catalyzes the hydrolysis of ADP-ribose and a variety of additional ADP-sugar conjugates to AMP and ribose-5-phosphate	NA|252aa|down_0|NC_021658.1_10768219_10768975_+	NA	NA|157aa|down_1|NC_021658.1_10768971_10769442_+	NA	NA|150aa|down_2|NC_021658.1_10769444_10769894_+	PRK05273, PRK05273, D-tyrosyl-tRNA(Tyr) deacylase; Provisional	NA|327aa|down_3|NC_021658.1_10769964_10770945_+	COG1893, ApbA, Ketopantoate reductase [Coenzyme metabolism]	NA|333aa|down_4|NC_021658.1_10771001_10772000_-	TIGR00557, pdxA, 4-hydroxythreonine-4-phosphate dehydrogenase	NA|314aa|down_5|NC_021658.1_10772107_10773049_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|482aa|down_6|NC_021658.1_10773156_10774602_-	PRK10735, tldD, protease TldD; Provisional	NA|919aa|down_7|NC_021658.1_10775167_10777924_+	TIGR02917, TPR_domain_protein, putative PEP-CTERM system TPR-repeat lipoprotein	NA|273aa|down_8|NC_021658.1_10778022_10778841_+	NA	NA|386aa|down_9|NC_021658.1_10778828_10779986_-	cd06578, HemD, Uroporphyrinogen-III synthase (HemD) catalyzes the asymmetrical cyclization of tetrapyrrole (linear) to uroporphyrinogen-III, the fourth step in the biosynthesis of heme
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	51	11366810-11366899	44	CRISPRCasFinder	no	csa3	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Type I-A	GTGAGCGAGCGCAGCGGCGAGAG	23	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|162aa|up_4|NC_021658.1_11355930_11356416_+,NA|494aa|up_0|NC_021658.1_11364873_11366355_-,NA|213aa|down_1|NC_021658.1_11370881_11371520_-,NA|225aa|down_2|NC_021658.1_11371723_11372398_+,NA|353aa|down_3|NC_021658.1_11372460_11373519_+,NA|131aa|down_4|NC_021658.1_11373673_11374066_+,NA|392aa|down_5|NC_021658.1_11374131_11375307_+,NA|163aa|down_6|NC_021658.1_11375276_11375765_-,NA|139aa|down_7|NC_021658.1_11375752_11376169_-,NA|325aa|down_9|NC_021658.1_11377607_11378582_-	NA|400aa|up_9|NC_021658.1_11347967_11349167_+	pfam00457, Glyco_hydro_11, Glycosyl hydrolases family 11	NA|201aa|up_8|NC_021658.1_11349744_11350347_-	pfam00457, Glyco_hydro_11, Glycosyl hydrolases family 11	NA|236aa|up_7|NC_021658.1_11351185_11351893_-	PRK11752, PRK11752, putative S-transferase; Provisional	NA|802aa|up_6|NC_021658.1_11352222_11354628_+	cd11339, AmyAc_bac_CMD_like_2, Alpha amylase catalytic domain found in bacterial cyclomaltodextrinases and related proteins	NA|341aa|up_5|NC_021658.1_11354695_11355718_-	COG2130, COG2130, Putative NADP-dependent oxidoreductases [General function prediction only]	NA|162aa|up_4|NC_021658.1_11355930_11356416_+	NA	NA|1358aa|up_3|NC_021658.1_11356551_11360625_+	sd00038, Kelch, Kelch repeat	NA|346aa|up_2|NC_021658.1_11361342_11362380_-	PRK01372, ddl, D-alanine--D-alanine ligase; Reviewed	NA|530aa|up_1|NC_021658.1_11363268_11364858_+	PRK03180, ligB, ATP-dependent DNA ligase; Reviewed	NA|494aa|up_0|NC_021658.1_11364873_11366355_-	NA	NA|942aa|down_0|NC_021658.1_11367971_11370797_-	COG3903, COG3903, Predicted ATPase [General function prediction only]	NA|213aa|down_1|NC_021658.1_11370881_11371520_-	NA	NA|225aa|down_2|NC_021658.1_11371723_11372398_+	NA	NA|353aa|down_3|NC_021658.1_11372460_11373519_+	NA	NA|131aa|down_4|NC_021658.1_11373673_11374066_+	NA	NA|392aa|down_5|NC_021658.1_11374131_11375307_+	NA	NA|163aa|down_6|NC_021658.1_11375276_11375765_-	NA	NA|139aa|down_7|NC_021658.1_11375752_11376169_-	NA	NA|454aa|down_8|NC_021658.1_11376192_11377554_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|325aa|down_9|NC_021658.1_11377607_11378582_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	52	11367008-11367144	45	CRISPRCasFinder	no	csa3	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Type I-A	GTGAGCGAGCGCAGCGGCGAGAG	23	0	0	NA	NA	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|162aa|up_4|NC_021658.1_11355930_11356416_+,NA|494aa|up_0|NC_021658.1_11364873_11366355_-,NA|213aa|down_1|NC_021658.1_11370881_11371520_-,NA|225aa|down_2|NC_021658.1_11371723_11372398_+,NA|353aa|down_3|NC_021658.1_11372460_11373519_+,NA|131aa|down_4|NC_021658.1_11373673_11374066_+,NA|392aa|down_5|NC_021658.1_11374131_11375307_+,NA|163aa|down_6|NC_021658.1_11375276_11375765_-,NA|139aa|down_7|NC_021658.1_11375752_11376169_-,NA|325aa|down_9|NC_021658.1_11377607_11378582_-	NA|400aa|up_9|NC_021658.1_11347967_11349167_+	pfam00457, Glyco_hydro_11, Glycosyl hydrolases family 11	NA|201aa|up_8|NC_021658.1_11349744_11350347_-	pfam00457, Glyco_hydro_11, Glycosyl hydrolases family 11	NA|236aa|up_7|NC_021658.1_11351185_11351893_-	PRK11752, PRK11752, putative S-transferase; Provisional	NA|802aa|up_6|NC_021658.1_11352222_11354628_+	cd11339, AmyAc_bac_CMD_like_2, Alpha amylase catalytic domain found in bacterial cyclomaltodextrinases and related proteins	NA|341aa|up_5|NC_021658.1_11354695_11355718_-	COG2130, COG2130, Putative NADP-dependent oxidoreductases [General function prediction only]	NA|162aa|up_4|NC_021658.1_11355930_11356416_+	NA	NA|1358aa|up_3|NC_021658.1_11356551_11360625_+	sd00038, Kelch, Kelch repeat	NA|346aa|up_2|NC_021658.1_11361342_11362380_-	PRK01372, ddl, D-alanine--D-alanine ligase; Reviewed	NA|530aa|up_1|NC_021658.1_11363268_11364858_+	PRK03180, ligB, ATP-dependent DNA ligase; Reviewed	NA|494aa|up_0|NC_021658.1_11364873_11366355_-	NA	NA|942aa|down_0|NC_021658.1_11367971_11370797_-	COG3903, COG3903, Predicted ATPase [General function prediction only]	NA|213aa|down_1|NC_021658.1_11370881_11371520_-	NA	NA|225aa|down_2|NC_021658.1_11371723_11372398_+	NA	NA|353aa|down_3|NC_021658.1_11372460_11373519_+	NA	NA|131aa|down_4|NC_021658.1_11373673_11374066_+	NA	NA|392aa|down_5|NC_021658.1_11374131_11375307_+	NA	NA|163aa|down_6|NC_021658.1_11375276_11375765_-	NA	NA|139aa|down_7|NC_021658.1_11375752_11376169_-	NA	NA|454aa|down_8|NC_021658.1_11376192_11377554_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|325aa|down_9|NC_021658.1_11377607_11378582_-	NA
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	53	11465309-11465423	46	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CCCGAGGGGAAGCGCGGCGGCCCCTCGC	28	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|95aa|up_4|NC_021658.1_11459734_11460019_-,NA|311aa|up_1|NC_021658.1_11462727_11463660_+,NA	NA|565aa|up_9|NC_021658.1_11451797_11453492_+	COG0433, COG0433,  HerA helicase [Replication, recombination, and repair]	NA|199aa|up_8|NC_021658.1_11453534_11454131_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|540aa|up_7|NC_021658.1_11454514_11456134_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|533aa|up_6|NC_021658.1_11456326_11457925_-	pfam10011, DUF2254, Predicted membrane protein (DUF2254)	NA|372aa|up_5|NC_021658.1_11458046_11459162_-	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|95aa|up_4|NC_021658.1_11459734_11460019_-	NA	NA|212aa|up_3|NC_021658.1_11460586_11461222_+	sd00006, TPR, Tetratricopeptide repeat	NA|475aa|up_2|NC_021658.1_11461286_11462711_+	PRK00293, dipZ, thiol:disulfide interchange protein precursor; Provisional	NA|311aa|up_1|NC_021658.1_11462727_11463660_+	NA	NA|336aa|up_0|NC_021658.1_11463669_11464677_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|312aa|down_0|NC_021658.1_11467243_11468179_-	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase	NA|315aa|down_1|NC_021658.1_11468433_11469378_+	PRK01259, PRK01259, ribose-phosphate diphosphokinase	NA|229aa|down_2|NC_021658.1_11469592_11470279_+	PRK05618, PRK05618, 50S ribosomal protein L25/general stress protein Ctc; Reviewed	NA|224aa|down_3|NC_021658.1_11470417_11471089_+	PRK05426, PRK05426, peptidyl-tRNA hydrolase; Provisional	NA|180aa|down_4|NC_021658.1_11471201_11471741_+	cd00473, bS6, Bacterial ribosomal protein S6	NA|107aa|down_5|NC_021658.1_11471743_11472064_+	PRK00391, rpsR, 30S ribosomal protein S18; Reviewed	NA|151aa|down_6|NC_021658.1_11472074_11472527_+	PRK00137, rplI, 50S ribosomal protein L9; Reviewed	NA|327aa|down_7|NC_021658.1_11472602_11473583_-	cd01167, bac_FRK, Fructokinases (FRKs) mainly from bacteria and plants are enzymes with high specificity for fructose, as are all FRKs, but they catalyzes the conversion of fructose to fructose-6-phosphate, which is an entry point into glycolysis via conversion into glucose-6-phosphate	NA|501aa|down_8|NC_021658.1_11474004_11475507_+	TIGR00665, DnaB, replicative DNA helicase	NA|129aa|down_9|NC_021658.1_11475731_11476118_+	TIGR03340, phn_DUF6, phosphonate utilization associated putative membrane protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	54	11531270-11531382	47	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCGTCTGCTCGTTGTTCGACGCGAAGC	27	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|59aa|up_4|NC_021658.1_11526251_11526428_-,NA|144aa|down_4|NC_021658.1_11549682_11550114_-	NA|186aa|up_9|NC_021658.1_11516650_11517208_+	cd05381, CAP_PR-1, CAP (cysteine-rich secretory proteins, antigen 5, and pathogenesis-related 1 proteins) domain of pathogenesis-related protein 1 (PR-1) family proteins	NA|395aa|up_8|NC_021658.1_11517295_11518480_+	cd00567, ACAD, Acyl-CoA dehydrogenase	NA|685aa|up_7|NC_021658.1_11518631_11520686_+	cd06456, M3A_DCP, Peptidase family M3, dipeptidyl carboxypeptidase (DCP)	NA|626aa|up_6|NC_021658.1_11521183_11523061_+	pfam08308, PEGA, PEGA domain	NA|632aa|up_5|NC_021658.1_11523198_11525094_-	TIGR04247, nitrous_oxide_maturation_protein_NosD, nitrous oxide reductase family maturation protein NosD	NA|59aa|up_4|NC_021658.1_11526251_11526428_-	NA	NA|110aa|up_3|NC_021658.1_11526582_11526912_+	pfam07238, PilZ, PilZ domain	NA|847aa|up_2|NC_021658.1_11527235_11529776_-	COG3202, COG3202, ATP/ADP translocase [Energy production and conversion]	NA|202aa|up_1|NC_021658.1_11529786_11530392_-	TIGR02727, Uncharacterized_protein_YqgN, 5,10-methenyltetrahydrofolate synthetase	NA|150aa|up_0|NC_021658.1_11530733_11531183_+	PRK00567, mscL, large-conductance mechanosensitive channel protein MscL	NA|807aa|down_0|NC_021658.1_11540354_11542775_-	pfam03534, SpvB, Salmonella virulence plasmid 65kDa B protein	NA|269aa|down_1|NC_021658.1_11543302_11544109_+	CHL00019, atpF, ATP synthase CF0 B subunit	NA|1125aa|down_2|NC_021658.1_11544811_11548186_-	pfam13517, VCBS, Repeat domain in Vibrio, Colwellia, Bradyrhizobium and Shewanella	NA|467aa|down_3|NC_021658.1_11548185_11549586_-	pfam08308, PEGA, PEGA domain	NA|144aa|down_4|NC_021658.1_11549682_11550114_-	NA	NA|1239aa|down_5|NC_021658.1_11550170_11553887_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|664aa|down_6|NC_021658.1_11553883_11555875_-	pfam12770, CHAT, CHAT domain	NA|510aa|down_7|NC_021658.1_11556129_11557659_+	pfam08308, PEGA, PEGA domain	NA|807aa|down_8|NC_021658.1_11558069_11560490_+	pfam13517, VCBS, Repeat domain in Vibrio, Colwellia, Bradyrhizobium and Shewanella	NA|569aa|down_9|NC_021658.1_11560963_11562670_+	cd07302, CHD, cyclase homology domain
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	55	11695354-11695462	48	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGGCTCCGTCGGGACCGTGGGCTCCGT	27	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|74aa|up_9|NC_021658.1_11684897_11685119_+,NA|267aa|up_8|NC_021658.1_11685136_11685937_+,NA|222aa|up_6|NC_021658.1_11688159_11688825_+,NA|281aa|up_1|NC_021658.1_11691902_11692745_-,NA|136aa|down_0|NC_021658.1_11698139_11698547_+,NA|58aa|down_6|NC_021658.1_11706749_11706923_-	NA|74aa|up_9|NC_021658.1_11684897_11685119_+	NA	NA|267aa|up_8|NC_021658.1_11685136_11685937_+	NA	NA|417aa|up_7|NC_021658.1_11686428_11687679_-	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|222aa|up_6|NC_021658.1_11688159_11688825_+	NA	NA|336aa|up_5|NC_021658.1_11688905_11689913_+	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|181aa|up_4|NC_021658.1_11689984_11690527_+	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|106aa|up_3|NC_021658.1_11690628_11690946_+	COG1359, COG1359, Uncharacterized conserved protein [Function unknown]	NA|301aa|up_2|NC_021658.1_11690926_11691829_-	cd05466, PBP2_LTTR_substrate, The substrate binding domain of LysR-type transcriptional regulators (LTTRs), a member of the type 2 periplasmic binding fold protein superfamily	NA|281aa|up_1|NC_021658.1_11691902_11692745_-	NA	NA|769aa|up_0|NC_021658.1_11693014_11695321_-	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|136aa|down_0|NC_021658.1_11698139_11698547_+	NA	NA|293aa|down_1|NC_021658.1_11698791_11699670_-	pfam13385, Laminin_G_3, Concanavalin A-like lectin/glucanases superfamily	NA|653aa|down_2|NC_021658.1_11700241_11702200_+	TIGR04247, nitrous_oxide_maturation_protein_NosD, nitrous oxide reductase family maturation protein NosD	NA|286aa|down_3|NC_021658.1_11702282_11703140_-	TIGR02069, cyanophycinase, cyanophycinase	NA|895aa|down_4|NC_021658.1_11703164_11705849_-	PRK14016, PRK14016, cyanophycin synthetase; Provisional	NA|270aa|down_5|NC_021658.1_11705873_11706683_-	TIGR02069, cyanophycinase, cyanophycinase	NA|58aa|down_6|NC_021658.1_11706749_11706923_-	NA	NA|1040aa|down_7|NC_021658.1_11707404_11710524_-	smart00382, AAA, ATPases associated with a variety of cellular activities	NA|291aa|down_8|NC_021658.1_11711048_11711921_-	COG0266, Nei, Formamidopyrimidine-DNA glycosylase [DNA replication, recombination, and repair]	NA|921aa|down_9|NC_021658.1_11711999_11714762_-	pfam00520, Ion_trans, Ion transport protein
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	56	12553389-12553489	49	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CTACCGCGGCACGGCAGAGAGCTACCGCCGGCACGG	36	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|161aa|up_4|NC_021658.1_12544290_12544773_+,NA|114aa|up_3|NC_021658.1_12546301_12546643_+,NA|126aa|up_2|NC_021658.1_12549142_12549520_+,NA|295aa|up_1|NC_021658.1_12549607_12550492_+,NA|53aa|down_0|NC_021658.1_12556453_12556612_+,NA|56aa|down_1|NC_021658.1_12556892_12557060_-,NA|233aa|down_2|NC_021658.1_12557074_12557773_+,NA|424aa|down_8|NC_021658.1_12565397_12566669_-	NA|283aa|up_9|NC_021658.1_12532864_12533713_+	cd03023, DsbA_Com1_like, DsbA family, Com1-like subfamily; composed of proteins similar to Com1, a 27-kDa outer membrane-associated immunoreactive protein originally found in both acute and chronic disease strains of the pathogenic bacteria Coxiella burnetti	NA|306aa|up_8|NC_021658.1_12533717_12534635_-	cd05374, 17beta-HSD-like_SDR_c, 17beta hydroxysteroid dehydrogenase-like, classical (c) SDRs	NA|371aa|up_7|NC_021658.1_12535851_12536964_-	PLN03138, PLN03138, Protein TOC75; Provisional	NA|209aa|up_6|NC_021658.1_12539733_12540360_+	pfam00457, Glyco_hydro_11, Glycosyl hydrolases family 11	NA|211aa|up_5|NC_021658.1_12540508_12541141_-	COG0625, Gst, Glutathione S-transferase [Posttranslational modification, protein turnover, chaperones]	NA|161aa|up_4|NC_021658.1_12544290_12544773_+	NA	NA|114aa|up_3|NC_021658.1_12546301_12546643_+	NA	NA|126aa|up_2|NC_021658.1_12549142_12549520_+	NA	NA|295aa|up_1|NC_021658.1_12549607_12550492_+	NA	NA|767aa|up_0|NC_021658.1_12550927_12553228_-	cd18805, SF2_C_suv3, C-terminal helicase domain of ATP-dependent RNA helicase	NA|53aa|down_0|NC_021658.1_12556453_12556612_+	NA	NA|56aa|down_1|NC_021658.1_12556892_12557060_-	NA	NA|233aa|down_2|NC_021658.1_12557074_12557773_+	NA	NA|303aa|down_3|NC_021658.1_12557956_12558865_-	cd19100, AKR_unchar, uncharacterized aldo-keto reductase (AKR) superfamily protein	NA|470aa|down_4|NC_021658.1_12559163_12560573_-	pfam07586, HXXSHH, Protein of unknown function (DUF1552)	NA|575aa|down_5|NC_021658.1_12560569_12562294_-	pfam07631, PSD4, Protein of unknown function (DUF1592)	NA|304aa|down_6|NC_021658.1_12562559_12563471_-	pfam00014, Kunitz_BPTI, Kunitz/Bovine pancreatic trypsin inhibitor domain	NA|564aa|down_7|NC_021658.1_12563576_12565268_-	cd00144, MPP_PPP_family, phosphoprotein phosphatases of the metallophosphatase superfamily, metallophosphatase domain	NA|424aa|down_8|NC_021658.1_12565397_12566669_-	NA	NA|456aa|down_9|NC_021658.1_12566665_12568033_-	pfam07394, DUF1501, Protein of unknown function (DUF1501)
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	57	12646297-12646447	50	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCCGCACCGCTCGTCGGACCGGCAGTCGGCGCTGCAGCCGTCGCCGTCC	49	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|319aa|up_8|NC_021658.1_12634422_12635379_-,NA|121aa|up_5|NC_021658.1_12637765_12638128_+,NA	NA|307aa|up_9|NC_021658.1_12633109_12634030_-	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|319aa|up_8|NC_021658.1_12634422_12635379_-	NA	NA|350aa|up_7|NC_021658.1_12635534_12636584_-	cd08417, PBP2_Nitroaromatics_like, The C-terminal substrate binding domain of LysR-type transcriptional regulators that involved in the catabolism of nitroaromatic/naphthalene compounds and that of related regulators; contains the type 2 periplasmic binding fold	NA|107aa|up_6|NC_021658.1_12636619_12636940_+	pfam03992, ABM, Antibiotic biosynthesis monooxygenase	NA|121aa|up_5|NC_021658.1_12637765_12638128_+	NA	NA|488aa|up_4|NC_021658.1_12638439_12639903_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|462aa|up_3|NC_021658.1_12639899_12641285_+	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|233aa|up_2|NC_021658.1_12641485_12642184_+	pfam03682, UPF0158, Uncharacterized protein family (UPF0158)	NA|336aa|up_1|NC_021658.1_12642252_12643260_-	TIGR00367, Uncharacterized_membrane_protein_MJ0091, K+-dependent Na+/Ca+ exchanger related-protein	NA|320aa|up_0|NC_021658.1_12643354_12644314_-	pfam08308, PEGA, PEGA domain	NA|414aa|down_0|NC_021658.1_12647010_12648252_+	pfam05762, VWA_CoxE, VWA domain containing CoxE-like protein	NA|730aa|down_1|NC_021658.1_12649099_12651289_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|147aa|down_2|NC_021658.1_12655831_12656272_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|141aa|down_3|NC_021658.1_12658201_12658624_-	COG1733, COG1733, Predicted transcriptional regulators [Transcription]	NA|990aa|down_4|NC_021658.1_12659047_12662017_+	pfam13646, HEAT_2, HEAT repeats	NA|141aa|down_5|NC_021658.1_12662132_12662555_-	cd17557, REC_Rcp-like, phosphoacceptor receiver (REC) domain of cyanobacterial phytochrome response regulator Rcp and similar domains	NA|965aa|down_6|NC_021658.1_12662832_12665727_-	COG4251, COG4251, Bacteriophytochrome (light-regulated signal transduction histidine kinase) [Signal transduction mechanisms]	NA|223aa|down_7|NC_021658.1_12666302_12666971_-	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|228aa|down_8|NC_021658.1_12666921_12667605_-	PHA02518, PHA02518, ParA-like protein; Provisional	NA|355aa|down_9|NC_021658.1_12668380_12669445_+	pfam12770, CHAT, CHAT domain
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	58	12836833-12836921	51	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGACAGGACAGCGCTCCTCCTCGGCAGGC	29	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA,NA	NA|98aa|up_9|NC_021658.1_12820496_12820790_+	cd03418, GRX_GRXb_1_3_like, Glutaredoxin (GRX) family, GRX bacterial class 1 and 3 (b_1_3)-like subfamily; composed of bacterial GRXs, approximately 10 kDa in size, and proteins containing a GRX or GRX-like domain	NA|568aa|up_8|NC_021658.1_12820983_12822687_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|375aa|up_7|NC_021658.1_12822802_12823927_+	TIGR02031, Magnesium-chelatase_67_kDa_subunit, magnesium chelatase ATPase subunit D	NA|656aa|up_6|NC_021658.1_12824092_12826060_+	PRK00174, PRK00174, acetyl-CoA synthetase; Provisional	NA|518aa|up_5|NC_021658.1_12826312_12827866_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|560aa|up_4|NC_021658.1_12827924_12829604_-	PRK11360, PRK11360, two-component system sensor histidine kinase AtoS	NA|362aa|up_3|NC_021658.1_12829600_12830686_-	COG0247, GlpC, Fe-S oxidoreductase [Energy production and conversion]	NA|701aa|up_2|NC_021658.1_12830735_12832838_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|416aa|up_1|NC_021658.1_12832954_12834202_-	PRK09376, rho, transcription termination factor Rho; Provisional	NA|93aa|up_0|NC_021658.1_12834589_12834868_+	COG1254, AcyP, Acylphosphatases [Energy production and conversion]	NA|173aa|down_0|NC_021658.1_12837317_12837836_-	PRK05591, rplQ, 50S ribosomal protein L17; Validated	NA|347aa|down_1|NC_021658.1_12837856_12838897_-	PRK05182, PRK05182, DNA-directed RNA polymerase subunit alpha; Provisional	NA|210aa|down_2|NC_021658.1_12839105_12839735_-	PRK05327, rpsD, 30S ribosomal protein S4; Validated	NA|137aa|down_3|NC_021658.1_12839746_12840157_-	PRK05309, PRK05309, 30S ribosomal protein S11; Validated	NA|127aa|down_4|NC_021658.1_12840177_12840558_-	PRK05179, rpsM, 30S ribosomal protein S13; Validated	NA|39aa|down_5|NC_021658.1_12840601_12840718_-	PRK00465, rpmJ, 50S ribosomal protein L36; Reviewed	NA|84aa|down_6|NC_021658.1_12840749_12841001_-	PRK00276, infA, translation initiation factor IF-1; Validated	NA|214aa|down_7|NC_021658.1_12840997_12841639_-	PRK00279, adk, adenylate kinase; Reviewed	NA|443aa|down_8|NC_021658.1_12841649_12842978_-	PRK09204, secY, preprotein translocase subunit SecY; Reviewed	NA|164aa|down_9|NC_021658.1_12843022_12843514_-	PRK05592, rplO, 50S ribosomal protein L15; Reviewed
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	59	12863887-12863963	52	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GATCGCGCCCGCCGGCGCCGTGAGG	25	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|99aa|up_1|NC_021658.1_12862997_12863294_+,NA|61aa|up_0|NC_021658.1_12863636_12863819_+,NA|167aa|down_0|NC_021658.1_12864018_12864519_-,NA|60aa|down_3|NC_021658.1_12868618_12868798_+	NA|113aa|up_9|NC_021658.1_12849200_12849539_-	PRK00565, rplV, 50S ribosomal protein L22; Reviewed	NA|245aa|up_8|NC_021658.1_12850197_12850932_+	PTZ00146, PTZ00146, fibrillarin; Provisional	NA|299aa|up_7|NC_021658.1_12851253_12852150_+	pfam03781, FGE-sulfatase, Sulfatase-modifying factor enzyme 1	NA|475aa|up_6|NC_021658.1_12852379_12853804_+	PRK12323, PRK12323, DNA polymerase III subunit gamma/tau	NA|175aa|up_5|NC_021658.1_12853896_12854421_-	PLN03237, PLN03237, DNA topoisomerase 2; Provisional	NA|222aa|up_4|NC_021658.1_12855908_12856574_+	COG2226, UbiE, Methylase involved in ubiquinone/menaquinone biosynthesis [Coenzyme metabolism]	NA|569aa|up_3|NC_021658.1_12859351_12861058_+	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|427aa|up_2|NC_021658.1_12861236_12862517_+	COG0768, FtsI, Cell division protein FtsI/penicillin-binding protein 2 [Cell envelope biogenesis, outer membrane]	NA|99aa|up_1|NC_021658.1_12862997_12863294_+	NA	NA|61aa|up_0|NC_021658.1_12863636_12863819_+	NA	NA|167aa|down_0|NC_021658.1_12864018_12864519_-	NA	NA|1019aa|down_1|NC_021658.1_12864578_12867635_-	COG0823, TolB, Periplasmic component of the Tol biopolymer transport system [Intracellular trafficking and secretion]	NA|225aa|down_2|NC_021658.1_12867659_12868334_-	PRK07994, PRK07994, DNA polymerase III subunits gamma and tau; Validated	NA|60aa|down_3|NC_021658.1_12868618_12868798_+	NA	NA|311aa|down_4|NC_021658.1_12868892_12869825_-	COG0223, Fmt, Methionyl-tRNA formyltransferase [Translation, ribosomal structure and biogenesis]	NA|277aa|down_5|NC_021658.1_12869845_12870676_+	COG2884, FtsE, Predicted ATPase involved in cell division [Cell division and chromosome partitioning]	NA|298aa|down_6|NC_021658.1_12870722_12871616_+	COG2177, FtsX, Cell division protein [Cell division and chromosome partitioning]	NA|334aa|down_7|NC_021658.1_12871612_12872614_+	COG4942, COG4942, Membrane-bound metallopeptidase [Cell division and chromosome partitioning]	NA|258aa|down_8|NC_021658.1_12872705_12873479_+	PRK00173, rph, ribonuclease PH; Reviewed	NA|208aa|down_9|NC_021658.1_12873475_12874099_+	PRK00120, PRK00120, dITP/XTP pyrophosphatase; Reviewed
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	60	12914976-12915078	53	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGTCGCAGAGCGGCGGTCACCCGCACAG	28	1	1	12915004-12915050	NC_021658.1_2165184-2165138	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|290aa|up_4|NC_021658.1_12907567_12908437_+,NA|116aa|up_3|NC_021658.1_12908960_12909308_+,NA|87aa|up_1|NC_021658.1_12913496_12913757_+,NA|92aa|down_7|NC_021658.1_12924324_12924600_-	NA|381aa|up_9|NC_021658.1_12901237_12902380_+	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|329aa|up_8|NC_021658.1_12902712_12903699_+	pfam08308, PEGA, PEGA domain	NA|543aa|up_7|NC_021658.1_12903728_12905357_+	PRK13875, PRK13875, conjugal transfer protein TrbL; Provisional	NA|399aa|up_6|NC_021658.1_12905418_12906615_-	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|112aa|up_5|NC_021658.1_12906972_12907308_+	cd05403, NT_KNTase_like, Nucleotidyltransferase (NT) domain of Staphylococcus aureus kanamycin nucleotidyltransferase, and similar proteins	NA|290aa|up_4|NC_021658.1_12907567_12908437_+	NA	NA|116aa|up_3|NC_021658.1_12908960_12909308_+	NA	NA|1300aa|up_2|NC_021658.1_12909304_12913204_+	pfam12770, CHAT, CHAT domain	NA|87aa|up_1|NC_021658.1_12913496_12913757_+	NA	NA|340aa|up_0|NC_021658.1_12913887_12914907_+	COG1192, Soj, ATPases involved in chromosome partitioning [Cell division and chromosome partitioning]	NA|309aa|down_0|NC_021658.1_12915180_12916107_-	COG0240, GpsA, Glycerol-3-phosphate dehydrogenase [Energy production and conversion]	NA|595aa|down_1|NC_021658.1_12916103_12917888_-	cd07993, LPLAT_DHAPAT-like, Lysophospholipid Acyltransferases (LPLATs) of Glycerophospholipid Biosynthesis: GPAT-like	NA|252aa|down_2|NC_021658.1_12917953_12918709_-	TIGR03413, GSH_gloB, hydroxyacylglutathione hydrolase	NA|335aa|down_3|NC_021658.1_12918876_12919881_+	pfam01351, RNase_HII, Ribonuclease HII	NA|385aa|down_4|NC_021658.1_12919985_12921140_+	PRK05550, PRK05550, bifunctional methionine sulfoxide reductase B/A protein; Provisional	NA|469aa|down_5|NC_021658.1_12921456_12922863_-	PRK06416, PRK06416, dihydrolipoamide dehydrogenase; Reviewed	NA|362aa|down_6|NC_021658.1_12923026_12924112_-	TIGR03181, PDH_E1_alph_x, pyruvate dehydrogenase E1 component, alpha subunit	NA|92aa|down_7|NC_021658.1_12924324_12924600_-	NA	NA|205aa|down_8|NC_021658.1_12924708_12925323_-	pfam13664, DUF4149, Domain of unknown function (DUF4149)	NA|349aa|down_9|NC_021658.1_12925319_12926366_-	COG1413, COG1413, FOG: HEAT repeat [Energy production and conversion]
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	61	13327224-13327304	54	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CTTCTCGGCGATCGTGCCCGCGCG	24	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|608aa|up_3|NC_021658.1_13320093_13321917_+,NA|229aa|up_2|NC_021658.1_13322459_13323146_+,NA|88aa|up_1|NC_021658.1_13323325_13323589_-,NA|262aa|down_6|NC_021658.1_13334782_13335568_+,NA|205aa|down_7|NC_021658.1_13335649_13336264_-	NA|734aa|up_9|NC_021658.1_13308710_13310912_-	PRK11360, PRK11360, two-component system sensor histidine kinase AtoS	NA|434aa|up_8|NC_021658.1_13310917_13312219_-	PRK05431, PRK05431, seryl-tRNA synthetase; Provisional	NA|918aa|up_7|NC_021658.1_13312354_13315108_-	PRK09277, PRK09277, aconitate hydratase AcnA	NA|292aa|up_6|NC_021658.1_13315169_13316045_+	pfam02586, SRAP, SOS response associated peptidase (SRAP)	NA|263aa|up_5|NC_021658.1_13316346_13317135_-	pfam01814, Hemerythrin, Hemerythrin HHE cation binding domain	NA|769aa|up_4|NC_021658.1_13317563_13319870_-	cd16148, sulfatase_like, uncharacterized sulfatase subfamily	NA|608aa|up_3|NC_021658.1_13320093_13321917_+	NA	NA|229aa|up_2|NC_021658.1_13322459_13323146_+	NA	NA|88aa|up_1|NC_021658.1_13323325_13323589_-	NA	NA|1148aa|up_0|NC_021658.1_13323721_13327165_-	cd17574, REC_OmpR, phosphoacceptor receiver (REC) domain of OmpR family response regulators	NA|364aa|down_0|NC_021658.1_13327332_13328424_-	COG0473, LeuB, Isocitrate/isopropylmalate dehydrogenase [Amino acid transport and metabolism]	NA|371aa|down_1|NC_021658.1_13328441_13329554_-	cd05305, L-AlaDH, Alanine dehydrogenase NAD-binding and catalytic domains	NA|540aa|down_2|NC_021658.1_13329713_13331333_-	pfam14332, DUF4388, Domain of unknown function (DUF4388)	NA|629aa|down_3|NC_021658.1_13331369_13333256_-	cd01949, GGDEF, Diguanylate-cyclase (DGC) or GGDEF domain	NA|269aa|down_4|NC_021658.1_13333252_13334059_-	PRK00450, dapF, diaminopimelate epimerase; Provisional	NA|113aa|down_5|NC_021658.1_13334055_13334394_-	pfam02594, DUF167, Uncharacterized ACR, YggU family COG1872	NA|262aa|down_6|NC_021658.1_13334782_13335568_+	NA	NA|205aa|down_7|NC_021658.1_13335649_13336264_-	NA	NA|110aa|down_8|NC_021658.1_13336577_13336907_+	pfam05164, ZapA, Cell division protein ZapA	NA|371aa|down_9|NC_021658.1_13337021_13338134_+	PRK05958, PRK05958, 8-amino-7-oxononanoate synthase; Reviewed
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	62	14280562-14280706	55	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GACGGGCGACGGGTGCGGCGCGAGCTGCCGGTGGGAGGTCTGCGGCAACGCG	52	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|261aa|up_9|NC_021658.1_14265189_14265972_+,NA|193aa|up_7|NC_021658.1_14267154_14267733_-,NA|222aa|up_2|NC_021658.1_14276540_14277206_+,NA|367aa|up_1|NC_021658.1_14277130_14278231_+,NA|191aa|down_7|NC_021658.1_14296306_14296879_+	NA|261aa|up_9|NC_021658.1_14265189_14265972_+	NA	NA|361aa|up_8|NC_021658.1_14266029_14267112_-	PRK02731, PRK02731, histidinol-phosphate aminotransferase; Validated	NA|193aa|up_7|NC_021658.1_14267154_14267733_-	NA	NA|371aa|up_6|NC_021658.1_14267729_14268842_-	pfam13304, AAA_21, AAA domain, putative AbiEii toxin, Type IV TA system	NA|1320aa|up_5|NC_021658.1_14269439_14273399_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|457aa|up_4|NC_021658.1_14273710_14275081_+	COG1541, PaaK, Coenzyme F390 synthetase [Coenzyme metabolism]	NA|397aa|up_3|NC_021658.1_14275077_14276268_+	cd03807, GT4_WbnK-like, Shigella dysenteriae WbnK and similar proteins	NA|222aa|up_2|NC_021658.1_14276540_14277206_+	NA	NA|367aa|up_1|NC_021658.1_14277130_14278231_+	NA	NA|451aa|up_0|NC_021658.1_14278422_14279775_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|1020aa|down_0|NC_021658.1_14282822_14285882_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|318aa|down_1|NC_021658.1_14285966_14286920_+	sd00006, TPR, Tetratricopeptide repeat	NA|394aa|down_2|NC_021658.1_14286954_14288136_-	TIGR04211, hypothetical_protein, SH3 domain protein	NA|746aa|down_3|NC_021658.1_14288393_14290631_+	cd06267, PBP1_LacI_sugar_binding-like, ligand binding domain of the LacI transcriptional regulator family belonging to the type 1 periplasmic-binding fold protein superfamily	NA|345aa|down_4|NC_021658.1_14290978_14292013_+	pfam03022, MRJP, Major royal jelly protein	NA|314aa|down_5|NC_021658.1_14291970_14292912_-	cd08422, PBP2_CrgA_like, The C-terminal substrate binding domain of LysR-type transcriptional regulator CrgA and its related homologs, contains the type 2 periplasmic binding domain	NA|250aa|down_6|NC_021658.1_14293934_14294684_-	PRK06172, PRK06172, SDR family oxidoreductase	NA|191aa|down_7|NC_021658.1_14296306_14296879_+	NA	NA|314aa|down_8|NC_021658.1_14297017_14297959_-	cd16283, RomA-like_MBL-fold, Enterobacter cloacae RomA and related proteins; MBL-fold metallo hydrolase domain	NA|245aa|down_9|NC_021658.1_14297963_14298698_-	PLN00042, PLN00042, photosystem II oxygen-evolving enhancer protein 2; Provisional
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	63	14281905-14282075	6	PILER-CR	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	CGAGCATCGCGCATTACGACGGCAGCTCCTGGACAT	36	0	0	NA	NA	NA	2	2	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|261aa|up_9|NC_021658.1_14265189_14265972_+,NA|193aa|up_7|NC_021658.1_14267154_14267733_-,NA|222aa|up_2|NC_021658.1_14276540_14277206_+,NA|367aa|up_1|NC_021658.1_14277130_14278231_+,NA|191aa|down_7|NC_021658.1_14296306_14296879_+	NA|261aa|up_9|NC_021658.1_14265189_14265972_+	NA	NA|361aa|up_8|NC_021658.1_14266029_14267112_-	PRK02731, PRK02731, histidinol-phosphate aminotransferase; Validated	NA|193aa|up_7|NC_021658.1_14267154_14267733_-	NA	NA|371aa|up_6|NC_021658.1_14267729_14268842_-	pfam13304, AAA_21, AAA domain, putative AbiEii toxin, Type IV TA system	NA|1320aa|up_5|NC_021658.1_14269439_14273399_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|457aa|up_4|NC_021658.1_14273710_14275081_+	COG1541, PaaK, Coenzyme F390 synthetase [Coenzyme metabolism]	NA|397aa|up_3|NC_021658.1_14275077_14276268_+	cd03807, GT4_WbnK-like, Shigella dysenteriae WbnK and similar proteins	NA|222aa|up_2|NC_021658.1_14276540_14277206_+	NA	NA|367aa|up_1|NC_021658.1_14277130_14278231_+	NA	NA|451aa|up_0|NC_021658.1_14278422_14279775_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|1020aa|down_0|NC_021658.1_14282822_14285882_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|318aa|down_1|NC_021658.1_14285966_14286920_+	sd00006, TPR, Tetratricopeptide repeat	NA|394aa|down_2|NC_021658.1_14286954_14288136_-	TIGR04211, hypothetical_protein, SH3 domain protein	NA|746aa|down_3|NC_021658.1_14288393_14290631_+	cd06267, PBP1_LacI_sugar_binding-like, ligand binding domain of the LacI transcriptional regulator family belonging to the type 1 periplasmic-binding fold protein superfamily	NA|345aa|down_4|NC_021658.1_14290978_14292013_+	pfam03022, MRJP, Major royal jelly protein	NA|314aa|down_5|NC_021658.1_14291970_14292912_-	cd08422, PBP2_CrgA_like, The C-terminal substrate binding domain of LysR-type transcriptional regulator CrgA and its related homologs, contains the type 2 periplasmic binding domain	NA|250aa|down_6|NC_021658.1_14293934_14294684_-	PRK06172, PRK06172, SDR family oxidoreductase	NA|191aa|down_7|NC_021658.1_14296306_14296879_+	NA	NA|314aa|down_8|NC_021658.1_14297017_14297959_-	cd16283, RomA-like_MBL-fold, Enterobacter cloacae RomA and related proteins; MBL-fold metallo hydrolase domain	NA|245aa|down_9|NC_021658.1_14297963_14298698_-	PLN00042, PLN00042, photosystem II oxygen-evolving enhancer protein 2; Provisional
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	64	14326570-14326669	56	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GGCATACTAACTTGCTTGTGGCC	23	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|123aa|up_4|NC_021658.1_14321166_14321535_+,NA|229aa|up_2|NC_021658.1_14323547_14324234_+,NA	NA|195aa|up_9|NC_021658.1_14315583_14316168_-	TIGR02246, hypothetical_protein, conserved hypothetical protein	NA|342aa|up_8|NC_021658.1_14316262_14317288_-	cd19091, AKR_PsAKR, Polaromonas Sp	NA|409aa|up_7|NC_021658.1_14318234_14319461_+	pfam00150, Cellulase, Cellulase (glycosyl hydrolase family 5)	NA|195aa|up_6|NC_021658.1_14319542_14320127_-	PRK00517, prmA, 50S ribosomal protein L11 methyltransferase	NA|224aa|up_5|NC_021658.1_14320170_14320842_-	pfam14124, DUF4291, Domain of unknown function (DUF4291)	NA|123aa|up_4|NC_021658.1_14321166_14321535_+	NA	NA|441aa|up_3|NC_021658.1_14321763_14323086_+	cd07209, Pat_hypo_Ecoli_Z1214_like, Hypothetical patatin similar to Z1214 protein of Escherichia coli	NA|229aa|up_2|NC_021658.1_14323547_14324234_+	NA	NA|442aa|up_1|NC_021658.1_14324261_14325587_+	cd00190, Tryp_SPc, Trypsin-like serine protease; Many of these are synthesized as inactive precursor zymogens that are cleaved during limited proteolysis to generate their active forms	NA|310aa|up_0|NC_021658.1_14325597_14326527_+	cd03392, PAP2_like_2, PAP2_like_2 proteins	NA|70aa|down_0|NC_021658.1_14326740_14326950_+	TIGR00638, Probable_molybdenum-pterin-binding_protein, molybdenum-pterin binding domain	NA|507aa|down_1|NC_021658.1_14326992_14328513_-	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|1309aa|down_2|NC_021658.1_14329090_14333017_+	TIGR02148, ORFveg106_random, fibro-slime domain	NA|635aa|down_3|NC_021658.1_14333062_14334967_-	COG5000, NtrY, Signal transduction histidine kinase involved in nitrogen fixation and metabolism regulation [Signal transduction mechanisms]	NA|670aa|down_4|NC_021658.1_14335223_14337233_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|344aa|down_5|NC_021658.1_14337267_14338299_+	cd00060, FHA, Forkhead associated domain (FHA); found in eukaryotic and prokaryotic proteins	NA|155aa|down_6|NC_021658.1_14338354_14338819_+	cd02232, cupin_ARD, acireductone dioxygenase (ARD), cupin domain	NA|123aa|down_7|NC_021658.1_14338833_14339202_+	cd02214, cupin_MJ1618, Methanocaldococcus jannaschii MJ1618 and related proteins, cupin domain	NA|388aa|down_8|NC_021658.1_14339456_14340620_+	smart00903, Flavin_Reduct, Flavin reductase like domain	NA|304aa|down_9|NC_021658.1_14340671_14341583_-	PRK08645, PRK08645, bifunctional homocysteine S-methyltransferase/5,10-methylenetetrahydrofolate reductase protein; Reviewed
GCF_000418325.1_ASM41832v1	NC_021658	Sorangium cellulosum So0157-2, complete sequence	65	14564502-14564596	57	CRISPRCasFinder	no		cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	Orphan	GCGGCGTGCGATGATCGGCGCGC	23	0	0	NA	NA	NA	1	1	Orphan	cas8u1,cas3,csb2gr5,csb1gr7,cas1,cas2,csa3,RT,DEDDh,WYL,DinG,PD-DExK,cas6	NA|110aa|up_5|NC_021658.1_14556578_14556908_+,NA|412aa|up_3|NC_021658.1_14559276_14560512_-,NA	NA|337aa|up_9|NC_021658.1_14550695_14551706_+	pfam01590, GAF, GAF domain	NA|902aa|up_8|NC_021658.1_14551750_14554456_+	TIGR03361, VI_Rhs_Vgr, type VI secretion system Vgr family protein	NA|145aa|up_7|NC_021658.1_14554519_14554954_+	pfam08786, DcrB, DcrB	NA|533aa|up_6|NC_021658.1_14554968_14556567_+	cd14742, PAAR_RHS, proline-alanine-alanine-arginine (PAAR) domain, also containing C-terminal Rearrangement hotspot (Rhs) extensions	NA|110aa|up_5|NC_021658.1_14556578_14556908_+	NA	NA|767aa|up_4|NC_021658.1_14556935_14559236_-	pfam09937, DUF2169, Uncharacterized protein conserved in bacteria (DUF2169)	NA|412aa|up_3|NC_021658.1_14559276_14560512_-	NA	NA|451aa|up_2|NC_021658.1_14560569_14561922_+	TIGR03329, Phn_aa_oxid, putative aminophosphonate oxidoreductase	NA|362aa|up_1|NC_021658.1_14561984_14563070_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|448aa|up_0|NC_021658.1_14563124_14564468_+	PLN02569, PLN02569, threonine synthase	NA|644aa|down_0|NC_021658.1_14564633_14566565_+	COG4191, COG4191, Signal transduction histidine kinase regulating C4-dicarboxylate transport system [Signal transduction mechanisms]	NA|615aa|down_1|NC_021658.1_14566607_14568452_-	cd07041, STAS_RsbR_RsbS_like, Sulphate Transporter and Anti-Sigma factor antagonist domain of the "stressosome" complex proteins RsbS and RsbR, regulators of the bacterial stress activated alternative sigma factor sigma-B by phosphorylation	NA|433aa|down_2|NC_021658.1_14568544_14569843_-	TIGR04411, hypothetical_protein, type II secretion system protein N, Leptospira/Geobacter-type	NA|201aa|down_3|NC_021658.1_14569839_14570442_-	pfam04612, T2SSM, Type II secretion system (T2SS), protein M	NA|505aa|down_4|NC_021658.1_14570438_14571953_-	COG4972, PilM, Tfp pilus assembly protein, ATPase PilM [Cell motility and secretion / Intracellular trafficking and secretion]	NA|501aa|down_5|NC_021658.1_14571980_14573483_-	pfam03934, T2SSK, Type II secretion system (T2SS), protein K	NA|240aa|down_6|NC_021658.1_14573486_14574206_-	COG4795, PulJ, Type II secretory pathway, component PulJ [Intracellular trafficking and secretion]	NA|226aa|down_7|NC_021658.1_14574202_14574880_-	COG2165, PulG, Type II secretory pathway, pseudopilin PulG [Cell motility and secretion / Intracellular trafficking and secretion]	NA|234aa|down_8|NC_021658.1_14574879_14575581_-	COG4970, FimT, Tfp pilus assembly protein FimT [Cell motility and secretion / Intracellular trafficking and secretion]	NA|135aa|down_9|NC_021658.1_14575603_14576008_-	TIGR01710, Type_II_secretion_system_protein_G, type II secretion system protein G
