assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	1	179434-179508	1	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATACTGTAACTCCTCCTGTCTTAG	24	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|309aa|up_3|NZ_AP018255.1_172846_173773_-,NA|271aa|down_5|NZ_AP018255.1_187765_188578_-,NA|243aa|down_6|NZ_AP018255.1_188612_189341_-	NA|404aa|up_9|NZ_AP018255.1_164741_165953_+	pfam07995, GSDH, Glucose / Sorbosone dehydrogenase	NA|302aa|up_8|NZ_AP018255.1_165961_166867_+	PRK05184, PRK05184, pyrroloquinoline quinone biosynthesis protein PqqB; Provisional	NA|238aa|up_7|NZ_AP018255.1_166964_167678_+	PRK05157, PRK05157, pyrroloquinoline quinone biosynthesis protein PqqC; Provisional	NA|94aa|up_6|NZ_AP018255.1_167954_168236_+	TIGR03859, PQQ_PqqD, coenzyme PQQ biosynthesis protein PqqD	NA|366aa|up_5|NZ_AP018255.1_168329_169427_+	PRK05301, PRK05301, pyrroloquinoline quinone biosynthesis protein PqqE; Provisional	NA|1021aa|up_4|NZ_AP018255.1_169667_172730_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|309aa|up_3|NZ_AP018255.1_172846_173773_-	NA	NA|524aa|up_2|NZ_AP018255.1_173827_175399_-	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily	NA|154aa|up_1|NZ_AP018255.1_175474_175936_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|563aa|up_0|NZ_AP018255.1_176504_178193_+	COG2831, FhaC, Hemolysin activation/secretion protein [Intracellular trafficking and secretion]	NA|237aa|down_0|NZ_AP018255.1_182643_183354_-	sd00006, TPR, Tetratricopeptide repeat	NA|351aa|down_1|NZ_AP018255.1_183628_184681_-	cd00707, Pancreat_lipase_like, Pancreatic lipase-like enzymes	NA|463aa|down_2|NZ_AP018255.1_184929_186318_+	pfam05685, Uma2, Putative restriction endonuclease	NA|234aa|down_3|NZ_AP018255.1_186419_187121_+	pfam13646, HEAT_2, HEAT repeats	NA|195aa|down_4|NZ_AP018255.1_187149_187734_-	pfam09346, SMI1_KNR4, SMI1 / KNR4 family (SUKH-1)	NA|271aa|down_5|NZ_AP018255.1_187765_188578_-	NA	NA|243aa|down_6|NZ_AP018255.1_188612_189341_-	NA	NA|134aa|down_7|NZ_AP018255.1_190539_190941_-	pfam13826, DUF4188, Domain of unknown function (DUF4188)	NA|768aa|down_8|NZ_AP018255.1_191343_193647_-	cd06160, S2P-M50_like_2, Uncharacterized homologs of Site-2 protease (S2P), zinc metalloproteases (MEROPS family M50) which cleave transmembrane domains of substrate proteins, regulating intramembrane proteolysis (RIP) of diverse signal transduction mechanisms	NA|223aa|down_9|NZ_AP018255.1_194104_194773_-	COG4340, COG4340, Uncharacterized protein conserved in bacteria [Function unknown]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	2	378345-378423	2	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATAATTTCACTTTATCCGCGACAAAT	26	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|134aa|up_0|NZ_AP018255.1_376396_376798_-,NA|83aa|down_6|NZ_AP018255.1_386022_386271_+	NA|301aa|up_9|NZ_AP018255.1_366998_367901_-	pfam00395, SLH, S-layer homology domain	NA|339aa|up_8|NZ_AP018255.1_368205_369222_+	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|186aa|up_7|NZ_AP018255.1_369708_370266_-	COG3247, HdeD, Uncharacterized conserved protein [Function unknown]	NA|254aa|up_6|NZ_AP018255.1_370301_371063_-	PRK12829, PRK12829, short chain dehydrogenase; Provisional	NA|451aa|up_5|NZ_AP018255.1_371088_372441_-	pfam00067, p450, Cytochrome P450	NA|193aa|up_4|NZ_AP018255.1_372476_373055_-	pfam03358, FMN_red, NADPH-dependent FMN reductase	NA|304aa|up_3|NZ_AP018255.1_373142_374054_-	COG3861, COG3861, Uncharacterized protein conserved in bacteria [Function unknown]	NA|190aa|up_2|NZ_AP018255.1_374446_375016_+	pfam12263, DUF3611, Protein of unknown function (DUF3611)	NA|341aa|up_1|NZ_AP018255.1_375039_376062_+	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|134aa|up_0|NZ_AP018255.1_376396_376798_-	NA	NA|160aa|down_0|NZ_AP018255.1_378758_379238_+	COG5637, COG5637, Predicted integral membrane protein [Function unknown]	NA|390aa|down_1|NZ_AP018255.1_379243_380413_+	cd08283, FDH_like_1, Glutathione-dependent formaldehyde dehydrogenase related proteins, child 1	NA|393aa|down_2|NZ_AP018255.1_380533_381712_+	cd08283, FDH_like_1, Glutathione-dependent formaldehyde dehydrogenase related proteins, child 1	NA|188aa|down_3|NZ_AP018255.1_381765_382329_+	cd03134, GATase1_PfpI_like, A type 1 glutamine amidotransferase (GATase1)-like domain found in PfpI from Pyrococcus furiosus	NA|280aa|down_4|NZ_AP018255.1_382359_383199_+	cd19138, AKR_YeaE, Escherichia coli YeaE and similar proteins	NA|301aa|down_5|NZ_AP018255.1_385070_385973_+	cd07385, MPP_YkuE_C, Bacillus subtilis YkuE and related proteins, C-terminal metallophosphatase domain	NA|83aa|down_6|NZ_AP018255.1_386022_386271_+	NA	NA|129aa|down_7|NZ_AP018255.1_386334_386721_+	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|274aa|down_8|NZ_AP018255.1_386772_387594_+	cd07363, 45_DOPA_Dioxygenase, The Class III extradiol dioxygenase, 4,5-DOPA Dioxygenase, catalyzes the incorporation of both atoms of molecular oxygen into 4,5-dihydroxy-phenylalanine	NA|1213aa|down_9|NZ_AP018255.1_388545_392184_+	COG4449, COG4449, Predicted protease of the Abi (CAAX) family [General function prediction only]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	3	785979-786109	3	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATTACAATCAATCAAAGTAACGAGAAATTAAACTGCTT	38	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|106aa|up_5|NZ_AP018255.1_777279_777597_-,NA|64aa|down_1|NZ_AP018255.1_790506_790698_+,NA|71aa|down_4|NZ_AP018255.1_792873_793086_-,NA|69aa|down_5|NZ_AP018255.1_793082_793289_-,NA|61aa|down_8|NZ_AP018255.1_794249_794432_-,NA|137aa|down_9|NZ_AP018255.1_795554_795965_-	NA|122aa|up_9|NZ_AP018255.1_774032_774398_-	smart00823, PKS_PP, Phosphopantetheine attachment site	NA|191aa|up_8|NZ_AP018255.1_774544_775117_-	PRK00889, PRK00889, adenylylsulfate kinase; Provisional	NA|230aa|up_7|NZ_AP018255.1_775268_775958_-	cd03023, DsbA_Com1_like, DsbA family, Com1-like subfamily; composed of proteins similar to Com1, a 27-kDa outer membrane-associated immunoreactive protein originally found in both acute and chronic disease strains of the pathogenic bacteria Coxiella burnetti	NA|85aa|up_6|NZ_AP018255.1_776258_776513_-	pfam12151, MVL, Mannan-binding protein	NA|106aa|up_5|NZ_AP018255.1_777279_777597_-	NA	NA|85aa|up_4|NZ_AP018255.1_778459_778714_-	pfam12151, MVL, Mannan-binding protein	NA|171aa|up_3|NZ_AP018255.1_779533_780046_-	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|573aa|up_2|NZ_AP018255.1_780660_782379_-	cd09912, DLP_2, Dynamin-like protein including dynamins, mitofusins, and guanylate-binding proteins	NA|411aa|up_1|NZ_AP018255.1_782777_784010_-	COG0265, DegQ, Trypsin-like serine proteases, typically periplasmic, contain C-terminal PDZ domain [Posttranslational modification, protein turnover, chaperones]	NA|429aa|up_0|NZ_AP018255.1_784545_785832_-	pfam14516, AAA_35, AAA-like domain	NA|1228aa|down_0|NZ_AP018255.1_786153_789837_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|64aa|down_1|NZ_AP018255.1_790506_790698_+	NA	NA|170aa|down_2|NZ_AP018255.1_790993_791503_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|199aa|down_3|NZ_AP018255.1_792246_792843_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|71aa|down_4|NZ_AP018255.1_792873_793086_-	NA	NA|69aa|down_5|NZ_AP018255.1_793082_793289_-	NA	NA|138aa|down_6|NZ_AP018255.1_793476_793890_+	pfam08814, XisH, XisH protein	NA|112aa|down_7|NZ_AP018255.1_793877_794213_+	cd16382, XisI-like, XisI is FdxN element excision controlling factor protein	NA|61aa|down_8|NZ_AP018255.1_794249_794432_-	NA	NA|137aa|down_9|NZ_AP018255.1_795554_795965_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	4	1797091-1797170	4	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATTGTCGGTTGAGGAGTAGGTTCCGG	26	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA,NA|243aa|down_4|NZ_AP018255.1_1801945_1802674_-,NA|482aa|down_7|NZ_AP018255.1_1806720_1808166_-,NA|66aa|down_8|NZ_AP018255.1_1808202_1808400_-	NA|469aa|up_9|NZ_AP018255.1_1785136_1786543_-	pfam04932, Wzy_C, O-Antigen ligase	NA|674aa|up_8|NZ_AP018255.1_1786557_1788579_-	cd05387, BY-kinase, bacterial tyrosine-kinase	NA|166aa|up_7|NZ_AP018255.1_1788653_1789151_-	COG5017, COG5017, Uncharacterized conserved protein [Function unknown]	NA|149aa|up_6|NZ_AP018255.1_1789198_1789645_-	pfam08660, Alg14, Oligosaccharide biosynthesis protein Alg14 like	NA|256aa|up_5|NZ_AP018255.1_1790691_1791459_+	pfam13489, Methyltransf_23, Methyltransferase domain	NA|353aa|up_4|NZ_AP018255.1_1791458_1792517_+	cd10918, CE4_NodB_like_5s_6s, Putative catalytic NodB homology domain of PgaB, IcaB, and similar proteins which consist of a deformed (beta/alpha)8 barrel fold with 5- or 6-strands	NA|310aa|up_3|NZ_AP018255.1_1792574_1793504_+	pfam00535, Glycos_transf_2, Glycosyl transferase family 2	NA|365aa|up_2|NZ_AP018255.1_1793524_1794619_+	cd04195, GT2_AmsE_like, GT2_AmsE_like is involved in exopolysaccharide amylovora biosynthesis	NA|310aa|up_1|NZ_AP018255.1_1794698_1795628_+	cd00761, Glyco_tranf_GTA_type, Glycosyltransferase family A (GT-A) includes diverse families of glycosyl transferases with a common GT-A type structural fold	NA|338aa|up_0|NZ_AP018255.1_1795667_1796681_+	cd05256, UDP_AE_SDR_e, UDP-N-acetylglucosamine 4-epimerase, extended (e) SDRs	NA|301aa|down_0|NZ_AP018255.1_1797669_1798572_+	cd07378, MPP_ACP5, Homo sapiens acid phosphatase 5 and related proteins, metallophosphatase domain	NA|398aa|down_1|NZ_AP018255.1_1798660_1799854_-	pfam07787, TMEM43, Transmembrane protein 43	NA|149aa|down_2|NZ_AP018255.1_1800038_1800485_+	COG4446, COG4446, Uncharacterized protein conserved in bacteria [Function unknown]	NA|313aa|down_3|NZ_AP018255.1_1800770_1801709_+	pfam07602, DUF1565, Protein of unknown function (DUF1565)	NA|243aa|down_4|NZ_AP018255.1_1801945_1802674_-	NA	NA|800aa|down_5|NZ_AP018255.1_1802666_1805066_-	pfam12770, CHAT, CHAT domain	NA|444aa|down_6|NZ_AP018255.1_1805191_1806523_-	pfam08852, DUF1822, Protein of unknown function (DUF1822)	NA|482aa|down_7|NZ_AP018255.1_1806720_1808166_-	NA	NA|66aa|down_8|NZ_AP018255.1_1808202_1808400_-	NA	NA|246aa|down_9|NZ_AP018255.1_1808390_1809128_-	cd03295, ABC_OpuCA_Osmoprotection, ATP-binding cassette domain of the osmoprotectant transporter
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	5	1951606-1951697	5	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ACTAGCTTCGTTTGAAATCGTTA	23	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|112aa|up_7|NZ_AP018255.1_1943181_1943517_+,NA|117aa|up_6|NZ_AP018255.1_1943516_1943867_+,NA|64aa|up_5|NZ_AP018255.1_1943899_1944091_+,NA|70aa|down_1|NZ_AP018255.1_1952103_1952313_+,NA|111aa|down_2|NZ_AP018255.1_1952302_1952635_+,NA|130aa|down_6|NZ_AP018255.1_1957046_1957436_-,NA|95aa|down_7|NZ_AP018255.1_1957432_1957717_-,NA|139aa|down_9|NZ_AP018255.1_1959775_1960192_+	NA|691aa|up_9|NZ_AP018255.1_1940364_1942437_+	TIGR03185, DNA_S_dndD, DNA sulfur modification protein DndD	NA|158aa|up_8|NZ_AP018255.1_1942579_1943053_+	TIGR04062, hypothetical_protein_CY0110_29519, dnd system-associated protein 4	NA|112aa|up_7|NZ_AP018255.1_1943181_1943517_+	NA	NA|117aa|up_6|NZ_AP018255.1_1943516_1943867_+	NA	NA|64aa|up_5|NZ_AP018255.1_1943899_1944091_+	NA	NA|321aa|up_4|NZ_AP018255.1_1944160_1945123_+	COG3440, COG3440, Predicted restriction endonuclease [Defense mechanisms]	NA|532aa|up_3|NZ_AP018255.1_1945135_1946731_-	TIGR03187, hypothetical_protein, DGQHR domain	NA|540aa|up_2|NZ_AP018255.1_1946952_1948572_+	PRK06850, PRK06850, hypothetical protein; Provisional	NA|662aa|up_1|NZ_AP018255.1_1948679_1950665_+	TIGR03185, DNA_S_dndD, DNA sulfur modification protein DndD	NA|150aa|up_0|NZ_AP018255.1_1951134_1951584_+	COG3600, GepA, Uncharacterized phage-associated protein [Function unknown]	NA|128aa|down_0|NZ_AP018255.1_1951717_1952101_+	pfam08870, DndE, DNA sulphur modification protein DndE	NA|70aa|down_1|NZ_AP018255.1_1952103_1952313_+	NA	NA|111aa|down_2|NZ_AP018255.1_1952302_1952635_+	NA	NA|448aa|down_3|NZ_AP018255.1_1952795_1954139_-	cd16414, dndB_like, DNA-sulfur modification-associated domain	NA|191aa|down_4|NZ_AP018255.1_1954700_1955273_-	cd06260, DUF820, Domain of unknown function (DUF820)	NA|486aa|down_5|NZ_AP018255.1_1955511_1956969_+	TIGR04096, conserved_hypothetical_protein, DNA phosphorothioation-associated putative methyltransferase	NA|130aa|down_6|NZ_AP018255.1_1957046_1957436_-	NA	NA|95aa|down_7|NZ_AP018255.1_1957432_1957717_-	NA	NA|508aa|down_8|NZ_AP018255.1_1958232_1959756_+	cd17486, MFS_AmpG_like, AmpG and similar transporters of the Major Facilitator Superfamily	NA|139aa|down_9|NZ_AP018255.1_1959775_1960192_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	6	2289510-2289610	6	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	GTAAATAATGAAAAATTTAGGTGAACCCGC	30	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|305aa|up_6|NZ_AP018255.1_2280002_2280917_-,NA|163aa|up_2|NZ_AP018255.1_2286659_2287148_-,NA|79aa|down_1|NZ_AP018255.1_2291263_2291500_-,NA|330aa|down_2|NZ_AP018255.1_2291533_2292523_-,NA|99aa|down_6|NZ_AP018255.1_2295808_2296105_-,NA|74aa|down_7|NZ_AP018255.1_2296542_2296764_-	NA|261aa|up_9|NZ_AP018255.1_2276736_2277519_-	COG1127, Ttg2A, ABC-type transport system involved in resistance to organic solvents, ATPase component [Secondary metabolites biosynthesis, transport, and catabolism]	NA|505aa|up_8|NZ_AP018255.1_2277615_2279130_+	TIGR02730, Carotenoid_isomerase, carotene isomerase	NA|202aa|up_7|NZ_AP018255.1_2279241_2279847_-	cd06260, DUF820, Domain of unknown function (DUF820)	NA|305aa|up_6|NZ_AP018255.1_2280002_2280917_-	NA	NA|720aa|up_5|NZ_AP018255.1_2281151_2283311_+	COG0514, RecQ, Superfamily II DNA helicase [DNA replication, recombination, and repair]	NA|180aa|up_4|NZ_AP018255.1_2283286_2283826_+	pfam13673, Acetyltransf_10, Acetyltransferase (GNAT) domain	NA|149aa|up_3|NZ_AP018255.1_2286036_2286483_+	pfam11068, YlqD, YlqD protein	NA|163aa|up_2|NZ_AP018255.1_2286659_2287148_-	NA	NA|434aa|up_1|NZ_AP018255.1_2287386_2288688_+	PRK11856, PRK11856, branched-chain alpha-keto acid dehydrogenase subunit E2; Reviewed	NA|196aa|up_0|NZ_AP018255.1_2288883_2289471_-	pfam13785, DUF4178, Domain of unknown function (DUF4178)	NA|523aa|down_0|NZ_AP018255.1_2289612_2291181_-	PRK03612, PRK03612, polyamine aminopropyltransferase	NA|79aa|down_1|NZ_AP018255.1_2291263_2291500_-	NA	NA|330aa|down_2|NZ_AP018255.1_2291533_2292523_-	NA	NA|109aa|down_3|NZ_AP018255.1_2292920_2293247_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	NA|111aa|down_4|NZ_AP018255.1_2293250_2293583_+	pfam18480, DUF5615, Domain of unknown function (DUF5615)	NA|142aa|down_5|NZ_AP018255.1_2295386_2295812_-	cd09881, PIN_VapC4-5_FitB-like, VapC-like PIN domain of Mycobacterium tuberculosis VapC4 and VapC5, and Neisseria gonorrhoeae FitB and related proteins	NA|99aa|down_6|NZ_AP018255.1_2295808_2296105_-	NA	NA|74aa|down_7|NZ_AP018255.1_2296542_2296764_-	NA	NA|178aa|down_8|NZ_AP018255.1_2297030_2297564_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|191aa|down_9|NZ_AP018255.1_2297585_2298158_+	COG2020, STE14, Putative protein-S-isoprenylcysteine methyltransferase [Posttranslational modification, protein turnover, chaperones]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	7	2521964-2522039	7	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	CTACGCTACGGGAAAACTCCGTTTA	25	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|67aa|up_5|NZ_AP018255.1_2516119_2516320_-,NA|63aa|up_3|NZ_AP018255.1_2517588_2517777_-,NA|96aa|down_5|NZ_AP018255.1_2529999_2530287_+,NA|73aa|down_9|NZ_AP018255.1_2533591_2533810_+	NA|143aa|up_9|NZ_AP018255.1_2513146_2513575_-	cd04688, Nudix_Hydrolase_29, Members of the Nudix hydrolase superfamily catalyze the hydrolysis of NUcleoside DIphosphates linked to other moieties, X	NA|151aa|up_8|NZ_AP018255.1_2513602_2514055_-	pfam12049, DUF3531, Protein of unknown function (DUF3531)	NA|312aa|up_7|NZ_AP018255.1_2514114_2515050_-	TIGR02917, TPR_domain_protein, putative PEP-CTERM system TPR-repeat lipoprotein	NA|225aa|up_6|NZ_AP018255.1_2515371_2516046_+	COG1122, CbiO, ABC-type cobalt transport system, ATPase component [Inorganic ion transport and metabolism]	NA|67aa|up_5|NZ_AP018255.1_2516119_2516320_-	NA	NA|245aa|up_4|NZ_AP018255.1_2516703_2517438_+	PRK02816, PRK02816, phycocyanobilin:ferredoxin oxidoreductase; Validated	NA|63aa|up_3|NZ_AP018255.1_2517588_2517777_-	NA	NA|473aa|up_2|NZ_AP018255.1_2518226_2519645_+	TIGR02971, devB-like_secretion_protein, ABC exporter membrane fusion protein, DevB family	NA|385aa|up_1|NZ_AP018255.1_2519942_2521097_+	TIGR01185, membrane_spanning_subunit, DevC protein	NA|246aa|up_0|NZ_AP018255.1_2521210_2521948_+	TIGR02982, heterocyst_DevA, ABC exporter ATP-binding subunit, DevA family	NA|259aa|down_0|NZ_AP018255.1_2523145_2523922_+	COG0561, Cof, Predicted hydrolases of the HAD superfamily [General function prediction only]	NA|443aa|down_1|NZ_AP018255.1_2523942_2525271_-	COG1253, TlyC, Hemolysins and related proteins containing CBS domains [General function prediction only]	NA|1195aa|down_2|NZ_AP018255.1_2525497_2529082_+	COG1197, Mfd, Transcription-repair coupling factor (superfamily II helicase) [DNA replication, recombination, and repair / Transcription]	NA|54aa|down_3|NZ_AP018255.1_2529387_2529549_-	pfam15919, HicB_lk_antitox, HicB_like antitoxin of bacterial toxin-antitoxin system	NA|68aa|down_4|NZ_AP018255.1_2529703_2529907_+	COG1598, COG1598, Predicted nuclease of the RNAse H fold, HicB family [General    function prediction only]	NA|96aa|down_5|NZ_AP018255.1_2529999_2530287_+	NA	NA|397aa|down_6|NZ_AP018255.1_2530392_2531583_-	COG0654, UbiH, 2-polyprenyl-6-methoxyphenol hydroxylase and related FAD-dependent oxidoreductases [Coenzyme metabolism / Energy production and conversion]	NA|120aa|down_7|NZ_AP018255.1_2532345_2532705_+	pfam06967, Mo-nitro_C, Mo-dependent nitrogenase C-terminus	NA|248aa|down_8|NZ_AP018255.1_2532778_2533522_+	COG1402, COG1402, Uncharacterized protein, putative amidase [General function prediction only]	NA|73aa|down_9|NZ_AP018255.1_2533591_2533810_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	8	2638139-2638235	8	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	TGTTCACGAAACCAGTAGTACCAAGTGGCGCC	32	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|309aa|up_5|NZ_AP018255.1_2625271_2626198_-,NA|60aa|down_5|NZ_AP018255.1_2643692_2643872_+	NA|259aa|up_9|NZ_AP018255.1_2620468_2621245_+	pfam01738, DLH, Dienelactone hydrolase family	NA|300aa|up_8|NZ_AP018255.1_2621314_2622214_+	COG0539, RpsA, Ribosomal protein S1 [Translation, ribosomal structure and biogenesis]	NA|301aa|up_7|NZ_AP018255.1_2622869_2623772_-	TIGR04168, Ser/Thr_protein_phosphatase_family_protein, TIGR04168 family protein	NA|325aa|up_6|NZ_AP018255.1_2624017_2624992_+	PRK09375, PRK09375, quinolinate synthase NadA	NA|309aa|up_5|NZ_AP018255.1_2625271_2626198_-	NA	NA|300aa|up_4|NZ_AP018255.1_2632190_2633090_+	PRK09348, glyQ, glycyl-tRNA synthetase subunit alpha; Validated	NA|161aa|up_3|NZ_AP018255.1_2633151_2633634_+	pfam13301, DUF4079, Protein of unknown function (DUF4079)	NA|788aa|up_2|NZ_AP018255.1_2633753_2636117_+	pfam03772, Competence, Competence protein	NA|382aa|up_1|NZ_AP018255.1_2636474_2637620_+	smart00854, PGA_cap, Bacterial capsule synthesis protein PGA_cap	NA|121aa|up_0|NZ_AP018255.1_2637723_2638086_+	pfam16156, DUF4864, Domain of unknown function (DUF4864)	NA|281aa|down_0|NZ_AP018255.1_2638505_2639348_-	COG1606, COG1606, ATP-utilizing enzymes of the PP-loop superfamily [General function prediction only]	NA|589aa|down_1|NZ_AP018255.1_2639385_2641152_-	TIGR02956, sensor_protein_TorS, TMAO reductase sytem sensor TorS	NA|45aa|down_2|NZ_AP018255.1_2641741_2641876_-	pfam08078, PsaX, PsaX family	NA|290aa|down_3|NZ_AP018255.1_2641973_2642843_-	PRK12928, PRK12928, lipoyl synthase; Provisional	NA|196aa|down_4|NZ_AP018255.1_2643032_2643620_+	cd00156, REC, phosphoacceptor receiver (REC) domain of response regulators (RRs) and pseudo response regulators (PRRs)	NA|60aa|down_5|NZ_AP018255.1_2643692_2643872_+	NA	NA|1876aa|down_6|NZ_AP018255.1_2643883_2649511_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|362aa|down_7|NZ_AP018255.1_2649775_2650861_-	pfam00891, Methyltransf_2, O-methyltransferase	NA|291aa|down_8|NZ_AP018255.1_2650934_2651807_-	COG0657, Aes, Esterase/lipase [Lipid metabolism]	NA|501aa|down_9|NZ_AP018255.1_2651793_2653296_-	pfam00743, FMO-like, Flavin-binding monooxygenase-like
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	9	3433638-3433743	9	CRISPRCasFinder	no	PD-DExK	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	TAGTAAAGTTTCCAAACCGGGAGTACAA	28	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|90aa|up_9|NZ_AP018255.1_3421027_3421297_+,NA|260aa|up_5|NZ_AP018255.1_3425033_3425813_-,NA|78aa|up_1|NZ_AP018255.1_3429088_3429322_-,NA|142aa|down_1|NZ_AP018255.1_3435210_3435636_-,PD-DExK|209aa|down_8|NZ_AP018255.1_3445997_3446624_+,NA|131aa|down_9|NZ_AP018255.1_3447008_3447401_+	NA|90aa|up_9|NZ_AP018255.1_3421027_3421297_+	NA	NA|430aa|up_8|NZ_AP018255.1_3421616_3422906_+	PRK02862, glgC, glucose-1-phosphate adenylyltransferase; Provisional	NA|335aa|up_7|NZ_AP018255.1_3423206_3424211_+	PRK14299, PRK14299, chaperone protein DnaJ; Provisional	NA|237aa|up_6|NZ_AP018255.1_3424348_3425059_-	pfam01816, LRV, Leucine rich repeat variant	NA|260aa|up_5|NZ_AP018255.1_3425033_3425813_-	NA	NA|271aa|up_4|NZ_AP018255.1_3426164_3426977_-	cd14852, LD-carboxypeptidase, L,D-carboxypeptidase DacB and LdcB, and related proteins	NA|307aa|up_3|NZ_AP018255.1_3427093_3428014_+	COG0679, COG0679, Predicted permeases [General function prediction only]	NA|141aa|up_2|NZ_AP018255.1_3428290_3428713_+	PRK02770, PRK02770, adenosylmethionine decarboxylase	NA|78aa|up_1|NZ_AP018255.1_3429088_3429322_-	NA	NA|419aa|up_0|NZ_AP018255.1_3430453_3431710_+	cd03398, PAP2_haloperoxidase, PAP2, haloperoxidase_like subfamily	NA|172aa|down_0|NZ_AP018255.1_3434241_3434757_+	pfam01471, PG_binding_1, Putative peptidoglycan binding domain	NA|142aa|down_1|NZ_AP018255.1_3435210_3435636_-	NA	NA|274aa|down_2|NZ_AP018255.1_3436683_3437505_-	COG3315, COG3315, O-Methyltransferase involved in polyketide biosynthesis [Secondary metabolites biosynthesis, transport, and catabolism]	NA|491aa|down_3|NZ_AP018255.1_3437497_3438970_-	COG3670, COG3670, Lignostilbene-alpha,beta-dioxygenase and related enzymes [Secondary metabolites biosynthesis, transport, and catabolism]	NA|496aa|down_4|NZ_AP018255.1_3439076_3440564_+	TIGR02734, Phytoene_desaturase_lycopene-forming, phytoene desaturase	NA|463aa|down_5|NZ_AP018255.1_3440591_3441980_+	cd07136, ALDH_YwdH-P39616, Bacillus subtilis aldehyde dehydrogenase ywdH-like	NA|346aa|down_6|NZ_AP018255.1_3442183_3443221_-	cd05288, PGDH, Prostaglandin dehydrogenases	NA|140aa|down_7|NZ_AP018255.1_3443340_3443760_-	pfam01797, Y1_Tnp, Transposase IS200 like	PD-DExK|209aa|down_8|NZ_AP018255.1_3445997_3446624_+	NA	NA|131aa|down_9|NZ_AP018255.1_3447008_3447401_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	10	3563535-3563640	10	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	GAACGAGTACTACTGGTTAACTCAAC	26	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|74aa|up_7|NZ_AP018255.1_3555512_3555734_-,NA|158aa|up_3|NZ_AP018255.1_3560616_3561090_+,NA|165aa|down_0|NZ_AP018255.1_3564245_3564740_-,NA|148aa|down_3|NZ_AP018255.1_3565927_3566371_-,NA|76aa|down_6|NZ_AP018255.1_3568955_3569183_+,NA|273aa|down_9|NZ_AP018255.1_3571912_3572731_-	NA|167aa|up_9|NZ_AP018255.1_3552265_3552766_-	cd00060, FHA, Forkhead associated domain (FHA); found in eukaryotic and prokaryotic proteins	NA|800aa|up_8|NZ_AP018255.1_3553003_3555403_-	cd02094, P-type_ATPase_Cu-like, P-type heavy metal-transporting ATPase, similar to human copper-transporting ATPases, ATP7A and ATP7B	NA|74aa|up_7|NZ_AP018255.1_3555512_3555734_-	NA	NA|92aa|up_6|NZ_AP018255.1_3555825_3556101_-	COG2314, XynA, Predicted membrane protein [Function unknown]	NA|519aa|up_5|NZ_AP018255.1_3557072_3558629_-	COG1266, COG1266, Predicted metal-dependent membrane protease [General function prediction only]	NA|588aa|up_4|NZ_AP018255.1_3558799_3560563_+	cd11646, Precorrin_3B_C17_MT, Precorrin-3B C(17)-methyltransferase (also named CobJ or CbiH)	NA|158aa|up_3|NZ_AP018255.1_3560616_3561090_+	NA	NA|237aa|up_2|NZ_AP018255.1_3561165_3561876_+	COG2249, MdaB, Putative NADPH-quinone reductase (modulator of drug activity B) [General function prediction only]	NA|213aa|up_1|NZ_AP018255.1_3561902_3562541_+	PRK00698, tmk, thymidylate kinase; Validated	NA|316aa|up_0|NZ_AP018255.1_3562537_3563485_+	PRK07399, PRK07399, DNA polymerase III subunit delta'; Validated	NA|165aa|down_0|NZ_AP018255.1_3564245_3564740_-	NA	NA|185aa|down_1|NZ_AP018255.1_3564847_3565402_-	cd03017, PRX_BCP, Peroxiredoxin (PRX) family, Bacterioferritin comigratory protein (BCP) subfamily; composed of  thioredoxin-dependent thiol peroxidases, widely expressed in pathogenic bacteria, that protect cells against toxicity from reactive oxygen species by reducing and detoxifying hydroperoxides	NA|73aa|down_2|NZ_AP018255.1_3565560_3565779_-	pfam11347, DUF3148, Protein of unknown function (DUF3148)	NA|148aa|down_3|NZ_AP018255.1_3565927_3566371_-	NA	NA|399aa|down_4|NZ_AP018255.1_3566851_3568048_+	COG4585, COG4585, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|241aa|down_5|NZ_AP018255.1_3568129_3568852_+	pfam05721, PhyH, Phytanoyl-CoA dioxygenase (PhyH)	NA|76aa|down_6|NZ_AP018255.1_3568955_3569183_+	NA	NA|339aa|down_7|NZ_AP018255.1_3569226_3570243_-	COG1294, AppB, Cytochrome bd-type quinol oxidase, subunit 2 [Energy production and conversion]	NA|480aa|down_8|NZ_AP018255.1_3570343_3571783_-	pfam01654, Cyt_bd_oxida_I, Cytochrome bd terminal oxidase subunit I	NA|273aa|down_9|NZ_AP018255.1_3571912_3572731_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	11	3676348-3676464	11	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	AGTTGCAAATAATCCTGGTTGAA	23	1	1	3676411-3676441	NZ_AP018255.1_3672830-3672800	NA	2	2	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|217aa|up_8|NZ_AP018255.1_3664042_3664693_-,NA|356aa|up_7|NZ_AP018255.1_3665216_3666283_-,NA|505aa|up_4|NZ_AP018255.1_3669487_3671002_+,NA	NA|343aa|up_9|NZ_AP018255.1_3661665_3662694_+	cd13919, CuRO_HCO_II_like_5, Uncharacterized subfamily with similarity to Heme-copper oxidase subunit II cupredoxin domain	NA|217aa|up_8|NZ_AP018255.1_3664042_3664693_-	NA	NA|356aa|up_7|NZ_AP018255.1_3665216_3666283_-	NA	NA|524aa|up_6|NZ_AP018255.1_3667187_3668759_+	COG0464, SpoVK, ATPases of the AAA+ class [Posttranslational modification, protein turnover, chaperones]	NA|80aa|up_5|NZ_AP018255.1_3668790_3669030_-	pfam13443, HTH_26, Cro/C1-type HTH DNA-binding domain	NA|505aa|up_4|NZ_AP018255.1_3669487_3671002_+	NA	NA|140aa|up_3|NZ_AP018255.1_3671097_3671517_-	cd09881, PIN_VapC4-5_FitB-like, VapC-like PIN domain of Mycobacterium tuberculosis VapC4 and VapC5, and Neisseria gonorrhoeae FitB and related proteins	NA|118aa|up_2|NZ_AP018255.1_3671513_3671867_-	COG1598, COG1598, Predicted nuclease of the RNAse H fold, HicB family [General    function prediction only]	NA|542aa|up_1|NZ_AP018255.1_3673724_3675350_+	pfam00665, rve, Integrase core domain	NA|324aa|up_0|NZ_AP018255.1_3675339_3676311_+	COG3267, ExeA, Type II secretory pathway, component ExeA (predicted ATPase) [Intracellular trafficking and secretion]	NA|394aa|down_0|NZ_AP018255.1_3676507_3677689_-	pfam06468, Spond_N, Spondin_N	NA|369aa|down_1|NZ_AP018255.1_3678030_3679137_-	smart00457, MACPF, membrane-attack complex / perforin	NA|114aa|down_2|NZ_AP018255.1_3679698_3680040_-	cd02949, TRX_NTR, TRX domain, novel NADPH thioredoxin reductase (NTR) family; composed of fusion proteins found only in oxygenic photosynthetic organisms containing both TRX and NTR domains	NA|284aa|down_3|NZ_AP018255.1_3680103_3680955_-	pfam02683, DsbD, Cytochrome C biogenesis protein transmembrane region	NA|186aa|down_4|NZ_AP018255.1_3680985_3681543_-	COG0526, TrxA, Thiol-disulfide isomerase and thioredoxins [Posttranslational modification, protein turnover, chaperones / Energy production and conversion]	NA|640aa|down_5|NZ_AP018255.1_3682013_3683933_+	pfam08548, Peptidase_M10_C, Peptidase M10 serralysin C terminal	NA|201aa|down_6|NZ_AP018255.1_3684846_3685449_+	PRK12519, PRK12519, RNA polymerase sigma factor; Provisional	NA|273aa|down_7|NZ_AP018255.1_3685441_3686260_+	pfam10099, RskA, Anti-sigma-K factor rskA	NA|211aa|down_8|NZ_AP018255.1_3686271_3686904_+	COG5553, COG5553, Predicted metal-dependent enzyme of the double-stranded beta helix superfamily [General function prediction only]	NA|613aa|down_9|NZ_AP018255.1_3686882_3688721_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	12	3740258-3740861	1	CRT	no	WYL,cas8b5,cas7,cas5,cas3,cas6,cas4,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	TTGTTAGTACTGTTTTNGGG	20	6	34	3740367-3740392|3740457-3740482|3740547-3740572|3740547-3740572|3740547-3740572|3740547-3740572|3740547-3740572|3740547-3740572|3740547-3740572|3740547-3740572|3740637-3740662|3740637-3740662|3740637-3740662|3740637-3740662|3740637-3740662|3740637-3740662|3740637-3740662|3740637-3740662|3740727-3740752|3740727-3740752|3740727-3740752|3740727-3740752|3740727-3740752|3740727-3740752|3740727-3740752|3740727-3740752|3740817-3740842|3740817-3740842|3740817-3740842|3740817-3740842|3740817-3740842|3740817-3740842|3740817-3740842|3740817-3740842	NZ_AP018255.1_3740861-3740886|NZ_AP018255.1_5016321-5016346|NZ_AP018255.1_6208239-6208214|NZ_AP018255.1_6392721-6392696|NZ_AP018255.1_10097268-10097243|NZ_AP018255.1_2973132-2973157|NZ_AP018255.1_4230681-4230706|NZ_AP018255.1_5016322-5016347|NZ_AP018255.1_6795392-6795417|NZ_AP018255.1_10086194-10086219|NZ_AP018255.1_6208239-6208214|NZ_AP018255.1_6392721-6392696|NZ_AP018255.1_10097268-10097243|NZ_AP018255.1_2973132-2973157|NZ_AP018255.1_4230681-4230706|NZ_AP018255.1_5016322-5016347|NZ_AP018255.1_6795392-6795417|NZ_AP018255.1_10086194-10086219|NZ_AP018255.1_6208239-6208214|NZ_AP018255.1_6392721-6392696|NZ_AP018255.1_10097268-10097243|NZ_AP018255.1_2973132-2973157|NZ_AP018255.1_4230681-4230706|NZ_AP018255.1_5016322-5016347|NZ_AP018255.1_6795392-6795417|NZ_AP018255.1_10086194-10086219|NZ_AP018255.1_6208239-6208214|NZ_AP018255.1_6392721-6392696|NZ_AP018255.1_10097268-10097243|NZ_AP018255.1_2973132-2973157|NZ_AP018255.1_4230681-4230706|NZ_AP018255.1_5016322-5016347|NZ_AP018255.1_6795392-6795417|NZ_AP018255.1_10086194-10086219	NA	13	13	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA,cas8b5|827aa|down_5|NZ_AP018255.1_3750473_3752954_+,cas7|298aa|down_6|NZ_AP018255.1_3752956_3753850_+,cas5|276aa|down_7|NZ_AP018255.1_3753884_3754712_+	NA|201aa|up_9|NZ_AP018255.1_3732569_3733172_-	cd04630, CBS_pair_bac, Two tandem repeats of the cystathionine beta-synthase (CBS pair) domains present in bacteria	NA|420aa|up_8|NZ_AP018255.1_3734252_3735512_+	cd08199, EEVS, 2-epi-5-epi-valiolone synthase (EEVS)	NA|313aa|up_7|NZ_AP018255.1_3735562_3736501_-	PRK04375, PRK04375, protoheme IX farnesyltransferase; Provisional	NA|100aa|up_6|NZ_AP018255.1_3737052_3737352_-	CHL00134, petF, ferredoxin; Validated	NA|125aa|up_5|NZ_AP018255.1_3737470_3737845_-	TIGR00049, Uncharacterized_protein_in_nifU_5'region, Iron-sulfur cluster assembly accessory protein	NA|268aa|up_4|NZ_AP018255.1_3737926_3738730_-	cd00757, ThiF_MoeB_HesA_family, ThiF_MoeB_HesA	NA|106aa|up_3|NZ_AP018255.1_3738740_3739058_-	PRK14102, nifW, nitrogenase-stabilizing/protective protein NifW	NA|72aa|up_2|NZ_AP018255.1_3739054_3739270_-	pfam05082, Rop-like, Rop-like	NA|159aa|up_1|NZ_AP018255.1_3739316_3739793_-	pfam03270, DUF269, Protein of unknown function, DUF269	NA|138aa|up_0|NZ_AP018255.1_3739789_3740203_-	TIGR02663, Protein_NifX, nitrogen fixation protein NifX	NA|440aa|down_0|NZ_AP018255.1_3740902_3742222_-	PRK14476, PRK14476, nitrogenase molybdenum-cofactor biosynthesis protein NifN; Provisional	NA|478aa|down_1|NZ_AP018255.1_3742397_3743831_-	PRK14477, PRK14477, bifunctional nitrogenase molybdenum-cofactor biosynthesis protein NifE/NifN; Provisional	NA|517aa|down_2|NZ_AP018255.1_3744500_3746051_+	smart00857, Resolvase, Resolvase, N terminal domain	NA|79aa|down_3|NZ_AP018255.1_3746310_3746547_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	WYL|287aa|down_4|NZ_AP018255.1_3749401_3750262_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	cas8b5|827aa|down_5|NZ_AP018255.1_3750473_3752954_+	NA	cas7|298aa|down_6|NZ_AP018255.1_3752956_3753850_+	NA	cas5|276aa|down_7|NZ_AP018255.1_3753884_3754712_+	NA	cas3|900aa|down_8|NZ_AP018255.1_3754704_3757404_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas6|281aa|down_9|NZ_AP018255.1_3757460_3758303_+	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	13	3742230-3742315	12	CRISPRCasFinder	no	WYL,cas8b5,cas7,cas5,cas3,cas6,cas4,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	ATTAGGAGTGATGAGTGCTGAGT	23	0	0	NA	NA	NA	1	1	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|99aa|up_1|NZ_AP018255.1_3740202_3740499_+,cas8b5|827aa|down_4|NZ_AP018255.1_3750473_3752954_+,cas7|298aa|down_5|NZ_AP018255.1_3752956_3753850_+,cas5|276aa|down_6|NZ_AP018255.1_3753884_3754712_+	NA|313aa|up_9|NZ_AP018255.1_3735562_3736501_-	PRK04375, PRK04375, protoheme IX farnesyltransferase; Provisional	NA|100aa|up_8|NZ_AP018255.1_3737052_3737352_-	CHL00134, petF, ferredoxin; Validated	NA|125aa|up_7|NZ_AP018255.1_3737470_3737845_-	TIGR00049, Uncharacterized_protein_in_nifU_5'region, Iron-sulfur cluster assembly accessory protein	NA|268aa|up_6|NZ_AP018255.1_3737926_3738730_-	cd00757, ThiF_MoeB_HesA_family, ThiF_MoeB_HesA	NA|106aa|up_5|NZ_AP018255.1_3738740_3739058_-	PRK14102, nifW, nitrogenase-stabilizing/protective protein NifW	NA|72aa|up_4|NZ_AP018255.1_3739054_3739270_-	pfam05082, Rop-like, Rop-like	NA|159aa|up_3|NZ_AP018255.1_3739316_3739793_-	pfam03270, DUF269, Protein of unknown function, DUF269	NA|138aa|up_2|NZ_AP018255.1_3739789_3740203_-	TIGR02663, Protein_NifX, nitrogen fixation protein NifX	NA|99aa|up_1|NZ_AP018255.1_3740202_3740499_+	NA	NA|440aa|up_0|NZ_AP018255.1_3740902_3742222_-	PRK14476, PRK14476, nitrogenase molybdenum-cofactor biosynthesis protein NifN; Provisional	NA|478aa|down_0|NZ_AP018255.1_3742397_3743831_-	PRK14477, PRK14477, bifunctional nitrogenase molybdenum-cofactor biosynthesis protein NifE/NifN; Provisional	NA|517aa|down_1|NZ_AP018255.1_3744500_3746051_+	smart00857, Resolvase, Resolvase, N terminal domain	NA|79aa|down_2|NZ_AP018255.1_3746310_3746547_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	WYL|287aa|down_3|NZ_AP018255.1_3749401_3750262_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	cas8b5|827aa|down_4|NZ_AP018255.1_3750473_3752954_+	NA	cas7|298aa|down_5|NZ_AP018255.1_3752956_3753850_+	NA	cas5|276aa|down_6|NZ_AP018255.1_3753884_3754712_+	NA	cas3|900aa|down_7|NZ_AP018255.1_3754704_3757404_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas6|281aa|down_8|NZ_AP018255.1_3757460_3758303_+	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas4|195aa|down_9|NZ_AP018255.1_3758351_3758936_+	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	14	3747151-3748842	1,13,2	PILER-CR,CRISPRCasFinder,CRT	no	WYL,cas8b5,cas7,cas5,cas3,cas6,cas4,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	ATTGCAATTTAAAATAATCCCTAACAGGGA----------TTGAAAC,ATTGCAATTTAAAATAATCCCTAACAGGGATTGAAAC,ATTGCAATTTAAAATAATCCCTAACAGGGATTGAAAC	47,37,37	0	0	NA	NA	NA:I-D,II-B:I-D,II-B	22,23,23	23	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|99aa|up_4|NZ_AP018255.1_3740202_3740499_+,cas8b5|827aa|down_1|NZ_AP018255.1_3750473_3752954_+,cas7|298aa|down_2|NZ_AP018255.1_3752956_3753850_+,cas5|276aa|down_3|NZ_AP018255.1_3753884_3754712_+	NA|268aa|up_9|NZ_AP018255.1_3737926_3738730_-	cd00757, ThiF_MoeB_HesA_family, ThiF_MoeB_HesA	NA|106aa|up_8|NZ_AP018255.1_3738740_3739058_-	PRK14102, nifW, nitrogenase-stabilizing/protective protein NifW	NA|72aa|up_7|NZ_AP018255.1_3739054_3739270_-	pfam05082, Rop-like, Rop-like	NA|159aa|up_6|NZ_AP018255.1_3739316_3739793_-	pfam03270, DUF269, Protein of unknown function, DUF269	NA|138aa|up_5|NZ_AP018255.1_3739789_3740203_-	TIGR02663, Protein_NifX, nitrogen fixation protein NifX	NA|99aa|up_4|NZ_AP018255.1_3740202_3740499_+	NA	NA|440aa|up_3|NZ_AP018255.1_3740902_3742222_-	PRK14476, PRK14476, nitrogenase molybdenum-cofactor biosynthesis protein NifN; Provisional	NA|478aa|up_2|NZ_AP018255.1_3742397_3743831_-	PRK14477, PRK14477, bifunctional nitrogenase molybdenum-cofactor biosynthesis protein NifE/NifN; Provisional	NA|517aa|up_1|NZ_AP018255.1_3744500_3746051_+	smart00857, Resolvase, Resolvase, N terminal domain	NA|79aa|up_0|NZ_AP018255.1_3746310_3746547_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	WYL|287aa|down_0|NZ_AP018255.1_3749401_3750262_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	cas8b5|827aa|down_1|NZ_AP018255.1_3750473_3752954_+	NA	cas7|298aa|down_2|NZ_AP018255.1_3752956_3753850_+	NA	cas5|276aa|down_3|NZ_AP018255.1_3753884_3754712_+	NA	cas3|900aa|down_4|NZ_AP018255.1_3754704_3757404_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas6|281aa|down_5|NZ_AP018255.1_3757460_3758303_+	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas4|195aa|down_6|NZ_AP018255.1_3758351_3758936_+	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4	cas1|335aa|down_7|NZ_AP018255.1_3759027_3760032_+	TIGR04093, hypothetical_protein_L8106_25395, CRISPR-associated endonuclease Cas1, subtype CYANO	cas2|91aa|down_8|NZ_AP018255.1_3760084_3760357_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|151aa|down_9|NZ_AP018255.1_3764286_3764739_+	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	15	3760621-3764240	2,14,3	PILER-CR,CRISPRCasFinder,CRT	no	WYL,cas8b5,cas7,cas5,cas3,cas6,cas4,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	ATTGCAATTTCAAATAATCCCTACCAGGGA----------TTGAAAC,ATTGCAATTTCAAATAATCCCTACCAGGGATTGAAAC,ATTGCAATTTCAAATAATCCCTACCAGGGATTGAAACN	47,37,38	0	0	NA	NA	NA:I-D,II-B:I-D,II-B	49,49,50	50	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	cas8b5|827aa|up_7|NZ_AP018255.1_3750473_3752954_+,cas7|298aa|up_6|NZ_AP018255.1_3752956_3753850_+,cas5|276aa|up_5|NZ_AP018255.1_3753884_3754712_+,NA|126aa|down_3|NZ_AP018255.1_3768939_3769317_+	NA|79aa|up_9|NZ_AP018255.1_3746310_3746547_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	WYL|287aa|up_8|NZ_AP018255.1_3749401_3750262_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	cas8b5|827aa|up_7|NZ_AP018255.1_3750473_3752954_+	NA	cas7|298aa|up_6|NZ_AP018255.1_3752956_3753850_+	NA	cas5|276aa|up_5|NZ_AP018255.1_3753884_3754712_+	NA	cas3|900aa|up_4|NZ_AP018255.1_3754704_3757404_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas6|281aa|up_3|NZ_AP018255.1_3757460_3758303_+	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas4|195aa|up_2|NZ_AP018255.1_3758351_3758936_+	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4	cas1|335aa|up_1|NZ_AP018255.1_3759027_3760032_+	TIGR04093, hypothetical_protein_L8106_25395, CRISPR-associated endonuclease Cas1, subtype CYANO	cas2|91aa|up_0|NZ_AP018255.1_3760084_3760357_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|151aa|down_0|NZ_AP018255.1_3764286_3764739_+	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|148aa|down_1|NZ_AP018255.1_3764748_3765192_+	pfam01934, DUF86, Protein of unknown function DUF86	NA|1042aa|down_2|NZ_AP018255.1_3765398_3768524_-	pfam12770, CHAT, CHAT domain	NA|126aa|down_3|NZ_AP018255.1_3768939_3769317_+	NA	NA|697aa|down_4|NZ_AP018255.1_3770009_3772100_+	PRK00007, PRK00007, elongation factor G; Reviewed	NA|584aa|down_5|NZ_AP018255.1_3772247_3773999_+	COG4928, COG4928, Predicted P-loop ATPase [General function prediction only]	NA|496aa|down_6|NZ_AP018255.1_3775800_3777288_-	TIGR01282, Nitrogenase_molybdenum-iron_protein_alpha_chain, nitrogenase molybdenum-iron protein alpha chain	NA|104aa|down_7|NZ_AP018255.1_3778835_3779147_-	COG3668, ParE, Plasmid stabilization system protein [General function prediction only]	NA|104aa|down_8|NZ_AP018255.1_3779139_3779451_-	TIGR02606, Antitoxin_ParD, putative addiction module antidote protein, CC2985 family	NA|251aa|down_9|NZ_AP018255.1_3780321_3781074_-	pfam13649, Methyltransf_25, Methyltransferase domain
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	16	4178141-4178233	15	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATAATGGCGCCAATTAATCCTAAAACCA	28	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|307aa|up_8|NZ_AP018255.1_4168647_4169568_-,NA|154aa|up_3|NZ_AP018255.1_4174323_4174785_+,NA|122aa|up_1|NZ_AP018255.1_4175990_4176356_+,NA|65aa|down_3|NZ_AP018255.1_4181898_4182093_-	NA|448aa|up_9|NZ_AP018255.1_4167307_4168651_-	pfam14065, DUF4255, Protein of unknown function (DUF4255)	NA|307aa|up_8|NZ_AP018255.1_4168647_4169568_-	NA	NA|242aa|up_7|NZ_AP018255.1_4169564_4170290_-	PHA02611, 51, baseplate hub assembly protein; Provisional	NA|176aa|up_6|NZ_AP018255.1_4170303_4170831_-	pfam06841, Phage_T4_gp19, T4-like virus tail tube protein gp19	NA|600aa|up_5|NZ_AP018255.1_4170937_4172737_-	COG3497, COG3497, Phage tail sheath protein FI [General function prediction only]	NA|282aa|up_4|NZ_AP018255.1_4173138_4173984_+	pfam14436, EndoU_bacteria, Bacterial EndoU nuclease	NA|154aa|up_3|NZ_AP018255.1_4174323_4174785_+	NA	NA|247aa|up_2|NZ_AP018255.1_4174797_4175538_+	cd00737, lyz_endolysin_autolysin, endolysin and autolysin	NA|122aa|up_1|NZ_AP018255.1_4175990_4176356_+	NA	NA|467aa|up_0|NZ_AP018255.1_4176383_4177784_-	COG0154, GatA, Asp-tRNAAsn/Glu-tRNAGln amidotransferase A subunit and related amidases [Translation, ribosomal structure and biogenesis]	NA|453aa|down_0|NZ_AP018255.1_4178398_4179757_-	PRK02507, PRK02507, proton extrusion protein PcxA; Provisional	NA|223aa|down_1|NZ_AP018255.1_4179948_4180617_-	cd00884, beta_CA_cladeB, Carbonic anhydrases (CA) are zinc-containing enzymes that catalyze the reversible hydration of carbon dioxide in a two-step mechanism in which the nucleophilic attack of a zinc-bound hydroxide ion on carbon dioxide is followed by the regeneration of an active site by ionization of the zinc-bound water molecule and removal of a proton from the active site	NA|188aa|down_2|NZ_AP018255.1_4180945_4181509_-	pfam01980, UPF0066, Uncharacterized protein family UPF0066	NA|65aa|down_3|NZ_AP018255.1_4181898_4182093_-	NA	NA|379aa|down_4|NZ_AP018255.1_4182270_4183407_-	PRK06753, PRK06753, hypothetical protein; Provisional	NA|216aa|down_5|NZ_AP018255.1_4183592_4184240_+	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|407aa|down_6|NZ_AP018255.1_4184264_4185485_-	pfam05626, DUF790, Protein of unknown function (DUF790)	NA|101aa|down_7|NZ_AP018255.1_4185809_4186112_+	pfam08681, DUF1778, Protein of unknown function (DUF1778)	NA|173aa|down_8|NZ_AP018255.1_4186095_4186614_+	pfam13508, Acetyltransf_7, Acetyltransferase (GNAT) domain	NA|515aa|down_9|NZ_AP018255.1_4186717_4188262_-	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	17	5414458-5414867	3,16,4	PILER-CR,CRISPRCasFinder,CRT	no	cas14k,PD-DExK,cas3,cas8a4,cas7,cas5,cas6,cas4,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	CTTGAAACCTTACGAATCCCGTCTTCGGGACTGAAAC,CTTGAAACCTTACGAATCCCGTCTTCGGGACTGAAAC,CTTGAAACCTTACGAATCCCGTCTTCGGGACTGAAAC	37,37,37	0	0	NA	NA	NA:NA:NA	4,5,5	5	TypeV	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|268aa|up_9|NZ_AP018255.1_5402281_5403085_-,NA|64aa|up_8|NZ_AP018255.1_5403163_5403355_-,NA|251aa|up_6|NZ_AP018255.1_5405966_5406719_-,PD-DExK|207aa|up_4|NZ_AP018255.1_5409286_5409907_+,NA|75aa|down_0|NZ_AP018255.1_5415271_5415496_-,NA|65aa|down_1|NZ_AP018255.1_5415645_5415840_+,NA|106aa|down_2|NZ_AP018255.1_5415897_5416215_+,cas8a4|590aa|down_4|NZ_AP018255.1_5416745_5418515_+,cas5|211aa|down_6|NZ_AP018255.1_5419771_5420404_+	NA|268aa|up_9|NZ_AP018255.1_5402281_5403085_-	NA	NA|64aa|up_8|NZ_AP018255.1_5403163_5403355_-	NA	NA|689aa|up_7|NZ_AP018255.1_5403879_5405946_-	COG1770, PtrB, Protease II [Amino acid transport and metabolism]	NA|251aa|up_6|NZ_AP018255.1_5405966_5406719_-	NA	NA|596aa|up_5|NZ_AP018255.1_5406898_5408686_+	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	PD-DExK|207aa|up_4|NZ_AP018255.1_5409286_5409907_+	NA	NA|94aa|up_3|NZ_AP018255.1_5409977_5410259_+	pfam01457, Peptidase_M8, Leishmanolysin	NA|301aa|up_2|NZ_AP018255.1_5410352_5411255_-	pfam14261, DUF4351, Domain of unknown function (DUF4351)	cas3|205aa|up_1|NZ_AP018255.1_5411436_5412051_+	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas3|683aa|up_0|NZ_AP018255.1_5412158_5414207_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|75aa|down_0|NZ_AP018255.1_5415271_5415496_-	NA	NA|65aa|down_1|NZ_AP018255.1_5415645_5415840_+	NA	NA|106aa|down_2|NZ_AP018255.1_5415897_5416215_+	NA	NA|74aa|down_3|NZ_AP018255.1_5416289_5416511_-	COG1598, COG1598, Predicted nuclease of the RNAse H fold, HicB family [General    function prediction only]	cas8a4|590aa|down_4|NZ_AP018255.1_5416745_5418515_+	NA	cas7|315aa|down_5|NZ_AP018255.1_5418598_5419543_+	pfam01905, DevR, CRISPR-associated negative auto-regulator DevR/Csa2	cas5|211aa|down_6|NZ_AP018255.1_5419771_5420404_+	NA	cas6|336aa|down_7|NZ_AP018255.1_5420381_5421389_+	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	cas4|198aa|down_8|NZ_AP018255.1_5421564_5422158_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|326aa|down_9|NZ_AP018255.1_5422165_5423143_+	TIGR04093, hypothetical_protein_L8106_25395, CRISPR-associated endonuclease Cas1, subtype CYANO
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	18	5423750-5424947	4,17,5	PILER-CR,CRISPRCasFinder,CRT	no	PD-DExK,cas3,cas8a4,cas7,cas5,cas6,cas4,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	CTTTAAACTTTACGAATCCCGTTATCGGGACTGAAAC,CTTTAAACTTTACGAATCCCGTTATCGGGACTGAAAC,CTTTAAACTTTACGAATCCCGTTATCGGGACTGAAAC	37,37,37	0	0	NA	NA	NA:NA:NA	16,16,16	16	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|65aa|up_9|NZ_AP018255.1_5415645_5415840_+,NA|106aa|up_8|NZ_AP018255.1_5415897_5416215_+,cas8a4|590aa|up_6|NZ_AP018255.1_5416745_5418515_+,cas5|211aa|up_4|NZ_AP018255.1_5419771_5420404_+,NA|95aa|down_3|NZ_AP018255.1_5427547_5427832_-,NA|78aa|down_4|NZ_AP018255.1_5427872_5428106_+	NA|65aa|up_9|NZ_AP018255.1_5415645_5415840_+	NA	NA|106aa|up_8|NZ_AP018255.1_5415897_5416215_+	NA	NA|74aa|up_7|NZ_AP018255.1_5416289_5416511_-	COG1598, COG1598, Predicted nuclease of the RNAse H fold, HicB family [General    function prediction only]	cas8a4|590aa|up_6|NZ_AP018255.1_5416745_5418515_+	NA	cas7|315aa|up_5|NZ_AP018255.1_5418598_5419543_+	pfam01905, DevR, CRISPR-associated negative auto-regulator DevR/Csa2	cas5|211aa|up_4|NZ_AP018255.1_5419771_5420404_+	NA	cas6|336aa|up_3|NZ_AP018255.1_5420381_5421389_+	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	cas4|198aa|up_2|NZ_AP018255.1_5421564_5422158_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|326aa|up_1|NZ_AP018255.1_5422165_5423143_+	TIGR04093, hypothetical_protein_L8106_25395, CRISPR-associated endonuclease Cas1, subtype CYANO	cas2|98aa|up_0|NZ_AP018255.1_5423235_5423529_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|143aa|down_0|NZ_AP018255.1_5425232_5425661_+	COG0071, IbpA, Molecular chaperone (small heat shock protein) [Posttranslational modification, protein turnover, chaperones]	NA|127aa|down_1|NZ_AP018255.1_5425890_5426271_+	pfam10990, DUF2809, Protein of unknown function (DUF2809)	NA|321aa|down_2|NZ_AP018255.1_5426457_5427420_+	cd19100, AKR_unchar, uncharacterized aldo-keto reductase (AKR) superfamily protein	NA|95aa|down_3|NZ_AP018255.1_5427547_5427832_-	NA	NA|78aa|down_4|NZ_AP018255.1_5427872_5428106_+	NA	NA|143aa|down_5|NZ_AP018255.1_5428102_5428531_+	COG0071, IbpA, Molecular chaperone (small heat shock protein) [Posttranslational modification, protein turnover, chaperones]	NA|333aa|down_6|NZ_AP018255.1_5428849_5429848_-	COG0435, ECM4, Predicted glutathione S-transferase [Posttranslational modification, protein turnover, chaperones]	NA|707aa|down_7|NZ_AP018255.1_5430078_5432199_+	COG4232, COG4232, Thiol:disulfide interchange protein [Posttranslational modification, protein turnover, chaperones / Energy production and conversion]	NA|239aa|down_8|NZ_AP018255.1_5432319_5433036_+	cd02969, PRX_like1, Peroxiredoxin (PRX)-like 1 family; hypothetical proteins that show sequence similarity to PRXs	NA|97aa|down_9|NZ_AP018255.1_5433138_5433429_-	PRK00034, gatC, Asp-tRNA(Asn)/Glu-tRNA(Gln) amidotransferase subunit GatC
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	19	5554286-5554429	18	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	TATTATCATGATTTTTTTCAGGTTGTGAAAGATATAAATTGCCACTATCATTAA	54	0	0	NA	NA	NA	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|533aa|up_7|NZ_AP018255.1_5540699_5542298_-,NA|344aa|down_1|NZ_AP018255.1_5558541_5559573_-,NA|579aa|down_2|NZ_AP018255.1_5560025_5561762_+,NA|125aa|down_3|NZ_AP018255.1_5561875_5562250_+,NA|125aa|down_7|NZ_AP018255.1_5567161_5567536_+,NA|89aa|down_8|NZ_AP018255.1_5568028_5568295_-	NA|525aa|up_9|NZ_AP018255.1_5532337_5533912_-	cd07378, MPP_ACP5, Homo sapiens acid phosphatase 5 and related proteins, metallophosphatase domain	NA|316aa|up_8|NZ_AP018255.1_5534015_5534963_+	pfam09992, NAGPA, Phosphodiester glycosidase	NA|533aa|up_7|NZ_AP018255.1_5540699_5542298_-	NA	NA|305aa|up_6|NZ_AP018255.1_5542391_5543306_-	PLN02679, PLN02679, hydrolase, alpha/beta fold family protein	NA|178aa|up_5|NZ_AP018255.1_5543792_5544326_+	PRK00028, infC, translation initiation factor IF-3; Reviewed	NA|1009aa|up_4|NZ_AP018255.1_5544519_5547546_+	pfam03219, TLC, TLC ATP/ADP transporter	NA|147aa|up_3|NZ_AP018255.1_5547567_5548008_+	cd00038, CAP_ED, effector domain of the CAP family of transcription factors; members include CAP (or cAMP receptor protein (CRP)), which binds cAMP, FNR (fumarate and nitrate reduction), which uses an iron-sulfur cluster to sense oxygen) and CooA, a heme containing CO sensor	NA|298aa|up_2|NZ_AP018255.1_5548331_5549225_-	pfam13191, AAA_16, AAA ATPase domain	NA|740aa|up_1|NZ_AP018255.1_5549227_5551447_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|782aa|up_0|NZ_AP018255.1_5551443_5553789_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|527aa|down_0|NZ_AP018255.1_5556845_5558426_-	pfam05729, NACHT, NACHT domain	NA|344aa|down_1|NZ_AP018255.1_5558541_5559573_-	NA	NA|579aa|down_2|NZ_AP018255.1_5560025_5561762_+	NA	NA|125aa|down_3|NZ_AP018255.1_5561875_5562250_+	NA	NA|1136aa|down_4|NZ_AP018255.1_5562286_5565694_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|161aa|down_5|NZ_AP018255.1_5565734_5566217_+	cd02236, cupin_CV2614-like, Chromobacterium violaceum CV2614 and related proteins, cupin domain	NA|176aa|down_6|NZ_AP018255.1_5566417_5566945_+	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|125aa|down_7|NZ_AP018255.1_5567161_5567536_+	NA	NA|89aa|down_8|NZ_AP018255.1_5568028_5568295_-	NA	NA|237aa|down_9|NZ_AP018255.1_5568684_5569395_-	COG1592, COG1592, Rubrerythrin [Energy production and conversion]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	20	5741953-5744730	5,19,6	PILER-CR,CRISPRCasFinder,CRT	no	cas6,PD-DExK,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	ATTGAAATTTAAAATAATCCCTTTAAGGGA----------TTGAAAC,GTTTCAATCCCTTAAAGGGATTATTTTAAATTTCAAT,GTTTCAATCCCTTAAAGGGATTATTTTAAATTTCAAT	47,37,37	0	0	NA	NA	NA:NA:NA	38,38,38	38	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|310aa|up_1|NZ_AP018255.1_5740526_5741456_+,NA|144aa|up_0|NZ_AP018255.1_5741462_5741894_+,NA	NA|227aa|up_9|NZ_AP018255.1_5728282_5728963_+	cd01012, YcaC_related, YcaC related amidohydrolases; E	NA|213aa|up_8|NZ_AP018255.1_5729899_5730538_+	cd04726, KGPDC_HPS, 3-Keto-L-gulonate 6-phosphate decarboxylase (KGPDC) and D-arabino-3-hexulose-6-phosphate synthase (HPS)	NA|664aa|up_7|NZ_AP018255.1_5731250_5733242_+	TIGR02956, sensor_protein_TorS, TMAO reductase sytem sensor TorS	NA|193aa|up_6|NZ_AP018255.1_5736290_5736869_-	cd16913, YkuD_like, L,D-transpeptidases/carboxypeptidases similar to Bacillus YkuD	NA|163aa|up_5|NZ_AP018255.1_5737077_5737566_+	TIGR04110, hypothetical_protein_VSWAT3_12502, heme utilization protein HutZ	NA|308aa|up_4|NZ_AP018255.1_5737794_5738718_+	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|198aa|up_3|NZ_AP018255.1_5738812_5739406_+	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|209aa|up_2|NZ_AP018255.1_5739402_5740029_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|310aa|up_1|NZ_AP018255.1_5740526_5741456_+	NA	NA|144aa|up_0|NZ_AP018255.1_5741462_5741894_+	NA	NA|504aa|down_0|NZ_AP018255.1_5745339_5746851_-	TIGR01766, Putative_transposase_MJ0751, transposase, IS605 OrfB family, central region	cas6|241aa|down_1|NZ_AP018255.1_5747179_5747902_-	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	PD-DExK|340aa|down_2|NZ_AP018255.1_5747965_5748985_-	pfam06250, DUF1016, Protein of unknown function (DUF1016)	cas2|42aa|down_3|NZ_AP018255.1_5753953_5754079_-	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|256aa|down_4|NZ_AP018255.1_5754336_5755104_+	COG4636, Uma2, Endonuclease, Uma2 family (restriction endonuclease fold) [General function prediction only]	NA|116aa|down_5|NZ_AP018255.1_5755314_5755662_+	PRK09652, PRK09652, RNA polymerase sigma factor RpoE; Provisional	NA|638aa|down_6|NZ_AP018255.1_5755695_5757609_-	PRK05899, PRK05899, transketolase; Reviewed	NA|255aa|down_7|NZ_AP018255.1_5757739_5758504_+	COG1349, GlpR, Transcriptional regulators of sugar metabolism [Transcription / Carbohydrate transport and metabolism]	NA|252aa|down_8|NZ_AP018255.1_5758935_5759691_+	COG4627, COG4627, Uncharacterized protein conserved in bacteria [Function unknown]	NA|182aa|down_9|NZ_AP018255.1_5760330_5760876_-	PRK08118, PRK08118, DNA topology modulation protein
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	21	5749233-5753691	6,20,7,7	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas6,PD-DExK,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GTTTC----AATCCCTAAAAGGGATTTTATAAAGTTTAAAC,GTTTCAATCCCTAAAAGGGATTTTATAAAGTTTAAAC,GTTTCAATCCCTAAAAGGGATTTTATAAAGTTTAAAC,GTTTC----AATCCCTAAAAGGGATTTTATAAAGTTTAAAC	41,37,37,41	0	0	NA	NA	NA:I-D,II-B:I-D,II-B	59,61,61,59	61	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|310aa|up_4|NZ_AP018255.1_5740526_5741456_+,NA|144aa|up_3|NZ_AP018255.1_5741462_5741894_+,NA|172aa|down_9|NZ_AP018255.1_5763868_5764384_+	NA|193aa|up_9|NZ_AP018255.1_5736290_5736869_-	cd16913, YkuD_like, L,D-transpeptidases/carboxypeptidases similar to Bacillus YkuD	NA|163aa|up_8|NZ_AP018255.1_5737077_5737566_+	TIGR04110, hypothetical_protein_VSWAT3_12502, heme utilization protein HutZ	NA|308aa|up_7|NZ_AP018255.1_5737794_5738718_+	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|198aa|up_6|NZ_AP018255.1_5738812_5739406_+	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|209aa|up_5|NZ_AP018255.1_5739402_5740029_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|310aa|up_4|NZ_AP018255.1_5740526_5741456_+	NA	NA|144aa|up_3|NZ_AP018255.1_5741462_5741894_+	NA	NA|504aa|up_2|NZ_AP018255.1_5745339_5746851_-	TIGR01766, Putative_transposase_MJ0751, transposase, IS605 OrfB family, central region	cas6|241aa|up_1|NZ_AP018255.1_5747179_5747902_-	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	PD-DExK|340aa|up_0|NZ_AP018255.1_5747965_5748985_-	pfam06250, DUF1016, Protein of unknown function (DUF1016)	cas2|42aa|down_0|NZ_AP018255.1_5753953_5754079_-	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|256aa|down_1|NZ_AP018255.1_5754336_5755104_+	COG4636, Uma2, Endonuclease, Uma2 family (restriction endonuclease fold) [General function prediction only]	NA|116aa|down_2|NZ_AP018255.1_5755314_5755662_+	PRK09652, PRK09652, RNA polymerase sigma factor RpoE; Provisional	NA|638aa|down_3|NZ_AP018255.1_5755695_5757609_-	PRK05899, PRK05899, transketolase; Reviewed	NA|255aa|down_4|NZ_AP018255.1_5757739_5758504_+	COG1349, GlpR, Transcriptional regulators of sugar metabolism [Transcription / Carbohydrate transport and metabolism]	NA|252aa|down_5|NZ_AP018255.1_5758935_5759691_+	COG4627, COG4627, Uncharacterized protein conserved in bacteria [Function unknown]	NA|182aa|down_6|NZ_AP018255.1_5760330_5760876_-	PRK08118, PRK08118, DNA topology modulation protein	NA|554aa|down_7|NZ_AP018255.1_5761096_5762758_-	COG1807, ArnT, 4-amino-4-deoxy-L-arabinose transferase and related glycosyltransferases of PMT family [Cell envelope biogenesis, outer membrane]	NA|215aa|down_8|NZ_AP018255.1_5762949_5763594_+	pfam08241, Methyltransf_11, Methyltransferase domain	NA|172aa|down_9|NZ_AP018255.1_5763868_5764384_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	22	5945704-5945784	21	CRISPRCasFinder	no	cas14j	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	ATTCTTTACCAGGATATAGATAAACC	26	0	0	NA	NA	N:A	1	1	TypeV	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|66aa|up_6|NZ_AP018255.1_5936918_5937116_-,NA|70aa|down_0|NZ_AP018255.1_5945863_5946073_-,NA|475aa|down_3|NZ_AP018255.1_5950266_5951691_-,NA|223aa|down_5|NZ_AP018255.1_5953058_5953727_-	NA|224aa|up_9|NZ_AP018255.1_5934095_5934767_-	pfam09366, DUF1997, Protein of unknown function (DUF1997)	NA|220aa|up_8|NZ_AP018255.1_5934945_5935605_+	PLN00141, PLN00141, Tic62-NAD(P)-related group II protein; Provisional	NA|282aa|up_7|NZ_AP018255.1_5935741_5936587_+	TIGR02821, S-formylglutathione_hydrolase, S-formylglutathione hydrolase	NA|66aa|up_6|NZ_AP018255.1_5936918_5937116_-	NA	NA|449aa|up_5|NZ_AP018255.1_5937430_5938777_-	PRK01077, PRK01077, cobyrinate a,c-diamide synthase	NA|458aa|up_4|NZ_AP018255.1_5938960_5940334_-	COG3429, COG3429, Glucose-6-P dehydrogenase subunit [Carbohydrate transport and metabolism]	NA|510aa|up_3|NZ_AP018255.1_5940557_5942087_-	PRK05722, PRK05722, glucose-6-phosphate 1-dehydrogenase; Validated	NA|382aa|up_2|NZ_AP018255.1_5942153_5943299_-	PRK03343, PRK03343, transaldolase; Validated	NA|350aa|up_1|NZ_AP018255.1_5943431_5944481_-	PRK09293, PRK09293, class 1 fructose-bisphosphatase	NA|104aa|up_0|NZ_AP018255.1_5944784_5945096_-	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|70aa|down_0|NZ_AP018255.1_5945863_5946073_-	NA	NA|397aa|down_1|NZ_AP018255.1_5946182_5947373_-	COG1262, COG1262, Uncharacterized conserved protein [Function unknown]	NA|328aa|down_2|NZ_AP018255.1_5949286_5950270_-	COG0714, COG0714, MoxR-like ATPases [General function prediction only]	NA|475aa|down_3|NZ_AP018255.1_5950266_5951691_-	NA	NA|364aa|down_4|NZ_AP018255.1_5951893_5952985_-	pfam13365, Trypsin_2, Trypsin-like peptidase domain	NA|223aa|down_5|NZ_AP018255.1_5953058_5953727_-	NA	NA|766aa|down_6|NZ_AP018255.1_5954349_5956647_-	TIGR02505, RTPR, ribonucleoside-triphosphate reductase, adenosylcobalamin-dependent	NA|194aa|down_7|NZ_AP018255.1_5956789_5957371_+	TIGR04026, hypothetical_protein, PPOX class probable FMN-dependent enzyme, alr4036 family	NA|177aa|down_8|NZ_AP018255.1_5957635_5958166_+	pfam07884, VKOR, Vitamin K epoxide reductase family	NA|188aa|down_9|NZ_AP018255.1_5958552_5959116_-	COG4636, Uma2, Endonuclease, Uma2 family (restriction endonuclease fold) [General function prediction only]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	23	6276543-6276661	22	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	TCCGGTTGTTTACCAGGATGTAGGTAAACCCGCCCGTACAG	41	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|61aa|up_9|NZ_AP018255.1_6263006_6263189_+,NA|87aa|down_1|NZ_AP018255.1_6277756_6278017_+,NA|62aa|down_5|NZ_AP018255.1_6280850_6281036_+,NA|196aa|down_8|NZ_AP018255.1_6283867_6284455_+,NA|115aa|down_9|NZ_AP018255.1_6284921_6285266_-	NA|61aa|up_9|NZ_AP018255.1_6263006_6263189_+	NA	NA|206aa|up_8|NZ_AP018255.1_6263560_6264178_+	COG1182, AcpD, Acyl carrier protein phosphodiesterase [Lipid metabolism]	NA|929aa|up_7|NZ_AP018255.1_6264451_6267238_-	COG2274, SunT, ABC-type bacteriocin/lantibiotic exporters, contain an N-terminal double-glycine peptidase domain [Defense mechanisms]	NA|253aa|up_6|NZ_AP018255.1_6267186_6267945_-	TIGR04500, PpiC_rel_mature, putative peptide maturation system protein	NA|257aa|up_5|NZ_AP018255.1_6268211_6268982_-	COG1836, COG1836, Predicted membrane protein [Function unknown]	NA|649aa|up_4|NZ_AP018255.1_6269332_6271279_+	cd07484, Peptidases_S8_Thermitase_like, Peptidase S8 family domain in Thermitase-like proteins	NA|66aa|up_3|NZ_AP018255.1_6271364_6271562_+	TIGR00927, retinal_rod, K+-dependent Na+/Ca+ exchanger	NA|486aa|up_2|NZ_AP018255.1_6271768_6273226_+	cd00044, CysPc, Calpains, domains IIa, IIb; calcium-dependent cytoplasmic cysteine proteinases, papain-like	NA|473aa|up_1|NZ_AP018255.1_6273463_6274882_+	cd07484, Peptidases_S8_Thermitase_like, Peptidase S8 family domain in Thermitase-like proteins	NA|499aa|up_0|NZ_AP018255.1_6274945_6276442_-	TIGR01843, Hemolysin_secretion_protein_D_plasmid, type I secretion membrane fusion protein, HlyD family	NA|292aa|down_0|NZ_AP018255.1_6276733_6277609_-	cd05243, SDR_a5, atypical (a) SDRs, subgroup 5	NA|87aa|down_1|NZ_AP018255.1_6277756_6278017_+	NA	NA|146aa|down_2|NZ_AP018255.1_6278009_6278447_+	cd09873, PIN_Pae0151-like, VapC-like PIN domain of the Pyrobaculum aerophilum Pae0151 and Pae2754 proteins and homologs	NA|261aa|down_3|NZ_AP018255.1_6278449_6279232_-	cd09086, ExoIII-like_AP-endo, Escherichia coli exonuclease III (ExoIII) and Neisseria meningitides NExo-like subfamily of the ExoIII family purinic/apyrimidinic (AP) endonucleases	NA|357aa|down_4|NZ_AP018255.1_6279713_6280784_+	cd03802, GT4_AviGT4-like, UDP-Glc:tetrahydrobiopterin alpha-glucosyltransferase and similar proteins	NA|62aa|down_5|NZ_AP018255.1_6280850_6281036_+	NA	NA|342aa|down_6|NZ_AP018255.1_6281347_6282373_+	cd08235, iditol_2_DH_like, L-iditol 2-dehydrogenase	NA|354aa|down_7|NZ_AP018255.1_6282516_6283578_+	cd06257, DnaJ, DnaJ domain or J-domain	NA|196aa|down_8|NZ_AP018255.1_6283867_6284455_+	NA	NA|115aa|down_9|NZ_AP018255.1_6284921_6285266_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	24	6291122-6291211	23	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	GGATTTTCCTAGAGGATATATTTG	24	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|196aa|up_7|NZ_AP018255.1_6283867_6284455_+,NA|115aa|up_6|NZ_AP018255.1_6284921_6285266_-,NA|164aa|down_0|NZ_AP018255.1_6291275_6291767_-,NA|63aa|down_1|NZ_AP018255.1_6291756_6291945_-,NA|400aa|down_9|NZ_AP018255.1_6301108_6302308_-	NA|342aa|up_9|NZ_AP018255.1_6281347_6282373_+	cd08235, iditol_2_DH_like, L-iditol 2-dehydrogenase	NA|354aa|up_8|NZ_AP018255.1_6282516_6283578_+	cd06257, DnaJ, DnaJ domain or J-domain	NA|196aa|up_7|NZ_AP018255.1_6283867_6284455_+	NA	NA|115aa|up_6|NZ_AP018255.1_6284921_6285266_-	NA	NA|264aa|up_5|NZ_AP018255.1_6285367_6286159_-	COG1842, PspA, Phage shock protein A (IM30), suppresses sigma54-dependent transcription [Transcription / Signal transduction mechanisms]	NA|225aa|up_4|NZ_AP018255.1_6286342_6287017_-	COG1842, PspA, Phage shock protein A (IM30), suppresses sigma54-dependent transcription [Transcription / Signal transduction mechanisms]	NA|423aa|up_3|NZ_AP018255.1_6287227_6288496_-	TIGR04526, predic_Ig_block, putative immunoglobulin-blocking virulence protein	NA|183aa|up_2|NZ_AP018255.1_6288632_6289181_+	COG5512, COG5512, Zn-ribbon-containing, possibly RNA-binding protein and truncated derivatives [General function prediction only]	NA|99aa|up_1|NZ_AP018255.1_6289547_6289844_+	pfam13867, SAP30_Sin3_bdg, Sin3 binding region of histone deacetylase complex subunit SAP30	NA|278aa|up_0|NZ_AP018255.1_6289999_6290833_-	PRK07396, PRK07396, dihydroxynaphthoic acid synthetase; Validated	NA|164aa|down_0|NZ_AP018255.1_6291275_6291767_-	NA	NA|63aa|down_1|NZ_AP018255.1_6291756_6291945_-	NA	NA|239aa|down_2|NZ_AP018255.1_6292223_6292940_+	pfam13649, Methyltransf_25, Methyltransferase domain	NA|568aa|down_3|NZ_AP018255.1_6293102_6294806_-	PRK07449, PRK07449, 2-succinyl-5-enolpyruvyl-6-hydroxy-3-cyclohexene-1-carboxylate synthase; Validated	NA|121aa|down_4|NZ_AP018255.1_6294916_6295279_+	pfam02152, FolB, Dihydroneopterin aldolase	NA|428aa|down_5|NZ_AP018255.1_6295779_6297063_+	PRK09776, PRK09776, putative diguanylate cyclase; Provisional	NA|636aa|down_6|NZ_AP018255.1_6297083_6298991_-	pfam11832, DUF3352, Protein of unknown function (DUF3352)	NA|392aa|down_7|NZ_AP018255.1_6299266_6300442_-	COG3621, COG3621, Patatin [General function prediction only]	NA|126aa|down_8|NZ_AP018255.1_6300558_6300936_-	pfam11535, Calci_bind_CcbP, Calcium binding	NA|400aa|down_9|NZ_AP018255.1_6301108_6302308_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	25	6651273-6651348	24	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ACTCAGCACGAGCGCACGAGCGCAC	25	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|256aa|up_0|NZ_AP018255.1_6650286_6651054_-,NA	NA|478aa|up_9|NZ_AP018255.1_6638710_6640144_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|295aa|up_8|NZ_AP018255.1_6640363_6641248_+	cd13653, PBP2_phosphate_like_1, Substrate binding domain of putative ABC-type phosphate transporter, a member of the type 2 periplasmic binding fold superfamily	NA|212aa|up_7|NZ_AP018255.1_6641290_6641926_+	cd07989, LPLAT_AGPAT-like, Lysophospholipid Acyltransferases (LPLATs) of Glycerophospholipid Biosynthesis: AGPAT-like	NA|348aa|up_6|NZ_AP018255.1_6642486_6643530_+	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|96aa|up_5|NZ_AP018255.1_6643623_6643911_+	COG5626, COG5626, Uncharacterized small conserved protein [Function unknown]	NA|170aa|up_4|NZ_AP018255.1_6643923_6644433_-	cd06259, YdcF-like, YdcF-like	NA|367aa|up_3|NZ_AP018255.1_6645171_6646272_-	pfam14249, Tocopherol_cycl, Tocopherol cyclase	NA|868aa|up_2|NZ_AP018255.1_6646416_6649020_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|202aa|up_1|NZ_AP018255.1_6649059_6649665_+	COG0484, DnaJ, DnaJ-class molecular chaperone with C-terminal Zn finger domain [Posttranslational modification, protein turnover, chaperones]	NA|256aa|up_0|NZ_AP018255.1_6650286_6651054_-	NA	NA|420aa|down_0|NZ_AP018255.1_6651429_6652689_+	PRK07364, PRK07364, FAD-dependent hydroxylase	NA|755aa|down_1|NZ_AP018255.1_6653041_6655306_+	COG4191, COG4191, Signal transduction histidine kinase regulating C4-dicarboxylate transport system [Signal transduction mechanisms]	NA|259aa|down_2|NZ_AP018255.1_6655306_6656083_-	cd08826, SPFH_eoslipins_u1, Uncharacterized prokaryotic subgroup of the stomatin-like proteins (slipins) family; belonging to the SPFH (stomatin, prohibitin, flotillin, and HflK/C) superfamily	NA|766aa|down_3|NZ_AP018255.1_6656330_6658628_+	cd13401, Slt70-like, 70kDa soluble lytic transglycosylase (Slt70) and similar proteins	NA|908aa|down_4|NZ_AP018255.1_6658920_6661644_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|275aa|down_5|NZ_AP018255.1_6661764_6662589_-	pfam18299, R2K_2, ATP-grasp domain, R2K clade family 2	NA|193aa|down_6|NZ_AP018255.1_6662788_6663367_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|535aa|down_7|NZ_AP018255.1_6663777_6665382_-	PRK00915, PRK00915, 2-isopropylmalate synthase; Validated	NA|175aa|down_8|NZ_AP018255.1_6665479_6666004_-	cd10911, PIN_LabA, PIN domain of Synechococcus elongatus LabA (low-amplitude and bright) and related proteins	NA|778aa|down_9|NZ_AP018255.1_6666844_6669178_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	26	6901980-6902092	25	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATGAAGCTGCAAATAATTAAATCCCCCCCTGCCCCC	36	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|318aa|up_9|NZ_AP018255.1_6873563_6874517_+,NA|77aa|up_4|NZ_AP018255.1_6884926_6885157_+,NA|83aa|up_3|NZ_AP018255.1_6886531_6886780_+,NA|62aa|up_2|NZ_AP018255.1_6891181_6891367_+,NA|158aa|down_5|NZ_AP018255.1_6910975_6911449_+,NA|114aa|down_6|NZ_AP018255.1_6911789_6912131_+,NA|139aa|down_9|NZ_AP018255.1_6920525_6920942_+	NA|318aa|up_9|NZ_AP018255.1_6873563_6874517_+	NA	NA|409aa|up_8|NZ_AP018255.1_6874448_6875675_-	pfam00145, DNA_methylase, C-5 cytosine-specific DNA methylase	NA|427aa|up_7|NZ_AP018255.1_6875825_6877106_-	cd06173, MFS_MefA_like, Macrolide efflux protein A and similar proteins of the Major Facilitator Superfamily of transporters	NA|1391aa|up_6|NZ_AP018255.1_6877125_6881298_-	PRK12467, PRK12467, peptide synthase; Provisional	NA|1136aa|up_5|NZ_AP018255.1_6881294_6884702_-	PRK12467, PRK12467, peptide synthase; Provisional	NA|77aa|up_4|NZ_AP018255.1_6884926_6885157_+	NA	NA|83aa|up_3|NZ_AP018255.1_6886531_6886780_+	NA	NA|62aa|up_2|NZ_AP018255.1_6891181_6891367_+	NA	NA|107aa|up_1|NZ_AP018255.1_6896161_6896482_+	pfam13476, AAA_23, AAA domain	NA|1365aa|up_0|NZ_AP018255.1_6897339_6901434_-	pfam03160, Calx-beta, Calx-beta domain	NA|1695aa|down_0|NZ_AP018255.1_6902226_6907311_-	PRK12467, PRK12467, peptide synthase; Provisional	NA|170aa|down_1|NZ_AP018255.1_6907382_6907892_-	cd19531, LCL_NRPS-like, LCL-type Condensation (C) domain of non-ribosomal peptide synthetases(NRPSs) and similar domains including the C-domain of SgcC5, a free-standing NRPS with both ester- and amide- bond forming activity	NA|344aa|down_2|NZ_AP018255.1_6908027_6909059_-	TIGR03944, ornithine_cyclodeaminase, 2,3-diaminopropionate biosynthesis protein SbnB	NA|335aa|down_3|NZ_AP018255.1_6909154_6910159_-	TIGR03945, cysteine_synthase, 2,3-diaminopropionate biosynthesis protein SbnA	NA|81aa|down_4|NZ_AP018255.1_6910749_6910992_+	pfam04255, DUF433, Protein of unknown function (DUF433)	NA|158aa|down_5|NZ_AP018255.1_6910975_6911449_+	NA	NA|114aa|down_6|NZ_AP018255.1_6911789_6912131_+	NA	NA|1091aa|down_7|NZ_AP018255.1_6912153_6915426_-	cd05930, A_NRPS, The adenylation domain of nonribosomal peptide synthetases (NRPS)	NA|1119aa|down_8|NZ_AP018255.1_6917066_6920423_-	PRK12467, PRK12467, peptide synthase; Provisional	NA|139aa|down_9|NZ_AP018255.1_6920525_6920942_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	27	7005478-7005581	26	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	GGTTCACGAAATATGAGCGCACCGTT	26	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|157aa|up_8|NZ_AP018255.1_6996531_6997002_-,NA|397aa|up_7|NZ_AP018255.1_6997214_6998405_+,NA|325aa|up_6|NZ_AP018255.1_6998397_6999372_+,NA|240aa|down_2|NZ_AP018255.1_7007913_7008633_-,NA|127aa|down_9|NZ_AP018255.1_7014507_7014888_-	NA|323aa|up_9|NZ_AP018255.1_6995403_6996372_+	TIGR02749, Prenyl_transferase, solanesyl diphosphate synthase	NA|157aa|up_8|NZ_AP018255.1_6996531_6997002_-	NA	NA|397aa|up_7|NZ_AP018255.1_6997214_6998405_+	NA	NA|325aa|up_6|NZ_AP018255.1_6998397_6999372_+	NA	NA|774aa|up_5|NZ_AP018255.1_6999598_7001920_+	COG1305, COG1305, Transglutaminase-like enzymes, putative cysteine proteases [Amino acid transport and metabolism]	NA|89aa|up_4|NZ_AP018255.1_7002418_7002685_+	PRK04323, PRK04323, hypothetical protein; Provisional	NA|206aa|up_3|NZ_AP018255.1_7002881_7003499_+	PRK00300, gmk, guanylate kinase; Provisional	NA|173aa|up_2|NZ_AP018255.1_7003575_7004094_-	pfam02605, PsaL, Photosystem I reaction centre subunit XI	NA|45aa|up_1|NZ_AP018255.1_7004430_7004565_-	PRK02733, PRK02733, photosystem I reaction center subunit IX; Provisional	NA|165aa|up_0|NZ_AP018255.1_7004679_7005174_-	CHL00132, psaF, photosystem I subunit III; Validated	NA|346aa|down_0|NZ_AP018255.1_7005663_7006701_+	PRK09604, PRK09604, tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex transferase subunit TsaD	NA|310aa|down_1|NZ_AP018255.1_7006835_7007765_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|240aa|down_2|NZ_AP018255.1_7007913_7008633_-	NA	NA|183aa|down_3|NZ_AP018255.1_7008923_7009472_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|275aa|down_4|NZ_AP018255.1_7010224_7011049_+	TIGR00995, Tic22-like_protein, chloroplast protein import component, Tic22 family	NA|302aa|down_5|NZ_AP018255.1_7011184_7012090_+	PRK09328, PRK09328, N5-glutamine S-adenosyl-L-methionine-dependent methyltransferase; Provisional	NA|198aa|down_6|NZ_AP018255.1_7012256_7012850_+	COG0009, SUA5, Putative translation factor (SUA5) [Translation, ribosomal structure and biogenesis]	NA|315aa|down_7|NZ_AP018255.1_7012987_7013932_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|156aa|down_8|NZ_AP018255.1_7013882_7014350_-	pfam13508, Acetyltransf_7, Acetyltransferase (GNAT) domain	NA|127aa|down_9|NZ_AP018255.1_7014507_7014888_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	28	7117837-7117932	27	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	TGGTTAATTTTCCGCTTAGGATATATTTGTATCT	34	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|60aa|up_7|NZ_AP018255.1_7110896_7111076_+,NA|164aa|up_6|NZ_AP018255.1_7111258_7111750_+,NA|180aa|up_5|NZ_AP018255.1_7111788_7112328_+,NA|210aa|down_0|NZ_AP018255.1_7118039_7118669_-	NA|214aa|up_9|NZ_AP018255.1_7107150_7107792_-	pfam11780, DUF3318, Protein of unknown function (DUF3318)	NA|627aa|up_8|NZ_AP018255.1_7107998_7109879_+	PRK00558, uvrC, excinuclease ABC subunit UvrC	NA|60aa|up_7|NZ_AP018255.1_7110896_7111076_+	NA	NA|164aa|up_6|NZ_AP018255.1_7111258_7111750_+	NA	NA|180aa|up_5|NZ_AP018255.1_7111788_7112328_+	NA	NA|325aa|up_4|NZ_AP018255.1_7112544_7113519_-	cd01339, LDH-like_MDH, L-lactate dehydrogenase-like malate dehydrogenase proteins	NA|225aa|up_3|NZ_AP018255.1_7113600_7114275_-	TIGR02252, Rhythmically_expressed_gene_2_protein, REG-2-like, HAD superfamily (subfamily IA) hydrolase	NA|262aa|up_2|NZ_AP018255.1_7114425_7115211_-	pfam13267, DUF4058, Protein of unknown function (DUF4058)	NA|397aa|up_1|NZ_AP018255.1_7115433_7116624_-	COG1252, Ndh, NADH dehydrogenase, FAD-containing subunit [Energy production and conversion]	NA|188aa|up_0|NZ_AP018255.1_7116675_7117239_-	pfam13523, Acetyltransf_8, Acetyltransferase (GNAT) domain	NA|210aa|down_0|NZ_AP018255.1_7118039_7118669_-	NA	NA|541aa|down_1|NZ_AP018255.1_7119131_7120754_-	cd09173, PLDc_Nuc_like_unchar1_2, Putative catalytic domain, repeat 2, of uncharacterized hypothetical proteins similar to Nuc, an endonuclease from Salmonella typhimurium	NA|319aa|down_2|NZ_AP018255.1_7120871_7121828_-	PRK04375, PRK04375, protoheme IX farnesyltransferase; Provisional	NA|312aa|down_3|NZ_AP018255.1_7121880_7122816_-	COG1612, CtaA, Uncharacterized protein required for cytochrome oxidase assembly [Posttranslational modification, protein turnover, chaperones]	NA|362aa|down_4|NZ_AP018255.1_7123286_7124372_+	cd13919, CuRO_HCO_II_like_5, Uncharacterized subfamily with similarity to Heme-copper oxidase subunit II cupredoxin domain	NA|581aa|down_5|NZ_AP018255.1_7124460_7126203_+	TIGR02891, Probable_cytochrome_c_oxidase_subunit_1-beta, cytochrome c oxidase, subunit I	NA|208aa|down_6|NZ_AP018255.1_7126294_7126918_+	COG1845, CyoC, Heme/copper-type cytochrome/quinol oxidase, subunit 3 [Energy production and conversion]	NA|142aa|down_7|NZ_AP018255.1_7132100_7132526_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|764aa|down_8|NZ_AP018255.1_7133143_7135435_+	cd00306, Peptidases_S8_S53, Peptidase domain in the S8 and S53 families	NA|144aa|down_9|NZ_AP018255.1_7135644_7136076_-	pfam13975, gag-asp_proteas, gag-polyprotein putative aspartyl protease
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	29	7229677-7229778	28	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	GTAAACCCGCCCGTACAAAAGAGGCGCGT	29	1	1	7229706-7229749	NZ_AP018255.1_7283380-7283423	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|102aa|up_6|NZ_AP018255.1_7222464_7222770_+,NA|94aa|up_1|NZ_AP018255.1_7228168_7228450_-,NA	NA|165aa|up_9|NZ_AP018255.1_7218419_7218914_-	COG2172, RsbW, Anti-sigma regulatory factor (Ser/Thr protein kinase) [Signal transduction mechanisms]	NA|456aa|up_8|NZ_AP018255.1_7219423_7220791_-	COG2265, TrmA, SAM-dependent methyltransferases related to tRNA (uracil-5-)-methyltransferase [Translation, ribosomal structure and biogenesis]	NA|162aa|up_7|NZ_AP018255.1_7220922_7221408_+	cd12125, APC_alpha, Allophycocyanin alpha subunit of the phycobilisome core	NA|102aa|up_6|NZ_AP018255.1_7222464_7222770_+	NA	NA|88aa|up_5|NZ_AP018255.1_7222756_7223020_+	COG3654, Doc, Prophage maintenance system killer protein [General function prediction only]	NA|786aa|up_4|NZ_AP018255.1_7223290_7225648_+	PRK01213, PRK01213, phosphoribosylformylglycinamidine synthase subunit PurL	NA|498aa|up_3|NZ_AP018255.1_7225934_7227428_+	PRK07349, PRK07349, amidophosphoribosyltransferase; Provisional	NA|101aa|up_2|NZ_AP018255.1_7227691_7227994_-	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|94aa|up_1|NZ_AP018255.1_7228168_7228450_-	NA	NA|349aa|up_0|NZ_AP018255.1_7228557_7229604_-	COG0601, DppB, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|173aa|down_0|NZ_AP018255.1_7229807_7230326_-	PRK02304, PRK02304, adenine phosphoribosyltransferase; Provisional	NA|209aa|down_1|NZ_AP018255.1_7230759_7231386_+	pfam11237, DUF3038, Protein of unknown function (DUF3038)	NA|501aa|down_2|NZ_AP018255.1_7231390_7232893_+	pfam14233, DUF4335, Domain of unknown function (DUF4335)	NA|756aa|down_3|NZ_AP018255.1_7232984_7235252_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|330aa|down_4|NZ_AP018255.1_7235751_7236741_+	PHA03247, PHA03247, large tegument protein UL36; Provisional	NA|158aa|down_5|NZ_AP018255.1_7236838_7237312_-	PRK00376, lspA, lipoprotein signal peptidase	NA|196aa|down_6|NZ_AP018255.1_7237349_7237937_-	COG1268, BioY, Uncharacterized conserved protein [General function prediction only]	NA|399aa|down_7|NZ_AP018255.1_7238403_7239600_+	TIGR00975, precursor_PBP-3_PstS-3_Antigen_Ag88	NA|317aa|down_8|NZ_AP018255.1_7239718_7240669_+	COG0573, PstC, ABC-type phosphate transport system, permease component [Inorganic ion transport and metabolism]	NA|307aa|down_9|NZ_AP018255.1_7240694_7241615_+	COG0581, PstA, ABC-type phosphate transport system, permease component [Inorganic ion transport and metabolism]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	30	7870357-7870445	29	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	TATCCTCGCTTGAATAAGTGGCGCCCG	27	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|216aa|up_9|NZ_AP018255.1_7853609_7854257_-,NA|114aa|up_0|NZ_AP018255.1_7869902_7870244_-,NA|442aa|down_0|NZ_AP018255.1_7870686_7872012_+,NA|173aa|down_2|NZ_AP018255.1_7873294_7873813_+,NA|187aa|down_3|NZ_AP018255.1_7873877_7874438_+,NA|401aa|down_6|NZ_AP018255.1_7877072_7878275_+	NA|216aa|up_9|NZ_AP018255.1_7853609_7854257_-	NA	NA|551aa|up_8|NZ_AP018255.1_7854385_7856038_-	pfam17210, SdrD_B, SdrD B-like domain	NA|540aa|up_7|NZ_AP018255.1_7856196_7857816_-	pfam17210, SdrD_B, SdrD B-like domain	NA|772aa|up_6|NZ_AP018255.1_7857914_7860230_-	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|323aa|up_5|NZ_AP018255.1_7864630_7865599_-	TIGR04226, Fimbrial_subunit_type_2, fimbrial isopeptide formation D2 domain	NA|216aa|up_4|NZ_AP018255.1_7867082_7867730_-	TIGR02894, DNA_bind_RsfA, transcription factor, RsfA family	NA|266aa|up_3|NZ_AP018255.1_7868000_7868798_-	PLN02591, PLN02591, tryptophan synthase	NA|103aa|up_2|NZ_AP018255.1_7868840_7869149_-	pfam11460, DUF3007, Protein of unknown function (DUF3007)	NA|71aa|up_1|NZ_AP018255.1_7869196_7869409_-	pfam10716, NdhL, NADH dehydrogenase transmembrane subunit	NA|114aa|up_0|NZ_AP018255.1_7869902_7870244_-	NA	NA|442aa|down_0|NZ_AP018255.1_7870686_7872012_+	NA	NA|310aa|down_1|NZ_AP018255.1_7872094_7873024_-	COG0392, COG0392, Predicted integral membrane protein [Function unknown]	NA|173aa|down_2|NZ_AP018255.1_7873294_7873813_+	NA	NA|187aa|down_3|NZ_AP018255.1_7873877_7874438_+	NA	NA|417aa|down_4|NZ_AP018255.1_7874533_7875784_-	PRK04194, PRK04194, nickel pincer cofactor biosynthesis protein LarC	NA|213aa|down_5|NZ_AP018255.1_7875825_7876464_+	TIGR00057, Putative_threonylcarbamoyl-AMP_synthase, tRNA threonylcarbamoyl adenosine modification protein, Sua5/YciO/YrdC/YwlC family	NA|401aa|down_6|NZ_AP018255.1_7877072_7878275_+	NA	NA|69aa|down_7|NZ_AP018255.1_7878685_7878892_+	pfam05421, DUF751, Protein of unknown function (DUF751)	NA|129aa|down_8|NZ_AP018255.1_7878932_7879319_+	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|79aa|down_9|NZ_AP018255.1_7880045_7880282_+	pfam14217, DUF4327, Domain of unknown function (DUF4327)
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	31	8345459-8345546	30	CRISPRCasFinder	no	PD-DExK,Cas14u_CAS-V	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	ATCCTCACTTGAAGGAAGGCGCCGTT	26	0	0	NA	NA	N:A	1	1	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|130aa|up_8|NZ_AP018255.1_8337380_8337770_+,PD-DExK|122aa|up_4|NZ_AP018255.1_8341153_8341519_-,NA|123aa|up_2|NZ_AP018255.1_8342965_8343334_+,NA|72aa|down_7|NZ_AP018255.1_8356894_8357110_-,Cas14u_CAS-V|540aa|down_8|NZ_AP018255.1_8357813_8359433_-	NA|454aa|up_9|NZ_AP018255.1_8335988_8337350_+	cd07490, Peptidases_S8_6, Peptidase S8 family domain, uncharacterized subfamily 6	NA|130aa|up_8|NZ_AP018255.1_8337380_8337770_+	NA	NA|379aa|up_7|NZ_AP018255.1_8338156_8339293_-	COG0665, DadA, Glycine/D-amino acid oxidases (deaminating) [Amino acid transport and metabolism]	NA|291aa|up_6|NZ_AP018255.1_8339496_8340369_-	COG3491, PcbC, Isopenicillin N synthase and related dioxygenases [General function prediction only]	NA|169aa|up_5|NZ_AP018255.1_8340472_8340979_+	pfam13508, Acetyltransf_7, Acetyltransferase (GNAT) domain	PD-DExK|122aa|up_4|NZ_AP018255.1_8341153_8341519_-	NA	NA|364aa|up_3|NZ_AP018255.1_8341612_8342704_-	PRK09601, PRK09601, redox-regulated ATPase YchF	NA|123aa|up_2|NZ_AP018255.1_8342965_8343334_+	NA	NA|69aa|up_1|NZ_AP018255.1_8343641_8343848_-	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|496aa|up_0|NZ_AP018255.1_8343966_8345454_+	COG1982, LdcC, Arginine/lysine/ornithine decarboxylases [Amino acid transport and metabolism]	NA|419aa|down_0|NZ_AP018255.1_8345667_8346924_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|1808aa|down_1|NZ_AP018255.1_8347047_8352471_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|245aa|down_2|NZ_AP018255.1_8352601_8353336_-	cd03378, beta_CA_cladeC, Carbonic anhydrases (CA) are zinc-containing enzymes that catalyze the reversible hydration of carbon dioxide in a two-step mechanism in which the nucleophilic attack of a zinc-bound hydroxide ion on carbon dioxide is followed by the regeneration of an active site by ionization of the zinc-bound water molecule and removal of a proton from the active site	NA|207aa|down_3|NZ_AP018255.1_8353750_8354371_-	cd19368, TenA_C_AtTH2-like, TenA_C family similar to the N-terminal TenA_C domain of Arabidopsis thaliana thiamine requiring 2	NA|257aa|down_4|NZ_AP018255.1_8354465_8355236_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|191aa|down_5|NZ_AP018255.1_8355710_8356283_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|151aa|down_6|NZ_AP018255.1_8356349_8356802_-	COG2149, COG2149, Predicted membrane protein [Function unknown]	NA|72aa|down_7|NZ_AP018255.1_8356894_8357110_-	NA	Cas14u_CAS-V|540aa|down_8|NZ_AP018255.1_8357813_8359433_-	NA	NA|1051aa|down_9|NZ_AP018255.1_8360134_8363287_-	COG0419, SbcC, ATPase involved in DNA repair [DNA replication, recombination, and repair]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	32	8355847-8355930	31	CRISPRCasFinder	no	PD-DExK,Cas14u_CAS-V	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GCAAGGTTTGCTCCACCCATATTG	24	0	0	NA	NA	N:A	1	1	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	PD-DExK|122aa|up_9|NZ_AP018255.1_8341153_8341519_-,NA|123aa|up_7|NZ_AP018255.1_8342965_8343334_+,NA|72aa|down_1|NZ_AP018255.1_8356894_8357110_-,Cas14u_CAS-V|540aa|down_2|NZ_AP018255.1_8357813_8359433_-,NA|134aa|down_7|NZ_AP018255.1_8367137_8367539_+	PD-DExK|122aa|up_9|NZ_AP018255.1_8341153_8341519_-	NA	NA|364aa|up_8|NZ_AP018255.1_8341612_8342704_-	PRK09601, PRK09601, redox-regulated ATPase YchF	NA|123aa|up_7|NZ_AP018255.1_8342965_8343334_+	NA	NA|69aa|up_6|NZ_AP018255.1_8343641_8343848_-	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|496aa|up_5|NZ_AP018255.1_8343966_8345454_+	COG1982, LdcC, Arginine/lysine/ornithine decarboxylases [Amino acid transport and metabolism]	NA|419aa|up_4|NZ_AP018255.1_8345667_8346924_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|1808aa|up_3|NZ_AP018255.1_8347047_8352471_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|245aa|up_2|NZ_AP018255.1_8352601_8353336_-	cd03378, beta_CA_cladeC, Carbonic anhydrases (CA) are zinc-containing enzymes that catalyze the reversible hydration of carbon dioxide in a two-step mechanism in which the nucleophilic attack of a zinc-bound hydroxide ion on carbon dioxide is followed by the regeneration of an active site by ionization of the zinc-bound water molecule and removal of a proton from the active site	NA|207aa|up_1|NZ_AP018255.1_8353750_8354371_-	cd19368, TenA_C_AtTH2-like, TenA_C family similar to the N-terminal TenA_C domain of Arabidopsis thaliana thiamine requiring 2	NA|257aa|up_0|NZ_AP018255.1_8354465_8355236_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|151aa|down_0|NZ_AP018255.1_8356349_8356802_-	COG2149, COG2149, Predicted membrane protein [Function unknown]	NA|72aa|down_1|NZ_AP018255.1_8356894_8357110_-	NA	Cas14u_CAS-V|540aa|down_2|NZ_AP018255.1_8357813_8359433_-	NA	NA|1051aa|down_3|NZ_AP018255.1_8360134_8363287_-	COG0419, SbcC, ATPase involved in DNA repair [DNA replication, recombination, and repair]	NA|656aa|down_4|NZ_AP018255.1_8363762_8365730_+	pfam11181, YflT, Heat induced stress protein YflT	NA|156aa|down_5|NZ_AP018255.1_8365839_8366307_+	pfam04972, BON, BON domain	NA|153aa|down_6|NZ_AP018255.1_8366445_8366904_+	pfam14159, CAAD, CAAD domains of cyanobacterial aminoacyl-tRNA synthetase	NA|134aa|down_7|NZ_AP018255.1_8367137_8367539_+	NA	NA|524aa|down_8|NZ_AP018255.1_8367608_8369180_-	cd07378, MPP_ACP5, Homo sapiens acid phosphatase 5 and related proteins, metallophosphatase domain	NA|319aa|down_9|NZ_AP018255.1_8369258_8370215_-	PRK00861, PRK00861, putative lipid kinase; Reviewed
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	33	9147454-9147558	32	CRISPRCasFinder	no	cas6	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GTTACCAGACCCAGAATTTTCAGGGTCTGGTGAC	34	0	0	NA	NA	N:A	1	1	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|102aa|up_8|NZ_AP018255.1_9137154_9137460_+,NA|103aa|up_6|NZ_AP018255.1_9141316_9141625_+,NA|225aa|up_5|NZ_AP018255.1_9141831_9142506_+,NA|77aa|up_3|NZ_AP018255.1_9143671_9143902_+,NA|373aa|up_1|NZ_AP018255.1_9145383_9146502_-,NA|330aa|down_0|NZ_AP018255.1_9148139_9149129_+	NA|144aa|up_9|NZ_AP018255.1_9136726_9137158_+	COG4683, COG4683, Uncharacterized protein conserved in bacteria [Function unknown]	NA|102aa|up_8|NZ_AP018255.1_9137154_9137460_+	NA	NA|1188aa|up_7|NZ_AP018255.1_9137612_9141176_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|103aa|up_6|NZ_AP018255.1_9141316_9141625_+	NA	NA|225aa|up_5|NZ_AP018255.1_9141831_9142506_+	NA	NA|204aa|up_4|NZ_AP018255.1_9142793_9143405_+	cd01457, vWA_ORF176_type, VWA ORF176 type: Von Willebrand factor type A (vWA) domain was originally found in the blood coagulation protein von Willebrand factor (vWF)	NA|77aa|up_3|NZ_AP018255.1_9143671_9143902_+	NA	NA|425aa|up_2|NZ_AP018255.1_9144017_9145292_+	pfam12770, CHAT, CHAT domain	NA|373aa|up_1|NZ_AP018255.1_9145383_9146502_-	NA	NA|93aa|up_0|NZ_AP018255.1_9147116_9147395_+	TIGR04532, polyketide_synthase, iterative type I PKS product template domain	NA|330aa|down_0|NZ_AP018255.1_9148139_9149129_+	NA	NA|402aa|down_1|NZ_AP018255.1_9150087_9151293_-	COG4637, COG4637, Predicted ATPase [General function prediction only]	NA|682aa|down_2|NZ_AP018255.1_9151635_9153681_-	PRK07956, ligA, NAD-dependent DNA ligase LigA; Validated	NA|353aa|down_3|NZ_AP018255.1_9153899_9154958_-	smart00327, VWA, von Willebrand factor (vWF) type A domain	NA|461aa|down_4|NZ_AP018255.1_9155475_9156858_-	cd19920, REC_PA4781-like, phosphoacceptor receiver (REC) domain of cyclic di-GMP phosphodiesterase PA4781 and similar domains	NA|783aa|down_5|NZ_AP018255.1_9156906_9159255_-	TIGR02956, sensor_protein_TorS, TMAO reductase sytem sensor TorS	NA|417aa|down_6|NZ_AP018255.1_9159484_9160735_+	PRK09230, PRK09230, cytosine deaminase; Provisional	NA|503aa|down_7|NZ_AP018255.1_9161186_9162695_-	pfam17380, DUF5401, Family of unknown function (DUF5401)	NA|1143aa|down_8|NZ_AP018255.1_9162738_9166167_-	cd07302, CHD, cyclase homology domain	NA|198aa|down_9|NZ_AP018255.1_9166820_9167414_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	34	9201505-9201745	33,8	CRISPRCasFinder,PILER-CR	no	cas6,cas3,cas8b3,cas7,cas5,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GTGATCAACACCTTACGGTATCTA,GTGATCAACACCTTACGGTATCTAA	24,25	0	0	NA	NA	N:A	3,2	3	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|163aa|up_8|NZ_AP018255.1_9186862_9187351_+,NA|168aa|up_6|NZ_AP018255.1_9188809_9189313_+,NA|86aa|up_0|NZ_AP018255.1_9199260_9199518_-,NA|102aa|down_5|NZ_AP018255.1_9209801_9210107_-,NA|92aa|down_6|NZ_AP018255.1_9210629_9210905_+,NA|92aa|down_9|NZ_AP018255.1_9214489_9214765_-	NA|305aa|up_9|NZ_AP018255.1_9185745_9186660_+	pfam01636, APH, Phosphotransferase enzyme family	NA|163aa|up_8|NZ_AP018255.1_9186862_9187351_+	NA	NA|128aa|up_7|NZ_AP018255.1_9187888_9188272_+	cd08359, VOC_like, uncharacterized subfamily of vicinal oxygen chelate (VOC) family	NA|168aa|up_6|NZ_AP018255.1_9188809_9189313_+	NA	NA|371aa|up_5|NZ_AP018255.1_9192557_9193670_-	pfam00144, Beta-lactamase, Beta-lactamase	NA|116aa|up_4|NZ_AP018255.1_9193701_9194049_-	pfam12680, SnoaL_2, SnoaL-like domain	NA|64aa|up_3|NZ_AP018255.1_9194121_9194313_-	pfam00892, EamA, EamA-like transporter family	NA|452aa|up_2|NZ_AP018255.1_9194418_9195774_+	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|1055aa|up_1|NZ_AP018255.1_9195834_9198999_+	COG0841, AcrB, Cation/multidrug efflux pump [Defense mechanisms]	NA|86aa|up_0|NZ_AP018255.1_9199260_9199518_-	NA	cas6|238aa|down_0|NZ_AP018255.1_9202224_9202938_+	pfam09559, Cas6, Cas6 Crispr	cas3|809aa|down_1|NZ_AP018255.1_9202967_9205394_+	cd09639, Cas3_I, CRISPR/Cas system-associated protein Cas3	cas8b3|523aa|down_2|NZ_AP018255.1_9205384_9206953_+	TIGR03485, hypothetical_protein_L8106_30105, CRISPR-associated protein Cas8a1/Csx13, MYXAN subtype	cas7|312aa|down_3|NZ_AP018255.1_9207020_9207956_+	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas5|221aa|down_4|NZ_AP018255.1_9207952_9208615_+	cd09688, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	NA|102aa|down_5|NZ_AP018255.1_9209801_9210107_-	NA	NA|92aa|down_6|NZ_AP018255.1_9210629_9210905_+	NA	cas1|555aa|down_7|NZ_AP018255.1_9210934_9212599_+	TIGR03983, hypothetical_protein_LA3181, CRISPR-associated endonuclease Cas1, subtype MYXAN	cas2|98aa|down_8|NZ_AP018255.1_9212615_9212909_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|92aa|down_9|NZ_AP018255.1_9214489_9214765_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	35	9208975-9210597	34,8,35	CRISPRCasFinder,CRT,CRISPRCasFinder	no	cas6,cas3,cas8b3,cas7,cas5,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GTGTTTTAACCTTAGATGTCGAAAGGCGTTGAGCAT,GTGTTTTAACCTTAGATGTCGNNAAGGCGTTGAGCA,GTGTTTTAACCTTAGATGTCGAAAGGCGTTGAGCAT	36,36,36	0	0	NA	NA	N:A	20,21,20	21	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|86aa|up_5|NZ_AP018255.1_9199260_9199518_-,NA|92aa|down_0|NZ_AP018255.1_9210629_9210905_+,NA|92aa|down_3|NZ_AP018255.1_9214489_9214765_-,NA|82aa|down_4|NZ_AP018255.1_9214951_9215197_-,NA|62aa|down_5|NZ_AP018255.1_9215379_9215565_+,NA|280aa|down_6|NZ_AP018255.1_9215651_9216491_-,NA|513aa|down_7|NZ_AP018255.1_9216623_9218162_-	NA|116aa|up_9|NZ_AP018255.1_9193701_9194049_-	pfam12680, SnoaL_2, SnoaL-like domain	NA|64aa|up_8|NZ_AP018255.1_9194121_9194313_-	pfam00892, EamA, EamA-like transporter family	NA|452aa|up_7|NZ_AP018255.1_9194418_9195774_+	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|1055aa|up_6|NZ_AP018255.1_9195834_9198999_+	COG0841, AcrB, Cation/multidrug efflux pump [Defense mechanisms]	NA|86aa|up_5|NZ_AP018255.1_9199260_9199518_-	NA	cas6|238aa|up_4|NZ_AP018255.1_9202224_9202938_+	pfam09559, Cas6, Cas6 Crispr	cas3|809aa|up_3|NZ_AP018255.1_9202967_9205394_+	cd09639, Cas3_I, CRISPR/Cas system-associated protein Cas3	cas8b3|523aa|up_2|NZ_AP018255.1_9205384_9206953_+	TIGR03485, hypothetical_protein_L8106_30105, CRISPR-associated protein Cas8a1/Csx13, MYXAN subtype	cas7|312aa|up_1|NZ_AP018255.1_9207020_9207956_+	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas5|221aa|up_0|NZ_AP018255.1_9207952_9208615_+	cd09688, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	NA|92aa|down_0|NZ_AP018255.1_9210629_9210905_+	NA	cas1|555aa|down_1|NZ_AP018255.1_9210934_9212599_+	TIGR03983, hypothetical_protein_LA3181, CRISPR-associated endonuclease Cas1, subtype MYXAN	cas2|98aa|down_2|NZ_AP018255.1_9212615_9212909_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|92aa|down_3|NZ_AP018255.1_9214489_9214765_-	NA	NA|82aa|down_4|NZ_AP018255.1_9214951_9215197_-	NA	NA|62aa|down_5|NZ_AP018255.1_9215379_9215565_+	NA	NA|280aa|down_6|NZ_AP018255.1_9215651_9216491_-	NA	NA|513aa|down_7|NZ_AP018255.1_9216623_9218162_-	NA	NA|268aa|down_8|NZ_AP018255.1_9218532_9219336_+	COG4242, CphB, Cyanophycinase and related exopeptidases [Secondary metabolites biosynthesis, transport, and catabolism / Inorganic ion transport and metabolism]	NA|394aa|down_9|NZ_AP018255.1_9219447_9220629_-	COG2267, PldB, Lysophospholipase [Lipid metabolism]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	36	9213083-9214485	9,9,36	CRT,PILER-CR,CRISPRCasFinder	no	cas6,cas3,cas8b3,cas7,cas5,cas1,cas2	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GTGCTGTAACCTTAGATGTCGTAAGGCGTTGAGCAG,GTGCTGTAACCTTAGATGTCGTAAGGCGTTGAGCAG,GTGCTGTAACCTTAGATGTCGTAAGGCGTTGAGCAG	36,36,36	0	0	NA	NA	N:A	19,17,18	19	Unclear	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|86aa|up_9|NZ_AP018255.1_9199260_9199518_-,NA|102aa|up_3|NZ_AP018255.1_9209801_9210107_-,NA|92aa|up_2|NZ_AP018255.1_9210629_9210905_+,NA|92aa|down_0|NZ_AP018255.1_9214489_9214765_-,NA|82aa|down_1|NZ_AP018255.1_9214951_9215197_-,NA|62aa|down_2|NZ_AP018255.1_9215379_9215565_+,NA|280aa|down_3|NZ_AP018255.1_9215651_9216491_-,NA|513aa|down_4|NZ_AP018255.1_9216623_9218162_-,NA|81aa|down_8|NZ_AP018255.1_9221070_9221313_+,NA|133aa|down_9|NZ_AP018255.1_9223314_9223713_-	NA|86aa|up_9|NZ_AP018255.1_9199260_9199518_-	NA	cas6|238aa|up_8|NZ_AP018255.1_9202224_9202938_+	pfam09559, Cas6, Cas6 Crispr	cas3|809aa|up_7|NZ_AP018255.1_9202967_9205394_+	cd09639, Cas3_I, CRISPR/Cas system-associated protein Cas3	cas8b3|523aa|up_6|NZ_AP018255.1_9205384_9206953_+	TIGR03485, hypothetical_protein_L8106_30105, CRISPR-associated protein Cas8a1/Csx13, MYXAN subtype	cas7|312aa|up_5|NZ_AP018255.1_9207020_9207956_+	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas5|221aa|up_4|NZ_AP018255.1_9207952_9208615_+	cd09688, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	NA|102aa|up_3|NZ_AP018255.1_9209801_9210107_-	NA	NA|92aa|up_2|NZ_AP018255.1_9210629_9210905_+	NA	cas1|555aa|up_1|NZ_AP018255.1_9210934_9212599_+	TIGR03983, hypothetical_protein_LA3181, CRISPR-associated endonuclease Cas1, subtype MYXAN	cas2|98aa|up_0|NZ_AP018255.1_9212615_9212909_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|92aa|down_0|NZ_AP018255.1_9214489_9214765_-	NA	NA|82aa|down_1|NZ_AP018255.1_9214951_9215197_-	NA	NA|62aa|down_2|NZ_AP018255.1_9215379_9215565_+	NA	NA|280aa|down_3|NZ_AP018255.1_9215651_9216491_-	NA	NA|513aa|down_4|NZ_AP018255.1_9216623_9218162_-	NA	NA|268aa|down_5|NZ_AP018255.1_9218532_9219336_+	COG4242, CphB, Cyanophycinase and related exopeptidases [Secondary metabolites biosynthesis, transport, and catabolism / Inorganic ion transport and metabolism]	NA|394aa|down_6|NZ_AP018255.1_9219447_9220629_-	COG2267, PldB, Lysophospholipase [Lipid metabolism]	NA|100aa|down_7|NZ_AP018255.1_9220774_9221074_+	COG2026, RelE, Cytotoxic translational repressor of toxin-antitoxin stability system [Translation, ribosomal structure and biogenesis / Cell division and chromosome partitioning]	NA|81aa|down_8|NZ_AP018255.1_9221070_9221313_+	NA	NA|133aa|down_9|NZ_AP018255.1_9223314_9223713_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	37	9705864-9705948	37	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	AGTGCTGAGTCAAGAAACAGTGCTGAGT	28	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|97aa|up_9|NZ_AP018255.1_9692528_9692819_+,NA|188aa|up_8|NZ_AP018255.1_9693067_9693631_+,NA|67aa|up_6|NZ_AP018255.1_9697993_9698194_-,NA|126aa|up_5|NZ_AP018255.1_9698356_9698734_-,NA|115aa|up_3|NZ_AP018255.1_9700825_9701170_+,NA|156aa|up_1|NZ_AP018255.1_9701974_9702442_+,NA|214aa|up_0|NZ_AP018255.1_9702564_9703206_-,NA|143aa|down_2|NZ_AP018255.1_9709625_9710054_-,NA|100aa|down_8|NZ_AP018255.1_9717069_9717369_-	NA|97aa|up_9|NZ_AP018255.1_9692528_9692819_+	NA	NA|188aa|up_8|NZ_AP018255.1_9693067_9693631_+	NA	NA|419aa|up_7|NZ_AP018255.1_9696563_9697820_-	smart00812, Alpha_L_fucos, Alpha-L-fucosidase	NA|67aa|up_6|NZ_AP018255.1_9697993_9698194_-	NA	NA|126aa|up_5|NZ_AP018255.1_9698356_9698734_-	NA	NA|605aa|up_4|NZ_AP018255.1_9698782_9700597_-	sd00006, TPR, Tetratricopeptide repeat	NA|115aa|up_3|NZ_AP018255.1_9700825_9701170_+	NA	NA|248aa|up_2|NZ_AP018255.1_9701192_9701936_+	PRK14831, PRK14831, undecaprenyl pyrophosphate synthase; Provisional	NA|156aa|up_1|NZ_AP018255.1_9701974_9702442_+	NA	NA|214aa|up_0|NZ_AP018255.1_9702564_9703206_-	NA	NA|88aa|down_0|NZ_AP018255.1_9708218_9708482_-	pfam00030, Crystall, Beta/Gamma crystallin	NA|143aa|down_1|NZ_AP018255.1_9708595_9709024_-	pfam06271, RDD, RDD family	NA|143aa|down_2|NZ_AP018255.1_9709625_9710054_-	NA	NA|74aa|down_3|NZ_AP018255.1_9710495_9710717_+	pfam13443, HTH_26, Cro/C1-type HTH DNA-binding domain	NA|314aa|down_4|NZ_AP018255.1_9711212_9712154_-	pfam11051, Mannosyl_trans3, Mannosyltransferase putative	NA|335aa|down_5|NZ_AP018255.1_9712158_9713163_-	cd04194, GT8_A4GalT_like, A4GalT_like proteins catalyze the addition of galactose or glucose residues to the lipooligosaccharide (LOS) or lipopolysaccharide (LPS) of the bacterial cell surface	NA|782aa|down_6|NZ_AP018255.1_9713391_9715737_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|392aa|down_7|NZ_AP018255.1_9715808_9716984_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|100aa|down_8|NZ_AP018255.1_9717069_9717369_-	NA	NA|364aa|down_9|NZ_AP018255.1_9717582_9718674_-	cd03813, GT4-like, glycosyltransferase family 4 proteins
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	38	9775374-9775461	38	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	GAAATTGATGTGAACCCACCCGTACTAT	28	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|64aa|up_2|NZ_AP018255.1_9770772_9770964_-,NA|225aa|down_6|NZ_AP018255.1_9784219_9784894_+,NA|247aa|down_7|NZ_AP018255.1_9785432_9786173_+,NA|116aa|down_8|NZ_AP018255.1_9786217_9786565_+	NA|258aa|up_9|NZ_AP018255.1_9760774_9761548_-	PRK00311, panB, 3-methyl-2-oxobutanoate hydroxymethyltransferase; Reviewed	NA|355aa|up_8|NZ_AP018255.1_9761863_9762928_-	COG3292, COG3292, Predicted periplasmic ligand-binding sensor domain [Signal transduction mechanisms]	NA|477aa|up_7|NZ_AP018255.1_9763666_9765097_+	CHL00040, rbcL, ribulose-1,5-bisphosphate carboxylase/oxygenase large subunit	NA|133aa|up_6|NZ_AP018255.1_9765287_9765686_+	pfam02341, RcbX, RbcX protein	NA|117aa|up_5|NZ_AP018255.1_9765744_9766095_+	pfam00101, RuBisCO_small, Ribulose bisphosphate carboxylase, small chain	NA|207aa|up_4|NZ_AP018255.1_9766397_9767018_+	cd01835, SGNH_hydrolase_like_3, SGNH_hydrolase subfamily	NA|114aa|up_3|NZ_AP018255.1_9770197_9770539_+	cd16382, XisI-like, XisI is FdxN element excision controlling factor protein	NA|64aa|up_2|NZ_AP018255.1_9770772_9770964_-	NA	NA|843aa|up_1|NZ_AP018255.1_9771454_9773983_+	cd05805, MPG1_transferase, GTP-mannose-1-phosphate guanyltransferase (MPG1 transferase), also known as GDP-mannose pyrophosphorylase, is a bifunctional enzyme with both phosphomannose isomerase (PMI) activity and GDP-mannose phosphorylase (GMP) activity	NA|397aa|up_0|NZ_AP018255.1_9774175_9775366_+	PRK04149, sat, sulfate adenylyltransferase; Reviewed	NA|706aa|down_0|NZ_AP018255.1_9775640_9777758_+	pfam00656, Peptidase_C14, Caspase domain	NA|291aa|down_1|NZ_AP018255.1_9777800_9778673_-	PRK07432, PRK07432, S-methyl-5'-thioadenosine phosphorylase	NA|620aa|down_2|NZ_AP018255.1_9779148_9781008_+	cd01948, EAL, EAL domain	NA|253aa|down_3|NZ_AP018255.1_9780979_9781738_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|213aa|down_4|NZ_AP018255.1_9781860_9782499_-	cd07051, BMC_like_1_repeat1, Bacterial Micro-Compartment (BMC)-like domain 1 repeat 1	NA|493aa|down_5|NZ_AP018255.1_9782660_9784139_+	TIGR02881, Stage_V_sporulation_protein_K, stage V sporulation protein K	NA|225aa|down_6|NZ_AP018255.1_9784219_9784894_+	NA	NA|247aa|down_7|NZ_AP018255.1_9785432_9786173_+	NA	NA|116aa|down_8|NZ_AP018255.1_9786217_9786565_+	NA	NA|420aa|down_9|NZ_AP018255.1_9787133_9788393_-	TIGR02779, NHEJ_ligase_lig, DNA ligase D, ligase domain
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	39	10109837-10109950	39	CRISPRCasFinder	no	RT	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	AAATGTGAACCGTGGTTCACAAATACA	27	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|100aa|up_9|NZ_AP018255.1_10098388_10098688_+,NA|62aa|up_3|NZ_AP018255.1_10105968_10106154_-,NA|149aa|up_0|NZ_AP018255.1_10109302_10109749_+,NA|164aa|down_0|NZ_AP018255.1_10109968_10110460_-,NA|120aa|down_1|NZ_AP018255.1_10110605_10110965_-,NA|115aa|down_2|NZ_AP018255.1_10111221_10111566_-	NA|100aa|up_9|NZ_AP018255.1_10098388_10098688_+	NA	NA|433aa|up_8|NZ_AP018255.1_10098795_10100094_-	PRK00062, PRK00062, glutamate-1-semialdehyde 2,1-aminomutase	NA|62aa|up_7|NZ_AP018255.1_10100202_10100388_+	COG4572, ChaB, Putative cation transport regulator [General function prediction only]	NA|216aa|up_6|NZ_AP018255.1_10100510_10101158_+	PRK02759, PRK02759, bifunctional phosphoribosyl-AMP cyclohydrolase/phosphoribosyl-ATP diphosphatase HisIE	RT|305aa|up_5|NZ_AP018255.1_10101781_10102696_-	TIGR04416, hypothetical_protein, group II intron reverse transcriptase/maturase	RT|595aa|up_4|NZ_AP018255.1_10102832_10104617_-	cd01651, RT_G2_intron, RT_G2_intron: Reverse transcriptases (RTs) with group II intron origin	NA|62aa|up_3|NZ_AP018255.1_10105968_10106154_-	NA	NA|122aa|up_2|NZ_AP018255.1_10106860_10107226_+	pfam01797, Y1_Tnp, Transposase IS200 like	NA|444aa|up_1|NZ_AP018255.1_10107589_10108921_+	COG2821, MltA, Membrane-bound lytic murein transglycosylase [Cell envelope biogenesis, outer membrane]	NA|149aa|up_0|NZ_AP018255.1_10109302_10109749_+	NA	NA|164aa|down_0|NZ_AP018255.1_10109968_10110460_-	NA	NA|120aa|down_1|NZ_AP018255.1_10110605_10110965_-	NA	NA|115aa|down_2|NZ_AP018255.1_10111221_10111566_-	NA	NA|114aa|down_3|NZ_AP018255.1_10111740_10112082_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|220aa|down_4|NZ_AP018255.1_10112184_10112844_-	cd10917, CE4_NodB_like_6s_7s, Catalytic NodB homology domain of rhizobial NodB-like proteins	NA|1056aa|down_5|NZ_AP018255.1_10113107_10116275_+	cd02080, P-type_ATPase_cation, P-type cation-transporting ATPase similar to Exiguobacterium aurantiacum Mna, an Na(+)-ATPase, and Synechocystis sp	NA|103aa|down_6|NZ_AP018255.1_10116568_10116877_+	pfam09907, HigB_toxin, HigB_toxin, RelE-like toxic component of a toxin-antitoxin system	NA|144aa|down_7|NZ_AP018255.1_10116968_10117400_+	COG5499, COG5499, Predicted transcription regulator containing HTH domain [Transcription]	NA|97aa|down_8|NZ_AP018255.1_10118303_10118594_+	COG1669, COG1669, Predicted nucleotidyltransferases [General function prediction only]	NA|116aa|down_9|NZ_AP018255.1_10118583_10118931_+	COG2361, COG2361, Uncharacterized conserved protein [Function unknown]
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	40	10220432-10220524	40	CRISPRCasFinder	no	cas14j	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Unclear	GCGTCACGCACCGGCTTAAAATTGTGACT	29	0	0	NA	NA	N:A	1	1	TypeV	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|134aa|up_7|NZ_AP018255.1_10212515_10212917_-,NA|62aa|up_6|NZ_AP018255.1_10213632_10213818_+,NA|114aa|up_2|NZ_AP018255.1_10218171_10218513_+,NA|61aa|up_1|NZ_AP018255.1_10218577_10218760_-,NA|75aa|down_3|NZ_AP018255.1_10223953_10224178_-,NA|81aa|down_4|NZ_AP018255.1_10224465_10224708_-,NA|218aa|down_7|NZ_AP018255.1_10226082_10226736_-	NA|575aa|up_9|NZ_AP018255.1_10208850_10210575_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|488aa|up_8|NZ_AP018255.1_10210991_10212455_+	cd11338, AmyAc_CMD, Alpha amylase catalytic domain found in cyclomaltodextrinases and related proteins	NA|134aa|up_7|NZ_AP018255.1_10212515_10212917_-	NA	NA|62aa|up_6|NZ_AP018255.1_10213632_10213818_+	NA	NA|361aa|up_5|NZ_AP018255.1_10213876_10214959_-	PRK09250, PRK09250, class I fructose-bisphosphate aldolase	NA|80aa|up_4|NZ_AP018255.1_10215771_10216011_-	pfam01797, Y1_Tnp, Transposase IS200 like	cas14j|558aa|up_3|NZ_AP018255.1_10216071_10217745_+	COG0675, COG0675, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|114aa|up_2|NZ_AP018255.1_10218171_10218513_+	NA	NA|61aa|up_1|NZ_AP018255.1_10218577_10218760_-	NA	NA|391aa|up_0|NZ_AP018255.1_10219167_10220340_-	pfam00144, Beta-lactamase, Beta-lactamase	NA|32aa|down_0|NZ_AP018255.1_10220897_10220993_+	pfam02634, FdhD-NarQ, FdhD/NarQ family	NA|515aa|down_1|NZ_AP018255.1_10221393_10222938_+	pfam00743, FMO-like, Flavin-binding monooxygenase-like	NA|213aa|down_2|NZ_AP018255.1_10223267_10223906_-	pfam14124, DUF4291, Domain of unknown function (DUF4291)	NA|75aa|down_3|NZ_AP018255.1_10223953_10224178_-	NA	NA|81aa|down_4|NZ_AP018255.1_10224465_10224708_-	NA	NA|249aa|down_5|NZ_AP018255.1_10224904_10225651_+	cd10001, HDAC_classII_APAH, Histone deacetylase class IIa	NA|108aa|down_6|NZ_AP018255.1_10225753_10226077_+	cd10001, HDAC_classII_APAH, Histone deacetylase class IIa	NA|218aa|down_7|NZ_AP018255.1_10226082_10226736_-	NA	NA|124aa|down_8|NZ_AP018255.1_10226909_10227281_+	cd07264, VOC_like, uncharacterized subfamily of vicinal oxygen chelate (VOC) family	NA|299aa|down_9|NZ_AP018255.1_10227369_10228266_+	PRK09563, rbgA, GTPase YlqF; Reviewed
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	41	10389858-10390189	10	PILER-CR	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	TGTTCGCTGTGAAGTTGCCA	20	0	0	NA	NA	N:A	4	4	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|216aa|up_9|NZ_AP018255.1_10381997_10382645_-,NA|109aa|up_5|NZ_AP018255.1_10385292_10385619_-,NA|102aa|up_4|NZ_AP018255.1_10385874_10386180_-,NA|74aa|up_2|NZ_AP018255.1_10386903_10387125_+,NA|118aa|down_0|NZ_AP018255.1_10390194_10390548_-,NA|186aa|down_1|NZ_AP018255.1_10390755_10391313_-,NA|117aa|down_7|NZ_AP018255.1_10398205_10398556_+,NA|187aa|down_8|NZ_AP018255.1_10398669_10399230_+,NA|67aa|down_9|NZ_AP018255.1_10399297_10399498_-	NA|216aa|up_9|NZ_AP018255.1_10381997_10382645_-	NA	NA|88aa|up_8|NZ_AP018255.1_10383065_10383329_-	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|323aa|up_7|NZ_AP018255.1_10383635_10384604_+	cd01167, bac_FRK, Fructokinases (FRKs) mainly from bacteria and plants are enzymes with high specificity for fructose, as are all FRKs, but they catalyzes the conversion of fructose to fructose-6-phosphate, which is an entry point into glycolysis via conversion into glucose-6-phosphate	NA|130aa|up_6|NZ_AP018255.1_10384858_10385248_+	cd02980, TRX_Fd_family, Thioredoxin (TRX)-like [2Fe-2S] Ferredoxin (Fd) family; composed of [2Fe-2S] Fds with a TRX fold (TRX-like Fds) and proteins containing domains similar to TRX-like Fd including formate dehydrogenases, NAD-reducing hydrogenases and the subunit E of NADH:ubiquinone oxidoreductase (NuoE)	NA|109aa|up_5|NZ_AP018255.1_10385292_10385619_-	NA	NA|102aa|up_4|NZ_AP018255.1_10385874_10386180_-	NA	NA|156aa|up_3|NZ_AP018255.1_10386223_10386691_-	COG3265, GntK, Gluconate kinase [Carbohydrate transport and metabolism]	NA|74aa|up_2|NZ_AP018255.1_10386903_10387125_+	NA	NA|471aa|up_1|NZ_AP018255.1_10387361_10388774_+	smart00563, PlsC, Phosphate acyltransferases	NA|161aa|up_0|NZ_AP018255.1_10388824_10389307_-	cd17036, T3SC_YbjN-like_1, T110839 is structurally similar to type III secretion system chaperones and YbjN family proteins	NA|118aa|down_0|NZ_AP018255.1_10390194_10390548_-	NA	NA|186aa|down_1|NZ_AP018255.1_10390755_10391313_-	NA	NA|373aa|down_2|NZ_AP018255.1_10391299_10392418_-	pfam13304, AAA_21, AAA domain, putative AbiEii toxin, Type IV TA system	NA|354aa|down_3|NZ_AP018255.1_10393542_10394604_+	COG4638, HcaE, Phenylpropionate dioxygenase and related ring-hydroxylating dioxygenases, large terminal subunit [Inorganic ion transport and metabolism / General function prediction only]	NA|343aa|down_4|NZ_AP018255.1_10394695_10395724_-	pfam10017, Methyltransf_33, Histidine-specific methyltransferase, SAM-dependent	NA|414aa|down_5|NZ_AP018255.1_10395940_10397182_-	TIGR03440, egtB_TIGR03440, ergothioneine biosynthesis protein EgtB	NA|288aa|down_6|NZ_AP018255.1_10397156_10398020_-	TIGR03442, TIGR03442, ergothioneine biosynthesis protein EgtC	NA|117aa|down_7|NZ_AP018255.1_10398205_10398556_+	NA	NA|187aa|down_8|NZ_AP018255.1_10398669_10399230_+	NA	NA|67aa|down_9|NZ_AP018255.1_10399297_10399498_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	42	10702223-10702313	41	CRISPRCasFinder	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	AGTGCGCTCGTGCGCTCGTGCTGAGT	26	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA,NA|134aa|down_0|NZ_AP018255.1_10702485_10702887_+,NA|419aa|down_2|NZ_AP018255.1_10703386_10704643_-,NA|112aa|down_6|NZ_AP018255.1_10709037_10709373_+,NA|151aa|down_9|NZ_AP018255.1_10711282_10711735_+	NA|363aa|up_9|NZ_AP018255.1_10681779_10682868_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|483aa|up_8|NZ_AP018255.1_10682895_10684344_-	PRK09302, PRK09302, circadian clock protein KaiC; Reviewed	NA|1060aa|up_7|NZ_AP018255.1_10687483_10690663_-	COG0643, CheA, Chemotaxis protein histidine kinase and related kinases [Cell motility and secretion / Signal transduction mechanisms]	NA|924aa|up_6|NZ_AP018255.1_10691034_10693806_-	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|166aa|up_5|NZ_AP018255.1_10693999_10694497_-	COG0835, CheW, Chemotaxis signal transduction protein [Cell motility and secretion / Signal transduction mechanisms]	NA|126aa|up_4|NZ_AP018255.1_10694503_10694881_-	cd17538, REC_D1_PleD-like, first (D1) phosphoacceptor receiver (REC) domain of response regulator PleD and similar domains	NA|366aa|up_3|NZ_AP018255.1_10694985_10696083_-	cd17602, REC_PatA-like, phosphoacceptor receiver (REC) domain of PatA and similar domains	NA|394aa|up_2|NZ_AP018255.1_10697123_10698305_-	PRK00053, alr, alanine racemase; Reviewed	NA|166aa|up_1|NZ_AP018255.1_10698766_10699264_+	COG1403, McrA, Restriction endonuclease [Defense mechanisms]	NA|423aa|up_0|NZ_AP018255.1_10699687_10700956_+	COG0618, COG0618, Exopolyphosphatase-related proteins [General function prediction only]	NA|134aa|down_0|NZ_AP018255.1_10702485_10702887_+	NA	NA|140aa|down_1|NZ_AP018255.1_10702886_10703306_+	cd00085, HNHc, HNH nucleases; HNH endonuclease signature which is found in viral, prokaryotic, and eukaryotic proteins	NA|419aa|down_2|NZ_AP018255.1_10703386_10704643_-	NA	NA|108aa|down_3|NZ_AP018255.1_10704814_10705138_-	PRK13564, PRK13564, anthranilate synthase component 1	NA|754aa|down_4|NZ_AP018255.1_10705564_10707826_-	cd05387, BY-kinase, bacterial tyrosine-kinase	NA|84aa|down_5|NZ_AP018255.1_10708567_10708819_+	pfam13692, Glyco_trans_1_4, Glycosyl transferases group 1	NA|112aa|down_6|NZ_AP018255.1_10709037_10709373_+	NA	NA|417aa|down_7|NZ_AP018255.1_10709397_10710648_-	TIGR00275, TIGR00275, flavoprotein, HI0933 family	NA|55aa|down_8|NZ_AP018255.1_10710755_10710920_-	cd00730, rubredoxin, Rubredoxin; nonheme iron binding domains containing a [Fe(SCys)4] center	NA|151aa|down_9|NZ_AP018255.1_10711282_10711735_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018255	Calothrix sp. NIES-4071 DNA, complete genome	43	10949304-10949461	11	PILER-CR	no		cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2	Orphan	ATTACTACCACCACCACCACCACCAT	26	0	0	NA	NA	N:A	2	2	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA,NA|839aa|down_2|NZ_AP018255.1_10956291_10958808_-,NA|270aa|down_9|NZ_AP018255.1_10967088_10967898_+	NA|150aa|up_9|NZ_AP018255.1_10935217_10935667_-	cd17557, REC_Rcp-like, phosphoacceptor receiver (REC) domain of cyanobacterial phytochrome response regulator Rcp and similar domains	NA|473aa|up_8|NZ_AP018255.1_10935663_10937082_-	COG4251, COG4251, Bacteriophytochrome (light-regulated signal transduction histidine kinase) [Signal transduction mechanisms]	NA|416aa|up_7|NZ_AP018255.1_10937715_10938963_-	COG1223, COG1223, Predicted ATPase (AAA+ superfamily) [General function prediction only]	NA|49aa|up_6|NZ_AP018255.1_10940434_10940581_+	PRK02106, PRK02106, choline dehydrogenase; Validated	NA|36aa|up_5|NZ_AP018255.1_10940605_10940713_+	PRK02106, PRK02106, choline dehydrogenase; Validated	NA|852aa|up_4|NZ_AP018255.1_10940680_10943236_-	pfam05860, Haemagg_act, haemagglutination activity domain	NA|144aa|up_3|NZ_AP018255.1_10943272_10943704_-	COG0654, UbiH, 2-polyprenyl-6-methoxyphenol hydroxylase and related FAD-dependent oxidoreductases [Coenzyme metabolism / Energy production and conversion]	NA|640aa|up_2|NZ_AP018255.1_10943889_10945809_-	cd17640, LC_FACS_like, Long-chain fatty acid CoA synthetase	NA|114aa|up_1|NZ_AP018255.1_10946440_10946782_-	pfam18480, DUF5615, Domain of unknown function (DUF5615)	NA|109aa|up_0|NZ_AP018255.1_10946781_10947108_-	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	NA|483aa|down_0|NZ_AP018255.1_10954052_10955501_-	TIGR01451, unnamed_protein_product, conserved repeat domain	NA|190aa|down_1|NZ_AP018255.1_10955635_10956205_-	COG4719, COG4719, Uncharacterized protein conserved in bacteria [Function unknown]	NA|839aa|down_2|NZ_AP018255.1_10956291_10958808_-	NA	NA|193aa|down_3|NZ_AP018255.1_10959727_10960306_-	cd04496, SSB_OBF, SSB_OBF: A subfamily of OB folds similar to the OB fold of ssDNA-binding protein (SSB)	NA|437aa|down_4|NZ_AP018255.1_10960752_10962063_+	PRK11650, ugpC, sn-glycerol-3-phosphate ABC transporter ATP-binding protein UgpC	NA|356aa|down_5|NZ_AP018255.1_10962187_10963255_-	COG0435, ECM4, Predicted glutathione S-transferase [Posttranslational modification, protein turnover, chaperones]	NA|77aa|down_6|NZ_AP018255.1_10964052_10964283_+	COG1598, COG1598, Predicted nuclease of the RNAse H fold, HicB family [General    function prediction only]	NA|192aa|down_7|NZ_AP018255.1_10964763_10965339_-	COG1463, Ttg2C, ABC-type transport system involved in resistance to organic solvents, periplasmic component [Secondary metabolites biosynthesis, transport, and catabolism]	NA|351aa|down_8|NZ_AP018255.1_10965738_10966791_-	PRK00143, mnmA, tRNA-specific 2-thiouridylase MnmA; Reviewed	NA|270aa|down_9|NZ_AP018255.1_10967088_10967898_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018257	Calothrix sp. NIES-4071 plasmid plasmid2 DNA, complete genome	1	137285-137382	1	CRISPRCasFinder	no		RT,Cas9_archaeal,c2c10_CAS-V-U3	Orphan	GGCTACACCAAAAGGTATAGAAAAAC	26	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|283aa|up_9|NZ_AP018257.1_126071_126920_+,NA|333aa|up_5|NZ_AP018257.1_132534_133533_-,NA|94aa|up_4|NZ_AP018257.1_133923_134205_+,NA|115aa|up_3|NZ_AP018257.1_134373_134718_-,NA|72aa|up_0|NZ_AP018257.1_136841_137057_+,NA|115aa|down_1|NZ_AP018257.1_138878_139223_-,NA|103aa|down_2|NZ_AP018257.1_140120_140429_-,NA|118aa|down_7|NZ_AP018257.1_144389_144743_-,NA|81aa|down_8|NZ_AP018257.1_145076_145319_-,NA|87aa|down_9|NZ_AP018257.1_145512_145773_+	NA|283aa|up_9|NZ_AP018257.1_126071_126920_+	NA	NA|70aa|up_8|NZ_AP018257.1_127000_127210_-	pfam05860, Haemagg_act, haemagglutination activity domain	NA|651aa|up_7|NZ_AP018257.1_128881_130834_+	COG3349, COG3349, Uncharacterized conserved protein [Function unknown]	NA|478aa|up_6|NZ_AP018257.1_130963_132397_+	COG3670, COG3670, Lignostilbene-alpha,beta-dioxygenase and related enzymes [Secondary metabolites biosynthesis, transport, and catabolism]	NA|333aa|up_5|NZ_AP018257.1_132534_133533_-	NA	NA|94aa|up_4|NZ_AP018257.1_133923_134205_+	NA	NA|115aa|up_3|NZ_AP018257.1_134373_134718_-	NA	NA|81aa|up_2|NZ_AP018257.1_134751_134994_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|421aa|up_1|NZ_AP018257.1_135423_136686_+	PRK12705, PRK12705, hypothetical protein; Provisional	NA|72aa|up_0|NZ_AP018257.1_136841_137057_+	NA	NA|166aa|down_0|NZ_AP018257.1_137556_138054_-	COG1525, COG1525, Micrococcal nuclease (thermonuclease) homologs [DNA replication, recombination, and repair]	NA|115aa|down_1|NZ_AP018257.1_138878_139223_-	NA	NA|103aa|down_2|NZ_AP018257.1_140120_140429_-	NA	NA|130aa|down_3|NZ_AP018257.1_140644_141034_-	pfam13730, HTH_36, Helix-turn-helix domain	NA|260aa|down_4|NZ_AP018257.1_141304_142084_+	cd09279, RNase_HI_like, RNAse HI family that includes archaeal, some bacterial as well as plant RNase HI	NA|297aa|down_5|NZ_AP018257.1_142527_143418_+	COG4469, CoiA, Competence protein CoiA-like family, contains a predicted nuclease    domain [General function prediction only]	NA|151aa|down_6|NZ_AP018257.1_143753_144206_-	PRK04654, PRK04654, sec-independent translocase; Provisional	NA|118aa|down_7|NZ_AP018257.1_144389_144743_-	NA	NA|81aa|down_8|NZ_AP018257.1_145076_145319_-	NA	NA|87aa|down_9|NZ_AP018257.1_145512_145773_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018257	Calothrix sp. NIES-4071 plasmid plasmid2 DNA, complete genome	2	155031-155161	2	CRISPRCasFinder	no		RT,Cas9_archaeal,c2c10_CAS-V-U3	Orphan	ATACAGCGGTACTTATCCTAACTGCGTGGCGCCTCCTCCACCAC	44	0	0	NA	NA	N:A	1	1	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|81aa|up_9|NZ_AP018257.1_145076_145319_-,NA|87aa|up_8|NZ_AP018257.1_145512_145773_+,NA|270aa|up_7|NZ_AP018257.1_145843_146653_+,NA|337aa|up_6|NZ_AP018257.1_146976_147987_+,NA|111aa|up_4|NZ_AP018257.1_150843_151176_+,NA|232aa|up_3|NZ_AP018257.1_151361_152057_-,NA|200aa|up_1|NZ_AP018257.1_152799_153399_-,NA|207aa|up_0|NZ_AP018257.1_153513_154134_+,NA|218aa|down_0|NZ_AP018257.1_155389_156043_+,NA|105aa|down_2|NZ_AP018257.1_158614_158929_-,NA|353aa|down_3|NZ_AP018257.1_160001_161060_-,NA|136aa|down_6|NZ_AP018257.1_167199_167607_+,NA|311aa|down_7|NZ_AP018257.1_168009_168942_+,NA|227aa|down_9|NZ_AP018257.1_169790_170471_-	NA|81aa|up_9|NZ_AP018257.1_145076_145319_-	NA	NA|87aa|up_8|NZ_AP018257.1_145512_145773_+	NA	NA|270aa|up_7|NZ_AP018257.1_145843_146653_+	NA	NA|337aa|up_6|NZ_AP018257.1_146976_147987_+	NA	NA|655aa|up_5|NZ_AP018257.1_148502_150467_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|111aa|up_4|NZ_AP018257.1_150843_151176_+	NA	NA|232aa|up_3|NZ_AP018257.1_151361_152057_-	NA	NA|185aa|up_2|NZ_AP018257.1_152273_152828_-	COG1525, COG1525, Micrococcal nuclease (thermonuclease) homologs [DNA replication, recombination, and repair]	NA|200aa|up_1|NZ_AP018257.1_152799_153399_-	NA	NA|207aa|up_0|NZ_AP018257.1_153513_154134_+	NA	NA|218aa|down_0|NZ_AP018257.1_155389_156043_+	NA	NA|74aa|down_1|NZ_AP018257.1_156105_156327_-	pfam13443, HTH_26, Cro/C1-type HTH DNA-binding domain	NA|105aa|down_2|NZ_AP018257.1_158614_158929_-	NA	NA|353aa|down_3|NZ_AP018257.1_160001_161060_-	NA	NA|1267aa|down_4|NZ_AP018257.1_161799_165600_+	pfam12770, CHAT, CHAT domain	NA|515aa|down_5|NZ_AP018257.1_165619_167164_+	pfam12770, CHAT, CHAT domain	NA|136aa|down_6|NZ_AP018257.1_167199_167607_+	NA	NA|311aa|down_7|NZ_AP018257.1_168009_168942_+	NA	NA|107aa|down_8|NZ_AP018257.1_169365_169686_+	pfam12770, CHAT, CHAT domain	NA|227aa|down_9|NZ_AP018257.1_169790_170471_-	NA
GCF_002368455.1_ASM236845v1	NZ_AP018257	Calothrix sp. NIES-4071 plasmid plasmid2 DNA, complete genome	3	180982-181701	3,1,1	CRISPRCasFinder,CRT,PILER-CR	no		RT,Cas9_archaeal,c2c10_CAS-V-U3	Orphan	GTCACATTCTTTACTTACCCCTCACGGGGACGGAAAC,GTCACATTCTTTACTTACCCCTCACGGGGACGGAAACN,TCACATTCTTTACTTACCCCTCACGGGGACGGAAAC	37,38,36	0	0	NA	NA	N:A	8,9,8	9	Orphan	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|227aa|up_8|NZ_AP018257.1_169790_170471_-,NA|79aa|up_5|NZ_AP018257.1_174094_174331_+,NA|103aa|up_3|NZ_AP018257.1_175931_176240_+,NA|129aa|up_2|NZ_AP018257.1_176544_176931_-,NA|248aa|up_1|NZ_AP018257.1_177389_178133_+,NA|254aa|down_0|NZ_AP018257.1_182123_182885_-,NA|242aa|down_3|NZ_AP018257.1_185421_186147_-,NA|111aa|down_8|NZ_AP018257.1_191402_191735_-	NA|107aa|up_9|NZ_AP018257.1_169365_169686_+	pfam12770, CHAT, CHAT domain	NA|227aa|up_8|NZ_AP018257.1_169790_170471_-	NA	NA|623aa|up_7|NZ_AP018257.1_170557_172426_-	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]	NA|453aa|up_6|NZ_AP018257.1_172468_173827_-	PRK11281, PRK11281, mechanosensitive channel MscK	NA|79aa|up_5|NZ_AP018257.1_174094_174331_+	NA	NA|129aa|up_4|NZ_AP018257.1_174358_174745_-	pfam13508, Acetyltransf_7, Acetyltransferase (GNAT) domain	NA|103aa|up_3|NZ_AP018257.1_175931_176240_+	NA	NA|129aa|up_2|NZ_AP018257.1_176544_176931_-	NA	NA|248aa|up_1|NZ_AP018257.1_177389_178133_+	NA	NA|540aa|up_0|NZ_AP018257.1_178418_180038_-	pfam01593, Amino_oxidase, Flavin containing amine oxidoreductase	NA|254aa|down_0|NZ_AP018257.1_182123_182885_-	NA	NA|306aa|down_1|NZ_AP018257.1_183019_183937_-	cd00315, Cyt_C5_DNA_methylase, Cytosine-C5 specific DNA methylases; Methyl transfer reactions play an important role in many aspects of biology	NA|471aa|down_2|NZ_AP018257.1_183967_185380_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|242aa|down_3|NZ_AP018257.1_185421_186147_-	NA	NA|416aa|down_4|NZ_AP018257.1_186382_187630_-	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|340aa|down_5|NZ_AP018257.1_187635_188655_-	pfam04307, YdjM, LexA-binding, inner membrane-associated putative hydrolase	NA|256aa|down_6|NZ_AP018257.1_188660_189428_-	cd00009, AAA, The AAA+ (ATPases Associated with a wide variety of cellular Activities) superfamily represents an ancient group of ATPases belonging to the ASCE (for additional strand, catalytic E) division of the P-loop NTPase fold	NA|223aa|down_7|NZ_AP018257.1_189586_190255_-	pfam11740, KfrA_N, Plasmid replication region DNA-binding N-term	NA|111aa|down_8|NZ_AP018257.1_191402_191735_-	NA	NA|197aa|down_9|NZ_AP018257.1_191731_192322_-	cd02042, ParAB_family, partition proteins ParAB family
GCF_002368455.1_ASM236845v1	NZ_AP018257	Calothrix sp. NIES-4071 plasmid plasmid2 DNA, complete genome	4	324571-324667	4	CRISPRCasFinder	no	c2c10_CAS-V-U3	RT,Cas9_archaeal,c2c10_CAS-V-U3	Type V-U3	AAAGGAATTGAGGATTGAAACGA	23	0	0	NA	NA	N:A	1	1	TypeV-U3	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|223aa|up_9|NZ_AP018257.1_313849_314518_+,NA|93aa|up_8|NZ_AP018257.1_314843_315122_+,NA|85aa|up_7|NZ_AP018257.1_315179_315434_+,NA|99aa|up_3|NZ_AP018257.1_318756_319053_-,NA|192aa|up_0|NZ_AP018257.1_323818_324394_-,NA|112aa|down_1|NZ_AP018257.1_325846_326182_+,NA|69aa|down_2|NZ_AP018257.1_326273_326480_-,NA|265aa|down_5|NZ_AP018257.1_327496_328291_-,NA|445aa|down_6|NZ_AP018257.1_328541_329876_+,NA|175aa|down_7|NZ_AP018257.1_330110_330635_+,NA|111aa|down_9|NZ_AP018257.1_333607_333940_+	NA|223aa|up_9|NZ_AP018257.1_313849_314518_+	NA	NA|93aa|up_8|NZ_AP018257.1_314843_315122_+	NA	NA|85aa|up_7|NZ_AP018257.1_315179_315434_+	NA	c2c10_CAS-V-U3|517aa|up_6|NZ_AP018257.1_316024_317575_+	pfam07282, OrfB_Zn_ribbon, Putative transposase DNA-binding domain	NA|135aa|up_5|NZ_AP018257.1_317882_318287_-	pfam11284, DUF3085, Protein of unknown function (DUF3085)	NA|108aa|up_4|NZ_AP018257.1_318427_318751_+	pfam07444, Ycf66_N, Ycf66 protein N-terminus	NA|99aa|up_3|NZ_AP018257.1_318756_319053_-	NA	NA|347aa|up_2|NZ_AP018257.1_319330_320371_+	pfam13395, HNH_4, HNH endonuclease	NA|1074aa|up_1|NZ_AP018257.1_320386_323608_-	pfam05860, Haemagg_act, haemagglutination activity domain	NA|192aa|up_0|NZ_AP018257.1_323818_324394_-	NA	NA|324aa|down_0|NZ_AP018257.1_324821_325793_+	COG3440, COG3440, Predicted restriction endonuclease [Defense mechanisms]	NA|112aa|down_1|NZ_AP018257.1_325846_326182_+	NA	NA|69aa|down_2|NZ_AP018257.1_326273_326480_-	NA	NA|119aa|down_3|NZ_AP018257.1_326577_326934_+	pfam14534, DUF4440, Domain of unknown function (DUF4440)	NA|141aa|down_4|NZ_AP018257.1_327063_327486_-	pfam04343, DUF488, Protein of unknown function, DUF488	NA|265aa|down_5|NZ_AP018257.1_327496_328291_-	NA	NA|445aa|down_6|NZ_AP018257.1_328541_329876_+	NA	NA|175aa|down_7|NZ_AP018257.1_330110_330635_+	NA	NA|520aa|down_8|NZ_AP018257.1_331877_333437_+	COG2303, BetA, Choline dehydrogenase and related flavoproteins [Amino acid transport and metabolism]	NA|111aa|down_9|NZ_AP018257.1_333607_333940_+	NA
GCF_002368455.1_ASM236845v1	NZ_AP018256	Calothrix sp. NIES-4071 plasmid plasmid1 DNA, complete genome	1	108378-108626	1,1	CRISPRCasFinder,CRT	no	TnpB_regular.1,csa3	csa3,TnpB_regular.1,cas3,Cas9_archaeal	Type I-A	TTTCAAACCACCCATAGCTGGAATGGTTATTGAAAC,CCATAGCTGGAATGGTTATTGAAACT	36,26	0	0	NA	NA	N:A	2,3	3	TypeI-A	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|265aa|up_9|NZ_AP018256.1_97290_98085_+,NA|205aa|up_8|NZ_AP018256.1_98216_98831_-,NA|225aa|up_6|NZ_AP018256.1_99865_100540_-,NA|184aa|up_5|NZ_AP018256.1_100665_101217_-,NA|157aa|up_4|NZ_AP018256.1_101282_101753_-,NA|324aa|up_1|NZ_AP018256.1_105492_106464_-,NA|209aa|up_0|NZ_AP018256.1_107168_107795_-,NA|77aa|down_0|NZ_AP018256.1_108747_108978_-,NA|87aa|down_2|NZ_AP018256.1_110933_111194_-	NA|265aa|up_9|NZ_AP018256.1_97290_98085_+	NA	NA|205aa|up_8|NZ_AP018256.1_98216_98831_-	NA	NA|169aa|up_7|NZ_AP018256.1_99387_99894_-	pfam07929, PRiA4_ORF3, Plasmid pRiA4b ORF-3-like protein	NA|225aa|up_6|NZ_AP018256.1_99865_100540_-	NA	NA|184aa|up_5|NZ_AP018256.1_100665_101217_-	NA	NA|157aa|up_4|NZ_AP018256.1_101282_101753_-	NA	TnpB_regular.1|508aa|up_3|NZ_AP018256.1_102431_103955_-	pfam07282, OrfB_Zn_ribbon, Putative transposase DNA-binding domain	NA|318aa|up_2|NZ_AP018256.1_104378_105332_-	cd00315, Cyt_C5_DNA_methylase, Cytosine-C5 specific DNA methylases; Methyl transfer reactions play an important role in many aspects of biology	NA|324aa|up_1|NZ_AP018256.1_105492_106464_-	NA	NA|209aa|up_0|NZ_AP018256.1_107168_107795_-	NA	NA|77aa|down_0|NZ_AP018256.1_108747_108978_-	NA	NA|223aa|down_1|NZ_AP018256.1_110218_110887_-	TIGR02690, arsenical_resistance_protein_ArsH_putative, arsenical resistance protein ArsH	NA|87aa|down_2|NZ_AP018256.1_110933_111194_-	NA	NA|350aa|down_3|NZ_AP018256.1_111325_112375_-	cd13654, PBP2_phosphate_like_2, Substrate binding domain of putative ABC-type phosphate transporter, a member of the type 2 periplasmic binding fold superfamily	NA|336aa|down_4|NZ_AP018256.1_112700_113708_+	PRK08955, PRK08955, glyceraldehyde-3-phosphate dehydrogenase; Validated	NA|420aa|down_5|NZ_AP018256.1_113731_114991_+	cd17325, MFS_MdtG_SLC18_like, bacterial MdtG-like and eukaryotic solute carrier 18 (SLC18) family of the Major Facilitator Superfamily of transporters	NA|211aa|down_6|NZ_AP018256.1_115245_115878_-	cd00333, MIP, Major intrinsic protein (MIP) superfamily	NA|153aa|down_7|NZ_AP018256.1_116252_116711_+	cd14504, DUSP23, dual specificity phosphatase 23	NA|391aa|down_8|NZ_AP018256.1_116777_117950_+	cd17370, MFS_MJ1317_like, MJ1317 and similar transporters of the Major Facilitator Superfamily	NA|132aa|down_9|NZ_AP018256.1_118039_118435_-	TIGR02689, arsenate_reductase, arsenate reductase, glutathione/glutaredoxin type
GCF_002368455.1_ASM236845v1	NZ_AP018256	Calothrix sp. NIES-4071 plasmid plasmid1 DNA, complete genome	2	242561-242667	2	CRISPRCasFinder	no	Cas9_archaeal	csa3,TnpB_regular.1,cas3,Cas9_archaeal	Type II-A, Type II-B, or Type II-C?	AGTTGGCGCCAATTTTGGAGTAGATT	26	0	0	NA	NA	N:A	1	1	TypeII-A,TypeII-B,orTypeII-C?	cas14k,RT,DEDDh,csa3,PD-DExK,cas3,Cas14b_CAS-V-F,WYL,cas8b5,cas7,cas5,cas6,cas4,cas1,cas2,c2c9_V-U4,TnpB_regular.1,cas8a4,cas14j,DinG,Cas14u_CAS-V,c2c10_CAS-V-U3,cas8b3,c2c8_V-U2,Cas9_archaeal	NA|254aa|up_9|NZ_AP018256.1_228595_229357_+,NA|294aa|up_8|NZ_AP018256.1_229912_230794_+,NA|134aa|up_7|NZ_AP018256.1_232396_232798_+,NA|95aa|up_6|NZ_AP018256.1_235107_235392_+,NA|63aa|up_1|NZ_AP018256.1_241387_241576_-,NA|118aa|up_0|NZ_AP018256.1_241687_242041_-,NA|73aa|down_1|NZ_AP018256.1_245440_245659_-,NA|62aa|down_3|NZ_AP018256.1_246366_246552_-,NA|145aa|down_5|NZ_AP018256.1_251374_251809_-,NA|178aa|down_7|NZ_AP018256.1_253005_253539_-,NA|310aa|down_9|NZ_AP018256.1_255195_256125_+	NA|254aa|up_9|NZ_AP018256.1_228595_229357_+	NA	NA|294aa|up_8|NZ_AP018256.1_229912_230794_+	NA	NA|134aa|up_7|NZ_AP018256.1_232396_232798_+	NA	NA|95aa|up_6|NZ_AP018256.1_235107_235392_+	NA	NA|132aa|up_5|NZ_AP018256.1_235462_235858_+	TIGR03976, hypothetical_protein, His-Xaa-Ser system protein HxsD	NA|483aa|up_4|NZ_AP018256.1_235913_237362_+	TIGR03978, paired_radical_SAM_protein_1, His-Xaa-Ser system radical SAM maturase HxsB	NA|401aa|up_3|NZ_AP018256.1_237381_238584_+	TIGR03977, radical_SAM_domain_protein, His-Xaa-Ser system radical SAM maturase HxsC	NA|243aa|up_2|NZ_AP018256.1_238745_239474_+	TIGR03979, His_Ser_Rich, His-Xaa-Ser repeat protein HxsA	NA|63aa|up_1|NZ_AP018256.1_241387_241576_-	NA	NA|118aa|up_0|NZ_AP018256.1_241687_242041_-	NA	NA|236aa|down_0|NZ_AP018256.1_243088_243796_+	smart00318, SNc, Staphylococcal nuclease homologues	NA|73aa|down_1|NZ_AP018256.1_245440_245659_-	NA	NA|234aa|down_2|NZ_AP018256.1_245714_246416_-	cd10170, HSP70_NBD, Nucleotide-binding domain of the HSP70 family	NA|62aa|down_3|NZ_AP018256.1_246366_246552_-	NA	NA|1408aa|down_4|NZ_AP018256.1_247062_251286_+	TIGR01901, Heme/hemopexin-binding_protein, filamentous hemagglutinin family N-terminal domain	NA|145aa|down_5|NZ_AP018256.1_251374_251809_-	NA	NA|170aa|down_6|NZ_AP018256.1_252296_252806_-	COG3409, COG3409, Putative peptidoglycan-binding domain-containing protein [Cell envelope biogenesis, outer membrane]	NA|178aa|down_7|NZ_AP018256.1_253005_253539_-	NA	NA|342aa|down_8|NZ_AP018256.1_254015_255041_-	COG1637, COG1637, Predicted nuclease of the RecB family [DNA replication, recombination, and repair]	NA|310aa|down_9|NZ_AP018256.1_255195_256125_+	NA
