assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	1	958658-959174	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	7,8,8	8	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA|47aa|up_1|NZ_CP029492.1_957367_957508_-,NA	NA|919aa|up_9|NZ_CP029492.1_945251_948008_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|434aa|up_8|NZ_CP029492.1_948064_949366_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_7|NZ_CP029492.1_949413_951648_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|83aa|up_6|NZ_CP029492.1_951725_951974_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_5|NZ_CP029492.1_951973_952309_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_4|NZ_CP029492.1_952379_953171_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_3|NZ_CP029492.1_953398_955036_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_2|NZ_CP029492.1_955123_956422_+	PRK00077, eno, enolase; Provisional	NA|47aa|up_1|NZ_CP029492.1_957367_957508_-	NA	NA|224aa|up_0|NZ_CP029492.1_957646_958318_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_CP029492.1_959812_961291_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_CP029492.1_961317_962595_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_CP029492.1_962913_963699_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_CP029492.1_963768_965223_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|470aa|down_4|NZ_CP029492.1_965244_966654_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_CP029492.1_966631_967411_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_CP029492.1_967407_968268_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|NZ_CP029492.1_968415_968991_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|NZ_CP029492.1_969007_969268_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|NZ_CP029492.1_969258_970530_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	2	987002-987399	2,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,TGTGTTCCCCGCGCCAGCGGGGATAAACCGGGT	29,29,33	0	0	NA	NA	I-E:I-E:I-E	6,6,2	6	TypeI-E	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA	NA|51aa|up_9|NZ_CP029492.1_975873_976026_+	pfam01848, HOK_GEF, Hok/gef family	NA|371aa|up_8|NZ_CP029492.1_976218_977331_-	pfam01609, DDE_Tnp_1, Transposase DDE domain	cas3|900aa|up_7|NZ_CP029492.1_978346_981046_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|521aa|up_6|NZ_CP029492.1_981143_982706_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|up_5|NZ_CP029492.1_982702_983239_+	TIGR02548, CRISPR_system_Cascade_subunit_CasB, CRISPR type I-E/ECOLI-associated protein CasB/Cse2	cas7|352aa|up_4|NZ_CP029492.1_983250_984306_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP029492.1_984316_985063_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP029492.1_985044_985695_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|NZ_CP029492.1_985691_986615_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP029492.1_986611_986905_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP029492.1_987477_988515_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP029492.1_988766_989675_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP029492.1_989676_991104_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP029492.1_991103_991709_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP029492.1_991758_992082_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP029492.1_992275_992587_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP029492.1_992605_993316_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP029492.1_993315_993795_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP029492.1_993791_994841_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP029492.1_994821_995583_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	3	1469842-1469959	3	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	CCGAGCCGTAGGCCGGATAAGGCGTTCACGC	31	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA	NA|62aa|up_9|NZ_CP029492.1_1459127_1459313_-	PRK09956, PRK09956, ISNCY family transposase	NA|300aa|up_8|NZ_CP029492.1_1459325_1460225_-	PRK09956, PRK09956, ISNCY family transposase	NA|397aa|up_7|NZ_CP029492.1_1460417_1461608_-	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|420aa|up_6|NZ_CP029492.1_1461604_1462864_-	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|543aa|up_5|NZ_CP029492.1_1462853_1464482_-	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|453aa|up_4|NZ_CP029492.1_1464754_1466113_+	PRK11273, glpT, glycerol-3-phosphate transporter	NA|359aa|up_3|NZ_CP029492.1_1466117_1467194_+	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|217aa|up_2|NZ_CP029492.1_1467656_1468307_+	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|85aa|up_1|NZ_CP029492.1_1468360_1468615_-	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|377aa|up_0|NZ_CP029492.1_1468614_1469745_-	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|762aa|down_0|NZ_CP029492.1_1469978_1472264_-	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|1251aa|down_1|NZ_CP029492.1_1472959_1476712_+	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|241aa|down_2|NZ_CP029492.1_1476839_1477562_-	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|876aa|down_3|NZ_CP029492.1_1477708_1480336_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|563aa|down_4|NZ_CP029492.1_1480484_1482173_+	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|208aa|down_5|NZ_CP029492.1_1482169_1482793_+	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|1465aa|down_6|NZ_CP029492.1_1482936_1487331_+	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|550aa|down_7|NZ_CP029492.1_1487331_1488981_+	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|252aa|down_8|NZ_CP029492.1_1489005_1489761_+	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|395aa|down_9|NZ_CP029492.1_1489834_1491019_-	PRK05790, PRK05790, putative acyltransferase; Provisional
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	4	2061680-2061803	4	CRISPRCasFinder	no	DEDDh	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA|30aa|down_7|NZ_CP029492.1_2070699_2070789_+	NA|471aa|up_9|NZ_CP029492.1_2050062_2051475_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP029492.1_2052031_2052241_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP029492.1_2052695_2053322_+	PRK09898, PRK09898, ferredoxin-like protein	NA|325aa|up_6|NZ_CP029492.1_2054491_2055466_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|213aa|up_5|NZ_CP029492.1_2056529_2057168_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP029492.1_2057231_2057900_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP029492.1_2057896_2058682_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP029492.1_2058685_2059498_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|535aa|up_1|NZ_CP029492.1_2059509_2061114_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP029492.1_2061239_2061545_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP029492.1_2062117_2063374_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP029492.1_2063414_2064788_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP029492.1_2065002_2065644_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP029492.1_2065683_2066832_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP029492.1_2067122_2068334_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP029492.1_2068446_2069379_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP029492.1_2069375_2070401_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP029492.1_2070699_2070789_+	NA	NA|390aa|down_8|NZ_CP029492.1_2070954_2072124_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP029492.1_2072358_2072940_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	5	2689297-2689388	5	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA|70aa|up_8|NZ_CP029492.1_2678372_2678582_-,NA	NA|503aa|up_9|NZ_CP029492.1_2676705_2678214_-	PRK15419, PRK15419, sodium/proline symporter PutP	NA|70aa|up_8|NZ_CP029492.1_2678372_2678582_-	NA	NA|1321aa|up_7|NZ_CP029492.1_2678636_2682599_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_6|NZ_CP029492.1_2682638_2683277_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_5|NZ_CP029492.1_2683564_2684656_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_4|NZ_CP029492.1_2684655_2685348_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_3|NZ_CP029492.1_2685359_2685746_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|197aa|up_2|NZ_CP029492.1_2686563_2687154_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_CP029492.1_2687164_2687659_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP029492.1_2687679_2689008_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP029492.1_2689811_2690408_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP029492.1_2690428_2690656_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP029492.1_2690693_2691935_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|307aa|down_3|NZ_CP029492.1_2693743_2694664_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_4|NZ_CP029492.1_2694663_2694969_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_5|NZ_CP029492.1_2695120_2695720_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_6|NZ_CP029492.1_2695716_2698263_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_7|NZ_CP029492.1_2698262_2699435_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_8|NZ_CP029492.1_2699564_2700257_+	PRK10766, PRK10766, two-component system response regulator TorR	NA|343aa|down_9|NZ_CP029492.1_2700229_2701258_-	PRK10936, PRK10936, TMAO reductase system periplasmic protein TorT; Provisional
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	6	2826965-2827170	6,3,3	CRISPRCasFinder,CRT,PILER-CR	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	TTTCTAAGCTGCCTGTACGGCAGTGAAC,TTTCTAAGCTGCCTGTACGGCAGTGAAC,TTTCTAAGCTGCCTGTACGGCAGTGAACG	28,28,29	0	0	NA	NA	I-F:I-F:I-F	3,3,2	3	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA	NA|431aa|up_9|NZ_CP029492.1_2812088_2813381_-	PRK05431, PRK05431, seryl-tRNA synthetase; Provisional	NA|448aa|up_8|NZ_CP029492.1_2813471_2814815_-	PRK13342, PRK13342, recombination factor protein RarA; Reviewed	NA|204aa|up_7|NZ_CP029492.1_2814825_2815437_-	TIGR00547, Outer-membrane_lipoprotein_carrier_protein, periplasmic chaperone LolA	NA|1330aa|up_6|NZ_CP029492.1_2815591_2819581_-	PRK10263, PRK10263, DNA translocase FtsK; Provisional	NA|165aa|up_5|NZ_CP029492.1_2819715_2820210_-	PRK11169, PRK11169, leucine-responsive transcriptional regulator Lrp	NA|322aa|up_4|NZ_CP029492.1_2820754_2821720_+	PRK10262, PRK10262, thioredoxin reductase; Provisional	NA|589aa|up_3|NZ_CP029492.1_2821842_2823609_+	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|574aa|up_2|NZ_CP029492.1_2823609_2825331_+	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|235aa|up_1|NZ_CP029492.1_2825372_2826077_+	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|73aa|up_0|NZ_CP029492.1_2826361_2826580_+	PRK00276, infA, translation initiation factor IF-1; Validated	NA|759aa|down_0|NZ_CP029492.1_2827380_2829657_-	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	NA|107aa|down_1|NZ_CP029492.1_2829687_2830008_-	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|75aa|down_2|NZ_CP029492.1_2830330_2830555_+	PRK09937, PRK09937, cold shock-like protein CspD	NA|649aa|down_3|NZ_CP029492.1_2830627_2832574_-	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|372aa|down_4|NZ_CP029492.1_2832570_2833686_-	PRK11578, PRK11578, macrolide transporter subunit MacA; Provisional	NA|319aa|down_5|NZ_CP029492.1_2833836_2834793_+	COG2990, VirK, Uncharacterized protein conserved in bacteria [Function unknown]	NA|553aa|down_6|NZ_CP029492.1_2834789_2836448_-	COG3593, COG3593, Predicted ATP-dependent endonuclease of the OLD family [DNA replication, recombination, and repair]	NA|232aa|down_7|NZ_CP029492.1_2836872_2837568_+	PRK05420, PRK05420, aquaporin Z; Provisional	NA|300aa|down_8|NZ_CP029492.1_2838062_2838962_+	COG2431, COG2431, Predicted membrane protein [Function unknown]	NA|551aa|down_9|NZ_CP029492.1_2839105_2840758_+	PRK05290, PRK05290, hybrid cluster protein; Provisional
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	7	2994709-2994853	7	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	GTAGGTCGGATAAGATGCGCAAGCATCGCATCCGACAATAAGTGCCGGATGC	52	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA|193aa|up_7|NZ_CP029492.1_2989381_2989960_-,NA	NA|415aa|up_9|NZ_CP029492.1_2987526_2988771_+	cd01713, PAPS_reductase, This domain is found in phosphoadenosine phosphosulphate (PAPS) reductase enzymes or PAPS sulphotransferase	NA|201aa|up_8|NZ_CP029492.1_2988782_2989385_-	pfam13649, Methyltransf_25, Methyltransferase domain	NA|193aa|up_7|NZ_CP029492.1_2989381_2989960_-	NA	NA|74aa|up_6|NZ_CP029492.1_2990329_2990551_+	PHA00080, PHA00080, DksA-like zinc finger domain containing protein	NA|124aa|up_5|NZ_CP029492.1_2990547_2990919_+	pfam13935, Ead_Ea22, Ead/Ea22-like protein	NA|218aa|up_4|NZ_CP029492.1_2990915_2991569_+	pfam04447, DUF550, Protein of unknown function (DUF550)	NA|60aa|up_3|NZ_CP029492.1_2991665_2991845_+	PHA00626, PHA00626, hypothetical protein	NA|73aa|up_2|NZ_CP029492.1_2991958_2992177_+	pfam07825, Exc, Excisionase-like protein	NA|357aa|up_1|NZ_CP029492.1_2992154_2993225_+	cd00800, INT_Lambda_C, C-terminal catalytic domain of Lambda integrase, a tyrosine-based site-specific recombinase	NA|428aa|up_0|NZ_CP029492.1_2993359_2994643_+	PRK10531, PRK10531, putative acyl-CoA thioester hydrolase	NA|754aa|down_0|NZ_CP029492.1_2994876_2997138_-	PRK11413, PRK11413, putative hydratase; Provisional	NA|478aa|down_1|NZ_CP029492.1_2997320_2998754_-	pfam00939, Na_sulph_symp, Sodium:sulfate symporter transmembrane region	NA|351aa|down_2|NZ_CP029492.1_2998829_2999882_-	NF033377, OMA_tautomer, 4-oxalomesaconate tautomerase	NA|318aa|down_3|NZ_CP029492.1_3000065_3001019_+	cd08440, PBP2_LTTR_like_4, TThe C-terminal substrate binding domain of an uncharacterized LysR-type transcriptional regulator, contains the type 2 periplasmic binding fold	NA|332aa|down_4|NZ_CP029492.1_3001059_3002055_-	PRK11028, PRK11028, 6-phosphogluconolactonase; Provisional	NA|273aa|down_5|NZ_CP029492.1_3002209_3003028_+	PRK10530, PRK10530, pyridoxal phosphate (PLP) phosphatase; Provisional	NA|353aa|down_6|NZ_CP029492.1_3003028_3004087_-	PRK11144, modC, molybdenum ABC transporter ATP-binding protein ModC	NA|230aa|down_7|NZ_CP029492.1_3004089_3004779_-	PRK09421, modB, molybdate ABC transporter permease subunit	NA|258aa|down_8|NZ_CP029492.1_3004778_3005552_-	PRK10677, modA, molybdate transporter periplasmic protein; Provisional	NA|50aa|down_9|NZ_CP029492.1_3005718_3005868_-	pfam10766, AcrZ, Multidrug efflux pump-associated protein AcrZ
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	8	3223455-3223551	8	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	TTGTAGGCCTGATAAGATGCGTCAAGC	27	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA	NA|172aa|up_9|NZ_CP029492.1_3212667_3213183_-	PRK09934, PRK09934, fimbriae assembly protein	NA|40aa|up_8|NZ_CP029492.1_3214827_3214947_-	PRK15199, fimH, type 1 fimbrin D-mannose specific adhesin FimH	NA|289aa|up_7|NZ_CP029492.1_3217175_3218042_+	PRK10792, PRK10792, bifunctional methylenetetrahydrofolate dehydrogenase/methenyltetrahydrofolate cyclohydrolase FolD	NA|71aa|up_6|NZ_CP029492.1_3218043_3218256_+	PRK11507, PRK11507, ribosome-associated protein YbcJ	NA|174aa|up_5|NZ_CP029492.1_3218363_3218885_+	COG1988, COG1988, Predicted membrane-bound metal-dependent hydrolases [General function prediction only]	NA|462aa|up_4|NZ_CP029492.1_3218920_3220306_-	PRK00260, cysS, cysteinyl-tRNA synthetase; Validated	NA|165aa|up_3|NZ_CP029492.1_3220479_3220974_+	PRK10791, PRK10791, peptidylprolyl isomerase B	NA|241aa|up_2|NZ_CP029492.1_3220976_3221699_+	PRK05340, PRK05340, UDP-2,3-diacylglucosamine hydrolase; Provisional	NA|170aa|up_1|NZ_CP029492.1_3221816_3222326_+	COG0041, PurE, Phosphoribosylcarboxyaminoimidazole (NCAIR) mutase [Nucleotide transport and metabolism]	NA|356aa|up_0|NZ_CP029492.1_3222322_3223390_+	PRK06019, PRK06019, phosphoribosylaminoimidazole carboxylase ATPase subunit; Reviewed	NA|298aa|down_0|NZ_CP029492.1_3223584_3224478_-	PRK09411, PRK09411, carbamate kinase; Reviewed	NA|272aa|down_1|NZ_CP029492.1_3224474_3225290_-	pfam11392, DUF2877, Protein of unknown function (DUF2877)	NA|420aa|down_2|NZ_CP029492.1_3225300_3226560_-	pfam06545, DUF1116, Protein of unknown function (DUF1116)	NA|556aa|down_3|NZ_CP029492.1_3226569_3228237_-	PRK06091, PRK06091, membrane protein FdrA; Validated	NA|90aa|down_4|NZ_CP029492.1_3228348_3228618_+	TIGR03176, AllC, allantoate amidohydrolase	NA|262aa|down_5|NZ_CP029492.1_3228628_3229414_+	TIGR03214, ura-cupin, putative allantoin catabolism protein	NA|382aa|down_6|NZ_CP029492.1_3229641_3230787_-	PRK09932, PRK09932, glycerate 3-kinase	NA|434aa|down_7|NZ_CP029492.1_3230808_3232110_-	PRK11412, PRK11412, uracil/xanthine transporter	NA|485aa|down_8|NZ_CP029492.1_3233580_3235035_-	PRK11375, PRK11375, putative allantoin permease	NA|293aa|down_9|NZ_CP029492.1_3235980_3236859_-	PRK15059, PRK15059, 2-hydroxy-3-oxopropionate reductase
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	9	3365146-3365290	9	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	TTTTGCAGGCCTGATAAGACGCGGCAAGCGTCGCATCAGGCAT	43	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA|28aa|down_2|NZ_CP029492.1_3367335_3367419_-	NA|357aa|up_9|NZ_CP029492.1_3349212_3350283_-	PRK00147, queA, S-adenosylmethionine:tRNA ribosyltransferase-isomerase; Provisional	NA|194aa|up_8|NZ_CP029492.1_3350375_3350957_+	PRK10045, PRK10045, ACP phosphodiesterase	NA|606aa|up_7|NZ_CP029492.1_3350961_3352779_-	PRK10785, PRK10785, maltodextrin glucosidase; Provisional	NA|458aa|up_6|NZ_CP029492.1_3352934_3354308_-	PRK10580, proY, putative proline-specific permease; Provisional	NA|440aa|up_5|NZ_CP029492.1_3354383_3355703_-	PRK15433, PRK15433, branched-chain amino acid transporter carrier protein BrnQ	NA|325aa|up_4|NZ_CP029492.1_3356136_3357111_-	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|230aa|up_3|NZ_CP029492.1_3358534_3359224_-	PRK10161, PRK10161, phosphate response regulator transcription factor PhoB	NA|401aa|up_2|NZ_CP029492.1_3359413_3360616_+	PRK10966, PRK10966, exonuclease subunit SbcD; Provisional	NA|1049aa|up_1|NZ_CP029492.1_3360612_3363759_+	PRK10246, PRK10246, exonuclease subunit SbcC; Provisional	NA|395aa|up_0|NZ_CP029492.1_3363884_3365069_+	PRK10091, PRK10091, MFS transport protein AraJ; Provisional	NA|303aa|down_0|NZ_CP029492.1_3365313_3366222_-	PRK09557, PRK09557, fructokinase; Reviewed	NA|304aa|down_1|NZ_CP029492.1_3366346_3367258_+	PRK00321, rdgC, recombination associated protein; Reviewed	NA|28aa|down_2|NZ_CP029492.1_3367335_3367419_-	NA	NA|95aa|down_3|NZ_CP029492.1_3367904_3368189_-	PRK10579, PRK10579, pyrimidine/purine nucleoside phosphorylase	NA|226aa|down_4|NZ_CP029492.1_3368260_3368938_-	PRK10481, PRK10481, hypothetical protein; Provisional	NA|64aa|down_5|NZ_CP029492.1_3369195_3369387_-	PRK10380, PRK10380, hypothetical protein; Provisional	NA|175aa|down_6|NZ_CP029492.1_3369436_3369961_-	PRK03731, aroL, shikimate kinase AroL	NA|153aa|down_7|NZ_CP029492.1_3370143_3370602_-	PRK00124, PRK00124, YaiI/YqxD family protein	NA|270aa|down_8|NZ_CP029492.1_3370721_3371531_+	PRK11880, PRK11880, pyrroline-5-carboxylate reductase; Reviewed	NA|372aa|down_9|NZ_CP029492.1_3371547_3372663_-	PRK10245, adrA, diguanylate cyclase AdrA; Provisional
GCF_003231115.1_ASM323111v1	NZ_CP029492	Escherichia coli strain HS30-1 chromosome, complete genome	10	3703780-3703921	10	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	Orphan	GCTGGAGAGCAACCGTAGGCCGGATAAGATGCGCCAGCATCGCATCCGGCGA	52	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG,c2c9_V-U4,RT	NA,NA	NA|96aa|up_9|NZ_CP029492.1_3692771_3693059_-	PRK15449, PRK15449, ferredoxin-like protein FixX; Provisional	NA|429aa|up_8|NZ_CP029492.1_3693055_3694342_-	PRK10157, PRK10157, putative oxidoreductase FixC; Provisional	NA|314aa|up_7|NZ_CP029492.1_3694392_3695334_-	PRK03363, fixB, electron transfer flavoprotein subunit alpha/FixB family protein	NA|257aa|up_6|NZ_CP029492.1_3695348_3696119_-	PRK03359, PRK03359, putative electron transfer flavoprotein FixA; Reviewed	NA|505aa|up_5|NZ_CP029492.1_3696591_3698106_+	PRK03356, PRK03356, L-carnitine/gamma-butyrobetaine antiport BCCT transporter	NA|381aa|up_4|NZ_CP029492.1_3698136_3699279_+	PRK03354, PRK03354, crotonobetainyl-CoA dehydrogenase; Validated	NA|406aa|up_3|NZ_CP029492.1_3699407_3700625_+	PRK03525, PRK03525, L-carnitine CoA-transferase	NA|518aa|up_2|NZ_CP029492.1_3700698_3702252_+	PRK08008, caiC, putative crotonobetaine/carnitine-CoA ligase; Validated	NA|262aa|up_1|NZ_CP029492.1_3702360_3703146_+	PRK03580, PRK03580, crotonobetainyl-CoA hydratase	NA|197aa|up_0|NZ_CP029492.1_3703151_3703742_+	PRK13627, PRK13627, carnitine operon protein CaiE; Provisional	NA|132aa|down_0|NZ_CP029492.1_3703950_3704346_-	PRK11476, PRK11476, carnitine metabolism transcriptional regulator CaiF	NA|1074aa|down_1|NZ_CP029492.1_3704607_3707829_-	PRK05294, carB, carbamoyl-phosphate synthase large subunit	NA|383aa|down_2|NZ_CP029492.1_3707846_3708995_-	PRK12564, PRK12564, carbamoyl-phosphate synthase small subunit	NA|274aa|down_3|NZ_CP029492.1_3709450_3710272_-	COG0289, DapB, Dihydrodipicolinate reductase [Amino acid transport and metabolism]	NA|305aa|down_4|NZ_CP029492.1_3710438_3711353_-	PRK10768, PRK10768, ribonucleoside hydrolase RihC; Provisional	NA|317aa|down_5|NZ_CP029492.1_3711418_3712369_-	PRK01045, ispH, 4-hydroxy-3-methylbut-2-enyl diphosphate reductase; Reviewed	NA|150aa|down_6|NZ_CP029492.1_3712370_3712820_-	PRK15095, PRK15095, FKBP-type peptidyl-prolyl cis-trans isomerase; Provisional	NA|165aa|down_7|NZ_CP029492.1_3712944_3713439_-	PRK00376, lspA, lipoprotein signal peptidase	NA|939aa|down_8|NZ_CP029492.1_3713438_3716255_-	PRK05743, ileS, isoleucyl-tRNA synthetase; Reviewed	NA|314aa|down_9|NZ_CP029492.1_3716297_3717239_-	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase
