assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	1	259663-259796	1	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	TGCCTGATGCGACGCTGGCGCGTCTTATCAGGCCTACA	38	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA	NA|336aa|up_9|NZ_CP029741.1_247625_248633_-	cd05247, UDP_G4E_1_SDR_e, UDP-glucose 4 epimerase, subgroup 1, extended (e) SDRs	NA|382aa|up_8|NZ_CP029741.1_248649_249795_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|344aa|up_7|NZ_CP029741.1_249781_250813_-	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|287aa|up_6|NZ_CP029741.1_250809_251670_-	pfam00535, Glycos_transf_2, Glycosyl transferase family 2	NA|448aa|up_5|NZ_CP029741.1_251675_253019_-	pfam14296, O-ag_pol_Wzy, O-antigen polysaccharide polymerase Wzy	NA|419aa|up_4|NZ_CP029741.1_253018_254275_-	cd13128, MATE_Wzx_like, Wzx, a subfamily of the multidrug and toxic compound extrusion (MATE)-like proteins	NA|298aa|up_3|NZ_CP029741.1_254631_255525_-	PRK10122, PRK10122, UTP--glucose-1-phosphate uridylyltransferase GalF	NA|465aa|up_2|NZ_CP029741.1_255699_257094_-	PRK10123, wcaM, putative colanic acid biosynthesis protein; Provisional	NA|407aa|up_1|NZ_CP029741.1_257104_258325_-	TIGR04005, wcaL, colanic acid biosynthesis glycosyltransferase WcaL	NA|427aa|up_0|NZ_CP029741.1_258321_259602_-	TIGR04006, wcaK, colanic acid biosynthesis pyruvyl transferase WcaK	NA|493aa|down_0|NZ_CP029741.1_259877_261356_-	PRK10459, PRK10459, MOP flippase family protein	NA|465aa|down_1|NZ_CP029741.1_261357_262752_-	PRK10124, PRK10124, putative UDP-glucose lipid carrier transferase; Provisional	NA|457aa|down_2|NZ_CP029741.1_262806_264177_-	PRK15414, PRK15414, phosphomannomutase	NA|479aa|down_3|NZ_CP029741.1_264457_265894_-	PRK15460, cpsB, mannose-1-phosphate guanyltransferase; Provisional	NA|408aa|down_4|NZ_CP029741.1_265896_267120_-	TIGR04007, wcaI, colanic acid biosynthesis glycosyl transferase WcaI	NA|160aa|down_5|NZ_CP029741.1_267116_267596_-	PRK15434, PRK15434, GDP-mannose mannosyl hydrolase	NA|322aa|down_6|NZ_CP029741.1_267598_268564_-	cd05239, GDP_FS_SDR_e, GDP-fucose synthetase, extended (e) SDRs	NA|374aa|down_7|NZ_CP029741.1_268566_269688_-	COG1089, Gmd, GDP-D-mannose dehydratase [Cell envelope biogenesis, outer membrane]	NA|183aa|down_8|NZ_CP029741.1_269715_270264_-	TIGR04008, WcaF, colanic acid biosynthesis acetyltransferase WcaF	NA|249aa|down_9|NZ_CP029741.1_270279_271026_-	PRK10063, PRK10063, colanic acid biosynthesis glycosyltransferase WcaE
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	2	264322-264456	2	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	GGATAAGGCGTTCACGCCGCATCCGACAAACAGCGCCTGATGCGACG	47	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA	NA|287aa|up_9|NZ_CP029741.1_250809_251670_-	pfam00535, Glycos_transf_2, Glycosyl transferase family 2	NA|448aa|up_8|NZ_CP029741.1_251675_253019_-	pfam14296, O-ag_pol_Wzy, O-antigen polysaccharide polymerase Wzy	NA|419aa|up_7|NZ_CP029741.1_253018_254275_-	cd13128, MATE_Wzx_like, Wzx, a subfamily of the multidrug and toxic compound extrusion (MATE)-like proteins	NA|298aa|up_6|NZ_CP029741.1_254631_255525_-	PRK10122, PRK10122, UTP--glucose-1-phosphate uridylyltransferase GalF	NA|465aa|up_5|NZ_CP029741.1_255699_257094_-	PRK10123, wcaM, putative colanic acid biosynthesis protein; Provisional	NA|407aa|up_4|NZ_CP029741.1_257104_258325_-	TIGR04005, wcaL, colanic acid biosynthesis glycosyltransferase WcaL	NA|427aa|up_3|NZ_CP029741.1_258321_259602_-	TIGR04006, wcaK, colanic acid biosynthesis pyruvyl transferase WcaK	NA|493aa|up_2|NZ_CP029741.1_259877_261356_-	PRK10459, PRK10459, MOP flippase family protein	NA|465aa|up_1|NZ_CP029741.1_261357_262752_-	PRK10124, PRK10124, putative UDP-glucose lipid carrier transferase; Provisional	NA|457aa|up_0|NZ_CP029741.1_262806_264177_-	PRK15414, PRK15414, phosphomannomutase	NA|479aa|down_0|NZ_CP029741.1_264457_265894_-	PRK15460, cpsB, mannose-1-phosphate guanyltransferase; Provisional	NA|408aa|down_1|NZ_CP029741.1_265896_267120_-	TIGR04007, wcaI, colanic acid biosynthesis glycosyl transferase WcaI	NA|160aa|down_2|NZ_CP029741.1_267116_267596_-	PRK15434, PRK15434, GDP-mannose mannosyl hydrolase	NA|322aa|down_3|NZ_CP029741.1_267598_268564_-	cd05239, GDP_FS_SDR_e, GDP-fucose synthetase, extended (e) SDRs	NA|374aa|down_4|NZ_CP029741.1_268566_269688_-	COG1089, Gmd, GDP-D-mannose dehydratase [Cell envelope biogenesis, outer membrane]	NA|183aa|down_5|NZ_CP029741.1_269715_270264_-	TIGR04008, WcaF, colanic acid biosynthesis acetyltransferase WcaF	NA|249aa|down_6|NZ_CP029741.1_270279_271026_-	PRK10063, PRK10063, colanic acid biosynthesis glycosyltransferase WcaE	NA|406aa|down_7|NZ_CP029741.1_271036_272254_-	TIGR04010, WcaD, putative colanic acid polymerase WcaD	NA|406aa|down_8|NZ_CP029741.1_272228_273446_-	TIGR04015, WcaC, colanic acid biosynthesis glycosyl transferase WcaC	NA|163aa|down_9|NZ_CP029741.1_273442_273931_-	PRK10191, PRK10191, putative acyl transferase; Provisional
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	3	491989-492115	3	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	TTTGTAGGCCTGATAAGACGCGCCAGCGTCGCATCAGGC	39	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA	NA|395aa|up_9|NZ_CP029741.1_470896_472081_+	PRK05790, PRK05790, putative acyltransferase; Provisional	NA|259aa|up_8|NZ_CP029741.1_472154_472931_-	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|550aa|up_7|NZ_CP029741.1_472935_474585_-	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|1465aa|up_6|NZ_CP029741.1_474585_478980_-	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|208aa|up_5|NZ_CP029741.1_479123_479747_-	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|563aa|up_4|NZ_CP029741.1_479743_481432_-	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|876aa|up_3|NZ_CP029741.1_481580_484208_-	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|241aa|up_2|NZ_CP029741.1_484354_485077_+	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|1251aa|up_1|NZ_CP029741.1_485204_488957_-	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|762aa|up_0|NZ_CP029741.1_489652_491938_+	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|377aa|down_0|NZ_CP029741.1_492171_493302_+	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|85aa|down_1|NZ_CP029741.1_493301_493556_+	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|217aa|down_2|NZ_CP029741.1_493609_494260_-	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|359aa|down_3|NZ_CP029741.1_494722_495799_-	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|453aa|down_4|NZ_CP029741.1_495803_497162_-	PRK11273, glpT, glycerol-3-phosphate transporter	NA|543aa|down_5|NZ_CP029741.1_497434_499063_+	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|420aa|down_6|NZ_CP029741.1_499052_500312_+	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|397aa|down_7|NZ_CP029741.1_500308_501499_+	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|300aa|down_8|NZ_CP029741.1_501691_502591_+	PRK09956, PRK09956, ISNCY family transposase	NA|62aa|down_9|NZ_CP029741.1_502603_502789_+	PRK09956, PRK09956, ISNCY family transposase
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	4	980624-980768	4	CRISPRCasFinder	no	csa3	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Type I-A	CACAATGCCTGATGCGACGCTGGAGCGTCTTATCATGCCTACAAA	45	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA|34aa|down_3|NZ_CP029741.1_983255_983357_-	NA|150aa|up_9|NZ_CP029741.1_971614_972064_+	pfam06610, AlaE, L-alanine exporter	NA|115aa|up_8|NZ_CP029741.1_972100_972445_-	PRK10556, PRK10556, hypothetical protein; Provisional	NA|110aa|up_7|NZ_CP029741.1_972596_972926_+	PRK10132, PRK10132, hypothetical protein; Provisional	NA|82aa|up_6|NZ_CP029741.1_973173_973419_+	PRK10329, PRK10329, glutaredoxin-like protein NrdH	NA|137aa|up_5|NZ_CP029741.1_973415_973826_+	PRK03600, nrdI, class Ib ribonucleoside-diphosphate reductase assembly flavoprotein NrdI	NA|715aa|up_4|NZ_CP029741.1_973798_975943_+	PRK08188, PRK08188, ribonucleotide-diphosphate reductase subunit alpha; Validated	NA|320aa|up_3|NZ_CP029741.1_975952_976912_+	TIGR04171, ribonucleotide-diphosphate_reductase_subunit_beta, ribonucleoside-diphosphate reductase, class 1b, beta subunit	NA|401aa|up_2|NZ_CP029741.1_977265_978468_+	PRK10070, PRK10070, proline/glycine betaine ABC transporter ATP-binding protein ProV	NA|355aa|up_1|NZ_CP029741.1_978460_979525_+	PRK10952, PRK10952, proline/glycine betaine ABC transporter permease ProW	NA|331aa|up_0|NZ_CP029741.1_979582_980575_+	PRK11119, proX, proline/glycine betaine ABC transporter substrate-binding protein ProX	NA|395aa|down_0|NZ_CP029741.1_980866_982051_+	cd17324, MFS_NepI_like, Purine ribonucleoside efflux pump NepI and similar transporters of the Major Facilitator Superfamily	NA|246aa|down_1|NZ_CP029741.1_982174_982912_+	COG1296, AzlC, Predicted branched-chain amino acid permease (azaleucine resistance) [Amino acid transport and metabolism]	NA|112aa|down_2|NZ_CP029741.1_982901_983237_+	PRK10408, PRK10408, L-valine transporter subunit YgaH	NA|34aa|down_3|NZ_CP029741.1_983255_983357_-	NA	NA|177aa|down_4|NZ_CP029741.1_983327_983858_+	PRK10870, PRK10870, transcriptional repressor MprA; Provisional	NA|391aa|down_5|NZ_CP029741.1_983984_985157_+	PRK15136, PRK15136, multidrug efflux MFS transporter periplasmic adaptor subunit EmrA	NA|513aa|down_6|NZ_CP029741.1_985173_986712_+	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily	NA|172aa|down_7|NZ_CP029741.1_986775_987291_-	PRK02260, PRK02260, S-ribosylhomocysteine lyase	NA|519aa|down_8|NZ_CP029741.1_987440_988997_-	PRK02107, PRK02107, glutamate--cysteine ligase; Provisional	NA|143aa|down_9|NZ_CP029741.1_989069_989498_-	COG1238, COG1238, Predicted membrane protein [Function unknown]
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	5	1051512-1052516	5,1,1	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Type I-E	CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	16,16,14	16	TypeI-E	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA	NA|254aa|up_9|NZ_CP029741.1_1043385_1044147_-	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional	NA|350aa|up_8|NZ_CP029741.1_1044127_1045177_-	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|160aa|up_7|NZ_CP029741.1_1045173_1045653_-	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|237aa|up_6|NZ_CP029741.1_1045652_1046363_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|104aa|up_5|NZ_CP029741.1_1046381_1046693_-	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|108aa|up_4|NZ_CP029741.1_1046886_1047210_-	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|202aa|up_3|NZ_CP029741.1_1047259_1047865_-	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|476aa|up_2|NZ_CP029741.1_1047864_1049292_-	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|303aa|up_1|NZ_CP029741.1_1049293_1050202_-	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|346aa|up_0|NZ_CP029741.1_1050453_1051491_+	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	cas2|95aa|down_0|NZ_CP029741.1_1052621_1052906_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|306aa|down_1|NZ_CP029741.1_1052907_1053825_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|200aa|down_2|NZ_CP029741.1_1053840_1054440_-	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas5|225aa|down_3|NZ_CP029741.1_1054426_1055101_-	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas7|364aa|down_4|NZ_CP029741.1_1055103_1056195_-	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cse2gr11|161aa|down_5|NZ_CP029741.1_1056207_1056690_-	cd09670, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|451aa|down_6|NZ_CP029741.1_1056838_1058191_-	PRK09693, PRK09693, Cascade antiviral complex protein; Validated	NA|245aa|down_7|NZ_CP029741.1_1061629_1062364_-	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|571aa|down_8|NZ_CP029741.1_1062437_1064150_-	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|600aa|down_9|NZ_CP029741.1_1064149_1065949_-	PRK10953, cysJ, NADPH-dependent assimilatory sulfite reductase flavoprotein subunit
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	6	1078065-1078886	6,2,2	CRISPRCasFinder,CRT,PILER-CR	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	13,13,12	13	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA	NA|424aa|up_9|NZ_CP029741.1_1066707_1067979_+	PRK10015, PRK10015, oxidoreductase; Provisional	NA|87aa|up_8|NZ_CP029741.1_1067969_1068230_+	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|192aa|up_7|NZ_CP029741.1_1068246_1068822_+	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|298aa|up_6|NZ_CP029741.1_1068969_1069863_-	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|260aa|up_5|NZ_CP029741.1_1069826_1070606_-	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|470aa|up_4|NZ_CP029741.1_1070583_1071993_-	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|485aa|up_3|NZ_CP029741.1_1072014_1073469_-	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|262aa|up_2|NZ_CP029741.1_1073538_1074324_-	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|426aa|up_1|NZ_CP029741.1_1074643_1075921_+	cd06174, MFS, Major Facilitator Superfamily	NA|493aa|up_0|NZ_CP029741.1_1075947_1077426_+	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|224aa|down_0|NZ_CP029741.1_1079225_1079897_-	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|291aa|down_1|NZ_CP029741.1_1080190_1081063_+	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|433aa|down_2|NZ_CP029741.1_1081122_1082421_-	PRK00077, eno, enolase; Provisional	NA|546aa|down_3|NZ_CP029741.1_1082508_1084146_-	PRK05380, pyrG, CTP synthetase; Validated	NA|264aa|down_4|NZ_CP029741.1_1084373_1085165_-	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|112aa|down_5|NZ_CP029741.1_1085235_1085571_-	PRK09907, PRK09907, endoribonuclease MazF	NA|83aa|down_6|NZ_CP029741.1_1085570_1085819_-	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|745aa|down_7|NZ_CP029741.1_1085896_1088131_-	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|434aa|down_8|NZ_CP029741.1_1088178_1089480_-	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|919aa|down_9|NZ_CP029741.1_1089536_1092293_+	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	7	2836127-2836276	7	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	TGAACGCCTTATCCGACCTACACAGCACTGAACTCGTAGGCCTGATAAGACGCG	54	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA|65aa|up_8|NZ_CP029741.1_2826395_2826590_+,NA	NA|660aa|up_9|NZ_CP029741.1_2824365_2826345_+	COG3211, PhoX, Predicted phosphatase [General function prediction only]	NA|65aa|up_8|NZ_CP029741.1_2826395_2826590_+	NA	NA|60aa|up_7|NZ_CP029741.1_2826637_2826817_+	COG1178, ThiP, ABC-type Fe3+ transport system, permease component [Inorganic ion transport and metabolism]	NA|116aa|up_6|NZ_CP029741.1_2826813_2827161_+	pfam13683, rve_3, Integrase core domain	NA|254aa|up_5|NZ_CP029741.1_2827671_2828433_+	COG3637, COG3637, Opacity protein and related surface antigens [Cell envelope biogenesis, outer membrane]	NA|403aa|up_4|NZ_CP029741.1_2828502_2829711_+	pfam01609, DDE_Tnp_1, Transposase DDE domain	NA|501aa|up_3|NZ_CP029741.1_2830466_2831969_+	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|361aa|up_2|NZ_CP029741.1_2832129_2833212_-	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|367aa|up_1|NZ_CP029741.1_2833211_2834312_-	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|504aa|up_0|NZ_CP029741.1_2834578_2836090_+	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|148aa|down_0|NZ_CP029741.1_2836443_2836887_+	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|952aa|down_1|NZ_CP029741.1_2836886_2839742_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|399aa|down_2|NZ_CP029741.1_2839795_2840992_-	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|168aa|down_3|NZ_CP029741.1_2841184_2841688_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|139aa|down_4|NZ_CP029741.1_2841733_2842150_-	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|335aa|down_5|NZ_CP029741.1_2842311_2843316_+	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|151aa|down_6|NZ_CP029741.1_2845163_2845616_-	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|198aa|down_7|NZ_CP029741.1_2845760_2846354_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|238aa|down_8|NZ_CP029741.1_2846424_2847138_+	PRK12742, PRK12742, SDR family oxidoreductase	NA|132aa|down_9|NZ_CP029741.1_2847268_2847664_+	cd02198, YjgH_like, YjgH belongs to a large family of YjgF/YER057c/UK114-like proteins present in bacteria, archaea, and eukaryotes with no definitive function
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	8	3618463-3618609	8	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	TCCGGCCTACGGATGGCGCGAGAATTTGTAGGCCTGATAAGACGCG	46	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA,NA	NA|361aa|up_9|NZ_CP029741.1_3608112_3609195_-	PRK09526, lacI, lac repressor; Reviewed	NA|318aa|up_8|NZ_CP029741.1_3609231_3610185_-	COG4977, COG4977, Transcriptional regulator containing an amidase domain and an AraC-type DNA-binding HTH domain [Transcription]	NA|259aa|up_7|NZ_CP029741.1_3610204_3610981_-	COG2220, COG2220, Predicted Zn-dependent hydrolases of the beta-lactamase fold [General function prediction only]	NA|316aa|up_6|NZ_CP029741.1_3611095_3612043_-	PRK09834, PRK09834, DNA-binding transcriptional regulator	NA|555aa|up_5|NZ_CP029741.1_3612119_3613784_+	PRK06183, mhpA, bifunctional 3-(3-hydroxy-phenyl)propionate/3-hydroxycinnamic acid hydroxylase	NA|315aa|up_4|NZ_CP029741.1_3613785_3614730_+	cd07365, MhpB_like, Subunit B of the Class III Extradiol ring-cleavage dioxygenase, 2,3-dihydroxyphenylpropionate 1,2-dioxygenase (MhpB), which catalyzes the oxidization and subsequent ring-opening of 2,3-dihydroxyphenylpropionate	NA|289aa|up_3|NZ_CP029741.1_3614747_3615614_+	TIGR03343, 2-hydroxy-6-oxo-6-phenylhexa-24-dienoate_hydrolase, 2-hydroxy-6-oxo-6-phenylhexa-2,4-dienoate hydrolase	NA|270aa|up_2|NZ_CP029741.1_3615623_3616433_+	PRK11342, mhpD, 2-keto-4-pentenoate hydratase; Provisional	NA|317aa|up_1|NZ_CP029741.1_3616429_3617380_+	PRK08300, PRK08300, acetaldehyde dehydrogenase; Validated	NA|338aa|up_0|NZ_CP029741.1_3617376_3618390_+	PRK08195, PRK08195, 4-hyroxy-2-oxovalerate/4-hydroxy-2-oxopentanoic acid aldolase,; Validated	NA|404aa|down_0|NZ_CP029741.1_3618767_3619979_+	PRK11551, PRK11551, putative 3-hydroxyphenylpropionic transporter MhpT; Provisional	NA|180aa|down_1|NZ_CP029741.1_3620080_3620620_+	COG3122, COG3122, Uncharacterized protein conserved in bacteria [Function unknown]	NA|278aa|down_2|NZ_CP029741.1_3620845_3621679_-	TIGR02821, S-formylglutathione_hydrolase, S-formylglutathione hydrolase	NA|370aa|down_3|NZ_CP029741.1_3621771_3622881_-	cd08300, alcohol_DH_class_III, class III alcohol dehydrogenases	NA|92aa|down_4|NZ_CP029741.1_3622915_3623191_-	PRK11352, PRK11352, formaldehyde-responsive transcriptional repressor FrmR	NA|258aa|down_5|NZ_CP029741.1_3623376_3624150_-	TIGR04390, hypothetical_protein, outer membrane protein, YaiO family	NA|81aa|down_6|NZ_CP029741.1_3625267_3625510_-	TIGR03991, alt_bact_glmU, UDP-N-acetylglucosamine diphosphorylase/glucosamine-1-phosphate N-acetyltransferase	NA|399aa|down_7|NZ_CP029741.1_3625487_3626684_-	COG1215, COG1215, Glycosyltransferases, probably involved in cell wall biogenesis [Cell envelope biogenesis, outer membrane]	NA|224aa|down_8|NZ_CP029741.1_3626693_3627365_-	COG2120, COG2120, Uncharacterized proteins, LmbE homologs [Function unknown]	NA|321aa|down_9|NZ_CP029741.1_3627980_3628943_+	PRK11480, tauA, taurine transporter substrate binding subunit; Provisional
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	9	3653956-3654100	9	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	ATGCCTGATGCGACGCTTGCCGCGTCTTATCAGGCCTACAAAA	43	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA|28aa|up_2|NZ_CP029741.1_3651826_3651910_+,NA	NA|372aa|up_9|NZ_CP029741.1_3646582_3647698_+	PRK10245, adrA, diguanylate cyclase AdrA; Provisional	NA|270aa|up_8|NZ_CP029741.1_3647714_3648524_-	PRK11880, PRK11880, pyrroline-5-carboxylate reductase; Reviewed	NA|155aa|up_7|NZ_CP029741.1_3648643_3649108_+	PRK00124, PRK00124, YaiI/YqxD family protein	NA|175aa|up_6|NZ_CP029741.1_3649284_3649809_+	PRK03731, aroL, shikimate kinase AroL	NA|64aa|up_5|NZ_CP029741.1_3649858_3650050_+	PRK10380, PRK10380, hypothetical protein; Provisional	NA|226aa|up_4|NZ_CP029741.1_3650307_3650985_+	PRK10481, PRK10481, hypothetical protein; Provisional	NA|95aa|up_3|NZ_CP029741.1_3651056_3651341_+	PRK10579, PRK10579, pyrimidine/purine nucleoside phosphorylase	NA|28aa|up_2|NZ_CP029741.1_3651826_3651910_+	NA	NA|304aa|up_1|NZ_CP029741.1_3651987_3652899_-	COG2974, RdgC, DNA recombination-dependent growth factor C [DNA replication, recombination, and repair]	NA|303aa|up_0|NZ_CP029741.1_3653023_3653932_+	PRK09557, PRK09557, fructokinase; Reviewed	NA|395aa|down_0|NZ_CP029741.1_3654176_3655361_-	PRK10091, PRK10091, MFS transport protein AraJ; Provisional	NA|1049aa|down_1|NZ_CP029741.1_3655486_3658633_-	PRK10246, PRK10246, exonuclease subunit SbcC; Provisional	NA|401aa|down_2|NZ_CP029741.1_3658629_3659832_-	PRK10966, PRK10966, exonuclease subunit SbcD; Provisional	NA|230aa|down_3|NZ_CP029741.1_3660021_3660711_+	PRK10161, PRK10161, phosphate response regulator transcription factor PhoB	NA|432aa|down_4|NZ_CP029741.1_3660768_3662064_+	PRK11006, phoR, phosphate regulon sensor histidine kinase PhoR	NA|440aa|down_5|NZ_CP029741.1_3662470_3663790_+	PRK15433, PRK15433, branched-chain amino acid transporter carrier protein BrnQ	NA|458aa|down_6|NZ_CP029741.1_3663865_3665239_+	PRK10580, proY, putative proline-specific permease; Provisional	NA|606aa|down_7|NZ_CP029741.1_3665394_3667212_+	PRK10785, PRK10785, maltodextrin glucosidase; Provisional	NA|194aa|down_8|NZ_CP029741.1_3667216_3667798_-	PRK10045, PRK10045, ACP phosphodiesterase	NA|357aa|down_9|NZ_CP029741.1_3667890_3668961_+	PRK00147, queA, S-adenosylmethionine:tRNA ribosyltransferase-isomerase; Provisional
GCF_003204155.1_ASM320415v1	NZ_CP029741	Escherichia coli strain AR_0085 chromosome, complete genome	10	3805319-3805415	10	CRISPRCasFinder	no		WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	Orphan	GCTTGACGCGTCTTATCAGGCCTACAA	27	0	0	NA	NA	NA	1	1	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA|69aa|up_9|NZ_CP029741.1_3795634_3795841_+,NA|138aa|up_6|NZ_CP029741.1_3797255_3797669_+,NA|94aa|up_4|NZ_CP029741.1_3798565_3798847_+,NA	NA|69aa|up_9|NZ_CP029741.1_3795634_3795841_+	NA	NA|352aa|up_8|NZ_CP029741.1_3795840_3796896_+	pfam03864, Phage_cap_E, Phage major capsid protein E	NA|112aa|up_7|NZ_CP029741.1_3796907_3797243_+	pfam02924, HDPD, Bacteriophage lambda head decoration protein D	NA|138aa|up_6|NZ_CP029741.1_3797255_3797669_+	NA	NA|147aa|up_5|NZ_CP029741.1_3797831_3798272_+	TIGR02257, Aerobic_cobaltochelatase_subunit_CobN, cobaltochelatase, CobN subunit	NA|94aa|up_4|NZ_CP029741.1_3798565_3798847_+	NA	NA|412aa|up_3|NZ_CP029741.1_3799280_3800516_-	TIGR03176, AllC, allantoate amidohydrolase	NA|350aa|up_2|NZ_CP029741.1_3800537_3801587_-	PRK15025, PRK15025, ureidoglycolate dehydrogenase; Provisional	NA|272aa|up_1|NZ_CP029741.1_3803579_3804395_+	pfam11392, DUF2877, Protein of unknown function (DUF2877)	NA|298aa|up_0|NZ_CP029741.1_3804391_3805285_+	PRK09411, PRK09411, carbamate kinase; Reviewed	NA|356aa|down_0|NZ_CP029741.1_3805479_3806547_-	PRK06019, PRK06019, phosphoribosylaminoimidazole carboxylase ATPase subunit; Reviewed	NA|170aa|down_1|NZ_CP029741.1_3806543_3807053_-	COG0041, PurE, Phosphoribosylcarboxyaminoimidazole (NCAIR) mutase [Nucleotide transport and metabolism]	NA|241aa|down_2|NZ_CP029741.1_3807170_3807893_-	PRK05340, PRK05340, UDP-2,3-diacylglucosamine hydrolase; Provisional	NA|165aa|down_3|NZ_CP029741.1_3807895_3808390_-	PRK10791, PRK10791, peptidylprolyl isomerase B	NA|462aa|down_4|NZ_CP029741.1_3808563_3809949_+	PRK00260, cysS, cysteinyl-tRNA synthetase; Validated	NA|174aa|down_5|NZ_CP029741.1_3809984_3810506_-	COG1988, COG1988, Predicted membrane-bound metal-dependent hydrolases [General function prediction only]	NA|71aa|down_6|NZ_CP029741.1_3810613_3810826_-	PRK11507, PRK11507, ribosome-associated protein YbcJ	NA|289aa|down_7|NZ_CP029741.1_3810827_3811694_-	PRK10792, PRK10792, bifunctional methylenetetrahydrofolate dehydrogenase/methenyltetrahydrofolate cyclohydrolase FolD	NA|181aa|down_8|NZ_CP029741.1_3812164_3812707_+	PRK15194, PRK15194, type 1 fimbrial protein subunit FimA	NA|231aa|down_9|NZ_CP029741.1_3812926_3813619_+	PRK15195, PRK15195, molecular chaperone FimC
GCF_003204155.1_ASM320415v1	NZ_CP029743	Escherichia coli strain AR_0085 plasmid unnamed2, complete sequence	1	51649-51834	1	PILER-CR	no		csa3,DEDDh	Orphan	TTTGATATGTGGGAACGCTGCACGAT	26	0	0	NA	NA	NA	2	2	Orphan	WYL,c2c9_V-U4,DEDDh,cas3,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,PD-DExK,DinG	NA|203aa|up_8|NZ_CP029743.1_44422_45031_+,NA|184aa|up_7|NZ_CP029743.1_45027_45579_+,NA|98aa|up_4|NZ_CP029743.1_47382_47676_-,NA|180aa|up_2|NZ_CP029743.1_49174_49714_+,NA|96aa|up_1|NZ_CP029743.1_49718_50006_+,NA|367aa|up_0|NZ_CP029743.1_49990_51091_+,NA|55aa|down_0|NZ_CP029743.1_51876_52041_+,NA|145aa|down_1|NZ_CP029743.1_52127_52562_-,NA|43aa|down_3|NZ_CP029743.1_53838_53967_+,NA|203aa|down_4|NZ_CP029743.1_53963_54572_+,NA|174aa|down_5|NZ_CP029743.1_54576_55098_+,NA|174aa|down_6|NZ_CP029743.1_55100_55622_+,NA|158aa|down_7|NZ_CP029743.1_55718_56192_+,NA|98aa|down_8|NZ_CP029743.1_56202_56496_+,NA|285aa|down_9|NZ_CP029743.1_56500_57355_+	NA|178aa|up_9|NZ_CP029743.1_43878_44412_+	cd13400, LT_IagB-like, Escherichia coli invasion protein IagB and similar proteins	NA|203aa|up_8|NZ_CP029743.1_44422_45031_+	NA	NA|184aa|up_7|NZ_CP029743.1_45027_45579_+	NA	NA|403aa|up_6|NZ_CP029743.1_45668_46877_+	COG3328, COG3328, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|140aa|up_5|NZ_CP029743.1_46961_47381_-	PRK00247, PRK00247, putative inner membrane protein translocase component YidC; Validated	NA|98aa|up_4|NZ_CP029743.1_47382_47676_-	NA	NA|328aa|up_3|NZ_CP029743.1_47692_48676_-	cd10227, ParM_like, Plasmid segregation protein ParM and similar proteins	NA|180aa|up_2|NZ_CP029743.1_49174_49714_+	NA	NA|96aa|up_1|NZ_CP029743.1_49718_50006_+	NA	NA|367aa|up_0|NZ_CP029743.1_49990_51091_+	NA	NA|55aa|down_0|NZ_CP029743.1_51876_52041_+	NA	NA|145aa|down_1|NZ_CP029743.1_52127_52562_-	NA	NA|372aa|down_2|NZ_CP029743.1_52579_53695_-	cd01713, PAPS_reductase, This domain is found in phosphoadenosine phosphosulphate (PAPS) reductase enzymes or PAPS sulphotransferase	NA|43aa|down_3|NZ_CP029743.1_53838_53967_+	NA	NA|203aa|down_4|NZ_CP029743.1_53963_54572_+	NA	NA|174aa|down_5|NZ_CP029743.1_54576_55098_+	NA	NA|174aa|down_6|NZ_CP029743.1_55100_55622_+	NA	NA|158aa|down_7|NZ_CP029743.1_55718_56192_+	NA	NA|98aa|down_8|NZ_CP029743.1_56202_56496_+	NA	NA|285aa|down_9|NZ_CP029743.1_56500_57355_+	NA
