assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_003095635.1_ASM309563v1	NZ_CP029164	Escherichia coli strain 104 chromosome, complete genome	1	136157-136296	1	CRISPRCasFinder	no		DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	Orphan	TGTTATTGTCGGATGCGGCGTGAACGCCTTATCCGACCTACACA	44	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	NA,NA	NA|340aa|up_9|NZ_CP029164.1_124367_125387_+	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)	NA|188aa|up_8|NZ_CP029164.1_125390_125954_-	PRK09825, idnK, gluconokinase	NA|344aa|up_7|NZ_CP029164.1_126170_127202_+	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|255aa|up_6|NZ_CP029164.1_127225_127990_+	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|440aa|up_5|NZ_CP029164.1_128054_129374_+	TIGR00791, Gluconate_permease, gluconate transporter	NA|333aa|up_4|NZ_CP029164.1_129440_130439_+	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|501aa|up_3|NZ_CP029164.1_130516_132019_+	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|361aa|up_2|NZ_CP029164.1_132179_133262_-	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|367aa|up_1|NZ_CP029164.1_133261_134362_-	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|504aa|up_0|NZ_CP029164.1_134628_136140_+	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|148aa|down_0|NZ_CP029164.1_136397_136841_+	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|952aa|down_1|NZ_CP029164.1_136840_139696_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|396aa|down_2|NZ_CP029164.1_139742_140930_-	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|168aa|down_3|NZ_CP029164.1_141122_141626_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|139aa|down_4|NZ_CP029164.1_141802_142219_-	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|335aa|down_5|NZ_CP029164.1_142380_143385_+	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|151aa|down_6|NZ_CP029164.1_143430_143883_-	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|407aa|down_7|NZ_CP029164.1_144560_145781_+	PRK01388, PRK01388, arginine deiminase; Provisional	NA|315aa|down_8|NZ_CP029164.1_145791_146736_+	PRK12354, PRK12354, carbamate kinase; Reviewed	NA|335aa|down_9|NZ_CP029164.1_146746_147751_+	PRK02102, PRK02102, ornithine carbamoyltransferase; Validated
GCF_003095635.1_ASM309563v1	NZ_CP029164	Escherichia coli strain 104 chromosome, complete genome	2	917706-917844	2	CRISPRCasFinder	no		DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	Orphan	CTCATACTGACAGTCAGGTCACAGCAGTACGTGATGAACT	40	1	1	917746-917804	NZ_CP029164.1_1712076-1712134	NA	1	1	Orphan	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	NA|176aa|up_9|NZ_CP029164.1_909021_909549_+,NA|64aa|up_7|NZ_CP029164.1_909883_910075_-,NA	NA|176aa|up_9|NZ_CP029164.1_909021_909549_+	NA	NA|83aa|up_8|NZ_CP029164.1_909566_909815_-	pfam04352, ProQ, ProQ/FINO family	NA|64aa|up_7|NZ_CP029164.1_909883_910075_-	NA	NA|340aa|up_6|NZ_CP029164.1_910670_911690_-	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|148aa|up_5|NZ_CP029164.1_911947_912391_+	cd00211, PTS_IIA_fru, PTS_IIA, PTS system, fructose/mannitol specific IIA subunit	NA|91aa|up_4|NZ_CP029164.1_912469_912742_+	cd05563, PTS_IIB_ascorbate, PTS_IIB_ascorbate: subunit IIB of enzyme II (EII) of the L-ascorbate-specific phosphoenolpyruvate:carbohydrate phosphotransferase system (PTS)	NA|463aa|up_3|NZ_CP029164.1_912764_914153_+	PRK12996, ulaA, PTS ascorbate transporter subunit IIC	NA|277aa|up_2|NZ_CP029164.1_914149_914980_+	COG3959, COG3959, Transketolase, N-terminal subunit [Carbohydrate transport and metabolism]	NA|318aa|up_1|NZ_CP029164.1_914972_915926_+	COG3958, COG3958, Transketolase, C-terminal subunit [Carbohydrate transport and metabolism]	NA|38aa|up_0|NZ_CP029164.1_916188_916302_+	pfam01527, HTH_Tnp_1, Transposase	NA|152aa|down_0|NZ_CP029164.1_918473_918929_+	pfam08281, Sigma70_r4_2, Sigma-70, region 4	NA|113aa|down_1|NZ_CP029164.1_919285_919624_-	PRK13791, PRK13791, c-type lysozyme inhibitor	NA|230aa|down_2|NZ_CP029164.1_920128_920818_-	PRK01130, PRK01130, putative N-acetylmannosamine-6-phosphate 2-epimerase	NA|519aa|down_3|NZ_CP029164.1_920817_922374_-	TIGR02002, PTS_system_glucose-specific_IIABC_component, PTS system, glucose-specific IIBC component	NA|275aa|down_4|NZ_CP029164.1_922539_923364_+	COG1737, RpiR, Transcriptional regulators [Transcription]	NA|448aa|down_5|NZ_CP029164.1_923520_924864_-	COG4222, COG4222, Uncharacterized protein conserved in bacteria [Function unknown]	NA|425aa|down_6|NZ_CP029164.1_924983_926257_-	PRK09409, PRK09409, IS2 transposase TnpB; Reviewed	NA|439aa|down_7|NZ_CP029164.1_927694_929011_-	PRK10974, PRK10974, sn-glycerol-3-phosphate ABC transporter substrate-binding protein UgpB	NA|62aa|down_8|NZ_CP029164.1_929181_929367_+	COG2337, MazF, Growth inhibitor [Signal transduction mechanisms]	NA|36aa|down_9|NZ_CP029164.1_929375_929483_+	COG2337, MazF, Growth inhibitor [Signal transduction mechanisms]
GCF_003095635.1_ASM309563v1	NZ_CP029164	Escherichia coli strain 104 chromosome, complete genome	3	2002885-2003401	1,3,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	Unclear	GAGTTCCCCACGTCAGCGGGGATAAACCG,GAGTTCCCCACGTCAGCGGGGATAAACCG,GAGTTCCCCNCGNCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29,29	0	0	NA	NA	I-E:I-E:I-E:I-E	7,8,8,7	8	Unclear	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	NA,NA	NA|451aa|up_9|NZ_CP029164.1_1985826_1987179_+	TIGR00893, Probable_glucarate_transporter, D-galactonate transporter	NA|447aa|up_8|NZ_CP029164.1_1987180_1988521_+	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|447aa|up_7|NZ_CP029164.1_1988541_1989882_+	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|919aa|up_6|NZ_CP029164.1_1990112_1992869_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|434aa|up_5|NZ_CP029164.1_1992925_1994227_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_4|NZ_CP029164.1_1994274_1996509_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|264aa|up_3|NZ_CP029164.1_1996604_1997396_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_2|NZ_CP029164.1_1997623_1999261_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_1|NZ_CP029164.1_1999347_2000646_+	PRK00077, eno, enolase; Provisional	NA|224aa|up_0|NZ_CP029164.1_2001873_2002545_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_CP029164.1_2004038_2005517_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_CP029164.1_2005543_2006821_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_CP029164.1_2007139_2007925_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_CP029164.1_2007994_2009449_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|470aa|down_4|NZ_CP029164.1_2009470_2010880_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_CP029164.1_2010857_2011637_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_CP029164.1_2011633_2012494_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|NZ_CP029164.1_2012640_2013216_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|NZ_CP029164.1_2013232_2013493_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|NZ_CP029164.1_2013483_2014755_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCF_003095635.1_ASM309563v1	NZ_CP029164	Escherichia coli strain 104 chromosome, complete genome	4	2029103-2030107	3,4,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cse2gr11,cas7,cas5,cas6e,cas1,cas2	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	16,16,16	16	TypeI-E	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	NA,NA	NA|571aa|up_9|NZ_CP029164.1_2017312_2019025_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|up_8|NZ_CP029164.1_2019098_2019833_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|51aa|up_7|NZ_CP029164.1_2020096_2020249_+	pfam01848, HOK_GEF, Hok/gef family	cas3|886aa|up_6|NZ_CP029164.1_2020486_2023144_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cse2gr11|179aa|up_5|NZ_CP029164.1_2024800_2025337_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|NZ_CP029164.1_2025351_2026407_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP029164.1_2026417_2027164_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP029164.1_2027145_2027796_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|NZ_CP029164.1_2027792_2028716_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP029164.1_2028712_2029006_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP029164.1_2030188_2031226_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP029164.1_2031477_2032386_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP029164.1_2032387_2033815_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP029164.1_2033814_2034420_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP029164.1_2034469_2034793_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP029164.1_2034986_2035298_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP029164.1_2035316_2036027_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP029164.1_2036026_2036506_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP029164.1_2036502_2037552_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP029164.1_2037532_2038294_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_003095635.1_ASM309563v1	NZ_CP029164	Escherichia coli strain 104 chromosome, complete genome	5	3135822-3135945	5	CRISPRCasFinder	no	DEDDh	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	NA,NA|30aa|down_7|NZ_CP029164.1_3144841_3144931_+	NA|471aa|up_9|NZ_CP029164.1_3125275_3126688_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP029164.1_3127244_3127454_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP029164.1_3127909_3128536_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP029164.1_3128556_3130659_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|213aa|up_5|NZ_CP029164.1_3130671_3131310_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP029164.1_3131373_3132042_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP029164.1_3132038_3132824_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP029164.1_3132827_3133640_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|537aa|up_1|NZ_CP029164.1_3133645_3135256_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP029164.1_3135381_3135687_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP029164.1_3136259_3137516_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP029164.1_3137556_3138930_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP029164.1_3139144_3139786_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP029164.1_3139825_3140974_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP029164.1_3141264_3142476_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP029164.1_3142588_3143521_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP029164.1_3143517_3144543_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP029164.1_3144841_3144931_+	NA	NA|390aa|down_8|NZ_CP029164.1_3145096_3146266_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP029164.1_3146411_3146993_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_003095635.1_ASM309563v1	NZ_CP029164	Escherichia coli strain 104 chromosome, complete genome	6	3774242-3774333	6	CRISPRCasFinder	no		DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,c2c9_V-U4,DinG	NA|70aa|up_9|NZ_CP029164.1_3763493_3763703_-,NA	NA|70aa|up_9|NZ_CP029164.1_3763493_3763703_-	NA	NA|1321aa|up_8|NZ_CP029164.1_3763757_3767720_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_7|NZ_CP029164.1_3767759_3768398_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_6|NZ_CP029164.1_3768685_3769777_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_5|NZ_CP029164.1_3769776_3770469_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_4|NZ_CP029164.1_3770480_3770867_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|271aa|up_3|NZ_CP029164.1_3770874_3771687_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_2|NZ_CP029164.1_3771683_3772274_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_CP029164.1_3772284_3772779_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP029164.1_3772799_3774128_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP029164.1_3774756_3775353_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP029164.1_3775373_3775601_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP029164.1_3775638_3776880_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|307aa|down_3|NZ_CP029164.1_3777414_3778335_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_4|NZ_CP029164.1_3778334_3778640_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_5|NZ_CP029164.1_3778995_3779595_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_6|NZ_CP029164.1_3779591_3782138_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_7|NZ_CP029164.1_3782137_3783310_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_8|NZ_CP029164.1_3783439_3784132_+	PRK10766, PRK10766, two-component system response regulator TorR	NA|343aa|down_9|NZ_CP029164.1_3784104_3785133_-	PRK10936, PRK10936, TMAO reductase system periplasmic protein TorT; Provisional
