assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_003017615.1_ASM301761v1	NZ_CP027310	Escherichia coli strain 2014C-4135 chromosome, complete genome	1	1941653-1941904	1	PILER-CR	no		DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Orphan	TTTTGGAGGAGCAGAAAGATGAATGACTGTCCACGACGCTATACCCAAAAGAAA	54	0	0	NA	NA	NA	2	2	Orphan	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA|180aa|down_1|NZ_CP027310.1_1943411_1943951_-	NA|158aa|up_9|NZ_CP027310.1_1931227_1931701_-	PRK11425, PRK11425, PTS N-acetylgalactosamine transporter subunit IIB	NA|427aa|up_8|NZ_CP027310.1_1931723_1933004_-	PRK15458, PRK15458, tagatose 6-phosphate aldolase subunit KbaZ; Provisional	NA|270aa|up_7|NZ_CP027310.1_1933252_1934062_+	PRK09802, PRK09802, DeoR family transcriptional regulator	NA|155aa|up_6|NZ_CP027310.1_1934116_1934581_-	pfam11663, Toxin_YhaV, Toxin with endonuclease activity, of toxin-antitoxin system	NA|112aa|up_5|NZ_CP027310.1_1934580_1934916_-	PRK09974, PRK09974, type II toxin-antitoxin system PrlF family antitoxin	NA|524aa|up_4|NZ_CP027310.1_1935064_1936636_-	TIGR03248, galactar-dH20, galactarate dehydratase	NA|445aa|up_3|NZ_CP027310.1_1937010_1938345_+	TIGR00893, Probable_glucarate_transporter, D-galactonate transporter	NA|257aa|up_2|NZ_CP027310.1_1938360_1939131_+	PRK10558, PRK10558, alpha-dehydro-beta-deoxy-D-glucarate aldolase; Provisional	NA|297aa|up_1|NZ_CP027310.1_1939160_1940051_+	PRK11559, garR, tartronate semialdehyde reductase; Provisional	NA|382aa|up_0|NZ_CP027310.1_1940147_1941293_+	PRK10342, PRK10342, glycerate kinase I; Provisional	NA|396aa|down_0|NZ_CP027310.1_1942202_1943390_-	PRK09716, PRK09716, YhaC family protein	NA|180aa|down_1|NZ_CP027310.1_1943411_1943951_-	NA	NA|115aa|down_2|NZ_CP027310.1_1944206_1944551_-	PRK11424, PRK11424, DNA-binding transcriptional activator TdcR; Provisional	NA|313aa|down_3|NZ_CP027310.1_1944739_1945678_+	PRK10341, PRK10341, transcriptional regulator TdcA	NA|330aa|down_4|NZ_CP027310.1_1945776_1946766_+	PRK08638, PRK08638, bifunctional threonine ammonia-lyase/L-serine ammonia-lyase TdcB	NA|444aa|down_5|NZ_CP027310.1_1946787_1948119_+	PRK13629, PRK13629, threonine/serine transporter TdcC; Provisional	NA|403aa|down_6|NZ_CP027310.1_1948144_1949353_+	PRK12379, PRK12379, propionate kinase	NA|765aa|down_7|NZ_CP027310.1_1949386_1951681_+	cd01678, PFL1, Pyruvate formate lyase 1	NA|130aa|down_8|NZ_CP027310.1_1951694_1952084_+	PRK11401, PRK11401, enamine/imine deaminase	NA|455aa|down_9|NZ_CP027310.1_1952155_1953520_+	PRK15040, PRK15040, L-serine ammonia-lyase
GCF_003017615.1_ASM301761v1	NZ_CP027310	Escherichia coli strain 2014C-4135 chromosome, complete genome	2	2436460-2436732	2,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	3,4,4	4	TypeI-E	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA|121aa|up_3|NZ_CP027310.1_2433356_2433719_-,NA	NA|745aa|up_9|NZ_CP027310.1_2426292_2428527_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|83aa|up_8|NZ_CP027310.1_2428604_2428853_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_7|NZ_CP027310.1_2428852_2429188_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_6|NZ_CP027310.1_2429258_2430050_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_5|NZ_CP027310.1_2430277_2431915_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_4|NZ_CP027310.1_2432002_2433301_+	PRK00077, eno, enolase; Provisional	NA|121aa|up_3|NZ_CP027310.1_2433356_2433719_-	NA	NA|302aa|up_2|NZ_CP027310.1_2433754_2434660_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|201aa|up_1|NZ_CP027310.1_2434673_2435276_-	COG1704, LemA, Uncharacterized conserved protein [Function unknown]	NA|224aa|up_0|NZ_CP027310.1_2435448_2436120_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|122aa|down_0|NZ_CP027310.1_2437964_2438330_-	cd00470, PTPS, 6-pyruvoyl tetrahydropterin synthase (PTPS)	NA|600aa|down_1|NZ_CP027310.1_2438645_2440445_+	PRK10953, cysJ, NADPH-dependent assimilatory sulfite reductase flavoprotein subunit	NA|571aa|down_2|NZ_CP027310.1_2440444_2442157_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|down_3|NZ_CP027310.1_2442230_2442965_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|51aa|down_4|NZ_CP027310.1_2443229_2443382_+	pfam01848, HOK_GEF, Hok/gef family	cas8e|521aa|down_5|NZ_CP027310.1_2446371_2447934_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|down_6|NZ_CP027310.1_2447930_2448467_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|down_7|NZ_CP027310.1_2448481_2449537_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|down_8|NZ_CP027310.1_2449547_2450294_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|down_9|NZ_CP027310.1_2450275_2450926_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI
GCF_003017615.1_ASM301761v1	NZ_CP027310	Escherichia coli strain 2014C-4135 chromosome, complete genome	3	2452233-2452871	3,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	10,10,10	10	TypeI-E	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA	NA|571aa|up_9|NZ_CP027310.1_2440444_2442157_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|up_8|NZ_CP027310.1_2442230_2442965_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|51aa|up_7|NZ_CP027310.1_2443229_2443382_+	pfam01848, HOK_GEF, Hok/gef family	cas8e|521aa|up_6|NZ_CP027310.1_2446371_2447934_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|179aa|up_5|NZ_CP027310.1_2447930_2448467_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|NZ_CP027310.1_2448481_2449537_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP027310.1_2449547_2450294_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP027310.1_2450275_2450926_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|NZ_CP027310.1_2450922_2451846_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP027310.1_2451842_2452136_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_CP027310.1_2452953_2453991_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP027310.1_2454242_2455151_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_CP027310.1_2455152_2456580_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP027310.1_2456579_2457185_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_CP027310.1_2457234_2457558_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP027310.1_2457751_2458063_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP027310.1_2458081_2458792_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP027310.1_2458791_2459271_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP027310.1_2459267_2460317_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP027310.1_2460297_2461059_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_003017615.1_ASM301761v1	NZ_CP027310	Escherichia coli strain 2014C-4135 chromosome, complete genome	4	3072443-3072534	3	CRISPRCasFinder	no		DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Orphan	GCATCAGAAGCAGGTAAAAAAGGTGG	26	0	0	NA	NA	NA	1	1	Orphan	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA|70aa|down_9|NZ_CP027310.1_3083073_3083283_+	NA|358aa|up_9|NZ_CP027310.1_3056663_3057737_-	COG0348, NapH, Polyferredoxin [Energy production and conversion]	NA|915aa|up_8|NZ_CP027310.1_3057808_3060553_-	PRK11466, PRK11466, hybrid sensory histidine kinase TorS; Provisional	NA|231aa|up_7|NZ_CP027310.1_3061635_3062328_-	PRK10766, PRK10766, two-component system response regulator TorR	NA|391aa|up_6|NZ_CP027310.1_3062457_3063630_+	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|200aa|up_5|NZ_CP027310.1_3066171_3066771_+	PRK04976, torD, chaperone protein TorD; Validated	NA|102aa|up_4|NZ_CP027310.1_3066863_3067169_-	PRK10265, PRK10265, chaperone modulator CbpM	NA|307aa|up_3|NZ_CP027310.1_3067168_3068089_-	PRK10266, PRK10266, curved DNA-binding protein	NA|420aa|up_2|NZ_CP027310.1_3068348_3069608_+	PRK09784, PRK09784, YccE family protein	NA|76aa|up_1|NZ_CP027310.1_3071174_3071402_-	PRK10174, PRK10174, hypothetical protein; Provisional	NA|199aa|up_0|NZ_CP027310.1_3071422_3072019_-	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|443aa|down_0|NZ_CP027310.1_3072647_3073976_-	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|165aa|down_1|NZ_CP027310.1_3073996_3074491_-	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|197aa|down_2|NZ_CP027310.1_3074501_3075092_-	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|267aa|down_3|NZ_CP027310.1_3075101_3075902_-	TIGR03611, RutD, pyrimidine utilization protein D	NA|129aa|down_4|NZ_CP027310.1_3075909_3076296_-	TIGR03610, RutC, pyrimidine utilization protein C	NA|231aa|down_5|NZ_CP027310.1_3076307_3077000_-	TIGR03614, RutB, pyrimidine utilization protein B	NA|364aa|down_6|NZ_CP027310.1_3076999_3078091_-	TIGR03612, RutA, pyrimidine utilization protein A	NA|213aa|down_7|NZ_CP027310.1_3078378_3079017_+	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|1321aa|down_8|NZ_CP027310.1_3079056_3083019_-	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|70aa|down_9|NZ_CP027310.1_3083073_3083283_+	NA
GCF_003017615.1_ASM301761v1	NZ_CP027310	Escherichia coli strain 2014C-4135 chromosome, complete genome	5	4863186-4863282	4	CRISPRCasFinder	no		DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Orphan	TTGTAGGCCTGATAAGATGCGTCAAGC	27	0	0	NA	NA	NA	1	1	Orphan	DEDDh,RT,cas3,c2c9_V-U4,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA	NA|870aa|up_9|NZ_CP027310.1_4852332_4854942_-	PRK15198, PRK15198, outer membrane usher protein FimD	NA|231aa|up_8|NZ_CP027310.1_4854972_4855665_-	PRK15195, PRK15195, molecular chaperone FimC	NA|181aa|up_7|NZ_CP027310.1_4855884_4856427_-	PRK15194, PRK15194, type 1 fimbrial protein subunit FimA	NA|289aa|up_6|NZ_CP027310.1_4856907_4857774_+	PRK10792, PRK10792, bifunctional methylenetetrahydrofolate dehydrogenase/methenyltetrahydrofolate cyclohydrolase FolD	NA|71aa|up_5|NZ_CP027310.1_4857775_4857988_+	PRK11507, PRK11507, ribosome-associated protein YbcJ	NA|174aa|up_4|NZ_CP027310.1_4858095_4858617_+	COG1988, COG1988, Predicted membrane-bound metal-dependent hydrolases [General function prediction only]	NA|462aa|up_3|NZ_CP027310.1_4858652_4860038_-	PRK00260, cysS, cysteinyl-tRNA synthetase; Validated	NA|165aa|up_2|NZ_CP027310.1_4860211_4860706_+	PRK10791, PRK10791, peptidylprolyl isomerase B	NA|241aa|up_1|NZ_CP027310.1_4860708_4861431_+	PRK05340, PRK05340, UDP-2,3-diacylglucosamine hydrolase; Provisional	NA|356aa|up_0|NZ_CP027310.1_4862053_4863121_+	PRK06019, PRK06019, phosphoribosylaminoimidazole carboxylase ATPase subunit; Reviewed	NA|298aa|down_0|NZ_CP027310.1_4863315_4864209_-	PRK09411, PRK09411, carbamate kinase; Reviewed	NA|272aa|down_1|NZ_CP027310.1_4864205_4865021_-	pfam11392, DUF2877, Protein of unknown function (DUF2877)	NA|420aa|down_2|NZ_CP027310.1_4865031_4866291_-	pfam06545, DUF1116, Protein of unknown function (DUF1116)	NA|556aa|down_3|NZ_CP027310.1_4866300_4867968_-	PRK06091, PRK06091, membrane protein FdrA; Validated	NA|350aa|down_4|NZ_CP027310.1_4868284_4869334_+	PRK15025, PRK15025, ureidoglycolate dehydrogenase; Provisional	NA|412aa|down_5|NZ_CP027310.1_4869355_4870591_+	TIGR03176, AllC, allantoate amidohydrolase	NA|262aa|down_6|NZ_CP027310.1_4870601_4871387_+	TIGR03214, ura-cupin, putative allantoin catabolism protein	NA|382aa|down_7|NZ_CP027310.1_4871515_4872661_-	PRK09932, PRK09932, glycerate 3-kinase	NA|454aa|down_8|NZ_CP027310.1_4874039_4875401_-	PRK08044, PRK08044, allantoinase AllB	NA|485aa|down_9|NZ_CP027310.1_4875460_4876915_-	PRK11375, PRK11375, putative allantoin permease
