assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_003095635.1_ASM309563v1	CP029164	Escherichia coli strain 104 chromosome, complete genome	1	136157-136296	1	CRISPRCasFinder	no		DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Orphan	TGTTATTGTCGGATGCGGCGTGAACGCCTTATCCGACCTACACA	44	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA	NA|340aa|up_9|CP029164.1_124367_125387_+	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)	NA|188aa|up_8|CP029164.1_125390_125954_-	PRK09825, idnK, gluconokinase	NA|344aa|up_7|CP029164.1_126170_127202_+	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|255aa|up_6|CP029164.1_127225_127990_+	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|440aa|up_5|CP029164.1_128054_129374_+	TIGR00791, Gluconate_permease, gluconate transporter	NA|333aa|up_4|CP029164.1_129440_130439_+	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|501aa|up_3|CP029164.1_130516_132019_+	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|361aa|up_2|CP029164.1_132179_133262_-	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|367aa|up_1|CP029164.1_133261_134362_-	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|504aa|up_0|CP029164.1_134628_136140_+	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|148aa|down_0|CP029164.1_136397_136841_+	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|952aa|down_1|CP029164.1_136840_139696_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|396aa|down_2|CP029164.1_139742_140930_-	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|168aa|down_3|CP029164.1_141122_141626_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|139aa|down_4|CP029164.1_141802_142219_-	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|335aa|down_5|CP029164.1_142380_143385_+	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|151aa|down_6|CP029164.1_143430_143883_-	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|407aa|down_7|CP029164.1_144560_145781_+	PRK01388, PRK01388, arginine deiminase; Provisional	NA|315aa|down_8|CP029164.1_145791_146736_+	PRK12354, PRK12354, carbamate kinase; Reviewed	NA|335aa|down_9|CP029164.1_146746_147751_+	PRK02102, PRK02102, ornithine carbamoyltransferase; Validated
GCA_003095635.1_ASM309563v1	CP029164	Escherichia coli strain 104 chromosome, complete genome	3	2002885-2003401	1,3,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Unclear	GAGTTCCCCACGTCAGCGGGGATAAACCG,GAGTTCCCCACGTCAGCGGGGATAAACCG,GAGTTCCCCNCGNCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29,29	0	0	NA	NA	I-E:I-E:I-E:I-E	7,8,8,7	8	Unclear	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA	NA|451aa|up_9|CP029164.1_1985826_1987179_+	TIGR00893, Probable_glucarate_transporter, D-galactonate transporter	NA|447aa|up_8|CP029164.1_1987180_1988521_+	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|447aa|up_7|CP029164.1_1988541_1989882_+	TIGR03247, glucar-dehydr, glucarate dehydratase	NA|919aa|up_6|CP029164.1_1990112_1992869_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|434aa|up_5|CP029164.1_1992925_1994227_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_4|CP029164.1_1994274_1996509_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|264aa|up_3|CP029164.1_1996604_1997396_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_2|CP029164.1_1997623_1999261_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_1|CP029164.1_1999347_2000646_+	PRK00077, eno, enolase; Provisional	NA|224aa|up_0|CP029164.1_2001873_2002545_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|CP029164.1_2004038_2005517_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|CP029164.1_2005543_2006821_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|CP029164.1_2007139_2007925_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|CP029164.1_2007994_2009449_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|446aa|down_4|CP029164.1_2009542_2010880_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|CP029164.1_2010857_2011637_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|CP029164.1_2011633_2012494_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|CP029164.1_2012640_2013216_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|CP029164.1_2013232_2013493_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|CP029164.1_2013483_2014755_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCA_003095635.1_ASM309563v1	CP029164	Escherichia coli strain 104 chromosome, complete genome	4	2029103-2030107	3,4,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cse2gr11,cas7,cas5,cas6e,cas1,cas2	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	16,16,16	16	TypeI-E	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA	NA|571aa|up_9|CP029164.1_2017312_2019025_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|up_8|CP029164.1_2019098_2019833_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|51aa|up_7|CP029164.1_2020096_2020249_+	pfam01848, HOK_GEF, Hok/gef family	cas3|886aa|up_6|CP029164.1_2020486_2023144_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cse2gr11|179aa|up_5|CP029164.1_2024800_2025337_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|352aa|up_4|CP029164.1_2025351_2026407_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|CP029164.1_2026417_2027164_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|CP029164.1_2027145_2027796_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|308aa|up_1|CP029164.1_2027792_2028716_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|CP029164.1_2028712_2029006_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|CP029164.1_2030188_2031226_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|CP029164.1_2031477_2032386_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|CP029164.1_2032387_2033815_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|CP029164.1_2033814_2034420_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|CP029164.1_2034469_2034793_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|CP029164.1_2034986_2035298_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|CP029164.1_2035316_2036027_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|CP029164.1_2036026_2036506_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|CP029164.1_2036502_2037552_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|CP029164.1_2037532_2038294_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCA_003095635.1_ASM309563v1	CP029164	Escherichia coli strain 104 chromosome, complete genome	5	3135822-3135945	5	CRISPRCasFinder	no	DEDDh	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,cas3,csa3,PD-DExK,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DinG	NA,NA|75aa|down_7|CP029164.1_3144530_3144755_-,NA|30aa|down_8|CP029164.1_3144841_3144931_+	NA|471aa|up_9|CP029164.1_3125275_3126688_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|CP029164.1_3127244_3127454_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|CP029164.1_3127909_3128536_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|CP029164.1_3128556_3130659_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|216aa|up_5|CP029164.1_3130662_3131310_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|CP029164.1_3131373_3132042_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|CP029164.1_3132038_3132824_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|CP029164.1_3132827_3133640_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|537aa|up_1|CP029164.1_3133645_3135256_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|CP029164.1_3135381_3135687_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|CP029164.1_3136259_3137516_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|CP029164.1_3137556_3138930_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|CP029164.1_3139144_3139786_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|CP029164.1_3139825_3140974_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|CP029164.1_3141264_3142476_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|CP029164.1_3142588_3143521_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|CP029164.1_3143517_3144543_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|75aa|down_7|CP029164.1_3144530_3144755_-	NA	NA|30aa|down_8|CP029164.1_3144841_3144931_+	NA	NA|390aa|down_9|CP029164.1_3145096_3146266_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]
