assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_002900305.1_ASM290030v1	CP025703	Escherichia coli BH100N substr. MG2017, complete genome	1	153607-153693	1	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	Orphan	GTTTTGTAGGCCGGATAAGGCGTTCA	26	1	1	153633-153667	CP025703.1_155130-155164	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	NA,NA|68aa|down_8|CP025703.1_162989_163193_+	NA|888aa|up_9|CP025703.1_137915_140579_+	PRK09405, aceE, pyruvate dehydrogenase subunit E1; Reviewed	NA|631aa|up_8|CP025703.1_140593_142486_+	PRK11854, aceF, pyruvate dehydrogenase dihydrolipoyltransacetylase; Validated	NA|475aa|up_7|CP025703.1_142693_144118_+	PRK06467, PRK06467, dihydrolipoamide dehydrogenase; Reviewed	NA|586aa|up_6|CP025703.1_144359_146117_-	pfam11737, DUF3300, Protein of unknown function (DUF3300)	NA|866aa|up_5|CP025703.1_146470_149068_+	PRK09238, PRK09238, bifunctional aconitate hydratase 2/2-methylisocitrate dehydratase; Validated	NA|121aa|up_4|CP025703.1_149242_149605_+	PRK05248, PRK05248, hypothetical protein; Provisional	NA|265aa|up_3|CP025703.1_149642_150437_-	PRK05462, PRK05462, adenosylmethionine decarboxylase	NA|289aa|up_2|CP025703.1_150452_151319_-	PRK00811, PRK00811, polyamine aminopropyltransferase	NA|116aa|up_1|CP025703.1_151424_151772_-	pfam09691, T2SS_PulS_OutS, Type II secretion system pilotin lipoprotein (PulS_OutS)	NA|517aa|up_0|CP025703.1_151937_153488_+	PRK10965, PRK10965, multicopper oxidase; Provisional	NA|797aa|down_0|CP025703.1_155180_157571_-	TIGR03074, PQQ_membr_DH, membrane-bound PQQ-dependent dehydrogenase, glucose/quinate/shikimate family	NA|179aa|down_1|CP025703.1_157776_158313_+	PRK15423, PRK15423, hypoxanthine phosphoribosyltransferase; Provisional	NA|221aa|down_2|CP025703.1_158353_159016_-	PRK10437, PRK10437, carbonic anhydrase; Provisional	NA|309aa|down_3|CP025703.1_159124_160051_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|257aa|down_4|CP025703.1_160047_160818_+	PRK15066, PRK15066, inner membrane transport permease; Provisional	NA|147aa|down_5|CP025703.1_160922_161363_+	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|410aa|down_6|CP025703.1_161426_162656_+	cd10966, CE4_yadE_5s, Putative catalytic polysaccharide deacetylase domain of uncharacterized protein yadE and similar proteins	NA|127aa|down_7|CP025703.1_162659_163040_-	TIGR00223, Aspartate_1-decarboxylase, L-aspartate-alpha-decarboxylase	NA|68aa|down_8|CP025703.1_162989_163193_+	NA	NA|311aa|down_9|CP025703.1_163313_164246_+	pfam04754, Transposase_31, Putative transposase, YhgA-like
GCA_002900305.1_ASM290030v1	CP025703	Escherichia coli BH100N substr. MG2017, complete genome	2	1036755-1036902	2	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	Orphan	GTTCACTGCCGTACAGGCAGCTTAGAAA	28	0	0	NA	NA	I-F	2	2	Orphan	DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	NA|86aa|up_9|CP025703.1_1028528_1028786_+,NA|69aa|up_7|CP025703.1_1029628_1029835_+,NA|94aa|up_4|CP025703.1_1032492_1032774_+,NA|60aa|up_3|CP025703.1_1032778_1032958_+,NA|80aa|up_2|CP025703.1_1033058_1033298_+,NA|38aa|down_5|CP025703.1_1043178_1043292_+	NA|86aa|up_9|CP025703.1_1028528_1028786_+	NA	NA|141aa|up_8|CP025703.1_1028782_1029205_+	cd04496, SSB_OBF, SSB_OBF: A subfamily of OB folds similar to the OB fold of ssDNA-binding protein (SSB)	NA|69aa|up_7|CP025703.1_1029628_1029835_+	NA	NA|638aa|up_6|CP025703.1_1029834_1031748_+	cd07016, S14_ClpP_1, Caseinolytic protease (ClpP) is an ATP-dependent, highly conserved serine protease	NA|162aa|up_5|CP025703.1_1032004_1032490_+	pfam07278, DUF1441, Protein of unknown function (DUF1441)	NA|94aa|up_4|CP025703.1_1032492_1032774_+	NA	NA|60aa|up_3|CP025703.1_1032778_1032958_+	NA	NA|80aa|up_2|CP025703.1_1033058_1033298_+	NA	NA|107aa|up_1|CP025703.1_1033914_1034235_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|759aa|up_0|CP025703.1_1034265_1036542_+	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	NA|73aa|down_0|CP025703.1_1037285_1037504_-	PRK00276, infA, translation initiation factor IF-1; Validated	NA|235aa|down_1|CP025703.1_1037788_1038493_-	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|574aa|down_2|CP025703.1_1038534_1040256_-	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|589aa|down_3|CP025703.1_1040256_1042023_-	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|322aa|down_4|CP025703.1_1042145_1043111_-	PRK10262, PRK10262, thioredoxin reductase; Provisional	NA|38aa|down_5|CP025703.1_1043178_1043292_+	NA	NA|165aa|down_6|CP025703.1_1043654_1044149_+	PRK11169, PRK11169, leucine-responsive transcriptional regulator Lrp	NA|1340aa|down_7|CP025703.1_1044283_1048303_+	PRK10263, PRK10263, DNA translocase FtsK; Provisional	NA|204aa|down_8|CP025703.1_1048461_1049073_+	TIGR00547, Outer-membrane_lipoprotein_carrier_protein, periplasmic chaperone LolA	NA|448aa|down_9|CP025703.1_1049083_1050427_+	PRK13342, PRK13342, recombination factor protein RarA; Reviewed
GCA_002900305.1_ASM290030v1	CP025703	Escherichia coli BH100N substr. MG2017, complete genome	3	2479008-2479121	3	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	Orphan	TTTGTAGGCCGGATAAGCGAAGCGCATCCGGCA	33	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	NA|71aa|up_1|CP025703.1_2476412_2476625_-,NA|42aa|down_8|CP025703.1_2488237_2488363_+	NA|259aa|up_9|CP025703.1_2459168_2459945_-	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|550aa|up_8|CP025703.1_2459949_2461599_-	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|1535aa|up_7|CP025703.1_2461599_2466204_-	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|208aa|up_6|CP025703.1_2466137_2466761_-	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|563aa|up_5|CP025703.1_2466757_2468446_-	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|876aa|up_4|CP025703.1_2468594_2471222_-	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|241aa|up_3|CP025703.1_2471368_2472091_+	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|1253aa|up_2|CP025703.1_2472230_2475989_-	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|71aa|up_1|CP025703.1_2476412_2476625_-	NA	NA|762aa|up_0|CP025703.1_2476670_2478956_+	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|377aa|down_0|CP025703.1_2479145_2480276_+	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|85aa|down_1|CP025703.1_2480275_2480530_+	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|217aa|down_2|CP025703.1_2480583_2481234_-	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|359aa|down_3|CP025703.1_2481436_2482513_-	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|453aa|down_4|CP025703.1_2482517_2483876_-	PRK11273, glpT, glycerol-3-phosphate transporter	NA|543aa|down_5|CP025703.1_2484148_2485777_+	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|420aa|down_6|CP025703.1_2485766_2487026_+	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|397aa|down_7|CP025703.1_2487022_2488213_+	TIGR03379, glycerol3P_GlpC, glycerol-3-phosphate dehydrogenase, anaerobic, C subunit	NA|42aa|down_8|CP025703.1_2488237_2488363_+	NA	NA|320aa|down_9|CP025703.1_2488405_2489365_+	PRK09956, PRK09956, ISNCY family transposase
GCA_002900305.1_ASM290030v1	CP025703	Escherichia coli BH100N substr. MG2017, complete genome	4	4369517-4369718	1	PILER-CR	no		DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	Orphan	GTAGACCGGATAAGGCGTTCACGCCGCATCCGGCAA	36	0	0	NA	NA	NA	2	2	Orphan	DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	NA,NA	NA|252aa|up_9|CP025703.1_4361067_4361823_+	PRK00216, ubiE, bifunctional demethylmenaquinone methyltransferase/2-methoxy-6-polyprenyl-1,4-benzoquinol methylase UbiE	NA|202aa|up_8|CP025703.1_4361836_4362442_+	COG3165, COG3165, Uncharacterized protein conserved in bacteria [Function unknown]	NA|547aa|up_7|CP025703.1_4362438_4364079_+	PRK04750, ubiB, putative ubiquinone biosynthesis protein UbiB; Reviewed	NA|90aa|up_6|CP025703.1_4364157_4364427_+	PRK03554, tatA, Sec-independent protein translocase subunit TatA	NA|172aa|up_5|CP025703.1_4364430_4364946_+	PRK01770, PRK01770, Sec-independent protein translocase subunit TatB	NA|259aa|up_4|CP025703.1_4364948_4365725_+	PRK10921, PRK10921, Sec-independent protein translocase subunit TatC	NA|261aa|up_3|CP025703.1_4365766_4366549_+	PRK10425, PRK10425, 3'-5' ssDNA/RNA exonuclease TatD	NA|163aa|up_2|CP025703.1_4366545_4367034_-	PRK09014, rfaH, transcription/translation regulatory transformer protein RfaH	NA|498aa|up_1|CP025703.1_4367200_4368694_+	PRK10922, PRK10922, 4-hydroxy-3-polyprenylbenzoate decarboxylase	NA|234aa|up_0|CP025703.1_4368739_4369441_+	PRK08051, fre, FMN reductase; Validated	NA|388aa|down_0|CP025703.1_4369722_4370886_-	PRK08947, fadA, 3-ketoacyl-CoA thiolase; Reviewed	NA|730aa|down_1|CP025703.1_4370895_4373085_-	PRK11730, fadB, fatty acid oxidation complex subunit alpha FadB	NA|444aa|down_2|CP025703.1_4373274_4374606_+	PRK13607, PRK13607, proline dipeptidase; Provisional	NA|205aa|down_3|CP025703.1_4374605_4375220_+	PRK11568, PRK11568, IMPACT family protein	NA|484aa|down_4|CP025703.1_4375258_4376710_+	PRK10750, PRK10750, Trk system potassium transporter TrkH	NA|182aa|down_5|CP025703.1_4376721_4377267_+	PRK11104, hemG, menaquinone-dependent protoporphyrinogen IX dehydrogenase	NA|176aa|down_6|CP025703.1_4382758_4383286_-	PRK10751, PRK10751, molybdopterin-guanine dinucleotide biosynthesis protein B; Provisional	NA|195aa|down_7|CP025703.1_4383267_4383852_-	PRK00317, mobA, molybdopterin-guanine dinucleotide biosynthesis protein MobA; Reviewed	NA|90aa|down_8|CP025703.1_4383921_4384191_+	pfam06288, DUF1040, Protein of unknown function (DUF1040)	NA|329aa|down_9|CP025703.1_4384267_4385254_+	PRK11768, PRK11768, serine/threonine protein kinase
GCA_002900305.1_ASM290030v1	CP025703	Escherichia coli BH100N substr. MG2017, complete genome	5	4430053-4430179	4	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	Orphan	GTAGGCCGGATAAGGCACTCGTGCCGCATCCGGCA	35	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	NA|85aa|up_5|CP025703.1_4425269_4425524_+,NA|50aa|down_2|CP025703.1_4432987_4433137_+,NA|56aa|down_6|CP025703.1_4435950_4436118_+,NA|43aa|down_8|CP025703.1_4436920_4437049_-	NA|71aa|up_9|CP025703.1_4419315_4419528_+	pfam01402, RHH_1, Ribbon-helix-helix protein, copG family	NA|310aa|up_8|CP025703.1_4419742_4420672_-	PRK03564, PRK03564, formate dehydrogenase accessory protein FdhE; Provisional	NA|212aa|up_7|CP025703.1_4420668_4421304_-	PRK10639, PRK10639, formate dehydrogenase cytochrome b556 subunit	NA|301aa|up_6|CP025703.1_4421300_4422203_-	TIGR01582, Formate_dehydrogenase_iron-sulfur_subunit, formate dehydrogenase, beta subunit, Fe-S containing	NA|85aa|up_5|CP025703.1_4425269_4425524_+	NA	NA|278aa|up_4|CP025703.1_4425459_4426293_+	PRK00724, PRK00724, formate dehydrogenase accessory sulfurtransferase FdhD	NA|221aa|up_3|CP025703.1_4426342_4427005_+	pfam12889, DUF3829, Protein of unknown function (DUF3829)	NA|465aa|up_2|CP025703.1_4427425_4428820_+	pfam16966, Porin_8, Porin-like glycoporin RafY	NA|105aa|up_1|CP025703.1_4428860_4429175_-	TIGR02625, L-rhamnose_mutarotase, L-rhamnose mutarotase	NA|275aa|up_0|CP025703.1_4429184_4430009_-	PRK03634, PRK03634, rhamnulose-1-phosphate aldolase; Provisional	NA|420aa|down_0|CP025703.1_4430183_4431443_-	PRK01076, PRK01076, L-rhamnose isomerase; Provisional	NA|490aa|down_1|CP025703.1_4431439_4432909_-	PRK10640, rhaB, rhamnulokinase; Provisional	NA|50aa|down_2|CP025703.1_4432987_4433137_+	NA	NA|279aa|down_3|CP025703.1_4433196_4434033_+	PRK13503, PRK13503, HTH-type transcriptional activator RhaS	NA|313aa|down_4|CP025703.1_4434016_4434955_+	PRK13500, PRK13500, HTH-type transcriptional activator RhaR	NA|345aa|down_5|CP025703.1_4434951_4435986_-	pfam06379, RhaT, L-rhamnose-proton symport protein (RhaT)	NA|56aa|down_6|CP025703.1_4435950_4436118_+	NA	NA|207aa|down_7|CP025703.1_4436271_4436892_+	PRK10925, PRK10925, superoxide dismutase [Mn]	NA|43aa|down_8|CP025703.1_4436920_4437049_-	NA	NA|328aa|down_9|CP025703.1_4437151_4438135_+	TIGR00793, 2-keto-3-deoxygluconate_permease, 2-keto-3-deoxygluconate transporter
GCA_002900305.1_ASM290030v1	CP025703	Escherichia coli BH100N substr. MG2017, complete genome	6	4850590-4850729	5	CRISPRCasFinder	no		DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	Orphan	TGTGTAGGTCGGATAAGGCGTTCACGCCGCATCCGACAATAACA	44	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas14j,DinG,cas3,csa3,RT,PD-DExK,WYL	NA|45aa|up_7|CP025703.1_4842413_4842548_-,NA	NA|315aa|up_9|CP025703.1_4840150_4841095_-	PRK12354, PRK12354, carbamate kinase; Reviewed	NA|407aa|up_8|CP025703.1_4841105_4842326_-	PRK01388, PRK01388, arginine deiminase; Provisional	NA|45aa|up_7|CP025703.1_4842413_4842548_-	NA	NA|151aa|up_6|CP025703.1_4843003_4843456_+	COG2731, EbgC, Beta-galactosidase, beta subunit [Carbohydrate transport and metabolism]	NA|335aa|up_5|CP025703.1_4843500_4844505_-	PRK03515, PRK03515, ornithine carbamoyltransferase subunit I; Provisional	NA|139aa|up_4|CP025703.1_4844666_4845083_+	PRK11191, PRK11191, ribonuclease E inhibitor RraB	NA|168aa|up_3|CP025703.1_4845259_4845763_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|396aa|up_2|CP025703.1_4845955_4847143_+	COG4269, COG4269, Predicted membrane protein [Function unknown]	NA|952aa|up_1|CP025703.1_4847189_4850045_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|148aa|up_0|CP025703.1_4850044_4850488_-	PRK05728, PRK05728, DNA polymerase III subunit chi; Validated	NA|504aa|down_0|CP025703.1_4850745_4852257_-	PRK00913, PRK00913, multifunctional aminopeptidase A; Provisional	NA|367aa|down_1|CP025703.1_4852523_4853624_+	PRK15120, PRK15120, lipopolysaccharide ABC transporter permease LptF; Provisional	NA|361aa|down_2|CP025703.1_4853623_4854706_+	PRK15071, PRK15071, lipopolysaccharide ABC transporter permease; Provisional	NA|501aa|down_3|CP025703.1_4854866_4856369_-	pfam05872, DUF853, Bacterial protein of unknown function (DUF853)	NA|333aa|down_4|CP025703.1_4856446_4857445_-	cd01575, PBP1_GntR, ligand-binding domain of DNA transcription repressor GntR specific for gluconate, a member of the LacI-GalR family of bacterial transcription regulators	NA|440aa|down_5|CP025703.1_4857511_4858831_-	TIGR00791, Gluconate_permease, gluconate transporter	NA|255aa|down_6|CP025703.1_4858895_4859660_-	PRK08085, PRK08085, gluconate 5-dehydrogenase; Provisional	NA|344aa|down_7|CP025703.1_4859683_4860715_-	PRK09880, PRK09880, L-idonate 5-dehydrogenase; Provisional	NA|188aa|down_8|CP025703.1_4860931_4861495_+	PRK09825, idnK, gluconokinase	NA|340aa|down_9|CP025703.1_4861498_4862518_-	cd05283, CAD1, Cinnamyl alcohol dehydrogenases (CAD)
