assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002012265.1_ASM201226v1	NZ_CP019012	Escherichia coli strain Ecol_AZ161 chromosome, complete genome	1	231549-231662	1	PILER-CR	no		cas3,DEDDh,c2c9_V-U4,csa3,DinG	Orphan	TTTTTTTACCTGATTCGGGTAAA	23	0	0	NA	NA	NA	2	2	Orphan	cas3,DEDDh,c2c9_V-U4,csa3,DinG	NA|47aa|up_8|NZ_CP019012.1_222937_223078_-,NA|34aa|up_3|NZ_CP019012.1_224338_224440_-,NA|94aa|down_9|NZ_CP019012.1_236727_237009_+	NA|230aa|up_9|NZ_CP019012.1_222251_222941_-	pfam06323, Phage_antiter_Q, Phage antitermination protein Q	NA|47aa|up_8|NZ_CP019012.1_222937_223078_-	NA	NA|121aa|up_7|NZ_CP019012.1_223074_223437_-	PRK09786, PRK09786, endodeoxyribonuclease RUS; Reviewed	NA|97aa|up_6|NZ_CP019012.1_223433_223724_-	pfam07102, DUF1364, Protein of unknown function (DUF1364)	NA|57aa|up_5|NZ_CP019012.1_223716_223887_-	PRK09689, PRK09689, prophage protein NinE; Provisional	NA|152aa|up_4|NZ_CP019012.1_223886_224342_-	PRK09741, PRK09741, hypothetical protein; Provisional	NA|34aa|up_3|NZ_CP019012.1_224338_224440_-	NA	NA|348aa|up_2|NZ_CP019012.1_224789_225833_+	COG0657, Aes, Esterase/lipase [Lipid metabolism]	NA|1422aa|up_1|NZ_CP019012.1_225869_230135_-	pfam11924, IAT_beta, Inverse autotransporter, beta-domain	NA|234aa|up_0|NZ_CP019012.1_230384_231086_-	pfam06992, Phage_lambda_P, Replication protein P	NA|180aa|down_0|NZ_CP019012.1_232098_232638_-	pfam06254, YdaT_toxin, Putative bacterial toxin ydaT	NA|77aa|down_1|NZ_CP019012.1_232707_232938_-	pfam15943, YdaS_antitoxin, Putative antitoxin of bacterial toxin-antitoxin system, YdaS/YdaT	NA|252aa|down_2|NZ_CP019012.1_232976_233732_+	COG2932, COG2932, Predicted transcriptional regulator [Transcription]	NA|69aa|down_3|NZ_CP019012.1_234327_234534_+	PRK11354, kil, FtsZ inhibitor protein; Reviewed	NA|99aa|down_4|NZ_CP019012.1_234609_234906_+	pfam06064, Gam, Host-nuclease inhibitor protein Gam	NA|262aa|down_5|NZ_CP019012.1_234911_235697_+	TIGR01913, Uncharacterized_protein_UU154, phage recombination protein Bet	NA|227aa|down_6|NZ_CP019012.1_235693_236374_+	pfam09588, YqaJ, YqaJ-like viral recombinase domain	NA|61aa|down_7|NZ_CP019012.1_236370_236553_+	pfam07026, DUF1317, Protein of unknown function (DUF1317)	NA|64aa|down_8|NZ_CP019012.1_236525_236717_+	pfam07131, DUF1382, Protein of unknown function (DUF1382)	NA|94aa|down_9|NZ_CP019012.1_236727_237009_+	NA
GCF_002012265.1_ASM201226v1	NZ_CP019012	Escherichia coli strain Ecol_AZ161 chromosome, complete genome	2	363957-364048	1	CRISPRCasFinder	no		cas3,DEDDh,c2c9_V-U4,csa3,DinG	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,c2c9_V-U4,csa3,DinG	NA|70aa|up_9|NZ_CP019012.1_353207_353417_-,NA	NA|70aa|up_9|NZ_CP019012.1_353207_353417_-	NA	NA|1321aa|up_8|NZ_CP019012.1_353471_357434_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_7|NZ_CP019012.1_357473_358112_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_6|NZ_CP019012.1_358399_359491_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_5|NZ_CP019012.1_359490_360183_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_4|NZ_CP019012.1_360194_360581_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|267aa|up_3|NZ_CP019012.1_360588_361389_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_2|NZ_CP019012.1_361398_361989_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_CP019012.1_361999_362494_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_CP019012.1_362514_363843_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_CP019012.1_364471_365068_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_CP019012.1_365088_365316_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_CP019012.1_365353_366595_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|307aa|down_3|NZ_CP019012.1_367129_368050_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_4|NZ_CP019012.1_368049_368355_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_5|NZ_CP019012.1_368609_369209_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_6|NZ_CP019012.1_369205_371752_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_7|NZ_CP019012.1_371751_372924_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_8|NZ_CP019012.1_373053_373746_+	PRK10766, PRK10766, two-component system response regulator TorR	NA|343aa|down_9|NZ_CP019012.1_373718_374747_-	PRK10936, PRK10936, TMAO reductase system periplasmic protein TorT; Provisional
GCF_002012265.1_ASM201226v1	NZ_CP019012	Escherichia coli strain Ecol_AZ161 chromosome, complete genome	3	533938-534020	2	CRISPRCasFinder	no		cas3,DEDDh,c2c9_V-U4,csa3,DinG	Orphan	ATCTGCCTGTACGGCAGTGAACT	23	0	0	NA	NA	I-F	1	1	Orphan	cas3,DEDDh,c2c9_V-U4,csa3,DinG	NA,NA	NA|431aa|up_9|NZ_CP019012.1_518936_520229_-	PRK05431, PRK05431, seryl-tRNA synthetase; Provisional	NA|448aa|up_8|NZ_CP019012.1_520319_521663_-	PRK13342, PRK13342, recombination factor protein RarA; Reviewed	NA|204aa|up_7|NZ_CP019012.1_521673_522285_-	TIGR00547, Outer-membrane_lipoprotein_carrier_protein, periplasmic chaperone LolA	NA|1369aa|up_6|NZ_CP019012.1_522443_526550_-	PRK10263, PRK10263, DNA translocase FtsK; Provisional	NA|165aa|up_5|NZ_CP019012.1_526684_527179_-	PRK11169, PRK11169, leucine-responsive transcriptional regulator Lrp	NA|322aa|up_4|NZ_CP019012.1_527722_528688_+	PRK10262, PRK10262, thioredoxin reductase; Provisional	NA|589aa|up_3|NZ_CP019012.1_528810_530577_+	PRK11174, PRK11174, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|574aa|up_2|NZ_CP019012.1_530577_532299_+	PRK11160, PRK11160, cysteine/glutathione ABC transporter membrane/ATP-binding component; Reviewed	NA|235aa|up_1|NZ_CP019012.1_532340_533045_+	PRK00301, aat, leucyl/phenylalanyl-tRNA--protein transferase; Reviewed	NA|73aa|up_0|NZ_CP019012.1_533329_533548_+	PRK00276, infA, translation initiation factor IF-1; Validated	NA|759aa|down_0|NZ_CP019012.1_534231_536508_-	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	NA|107aa|down_1|NZ_CP019012.1_536538_536859_-	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|75aa|down_2|NZ_CP019012.1_537181_537406_+	PRK09937, PRK09937, cold shock-like protein CspD	NA|649aa|down_3|NZ_CP019012.1_537478_539425_-	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|372aa|down_4|NZ_CP019012.1_539421_540537_-	PRK11578, PRK11578, macrolide transporter subunit MacA; Provisional	NA|319aa|down_5|NZ_CP019012.1_540687_541644_+	COG2990, VirK, Uncharacterized protein conserved in bacteria [Function unknown]	NA|553aa|down_6|NZ_CP019012.1_541640_543299_-	COG3593, COG3593, Predicted ATP-dependent endonuclease of the OLD family [DNA replication, recombination, and repair]	NA|232aa|down_7|NZ_CP019012.1_543723_544419_+	PRK05420, PRK05420, aquaporin Z; Provisional	NA|300aa|down_8|NZ_CP019012.1_544833_545733_+	COG2431, COG2431, Predicted membrane protein [Function unknown]	NA|551aa|down_9|NZ_CP019012.1_545876_547529_+	PRK05290, PRK05290, hybrid cluster protein; Provisional
GCF_002012265.1_ASM201226v1	NZ_CP019012	Escherichia coli strain Ecol_AZ161 chromosome, complete genome	4	4597861-4597984	3	CRISPRCasFinder	no	DEDDh	cas3,DEDDh,c2c9_V-U4,csa3,DinG	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,c2c9_V-U4,csa3,DinG	NA,NA|30aa|down_7|NZ_CP019012.1_4606880_4606970_+	NA|471aa|up_9|NZ_CP019012.1_4587313_4588726_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_CP019012.1_4589282_4589492_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_CP019012.1_4589947_4590574_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_CP019012.1_4590594_4592697_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|213aa|up_5|NZ_CP019012.1_4592709_4593348_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_CP019012.1_4593411_4594080_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_CP019012.1_4594076_4594862_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_CP019012.1_4594865_4595678_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|535aa|up_1|NZ_CP019012.1_4595689_4597294_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_CP019012.1_4597419_4597725_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_CP019012.1_4598298_4599555_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_CP019012.1_4599595_4600969_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_CP019012.1_4601183_4601825_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_CP019012.1_4601864_4603013_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_CP019012.1_4603303_4604515_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_CP019012.1_4604627_4605560_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_CP019012.1_4605556_4606582_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_CP019012.1_4606880_4606970_+	NA	NA|390aa|down_8|NZ_CP019012.1_4607135_4608305_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_CP019012.1_4608450_4609032_-	PRK10543, PRK10543, superoxide dismutase [Fe]
