assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000784925.1_ASM78492v1	NZ_CP009859	Escherichia coli strain ECONIH1 chromosome, complete genome	1	1029641-1029788	1	CRISPRCasFinder	no		DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	Orphan	GTTCACTGCCGTACAGGCAGCTTAGAAA	28	0	0	NA	NA	I-F	2	2	Orphan	DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	NA,NA|606aa|down_1|NZ_CP009859.1_1031395_1033213_-,NA|479aa|down_7|NZ_CP009859.1_1043696_1045133_+	NA|551aa|up_9|NZ_CP009859.1_1016085_1017738_-	PRK05290, PRK05290, hybrid cluster protein; Provisional	NA|300aa|up_8|NZ_CP009859.1_1017880_1018780_-	COG2431, COG2431, Predicted membrane protein [Function unknown]	NA|232aa|up_7|NZ_CP009859.1_1019237_1019933_-	PRK05420, PRK05420, aquaporin Z; Provisional	NA|553aa|up_6|NZ_CP009859.1_1020358_1022017_+	COG3593, COG3593, Predicted ATP-dependent endonuclease of the OLD family [DNA replication, recombination, and repair]	NA|319aa|up_5|NZ_CP009859.1_1022013_1022970_-	COG2990, VirK, Uncharacterized protein conserved in bacteria [Function unknown]	NA|372aa|up_4|NZ_CP009859.1_1023120_1024236_+	PRK11578, PRK11578, macrolide transporter subunit MacA; Provisional	NA|649aa|up_3|NZ_CP009859.1_1024232_1026179_+	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|75aa|up_2|NZ_CP009859.1_1026251_1026476_-	PRK09937, PRK09937, cold shock-like protein CspD	NA|107aa|up_1|NZ_CP009859.1_1026798_1027119_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|759aa|up_0|NZ_CP009859.1_1027149_1029426_+	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	NA|401aa|down_0|NZ_CP009859.1_1030006_1031209_+	cd00801, INT_P4_C, Bacteriophage P4 integrase, C-terminal catalytic domain	NA|606aa|down_1|NZ_CP009859.1_1031395_1033213_-	NA	NA|99aa|down_2|NZ_CP009859.1_1034323_1034620_+	COG3311, AlpA, Predicted transcriptional regulator [Transcription]	NA|66aa|down_3|NZ_CP009859.1_1034846_1035044_+	pfam13148, DUF3987, Protein of unknown function (DUF3987)	NA|478aa|down_4|NZ_CP009859.1_1035261_1036695_+	pfam13148, DUF3987, Protein of unknown function (DUF3987)	NA|188aa|down_5|NZ_CP009859.1_1037515_1038079_+	pfam11726, Inovirus_Gp2, Inovirus Gp2	NA|1653aa|down_6|NZ_CP009859.1_1038741_1043700_+	cd18808, SF1_C_Upf1, C-terminal helicase domain of Upf1-like family helicases	NA|479aa|down_7|NZ_CP009859.1_1043696_1045133_+	NA	NA|69aa|down_8|NZ_CP009859.1_1045237_1045444_+	PRK14994, PRK14994, SAM-dependent 16S ribosomal RNA C1402 ribose 2'-O-methyltransferase; Provisional	NA|630aa|down_9|NZ_CP009859.1_1045612_1047502_-	cd06592, GH31_NET37, glucosidase NET37
GCF_000784925.1_ASM78492v1	NZ_CP009859	Escherichia coli strain ECONIH1 chromosome, complete genome	2	3180214-3181097	1,2,1	CRT,CRISPRCasFinder,PILER-CR	no	cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,cas3	DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	Type I-E	CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC,CGGTTTATCCCCGCTGGCGCGGGGAACTC	29,29,29	0	0	NA	NA	I-E:I-E:I-E	14,13,12	14	TypeI-E	DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	NA,NA	NA|254aa|up_9|NZ_CP009859.1_3172087_3172849_-	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional	NA|350aa|up_8|NZ_CP009859.1_3172829_3173879_-	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|160aa|up_7|NZ_CP009859.1_3173875_3174355_-	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|237aa|up_6|NZ_CP009859.1_3174354_3175065_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|104aa|up_5|NZ_CP009859.1_3175083_3175395_-	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|108aa|up_4|NZ_CP009859.1_3175588_3175912_-	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|202aa|up_3|NZ_CP009859.1_3175961_3176567_-	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|476aa|up_2|NZ_CP009859.1_3176566_3177994_-	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|303aa|up_1|NZ_CP009859.1_3177995_3178904_-	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|346aa|up_0|NZ_CP009859.1_3179155_3180193_+	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	cas2|95aa|down_0|NZ_CP009859.1_3181202_3181487_-	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	cas1|306aa|down_1|NZ_CP009859.1_3181488_3182406_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas6e|200aa|down_2|NZ_CP009859.1_3182421_3183021_-	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas5|225aa|down_3|NZ_CP009859.1_3183007_3183682_-	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas7|364aa|down_4|NZ_CP009859.1_3183684_3184776_-	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cse2gr11|161aa|down_5|NZ_CP009859.1_3184788_3185271_-	cd09670, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas8e|503aa|down_6|NZ_CP009859.1_3185263_3186772_-	PRK09693, PRK09693, Cascade antiviral complex protein; Validated	cas3|889aa|down_7|NZ_CP009859.1_3187186_3189853_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	NA|245aa|down_8|NZ_CP009859.1_3190211_3190946_-	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|571aa|down_9|NZ_CP009859.1_3191019_3192732_-	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit
GCF_000784925.1_ASM78492v1	NZ_CP009859	Escherichia coli strain ECONIH1 chromosome, complete genome	3	3206644-3207772	3,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas3	DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	Unclear	CGGTTTATCCCCGCTGGCGCGGGGAACAC,CGGTTTATCCCCGCTGGCGCGGGGAACAC,GGTTTATCCCCGCTGGCGCGGGGAACAC	29,29,28	2	2	3207040-3207071|3207040-3207072	NZ_CP009859.1_3227604-3227573|NZ_CP009859.1_3227604-3227572	I-E:I-E:I-E	18,18,18	18	Unclear	DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	NA,NA	NA|424aa|up_9|NZ_CP009859.1_3195289_3196561_+	PRK10015, PRK10015, oxidoreductase; Provisional	NA|87aa|up_8|NZ_CP009859.1_3196551_3196812_+	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|192aa|up_7|NZ_CP009859.1_3196828_3197404_+	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|287aa|up_6|NZ_CP009859.1_3197550_3198411_-	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|260aa|up_5|NZ_CP009859.1_3198407_3199187_-	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|470aa|up_4|NZ_CP009859.1_3199164_3200574_-	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|485aa|up_3|NZ_CP009859.1_3200595_3202050_-	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|262aa|up_2|NZ_CP009859.1_3202119_3202905_-	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|426aa|up_1|NZ_CP009859.1_3203223_3204501_+	cd06174, MFS, Major Facilitator Superfamily	NA|493aa|up_0|NZ_CP009859.1_3204527_3206006_+	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|224aa|down_0|NZ_CP009859.1_3208111_3208783_-	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|291aa|down_1|NZ_CP009859.1_3209076_3209949_+	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|433aa|down_2|NZ_CP009859.1_3210008_3211307_-	PRK00077, eno, enolase; Provisional	NA|546aa|down_3|NZ_CP009859.1_3211393_3213031_-	PRK05380, pyrG, CTP synthetase; Validated	NA|264aa|down_4|NZ_CP009859.1_3213258_3214050_-	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|112aa|down_5|NZ_CP009859.1_3214121_3214457_-	PRK09907, PRK09907, endoribonuclease MazF	NA|83aa|down_6|NZ_CP009859.1_3214456_3214705_-	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|745aa|down_7|NZ_CP009859.1_3214782_3217017_-	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|434aa|down_8|NZ_CP009859.1_3217064_3218366_-	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|919aa|down_9|NZ_CP009859.1_3218422_3221179_+	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional
GCF_000784925.1_ASM78492v1	NZ_CP009859	Escherichia coli strain ECONIH1 chromosome, complete genome	4	5276183-5276347	4	CRISPRCasFinder	no		DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	Orphan	CTAACGTGCAGGTTTTGTAGGTCGGATAAGGCGTTCACGCCGCATCCGACACGG	54	0	0	NA	NA	NA	1	1	Orphan	DEDDh,cas3,DinG,csa3,cas2,cas1,cas6e,cas5,cas7,cse2gr11,cas8e,RT,WYL,PD-DExK,c2c9_V-U4	NA,NA	NA|764aa|up_9|NZ_CP009859.1_5266810_5269102_-	PRK03776, PRK03776, phosphatidylglycerol--membrane-oligosaccharide glycerophosphotransferase	NA|165aa|up_8|NZ_CP009859.1_5269355_5269850_-	PRK11667, PRK11667, hypothetical protein; Provisional	NA|246aa|up_7|NZ_CP009859.1_5269898_5270636_-	PRK07952, PRK07952, DNA replication protein DnaC; Validated	NA|180aa|up_6|NZ_CP009859.1_5270638_5271178_-	PRK02854, PRK02854, primosomal protein DnaT	NA|158aa|up_5|NZ_CP009859.1_5271284_5271758_-	PRK09917, PRK09917, threonine/serine exporter	NA|257aa|up_4|NZ_CP009859.1_5271748_5272519_-	COG2966, COG2966, Uncharacterized conserved protein [Function unknown]	NA|242aa|up_3|NZ_CP009859.1_5273137_5273863_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|226aa|up_2|NZ_CP009859.1_5273820_5274498_+	PRK11475, PRK11475, DNA-binding transcriptional activator BglJ; Provisional	NA|263aa|up_1|NZ_CP009859.1_5274535_5275324_-	PRK10647, PRK10647, ferric iron reductase involved in ferric hydroximate transport; Provisional	NA|79aa|up_0|NZ_CP009859.1_5275464_5275701_+	pfam07256, DUF1435, Protein of unknown function (DUF1435)	NA|344aa|down_0|NZ_CP009859.1_5276440_5277472_-	PRK09489, rsmC, 16S rRNA (guanine(1207)-N(2))-methyltransferase RsmC	NA|138aa|down_1|NZ_CP009859.1_5277574_5277988_+	PRK06856, PRK06856, DNA polymerase III subunit psi; Validated	NA|149aa|down_2|NZ_CP009859.1_5277956_5278403_+	PRK09491, rimI, ribosomal-protein-alanine N-acetyltransferase; Provisional	NA|226aa|down_3|NZ_CP009859.1_5278417_5279095_+	PRK09449, PRK09449, dUMP phosphatase; Provisional	NA|530aa|down_4|NZ_CP009859.1_5279185_5280775_+	PRK00741, prfC, peptide chain release factor 3; Provisional	NA|202aa|down_5|NZ_CP009859.1_5281167_5281773_+	PRK10568, PRK10568, molecular chaperone OsmY	NA|54aa|down_6|NZ_CP009859.1_5281901_5282063_+	COG5487, COG5487, Small integral membrane protein [Function unknown]	NA|358aa|down_7|NZ_CP009859.1_5282183_5283257_+	COG4667, COG4667, Predicted esterase of the alpha-beta hydrolase superfamily [General function prediction only]	NA|261aa|down_8|NZ_CP009859.1_5283253_5284036_+	PRK11449, PRK11449, metal-dependent hydrolase	NA|288aa|down_9|NZ_CP009859.1_5284254_5285118_-	TIGR04041, glycine_radical_enzyme_activase_YjjW_family, glycine radical enzyme activase, YjjW family
