assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	1	681370-681509	1	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Orphan	ACATGTAGGGCGGATAAGGCGTTCACGCCGCATCCGCCAG	40	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA|101aa|up_6|NZ_AP023197.1_673847_674150_-,NA|357aa|down_1|NZ_AP023197.1_683887_684958_-	NA|496aa|up_9|NZ_AP023197.1_670272_671760_+	pfam04295, GD_AH_C, D-galactarate dehydratase / Altronate hydrolase, C-terminus	NA|184aa|up_8|NZ_AP023197.1_671842_672394_+	pfam10688, Imp-YgjV, Bacterial inner membrane protein	NA|415aa|up_7|NZ_AP023197.1_672398_673643_-	PRK13628, PRK13628, serine/threonine transporter SstT; Provisional	NA|101aa|up_6|NZ_AP023197.1_673847_674150_-	NA	NA|322aa|up_5|NZ_AP023197.1_674258_675224_-	TIGR03718, R_switched_Alx, integral membrane protein, TerC family	NA|329aa|up_4|NZ_AP023197.1_675506_676493_-	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|231aa|up_3|NZ_AP023197.1_676571_677264_-	COG2949, SanA, Uncharacterized membrane protein [Function unknown]	NA|168aa|up_2|NZ_AP023197.1_677340_677844_-	COG1451, COG1451, Predicted metal-dependent hydrolase [General function prediction only]	NA|379aa|up_1|NZ_AP023197.1_677928_679065_+	PRK15001, PRK15001, 23S rRNA (guanine(1835)-N(2))-methyltransferase RlmG	NA|673aa|up_0|NZ_AP023197.1_679175_681194_-	cd02930, DCR_FMN, 2,4-dienoyl-CoA reductase (DCR) FMN-binding domain	NA|784aa|down_0|NZ_AP023197.1_681519_683871_-	PRK10137, PRK10137, alpha-glucosidase; Provisional	NA|357aa|down_1|NZ_AP023197.1_683887_684958_-	NA	NA|478aa|down_2|NZ_AP023197.1_685091_686525_-	PRK15238, PRK15238, inner membrane transporter YjeM; Provisional	NA|150aa|down_3|NZ_AP023197.1_686587_687037_-	PRK10202, ebgC, beta-galactosidase subunit beta	NA|1031aa|down_4|NZ_AP023197.1_687033_690126_-	PRK10340, ebgA, cryptic beta-D-galactosidase subunit alpha; Reviewed	NA|328aa|down_5|NZ_AP023197.1_690309_691293_-	PRK10339, PRK10339, DNA-binding transcriptional repressor EbgR; Provisional	NA|111aa|down_6|NZ_AP023197.1_691511_691844_+	PRK10089, PRK10089, chaperone CsaA	NA|460aa|down_7|NZ_AP023197.1_691885_693265_-	PRK11522, PRK11522, putrescine--2-oxoglutarate aminotransferase; Provisional	NA|507aa|down_8|NZ_AP023197.1_693682_695203_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|208aa|down_9|NZ_AP023197.1_695250_695874_-	COG1695, COG1695, Predicted transcriptional regulators [Transcription]
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	2	1047491-1047946	2,1	CRISPRCasFinder,CRT	no	cas3	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Unclear	GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29	0	0	NA	NA	I-E:I-E	7,7	7	Unclear	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA,NA	NA|83aa|up_9|NZ_AP023197.1_1037980_1038229_+	PRK09798, PRK09798, MazF-MazE toxin-antitoxin system antitoxin MazE	NA|112aa|up_8|NZ_AP023197.1_1038228_1038564_+	PRK09907, PRK09907, endoribonuclease MazF	NA|264aa|up_7|NZ_AP023197.1_1038634_1039426_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_6|NZ_AP023197.1_1039653_1041291_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_5|NZ_AP023197.1_1041378_1042677_+	PRK00077, eno, enolase; Provisional	NA|301aa|up_4|NZ_AP023197.1_1042736_1043639_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|383aa|up_3|NZ_AP023197.1_1043635_1044784_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|298aa|up_2|NZ_AP023197.1_1044798_1045692_-	COG1512, COG1512, Beta-propeller domains of methanol dehydrogenase type [General function prediction only]	NA|201aa|up_1|NZ_AP023197.1_1045705_1046308_-	COG1704, LemA, Uncharacterized conserved protein [Function unknown]	NA|224aa|up_0|NZ_AP023197.1_1046480_1047152_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|493aa|down_0|NZ_AP023197.1_1048584_1050063_-	cd07779, FGGY_ygcE_like, uncharacterized ygcE-like proteins	NA|426aa|down_1|NZ_AP023197.1_1050089_1051367_-	cd06174, MFS, Major Facilitator Superfamily	NA|262aa|down_2|NZ_AP023197.1_1051685_1052471_+	cd05347, Ga5DH-like_SDR_c, gluconate 5-dehydrogenase (Ga5DH)-like, classical (c) SDRs	NA|485aa|down_3|NZ_AP023197.1_1052540_1053995_+	COG0277, GlcD, FAD/FMN-containing dehydrogenases [Energy production and conversion]	NA|470aa|down_4|NZ_AP023197.1_1054016_1055426_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|260aa|down_5|NZ_AP023197.1_1055403_1056183_+	COG2086, FixA, Electron transfer flavoprotein, beta subunit [Energy production and conversion]	NA|287aa|down_6|NZ_AP023197.1_1056179_1057040_+	COG2025, FixB, Electron transfer flavoprotein, alpha subunit [Energy production and conversion]	NA|192aa|down_7|NZ_AP023197.1_1057187_1057763_-	COG1954, GlpP, Glycerol-3-phosphate responsive antiterminator (mRNA-binding) [Transcription]	NA|87aa|down_8|NZ_AP023197.1_1057779_1058040_-	COG2440, FixX, Ferredoxin-like protein [Energy production and conversion]	NA|424aa|down_9|NZ_AP023197.1_1058030_1059302_-	PRK10015, PRK10015, oxidoreductase; Provisional
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	3	1073493-1074375	1,3,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas2	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Type I-E	GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG,GAGTTCCCCGCGCCAGCGGGGATAAACCG	29,29,29	0	0	NA	NA	I-E:I-E:I-E	9,14,13	14	TypeI-E	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA,NA	NA|600aa|up_9|NZ_AP023197.1_1060060_1061860_+	PRK10953, cysJ, NADPH-dependent assimilatory sulfite reductase flavoprotein subunit	NA|571aa|up_8|NZ_AP023197.1_1061859_1063572_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|up_7|NZ_AP023197.1_1063645_1064380_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	cas3|889aa|up_6|NZ_AP023197.1_1064737_1067404_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas8e|503aa|up_5|NZ_AP023197.1_1067818_1069327_+	PRK09693, PRK09693, Cascade antiviral complex protein; Validated	cse2gr11|161aa|up_4|NZ_AP023197.1_1069319_1069802_+	cd09670, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|364aa|up_3|NZ_AP023197.1_1069814_1070906_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|225aa|up_2|NZ_AP023197.1_1070908_1071583_+	TIGR01868, hypothetical_protein, CRISPR-associated protein Cas5/CasD, subtype I-E/ECOLI	cas6e|200aa|up_1|NZ_AP023197.1_1071569_1072169_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas2|95aa|up_0|NZ_AP023197.1_1073102_1073387_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|346aa|down_0|NZ_AP023197.1_1074395_1075433_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_AP023197.1_1075684_1076593_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|476aa|down_2|NZ_AP023197.1_1076594_1078022_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_AP023197.1_1078021_1078627_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|108aa|down_4|NZ_AP023197.1_1078676_1079000_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_AP023197.1_1079193_1079505_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_AP023197.1_1079523_1080234_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_AP023197.1_1080233_1080713_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_AP023197.1_1080709_1081759_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_AP023197.1_1081739_1082501_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	4	1572629-1572755	4	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Orphan	GCCTGATGCGACGCTGGCGCGTCTTATCAGGCCTACAAA	39	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA|357aa|up_5|NZ_AP023197.1_1566649_1567720_-,NA	NA|420aa|up_9|NZ_AP023197.1_1560836_1562096_-	COG3075, GlpB, Anaerobic glycerol-3-phosphate dehydrogenase [Amino acid transport and metabolism]	NA|543aa|up_8|NZ_AP023197.1_1562085_1563714_-	PRK11101, glpA, anaerobic glycerol-3-phosphate dehydrogenase subunit A	NA|453aa|up_7|NZ_AP023197.1_1563986_1565345_+	PRK11273, glpT, glycerol-3-phosphate transporter	NA|359aa|up_6|NZ_AP023197.1_1565349_1566426_+	PRK11143, glpQ, glycerophosphodiester phosphodiesterase; Provisional	NA|357aa|up_5|NZ_AP023197.1_1566649_1567720_-	NA	NA|293aa|up_4|NZ_AP023197.1_1568183_1569062_-	cd05466, PBP2_LTTR_substrate, The substrate binding domain of LysR-type transcriptional regulators (LTTRs), a member of the type 2 periplasmic binding fold protein superfamily	NA|397aa|up_3|NZ_AP023197.1_1569213_1570404_+	cd17489, MFS_YfcJ_like, Escherichia coli YfcJ, YhhS, and similar transporters of the Major Facilitator Superfamily	NA|217aa|up_2|NZ_AP023197.1_1570484_1571135_+	PRK09902, PRK09902, lipopolysaccharide kinase InaA	NA|85aa|up_1|NZ_AP023197.1_1571188_1571443_-	PRK10713, PRK10713, 2Fe-2S ferredoxin-like protein	NA|377aa|up_0|NZ_AP023197.1_1571442_1572573_-	PRK09101, nrdB, ribonucleotide-diphosphate reductase subunit beta; Reviewed	NA|762aa|down_0|NZ_AP023197.1_1572805_1575091_-	PRK09103, PRK09103, ribonucleoside-diphosphate reductase subunit alpha	NA|1245aa|down_1|NZ_AP023197.1_1575786_1579521_+	PRK09752, PRK09752, AIDA-I family autotransporter YfaL	NA|241aa|down_2|NZ_AP023197.1_1579661_1580384_-	PRK05134, PRK05134, bifunctional 2-polyprenyl-6-hydroxyphenol methylase/3-demethylubiquinol 3-O-methyltransferase UbiG	NA|876aa|down_3|NZ_AP023197.1_1580530_1583158_+	PRK05560, PRK05560, DNA gyrase subunit A; Validated	NA|563aa|down_4|NZ_AP023197.1_1583306_1584995_+	COG4685, COG4685, Uncharacterized protein conserved in bacteria [Function unknown]	NA|208aa|down_5|NZ_AP023197.1_1584991_1585615_+	COG3234, COG3234, Uncharacterized protein conserved in bacteria [Function unknown]	NA|1465aa|down_6|NZ_AP023197.1_1585758_1590153_+	COG2373, COG2373, Large extracellular alpha-helical protein [General function prediction only]	NA|550aa|down_7|NZ_AP023197.1_1590153_1591803_+	COG5445, COG5445, Predicted secreted protein [Function unknown]	NA|259aa|down_8|NZ_AP023197.1_1591807_1592584_+	COG4676, COG4676, Uncharacterized protein conserved in bacteria [Function unknown]	NA|950aa|down_9|NZ_AP023197.1_1592858_1595708_+	PRK10841, PRK10841, two-component system sensor histidine kinase RcsC
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	5	1978000-1978145	5	CRISPRCasFinder	no	DEDDh	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Unclear	AGAGATAGCGAACCGTAGGTCAGATAAGGCGCTCGCGCCGCATCCGACA	49	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA|22aa|up_2|NZ_AP023197.1_1976085_1976151_+,NA	NA|273aa|up_9|NZ_AP023197.1_1970052_1970871_-	PRK10302, PRK10302, hypothetical protein; Provisional	NA|189aa|up_8|NZ_AP023197.1_1970867_1971434_-	PRK11440, PRK11440, putative hydrolase; Provisional	NA|591aa|up_7|NZ_AP023197.1_1971743_1973516_+	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|151aa|up_6|NZ_AP023197.1_1973633_1974086_+	PRK09438, nudB, dihydroneopterin triphosphate pyrophosphatase; Provisional	NA|247aa|up_5|NZ_AP023197.1_1974114_1974855_+	PRK00110, PRK00110, YebC/PmpR family DNA-binding transcriptional regulator	NA|174aa|up_4|NZ_AP023197.1_1974889_1975411_+	TIGR00228, Crossover_junction_endodeoxyribonuclease_RuvC, crossover junction endodeoxyribonuclease RuvC	NA|201aa|up_3|NZ_AP023197.1_1975412_1976015_-	PRK11470, PRK11470, YebB family permuted papain-like enzyme	NA|22aa|up_2|NZ_AP023197.1_1976085_1976151_+	NA	NA|204aa|up_1|NZ_AP023197.1_1976289_1976901_+	PRK00116, ruvA, Holliday junction branch migration protein RuvA	NA|337aa|up_0|NZ_AP023197.1_1976909_1977920_+	PRK00080, ruvB, Holliday junction branch migration DNA helicase RuvB	NA|262aa|down_0|NZ_AP023197.1_1978163_1978949_-	PRK09543, znuB, zinc ABC transporter permease subunit ZnuB	NA|252aa|down_1|NZ_AP023197.1_1978945_1979701_-	PRK09544, znuC, high-affinity zinc transporter ATPase; Reviewed	NA|311aa|down_2|NZ_AP023197.1_1979779_1980712_+	PRK09545, znuA, zinc ABC transporter substrate-binding protein ZnuA	NA|441aa|down_3|NZ_AP023197.1_1980727_1982050_+	PRK11649, PRK11649, putative peptidase; Provisional	NA|324aa|down_4|NZ_AP023197.1_1982169_1983141_+	PRK08943, PRK08943, lipid A biosynthesis (KDO)2-(lauroyl)-lipid IVA acyltransferase; Validated	NA|481aa|down_5|NZ_AP023197.1_1983271_1984714_-	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|290aa|down_6|NZ_AP023197.1_1984841_1985711_-	PRK11302, PRK11302, DNA-binding transcriptional regulator HexR; Provisional	NA|492aa|down_7|NZ_AP023197.1_1986048_1987524_+	PRK05722, PRK05722, glucose-6-phosphate 1-dehydrogenase; Validated	NA|604aa|down_8|NZ_AP023197.1_1987758_1989570_+	PRK09054, PRK09054, phosphogluconate dehydratase; Validated	NA|214aa|down_9|NZ_AP023197.1_1989606_1990248_+	PRK05718, PRK05718, keto-hydroxyglutarate-aldolase/keto-deoxy-phosphogluconate aldolase; Provisional
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	6	2208984-2209107	6	CRISPRCasFinder	no	DEDDh	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Unclear	CGACCCCCACCATGTCAAGGTGGTGCTCTAACCAACTGAGCTA	43	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA,NA|30aa|down_7|NZ_AP023197.1_2218003_2218093_+	NA|471aa|up_9|NZ_AP023197.1_2198437_2199850_-	PRK09206, PRK09206, pyruvate kinase PykF	NA|70aa|up_8|NZ_AP023197.1_2200406_2200616_+	PRK10292, PRK10292, fumarate hydratase FumD	NA|209aa|up_7|NZ_AP023197.1_2201071_2201698_+	PRK09898, PRK09898, ferredoxin-like protein	NA|701aa|up_6|NZ_AP023197.1_2201718_2203821_+	PRK09849, PRK09849, putative oxidoreductase; Provisional	NA|213aa|up_5|NZ_AP023197.1_2203833_2204472_+	PRK09947, PRK09947, YdhW family putative oxidoreductase system protein	NA|223aa|up_4|NZ_AP023197.1_2204535_2205204_+	TIGR03149, cyt_nit_nrfC, cytochrome c nitrite reductase, Fe-S protein	NA|262aa|up_3|NZ_AP023197.1_2205200_2205986_+	PRK15006, PRK15006, thiosulfate reductase cytochrome B subunit; Provisional	NA|271aa|up_2|NZ_AP023197.1_2205989_2206802_+	PRK09946, PRK09946, hypothetical protein; Provisional	NA|535aa|up_1|NZ_AP023197.1_2206813_2208418_-	PRK09897, PRK09897, FAD-NAD(P)-binding protein	NA|102aa|up_0|NZ_AP023197.1_2208543_2208849_-	PRK11118, PRK11118, putative monooxygenase; Provisional	NA|419aa|down_0|NZ_AP023197.1_2209421_2210678_+	PRK09945, PRK09945, hypothetical protein; Provisional	NA|458aa|down_1|NZ_AP023197.1_2210718_2212092_-	PRK01766, PRK01766, multidrug efflux protein; Reviewed	NA|214aa|down_2|NZ_AP023197.1_2212306_2212948_+	PRK13020, PRK13020, riboflavin synthase subunit alpha; Provisional	NA|383aa|down_3|NZ_AP023197.1_2212987_2214136_-	PRK11705, PRK11705, cyclopropane fatty acyl phospholipid synthase	NA|404aa|down_4|NZ_AP023197.1_2214426_2215638_-	PRK11043, PRK11043, Bcr/CflA family multidrug efflux MFS transporter	NA|311aa|down_5|NZ_AP023197.1_2215750_2216683_+	PRK11074, PRK11074, putative DNA-binding transcriptional regulator; Provisional	NA|342aa|down_6|NZ_AP023197.1_2216679_2217705_-	PRK10703, PRK10703, HTH-type transcriptional repressor PurR	NA|30aa|down_7|NZ_AP023197.1_2218003_2218093_+	NA	NA|390aa|down_8|NZ_AP023197.1_2218258_2219428_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|194aa|down_9|NZ_AP023197.1_2219573_2220155_-	PRK10543, PRK10543, superoxide dismutase [Fe]
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	7	2862980-2863071	7	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Orphan	CCACCTTTTTTACCTGCTTCAGATGC	26	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA|70aa|up_9|NZ_AP023197.1_2852230_2852440_-,NA	NA|70aa|up_9|NZ_AP023197.1_2852230_2852440_-	NA	NA|1321aa|up_8|NZ_AP023197.1_2852494_2856457_+	PRK11809, putA, trifunctional transcriptional regulator/proline dehydrogenase/pyrroline-5-carboxylate dehydrogenase; Reviewed	NA|213aa|up_7|NZ_AP023197.1_2856496_2857135_-	PRK15008, PRK15008, HTH-type transcriptional regulator RutR; Provisional	NA|364aa|up_6|NZ_AP023197.1_2857422_2858514_+	TIGR03612, RutA, pyrimidine utilization protein A	NA|231aa|up_5|NZ_AP023197.1_2858513_2859206_+	TIGR03614, RutB, pyrimidine utilization protein B	NA|129aa|up_4|NZ_AP023197.1_2859217_2859604_+	TIGR03610, RutC, pyrimidine utilization protein C	NA|267aa|up_3|NZ_AP023197.1_2859611_2860412_+	TIGR03611, RutD, pyrimidine utilization protein D	NA|197aa|up_2|NZ_AP023197.1_2860421_2861012_+	PRK05365, PRK05365, malonic semialdehyde reductase; Provisional	NA|165aa|up_1|NZ_AP023197.1_2861022_2861517_+	TIGR03615, flavoprotein_oxidoreductase, pyrimidine utilization flavin reductase protein F	NA|443aa|up_0|NZ_AP023197.1_2861537_2862866_+	TIGR03616, Putative_pyrimidine_permease_RutG, pyrimidine utilization transport protein G	NA|199aa|down_0|NZ_AP023197.1_2863494_2864091_+	PRK03767, PRK03767, NAD(P)H:quinone oxidoreductase; Provisional	NA|76aa|down_1|NZ_AP023197.1_2864111_2864339_+	PRK10174, PRK10174, hypothetical protein; Provisional	NA|414aa|down_2|NZ_AP023197.1_2864376_2865618_-	PRK10173, PRK10173, glucose-1-phosphatase/inositol phosphatase; Provisional	NA|419aa|down_3|NZ_AP023197.1_2865899_2867156_-	PRK09784, PRK09784, YccE family protein	NA|307aa|down_4|NZ_AP023197.1_2867416_2868337_+	PRK10266, PRK10266, curved DNA-binding protein	NA|102aa|down_5|NZ_AP023197.1_2868336_2868642_+	PRK10265, PRK10265, chaperone modulator CbpM	NA|200aa|down_6|NZ_AP023197.1_2868793_2869393_-	PRK04976, torD, chaperone protein TorD; Validated	NA|849aa|down_7|NZ_AP023197.1_2869389_2871936_-	PRK15102, PRK15102, trimethylamine-N-oxide reductase TorA	NA|391aa|down_8|NZ_AP023197.1_2871935_2873108_-	PRK15032, PRK15032, pentaheme c-type cytochrome TorC	NA|231aa|down_9|NZ_AP023197.1_2873237_2873930_+	PRK10766, PRK10766, two-component system response regulator TorR
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	8	3070419-3070567	8,2	CRISPRCasFinder,PILER-CR	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Orphan	TTTCTAAGCTGCCTGTACGGCAGTGAAC,TTTCTAAGCTGCCTGTACGGCAGTGAAC	28,28	0	0	NA	NA	I-F:I-F	2,2	2	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA|129aa|up_9|NZ_AP023197.1_3056394_3056781_+,NA|64aa|up_8|NZ_AP023197.1_3056789_3056981_+,NA|475aa|up_6|NZ_AP023197.1_3059994_3061419_+,NA|608aa|up_3|NZ_AP023197.1_3065014_3066838_-,NA|95aa|down_2|NZ_AP023197.1_3074192_3074477_-,NA|82aa|down_8|NZ_AP023197.1_3077901_3078147_-	NA|129aa|up_9|NZ_AP023197.1_3056394_3056781_+	NA	NA|64aa|up_8|NZ_AP023197.1_3056789_3056981_+	NA	NA|980aa|up_7|NZ_AP023197.1_3057058_3059998_+	cd17933, DEXSc_RecD-like, DEXS-box helicase domain of RecD and similar proteins	NA|475aa|up_6|NZ_AP023197.1_3059994_3061419_+	NA	NA|323aa|up_5|NZ_AP023197.1_3061605_3062574_+	pfam13737, DDE_Tnp_1_5, Transposase DDE domain	NA|188aa|up_4|NZ_AP023197.1_3063240_3063804_-	pfam11726, Inovirus_Gp2, Inovirus Gp2	NA|608aa|up_3|NZ_AP023197.1_3065014_3066838_-	NA	NA|83aa|up_2|NZ_AP023197.1_3066938_3067187_+	COG3311, AlpA, Predicted transcriptional regulator [Transcription]	NA|522aa|up_1|NZ_AP023197.1_3067202_3068768_+	pfam13148, DUF3987, Protein of unknown function (DUF3987)	NA|403aa|up_0|NZ_AP023197.1_3068991_3070200_-	cd00801, INT_P4_C, Bacteriophage P4 integrase, C-terminal catalytic domain	NA|759aa|down_0|NZ_AP023197.1_3070778_3073055_-	PRK11034, clpA, ATP-dependent Clp protease ATP-binding subunit; Provisional	NA|107aa|down_1|NZ_AP023197.1_3073085_3073406_-	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|95aa|down_2|NZ_AP023197.1_3074192_3074477_-	NA	NA|181aa|down_3|NZ_AP023197.1_3074734_3075277_-	COG4220, COG4220, Phage DNA packaging protein, Nu1 subunit of terminase [DNA replication, recombination, and repair]	NA|128aa|down_4|NZ_AP023197.1_3075478_3075862_-	COG3311, AlpA, Predicted transcriptional regulator [Transcription]	NA|114aa|down_5|NZ_AP023197.1_3075873_3076215_-	pfam02924, HDPD, Bacteriophage lambda head decoration protein D	NA|347aa|down_6|NZ_AP023197.1_3076224_3077265_-	pfam03864, Phage_cap_E, Phage major capsid protein E	NA|141aa|down_7|NZ_AP023197.1_3077482_3077905_-	cd04496, SSB_OBF, SSB_OBF: A subfamily of OB folds similar to the OB fold of ssDNA-binding protein (SSB)	NA|82aa|down_8|NZ_AP023197.1_3077901_3078147_-	NA	NA|606aa|down_9|NZ_AP023197.1_3078433_3080251_-	COG3378, COG3378, Phage associated DNA primase [General function prediction only]
GCF_013340805.1_ASM1334080v1	NZ_AP023197	Escherichia coli strain TUM18780	9	3839121-3839219	9	CRISPRCasFinder	no		cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	Orphan	AGCGTCGCATCAGGCATCCGCGCACAATT	29	0	0	NA	NA	NA	1	1	Orphan	cas3,csa3,PD-DExK,cas8e,cse2gr11,cas7,cas5,cas6e,cas2,DEDDh,DinG,c2c9_V-U4,RT,WYL	NA,NA	NA|549aa|up_9|NZ_AP023197.1_3829424_3831071_-	PRK07193, fliF, flagellar MS-ring protein; Reviewed	NA|114aa|up_8|NZ_AP023197.1_3831075_3831417_-	pfam02049, FliE, Flagellar hook-basal body complex protein FliE	NA|326aa|up_7|NZ_AP023197.1_3831431_3832409_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|284aa|up_6|NZ_AP023197.1_3832795_3833647_+	pfam01052, FliMN_C, Type III flagellar switch regulator (C-ring) FliN C-term	NA|124aa|up_5|NZ_AP023197.1_3833639_3834011_+	TIGR02480, Flagellar_motor_switch_protein_FliN, flagellar motor switch protein FliN	NA|251aa|up_4|NZ_AP023197.1_3834007_3834760_+	PRK05699, fliP, flagellar biosynthesis protein FliP; Reviewed	NA|91aa|up_3|NZ_AP023197.1_3834762_3835035_+	COG1987, FliQ, Flagellar biosynthesis pathway, component FliQ [Cell motility and secretion / Intracellular trafficking and secretion]	NA|261aa|up_2|NZ_AP023197.1_3835036_3835819_+	COG1684, FliR, Flagellar biosynthesis pathway, component FliR [Cell motility and secretion / Intracellular trafficking and secretion]	NA|380aa|up_1|NZ_AP023197.1_3835808_3836948_+	PRK05702, flhB, flagellar type III secretion system protein FlhB	NA|698aa|up_0|NZ_AP023197.1_3836931_3839025_+	COG1298, FlhA, Flagellar biosynthesis pathway, component FlhA [Cell motility and secretion / Intracellular trafficking and secretion]	NA|250aa|down_0|NZ_AP023197.1_3839890_3840640_-	COG0791, Spr, Cell wall-associated hydrolases (invasion-associated proteins) [Cell envelope biogenesis, outer membrane]	NA|87aa|down_1|NZ_AP023197.1_3840849_3841110_+	COG3077, RelB, DNA-damage-inducible protein J [DNA replication, recombination, and repair]	NA|93aa|down_2|NZ_AP023197.1_3841112_3841391_+	COG3041, COG3041, Uncharacterized protein conserved in bacteria [Function unknown]	NA|247aa|down_3|NZ_AP023197.1_3841546_3842287_+	COG3034, COG3034, Uncharacterized protein conserved in bacteria [Function unknown]	NA|256aa|down_4|NZ_AP023197.1_3842257_3843025_-	pfam13230, GATase_4, Glutamine amidotransferases class-II	NA|193aa|down_5|NZ_AP023197.1_3843230_3843809_-	PRK00414, gmhA, D-sedoheptulose 7-phosphate isomerase	NA|815aa|down_6|NZ_AP023197.1_3844048_3846493_+	PRK09463, fadE, acyl-CoA dehydrogenase; Reviewed	NA|158aa|down_7|NZ_AP023197.1_3846535_3847009_-	PRK09993, PRK09993, C-lysozyme inhibitor; Provisional	NA|257aa|down_8|NZ_AP023197.1_3847162_3847933_+	PRK10438, PRK10438, C-N hydrolase family amidase; Provisional	NA|337aa|down_9|NZ_AP023197.1_3848662_3849673_-	COG0790, COG0790, FOG: TPR repeat, SEL1 subfamily [General function prediction only]
