assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001455205.1_ASM145520v1	NZ_CP013341	Nitrosomonas ureae strain Nm10 chromosome, complete genome	1	773885-775124	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7	DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	Type III-C,Type III-B,Type III-D,Type III-A	GTTTGAACTAAAGACCTGATTAAGAAGGGATTAAGAC,GTTTGAACTAAAGACCTGATTAAGAAGGGATTAAGAC,GTTTGAACTAAAGACCTGATTAAGAAGGGATTAAGAC	37,37,37	0	0	NA	NA	NA:NA:NA	17,17,17	17	TypeIII-C,TypeIII-B,TypeIII-D,TypeIII-A	DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	NA|60aa|up_4|NZ_CP013341.1_768491_768671_+,NA|217aa|down_5|NZ_CP013341.1_783725_784376_-	cas6|317aa|up_9|NZ_CP013341.1_762475_763426_+	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	csx1|370aa|up_8|NZ_CP013341.1_763455_764565_+	cd09741, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	cas10|899aa|up_7|NZ_CP013341.1_764561_767258_+	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	csm2gr11|149aa|up_6|NZ_CP013341.1_767316_767763_+	pfam03750, Csm2_III-A, Csm2 Type III-A	csm3gr7|236aa|up_5|NZ_CP013341.1_767773_768481_+	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	NA|60aa|up_4|NZ_CP013341.1_768491_768671_+	NA	csm4gr5|317aa|up_3|NZ_CP013341.1_768645_769596_+	TIGR01903, Hypothetical_protein	csm5gr7|572aa|up_2|NZ_CP013341.1_769592_771308_+	COG1332, COG1332, CRISPR system related protein, RAMP superfamily [Defense mechanisms]	csx1|422aa|up_1|NZ_CP013341.1_771382_772648_+	cd09747, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	csx1|427aa|up_0|NZ_CP013341.1_772530_773811_+	pfam09002, DUF1887, Domain of unknown function (DUF1887)	NA|172aa|down_0|NZ_CP013341.1_776003_776519_+	pfam09912, DUF2141, Uncharacterized protein conserved in bacteria (DUF2141)	NA|276aa|down_1|NZ_CP013341.1_776530_777358_+	COG1073, COG1073, Hydrolases of the alpha/beta superfamily [General function prediction only]	NA|177aa|down_2|NZ_CP013341.1_777393_777924_+	pfam02464, CinA, Competence-damaged protein	NA|1497aa|down_3|NZ_CP013341.1_778021_782512_-	TIGR00845, Sodium/calcium_exchanger_1, sodium/calcium exchanger 1	NA|204aa|down_4|NZ_CP013341.1_782899_783511_-	PRK05208, PRK05208, hypothetical protein; Provisional	NA|217aa|down_5|NZ_CP013341.1_783725_784376_-	NA	NA|296aa|down_6|NZ_CP013341.1_784570_785458_-	PRK05678, PRK05678, succinyl-CoA synthetase subunit alpha; Validated	NA|394aa|down_7|NZ_CP013341.1_785467_786649_-	PRK14046, PRK14046, malate--CoA ligase subunit beta; Provisional	NA|319aa|down_8|NZ_CP013341.1_786748_787705_-	COG2301, CitE, Citrate lyase beta subunit [Carbohydrate transport and metabolism]	NA|345aa|down_9|NZ_CP013341.1_788105_789140_+	PRK09604, PRK09604, tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex transferase subunit TsaD
GCF_001455205.1_ASM145520v1	NZ_CP013341	Nitrosomonas ureae strain Nm10 chromosome, complete genome	2	2722971-2723071	2	CRISPRCasFinder	no		DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	Orphan	TTGTGCCGACATTCATGGATATG	23	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	NA|94aa|up_6|NZ_CP013341.1_2715680_2715962_+,NA|120aa|up_4|NZ_CP013341.1_2718044_2718404_+,NA|149aa|up_2|NZ_CP013341.1_2719753_2720200_+,NA|118aa|down_6|NZ_CP013341.1_2729524_2729878_-,NA|59aa|down_8|NZ_CP013341.1_2731038_2731215_-,NA|150aa|down_9|NZ_CP013341.1_2731254_2731704_+	NA|247aa|up_9|NZ_CP013341.1_2711195_2711936_+	cd05362, THN_reductase-like_SDR_c, tetrahydroxynaphthalene/trihydroxynaphthalene reductase-like, classical (c) SDRs	NA|372aa|up_8|NZ_CP013341.1_2711957_2713073_+	cd05305, L-AlaDH, Alanine dehydrogenase NAD-binding and catalytic domains	NA|792aa|up_7|NZ_CP013341.1_2713236_2715612_+	pfam06934, CTI, Fatty acid cis/trans isomerase (CTI)	NA|94aa|up_6|NZ_CP013341.1_2715680_2715962_+	NA	NA|554aa|up_5|NZ_CP013341.1_2716011_2717673_-	pfam13372, Alginate_exp, Alginate export	NA|120aa|up_4|NZ_CP013341.1_2718044_2718404_+	NA	NA|246aa|up_3|NZ_CP013341.1_2718911_2719649_+	PRK05293, glgC, glucose-1-phosphate adenylyltransferase; Provisional	NA|149aa|up_2|NZ_CP013341.1_2719753_2720200_+	NA	NA|167aa|up_1|NZ_CP013341.1_2720238_2720739_+	cd02966, TlpA_like_family, TlpA-like family; composed of  TlpA, ResA, DsbE and similar proteins	NA|79aa|up_0|NZ_CP013341.1_2720778_2721015_+	pfam14086, DUF4266, Domain of unknown function (DUF4266)	NA|289aa|down_0|NZ_CP013341.1_2723864_2724731_+	pfam02424, ApbE, ApbE family	NA|413aa|down_1|NZ_CP013341.1_2724816_2726055_+	pfam01764, Lipase_3, Lipase (class 3)	NA|268aa|down_2|NZ_CP013341.1_2726246_2727050_+	cd07361, MEMO_like, Memo (mediator of ErbB2-driven cell motility) is co-precipitated with the C terminus of ErbB2, a protein involved in cell motility	NA|197aa|down_3|NZ_CP013341.1_2727039_2727630_+	TIGR04335, AMMECR1_domain_protein, AmmeMemoRadiSam system protein A	NA|366aa|down_4|NZ_CP013341.1_2727622_2728720_+	TIGR04337, Radical_SAM, AmmeMemoRadiSam system radical SAM enzyme	NA|118aa|down_5|NZ_CP013341.1_2728884_2729238_-	pfam11154, DUF2934, Protein of unknown function (DUF2934)	NA|118aa|down_6|NZ_CP013341.1_2729524_2729878_-	NA	NA|150aa|down_7|NZ_CP013341.1_2730104_2730554_-	cd17775, CBS_pair_bact_arch, Two tandem repeats of the cystathionine beta-synthase (CBS pair) domains  present in bacteria and archaea	NA|59aa|down_8|NZ_CP013341.1_2731038_2731215_-	NA	NA|150aa|down_9|NZ_CP013341.1_2731254_2731704_+	NA
GCF_001455205.1_ASM145520v1	NZ_CP013341	Nitrosomonas ureae strain Nm10 chromosome, complete genome	3	2891513-2891939	2,3,2	PILER-CR,CRISPRCasFinder,CRT	no	cas5,cas8c,cas7,cas4,cas1,cas2	DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	 Type I-U?,Type I-U,Type I-C	GTCGCGCCCCGCGTGGGCGCGTGGATTGAAAC,GTCGCGCCCCGCGTGGGCGCGTGGATTGAAAC,GTCGCGCCCCGCGTGGGCGCGTGGATTGAAAC	32,32,32	0	0	NA	NA	I-C:I-C:I-C	6,6,6	6	TypeI-U?,TypeI-U,TypeI-C	DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	NA,NA	NA|1168aa|up_9|NZ_CP013341.1_2877250_2880754_+	PRK05673, dnaE, DNA polymerase III subunit alpha; Validated	NA|146aa|up_8|NZ_CP013341.1_2881612_2882050_-	pfam01797, Y1_Tnp, Transposase IS200 like	NA|101aa|up_7|NZ_CP013341.1_2882162_2882465_-	COG3668, ParE, Plasmid stabilization system protein [General function prediction only]	NA|83aa|up_6|NZ_CP013341.1_2882461_2882710_-	pfam03693, ParD_antitoxin, Bacterial antitoxin of ParD toxin-antitoxin type II system and RHH	cas5|228aa|up_5|NZ_CP013341.1_2885580_2886264_+	cd09752, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas8c|627aa|up_4|NZ_CP013341.1_2886260_2888141_+	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas7|329aa|up_3|NZ_CP013341.1_2888152_2889139_+	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas4|212aa|up_2|NZ_CP013341.1_2889359_2889995_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|345aa|up_1|NZ_CP013341.1_2889997_2891032_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|97aa|up_0|NZ_CP013341.1_2891047_2891338_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|450aa|down_0|NZ_CP013341.1_2893333_2894683_+	PRK10867, PRK10867, signal recognition particle protein; Provisional	NA|150aa|down_1|NZ_CP013341.1_2895969_2896419_-	PRK00601, dut, dUTP diphosphatase	NA|409aa|down_2|NZ_CP013341.1_2896405_2897632_-	PRK05579, PRK05579, bifunctional phosphopantothenoylcysteine decarboxylase/phosphopantothenate synthase; Validated	NA|225aa|down_3|NZ_CP013341.1_2897831_2898506_+	PRK00024, PRK00024, DNA repair protein RadC	NA|79aa|down_4|NZ_CP013341.1_2898563_2898800_+	PRK00359, rpmB, 50S ribosomal protein L28; Reviewed	NA|52aa|down_5|NZ_CP013341.1_2898839_2898995_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|397aa|down_6|NZ_CP013341.1_2899045_2900236_-	COG1398, OLE1, Fatty-acid desaturase [Lipid metabolism]	NA|185aa|down_7|NZ_CP013341.1_2900546_2901101_-	cd02566, PseudoU_synth_RluE, Pseudouridine synthase, Escherichia coli RluE	NA|151aa|down_8|NZ_CP013341.1_2901139_2901592_-	COG2062, SixA, Phosphohistidine phosphatase SixA [Signal transduction mechanisms]	NA|97aa|down_9|NZ_CP013341.1_2901627_2901918_-	pfam02594, DUF167, Uncharacterized ACR, YggU family COG1872
GCF_001455205.1_ASM145520v1	NZ_CP013341	Nitrosomonas ureae strain Nm10 chromosome, complete genome	4	2942511-2942613	4	CRISPRCasFinder	no		DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	Orphan	GCAATGGTCAATGTTCATTTATGAGTCAGAGAAAATA	37	0	0	NA	NA	NA	1	1	Orphan	DEDDh,csa3,cas2,cas6,csx1,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,PD-DExK,cas1,DinG,cas5,cas8c,cas7,cas4,cas3	NA|158aa|up_9|NZ_CP013341.1_2931512_2931986_+,NA	NA|158aa|up_9|NZ_CP013341.1_2931512_2931986_+	NA	NA|170aa|up_8|NZ_CP013341.1_2932252_2932762_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|478aa|up_7|NZ_CP013341.1_2934670_2936104_+	pfam08548, Peptidase_M10_C, Peptidase M10 serralysin C terminal	NA|68aa|up_6|NZ_CP013341.1_2936326_2936530_+	TIGR01683, thiamine_biosynthesis_protein_ThiS, thiamine biosynthesis protein ThiS	NA|272aa|up_5|NZ_CP013341.1_2936571_2937387_+	PRK00208, thiG, thiazole synthase; Reviewed	NA|222aa|up_4|NZ_CP013341.1_2937419_2938085_+	PRK00121, trmB, tRNA (guanine-N(7)-)-methyltransferase; Reviewed	NA|300aa|up_3|NZ_CP013341.1_2938313_2939213_+	TIGR02971, devB-like_secretion_protein, ABC exporter membrane fusion protein, DevB family	NA|378aa|up_2|NZ_CP013341.1_2939245_2940379_+	TIGR01185, membrane_spanning_subunit, DevC protein	NA|226aa|up_1|NZ_CP013341.1_2940378_2941056_+	TIGR02982, heterocyst_DevA, ABC exporter ATP-binding subunit, DevA family	NA|418aa|up_0|NZ_CP013341.1_2941157_2942411_-	COG1686, DacC, D-alanyl-D-alanine carboxypeptidase [Cell envelope biogenesis, outer membrane]	NA|322aa|down_0|NZ_CP013341.1_2943025_2943991_+	COG4076, COG4076, Predicted RNA methylase [General function prediction only]	NA|381aa|down_1|NZ_CP013341.1_2944248_2945391_-	pfam06727, DUF1207, Protein of unknown function (DUF1207)	NA|158aa|down_2|NZ_CP013341.1_2945399_2945873_-	PRK10568, PRK10568, molecular chaperone OsmY	NA|583aa|down_3|NZ_CP013341.1_2946113_2947862_+	COG0405, Ggt, Gamma-glutamyltransferase [Amino acid transport and metabolism]	NA|472aa|down_4|NZ_CP013341.1_2948249_2949665_+	PRK06292, PRK06292, dihydrolipoamide dehydrogenase; Validated	NA|537aa|down_5|NZ_CP013341.1_2949899_2951510_+	COG0531, PotE, Amino acid transporters [Amino acid transport and metabolism]	NA|127aa|down_6|NZ_CP013341.1_2951585_2951966_-	PRK08762, PRK08762, molybdopterin-synthase adenylyltransferase MoeB	NA|421aa|down_7|NZ_CP013341.1_2952183_2953446_-	TIGR03079, ammonia_monooxygenase_subunit_B, methane monooxygenase/ammonia monooxygenase, subunit B	NA|275aa|down_8|NZ_CP013341.1_2953445_2954270_-	TIGR03080, ammonia_monooxygeanse_subunit_A, methane monooxygenase/ammonia monooxygenase, subunit A	NA|270aa|down_9|NZ_CP013341.1_2954444_2955254_-	TIGR03078, ammonia_monooxygenase_3_subunit_C, methane monooxygenase/ammonia monooxygenase, subunit C
