assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000175095.2_ASM17509v2	NC_015222	Nitrosomonas sp. AL212, complete sequence	1	1342573-1342655	1	CRISPRCasFinder	no	cas1	cas1,csa3,cas2,cas4,cas7,cas8c,cas5,cas3,PD-DExK,DinG,DEDDh,cas9	Unclear	ATAAGTCTCGGTTAAGGGGCCAA	23	0	0	NA	NA	NA	1	1	Unclear	cas1,csa3,cas2,cas4,cas7,cas8c,cas5,cas3,PD-DExK,DinG,DEDDh,cas9	NA|74aa|up_6|NC_015222.1_1335350_1335572_+,NA|591aa|up_5|NC_015222.1_1335963_1337736_+,NA|99aa|up_1|NC_015222.1_1340523_1340820_-,NA	NA|478aa|up_9|NC_015222.1_1330380_1331814_-	pfam08548, Peptidase_M10_C, Peptidase M10 serralysin C terminal	NA|288aa|up_8|NC_015222.1_1332758_1333622_+	pfam10137, TIR-like, Predicted nucleotide-binding protein containing TIR-like domain	NA|350aa|up_7|NC_015222.1_1334132_1335182_-	COG3177, COG3177, Fic family protein [Function unknown]	NA|74aa|up_6|NC_015222.1_1335350_1335572_+	NA	NA|591aa|up_5|NC_015222.1_1335963_1337736_+	NA	NA|97aa|up_4|NC_015222.1_1337864_1338155_+	PRK11147, PRK11147, ABC transporter ATPase component; Reviewed	NA|528aa|up_3|NC_015222.1_1338548_1340132_-	pfam03050, DDE_Tnp_IS66, Transposase IS66 family	NA|117aa|up_2|NC_015222.1_1340185_1340536_-	pfam05717, TnpB_IS66, IS66 Orf2 like protein	NA|99aa|up_1|NC_015222.1_1340523_1340820_-	NA	NA|479aa|up_0|NC_015222.1_1341116_1342553_-	TIGR01845, Outer_membrane_protein_OprM, efflux transporter, outer membrane factor (OMF) lipoprotein, NodT family	NA|362aa|down_0|NC_015222.1_1345802_1346888_-	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|93aa|down_1|NC_015222.1_1347128_1347407_+	pfam12760, Zn_Tnp_IS1595, Transposase zinc-ribbon domain	NA|83aa|down_2|NC_015222.1_1347343_1347592_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas1|133aa|down_3|NC_015222.1_1347595_1347994_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|120aa|down_4|NC_015222.1_1348485_1348845_+	pfam13875, DUF4202, Domain of unknown function (DUF4202)	NA|300aa|down_5|NC_015222.1_1348944_1349844_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|385aa|down_6|NC_015222.1_1349950_1351105_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|503aa|down_7|NC_015222.1_1352327_1353836_-	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|96aa|down_8|NC_015222.1_1353924_1354212_+	pfam13875, DUF4202, Domain of unknown function (DUF4202)	NA|563aa|down_9|NC_015222.1_1354318_1356007_-	cd13853, CuRO_1_Tth-MCO_like, The first cupredoxin domain of the bacterial laccases similar to Tth-MCO from Thermus Thermophilus
GCF_000175095.2_ASM17509v2	NC_015222	Nitrosomonas sp. AL212, complete sequence	2	1386182-1388367	1,2,1	PILER-CR,CRISPRCasFinder,CRT	no	cas2,cas1,cas4,cas7,cas8c,cas5,cas3	cas1,csa3,cas2,cas4,cas7,cas8c,cas5,cas3,PD-DExK,DinG,DEDDh,cas9	Type I-C,Type I-U, Type I-U?	GTTTCAATCCACGCGCCCACGCGGGGCGCGAC,GTTTCAATCCACGCGCCCACGCGGGGCGCGAC,GTTTCAATCCACGCGCCCACGCGGGGCGCGAC	32,32,32	0	0	NA	NA	I-C:I-C:I-C	33,33,33	33	TypeI-C,TypeI-U,TypeI-U?	cas1,csa3,cas2,cas4,cas7,cas8c,cas5,cas3,PD-DExK,DinG,DEDDh,cas9	NA,NA|59aa|down_3|NC_015222.1_1390550_1390727_-	NA|154aa|up_9|NC_015222.1_1376712_1377174_+	COG2062, SixA, Phosphohistidine phosphatase SixA [Signal transduction mechanisms]	NA|185aa|up_8|NC_015222.1_1377203_1377758_+	cd02566, PseudoU_synth_RluE, Pseudouridine synthase, Escherichia coli RluE	NA|397aa|up_7|NC_015222.1_1378072_1379263_+	COG1398, OLE1, Fatty-acid desaturase [Lipid metabolism]	NA|52aa|up_6|NC_015222.1_1379311_1379467_-	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|79aa|up_5|NC_015222.1_1379506_1379743_-	PRK00359, rpmB, 50S ribosomal protein L28; Reviewed	NA|225aa|up_4|NC_015222.1_1379800_1380475_-	PRK00024, PRK00024, DNA repair protein RadC	NA|409aa|up_3|NC_015222.1_1380674_1381901_+	PRK05579, PRK05579, bifunctional phosphopantothenoylcysteine decarboxylase/phosphopantothenate synthase; Validated	NA|150aa|up_2|NC_015222.1_1381887_1382337_+	PRK00601, dut, dUTP diphosphatase	NA|450aa|up_1|NC_015222.1_1383444_1384794_-	PRK10867, PRK10867, signal recognition particle protein; Provisional	NA|281aa|up_0|NC_015222.1_1384930_1385773_+	COG4137, COG4137, ABC-type uncharacterized transport system, permease component [General function prediction only]	cas2|97aa|down_0|NC_015222.1_1388541_1388832_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|345aa|down_1|NC_015222.1_1388847_1389882_-	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas4|212aa|down_2|NC_015222.1_1389884_1390520_-	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	NA|59aa|down_3|NC_015222.1_1390550_1390727_-	NA	cas7|292aa|down_4|NC_015222.1_1390737_1391613_-	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas8c|609aa|down_5|NC_015222.1_1391624_1393451_-	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas5|228aa|down_6|NC_015222.1_1393447_1394131_-	cd09752, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas3|755aa|down_7|NC_015222.1_1394152_1396417_-	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	NA|1168aa|down_8|NC_015222.1_1397535_1401039_-	PRK05673, dnaE, DNA polymerase III subunit alpha; Validated	NA|456aa|down_9|NC_015222.1_1401101_1402469_+	PRK15452, PRK15452, putative protease; Provisional
GCF_000175095.2_ASM17509v2	NC_015222	Nitrosomonas sp. AL212, complete sequence	3	2937667-2938940	3,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas9	cas1,csa3,cas2,cas4,cas7,cas8c,cas5,cas3,PD-DExK,DinG,DEDDh,cas9	 Type II-B,Type II-A, or Type II-C?,Type II-C,Type II-B	GTTCCGGTCAGAGCACAAATCCCAATATGCTAAAC,GTTCCGGTCAGAGCACAAATCCCAATATGCTAAAC,GTTCCGGTCAGAGCACAAATCCCAATATGCTAAAC	35,35,35	1	1	2938811-2938840	NC_015222.1_980-1009	NA:NA:NA	19,19,9	19	TypeII-B,TypeII-A,orTypeII-C?,TypeII-C,TypeII-B	cas1,csa3,cas2,cas4,cas7,cas8c,cas5,cas3,PD-DExK,DinG,DEDDh,cas9	NA|118aa|up_3|NC_015222.1_2934405_2934759_+,NA|76aa|up_0|NC_015222.1_2937021_2937249_-,NA|99aa|down_8|NC_015222.1_2949988_2950285_+	NA|276aa|up_9|NC_015222.1_2926941_2927769_-	PRK05339, PRK05339, pyruvate, phosphate dikinase/phosphoenolpyruvate synthase regulator	NA|794aa|up_8|NC_015222.1_2927765_2930147_-	PRK06464, PRK06464, phosphoenolpyruvate synthase; Validated	NA|329aa|up_7|NC_015222.1_2930196_2931183_-	cd08419, PBP2_CbbR_RubisCO_like, The C-terminal substrate binding of LysR-type transcriptional regulator (CbbR) of RubisCO operon, which is involved in the carbon dioxide fixation, contains the type 2 periplasmic binding fold	NA|493aa|up_6|NC_015222.1_2931348_2932827_+	CHL00040, rbcL, ribulose-1,5-bisphosphate carboxylase/oxygenase large subunit	NA|145aa|up_5|NC_015222.1_2932847_2933282_+	CHL00130, rbcS, ribulose-1,5-bisphosphate carboxylase/oxygenase small subunit; Reviewed	NA|314aa|up_4|NC_015222.1_2933429_2934371_+	TIGR02880, Protein_CbxX_chromosomal, probable Rubsico expression protein CbbX	NA|118aa|up_3|NC_015222.1_2934405_2934759_+	NA	NA|411aa|up_2|NC_015222.1_2934792_2936025_+	pfam01116, F_bP_aldolase, Fructose-bisphosphate aldolase class-II	NA|228aa|up_1|NC_015222.1_2936248_2936932_+	COG2885, OmpA, Outer membrane protein and related peptidoglycan-associated (lipo)proteins [Cell envelope biogenesis, outer membrane]	NA|76aa|up_0|NC_015222.1_2937021_2937249_-	NA	cas2|109aa|down_0|NC_015222.1_2939009_2939336_-	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	cas1|232aa|down_1|NC_015222.1_2939342_2940038_-	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	NA|436aa|down_2|NC_015222.1_2940132_2941440_+	pfam05598, DUF772, Transposase domain (DUF772)	cas9|1045aa|down_3|NC_015222.1_2941805_2944940_-	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	NA|469aa|down_4|NC_015222.1_2945201_2946608_-	cd07100, ALDH_SSADH1_GabD1, Mycobacterium tuberculosis succinate-semialdehyde dehydrogenase 1-like	NA|300aa|down_5|NC_015222.1_2946890_2947790_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|385aa|down_6|NC_015222.1_2947849_2949004_-	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|120aa|down_7|NC_015222.1_2949356_2949716_-	pfam14832, Tautomerase_3, Putative oxalocrotonate tautomerase enzyme	NA|99aa|down_8|NC_015222.1_2949988_2950285_+	NA	NA|304aa|down_9|NC_015222.1_2950441_2951353_-	pfam03285, Paralemmin, Paralemmin
