assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000165715.2_ASM16571v3	NC_015174	Rubinisphaera brasiliensis DSM 5305, complete sequence	1	238716-238834	1	CRISPRCasFinder	no		csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	Orphan	GTGGCGGAATGGCAGACGCGGAGGATTCAAAATCC	35	0	0	NA	NA	NA	1	1	Orphan	csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	NA|85aa|up_9|NC_015174.1_228089_228344_-,NA|184aa|up_8|NC_015174.1_228371_228923_-,NA|224aa|up_7|NC_015174.1_229105_229777_+,NA|201aa|up_6|NC_015174.1_229813_230416_+,NA|76aa|up_5|NC_015174.1_230494_230722_-,NA|54aa|down_1|NC_015174.1_239259_239421_+,NA|104aa|down_2|NC_015174.1_239452_239764_+,NA|53aa|down_3|NC_015174.1_239763_239922_+,NA|122aa|down_4|NC_015174.1_240098_240464_+,NA|148aa|down_6|NC_015174.1_241188_241632_+,NA|123aa|down_8|NC_015174.1_241825_242194_+,NA|97aa|down_9|NC_015174.1_242190_242481_+	NA|85aa|up_9|NC_015174.1_228089_228344_-	NA	NA|184aa|up_8|NC_015174.1_228371_228923_-	NA	NA|224aa|up_7|NC_015174.1_229105_229777_+	NA	NA|201aa|up_6|NC_015174.1_229813_230416_+	NA	NA|76aa|up_5|NC_015174.1_230494_230722_-	NA	NA|183aa|up_4|NC_015174.1_231455_232004_+	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|458aa|up_3|NC_015174.1_232110_233484_+	pfam04326, AlbA_2, Putative DNA-binding domain	NA|344aa|up_2|NC_015174.1_233994_235026_+	PRK09197, PRK09197, fructose-bisphosphate aldolase; Provisional	NA|395aa|up_1|NC_015174.1_235560_236745_+	pfam13485, Peptidase_MA_2, Peptidase MA superfamily	NA|289aa|up_0|NC_015174.1_237626_238493_-	PRK12276, PRK12276, putative heme peroxidase; Provisional	NA|68aa|down_0|NC_015174.1_238942_239146_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|54aa|down_1|NC_015174.1_239259_239421_+	NA	NA|104aa|down_2|NC_015174.1_239452_239764_+	NA	NA|53aa|down_3|NC_015174.1_239763_239922_+	NA	NA|122aa|down_4|NC_015174.1_240098_240464_+	NA	NA|197aa|down_5|NC_015174.1_240483_241074_+	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|148aa|down_6|NC_015174.1_241188_241632_+	NA	NA|59aa|down_7|NC_015174.1_241649_241826_+	pfam02599, CsrA, Global regulator protein family	NA|123aa|down_8|NC_015174.1_241825_242194_+	NA	NA|97aa|down_9|NC_015174.1_242190_242481_+	NA
GCF_000165715.2_ASM16571v3	NC_015174	Rubinisphaera brasiliensis DSM 5305, complete sequence	2	4766811-4772494	2,1,1	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas7,cas8c,cas5,cas3	csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	 Type I-U?,Type I-C,Type I-U	GTTTCAATCCGCGCCCCTGTGGAGGGGCGAT,GTTTCAATCCGCGCCCCTGTGGAGGGGCGAT,GTTTCAATCCGCGCCCCTGTGGAGGGGCGAT	31,31,31	6	6	4767037-4767072|4767429-4767462|4767558-4767591|4770872-4770906|4771002-4771034|4771130-4771164	NC_015174.1_253501-253536|NC_015174.1_283064-283031|NC_015174.1_283304-283271|NC_015174.1_275232-275198|NC_015174.1_276100-276068|NC_015174.1_259703-259737	NA:NA:NA	87,87,86	87	TypeI-U?,TypeI-C,TypeI-U	csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	NA|102aa|up_1|NC_015174.1_4765275_4765581_-,NA	NA|79aa|up_9|NC_015174.1_4748439_4748676_+	PRK01271, PRK01271, tautomerase PptA	NA|230aa|up_8|NC_015174.1_4748782_4749472_+	cd05324, carb_red_PTCR-like_SDR_c, Porcine testicular carbonyl reductase (PTCR)-like, classical (c) SDRs	NA|334aa|up_7|NC_015174.1_4749790_4750792_-	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|486aa|up_6|NC_015174.1_4751118_4752576_+	COG5361, COG5361, Uncharacterized conserved protein [Function unknown]	NA|778aa|up_5|NC_015174.1_4752711_4755045_+	cd16025, PAS_like, Bacterial Arylsulfatase of Pseudomonas aeruginosa and related proteins	NA|789aa|up_4|NC_015174.1_4757628_4759995_+	cd16025, PAS_like, Bacterial Arylsulfatase of Pseudomonas aeruginosa and related proteins	NA|808aa|up_3|NC_015174.1_4760130_4762554_+	cd16025, PAS_like, Bacterial Arylsulfatase of Pseudomonas aeruginosa and related proteins	NA|781aa|up_2|NC_015174.1_4762644_4764987_+	cd16025, PAS_like, Bacterial Arylsulfatase of Pseudomonas aeruginosa and related proteins	NA|102aa|up_1|NC_015174.1_4765275_4765581_-	NA	NA|250aa|up_0|NC_015174.1_4765847_4766597_-	pfam13683, rve_3, Integrase core domain	cas2|97aa|down_0|NC_015174.1_4772696_4772987_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|345aa|down_1|NC_015174.1_4772990_4774025_-	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	NA|296aa|down_2|NC_015174.1_4774021_4774909_-	COG3183, COG3183, Predicted restriction endonuclease [Defense mechanisms]	cas4|230aa|down_3|NC_015174.1_4774926_4775616_-	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas7|296aa|down_4|NC_015174.1_4775674_4776562_-	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas8c|589aa|down_5|NC_015174.1_4776625_4778392_-	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas5|221aa|down_6|NC_015174.1_4778388_4779051_-	cd09752, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas3|770aa|down_7|NC_015174.1_4779063_4781373_-	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	NA|70aa|down_8|NC_015174.1_4781820_4782030_-	pfam13358, DDE_3, DDE superfamily endonuclease	NA|445aa|down_9|NC_015174.1_4782994_4784329_-	TIGR00881, Glycerol-3-phosphate_transporter, phosphoglycerate transporter family protein
GCF_000165715.2_ASM16571v3	NC_015174	Rubinisphaera brasiliensis DSM 5305, complete sequence	3	5079465-5087824	3,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas7,cas8c,cas5,cas3	csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	 Type I-U?,Type I-C,Type I-U	GTTTCAATCCGCGCCCCTGTGGAGGGGCGAT,GTTTCAATCCGCGCCCCTGTGGAGGGGCGAT,GTTTCAATCCGCGCCCCTGTGGAGGGGCGAT	31,31,31	10	10	5081185-5081219|5081772-5081804|5083457-5083489|5083586-5083619|5083651-5083684|5084433-5084467|5084826-5084860|5086389-5086422|5086912-5086945|5087107-5087141	NC_015174.1_280331-280365|NC_015174.1_253504-253536|NC_015174.1_252053-252085|NC_015174.1_249157-249190|NC_015174.1_280955-280988|NC_015174.1_281027-281061|NC_015174.1_281027-281061|NC_015174.1_253598-253631|NC_015174.1_242924-242891|NC_015174.1_246449-246415	NA:NA:NA	128,128,123	128	TypeI-U?,TypeI-C,TypeI-U	csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	NA|56aa|up_8|NC_015174.1_5074918_5075086_-,NA|95aa|up_7|NC_015174.1_5075156_5075441_+,NA|155aa|up_5|NC_015174.1_5075779_5076244_+,NA|328aa|up_2|NC_015174.1_5076998_5077982_+,NA|203aa|down_8|NC_015174.1_5098218_5098827_+	NA|685aa|up_9|NC_015174.1_5072848_5074903_+	cd00338, Ser_Recombinase, Serine Recombinase family, catalytic domain; a DNA binding domain may be present either N- or C-terminal to the catalytic domain	NA|56aa|up_8|NC_015174.1_5074918_5075086_-	NA	NA|95aa|up_7|NC_015174.1_5075156_5075441_+	NA	NA|74aa|up_6|NC_015174.1_5075446_5075668_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|155aa|up_5|NC_015174.1_5075779_5076244_+	NA	NA|59aa|up_4|NC_015174.1_5076353_5076530_+	TIGR03184, putative_phosphoribosylaminoimidazole, DNA sulfur modification protein DndE	NA|78aa|up_3|NC_015174.1_5076689_5076923_+	cd00754, Ubl_MoaD, ubiquitin-like (Ubl) domain found in molybdenum cofactor biosynthesis protein D (MoaD) and similar proteins	NA|328aa|up_2|NC_015174.1_5076998_5077982_+	NA	NA|222aa|up_1|NC_015174.1_5077920_5078586_+	cd07767, MPN, Mpr1p, Pad1p N-terminal (MPN) domains	NA|219aa|up_0|NC_015174.1_5078578_5079235_+	pfam00899, ThiF, ThiF family	cas2|97aa|down_0|NC_015174.1_5088026_5088317_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|345aa|down_1|NC_015174.1_5088320_5089355_-	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	NA|296aa|down_2|NC_015174.1_5089351_5090239_-	COG3183, COG3183, Predicted restriction endonuclease [Defense mechanisms]	cas4|230aa|down_3|NC_015174.1_5090256_5090946_-	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas7|296aa|down_4|NC_015174.1_5091004_5091892_-	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	cas8c|589aa|down_5|NC_015174.1_5091955_5093722_-	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas5|221aa|down_6|NC_015174.1_5093718_5094381_-	cd09752, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas3|770aa|down_7|NC_015174.1_5094393_5096703_-	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	NA|203aa|down_8|NC_015174.1_5098218_5098827_+	NA	NA|324aa|down_9|NC_015174.1_5099300_5100272_-	pfam07596, SBP_bac_10, Protein of unknown function (DUF1559)
GCF_000165715.2_ASM16571v3	NC_015174	Rubinisphaera brasiliensis DSM 5305, complete sequence	4	5779301-5779410	4	CRISPRCasFinder	no		csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	Orphan	TCGTCAAACGTGTTCCTCGCGAAGTG	26	0	0	NA	NA	NA	1	1	Orphan	csf3gr5,csf2gr7,csf4gr11,csf1gr8,cas3,WYL,csa3,DinG,RT,cas2,cas1,cas4,cas7,cas8c,cas5	NA|387aa|up_7|NC_015174.1_5768610_5769771_+,NA|134aa|up_5|NC_015174.1_5771003_5771405_-,NA|758aa|down_1|NC_015174.1_5782995_5785269_+,NA|150aa|down_4|NC_015174.1_5787132_5787582_-,NA|110aa|down_5|NC_015174.1_5788065_5788395_+	NA|333aa|up_9|NC_015174.1_5765672_5766671_+	cd05241, 3b-HSD-like_SDR_e, 3beta-hydroxysteroid dehydrogenases (3b-HSD)-like, extended (e) SDRs	NA|475aa|up_8|NC_015174.1_5766985_5768410_-	cd16026, GALNS_like, galactosamine-6-sulfatase; also known as N-acetylgalactosamine-6-sulfatase (GALNS)	NA|387aa|up_7|NC_015174.1_5768610_5769771_+	NA	NA|336aa|up_6|NC_015174.1_5769927_5770935_+	cd12183, LDH_like_2, D-Lactate and related Dehydrogenases, NAD-binding and catalytic domains	NA|134aa|up_5|NC_015174.1_5771003_5771405_-	NA	NA|496aa|up_4|NC_015174.1_5771584_5773072_+	PRK10867, PRK10867, signal recognition particle protein; Provisional	NA|477aa|up_3|NC_015174.1_5773891_5775322_+	cd03302, Adenylsuccinate_lyase_2, Adenylsuccinate lyase (ASL)_subgroup 2	NA|199aa|up_2|NC_015174.1_5775494_5776091_+	pfam07617, DUF1579, Protein of unknown function (DUF1579)	NA|334aa|up_1|NC_015174.1_5776123_5777125_-	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|316aa|up_0|NC_015174.1_5777549_5778497_-	sd00006, TPR, Tetratricopeptide repeat	NA|641aa|down_0|NC_015174.1_5780916_5782839_+	PRK05899, PRK05899, transketolase; Reviewed	NA|758aa|down_1|NC_015174.1_5782995_5785269_+	NA	NA|309aa|down_2|NC_015174.1_5785326_5786253_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|264aa|down_3|NC_015174.1_5786272_5787064_+	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]	NA|150aa|down_4|NC_015174.1_5787132_5787582_-	NA	NA|110aa|down_5|NC_015174.1_5788065_5788395_+	NA	NA|337aa|down_6|NC_015174.1_5788804_5789815_+	COG1821, COG1821, Predicted ATP-utilizing enzyme (ATP-grasp superfamily) [General function prediction only]	NA|345aa|down_7|NC_015174.1_5789823_5790858_+	TIGR03123, one_C_unchar_1, probable H4MPT-linked C1 transfer pathway protein	NA|230aa|down_8|NC_015174.1_5791242_5791932_+	cd08168, Cytochrom_C3, Heme-binding domain of the class III cytochrome C family and related proteins	NA|1082aa|down_9|NC_015174.1_5791998_5795244_+	cd02764, MopB_PHLH, The MopB_PHLH CD includes a group of related uncharacterized putative hydrogenase-like homologs (PHLH) of molybdopterin binding (MopB) proteins
