assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000010105.1_ASM1010v1	NC_012490	Rhodococcus erythropolis PR4, complete genome	1	128133-128249	1	CRISPRCasFinder	no		cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT	Orphan	GAAGCTGAACGGGTTGTCGACGAGGGCGTTGGTGCC	36	0	0	NA	NA	NA	1	1	Orphan	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT,csf1gr8,csf4gr11,csf2gr7,csf3gr5,PD-DExK	NA,NA|151aa|down_6|NC_012490.1_133566_134019_-,NA|416aa|down_8|NC_012490.1_135737_136985_-	NA|401aa|up_9|NC_012490.1_117915_119118_-	COG4585, COG4585, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|349aa|up_8|NC_012490.1_119232_120279_+	COG0577, SalY, ABC-type antimicrobial peptide transport system, permease component [Defense mechanisms]	NA|247aa|up_7|NC_012490.1_120275_121016_+	cd03255, ABC_MJ0796_LolCDE_FtsE, ATP-binding cassette domain of the transporters involved in export of lipoprotein and macrolide, and cell division protein	NA|147aa|up_6|NC_012490.1_121127_121568_+	pfam13426, PAS_9, PAS domain	NA|209aa|up_5|NC_012490.1_121574_122201_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|324aa|up_4|NC_012490.1_122252_123224_+	COG1748, LYS9, Saccharopine dehydrogenase and related proteins [Amino acid transport and metabolism]	NA|431aa|up_3|NC_012490.1_123170_124463_-	TIGR03604, hypothetical_protein, thiazole/oxazole-forming peptide maturase, SagD family component	NA|447aa|up_2|NC_012490.1_124459_125800_-	TIGR03604, hypothetical_protein, thiazole/oxazole-forming peptide maturase, SagD family component	NA|476aa|up_1|NC_012490.1_125792_127220_-	COG2936, COG2936, Predicted acyl esterases [General function prediction only]	NA|271aa|up_0|NC_012490.1_127216_128029_-	TIGR03882, hypothetical_protein, bacteriocin biosynthesis cyclodehydratase domain	NA|420aa|down_0|NC_012490.1_128404_129664_+	cd06173, MFS_MefA_like, Macrolide efflux protein A and similar proteins of the Major Facilitator Superfamily of transporters	NA|356aa|down_1|NC_012490.1_129748_130816_+	pfam01032, FecCD, FecCD transport family	NA|265aa|down_2|NC_012490.1_130812_131607_+	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|327aa|down_3|NC_012490.1_131603_132584_+	cd01148, TroA_a, Metal binding protein TroA_a	NA|229aa|down_4|NC_012490.1_132588_133275_+	TIGR03605, antibiot_sagB, SagB-type dehydrogenase domain	NA|98aa|down_5|NC_012490.1_133276_133570_-	pfam09851, SHOCT, Short C-terminal domain	NA|151aa|down_6|NC_012490.1_133566_134019_-	NA	NA|549aa|down_7|NC_012490.1_134022_135669_-	cd17321, MFS_MMR_MDR_like, Methylenomycin A resistance protein (also called MMR peptide) and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|416aa|down_8|NC_012490.1_135737_136985_-	NA	NA|196aa|down_9|NC_012490.1_137003_137591_+	pfam04978, DUF664, Protein of unknown function (DUF664)
GCF_000010105.1_ASM1010v1	NC_012490	Rhodococcus erythropolis PR4, complete genome	2	2313611-2313696	2	CRISPRCasFinder	no		cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT	Orphan	CACCGGATGCTGCGCCGCCGCCG	23	0	0	NA	NA	NA	1	1	Orphan	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT,csf1gr8,csf4gr11,csf2gr7,csf3gr5,PD-DExK	NA|117aa|up_1|NC_012490.1_2312549_2312900_-,NA	NA|904aa|up_9|NC_012490.1_2304554_2307266_-	PRK09800, PRK09800, putative hypoxanthine oxidase; Provisional	NA|270aa|up_8|NC_012490.1_2307262_2308072_-	pfam00941, FAD_binding_5, FAD binding domain in molybdopterin dehydrogenase	NA|457aa|up_7|NC_012490.1_2308079_2309450_-	PRK08203, PRK08203, hydroxydechloroatrazine ethylaminohydrolase; Reviewed	NA|306aa|up_6|NC_012490.1_2309446_2310364_-	TIGR03383, Structure_Of_Uricase, urate oxidase	NA|110aa|up_5|NC_012490.1_2310428_2310758_-	pfam00576, Transthyretin, HIUase/Transthyretin family	NA|173aa|up_4|NC_012490.1_2310754_2311273_-	PRK13798, PRK13798, putative OHCU decarboxylase; Provisional	NA|267aa|up_3|NC_012490.1_2311389_2312190_+	pfam13350, Y_phosphatase3, Tyrosine phosphatase family	NA|121aa|up_2|NC_012490.1_2312190_2312553_-	COG5652, COG5652, Predicted integral membrane protein [Function unknown]	NA|117aa|up_1|NC_012490.1_2312549_2312900_-	NA	NA|142aa|up_0|NC_012490.1_2312899_2313325_-	pfam08044, DUF1707, Domain of unknown function (DUF1707)	NA|467aa|down_0|NC_012490.1_2315336_2316737_-	pfam00668, Condensation, Condensation domain	NA|139aa|down_1|NC_012490.1_2316741_2317158_-	pfam02657, SufE, Fe-S metabolism associated domain	NA|302aa|down_2|NC_012490.1_2317154_2318060_-	COG2897, SseA, Rhodanese-related sulfurtransferase [Inorganic ion transport and metabolism]	NA|488aa|down_3|NC_012490.1_2318178_2319642_-	pfam00668, Condensation, Condensation domain	NA|498aa|down_4|NC_012490.1_2319641_2321135_-	pfam00668, Condensation, Condensation domain	NA|566aa|down_5|NC_012490.1_2321285_2322983_+	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily	NA|435aa|down_6|NC_012490.1_2323047_2324352_+	pfam02720, DUF222, Domain of unknown function (DUF222)	NA|214aa|down_7|NC_012490.1_2324475_2325117_-	PRK00148, PRK00148, Maf-like protein; Reviewed	NA|114aa|down_8|NC_012490.1_2325132_2325474_-	pfam13822, ACC_epsilon, Acyl-CoA carboxylase epsilon subunit	NA|547aa|down_9|NC_012490.1_2325470_2327111_-	COG4799, COG4799, Acetyl-CoA carboxylase, carboxyltransferase component (subunits alpha and beta) [Lipid metabolism]
GCF_000010105.1_ASM1010v1	NC_012490	Rhodococcus erythropolis PR4, complete genome	3	3337843-3338328	1	CRT	no	csa3	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT	Type I-A	GGANGAGCGGTTGCCCTGGTANCC	24	0	0	NA	NA	NA	7	7	Orphan	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT,csf1gr8,csf4gr11,csf2gr7,csf3gr5,PD-DExK	NA|293aa|up_6|NC_012490.1_3328490_3329369_-,NA|294aa|up_2|NC_012490.1_3333587_3334469_-,NA|261aa|down_6|NC_012490.1_3347709_3348492_+	NA|345aa|up_9|NC_012490.1_3325623_3326658_-	cd02653, nuc_hydro_3, NH_3: A subgroup of nucleoside hydrolases	NA|159aa|up_8|NC_012490.1_3326650_3327127_-	COG1764, osmC, Organic hydroperoxide reductase [Secondary metabolites biosynthesis, transport and catabolism]	NA|438aa|up_7|NC_012490.1_3327158_3328472_-	pfam02515, CoA_transf_3, CoA-transferase family III	NA|293aa|up_6|NC_012490.1_3328490_3329369_-	NA	NA|363aa|up_5|NC_012490.1_3329372_3330461_-	COG1253, TlyC, Hemolysins and related proteins containing CBS domains [General function prediction only]	NA|461aa|up_4|NC_012490.1_3330453_3331836_-	COG1253, TlyC, Hemolysins and related proteins containing CBS domains [General function prediction only]	NA|479aa|up_3|NC_012490.1_3332147_3333584_-	PRK07807, PRK07807, GuaB1 family IMP dehydrogenase-related protein	NA|294aa|up_2|NC_012490.1_3333587_3334469_-	NA	NA|501aa|up_1|NC_012490.1_3334473_3335976_-	COG0513, SrmB, Superfamily II DNA and RNA helicases [DNA replication, recombination, and repair / Transcription / Translation, ribosomal structure and biogenesis]	NA|486aa|up_0|NC_012490.1_3336038_3337496_-	PRK09287, PRK09287, NADP-dependent phosphogluconate dehydrogenase	NA|318aa|down_0|NC_012490.1_3339942_3340896_-	cd07326, M56_BlaR1_MecR1_like, Peptidase M56-like including those in BlaR1 and MecR1, integral membrane metallopeptidase	NA|138aa|down_1|NC_012490.1_3340921_3341335_-	COG3682, COG3682, Predicted transcriptional regulator [Transcription]	NA|858aa|down_2|NC_012490.1_3341526_3344100_+	pfam09924, DUF2156, Uncharacterized conserved protein (DUF2156)	NA|284aa|down_3|NC_012490.1_3344110_3344962_-	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|364aa|down_4|NC_012490.1_3344958_3346050_-	COG4779, FepG, ABC-type enterobactin transport system, permease component [Inorganic ion transport and metabolism]	NA|487aa|down_5|NC_012490.1_3346046_3347507_-	PRK10441, PRK10441, Fe(3+)-siderophore ABC transporter permease	NA|261aa|down_6|NC_012490.1_3347709_3348492_+	NA	NA|143aa|down_7|NC_012490.1_3348728_3349157_+	cd03443, PaaI_thioesterase, PaaI_thioesterase is a tetrameric acyl-CoA thioesterase with a hot dog fold and one of several proteins responsible for phenylacetic acid (PA) degradation in bacteria	NA|472aa|down_8|NC_012490.1_3349244_3350660_-	COG1252, Ndh, NADH dehydrogenase, FAD-containing subunit [Energy production and conversion]	csa3|255aa|down_9|NC_012490.1_3351103_3351868_+	cd08893, SRPBCC_CalC_Aha1-like_GntR-HTH, Putative hydrophobic ligand-binding SRPBCC domain of an uncharacterized subgroup of CalC- and Aha1-like proteins; some contain an N-terminal GntR family winged HTH DNA-binding domain
GCF_000010105.1_ASM1010v1	NC_012490	Rhodococcus erythropolis PR4, complete genome	4	3429180-3429259	3	CRISPRCasFinder	no	WYL,cas4	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT	Unclear	CCCCACGGCTGTTGCTGGCCGGG	23	0	0	NA	NA	NA	1	1	Unclear	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT,csf1gr8,csf4gr11,csf2gr7,csf3gr5,PD-DExK	NA,NA	NA|120aa|up_9|NC_012490.1_3420159_3420519_-	cd07238, VOC_like, uncharacterized subfamily of vicinal oxygen chelate (VOC) family	NA|214aa|up_8|NC_012490.1_3420529_3421171_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|322aa|up_7|NC_012490.1_3421330_3422296_-	cd06225, HAMP, Histidine kinase, Adenylyl cyclase, Methyl-accepting protein, and Phosphatase (HAMP) domain	NA|249aa|up_6|NC_012490.1_3422396_3423143_-	PRK08057, PRK08057, cobalt-precorrin-6x reductase; Reviewed	NA|250aa|up_5|NC_012490.1_3423166_3423916_-	COG2875, CobM, Precorrin-4 methylase [Coenzyme metabolism]	NA|428aa|up_4|NC_012490.1_3423912_3425196_-	COG2242, CobL, Precorrin-6B methylase 2 [Coenzyme metabolism]	NA|254aa|up_3|NC_012490.1_3425192_3425954_-	PRK05599, PRK05599, SDR family oxidoreductase	NA|142aa|up_2|NC_012490.1_3425984_3426410_+	TIGR03618, Rv1155_F420, PPOX class probable F420-dependent enzyme	NA|379aa|up_1|NC_012490.1_3426410_3427547_-	COG0006, PepP, Xaa-Pro aminopeptidase [Amino acid transport and metabolism]	NA|322aa|up_0|NC_012490.1_3427584_3428550_+	smart00475, 53EXOc, 5'-3' exonuclease	NA|904aa|down_0|NC_012490.1_3429440_3432152_-	COG4581, COG4581, Superfamily II RNA helicase [DNA replication, recombination, and repair]	NA|343aa|down_1|NC_012490.1_3432200_3433229_-	pfam00902, TatC, Sec-independent protein translocase protein (TatC)	NA|92aa|down_2|NC_012490.1_3433302_3433578_-	PRK00575, tatA, Sec-independent protein translocase subunit TatA	WYL|326aa|down_3|NC_012490.1_3433712_3434690_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	WYL|338aa|down_4|NC_012490.1_3434689_3435703_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|448aa|down_5|NC_012490.1_3435813_3437157_-	TIGR03686, pupylate_PafA, Pup--protein ligase	NA|473aa|down_6|NC_012490.1_3437316_3438735_+	smart00046, DAGKc, Diacylglycerol kinase catalytic domain (presumed)	NA|255aa|down_7|NC_012490.1_3438772_3439537_-	TIGR03691, 20S_bact_alpha, proteasome, alpha subunit, bacterial type	NA|293aa|down_8|NC_012490.1_3439533_3440412_-	TIGR03690, 20S_bact_beta, proteasome, beta subunit, bacterial type	NA|65aa|down_9|NC_012490.1_3440408_3440603_-	pfam05639, Pup, Pup-like protein
GCF_000010105.1_ASM1010v1	NC_012490	Rhodococcus erythropolis PR4, complete genome	5	4466297-4466430	4	CRISPRCasFinder	no		cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT	Orphan	CGTTCGGTCGATCTGAGGCGACGAATGTACCGTTCGCTCGAA	42	0	0	NA	NA	NA	1	1	Orphan	cas3,WYL,csa3,cas4,DEDDh,DinG,Cas9_archaeal,RT,csf1gr8,csf4gr11,csf2gr7,csf3gr5,PD-DExK	NA,NA|94aa|down_4|NC_012490.1_4481714_4481996_-,NA|142aa|down_6|NC_012490.1_4486125_4486551_-,NA|257aa|down_8|NC_012490.1_4487684_4488455_-,NA|410aa|down_9|NC_012490.1_4488591_4489821_-	NA|498aa|up_9|NC_012490.1_4451869_4453363_+	pfam11380, Stealth_CR2, Stealth protein CR2, conserved region 2	NA|456aa|up_8|NC_012490.1_4453414_4454782_-	TIGR03860, FMN_nitrolo, FMN-dependent oxidoreductase, nitrilotriacetate monooxygenase family	NA|449aa|up_7|NC_012490.1_4454802_4456149_-	TIGR03860, FMN_nitrolo, FMN-dependent oxidoreductase, nitrilotriacetate monooxygenase family	NA|302aa|up_6|NC_012490.1_4456323_4457229_-	cd07402, MPP_GpdQ, Enterobacter aerogenes GpdQ and related proteins, metallophosphatase domain	NA|458aa|up_5|NC_012490.1_4457568_4458942_+	pfam00375, SDF, Sodium:dicarboxylate symporter family	NA|120aa|up_4|NC_012490.1_4459114_4459474_+	pfam05901, Excalibur, Excalibur calcium-binding domain	NA|373aa|up_3|NC_012490.1_4459526_4460645_-	COG0627, COG0627, Predicted esterase [General function prediction only]	NA|1061aa|up_2|NC_012490.1_4460756_4463939_+	cd18012, DEXQc_arch_SWI2_SNF2, DEAQ-box helicase domain of archaeal and bacterial SNF2-related proteins	NA|192aa|up_1|NC_012490.1_4464052_4464628_+	pfam02342, TerD, TerD domain	NA|463aa|up_0|NC_012490.1_4464710_4466099_-	pfam07929, PRiA4_ORF3, Plasmid pRiA4b ORF-3-like protein	NA|137aa|down_0|NC_012490.1_4472423_4472834_+	COG3607, COG3607, Predicted lactoylglutathione lyase [General function prediction only]	NA|325aa|down_1|NC_012490.1_4472906_4473881_-	PRK08241, PRK08241, RNA polymerase subunit sigma-70	NA|244aa|down_2|NC_012490.1_4473934_4474666_-	pfam08445, FR47, FR47-like protein	NA|1828aa|down_3|NC_012490.1_4476161_4481645_+	COG4770, COG4770, Acetyl/propionyl-CoA carboxylase, alpha subunit [Lipid metabolism]	NA|94aa|down_4|NC_012490.1_4481714_4481996_-	NA	NA|1373aa|down_5|NC_012490.1_4482007_4486126_-	cd07539, P-type_ATPase, uncharacterized subfamily of P-type ATPase transporters	NA|142aa|down_6|NC_012490.1_4486125_4486551_-	NA	NA|316aa|down_7|NC_012490.1_4486734_4487682_+	cd19081, AKR_AKR9C1, AKR9C family of aldo-keto reductase (AKR)	NA|257aa|down_8|NC_012490.1_4487684_4488455_-	NA	NA|410aa|down_9|NC_012490.1_4488591_4489821_-	NA
