assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_004011905.1_ASM401190v1	CP027114	Gordonia alkanivorans strain YC-RL2 chromosome, complete genome	1	319947-320106	1	CRISPRCasFinder	no		csa3,WYL,DEDDh,cas4,DinG,cas3	Orphan	TCGACAGTCTCGGCGAGCCTCGACTGGG	28	0	0	NA	NA	NA	2	2	Orphan	csa3,WYL,DEDDh,cas4,DinG,cas3	NA|210aa|up_9|CP027114.1_310973_311603_+,NA|394aa|up_8|CP027114.1_311641_312823_-,NA|248aa|up_6|CP027114.1_313719_314463_-,NA|318aa|down_5|CP027114.1_324928_325882_+,NA|248aa|down_9|CP027114.1_329903_330647_-	NA|210aa|up_9|CP027114.1_310973_311603_+	NA	NA|394aa|up_8|CP027114.1_311641_312823_-	NA	NA|292aa|up_7|CP027114.1_312819_313695_-	cd07581, nitrilase_3, Uncharacterized subgroup of the nitrilase superfamily (putative class 13 nitrilases)	NA|248aa|up_6|CP027114.1_313719_314463_-	NA	NA|170aa|up_5|CP027114.1_314519_315029_-	pfam10698, DUF2505, Protein of unknown function (DUF2505)	NA|169aa|up_4|CP027114.1_315039_315546_-	pfam10698, DUF2505, Protein of unknown function (DUF2505)	NA|374aa|up_3|CP027114.1_315584_316706_+	PRK13903, murB, UDP-N-acetylmuramate dehydrogenase	NA|365aa|up_2|CP027114.1_316727_317822_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|276aa|up_1|CP027114.1_317882_318710_-	cd04778, HTH_MerR-like_sg2, Helix-Turn-Helix DNA binding domain of putative transcription regulators from the MerR superfamily	NA|108aa|up_0|CP027114.1_318716_319040_-	pfam10724, DUF2516, Protein of unknown function (DUF2516)	NA|178aa|down_0|CP027114.1_320244_320778_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|447aa|down_1|CP027114.1_320893_322234_-	COG2733, COG2733, Predicted membrane protein [Function unknown]	NA|268aa|down_2|CP027114.1_322272_323076_+	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|276aa|down_3|CP027114.1_323072_323900_+	cd09763, DHRS1-like_SDR_c, human dehydrogenase/reductase (SDR family) member 1 (DHRS1) -like, classical (c) SDRs	NA|284aa|down_4|CP027114.1_323896_324748_+	TIGR03709, PPK2_rel_1, polyphosphate:nucleotide phosphotransferase, PPK2 family	NA|318aa|down_5|CP027114.1_324928_325882_+	NA	NA|261aa|down_6|CP027114.1_326050_326833_-	PRK14900, valS, valyl-tRNA synthetase; Provisional	NA|296aa|down_7|CP027114.1_327085_327973_-	PRK07819, PRK07819, 3-hydroxybutyryl-CoA dehydrogenase; Validated	NA|432aa|down_8|CP027114.1_328136_329432_-	PRK15063, PRK15063, isocitrate lyase; Provisional	NA|248aa|down_9|CP027114.1_329903_330647_-	NA
GCA_004011905.1_ASM401190v1	CP027114	Gordonia alkanivorans strain YC-RL2 chromosome, complete genome	2	1748359-1748547	2	CRISPRCasFinder	no		csa3,WYL,DEDDh,cas4,DinG,cas3	Orphan	GACGCACCCAGCTCCGATGCCTGAGGTGCGAGGAGCGCAAGCG	43	1	1	1748402-1748435	CP027114.1_1748548-1748581	NA	2	2	Orphan	csa3,WYL,DEDDh,cas4,DinG,cas3	NA|390aa|up_6|CP027114.1_1741115_1742285_+,NA|262aa|up_5|CP027114.1_1742418_1743204_+,NA|152aa|down_4|CP027114.1_1752015_1752471_+	NA|124aa|up_9|CP027114.1_1739547_1739919_+	pfam02152, FolB, Dihydroneopterin aldolase	NA|176aa|up_8|CP027114.1_1739915_1740443_+	COG0801, FolK, 7,8-dihydro-6-hydroxymethylpterin-pyrophosphokinase [Coenzyme metabolism]	NA|172aa|up_7|CP027114.1_1740439_1740955_+	pfam11377, DUF3180, Protein of unknown function (DUF3180)	NA|390aa|up_6|CP027114.1_1741115_1742285_+	NA	NA|262aa|up_5|CP027114.1_1742418_1743204_+	NA	NA|479aa|up_4|CP027114.1_1743223_1744660_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|351aa|up_3|CP027114.1_1744961_1746014_+	COG5495, COG5495, Uncharacterized conserved protein [Function unknown]	NA|315aa|up_2|CP027114.1_1746067_1747012_+	PRK00380, panC, pantoate--beta-alanine ligase; Reviewed	NA|147aa|up_1|CP027114.1_1747014_1747455_+	pfam02261, Asp_decarbox, Aspartate decarboxylase	NA|268aa|up_0|CP027114.1_1747482_1748286_+	PRK13318, PRK13318, type III pantothenate kinase	NA|196aa|down_0|CP027114.1_1748588_1749176_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|284aa|down_1|CP027114.1_1749356_1750208_+	COG2267, PldB, Lysophospholipase [Lipid metabolism]	NA|168aa|down_2|CP027114.1_1750187_1750691_-	pfam17940, TetR_C_31, Tetracyclin repressor-like, C-terminal domain	NA|374aa|down_3|CP027114.1_1750740_1751862_+	PRK06753, PRK06753, hypothetical protein; Provisional	NA|152aa|down_4|CP027114.1_1752015_1752471_+	NA	NA|528aa|down_5|CP027114.1_1752528_1754112_+	PRK00484, lysS, lysyl-tRNA synthetase; Reviewed	NA|256aa|down_6|CP027114.1_1754136_1754904_-	pfam18741, MTES_1575, REase_MTES_1575	NA|527aa|down_7|CP027114.1_1755054_1756635_-	PRK07656, PRK07656, long-chain-fatty-acid--CoA ligase; Validated	NA|420aa|down_8|CP027114.1_1756677_1757937_+	cd01152, ACAD_fadE6_17_26, Putative acyl-CoA dehydrogenases similar to fadE6, fadE17, and fadE26	NA|275aa|down_9|CP027114.1_1757937_1758762_+	PRK07831, PRK07831, SDR family oxidoreductase
GCA_004011905.1_ASM401190v1	CP027114	Gordonia alkanivorans strain YC-RL2 chromosome, complete genome	3	3367084-3367144	3	CRISPRCasFinder	no		csa3,WYL,DEDDh,cas4,DinG,cas3	Orphan	CGCTCCCTGAGGTGCGAGGAGCG	23	0	0	NA	NA	NA	1	1	Orphan	csa3,WYL,DEDDh,cas4,DinG,cas3	NA,NA	NA|465aa|up_9|CP027114.1_3357276_3358671_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|200aa|up_8|CP027114.1_3358895_3359495_-	COG0545, FkpA, FKBP-type peptidyl-prolyl cis-trans isomerases 1 [Posttranslational modification, protein turnover, chaperones]	NA|156aa|up_7|CP027114.1_3359530_3359998_-	cd08865, SRPBCC_10, Ligand-binding SRPBCC domain of an uncharacterized subfamily of proteins	NA|345aa|up_6|CP027114.1_3359997_3361032_-	TIGR03559, F420_Rv3520c, probable F420-dependent oxidoreductase, Rv3520c family	NA|138aa|up_5|CP027114.1_3361028_3361442_-	pfam12680, SnoaL_2, SnoaL-like domain	NA|337aa|up_4|CP027114.1_3361407_3362418_-	TIGR00950, Uncharacterized_inner_membrane_transporter_YicL, Carboxylate/Amino Acid/Amine Transporter	NA|376aa|up_3|CP027114.1_3362414_3363542_-	TIGR04047, MSMEG_0565_glyc, glycosyltransferase, MSMEG_0565 family	NA|288aa|up_2|CP027114.1_3363538_3364402_-	cd07197, nitrilase, Nitrilase superfamily, including nitrile- or amide-hydrolyzing enzymes and amide-condensing enzymes	NA|484aa|up_1|CP027114.1_3364454_3365906_-	TIGR04050, MSMEG_0567_Cter, AIR synthase-related protein, MSMEG_0567 C-terminal family	NA|352aa|up_0|CP027114.1_3365906_3366962_-	TIGR04043, hypothetical_protein_WH5701_02349, radical SAM protein, MSMEG_0568 family	NA|424aa|down_0|CP027114.1_3367194_3368466_-	TIGR04046, predicted_flavoprotein_involved_in_K+_transport, flavin-dependent oxidoreductase, MSMEG_0569 family	NA|106aa|down_1|CP027114.1_3368462_3368780_-	TIGR04042, conserved_hypothetical_protein, MSMEG_0570 family protein	NA|300aa|down_2|CP027114.1_3368772_3369672_-	cd07197, nitrilase, Nitrilase superfamily, including nitrile- or amide-hydrolyzing enzymes and amide-condensing enzymes	NA|175aa|down_3|CP027114.1_3369711_3370236_-	TIGR04044, MSMEG_0572_fam, MSMEG_0572 family protein	NA|229aa|down_4|CP027114.1_3370744_3371431_+	COG0428, COG0428, Predicted divalent heavy-metal cations transporter [Inorganic ion transport and metabolism]	NA|372aa|down_5|CP027114.1_3371441_3372557_-	pfam07859, Abhydrolase_3, alpha/beta hydrolase fold	NA|507aa|down_6|CP027114.1_3372682_3374203_+	pfam11855, DUF3375, Protein of unknown function (DUF3375)	NA|303aa|down_7|CP027114.1_3374400_3375309_+	pfam13835, DUF4194, Domain of unknown function (DUF4194)	NA|1114aa|down_8|CP027114.1_3375302_3378644_+	COG4913, COG4913, Uncharacterized protein conserved in bacteria [Function unknown]	NA|973aa|down_9|CP027114.1_3378915_3381834_-	cd17932, DEXQc_UvrD, DEXQD-box helicase domain of UvrD
GCA_004011905.1_ASM401190v1	CP027114	Gordonia alkanivorans strain YC-RL2 chromosome, complete genome	4	3920623-3920742	4	CRISPRCasFinder	no		csa3,WYL,DEDDh,cas4,DinG,cas3	Orphan	GTGGTCTGCTCAACGCCTCCGGCGTCAGTGGTCTGCTC	38	0	0	NA	NA	NA	1	1	Orphan	csa3,WYL,DEDDh,cas4,DinG,cas3	NA|155aa|up_1|CP027114.1_3919229_3919694_-,NA	NA|250aa|up_9|CP027114.1_3910278_3911028_-	TIGR03206, benzo_BadH, 2-hydroxycyclohexanecarboxyl-CoA dehydrogenase	NA|264aa|up_8|CP027114.1_3911061_3911853_-	PRK07396, PRK07396, dihydroxynaphthoic acid synthetase; Validated	NA|470aa|up_7|CP027114.1_3912085_3913495_+	PRK15067, PRK15067, ethanolamine ammonia-lyase subunit EutB	NA|267aa|up_6|CP027114.1_3913491_3914292_+	PRK05465, PRK05465, ethanolamine ammonia-lyase subunit EutC	NA|112aa|up_5|CP027114.1_3914313_3914649_-	pfam09851, SHOCT, Short C-terminal domain	NA|146aa|up_4|CP027114.1_3914662_3915100_-	pfam06897, DUF1269, Protein of unknown function (DUF1269)	NA|613aa|up_3|CP027114.1_3915096_3916935_-	COG1022, FAA1, Long-chain acyl-CoA synthetases (AMP-forming) [Lipid metabolism]	NA|661aa|up_2|CP027114.1_3917045_3919028_-	COG4178, COG4178, ABC-type uncharacterized transport system, permease and ATPase components [General function prediction only]	NA|155aa|up_1|CP027114.1_3919229_3919694_-	NA	NA|293aa|up_0|CP027114.1_3919704_3920583_-	COG1946, TesB, Acyl-CoA thioesterase [Lipid metabolism]	NA|502aa|down_0|CP027114.1_3922337_3923843_-	PRK12810, gltD, glutamate synthase subunit beta; Reviewed	NA|1524aa|down_1|CP027114.1_3923835_3928407_-	PRK11750, gltB, glutamate synthase subunit alpha; Provisional	NA|549aa|down_2|CP027114.1_3928744_3930391_-	PRK13108, PRK13108, prolipoprotein diacylglyceryl transferase; Reviewed	NA|270aa|down_3|CP027114.1_3930515_3931325_-	PRK13111, trpA, tryptophan synthase subunit alpha; Provisional	NA|444aa|down_4|CP027114.1_3931321_3932653_-	PRK04346, PRK04346, tryptophan synthase subunit beta; Validated	NA|273aa|down_5|CP027114.1_3932714_3933533_-	PRK00278, trpC, indole-3-glycerol phosphate synthase TrpC	NA|262aa|down_6|CP027114.1_3933714_3934500_-	pfam09534, Trp_oprn_chp, Tryptophan-associated transmembrane protein (Trp_oprn_chp)	NA|531aa|down_7|CP027114.1_3934496_3936089_-	PRK13571, PRK13571, anthranilate synthase component I; Provisional	NA|60aa|down_8|CP027114.1_3936085_3936265_-	COG1942, COG1942, Uncharacterized protein, 4-oxalocrotonate tautomerase homolog [General function prediction only]	NA|124aa|down_9|CP027114.1_3936304_3936676_-	PRK00051, hisI, phosphoribosyl-AMP cyclohydrolase; Reviewed
GCA_004011905.1_ASM401190v1	CP027114	Gordonia alkanivorans strain YC-RL2 chromosome, complete genome	5	4309397-4309489	5	CRISPRCasFinder	no		csa3,WYL,DEDDh,cas4,DinG,cas3	Orphan	CTCGCTACGCTCCCGGCGCGGAC	23	0	0	NA	NA	NA	1	1	Orphan	csa3,WYL,DEDDh,cas4,DinG,cas3	NA|60aa|up_5|CP027114.1_4303664_4303844_+,NA|69aa|up_1|CP027114.1_4307698_4307905_+,NA|407aa|down_4|CP027114.1_4315677_4316898_-	NA|332aa|up_9|CP027114.1_4298583_4299579_+	PRK09479, glpX, fructose 1,6-bisphosphatase II; Reviewed	NA|566aa|up_8|CP027114.1_4299697_4301395_+	PRK15389, PRK15389, fumarate hydratase; Provisional	NA|471aa|up_7|CP027114.1_4301402_4302815_+	PRK00485, fumC, fumarate hydratase; Reviewed	NA|228aa|up_6|CP027114.1_4302828_4303512_+	COG2120, COG2120, Uncharacterized proteins, LmbE homologs [Function unknown]	NA|60aa|up_5|CP027114.1_4303664_4303844_+	NA	NA|576aa|up_4|CP027114.1_4303872_4305600_-	COG4585, COG4585, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|216aa|up_3|CP027114.1_4305846_4306494_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|292aa|up_2|CP027114.1_4306677_4307553_+	pfam00582, Usp, Universal stress protein family	NA|69aa|up_1|CP027114.1_4307698_4307905_+	NA	NA|316aa|up_0|CP027114.1_4307891_4308839_-	COG3786, COG3786, Uncharacterized protein conserved in bacteria [Function unknown]	NA|340aa|down_0|CP027114.1_4311245_4312265_+	pfam00665, rve, Integrase core domain	NA|291aa|down_1|CP027114.1_4312261_4313134_-	cd01050, Acyl_ACP_Desat, Acyl ACP desaturase, ferritin-like diiron-binding domain	NA|426aa|down_2|CP027114.1_4313202_4314480_-	PRK00011, glyA, serine hydroxymethyltransferase; Reviewed	NA|340aa|down_3|CP027114.1_4314638_4315658_+	pfam00665, rve, Integrase core domain	NA|407aa|down_4|CP027114.1_4315677_4316898_-	NA	NA|314aa|down_5|CP027114.1_4317024_4317966_+	PRK05439, PRK05439, pantothenate kinase; Provisional	NA|191aa|down_6|CP027114.1_4317986_4318559_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|388aa|down_7|CP027114.1_4318630_4319794_+	cd01159, NcnH, Naphthocyclinone hydroxylase	NA|153aa|down_8|CP027114.1_4319884_4320343_-	COG2128, COG2128, Uncharacterized conserved protein [Function unknown]	NA|265aa|down_9|CP027114.1_4320369_4321164_-	cd05271, NDUFA9_like_SDR_a, NADH dehydrogenase (ubiquinone) 1 alpha subcomplex, subunit 9, 39 kDa, (NDUFA9) -like, atypical (a) SDRs
