assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	1	396249-396507	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	csb1gr7,csb2gr5,cas3,csb3,cas1	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC	36,36,36	0	0	NA	NA	NA:NA:NA	3,3,3	3	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA,NA|201aa|down_6|LR026975.1_408049_408652_+	NA|161aa|up_9|LR026975.1_382423_382906_+	TIGR01575, rimI, ribosomal-protein-alanine acetyltransferase	NA|342aa|up_8|LR026975.1_382902_383928_+	PRK09604, PRK09604, tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex transferase subunit TsaD	NA|184aa|up_7|LR026975.1_383924_384476_+	pfam13577, SnoaL_4, SnoaL-like domain	NA|101aa|up_6|LR026975.1_384640_384943_+	PRK00364, groES, co-chaperonin GroES; Reviewed	NA|540aa|up_5|LR026975.1_385019_386639_+	PRK12849, groEL, chaperonin GroEL; Reviewed	csb1gr7|351aa|up_4|LR026975.1_387834_388887_+	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	csb2gr5|520aa|up_3|LR026975.1_388886_390446_+	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	cas3|884aa|up_2|LR026975.1_390442_393094_+	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb3|353aa|up_1|LR026975.1_393090_394149_+	cd09764, Csb3_I-U, CRISPR/Cas system-associated RAMP superfamily protein Csb3	cas1|534aa|up_0|LR026975.1_394165_395767_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|440aa|down_0|LR026975.1_396557_397877_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|down_1|LR026975.1_398703_400020_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|down_2|LR026975.1_400529_401846_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|440aa|down_3|LR026975.1_402426_403746_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|349aa|down_4|LR026975.1_405532_406579_+	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|440aa|down_5|LR026975.1_406668_407988_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|201aa|down_6|LR026975.1_408049_408652_+	NA	NA|266aa|down_7|LR026975.1_408653_409451_+	COG1484, DnaC, DNA replication protein [DNA replication, recombination, and repair]	NA|352aa|down_8|LR026975.1_410032_411088_+	PRK09261, PRK09261, phospho-2-dehydro-3-deoxyheptonate aldolase; Validated	NA|79aa|down_9|LR026975.1_411150_411387_-	pfam02467, Whib, Transcription factor WhiB
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	2	398042-398593	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no	csb1gr7,csb2gr5,cas3,csb3,cas1	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCNNNNNGGGAGCCGCTCTTCATTGAGGC	36,36,41	0	0	NA	NA	NA:NA:NA	6,6,7	7	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA,NA|201aa|down_5|LR026975.1_408049_408652_+,NA|264aa|down_9|LR026975.1_411825_412617_+	NA|342aa|up_9|LR026975.1_382902_383928_+	PRK09604, PRK09604, tRNA (adenosine(37)-N6)-threonylcarbamoyltransferase complex transferase subunit TsaD	NA|184aa|up_8|LR026975.1_383924_384476_+	pfam13577, SnoaL_4, SnoaL-like domain	NA|101aa|up_7|LR026975.1_384640_384943_+	PRK00364, groES, co-chaperonin GroES; Reviewed	NA|540aa|up_6|LR026975.1_385019_386639_+	PRK12849, groEL, chaperonin GroEL; Reviewed	csb1gr7|351aa|up_5|LR026975.1_387834_388887_+	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	csb2gr5|520aa|up_4|LR026975.1_388886_390446_+	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	cas3|884aa|up_3|LR026975.1_390442_393094_+	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb3|353aa|up_2|LR026975.1_393090_394149_+	cd09764, Csb3_I-U, CRISPR/Cas system-associated RAMP superfamily protein Csb3	cas1|534aa|up_1|LR026975.1_394165_395767_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|440aa|up_0|LR026975.1_396557_397877_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|down_0|LR026975.1_398703_400020_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|down_1|LR026975.1_400529_401846_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|440aa|down_2|LR026975.1_402426_403746_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|349aa|down_3|LR026975.1_405532_406579_+	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|440aa|down_4|LR026975.1_406668_407988_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|201aa|down_5|LR026975.1_408049_408652_+	NA	NA|266aa|down_6|LR026975.1_408653_409451_+	COG1484, DnaC, DNA replication protein [DNA replication, recombination, and repair]	NA|352aa|down_7|LR026975.1_410032_411088_+	PRK09261, PRK09261, phospho-2-dehydro-3-deoxyheptonate aldolase; Validated	NA|79aa|down_8|LR026975.1_411150_411387_-	pfam02467, Whib, Transcription factor WhiB	NA|264aa|down_9|LR026975.1_411825_412617_+	NA
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	3	400051-400448	3,3,3	CRISPRCasFinder,CRT,PILER-CR	no	csb1gr7,csb2gr5,cas3,csb3,cas1	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC	36,36,33	0	0	NA	NA	NA:NA:NA	5,5,5	5	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA,NA|201aa|down_4|LR026975.1_408049_408652_+,NA|264aa|down_8|LR026975.1_411825_412617_+	NA|184aa|up_9|LR026975.1_383924_384476_+	pfam13577, SnoaL_4, SnoaL-like domain	NA|101aa|up_8|LR026975.1_384640_384943_+	PRK00364, groES, co-chaperonin GroES; Reviewed	NA|540aa|up_7|LR026975.1_385019_386639_+	PRK12849, groEL, chaperonin GroEL; Reviewed	csb1gr7|351aa|up_6|LR026975.1_387834_388887_+	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	csb2gr5|520aa|up_5|LR026975.1_388886_390446_+	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	cas3|884aa|up_4|LR026975.1_390442_393094_+	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb3|353aa|up_3|LR026975.1_393090_394149_+	cd09764, Csb3_I-U, CRISPR/Cas system-associated RAMP superfamily protein Csb3	cas1|534aa|up_2|LR026975.1_394165_395767_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|440aa|up_1|LR026975.1_396557_397877_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_0|LR026975.1_398703_400020_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|down_0|LR026975.1_400529_401846_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|440aa|down_1|LR026975.1_402426_403746_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|349aa|down_2|LR026975.1_405532_406579_+	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|440aa|down_3|LR026975.1_406668_407988_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|201aa|down_4|LR026975.1_408049_408652_+	NA	NA|266aa|down_5|LR026975.1_408653_409451_+	COG1484, DnaC, DNA replication protein [DNA replication, recombination, and repair]	NA|352aa|down_6|LR026975.1_410032_411088_+	PRK09261, PRK09261, phospho-2-dehydro-3-deoxyheptonate aldolase; Validated	NA|79aa|down_7|LR026975.1_411150_411387_-	pfam02467, Whib, Transcription factor WhiB	NA|264aa|down_8|LR026975.1_411825_412617_+	NA	NA|193aa|down_9|LR026975.1_412707_413286_+	PRK09648, PRK09648, RNA polymerase sigma factor ShbA
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	4	401981-402376	4,4,4	CRISPRCasFinder,CRT,PILER-CR	no	csb1gr7,csb2gr5,cas3,csb3,cas1	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC	36,36,36	0	0	NA	NA	NA:NA:NA	5,5,5	5	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA,NA|201aa|down_3|LR026975.1_408049_408652_+,NA|264aa|down_7|LR026975.1_411825_412617_+	NA|101aa|up_9|LR026975.1_384640_384943_+	PRK00364, groES, co-chaperonin GroES; Reviewed	NA|540aa|up_8|LR026975.1_385019_386639_+	PRK12849, groEL, chaperonin GroEL; Reviewed	csb1gr7|351aa|up_7|LR026975.1_387834_388887_+	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	csb2gr5|520aa|up_6|LR026975.1_388886_390446_+	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	cas3|884aa|up_5|LR026975.1_390442_393094_+	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb3|353aa|up_4|LR026975.1_393090_394149_+	cd09764, Csb3_I-U, CRISPR/Cas system-associated RAMP superfamily protein Csb3	cas1|534aa|up_3|LR026975.1_394165_395767_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|440aa|up_2|LR026975.1_396557_397877_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_1|LR026975.1_398703_400020_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_0|LR026975.1_400529_401846_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|440aa|down_0|LR026975.1_402426_403746_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|349aa|down_1|LR026975.1_405532_406579_+	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|440aa|down_2|LR026975.1_406668_407988_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|201aa|down_3|LR026975.1_408049_408652_+	NA	NA|266aa|down_4|LR026975.1_408653_409451_+	COG1484, DnaC, DNA replication protein [DNA replication, recombination, and repair]	NA|352aa|down_5|LR026975.1_410032_411088_+	PRK09261, PRK09261, phospho-2-dehydro-3-deoxyheptonate aldolase; Validated	NA|79aa|down_6|LR026975.1_411150_411387_-	pfam02467, Whib, Transcription factor WhiB	NA|264aa|down_7|LR026975.1_411825_412617_+	NA	NA|193aa|down_8|LR026975.1_412707_413286_+	PRK09648, PRK09648, RNA polymerase sigma factor ShbA	NA|409aa|down_9|LR026975.1_413278_414505_+	pfam16751, RsdA_SigD_bd, Anti-sigma-D factor RsdA to sigma factor binding region
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	5	403908-405326	5,5,5	PILER-CR,CRISPRCasFinder,CRT	no	csb1gr7,csb2gr5,cas3,csb3,cas1	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGC	36,36,36	1	1	404967-405005	LR026975.1_2981066-2981028	NA:NA:NA	19,19,19	19	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA,NA|201aa|down_2|LR026975.1_408049_408652_+,NA|264aa|down_6|LR026975.1_411825_412617_+	NA|540aa|up_9|LR026975.1_385019_386639_+	PRK12849, groEL, chaperonin GroEL; Reviewed	csb1gr7|351aa|up_8|LR026975.1_387834_388887_+	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	csb2gr5|520aa|up_7|LR026975.1_388886_390446_+	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	cas3|884aa|up_6|LR026975.1_390442_393094_+	TIGR02621, CRISPR-associated_helicase_Cas3, CRISPR-associated helicase Cas3, subtype Dpsyc	csb3|353aa|up_5|LR026975.1_393090_394149_+	cd09764, Csb3_I-U, CRISPR/Cas system-associated RAMP superfamily protein Csb3	cas1|534aa|up_4|LR026975.1_394165_395767_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|440aa|up_3|LR026975.1_396557_397877_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_2|LR026975.1_398703_400020_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_1|LR026975.1_400529_401846_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|440aa|up_0|LR026975.1_402426_403746_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|349aa|down_0|LR026975.1_405532_406579_+	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|440aa|down_1|LR026975.1_406668_407988_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|201aa|down_2|LR026975.1_408049_408652_+	NA	NA|266aa|down_3|LR026975.1_408653_409451_+	COG1484, DnaC, DNA replication protein [DNA replication, recombination, and repair]	NA|352aa|down_4|LR026975.1_410032_411088_+	PRK09261, PRK09261, phospho-2-dehydro-3-deoxyheptonate aldolase; Validated	NA|79aa|down_5|LR026975.1_411150_411387_-	pfam02467, Whib, Transcription factor WhiB	NA|264aa|down_6|LR026975.1_411825_412617_+	NA	NA|193aa|down_7|LR026975.1_412707_413286_+	PRK09648, PRK09648, RNA polymerase sigma factor ShbA	NA|409aa|down_8|LR026975.1_413278_414505_+	pfam16751, RsdA_SigD_bd, Anti-sigma-D factor RsdA to sigma factor binding region	NA|135aa|down_9|LR026975.1_414511_414916_-	pfam17252, DUF5319, Family of unknown function (DUF5319)
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	6	409511-409770	6,6	CRT,PILER-CR	no	cas3,csb3,cas1	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	TGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGCCCG,GGTGCGGTTCCTTCGGGAGCCGCTCTTCATTGAGGCCCGACGATGATCG	37,49	0	0	NA	NA	NA:NA	3,2	3	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA|201aa|up_1|LR026975.1_408049_408652_+,NA|264aa|down_2|LR026975.1_411825_412617_+	csb3|353aa|up_9|LR026975.1_393090_394149_+	cd09764, Csb3_I-U, CRISPR/Cas system-associated RAMP superfamily protein Csb3	cas1|534aa|up_8|LR026975.1_394165_395767_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	NA|440aa|up_7|LR026975.1_396557_397877_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_6|LR026975.1_398703_400020_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|439aa|up_5|LR026975.1_400529_401846_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|440aa|up_4|LR026975.1_402426_403746_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|349aa|up_3|LR026975.1_405532_406579_+	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|440aa|up_2|LR026975.1_406668_407988_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|201aa|up_1|LR026975.1_408049_408652_+	NA	NA|266aa|up_0|LR026975.1_408653_409451_+	COG1484, DnaC, DNA replication protein [DNA replication, recombination, and repair]	NA|352aa|down_0|LR026975.1_410032_411088_+	PRK09261, PRK09261, phospho-2-dehydro-3-deoxyheptonate aldolase; Validated	NA|79aa|down_1|LR026975.1_411150_411387_-	pfam02467, Whib, Transcription factor WhiB	NA|264aa|down_2|LR026975.1_411825_412617_+	NA	NA|193aa|down_3|LR026975.1_412707_413286_+	PRK09648, PRK09648, RNA polymerase sigma factor ShbA	NA|409aa|down_4|LR026975.1_413278_414505_+	pfam16751, RsdA_SigD_bd, Anti-sigma-D factor RsdA to sigma factor binding region	NA|135aa|down_5|LR026975.1_414511_414916_-	pfam17252, DUF5319, Family of unknown function (DUF5319)	NA|514aa|down_6|LR026975.1_415216_416758_+	PRK05567, PRK05567, inosine 5'-monophosphate dehydrogenase; Reviewed	NA|380aa|down_7|LR026975.1_416775_417915_+	PRK08649, PRK08649, GuaB3 family IMP dehydrogenase-related protein	NA|520aa|down_8|LR026975.1_417926_419486_-	cd01456, vWA_ywmD_type, VWA ywmD type:Von Willebrand factor type A (vWA) domain was originally found in the blood coagulation protein von Willebrand factor (vWF)	NA|124aa|down_9|LR026975.1_419944_420316_+	pfam05154, TM2, TM2 domain
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	7	879291-879440	7,6	PILER-CR,CRISPRCasFinder	no		DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Orphan	GTGCTCCCCGCGCAGGCGGGGGTGATCC,GTGCTCCCCGCGCAGGCGGGGGTGATCC	28,28	0	0	NA	NA	I-E:I-E	2,2	2	Orphan	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA,NA	NA|280aa|up_9|LR026975.1_870333_871173_+	COG2159, COG2159, Predicted metal-dependent hydrolase of the TIM-barrel fold [General function prediction only]	NA|350aa|up_8|LR026975.1_871175_872225_+	cd00567, ACAD, Acyl-CoA dehydrogenase	NA|398aa|up_7|LR026975.1_872241_873435_+	cd01152, ACAD_fadE6_17_26, Putative acyl-CoA dehydrogenases similar to fadE6, fadE17, and fadE26	NA|353aa|up_6|LR026975.1_873438_874497_+	cd05228, AR_FR_like_1_SDR_e, uncharacterized subgroup of aldehyde reductase and flavonoid reductase related proteins, extended (e) SDRs	NA|169aa|up_5|LR026975.1_874493_875000_+	pfam13577, SnoaL_4, SnoaL-like domain	NA|275aa|up_4|LR026975.1_875004_875829_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|382aa|up_3|LR026975.1_875964_877110_-	cd00829, SCP-x_thiolase, Thiolase domain associated with sterol carrier protein (SCP)-x isoform and related proteins; SCP-2  has multiple roles in intracellular lipid circulation and metabolism	NA|99aa|up_2|LR026975.1_877789_878086_+	pfam18019, HD_6, HD domain	NA|287aa|up_1|LR026975.1_878054_878915_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|103aa|up_0|LR026975.1_878911_879220_-	pfam01527, HTH_Tnp_1, Transposase	NA|408aa|down_0|LR026975.1_879610_880834_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|724aa|down_1|LR026975.1_880830_883002_+	cd02762, MopB_1, The MopB_1 CD includes a group of related uncharacterized bacterial molybdopterin-binding oxidoreductase-like domains with a putative N-terminal iron-sulfur [4Fe-4S] cluster binding site and molybdopterin cofactor binding site	NA|409aa|down_2|LR026975.1_883003_884230_-	pfam02515, CoA_transf_3, CoA-transferase family III	NA|400aa|down_3|LR026975.1_884519_885719_-	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|263aa|down_4|LR026975.1_885777_886566_-	cd05328, 3alpha_HSD_SDR_c, alpha hydroxysteroid dehydrogenase (3alpha_HSD), classical (c) SDRs	NA|503aa|down_5|LR026975.1_886700_888209_+	cd07133, ALDH_CALDH_CalB, Coniferyl aldehyde dehydrogenase-like	NA|552aa|down_6|LR026975.1_888281_889937_-	PRK07798, PRK07798, acyl-CoA synthetase; Validated	NA|206aa|down_7|LR026975.1_889945_890563_-	cd03443, PaaI_thioesterase, PaaI_thioesterase is a tetrameric acyl-CoA thioesterase with a hot dog fold and one of several proteins responsible for phenylacetic acid (PA) degradation in bacteria	NA|339aa|down_8|LR026975.1_890579_891596_-	cd03469, Rieske_RO_Alpha_N, Rieske non-heme iron oxygenase (RO) family, N-terminal Rieske domain of the oxygenase alpha subunit; The RO family comprise a large class of aromatic ring-hydroxylating dioxygenases found predominantly in microorganisms	NA|542aa|down_9|LR026975.1_891753_893379_+	COG2072, TrkA, Predicted flavoprotein involved in K+ transport [Inorganic ion transport and metabolism]
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	10	3026693-3026803	9	CRISPRCasFinder	no		DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Orphan	GGTGAGGCCGGTGTCGGTTCGGACGATCTGCTGAGT	36	1	1	3026729-3026767	LR026975.1_2259486-2259524	NA	1	1	Orphan	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA|138aa|up_7|LR026975.1_3019764_3020178_-,NA|83aa|down_1|LR026975.1_3027421_3027670_-	NA|128aa|up_9|LR026975.1_3017805_3018189_-	PRK03100, PRK03100, Sec-independent protein translocase subunit TatB	NA|498aa|up_8|LR026975.1_3018191_3019685_-	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|138aa|up_7|LR026975.1_3019764_3020178_-	NA	NA|256aa|up_6|LR026975.1_3020268_3021036_-	PRK09647, PRK09647, RNA polymerase sigma factor SigE; Reviewed	NA|243aa|up_5|LR026975.1_3021167_3021896_+	COG4122, COG4122, Predicted O-methyltransferase [General function prediction only]	NA|231aa|up_4|LR026975.1_3022151_3022844_+	pfam17933, TetR_C_25, Tetracyclin repressor-like, C-terminal domain	NA|308aa|up_3|LR026975.1_3022818_3023742_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|67aa|up_2|LR026975.1_3023738_3023939_+	COG3559, TnrB3, Putative exporter of polyketide antibiotics [Cell envelope biogenesis, outer membrane]	NA|467aa|up_1|LR026975.1_3023938_3025339_+	COG3559, TnrB3, Putative exporter of polyketide antibiotics [Cell envelope biogenesis, outer membrane]	NA|225aa|up_0|LR026975.1_3025348_3026023_+	COG2020, STE14, Putative protein-S-isoprenylcysteine methyltransferase [Posttranslational modification, protein turnover, chaperones]	NA|202aa|down_0|LR026975.1_3026840_3027446_+	pfam13548, DUF4126, Domain of unknown function (DUF4126)	NA|83aa|down_1|LR026975.1_3027421_3027670_-	NA	NA|405aa|down_2|LR026975.1_3027928_3029143_-	PRK00844, glgC, glucose-1-phosphate adenylyltransferase; Provisional	NA|382aa|down_3|LR026975.1_3029229_3030375_+	TIGR02149, glgA_Coryne, glycogen synthase, Corynebacterium family	NA|56aa|down_4|LR026975.1_3030397_3030565_-	pfam11314, DUF3117, Protein of unknown function (DUF3117)	NA|199aa|down_5|LR026975.1_3030708_3031305_-	pfam03352, Adenine_glyco, Methyladenine glycosylase	NA|124aa|down_6|LR026975.1_3031301_3031673_-	TIGR03544, cell_division_initiation_protein_DivIVA, DivIVA domain	NA|315aa|down_7|LR026975.1_3031736_3032681_-	PRK13915, PRK13915, putative glucosyl-3-phosphoglycerate synthase; Provisional	NA|292aa|down_8|LR026975.1_3032677_3033553_-	TIGR01496, Dihydropteroate_synthase, dihydropteroate synthase	NA|595aa|down_9|LR026975.1_3033618_3035403_-	PRK08279, PRK08279, long-chain-acyl-CoA synthetase; Validated
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	13	4277014-4277105	12	CRISPRCasFinder	no		DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Orphan	TCCGCCGTCCCCGCGCGTCTGGCACCCTGGT	31	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA|175aa|up_3|LR026975.1_4274329_4274854_+,NA|230aa|up_0|LR026975.1_4275690_4276380_-,NA	NA|391aa|up_9|LR026975.1_4267121_4268294_-	pfam01594, AI-2E_transport, AI-2E family transporter	NA|356aa|up_8|LR026975.1_4268369_4269437_+	COG0392, COG0392, Predicted integral membrane protein [Function unknown]	NA|129aa|up_7|LR026975.1_4269433_4269820_+	pfam11255, DUF3054, Protein of unknown function (DUF3054)	NA|126aa|up_6|LR026975.1_4269938_4270316_-	pfam16525, MHB, Haemophore, haem-binding	NA|195aa|up_5|LR026975.1_4270488_4271073_-	TIGR04530, hemophoreRv0203, hemophore, mycobacterial-type	NA|972aa|up_4|LR026975.1_4271417_4274333_+	COG2409, COG2409, Predicted drug exporters of the RND superfamily [General function prediction only]	NA|175aa|up_3|LR026975.1_4274329_4274854_+	NA	NA|121aa|up_2|LR026975.1_4274873_4275236_+	COG2044, COG2044, Predicted peroxiredoxins [General function prediction only]	NA|137aa|up_1|LR026975.1_4275255_4275666_+	COG1832, COG1832, Predicted CoA-binding protein [General function prediction only]	NA|230aa|up_0|LR026975.1_4275690_4276380_-	NA	NA|662aa|down_0|LR026975.1_4277108_4279094_+	COG3590, PepO, Predicted metalloendopeptidase [Posttranslational modification, protein turnover, chaperones]	NA|145aa|down_1|LR026975.1_4279177_4279612_-	TIGR02096, putative_cyclase, conserved hypothetical protein, steroid delta-isomerase-related	NA|350aa|down_2|LR026975.1_4279679_4280729_-	PRK08195, PRK08195, 4-hyroxy-2-oxovalerate/4-hydroxy-2-oxopentanoic acid aldolase,; Validated	NA|314aa|down_3|LR026975.1_4280725_4281667_-	PRK08300, PRK08300, acetaldehyde dehydrogenase; Validated	NA|266aa|down_4|LR026975.1_4281663_4282461_-	PRK11342, mhpD, 2-keto-4-pentenoate hydratase; Provisional	NA|255aa|down_5|LR026975.1_4282492_4283257_-	PRK05653, fabG, 3-oxoacyl-ACP reductase FabG	NA|171aa|down_6|LR026975.1_4283253_4283766_-	cd00667, ring_hydroxylating_dioxygenases_beta, Ring hydroxylating dioxygenase beta subunit	NA|436aa|down_7|LR026975.1_4283762_4285070_-	TIGR03229, benzo_1_2_benA, benzoate 1,2-dioxygenase, large subunit	NA|280aa|down_8|LR026975.1_4285086_4285926_-	TIGR03343, 2-hydroxy-6-oxo-6-phenylhexa-24-dienoate_hydrolase, 2-hydroxy-6-oxo-6-phenylhexa-2,4-dienoate hydrolase	NA|359aa|down_9|LR026975.1_4285922_4286999_-	cd07359, PCA_45_Doxase_B_like, Subunit B of the Class III Extradiol dioxygenase, Protocatechuate 4,5-dioxygenase, and simlar enzymes
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	14	4886803-4886913	13	CRISPRCasFinder	no		DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Orphan	GGTGCCGGGTTGCCGGGTGTGGTCGCTCGGTGTGATG	37	1	1	4886840-4886876	LR026975.1_4445575-4445611	NA	1	1	Orphan	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA|88aa|up_3|LR026975.1_4882835_4883099_-,NA|105aa|down_9|LR026975.1_4896569_4896884_-	NA|231aa|up_9|LR026975.1_4878371_4879064_-	pfam02592, Vut_1, Putative vitamin uptake transporter	NA|303aa|up_8|LR026975.1_4879097_4880006_-	cd01146, FhuD, Fe3+-siderophore binding domain FhuD	NA|389aa|up_7|LR026975.1_4880019_4881186_-	pfam03601, Cons_hypoth698, Conserved hypothetical protein 698	NA|30aa|up_6|LR026975.1_4881182_4881272_-	pfam05140, ResB, ResB-like family	NA|271aa|up_5|LR026975.1_4881341_4882154_-	PRK08267, PRK08267, SDR family oxidoreductase	NA|188aa|up_4|LR026975.1_4882200_4882764_-	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|88aa|up_3|LR026975.1_4882835_4883099_-	NA	NA|213aa|up_2|LR026975.1_4883223_4883862_-	COG1279, COG1279, Lysine efflux permease [General function prediction only]	NA|253aa|up_1|LR026975.1_4884496_4885255_+	pfam10824, T7SS_ESX_EspC, Excreted virulence factor EspC, type VII ESX diderm	NA|338aa|up_0|LR026975.1_4885270_4886284_-	COG0523, COG0523, Putative GTPases (G3E family) [General function prediction only]	NA|311aa|down_0|LR026975.1_4887359_4888292_+	COG1946, TesB, Acyl-CoA thioesterase [Lipid metabolism]	NA|194aa|down_1|LR026975.1_4888587_4889169_+	PRK06991, PRK06991, electron transport complex subunit RsxB	NA|223aa|down_2|LR026975.1_4889184_4889853_+	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|311aa|down_3|LR026975.1_4889866_4890799_-	pfam05661, DUF808, Protein of unknown function (DUF808)	NA|485aa|down_4|LR026975.1_4890848_4892303_-	COG2252, COG2252, Xanthine/uracil/vitamin C permease [Nucleotide transport and    metabolism]	NA|118aa|down_5|LR026975.1_4892375_4892729_-	cd10912, PIN_YacP-like, PIN_domain of Bacillus subtilis YacP/Rae1 and related proteins	NA|137aa|down_6|LR026975.1_4892864_4893275_-	pfam01740, STAS, STAS domain	NA|412aa|down_7|LR026975.1_4893384_4894620_-	COG3285, COG3285, Predicted eukaryotic-type DNA primase [DNA replication, recombination, and repair]	NA|563aa|down_8|LR026975.1_4894676_4896365_+	PRK07788, PRK07788, acyl-CoA synthetase; Validated	NA|105aa|down_9|LR026975.1_4896569_4896884_-	NA
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	15	5061904-5062012	14	CRISPRCasFinder	no		DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Orphan	GGATCCGCGCGGCGGCCGCCGCGGCCGGCAGCGCCC	36	0	0	NA	NA	NA	1	1	Orphan	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA|85aa|up_9|LR026975.1_5055360_5055615_+,NA	NA|85aa|up_9|LR026975.1_5055360_5055615_+	NA	NA|272aa|up_8|LR026975.1_5055611_5056427_-	cd09086, ExoIII-like_AP-endo, Escherichia coli exonuclease III (ExoIII) and Neisseria meningitides NExo-like subfamily of the ExoIII family purinic/apyrimidinic (AP) endonucleases	NA|302aa|up_7|LR026975.1_5056429_5057335_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|198aa|up_6|LR026975.1_5057334_5057928_-	PRK00150, def, peptide deformylase; Reviewed	NA|105aa|up_5|LR026975.1_5058063_5058378_+	pfam11662, DUF3263, Protein of unknown function (DUF3263)	NA|156aa|up_4|LR026975.1_5058415_5058883_+	pfam13399, LytR_C, LytR cell envelope-related transcriptional attenuator	NA|229aa|up_3|LR026975.1_5058893_5059580_+	COG2032, SodC, Cu/Zn superoxide dismutase [Inorganic ion transport and metabolism]	NA|357aa|up_2|LR026975.1_5059623_5060694_+	PRK13517, PRK13517, glutamate--cysteine ligase	NA|219aa|up_1|LR026975.1_5060696_5061353_+	COG2802, COG2802, Uncharacterized protein, similar to the N-terminal domain of Lon protease [General function prediction only]	NA|156aa|up_0|LR026975.1_5061349_5061817_-	TIGR00027, Hypothetical_protein_Rv0893c/MT0917/Mb0917c	NA|121aa|down_0|LR026975.1_5062140_5062503_-	PRK12674, PRK12674, putative monovalent cation/H+ antiporter subunit G; Reviewed	NA|91aa|down_1|LR026975.1_5062499_5062772_-	PRK07948, PRK07948, putative monovalent cation/H+ antiporter subunit F; Reviewed	NA|181aa|down_2|LR026975.1_5062768_5063311_-	PRK08965, PRK08965, putative monovalent cation/H+ antiporter subunit E; Reviewed	NA|532aa|down_3|LR026975.1_5063307_5064903_-	PRK12665, PRK12665, putative monovalent cation/H+ antiporter subunit D; Reviewed	NA|157aa|down_4|LR026975.1_5064899_5065370_-	PRK07946, PRK07946, putative monovalent cation/H+ antiporter subunit C; Reviewed	NA|961aa|down_5|LR026975.1_5065366_5068249_-	PRK12644, PRK12644, putative monovalent cation/H+ antiporter subunit A; Reviewed	NA|684aa|down_6|LR026975.1_5068394_5070446_-	COG1835, COG1835, Predicted acyltransferases [Lipid metabolism]	NA|138aa|down_7|LR026975.1_5070528_5070942_-	pfam08044, DUF1707, Domain of unknown function (DUF1707)	NA|762aa|down_8|LR026975.1_5071034_5073320_-	TIGR01243, Cell_division_cycle_protein_48_homolog_MJ1156, AAA family ATPase, CDC48 subfamily	NA|286aa|down_9|LR026975.1_5073316_5074174_-	COG1183, PssA, Phosphatidylserine synthase [Lipid metabolism]
GCA_900603025.1_MHAS	LR026975	Mycolicibacterium hassiacum DSM 44199 isolate Mhassiacum genome assembly, chromosome: 1	16	5082587-5085875	8,15,7	PILER-CR,CRISPRCasFinder,CRT	no	cas1,cas8u1,cas3,csb2gr5,csb1gr7	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	Unclear	GCTGCAATGCGGCTCCGTCTCAGGGACGGAGATCAC,GCTGCAATGCGGCTCCGTCTCAGGGACGGAGATCAC,GCTGCAATGCGGCTCCGTCTCAGGGACGGAGATCAC	36,36,36	0	0	NA	NA	NA:NA:NA	44,44,44	44	Unclear	DEDDh,WYL,csb1gr7,csb2gr5,cas3,csb3,cas1,cas4,csa3,DinG,cas8u1	NA|230aa|up_0|LR026975.1_5081589_5082279_-,cas8u1|313aa|down_1|LR026975.1_5088028_5088967_-,NA|182aa|down_5|LR026975.1_5095286_5095832_-	NA|762aa|up_9|LR026975.1_5071034_5073320_-	TIGR01243, Cell_division_cycle_protein_48_homolog_MJ1156, AAA family ATPase, CDC48 subfamily	NA|286aa|up_8|LR026975.1_5073316_5074174_-	COG1183, PssA, Phosphatidylserine synthase [Lipid metabolism]	NA|233aa|up_7|LR026975.1_5074170_5074869_-	PRK05305, PRK05305, phosphatidylserine decarboxylase family protein	NA|407aa|up_6|LR026975.1_5074907_5076128_-	cd00887, MoeA, MoeA family	NA|304aa|up_5|LR026975.1_5076127_5077039_-	PRK06197, PRK06197, short chain dehydrogenase; Provisional	NA|165aa|up_4|LR026975.1_5077106_5077601_+	COG3402, COG3402, Uncharacterized conserved protein [Function unknown]	NA|493aa|up_3|LR026975.1_5077597_5079076_+	COG3428, COG3428, Predicted membrane protein [Function unknown]	NA|272aa|up_2|LR026975.1_5079101_5079917_+	cd07509, HAD_PPase, inorganic pyrophosphatase similar to a human phospholysine phosphohistidine inorganic pyrophosphate phosphatase (LHPP)	NA|565aa|up_1|LR026975.1_5079905_5081600_-	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]	NA|230aa|up_0|LR026975.1_5081589_5082279_-	NA	cas1|563aa|down_0|LR026975.1_5086332_5088021_-	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas8u1|313aa|down_1|LR026975.1_5088028_5088967_-	NA	cas3|1011aa|down_2|LR026975.1_5088963_5091996_-	cd09696, Cas3_I, CRISPR/Cas system-associated protein Cas3; Distinct Cas3 family with HD domain fused to C-termus of Helicase domain	csb2gr5|566aa|down_3|LR026975.1_5091985_5093683_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csb1gr7|406aa|down_4|LR026975.1_5093682_5094900_-	pfam09617, Cas_GSU0053, CRISPR-associated protein GSU0053 (Cas_GSU0053)	NA|182aa|down_5|LR026975.1_5095286_5095832_-	NA	NA|102aa|down_6|LR026975.1_5095847_5096153_-	pfam06013, WXG100, Proteins of 100 residues with WXG	NA|276aa|down_7|LR026975.1_5096453_5097281_+	COG0600, TauC, ABC-type nitrate/sulfonate/bicarbonate transport system, permease component [Inorganic ion transport and metabolism]	NA|250aa|down_8|LR026975.1_5097277_5098027_+	COG1116, TauB, ABC-type nitrate/sulfonate/bicarbonate transport system, ATPase component [Inorganic ion transport and metabolism]	NA|328aa|down_9|LR026975.1_5098038_5099022_+	cd13558, PBP2_SsuA_like_2, Putative substrate binding domain of sulfonate binding protein, the type 2 periplasmic binding protein fold
