assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	1	329432-329820	1	CRT	no	cas14j	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Unclear	CTGCCGGTCGTGGGNGACGTNGCCGG	26	0	0	NA	NA	NA	7	7	TypeV	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA,NA	NA|310aa|up_9|NC_009142.1_317601_318531_-	COG0492, TrxB, Thioredoxin reductase [Posttranslational modification, protein turnover, chaperones]	NA|164aa|up_8|NC_009142.1_318633_319125_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|188aa|up_7|NC_009142.1_319250_319814_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|164aa|up_6|NC_009142.1_319929_320421_-	cd01043, DPS, DPS protein, ferritin-like diiron-binding domain	NA|186aa|up_5|NC_009142.1_320496_321054_-	pfam03358, FMN_red, NADPH-dependent FMN reductase	cas14j|400aa|up_4|NC_009142.1_321212_322412_+	COG0675, COG0675, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|359aa|up_3|NC_009142.1_322561_323638_+	pfam07859, Abhydrolase_3, alpha/beta hydrolase fold	NA|160aa|up_2|NC_009142.1_323750_324230_-	cd01285, nucleoside_deaminase, Nucleoside deaminases include adenosine, guanine and cytosine deaminases	NA|823aa|up_1|NC_009142.1_324326_326795_-	cd06170, LuxR_C_like, C-terminal DNA-binding domain of LuxR-like proteins	NA|464aa|up_0|NC_009142.1_326974_328366_-	cd10170, HSP70_NBD, Nucleotide-binding domain of the HSP70 family	NA|604aa|down_0|NC_009142.1_330333_332145_+	cd09912, DLP_2, Dynamin-like protein including dynamins, mitofusins, and guanylate-binding proteins	NA|489aa|down_1|NC_009142.1_332141_333608_+	cd09912, DLP_2, Dynamin-like protein including dynamins, mitofusins, and guanylate-binding proteins	NA|405aa|down_2|NC_009142.1_333790_335005_-	PRK07588, PRK07588, FAD-binding domain	NA|176aa|down_3|NC_009142.1_335025_335553_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|82aa|down_4|NC_009142.1_335944_336190_-	pfam16827, zf-HC3, zinc-finger	NA|286aa|down_5|NC_009142.1_336340_337198_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|63aa|down_6|NC_009142.1_337187_337376_+	pfam04149, DUF397, Domain of unknown function (DUF397)	NA|485aa|down_7|NC_009142.1_337477_338932_-	pfam00199, Catalase, Catalase	NA|188aa|down_8|NC_009142.1_339415_339979_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|168aa|down_9|NC_009142.1_340017_340521_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	2	472318-472404	1	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	GGTCAGGCGCCGGTCAGGAACGT	23	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA,NA|79aa|down_2|NC_009142.1_476901_477138_+	NA|508aa|up_9|NC_009142.1_458153_459677_+	PRK00484, lysS, lysyl-tRNA synthetase; Reviewed	NA|117aa|up_8|NC_009142.1_459844_460195_+	pfam11774, Lsr2, Lsr2	NA|357aa|up_7|NC_009142.1_460676_461747_+	pfam01032, FecCD, FecCD transport family	NA|362aa|up_6|NC_009142.1_461743_462829_+	pfam01032, FecCD, FecCD transport family	NA|285aa|up_5|NC_009142.1_462825_463680_+	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|854aa|up_4|NC_009142.1_463958_466520_+	CHL00095, clpC, Clp protease ATP binding subunit	NA|348aa|up_3|NC_009142.1_466584_467628_-	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|267aa|up_2|NC_009142.1_469472_470273_+	PRK06526, PRK06526, transposase; Provisional	NA|359aa|up_1|NC_009142.1_470605_471682_-	COG1252, Ndh, NADH dehydrogenase, FAD-containing subunit [Energy production and conversion]	NA|168aa|up_0|NC_009142.1_471779_472283_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|262aa|down_0|NC_009142.1_472468_473254_-	COG0586, DedA, Uncharacterized membrane-associated protein [Function unknown]	NA|1046aa|down_1|NC_009142.1_473404_476542_+	COG3903, COG3903, Predicted ATPase [General function prediction only]	NA|79aa|down_2|NC_009142.1_476901_477138_+	NA	NA|277aa|down_3|NC_009142.1_477437_478268_-	pfam01061, ABC2_membrane, ABC-2 type transporter	NA|323aa|down_4|NC_009142.1_478264_479233_-	TIGR01188, drrA, daunorubicin resistance ABC transporter ATP-binding subunit	NA|336aa|down_5|NC_009142.1_479362_480370_+	pfam03372, Exo_endo_phos, Endonuclease/Exonuclease/phosphatase family	NA|169aa|down_6|NC_009142.1_480441_480948_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|541aa|down_7|NC_009142.1_480995_482618_+	pfam13515, FUSC_2, Fusaric acid resistance protein-like	NA|103aa|down_8|NC_009142.1_482688_482997_-	COG2329, COG2329, Uncharacterized enzyme involved in biosynthesis of extracellular polysaccharides [General function prediction only]	NA|647aa|down_9|NC_009142.1_483014_484955_-	TIGR03062, hypothetical_protein_lp_1332, YhgE/Pip C-terminal domain
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	3	1314743-1314813	2	CRISPRCasFinder	no	DinG	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Type IV-A	CGCGAGCTTCGCCCGCCACCCGC	23	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|241aa|up_7|NC_009142.1_1305736_1306459_+,NA|72aa|down_4|NC_009142.1_1320554_1320770_+	NA|82aa|up_9|NC_009142.1_1304048_1304294_+	pfam04672, Methyltransf_19, S-adenosyl methyltransferase	NA|453aa|up_8|NC_009142.1_1304372_1305731_+	pfam04775, Bile_Hydr_Trans, Acyl-CoA thioester hydrolase/BAAT N-terminal region	NA|241aa|up_7|NC_009142.1_1305736_1306459_+	NA	NA|203aa|up_6|NC_009142.1_1306553_1307162_-	pfam03713, DUF305, Domain of unknown function (DUF305)	NA|585aa|up_5|NC_009142.1_1307578_1309333_+	cd01662, Ubiquinol_Oxidase_I, Ubiquinol oxidase subunit I	NA|414aa|up_4|NC_009142.1_1309472_1310714_+	cd07500, HAD_PSP, phosphoserine phosphatase (PSP), similar to Methanococcus Jannaschii PSP and Saccharomyces cerevisiae SER2p	NA|271aa|up_3|NC_009142.1_1311101_1311914_+	pfam01981, PTH2, Peptidyl-tRNA hydrolase PTH2	NA|207aa|up_2|NC_009142.1_1312306_1312927_-	COG0619, CbiQ, ABC-type cobalt transport system, permease component CbiQ and related transporters [Inorganic ion transport and metabolism]	NA|225aa|up_1|NC_009142.1_1312923_1313598_-	cd03225, ABC_cobalt_CbiO_domain1, First domain of the ATP-binding cassette component of cobalt transport system	NA|336aa|up_0|NC_009142.1_1313594_1314602_-	cd00751, thiolase, Thiolase are ubiquitous enzymes that catalyze the reversible thiolytic cleavage of 3-ketoacyl-CoA into acyl-CoA and acetyl-CoA, a 2-step reaction involving a covalent intermediate formed with a catalytic cysteine	NA|496aa|down_0|NC_009142.1_1315104_1316592_-	COG0318, CaiC, Acyl-CoA synthetases (AMP-forming)/AMP-acid ligases II [Lipid metabolism / Secondary metabolites biosynthesis, transport, and catabolism]	NA|232aa|down_1|NC_009142.1_1316593_1317289_-	COG1268, BioY, Uncharacterized conserved protein [General function prediction only]	NA|140aa|down_2|NC_009142.1_1317546_1317966_+	pfam11253, DUF3052, Protein of unknown function (DUF3052)	DinG|664aa|down_3|NC_009142.1_1318195_1320187_-	COG1199, DinG, Rad3-related DNA helicases [Transcription / DNA replication, recombination, and repair]	NA|72aa|down_4|NC_009142.1_1320554_1320770_+	NA	NA|269aa|down_5|NC_009142.1_1320846_1321653_-	pfam11716, MDMPI_N, Mycothiol maleylpyruvate isomerase N-terminal domain	NA|191aa|down_6|NC_009142.1_1321750_1322323_-	cd01011, nicotinamidase, Nicotinamidase/pyrazinamidase (PZase)	NA|435aa|down_7|NC_009142.1_1322332_1323637_-	PRK09243, PRK09243, nicotinate phosphoribosyltransferase; Validated	NA|98aa|down_8|NC_009142.1_1324093_1324387_+	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|188aa|down_9|NC_009142.1_1324391_1324955_+	pfam09438, DUF2017, Domain of unknown function (DUF2017)
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	4	1858868-1858959	3	CRISPRCasFinder	no	DEDDh	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Unclear	TCGGCATCGGATCGCGATCAGCG	23	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|137aa|up_7|NC_009142.1_1850686_1851097_-,NA|143aa|up_6|NC_009142.1_1851195_1851624_-,NA|133aa|down_4|NC_009142.1_1865759_1866158_+,NA|134aa|down_8|NC_009142.1_1868753_1869155_+	NA|95aa|up_9|NC_009142.1_1849161_1849446_+	pfam01037, AsnC_trans_reg, Lrp/AsnC ligand binding domain	NA|352aa|up_8|NC_009142.1_1849611_1850667_-	PRK00188, trpD, anthranilate phosphoribosyltransferase; Provisional	NA|137aa|up_7|NC_009142.1_1850686_1851097_-	NA	NA|143aa|up_6|NC_009142.1_1851195_1851624_-	NA	NA|204aa|up_5|NC_009142.1_1851739_1852351_+	COG1845, CyoC, Heme/copper-type cytochrome/quinol oxidase, subunit 3 [Energy production and conversion]	NA|269aa|up_4|NC_009142.1_1852415_1853222_+	COG2010, CccA, Cytochrome c, mono- and diheme variants [Energy production and conversion]	NA|377aa|up_3|NC_009142.1_1853218_1854349_+	cd03467, Rieske, Rieske domain; a [2Fe-2S] cluster binding domain commonly found in Rieske non-heme iron oxygenase (RO) systems such as naphthalene and biphenyl dioxygenases, as well as in plant/cyanobacterial chloroplast b6f and mitochondrial cytochrome bc(1) complexes	NA|553aa|up_2|NC_009142.1_1854345_1856004_+	pfam13631, Cytochrom_B_N_2, Cytochrome b(N-terminal)/b6/petB	NA|263aa|up_1|NC_009142.1_1856125_1856914_-	TIGR03083, TIGR03083, uncharacterized Actinobacterial protein TIGR03083	DEDDh|573aa|up_0|NC_009142.1_1856998_1858717_-	PRK07883, PRK07883, DEDD exonuclease domain-containing protein	NA|429aa|down_0|NC_009142.1_1859231_1860518_+	pfam05991, NYN_YacP, YacP-like NYN domain	NA|325aa|down_1|NC_009142.1_1861159_1862134_+	pfam00877, NLPC_P60, NlpC/P60 family	NA|429aa|down_2|NC_009142.1_1862292_1863579_+	pfam04450, BSP, Peptidase of plants and bacteria	NA|603aa|down_3|NC_009142.1_1863644_1865453_-	COG1022, FAA1, Long-chain acyl-CoA synthetases (AMP-forming) [Lipid metabolism]	NA|133aa|down_4|NC_009142.1_1865759_1866158_+	NA	NA|263aa|down_5|NC_009142.1_1866183_1866972_+	COG2129, COG2129, Predicted phosphoesterases, related to the Icc protein [General function prediction only]	NA|148aa|down_6|NC_009142.1_1867082_1867526_+	cd07819, SRPBCC_2, Ligand-binding SRPBCC domain of an uncharacterized subfamily of proteins	NA|401aa|down_7|NC_009142.1_1867545_1868748_+	cd02035, ArsA, Arsenical pump-driving ATPase ArsA	NA|134aa|down_8|NC_009142.1_1868753_1869155_+	NA	NA|318aa|down_9|NC_009142.1_1869148_1870102_+	TIGR00744, Glucokinase_Glucose_kinase
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	5	1893387-1893527	4	CRISPRCasFinder	no	WYL	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Unclear	CGCACCGGCTGCGGTGAGTGCGCGG	25	1	1	1893412-1893430	NC_009142.1_3790111-3790129	NA	2	2	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|346aa|up_3|NC_009142.1_1888642_1889680_-,NA|132aa|down_5|NC_009142.1_1901022_1901418_-	NA|122aa|up_9|NC_009142.1_1882885_1883251_+	pfam18367, Rv2175c_C, Rv2175c C-terminal domain of unknown function	NA|205aa|up_8|NC_009142.1_1883654_1884269_+	pfam04892, VanZ, VanZ like family	NA|489aa|up_7|NC_009142.1_1884293_1885760_-	TIGR02734, Phytoene_desaturase_lycopene-forming, phytoene desaturase	NA|359aa|up_6|NC_009142.1_1885759_1886836_-	cd00685, Trans_IPPS_HT, Trans-Isoprenyl Diphosphate Synthases, head-to-tail	NA|295aa|up_5|NC_009142.1_1887066_1887951_+	TIGR00676, 510-methylenetetrahydrofolate_reductase	NA|150aa|up_4|NC_009142.1_1888016_1888466_+	cd07502, HAD_PNKP-C, C-terminal phosphatase domain of T4 polynucleotide kinase/phosphatase (PNKP) and related phosphatases	NA|346aa|up_3|NC_009142.1_1888642_1889680_-	NA	WYL|333aa|up_2|NC_009142.1_1889802_1890801_+	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|220aa|up_1|NC_009142.1_1890843_1891503_-	pfam11353, DUF3153, Protein of unknown function (DUF3153)	NA|559aa|up_0|NC_009142.1_1891618_1893295_+	pfam05960, DUF885, Bacterial protein of unknown function (DUF885)	NA|192aa|down_0|NC_009142.1_1893626_1894202_-	COG0456, RimI, Acetyltransferases [General function prediction only]	NA|151aa|down_1|NC_009142.1_1894509_1894962_+	pfam18726, HEPN_SAV_6107, SAV_6107-like HEPN	NA|401aa|down_2|NC_009142.1_1896742_1897945_-	pfam09992, NAGPA, Phosphodiester glycosidase	NA|417aa|down_3|NC_009142.1_1898401_1899652_-	cd17329, MFS_MdtH_MDR_like, Multidrug resistance protein MdtH and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|376aa|down_4|NC_009142.1_1899651_1900779_-	COG0031, CysK, Cysteine synthase [Amino acid transport and metabolism]	NA|132aa|down_5|NC_009142.1_1901022_1901418_-	NA	NA|393aa|down_6|NC_009142.1_1901586_1902765_-	PRK07588, PRK07588, FAD-binding domain	NA|197aa|down_7|NC_009142.1_1902761_1903352_-	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|1521aa|down_8|NC_009142.1_1903527_1908090_-	PRK09751, PRK09751, putative ATP-dependent helicase Lhr; Provisional	NA|165aa|down_9|NC_009142.1_1908124_1908619_-	pfam11695, DUF3291, Domain of unknown function (DUF3291)
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	6	2049617-2049716	5	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	CGCCACACCGCATCCGCCCGCCACGC	26	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|61aa|up_9|NC_009142.1_2042984_2043167_-,NA|99aa|up_7|NC_009142.1_2043550_2043847_-,NA|193aa|up_5|NC_009142.1_2044501_2045080_-,NA|79aa|down_2|NC_009142.1_2052379_2052616_+	NA|61aa|up_9|NC_009142.1_2042984_2043167_-	NA	NA|86aa|up_8|NC_009142.1_2043293_2043551_-	pfam02956, TT_ORF1, TT viral orf 1	NA|99aa|up_7|NC_009142.1_2043550_2043847_-	NA	NA|172aa|up_6|NC_009142.1_2043883_2044399_-	pfam03780, Asp23, Asp23 family, cell envelope-related function	NA|193aa|up_5|NC_009142.1_2044501_2045080_-	NA	NA|188aa|up_4|NC_009142.1_2045072_2045636_-	PRK11922, PRK11922, RNA polymerase sigma factor; Provisional	NA|245aa|up_3|NC_009142.1_2045632_2046367_-	PRK14059, PRK14059, pyrimidine reductase family protein	NA|343aa|up_2|NC_009142.1_2046419_2047448_+	pfam03969, AFG1_ATPase, AFG1-like ATPase	NA|411aa|up_1|NC_009142.1_2047693_2048926_+	PRK06185, PRK06185, FAD-dependent oxidoreductase	NA|210aa|up_0|NC_009142.1_2048922_2049552_-	TIGR03384, betaine_BetI, transcriptional repressor BetI	NA|420aa|down_0|NC_009142.1_2049741_2051001_-	PRK00854, rocD, ornithine--oxo-acid transaminase; Reviewed	NA|347aa|down_1|NC_009142.1_2051162_2052203_+	pfam10282, Lactonase, Lactonase, 7-bladed beta-propeller	NA|79aa|down_2|NC_009142.1_2052379_2052616_+	NA	NA|221aa|down_3|NC_009142.1_2052660_2053323_-	smart00994, zf-C4_ClpX, ClpX C4-type zinc finger	NA|588aa|down_4|NC_009142.1_2053401_2055165_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|261aa|down_5|NC_009142.1_2055492_2056275_+	cd07247, SgaA_N_like, N-terminal domain of Streptomyces griseus SgaA and similar domains	NA|488aa|down_6|NC_009142.1_2056532_2057996_+	COG1129, MglA, ABC-type sugar transport system, ATPase component [Carbohydrate transport and metabolism]	NA|332aa|down_7|NC_009142.1_2057988_2058984_+	COG1172, AraH, Ribose/xylose/arabinose/galactoside ABC-type transport systems, permease components [Carbohydrate transport and metabolism]	NA|336aa|down_8|NC_009142.1_2059039_2060047_+	cd20008, PBP1_ABC_sugar_binding-like, monosaccharide ABC transporter substrate-binding protein such as CUT2	NA|395aa|down_9|NC_009142.1_2060134_2061319_-	TIGR01426, Glycosyl_transferase, glycosyltransferase, MGT family
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	7	2467949-2468087	6	CRISPRCasFinder	no	WYL	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Unclear	GCTGCCGCTCGGTCTGCTCGACCT	24	0	0	NA	NA	NA	2	2	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA,NA	NA|183aa|up_9|NC_009142.1_2457726_2458275_+	pfam00440, TetR_N, Bacterial regulatory proteins, tetR family	NA|306aa|up_8|NC_009142.1_2458295_2459213_+	cd07742, metallo-hydrolase-like_MBL-fold, uncharacterized subgroup of the MBL-fold_metallo-hydrolase superfamily; MBL-fold metallo hydrolase domain	NA|306aa|up_7|NC_009142.1_2459189_2460107_-	smart00475, 53EXOc, 5'-3' exonuclease	NA|548aa|up_6|NC_009142.1_2460174_2461818_-	COG1080, PtsA, Phosphoenolpyruvate-protein kinase (PTS system EI component in bacteria) [Carbohydrate transport and metabolism]	NA|253aa|up_5|NC_009142.1_2461917_2462676_+	COG1349, GlpR, Transcriptional regulators of sugar metabolism [Transcription / Carbohydrate transport and metabolism]	NA|315aa|up_4|NC_009142.1_2462672_2463617_+	TIGR03168, 1-PFK, hexose kinase, 1-phosphofructokinase family	NA|151aa|up_3|NC_009142.1_2463613_2464066_+	TIGR00848, Includes:_Phosphotransferase_enzyme_IIA_component, PTS system, fructose subfamily, IIA component	NA|491aa|up_2|NC_009142.1_2464062_2465535_+	PRK10712, PRK10712, PTS system fructose-specific transporter subunits IIBC; Provisional	NA|97aa|up_1|NC_009142.1_2466082_2466373_+	pfam00381, PTS-HPr, PTS HPr component phosphorylation site	NA|509aa|up_0|NC_009142.1_2466388_2467915_+	cd18622, GH32_Inu-like, glycoside hydrolase family 32 protein such as Aspergillus ficuum endo-inulinase (Inu2)	NA|385aa|down_0|NC_009142.1_2469142_2470297_+	COG0006, PepP, Xaa-Pro aminopeptidase [Amino acid transport and metabolism]	NA|147aa|down_1|NC_009142.1_2470326_2470767_+	smart00344, HTH_ASNC, helix_turn_helix ASNC type	NA|230aa|down_2|NC_009142.1_2470778_2471468_+	pfam08241, Methyltransf_11, Methyltransferase domain	NA|360aa|down_3|NC_009142.1_2472638_2473718_-	cd01823, SEST_like, SEST_like	NA|208aa|down_4|NC_009142.1_2473875_2474499_+	pfam04186, FxsA, FxsA cytoplasmic membrane protein	NA|542aa|down_5|NC_009142.1_2474634_2476260_+	COG1574, COG1574, Predicted metal-dependent hydrolase with the TIM-barrel fold [General function prediction only]	NA|201aa|down_6|NC_009142.1_2476553_2477156_+	pfam08044, DUF1707, Domain of unknown function (DUF1707)	NA|493aa|down_7|NC_009142.1_2477378_2478857_+	cd07571, ALP_N-acyl_transferase, Apolipoprotein N-acyl transferase (class 9 nitrilases)	NA|263aa|down_8|NC_009142.1_2478928_2479717_+	cd06442, DPM1_like, DPM1_like represents putative enzymes similar to eukaryotic DPM1	NA|115aa|down_9|NC_009142.1_2479778_2480123_-	pfam13397, RbpA, RNA polymerase-binding protein
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	8	2779878-2780124	7,1	CRISPRCasFinder,PILER-CR	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	CTCGCCGTCCCCGCCGGGACGGCCCTTCATT,CCGGGACGGCCCTTCATTGAGGC	31,23	0	0	NA	NA	NA:NA	3,2	3	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA,NA	NA|113aa|up_9|NC_009142.1_2770411_2770750_+	COG2814, AraJ, Arabinose efflux permease [Carbohydrate transport and metabolism]	NA|320aa|up_8|NC_009142.1_2770898_2771858_-	COG0604, Qor, NADPH:quinone reductase and related Zn-dependent oxidoreductases [Energy production and conversion / General function prediction only]	NA|237aa|up_7|NC_009142.1_2771935_2772646_+	pfam16859, TetR_C_11, Bacterial transcriptional repressor C-terminal	NA|211aa|up_6|NC_009142.1_2773037_2773670_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|383aa|up_5|NC_009142.1_2773742_2774891_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|212aa|up_4|NC_009142.1_2775337_2775973_-	cd17393, MFS_MosC_like, Membrane protein MosC and similar proteins of the Major Facilitator Superfamily of transporters	NA|290aa|up_3|NC_009142.1_2776030_2776900_-	pfam13481, AAA_25, AAA domain	NA|307aa|up_2|NC_009142.1_2777567_2778488_-	TIGR03564, F420_MSMEG_4879, F420-dependent oxidoreductase, MSMEG_4879 family	NA|189aa|up_1|NC_009142.1_2778598_2779165_+	TIGR03968, transcriptional_regulator_TetR_family, mycofactocin system transcriptional regulator	NA|70aa|up_0|NC_009142.1_2779606_2779816_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|176aa|down_0|NC_009142.1_2780716_2781244_-	pfam13586, DDE_Tnp_1_2, Transposase DDE domain	NA|463aa|down_1|NC_009142.1_2781995_2783384_-	cd17359, MFS_XylE_like, D-xylose-proton symporter and similar transporters of the Major Facilitator Superfamily	NA|132aa|down_2|NC_009142.1_2784145_2784541_-	pfam07100, ASRT, Anabaena sensory rhodopsin transducer	NA|257aa|down_3|NC_009142.1_2784555_2785326_-	PRK05653, fabG, 3-oxoacyl-ACP reductase FabG	NA|380aa|down_4|NC_009142.1_2785360_2786500_-	cd03316, MR_like, Mandelate racemase (MR)-like subfamily of the enolase superfamily	NA|542aa|down_5|NC_009142.1_2786540_2788166_-	cd01297, D-aminoacylase, D-aminoacylases (N-acyl-D-Amino acid amidohydrolases) catalyze the hydrolysis of N-acyl-D-amino acids to produce the corresponding D-amino acids, which are used as intermediates in the synthesis of pesticides, bioactive peptides, and antibiotics	NA|443aa|down_6|NC_009142.1_2788165_2789494_-	cd17369, MFS_ShiA_like, Shikimate transporter and similar proteins of the Major Facilitator Superfamily	NA|213aa|down_7|NC_009142.1_2789609_2790248_+	COG1802, GntR, Transcriptional regulators [Transcription]	NA|164aa|down_8|NC_009142.1_2790937_2791429_+	COG1959, COG1959, Predicted transcriptional regulator [Transcription]	NA|250aa|down_9|NC_009142.1_2791395_2792145_+	PRK06500, PRK06500, SDR family oxidoreductase
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	9	5389161-5389263	8	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	TGCGGGACACCGGCACCCGGTCGGCAACC	29	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|154aa|up_8|NC_009142.1_5379481_5379943_+,NA|181aa|up_7|NC_009142.1_5379972_5380515_+,NA|417aa|up_6|NC_009142.1_5380524_5381775_+,NA|875aa|down_8|NC_009142.1_5398257_5400882_+	NA|275aa|up_9|NC_009142.1_5378091_5378916_+	pfam13340, DUF4096, Putative transposase of IS4/5 family (DUF4096)	NA|154aa|up_8|NC_009142.1_5379481_5379943_+	NA	NA|181aa|up_7|NC_009142.1_5379972_5380515_+	NA	NA|417aa|up_6|NC_009142.1_5380524_5381775_+	NA	NA|393aa|up_5|NC_009142.1_5381778_5382957_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|205aa|up_4|NC_009142.1_5383025_5383640_-	pfam13977, TetR_C_6, BetI-type transcriptional repressor, C-terminal	NA|663aa|up_3|NC_009142.1_5383636_5385625_-	COG2936, COG2936, Predicted acyl esterases [General function prediction only]	NA|576aa|up_2|NC_009142.1_5385621_5387349_-	COG1123, COG1123, ATPase components of various ABC-type transport systems, contain duplicated ATPase [General function prediction only]	NA|281aa|up_1|NC_009142.1_5387345_5388188_-	COG1173, DppC, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|319aa|up_0|NC_009142.1_5388187_5389144_-	COG0601, DppB, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|519aa|down_0|NC_009142.1_5389289_5390846_-	cd08503, PBP2_NikA_DppA_OppA_like_17, The substrate-binding component of an uncharacterized ABC-type nickel/dipeptide/oligopeptide-like import system contains the type 2 periplasmic binding fold	NA|184aa|down_1|NC_009142.1_5391082_5391634_+	pfam04343, DUF488, Protein of unknown function, DUF488	NA|292aa|down_2|NC_009142.1_5391693_5392569_-	pfam14100, PmoA, Methane oxygenase PmoA	NA|396aa|down_3|NC_009142.1_5392561_5393749_-	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|352aa|down_4|NC_009142.1_5393812_5394868_+	COG1609, PurR, Transcriptional regulators [Transcription]	NA|427aa|down_5|NC_009142.1_5395149_5396430_+	cd13585, PBP2_TMBP_like, The periplasmic-binding component of ABC transport systems specific for trehalose/maltose and similar oligosaccharides; possess type 2 periplasmic binding fold	NA|312aa|down_6|NC_009142.1_5396426_5397362_+	COG1175, UgpA, ABC-type sugar transport systems, permease components [Carbohydrate transport and metabolism]	NA|266aa|down_7|NC_009142.1_5397448_5398246_+	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|875aa|down_8|NC_009142.1_5398257_5400882_+	NA	NA|330aa|down_9|NC_009142.1_5400902_5401892_-	pfam16169, DUF4872, Domain of unknown function (DUF4872)
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	10	5687530-5688961	9,2,2	CRISPRCasFinder,CRT,PILER-CR	no	cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Type III-D,Type III-B,Type III-C,Type III-A	CCGTCACCGACGCGCAGCGTCGGTCCTCATTGCGGC,CCGTCACCGACGCGCAGCGTCGGTCCTCATTGCGGC,CCGTCACCGACGCGCAGCGTCGGTCCTCATTGCGGC	36,36,36	0	0	NA	NA	NA:NA:NA	19,19,15	19	TypeIII-D,TypeIII-B,TypeIII-C,TypeIII-A	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|324aa|up_9|NC_009142.1_5674044_5675016_+,NA|349aa|up_0|NC_009142.1_5686273_5687320_+,NA|246aa|down_2|NC_009142.1_5691296_5692034_+,csm3gr7|167aa|down_8|NC_009142.1_5701706_5702207_-	NA|324aa|up_9|NC_009142.1_5674044_5675016_+	NA	NA|1192aa|up_8|NC_009142.1_5675000_5678576_+	COG1204, COG1204, Superfamily II helicase [General function prediction only]	NA|107aa|up_7|NC_009142.1_5679671_5679992_+	pfam01527, HTH_Tnp_1, Transposase	NA|130aa|up_6|NC_009142.1_5679997_5680387_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|79aa|up_5|NC_009142.1_5680383_5680620_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|390aa|up_4|NC_009142.1_5680829_5681999_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|83aa|up_3|NC_009142.1_5682075_5682324_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|315aa|up_2|NC_009142.1_5682576_5683521_+	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|320aa|up_1|NC_009142.1_5683909_5684869_-	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|349aa|up_0|NC_009142.1_5686273_5687320_+	NA	cas1|550aa|down_0|NC_009142.1_5689321_5690971_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|96aa|down_1|NC_009142.1_5690976_5691264_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|246aa|down_2|NC_009142.1_5691296_5692034_+	NA	NA|567aa|down_3|NC_009142.1_5692058_5693759_+	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]	NA|267aa|down_4|NC_009142.1_5695281_5696082_-	PRK06526, PRK06526, transposase; Provisional	csb2gr5|391aa|down_5|NC_009142.1_5697949_5699122_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csm3gr7|449aa|down_6|NC_009142.1_5699140_5700487_-	pfam03787, RAMPs, RAMP superfamily	csx10gr5|407aa|down_7|NC_009142.1_5700489_5701710_-	TIGR02674, cas_cyan_RAMP_2, CRISPR-associated RAMP protein, Csx10 family	csm3gr7|167aa|down_8|NC_009142.1_5701706_5702207_-	NA	cas10|458aa|down_9|NC_009142.1_5702238_5703612_-	cd09679, Cas10_III, CRISPR/Cas system-associated protein Cas10
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	11	5694051-5695231	3,10,3,4	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Type III-D,Type III-B,Type III-C,Type III-A	CCTGTCACCGGCGCCAAGCGTCGGTCCTCATTGCGGCC,CTGTCACCGGCGCCAAGCGTCGGTCCTCATTGCGGC,CTGTCACCGGCGCCAAGCGTCGGTCCTCATTGCGGC,CTGTCACCGGCGCCAAGCGTCGGTCCTCATTGCGGC	38,36,36,36	0	0	NA	NA	NA:NA:NA:NA	10,14,15,10	15	TypeIII-D,TypeIII-B,TypeIII-C,TypeIII-A	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|349aa|up_4|NC_009142.1_5686273_5687320_+,NA|246aa|up_1|NC_009142.1_5691296_5692034_+,csm3gr7|167aa|down_4|NC_009142.1_5701706_5702207_-,NA|121aa|down_9|NC_009142.1_5708466_5708829_+	NA|79aa|up_9|NC_009142.1_5680383_5680620_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|390aa|up_8|NC_009142.1_5680829_5681999_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|83aa|up_7|NC_009142.1_5682075_5682324_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|315aa|up_6|NC_009142.1_5682576_5683521_+	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|320aa|up_5|NC_009142.1_5683909_5684869_-	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|349aa|up_4|NC_009142.1_5686273_5687320_+	NA	cas1|550aa|up_3|NC_009142.1_5689321_5690971_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|96aa|up_2|NC_009142.1_5690976_5691264_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|246aa|up_1|NC_009142.1_5691296_5692034_+	NA	NA|567aa|up_0|NC_009142.1_5692058_5693759_+	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]	NA|267aa|down_0|NC_009142.1_5695281_5696082_-	PRK06526, PRK06526, transposase; Provisional	csb2gr5|391aa|down_1|NC_009142.1_5697949_5699122_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csm3gr7|449aa|down_2|NC_009142.1_5699140_5700487_-	pfam03787, RAMPs, RAMP superfamily	csx10gr5|407aa|down_3|NC_009142.1_5700489_5701710_-	TIGR02674, cas_cyan_RAMP_2, CRISPR-associated RAMP protein, Csx10 family	csm3gr7|167aa|down_4|NC_009142.1_5701706_5702207_-	NA	cas10|458aa|down_5|NC_009142.1_5702238_5703612_-	cd09679, Cas10_III, CRISPR/Cas system-associated protein Cas10	csm3gr7|651aa|down_6|NC_009142.1_5703608_5705561_-	TIGR03986, CRISPR-associated_protein, CRISPR-associated protein	NA|310aa|down_7|NC_009142.1_5706888_5707818_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|104aa|down_8|NC_009142.1_5707814_5708126_-	pfam01527, HTH_Tnp_1, Transposase	NA|121aa|down_9|NC_009142.1_5708466_5708829_+	NA
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	12	5697385-5697858	11,4	CRISPRCasFinder,CRT	no	cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Type III-D,Type III-B,Type III-C,Type III-A	CTGTCACCGGCGCCAAGCGTCGGTCCTCATTGCGGC,GNNCCAAGCGNCGGTCCTCATTGCGGC	36,27	0	0	NA	NA	NA:NA	4,6	6	TypeIII-D,TypeIII-B,TypeIII-C,TypeIII-A	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|349aa|up_5|NC_009142.1_5686273_5687320_+,NA|246aa|up_2|NC_009142.1_5691296_5692034_+,csm3gr7|167aa|down_3|NC_009142.1_5701706_5702207_-,NA|121aa|down_8|NC_009142.1_5708466_5708829_+	NA|390aa|up_9|NC_009142.1_5680829_5681999_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|83aa|up_8|NC_009142.1_5682075_5682324_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|315aa|up_7|NC_009142.1_5682576_5683521_+	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|320aa|up_6|NC_009142.1_5683909_5684869_-	PRK00236, xerC, site-specific tyrosine recombinase XerC; Reviewed	NA|349aa|up_5|NC_009142.1_5686273_5687320_+	NA	cas1|550aa|up_4|NC_009142.1_5689321_5690971_+	cd09634, Cas1_I-II-III, CRISPR/Cas system-associated protein Cas1	cas2|96aa|up_3|NC_009142.1_5690976_5691264_+	pfam09827, CRISPR_Cas2, CRISPR associated protein Cas2	NA|246aa|up_2|NC_009142.1_5691296_5692034_+	NA	NA|567aa|up_1|NC_009142.1_5692058_5693759_+	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]	NA|267aa|up_0|NC_009142.1_5695281_5696082_-	PRK06526, PRK06526, transposase; Provisional	csb2gr5|391aa|down_0|NC_009142.1_5697949_5699122_-	TIGR02165, CRISPR-associated_protein_GSU0054_family, CRISPR-associated protein GSU0054/csb2, Dpsyc system	csm3gr7|449aa|down_1|NC_009142.1_5699140_5700487_-	pfam03787, RAMPs, RAMP superfamily	csx10gr5|407aa|down_2|NC_009142.1_5700489_5701710_-	TIGR02674, cas_cyan_RAMP_2, CRISPR-associated RAMP protein, Csx10 family	csm3gr7|167aa|down_3|NC_009142.1_5701706_5702207_-	NA	cas10|458aa|down_4|NC_009142.1_5702238_5703612_-	cd09679, Cas10_III, CRISPR/Cas system-associated protein Cas10	csm3gr7|651aa|down_5|NC_009142.1_5703608_5705561_-	TIGR03986, CRISPR-associated_protein, CRISPR-associated protein	NA|310aa|down_6|NC_009142.1_5706888_5707818_-	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|104aa|down_7|NC_009142.1_5707814_5708126_-	pfam01527, HTH_Tnp_1, Transposase	NA|121aa|down_8|NC_009142.1_5708466_5708829_+	NA	NA|495aa|down_9|NC_009142.1_5708966_5710451_-	pfam18145, SAVED, SMODS-associated and fused to various effectors sensor domain
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	13	5966587-5966853	12	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	CAGCGACCCACCCAGCCGAGCCG	23	0	0	NA	NA	NA	4	4	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|257aa|up_8|NC_009142.1_5956938_5957709_-,NA|91aa|up_5|NC_009142.1_5959936_5960209_+,NA|72aa|down_8|NC_009142.1_5976788_5977004_+	NA|334aa|up_9|NC_009142.1_5955821_5956823_+	COG1609, PurR, Transcriptional regulators [Transcription]	NA|257aa|up_8|NC_009142.1_5956938_5957709_-	NA	NA|241aa|up_7|NC_009142.1_5957748_5958471_-	PRK06194, PRK06194, hypothetical protein; Provisional	NA|359aa|up_6|NC_009142.1_5958615_5959692_-	pfam03417, AAT, Acyl-coenzyme A:6-aminopenicillanic acid acyl-transferase	NA|91aa|up_5|NC_009142.1_5959936_5960209_+	NA	NA|399aa|up_4|NC_009142.1_5960237_5961434_-	pfam00999, Na_H_Exchanger, Sodium/hydrogen exchanger family	NA|237aa|up_3|NC_009142.1_5961492_5962203_-	pfam13539, Peptidase_M15_4, D-alanyl-D-alanine carboxypeptidase	NA|375aa|up_2|NC_009142.1_5962366_5963491_-	pfam13556, HTH_30, PucR C-terminal helix-turn-helix domain	NA|413aa|up_1|NC_009142.1_5963881_5965120_+	TIGR03866, PQQ_ABC_repeats, PQQ-dependent catabolism-associated beta-propeller protein	NA|188aa|up_0|NC_009142.1_5965229_5965793_-	TIGR01642, Splicing_factor_U2AF_59_kDa_subunit, U2 snRNP auxilliary factor, large subunit, splicing factor	NA|284aa|down_0|NC_009142.1_5966868_5967720_-	pfam02567, PhzC-PhzF, Phenazine biosynthesis-like protein	NA|291aa|down_1|NC_009142.1_5967791_5968664_+	COG0583, LysR, Transcriptional regulator [Transcription]	NA|629aa|down_2|NC_009142.1_5968675_5970562_-	pfam10101, DUF2339, Predicted membrane protein (DUF2339)	NA|134aa|down_3|NC_009142.1_5970664_5971066_+	COG2226, UbiE, Methylase involved in ubiquinone/menaquinone biosynthesis [Coenzyme metabolism]	NA|120aa|down_4|NC_009142.1_5971049_5971409_-	pfam05239, PRC, PRC-barrel domain	NA|246aa|down_5|NC_009142.1_5971573_5972311_-	COG0668, MscS, Small-conductance mechanosensitive channel [Cell envelope biogenesis, outer membrane]	NA|1058aa|down_6|NC_009142.1_5972541_5975715_+	COG3903, COG3903, Predicted ATPase [General function prediction only]	NA|292aa|down_7|NC_009142.1_5975758_5976634_-	COG2084, MmsB, 3-hydroxyisobutyrate dehydrogenase and related beta-hydroxyacid dehydrogenases [Lipid metabolism]	NA|72aa|down_8|NC_009142.1_5976788_5977004_+	NA	NA|188aa|down_9|NC_009142.1_5977091_5977655_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	14	5986973-5987087	13	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	GCCTGAGCGGAGCACCTGACAGCCTGAGC	29	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|72aa|up_6|NC_009142.1_5976788_5977004_+,NA|88aa|up_3|NC_009142.1_5980017_5980281_-,NA|135aa|down_8|NC_009142.1_5996444_5996849_-	NA|246aa|up_9|NC_009142.1_5971573_5972311_-	COG0668, MscS, Small-conductance mechanosensitive channel [Cell envelope biogenesis, outer membrane]	NA|1058aa|up_8|NC_009142.1_5972541_5975715_+	COG3903, COG3903, Predicted ATPase [General function prediction only]	NA|292aa|up_7|NC_009142.1_5975758_5976634_-	COG2084, MmsB, 3-hydroxyisobutyrate dehydrogenase and related beta-hydroxyacid dehydrogenases [Lipid metabolism]	NA|72aa|up_6|NC_009142.1_5976788_5977004_+	NA	NA|188aa|up_5|NC_009142.1_5977091_5977655_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|609aa|up_4|NC_009142.1_5977823_5979650_-	COG1022, FAA1, Long-chain acyl-CoA synthetases (AMP-forming) [Lipid metabolism]	NA|88aa|up_3|NC_009142.1_5980017_5980281_-	NA	NA|415aa|up_2|NC_009142.1_5980445_5981690_-	cd06412, GH25_CH-type, CH-type (Chalaropsis-type) lysozymes represent one of four functionally-defined classes of peptidoglycan hydrolases (also referred to as endo-N-acetylmuramidases) that cleave bacterial cell wall peptidoglycans	NA|797aa|up_1|NC_009142.1_5982194_5984585_+	COG2183, Tex, Transcriptional accessory protein [Transcription]	NA|203aa|up_0|NC_009142.1_5985608_5986217_+	cd03395, PAP2_like_4, PAP2_like_4 proteins	NA|313aa|down_0|NC_009142.1_5987146_5988085_-	TIGR00633, DNA-apurinic_or_apyrimidinic_site_lyase, exodeoxyribonuclease III (xth)	NA|248aa|down_1|NC_009142.1_5988313_5989057_-	cd04778, HTH_MerR-like_sg2, Helix-Turn-Helix DNA binding domain of putative transcription regulators from the MerR superfamily	NA|242aa|down_2|NC_009142.1_5989202_5989928_-	COG2186, FadR, Transcriptional regulators [Transcription]	NA|256aa|down_3|NC_009142.1_5989998_5990766_-	PRK06057, PRK06057, short chain dehydrogenase; Provisional	NA|457aa|down_4|NC_009142.1_5990866_5992237_-	pfam00171, Aldedh, Aldehyde dehydrogenase family	NA|243aa|down_5|NC_009142.1_5992233_5992962_-	COG2071, COG2071, Predicted glutamine amidotransferases [General function prediction only]	NA|454aa|down_6|NC_009142.1_5992942_5994304_-	COG0174, GlnA, Glutamine synthetase [Amino acid transport and metabolism]	NA|483aa|down_7|NC_009142.1_5994570_5996019_+	TIGR00908, putative_ethanolamine_permease, ethanolamine permease	NA|135aa|down_8|NC_009142.1_5996444_5996849_-	NA	NA|510aa|down_9|NC_009142.1_5997150_5998680_-	COG3333, COG3333, Uncharacterized protein conserved in bacteria [Function unknown]
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	15	6477248-6477328	14	CRISPRCasFinder	no	csa3	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Type I-A	CCGGCAACAGCCGGGCAACCGGC	23	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|61aa|up_5|NC_009142.1_6472723_6472906_-,NA|404aa|up_0|NC_009142.1_6476024_6477236_+,NA|53aa|down_7|NC_009142.1_6484526_6484685_-	NA|258aa|up_9|NC_009142.1_6467501_6468275_-	PRK02083, PRK02083, imidazole glycerol phosphate synthase subunit HisF; Provisional	NA|128aa|up_8|NC_009142.1_6468331_6468715_+	TIGR03666, Rv2061_F420, PPOX class probable F420-dependent enzyme, Rv2061 family	NA|494aa|up_7|NC_009142.1_6469130_6470612_-	pfam08386, Abhydrolase_4, TAP-like protein	NA|244aa|up_6|NC_009142.1_6471041_6471773_-	PRK14024, PRK14024, phosphoribosyl isomerase A; Provisional	NA|61aa|up_5|NC_009142.1_6472723_6472906_-	NA	NA|211aa|up_4|NC_009142.1_6472923_6473556_-	PRK13146, hisH, imidazole glycerol phosphate synthase subunit HisH; Provisional	NA|307aa|up_3|NC_009142.1_6473742_6474663_-	cd07033, TPP_PYR_DXS_TK_like, Pyrimidine (PYR) binding domain of 1-deoxy-D-xylulose-5-phosphate synthase (DXS), transketolase (TK), and related proteins	NA|233aa|up_2|NC_009142.1_6474671_6475370_-	cd02012, TPP_TK, Thiamine pyrophosphate (TPP) family, Transketolase (TK) subfamily, TPP-binding module; TK catalyzes the transfer of a two-carbon unit from ketose phosphates to aldose phosphates	NA|154aa|up_1|NC_009142.1_6475453_6475915_+	cd01110, HTH_SoxR, Helix-Turn-Helix DNA binding domain of the SoxR transcription regulator	NA|404aa|up_0|NC_009142.1_6476024_6477236_+	NA	NA|228aa|down_0|NC_009142.1_6477611_6478295_-	COG4565, CitB, Response regulator of citrate/malate metabolism [Transcription / Signal transduction mechanisms]	NA|538aa|down_1|NC_009142.1_6478291_6479905_-	COG3290, CitA, Signal transduction histidine kinase regulating citrate/malate metabolism [Signal transduction mechanisms]	NA|463aa|down_2|NC_009142.1_6480280_6481669_+	PRK01663, PRK01663, C4-dicarboxylate transporter DctA; Reviewed	NA|94aa|down_3|NC_009142.1_6481936_6482218_+	COG3795, COG3795, Uncharacterized protein conserved in bacteria [Function unknown]	NA|406aa|down_4|NC_009142.1_6482227_6483445_+	COG4941, COG4941, Predicted RNA polymerase sigma factor containing a TPR repeat domain [Transcription]	csa3|115aa|down_5|NC_009142.1_6483667_6484012_+	cd00090, HTH_ARSR, Arsenical Resistance Operon Repressor and similar prokaryotic, metal regulated homodimeric repressors	NA|158aa|down_6|NC_009142.1_6483995_6484469_+	cd07826, SRPBCC_CalC_Aha1-like_9, Putative hydrophobic ligand-binding SRPBCC domain of an uncharacterized subgroup of CalC- and Aha1-like proteins	NA|53aa|down_7|NC_009142.1_6484526_6484685_-	NA	NA|207aa|down_8|NC_009142.1_6487177_6487798_-	PRK00951, hisB, imidazoleglycerol-phosphate dehydratase HisB	NA|373aa|down_9|NC_009142.1_6487794_6488913_-	PRK03317, PRK03317, histidinol-phosphate aminotransferase; Provisional
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	16	6962936-6963021	15	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	CCCGCAAGGCCAGGGTGAGTACGTCGAAAA	30	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA,NA|68aa|down_7|NC_009142.1_6973505_6973709_+	NA|1315aa|up_9|NC_009142.1_6950949_6954894_-	PRK11131, PRK11131, ATP-dependent RNA helicase HrpA; Provisional	NA|219aa|up_8|NC_009142.1_6955023_6955680_-	cd04647, LbH_MAT_like, Maltose O-acyltransferase (MAT)-like: This family is composed of maltose O-acetyltransferase, galactoside O-acetyltransferase (GAT), xenobiotic acyltransferase (XAT) and similar proteins	NA|386aa|up_7|NC_009142.1_6956089_6957247_-	pfam18096, Thump_like, THUMP domain-like	NA|328aa|up_6|NC_009142.1_6957404_6958388_-	pfam08241, Methyltransf_11, Methyltransferase domain	NA|261aa|up_5|NC_009142.1_6958431_6959214_-	PRK05869, PRK05869, enoyl-CoA hydratase; Validated	NA|255aa|up_4|NC_009142.1_6959326_6960091_-	COG1119, ModF, ABC-type molybdenum transport system, ATPase component/photorepair protein PhrA [Inorganic ion transport and metabolism]	NA|182aa|up_3|NC_009142.1_6960599_6961145_+	cd10548, cupin_CDO, cysteine dioxygenase, cupin domain	NA|137aa|up_2|NC_009142.1_6961141_6961552_+	cd01447, Polysulfide_ST, Polysulfide-sulfurtransferase - Rhodanese Homology Domain	NA|279aa|up_1|NC_009142.1_6961757_6962594_+	pfam13560, HTH_31, Helix-turn-helix domain	NA|69aa|up_0|NC_009142.1_6962616_6962823_+	pfam04149, DUF397, Domain of unknown function (DUF397)	NA|375aa|down_0|NC_009142.1_6963380_6964505_+	TIGR00540, TPR_hemY_coli, heme biosynthesis-associated TPR protein	NA|270aa|down_1|NC_009142.1_6964497_6965307_-	pfam13977, TetR_C_6, BetI-type transcriptional repressor, C-terminal	NA|218aa|down_2|NC_009142.1_6965875_6966529_+	pfam02517, Abi, CAAX protease self-immunity	NA|852aa|down_3|NC_009142.1_6966557_6969113_-	cd04299, GT35_Glycogen_Phosphorylase-like, proteins similar to glycogen phosphorylase	NA|420aa|down_4|NC_009142.1_6969197_6970457_+	COG2321, COG2321, Predicted metalloprotease [General function prediction only]	NA|490aa|down_5|NC_009142.1_6970596_6972066_+	COG2321, COG2321, Predicted metalloprotease [General function prediction only]	NA|308aa|down_6|NC_009142.1_6972169_6973093_-	COG3118, COG3118, Thioredoxin domain-containing protein [Posttranslational modification, protein turnover, chaperones]	NA|68aa|down_7|NC_009142.1_6973505_6973709_+	NA	NA|99aa|down_8|NC_009142.1_6973777_6974074_-	pfam01910, Thiamine_BP, Thiamine-binding protein	NA|167aa|down_9|NC_009142.1_6974204_6974705_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	17	7106441-7106655	16	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	CCGCAAACCCACGCGCCCCCGCCC	24	1	1	7106465-7106495	NC_009142.1_1071542-1071572	NA	3	3	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA,NA|127aa|down_4|NC_009142.1_7115418_7115799_+	NA|147aa|up_9|NC_009142.1_7096065_7096506_+	smart00960, Robl_LC7, Roadblock/LC7 domain	NA|221aa|up_8|NC_009142.1_7096513_7097176_+	pfam05331, DUF742, Protein of unknown function (DUF742)	NA|201aa|up_7|NC_009142.1_7097255_7097858_+	COG2229, COG2229, Predicted GTPase [General function prediction only]	NA|388aa|up_6|NC_009142.1_7098061_7099225_-	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|197aa|up_5|NC_009142.1_7099439_7100030_-	COG0262, FolA, Dihydrofolate reductase [Coenzyme metabolism]	NA|552aa|up_4|NC_009142.1_7100275_7101931_+	cd01300, YtcJ_like, YtcJ_like metal dependent amidohydrolases	NA|92aa|up_3|NC_009142.1_7102000_7102276_+	pfam11755, DUF3311, Protein of unknown function (DUF3311)	NA|493aa|up_2|NC_009142.1_7102272_7103751_+	cd10322, SLC5sbd, Solute carrier 5 family, sodium/glucose transporters and related proteins; solute-binding domain	NA|315aa|up_1|NC_009142.1_7103779_7104724_-	cd07209, Pat_hypo_Ecoli_Z1214_like, Hypothetical patatin similar to Z1214 protein of Escherichia coli	NA|145aa|up_0|NC_009142.1_7104786_7105221_-	PRK09256, PRK09256, aminoacyl-tRNA hydrolase	NA|763aa|down_0|NC_009142.1_7108289_7110578_+	PRK05222, PRK05222, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase; Provisional	NA|312aa|down_1|NC_009142.1_7110665_7111601_+	pfam02517, Abi, CAAX protease self-immunity	NA|296aa|down_2|NC_009142.1_7111624_7112512_-	pfam00494, SQS_PSY, Squalene/phytoene synthase	NA|706aa|down_3|NC_009142.1_7112924_7115042_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|127aa|down_4|NC_009142.1_7115418_7115799_+	NA	NA|145aa|down_5|NC_009142.1_7115954_7116389_-	COG4578, GutM, Glucitol operon activator [Transcription]	NA|388aa|down_6|NC_009142.1_7116473_7117637_-	cd08567, GDPD_SpGDE_like, Glycerophosphodiester phosphodiesterase domain of putative Silicibacter pomeroyi glycerophosphodiester phosphodiesterase and similar proteins	NA|385aa|down_7|NC_009142.1_7117646_7118801_-	cd17489, MFS_YfcJ_like, Escherichia coli YfcJ, YhhS, and similar transporters of the Major Facilitator Superfamily	NA|420aa|down_8|NC_009142.1_7118975_7120235_+	smart00631, Zn_pept, Zn_pept domain	NA|291aa|down_9|NC_009142.1_7120468_7121341_-	PRK13875, PRK13875, conjugal transfer protein TrbL; Provisional
GCF_000062885.1_ASM6288v1	NC_009142	Saccharopolyspora erythraea NRRL 2338, complete genome	18	7943191-7943276	17	CRISPRCasFinder	no		csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	Orphan	GAGGAGCGCCGCCAGGAGCTGGA	23	0	0	NA	NA	NA	1	1	Orphan	csa3,cas14j,cas3,c2c9_V-U4,DinG,DEDDh,Cas9_archaeal,WYL,cas4,RT,casR,cas1,cas2,csb2gr5,csm3gr7,csx10gr5,cas10	NA|64aa|up_7|NC_009142.1_7932268_7932460_+,NA|141aa|down_5|NC_009142.1_7949891_7950314_+	NA|67aa|up_9|NC_009142.1_7931072_7931273_-	pfam04149, DUF397, Domain of unknown function (DUF397)	NA|283aa|up_8|NC_009142.1_7931287_7932136_-	pfam13560, HTH_31, Helix-turn-helix domain	NA|64aa|up_7|NC_009142.1_7932268_7932460_+	NA	NA|268aa|up_6|NC_009142.1_7932507_7933311_-	smart00421, HTH_LUXR, helix_turn_helix, Lux Regulon	NA|392aa|up_5|NC_009142.1_7933611_7934787_-	cd04077, Peptidases_S8_PCSK9_ProteinaseK_like, Peptidase S8 family domain in ProteinaseK-like proteins	NA|138aa|up_4|NC_009142.1_7935036_7935450_-	pfam05239, PRC, PRC-barrel domain	NA|195aa|up_3|NC_009142.1_7935647_7936232_+	pfam07179, SseB, SseB protein N-terminal domain	NA|627aa|up_2|NC_009142.1_7936990_7938871_+	COG3387, SGA1, Glucoamylase and related glycosyl hydrolases [Carbohydrate transport and metabolism]	NA|705aa|up_1|NC_009142.1_7939551_7941666_-	PRK10060, PRK10060, cyclic di-GMP phosphodiesterase	NA|280aa|up_0|NC_009142.1_7942142_7942982_+	cd06412, GH25_CH-type, CH-type (Chalaropsis-type) lysozymes represent one of four functionally-defined classes of peptidoglycan hydrolases (also referred to as endo-N-acetylmuramidases) that cleave bacterial cell wall peptidoglycans	NA|369aa|down_0|NC_009142.1_7944112_7945219_-	PLN02316, PLN02316, synthase/transferase	NA|349aa|down_1|NC_009142.1_7945297_7946344_+	pfam13576, Pentapeptide_3, Pentapeptide repeats (9 copies)	NA|764aa|down_2|NC_009142.1_7946372_7948664_-	PRK01213, PRK01213, phosphoribosylformylglycinamidine synthase subunit PurL	NA|234aa|down_3|NC_009142.1_7948660_7949362_-	PRK03619, PRK03619, phosphoribosylformylglycinamidine synthase subunit PurQ	NA|80aa|down_4|NC_009142.1_7949358_7949598_-	PRK05974, PRK05974, phosphoribosylformylglycinamidine synthase subunit PurS; Reviewed	NA|141aa|down_5|NC_009142.1_7949891_7950314_+	NA	NA|334aa|down_6|NC_009142.1_7950436_7951438_+	cd05265, SDR_a1, atypical (a) SDRs, subgroup 1	NA|212aa|down_7|NC_009142.1_7951511_7952147_+	COG2220, COG2220, Predicted Zn-dependent hydrolases of the beta-lactamase fold [General function prediction only]	NA|136aa|down_8|NC_009142.1_7952218_7952626_-	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|257aa|down_9|NC_009142.1_7952738_7953509_-	cd11374, CE4_u10, Putative catalytic domain of uncharacterized bacterial proteins from the carbohydrate esterase 4 superfamily
