assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000195815.1_ASM19581v1	NC_002935	Corynebacterium diphtheriae NCTC 13129, complete genome	1	39014-39496	1,1,1	CRISPRCasFinder,CRT,PILER-CR	no	cas9,cas1,cas2	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	 or Type II-C?,Type II-B,Type II-C,Type II-A, Type II-B	GAAGTCTATCAGGGTTTTTGAGAACTGAACCCCAGT,GAAGTCTATCAGGGTTTTTGAGAACTGAACCCCAGT,GAAGTCTATCAGGGTTTTTGAGAACTGAACCCCAG	36,36,35	0	0	NA	NA	NA:NA:NA	6,7,3	7	orTypeII-C?,TypeII-B,TypeII-C,TypeII-A,TypeII-B	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	NA,NA	NA|600aa|up_9|NC_002935.2_27566_29366_+	PRK09284, PRK09284, thiamine biosynthesis protein ThiC; Provisional	NA|223aa|up_8|NC_002935.2_29349_30018_+	PRK00043, thiE, thiamine phosphate synthase	NA|363aa|up_7|NC_002935.2_30014_31103_+	TIGR02352, Glycine_oxidase, glycine oxidase ThiO	NA|67aa|up_6|NC_002935.2_31086_31287_+	TIGR01683, thiamine_biosynthesis_protein_ThiS, thiamine biosynthesis protein ThiS	NA|262aa|up_5|NC_002935.2_31288_32074_+	PRK00208, thiG, thiazole synthase; Reviewed	NA|337aa|up_4|NC_002935.2_32073_33084_+	PRK05600, PRK05600, thiamine biosynthesis protein ThiF; Validated	NA|273aa|up_3|NC_002935.2_33080_33899_+	PRK14713, PRK14713, bifunctional hydroxymethylpyrimidine kinase/phosphomethylpyrimidine kinase	cas9|1085aa|up_2|NC_002935.2_34477_37732_+	pfam18470, Cas9_a, Cas9 alpha-helical lobe domain	cas1|305aa|up_1|NC_002935.2_37735_38650_+	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas2|110aa|up_0|NC_002935.2_38633_38963_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	NA|78aa|down_0|NC_002935.2_42735_42969_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|90aa|down_1|NC_002935.2_43307_43577_-	PRK00159, PRK00159, putative septation inhibitor protein; Reviewed	NA|674aa|down_2|NC_002935.2_43693_45715_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|502aa|down_3|NC_002935.2_45711_47217_-	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|487aa|down_4|NC_002935.2_47229_48690_-	COG0768, FtsI, Cell division protein FtsI/penicillin-binding protein 2 [Cell envelope biogenesis, outer membrane]	NA|450aa|down_5|NC_002935.2_48686_50036_-	COG0772, FtsW, Bacterial cell division membrane protein [Cell division and chromosome partitioning]	NA|485aa|down_6|NC_002935.2_50036_51491_-	COG0631, PTC1, Serine/threonine protein phosphatase [Signal transduction mechanisms]	NA|163aa|down_7|NC_002935.2_51490_51979_-	COG1716, COG1716, FOG: FHA domain [Signal transduction mechanisms]	NA|289aa|down_8|NC_002935.2_51992_52859_-	pfam12401, DUF3662, Protein of unknown function (DUF2662)	NA|745aa|down_9|NC_002935.2_53812_56047_-	cd07552, P-type_ATPase_Cu-like, P-type heavy metal-transporting ATPase, similar to Archaeoglobus fulgidus CopB, a Cu(2+)-ATPase
GCF_000195815.1_ASM19581v1	NC_002935	Corynebacterium diphtheriae NCTC 13129, complete genome	2	979277-979376	2	CRISPRCasFinder	no		cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	Orphan	GGTGCGGCAGATGGTATCGACGATGGCATTTCCGTT	36	1	1	979313-979340	NC_002935.2_1771042-1771015	NA	1	1	Orphan	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	NA|138aa|up_9|NC_002935.2_964907_965321_+,NA|170aa|up_4|NC_002935.2_968958_969468_+,NA|227aa|up_3|NC_002935.2_969518_970199_+,NA|277aa|up_0|NC_002935.2_977877_978708_-,NA|181aa|down_4|NC_002935.2_983605_984148_-,NA|94aa|down_7|NC_002935.2_987077_987359_+	NA|138aa|up_9|NC_002935.2_964907_965321_+	NA	NA|148aa|up_8|NC_002935.2_965351_965795_+	PRK00182, tatB, Sec-independent protein translocase subunit TatB	NA|378aa|up_7|NC_002935.2_965797_966931_-	pfam10609, ParA, NUBPL iron-transfer P-loop NTPase	NA|199aa|up_6|NC_002935.2_966943_967540_-	COG4420, COG4420, Predicted membrane protein [Function unknown]	NA|430aa|up_5|NC_002935.2_967543_968833_-	COG2239, MgtE, Mg/Co/Ni transporter MgtE (contains CBS domain) [Inorganic ion transport and metabolism]	NA|170aa|up_4|NC_002935.2_968958_969468_+	NA	NA|227aa|up_3|NC_002935.2_969518_970199_+	NA	NA|1238aa|up_2|NC_002935.2_970253_973967_-	PRK12270, kgd, multifunctional oxoglutarate decarboxylase/oxoglutarate dehydrogenase thiamine pyrophosphate-binding subunit/dihydrolipoyllysine-residue succinyltransferase subunit	NA|1247aa|up_1|NC_002935.2_974129_977870_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|277aa|up_0|NC_002935.2_977877_978708_-	NA	NA|271aa|down_0|NC_002935.2_979491_980304_-	PRK12550, PRK12550, shikimate 5-dehydrogenase; Reviewed	NA|527aa|down_1|NC_002935.2_980323_981904_+	COG2272, PnbA, Carboxylesterase type B [Lipid metabolism]	NA|270aa|down_2|NC_002935.2_981925_982735_+	pfam11575, FhuF_C, FhuF 2Fe-2S C-terminal domain	NA|271aa|down_3|NC_002935.2_982784_983597_+	PRK12298, obgE, GTPase CgtA; Reviewed	NA|181aa|down_4|NC_002935.2_983605_984148_-	NA	NA|306aa|down_5|NC_002935.2_984452_985370_+	cd09022, Aldose_epim_Ec_YihR, Aldose 1-epimerase, similar to Escherichia coli YihR	NA|553aa|down_6|NC_002935.2_985406_987065_+	cd11478, SLC5sbd_u2, Uncharacterized bacterial solute carrier 5 subfamily; putative solute-binding domain	NA|94aa|down_7|NC_002935.2_987077_987359_+	NA	NA|377aa|down_8|NC_002935.2_987358_988489_+	cd00608, GalT, Galactose-1-phosphate uridyl transferase (GalT): This enzyme plays a key role in galactose metabolism by catalysing the transfer of a uridine 5'-phosphoryl group from UDP-galactose 1-phosphate	NA|410aa|down_9|NC_002935.2_988472_989702_+	COG0153, GalK, Galactokinase [Carbohydrate transport and metabolism]
GCF_000195815.1_ASM19581v1	NC_002935	Corynebacterium diphtheriae NCTC 13129, complete genome	3	1499043-1499155	3	CRISPRCasFinder	no		cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	Orphan	GCTGGTTTAGGAGCCGCAGGCTT	23	0	0	NA	NA	NA	2	2	Orphan	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	NA,NA	NA|756aa|up_9|NC_002935.2_1486306_1488574_-	TIGR02696, polyribonucleotide_nucleotidyltransferase, guanosine pentaphosphate synthetase I/polynucleotide phosphorylase	NA|90aa|up_8|NC_002935.2_1488765_1489035_-	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|320aa|up_7|NC_002935.2_1489206_1490166_-	cd02650, nuc_hydro_CaPnhB, NH_hydro_CaPnhB: A subgroup of nucleoside hydrolases similar to Corynebacterium ammoniagenes Purine/pyrimidine nucleoside hydrolase (pnhB)	NA|324aa|up_6|NC_002935.2_1490203_1491175_-	PRK05627, PRK05627, bifunctional riboflavin kinase/FAD synthetase	NA|301aa|up_5|NC_002935.2_1491197_1492100_+	PRK03287, truB, tRNA pseudouridine synthase B; Provisional	NA|231aa|up_4|NC_002935.2_1492096_1492789_-	COG2977, EntD, Phosphopantetheinyl transferase component of siderophore synthetase [Secondary metabolites biosynthesis, transport, and catabolism]	NA|269aa|up_3|NC_002935.2_1492785_1493592_-	COG1409, Icc, Predicted phosphohydrolases [General function prediction only]	NA|440aa|up_2|NC_002935.2_1493638_1494958_-	cd13136, MATE_DinF_like, DinF and similar proteins, a subfamily of the multidrug and toxic compound extrusion (MATE)-like proteins	NA|314aa|up_1|NC_002935.2_1494954_1495896_-	COG0618, COG0618, Exopolyphosphatase-related proteins [General function prediction only]	NA|148aa|up_0|NC_002935.2_1495935_1496379_-	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|111aa|down_0|NC_002935.2_1499490_1499823_-	pfam04296, DUF448, Protein of unknown function (DUF448)	NA|333aa|down_1|NC_002935.2_1500078_1501077_-	PRK12327, nusA, transcription elongation factor NusA; Provisional	NA|185aa|down_2|NC_002935.2_1501073_1501628_-	PRK00092, PRK00092, ribosome maturation protein RimP; Reviewed	NA|303aa|down_3|NC_002935.2_1501679_1502588_+	pfam14530, DUF4439, Domain of unknown function (DUF4439)	NA|586aa|down_4|NC_002935.2_1502666_1504424_-	PRK09194, PRK09194, prolyl-tRNA synthetase; Provisional	NA|249aa|down_5|NC_002935.2_1504455_1505202_+	PRK02101, PRK02101, peroxide stress protein YaaA	NA|275aa|down_6|NC_002935.2_1505221_1506046_-	cd11642, SUMT, Uroporphyrin-III C-methyltransferase (also known as S-Adenosyl-L-methionine:uroporphyrinogen III methyltransferase, SUMT)	NA|449aa|down_7|NC_002935.2_1506044_1507391_+	PRK00029, PRK00029, YdiU family protein	NA|375aa|down_8|NC_002935.2_1507394_1508519_-	COG0523, COG0523, Putative GTPases (G3E family) [General function prediction only]	NA|170aa|down_9|NC_002935.2_1508538_1509048_-	pfam01035, DNA_binding_1, 6-O-methylguanine DNA methyltransferase, DNA binding domain
GCF_000195815.1_ASM19581v1	NC_002935	Corynebacterium diphtheriae NCTC 13129, complete genome	4	1824800-1824907	4	CRISPRCasFinder	no		cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	Orphan	ACAGCGCGACGACGCCCACGGGAG	24	0	0	NA	NA	NA	1	1	Orphan	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	NA|84aa|up_3|NC_002935.2_1821943_1822195_-,NA	NA|274aa|up_9|NC_002935.2_1816727_1817549_-	pfam02645, DegV, Uncharacterized protein, DegV family COG1307	NA|241aa|up_8|NC_002935.2_1817553_1818276_-	pfam00300, His_Phos_1, Histidine phosphatase superfamily (branch 1)	NA|156aa|up_7|NC_002935.2_1818282_1818750_-	pfam02410, RsfS, Ribosomal silencing factor during starvation	NA|229aa|up_6|NC_002935.2_1818772_1819459_-	PRK00071, nadD, nicotinate-nucleotide adenylyltransferase	NA|431aa|up_5|NC_002935.2_1819482_1820775_-	PRK00197, proA, gamma-glutamyl phosphate reductase; Provisional	NA|377aa|up_4|NC_002935.2_1820792_1821923_-	PRK05429, PRK05429, gamma-glutamyl kinase; Provisional	NA|84aa|up_3|NC_002935.2_1821943_1822195_-	NA	NA|509aa|up_2|NC_002935.2_1822198_1823725_-	PRK12296, obgE, GTPase CgtA; Reviewed	NA|89aa|up_1|NC_002935.2_1823885_1824152_-	PRK05435, rpmA, 50S ribosomal protein L27; Validated	NA|102aa|up_0|NC_002935.2_1824192_1824498_-	PRK05573, rplU, 50S ribosomal protein L21; Validated	NA|137aa|down_0|NC_002935.2_1827842_1828253_-	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|138aa|down_1|NC_002935.2_1828444_1828858_-	pfam14017, DUF4233, Protein of unknown function (DUF4233)	NA|499aa|down_2|NC_002935.2_1828854_1830351_-	COG0285, FolC, Folylpolyglutamate synthase [Coenzyme metabolism]	NA|903aa|down_3|NC_002935.2_1830347_1833056_-	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|327aa|down_4|NC_002935.2_1833150_1834131_-	PRK05442, PRK05442, malate dehydrogenase; Provisional	NA|251aa|down_5|NC_002935.2_1834613_1835366_+	pfam17938, TetR_C_29, Tetracyclin repressor-like, C-terminal domain	NA|431aa|down_6|NC_002935.2_1835402_1836695_-	PRK05342, clpX, ATP-dependent Clp protease ATP-binding subunit ClpX	NA|842aa|down_7|NC_002935.2_1836841_1839367_-	COG0147, TrpE, Anthranilate/para-aminobenzoate synthases component I [Amino acid transport and metabolism / Coenzyme metabolism]	NA|210aa|down_8|NC_002935.2_1839461_1840091_-	PRK12553, PRK12553, ATP-dependent Clp protease proteolytic subunit; Reviewed	NA|200aa|down_9|NC_002935.2_1840108_1840708_-	PRK00277, clpP, ATP-dependent Clp protease proteolytic subunit; Reviewed
GCF_000195815.1_ASM19581v1	NC_002935	Corynebacterium diphtheriae NCTC 13129, complete genome	5	2306022-2307638	2,5,2	PILER-CR,CRISPRCasFinder,CRT	no	cas5,cas7,cse2gr11,cas8e,cas6e,cas3,cas1,cas2	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	Type I-E	GTCTTCTCCGCACACGCGGAGGTATTTC,GTCTTCTCCGCACACGCGGAGGTATTTCC,GTCTTCTCCGCACACGCGGAGGTATTTCC	28,29,29	0	0	NA	NA	I-C,I-E,II-B:I-C,I-E,II-B:I-C,I-E,II-B	26,26,26	26	TypeI-E	cas9,cas1,cas2,DEDDh,csa3,cas3,WYL,cas4,DinG,cas5,cas7,cse2gr11,cas8e,cas6e	NA,NA|57aa|down_0|NC_002935.2_2307663_2307834_+,NA|226aa|down_2|NC_002935.2_2309126_2309804_+,NA|92aa|down_3|NC_002935.2_2310209_2310485_+,NA|50aa|down_4|NC_002935.2_2310640_2310790_+	NA|92aa|up_9|NC_002935.2_2294402_2294678_-	cd03214, ABC_Iron-Siderophores_B12_Hemin, ATP-binding component of iron-siderophores, vitamin B12 and hemin transporters and related proteins	NA|607aa|up_8|NC_002935.2_2295147_2296968_+	COG5479, COG5479, Uncharacterized protein potentially involved in peptidoglycan biosynthesis [Cell envelope biogenesis, outer membrane]	cas5|243aa|up_7|NC_002935.2_2297076_2297805_-	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|353aa|up_6|NC_002935.2_2297797_2298856_-	pfam09344, Cas_CT1975, CT1975-like protein	cse2gr11|195aa|up_5|NC_002935.2_2298911_2299496_-	TIGR02548, CRISPR_system_Cascade_subunit_CasB, CRISPR type I-E/ECOLI-associated protein CasB/Cse2	cas8e|519aa|up_4|NC_002935.2_2299488_2301045_-	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cas6e|229aa|up_3|NC_002935.2_2301410_2302097_+	cd09727, Cas6_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas6e	cas3|877aa|up_2|NC_002935.2_2302096_2304727_+	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas1|320aa|up_1|NC_002935.2_2304728_2305688_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|105aa|up_0|NC_002935.2_2305688_2306003_+	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	NA|57aa|down_0|NC_002935.2_2307663_2307834_+	NA	NA|172aa|down_1|NC_002935.2_2307892_2308408_+	PRK07772, PRK07772, single-stranded DNA-binding protein; Provisional	NA|226aa|down_2|NC_002935.2_2309126_2309804_+	NA	NA|92aa|down_3|NC_002935.2_2310209_2310485_+	NA	NA|50aa|down_4|NC_002935.2_2310640_2310790_+	NA	NA|270aa|down_5|NC_002935.2_2310947_2311757_-	pfam17802, SpaA, Prealbumin-like fold domain	NA|349aa|down_6|NC_002935.2_2311829_2312876_-	cd05827, Sortase_C, Sortase domain found in class C sortases	NA|319aa|down_7|NC_002935.2_2312859_2313816_-	cd05827, Sortase_C, Sortase domain found in class C sortases	NA|556aa|down_8|NC_002935.2_2314005_2315673_-	TIGR04226, Fimbrial_subunit_type_2, fimbrial isopeptide formation D2 domain	NA|1376aa|down_9|NC_002935.2_2315776_2319904_-	COG4932, COG4932, Predicted outer membrane protein [Cell envelope biogenesis, outer membrane]
