assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001922285.1_ASM192228v1	NZ_CP017292	Corynebacterium pseudotuberculosis strain MEX31, complete genome	1	22351-22564	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	Type I-E	ACGGGAACTACCTCCGCATACGCGGAGAAAAGT,GGAACTACCTCCGCATACGCGGAGAAAAG,GGAACTACCTCCGCATACGCGGAGAAAAGT	33,29,30	0	0	NA	NA	I-C,I-E,II-B:I-C,I-E,II-B:I-C,I-E,II-B	2,3,3	3	TypeI-E	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	NA|224aa|up_5|NZ_CP017292.1_17642_18314_-,NA|112aa|up_2|NZ_CP017292.1_20315_20651_+,NA|64aa|up_1|NZ_CP017292.1_20724_20916_+,NA|100aa|up_0|NZ_CP017292.1_21717_22017_-,NA	NA|172aa|up_9|NZ_CP017292.1_13536_14052_+	smart00112, CA, Cadherin repeats	NA|334aa|up_8|NZ_CP017292.1_14682_15684_+	cd06312, PBP1_ABC_sugar_binding-like, periplasmic sugar-binding domain of uncharacterized ABC-type transport systems	NA|362aa|up_7|NZ_CP017292.1_15680_16766_+	COG1172, AraH, Ribose/xylose/arabinose/galactoside ABC-type transport systems, permease components [Carbohydrate transport and metabolism]	NA|258aa|up_6|NZ_CP017292.1_16767_17541_+	COG1129, MglA, ABC-type sugar transport system, ATPase component [Carbohydrate transport and metabolism]	NA|224aa|up_5|NZ_CP017292.1_17642_18314_-	NA	NA|179aa|up_4|NZ_CP017292.1_18391_18928_+	COG0652, PpiB, Peptidyl-prolyl cis-trans isomerase (rotamase) - cyclophilin family [Posttranslational modification, protein turnover, chaperones]	NA|257aa|up_3|NZ_CP017292.1_18989_19760_+	pfam01694, Rhomboid, Rhomboid family	NA|112aa|up_2|NZ_CP017292.1_20315_20651_+	NA	NA|64aa|up_1|NZ_CP017292.1_20724_20916_+	NA	NA|100aa|up_0|NZ_CP017292.1_21717_22017_-	NA	cas2|124aa|down_0|NZ_CP017292.1_22581_22953_-	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	cas1|318aa|down_1|NZ_CP017292.1_22953_23907_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas3|896aa|down_2|NZ_CP017292.1_23909_26597_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas6e|237aa|down_3|NZ_CP017292.1_26617_27328_-	cd09727, Cas6_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas6e	cas8e|538aa|down_4|NZ_CP017292.1_27538_29152_+	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cse2gr11|198aa|down_5|NZ_CP017292.1_29148_29742_+	TIGR02548, CRISPR_system_Cascade_subunit_CasB, CRISPR type I-E/ECOLI-associated protein CasB/Cse2	cas7|356aa|down_6|NZ_CP017292.1_29741_30809_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|231aa|down_7|NZ_CP017292.1_30820_31513_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	NA|347aa|down_8|NZ_CP017292.1_31587_32628_-	COG3677, COG3677, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|308aa|down_9|NZ_CP017292.1_33035_33959_+	cd08576, GDPD_like_SMaseD_PLD, Glycerophosphodiester phosphodiesterase-like domain of spider venom sphingomyelinases D, bacterial phospholipase D, and similar proteins
GCF_001922285.1_ASM192228v1	NZ_CP017292	Corynebacterium pseudotuberculosis strain MEX31, complete genome	2	27379-27450	2	CRISPRCasFinder	no	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	Type I-E	TTCCTCGCGTCCTGCGGGGGTAG	23	0	0	NA	NA	NA	1	1	TypeI-E	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	NA|112aa|up_7|NZ_CP017292.1_20315_20651_+,NA|64aa|up_6|NZ_CP017292.1_20724_20916_+,NA|100aa|up_5|NZ_CP017292.1_21717_22017_-,NA|148aa|up_4|NZ_CP017292.1_22027_22471_-,NA	NA|179aa|up_9|NZ_CP017292.1_18391_18928_+	COG0652, PpiB, Peptidyl-prolyl cis-trans isomerase (rotamase) - cyclophilin family [Posttranslational modification, protein turnover, chaperones]	NA|257aa|up_8|NZ_CP017292.1_18989_19760_+	pfam01694, Rhomboid, Rhomboid family	NA|112aa|up_7|NZ_CP017292.1_20315_20651_+	NA	NA|64aa|up_6|NZ_CP017292.1_20724_20916_+	NA	NA|100aa|up_5|NZ_CP017292.1_21717_22017_-	NA	NA|148aa|up_4|NZ_CP017292.1_22027_22471_-	NA	cas2|124aa|up_3|NZ_CP017292.1_22581_22953_-	pfam09707, Cas_Cas2CT1978, CRISPR-associated protein (Cas_Cas2CT1978)	cas1|318aa|up_2|NZ_CP017292.1_22953_23907_-	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas3|896aa|up_1|NZ_CP017292.1_23909_26597_-	PRK09694, PRK09694, CRISPR-associated helicase/endonuclease Cas3	cas6e|237aa|up_0|NZ_CP017292.1_26617_27328_-	cd09727, Cas6_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas6e	cas8e|538aa|down_0|NZ_CP017292.1_27538_29152_+	pfam09481, CRISPR_Cse1, CRISPR-associated protein Cse1 (CRISPR_cse1)	cse2gr11|198aa|down_1|NZ_CP017292.1_29148_29742_+	TIGR02548, CRISPR_system_Cascade_subunit_CasB, CRISPR type I-E/ECOLI-associated protein CasB/Cse2	cas7|356aa|down_2|NZ_CP017292.1_29741_30809_+	pfam09344, Cas_CT1975, CT1975-like protein	cas5|231aa|down_3|NZ_CP017292.1_30820_31513_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	NA|347aa|down_4|NZ_CP017292.1_31587_32628_-	COG3677, COG3677, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|308aa|down_5|NZ_CP017292.1_33035_33959_+	cd08576, GDPD_like_SMaseD_PLD, Glycerophosphodiester phosphodiesterase-like domain of spider venom sphingomyelinases D, bacterial phospholipase D, and similar proteins	NA|289aa|down_6|NZ_CP017292.1_34011_34878_-	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|329aa|down_7|NZ_CP017292.1_34886_35873_-	PRK10440, PRK10440, iron-enterobactin ABC transporter permease	NA|356aa|down_8|NZ_CP017292.1_35872_36940_-	PRK10441, PRK10441, Fe(3+)-siderophore ABC transporter permease	NA|351aa|down_9|NZ_CP017292.1_36986_38039_+	cd01146, FhuD, Fe3+-siderophore binding domain FhuD
GCF_001922285.1_ASM192228v1	NZ_CP017292	Corynebacterium pseudotuberculosis strain MEX31, complete genome	3	642487-642580	3	CRISPRCasFinder	no		cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	Orphan	GTGTGTTGTTTGAGAACTCAATAGTGTGCCA	31	1	1	642518-642549	NZ_CP017292.1_1060052-1060083	NA	1	1	Orphan	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	NA|126aa|up_7|NZ_CP017292.1_635922_636300_-,NA|64aa|up_6|NZ_CP017292.1_636296_636488_-,NA|67aa|up_4|NZ_CP017292.1_637763_637964_+,NA	NA|301aa|up_9|NZ_CP017292.1_632571_633474_+	COG2177, FtsX, Cell division protein [Cell division and chromosome partitioning]	NA|164aa|up_8|NZ_CP017292.1_633581_634073_+	pfam01668, SmpB, SmpB protein	NA|126aa|up_7|NZ_CP017292.1_635922_636300_-	NA	NA|64aa|up_6|NZ_CP017292.1_636296_636488_-	NA	NA|241aa|up_5|NZ_CP017292.1_636993_637716_+	cd00884, beta_CA_cladeB, Carbonic anhydrases (CA) are zinc-containing enzymes that catalyze the reversible hydration of carbon dioxide in a two-step mechanism in which the nucleophilic attack of a zinc-bound hydroxide ion on carbon dioxide is followed by the regeneration of an active site by ionization of the zinc-bound water molecule and removal of a proton from the active site	NA|67aa|up_4|NZ_CP017292.1_637763_637964_+	NA	NA|331aa|up_3|NZ_CP017292.1_638324_639317_+	COG4607, CeuA, ABC-type enterochelin transport system, periplasmic component [Inorganic ion transport and metabolism]	NA|322aa|up_2|NZ_CP017292.1_639433_640399_+	COG4606, CeuB, ABC-type enterochelin transport system, permease component [Inorganic ion transport and metabolism]	NA|353aa|up_1|NZ_CP017292.1_640391_641450_+	COG4605, CeuC, ABC-type enterochelin transport system, permease component [Inorganic ion transport and metabolism]	NA|252aa|up_0|NZ_CP017292.1_641446_642202_+	COG4604, CeuD, ABC-type enterochelin transport system, ATPase component [Inorganic ion transport and metabolism]	NA|214aa|down_0|NZ_CP017292.1_649559_650201_-	pfam11580, DUF3239, Protein of unknown function (DUF3239)	NA|550aa|down_1|NZ_CP017292.1_650267_651917_-	COG1061, SSL2, DNA or RNA helicases of superfamily II [Transcription / DNA replication, recombination, and repair]	NA|833aa|down_2|NZ_CP017292.1_652031_654530_-	pfam13625, Helicase_C_3, Helicase conserved C-terminal domain	NA|208aa|down_3|NZ_CP017292.1_654770_655394_-	pfam06737, Transglycosylas, Transglycosylase-like domain	NA|131aa|down_4|NZ_CP017292.1_656218_656611_+	cd04458, CSP_CDS, Cold-Shock Protein (CSP) contains an S1-like cold-shock domain (CSD) that is found in eukaryotes, prokaryotes, and archaea	NA|176aa|down_5|NZ_CP017292.1_656679_657207_-	pfam10969, DUF2771, Protein of unknown function (DUF2771)	NA|314aa|down_6|NZ_CP017292.1_657235_658177_-	pfam05096, Glu_cyclase_2, Glutamine cyclotransferase	NA|245aa|down_7|NZ_CP017292.1_658233_658968_+	pfam11228, DUF3027, Protein of unknown function (DUF3027)	NA|493aa|down_8|NZ_CP017292.1_659181_660660_+	COG2252, COG2252, Xanthine/uracil/vitamin C permease [Nucleotide transport and    metabolism]	NA|291aa|down_9|NZ_CP017292.1_660746_661619_+	COG0566, SpoU, rRNA methylases [Translation, ribosomal structure and biogenesis]
GCF_001922285.1_ASM192228v1	NZ_CP017292	Corynebacterium pseudotuberculosis strain MEX31, complete genome	4	1842798-1842887	4	CRISPRCasFinder	no	DinG	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	Type IV-A	CCTTTTCTCCGCGCACGCGGAGGTAGTTC	29	0	0	NA	NA	I-C,I-E,II-B	1	1	Orphan	cas2,cas1,cas3,cas6e,cas8e,cse2gr11,cas7,cas5,DEDDh,WYL,cas4,csa3,DinG	NA,NA|90aa|down_0|NZ_CP017292.1_1842932_1843202_+,NA|64aa|down_1|NZ_CP017292.1_1843394_1843586_+,NA|82aa|down_3|NZ_CP017292.1_1843937_1844183_+,NA|280aa|down_4|NZ_CP017292.1_1844972_1845812_-,NA|76aa|down_6|NZ_CP017292.1_1847050_1847278_-,NA|99aa|down_7|NZ_CP017292.1_1848044_1848341_-	NA|245aa|up_9|NZ_CP017292.1_1832675_1833410_-	PRK00173, rph, ribonuclease PH; Reviewed	NA|256aa|up_8|NZ_CP017292.1_1833448_1834216_-	cd07716, RNaseZ_short-form-like_MBL-fold, uncharacterized bacterial subgroup of Ribonuclease Z, short form; MBL-fold metallo-hydrolase domain	NA|298aa|up_7|NZ_CP017292.1_1834288_1835182_-	PRK00865, PRK00865, glutamate racemase; Provisional	NA|273aa|up_6|NZ_CP017292.1_1835255_1836074_-	pfam01694, Rhomboid, Rhomboid family	NA|179aa|up_5|NZ_CP017292.1_1836160_1836697_-	pfam09438, DUF2017, Domain of unknown function (DUF2017)	NA|127aa|up_4|NZ_CP017292.1_1836791_1837172_-	PRK00033, clpS, ATP-dependent Clp protease adaptor protein ClpS; Reviewed	NA|453aa|up_3|NZ_CP017292.1_1837297_1838656_+	PRK09243, PRK09243, nicotinate phosphoribosyltransferase; Validated	DinG|665aa|up_2|NZ_CP017292.1_1838708_1840703_+	COG1199, DinG, Rad3-related DNA helicases [Transcription / DNA replication, recombination, and repair]	NA|166aa|up_1|NZ_CP017292.1_1840726_1841224_+	pfam13302, Acetyltransf_3, Acetyltransferase (GNAT) domain	NA|428aa|up_0|NZ_CP017292.1_1841220_1842504_-	cd07500, HAD_PSP, phosphoserine phosphatase (PSP), similar to Methanococcus Jannaschii PSP and Saccharomyces cerevisiae SER2p	NA|90aa|down_0|NZ_CP017292.1_1842932_1843202_+	NA	NA|64aa|down_1|NZ_CP017292.1_1843394_1843586_+	NA	NA|80aa|down_2|NZ_CP017292.1_1843655_1843895_+	pfam02661, Fic, Fic/DOC family	NA|82aa|down_3|NZ_CP017292.1_1843937_1844183_+	NA	NA|280aa|down_4|NZ_CP017292.1_1844972_1845812_-	NA	NA|88aa|down_5|NZ_CP017292.1_1846537_1846801_-	cd02042, ParAB_family, partition proteins ParAB family	NA|76aa|down_6|NZ_CP017292.1_1847050_1847278_-	NA	NA|99aa|down_7|NZ_CP017292.1_1848044_1848341_-	NA	NA|51aa|down_8|NZ_CP017292.1_1848696_1848849_-	pfam04796, RepA_C, Plasmid encoded RepA protein	NA|79aa|down_9|NZ_CP017292.1_1849022_1849259_-	pfam04796, RepA_C, Plasmid encoded RepA protein
