assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002290205.1_ASM229020v1	NZ_CP023166	Salmonella enterica subsp. enterica serovar Saintpaul strain SGB23 chromosome, complete genome	1	592861-592961	1	CRISPRCasFinder	no		cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Orphan	GCTTCAGTGGCGAACGTCGTGAA	23	0	0	NA	NA	NA	1	1	Orphan	cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA|177aa|down_1|NZ_CP023166.1_594479_595010_-	NA|448aa|up_9|NZ_CP023166.1_578939_580283_-	PRK05370, PRK05370, argininosuccinate synthase; Validated	NA|151aa|up_8|NZ_CP023166.1_580910_581363_+	PRK00092, PRK00092, ribosome maturation protein RimP; Reviewed	NA|501aa|up_7|NZ_CP023166.1_581390_582893_+	PRK09202, nusA, transcription elongation factor NusA; Validated	NA|893aa|up_6|NZ_CP023166.1_582917_585596_+	PRK05306, infB, translation initiation factor IF-2; Validated	NA|134aa|up_5|NZ_CP023166.1_585816_586218_+	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|315aa|up_4|NZ_CP023166.1_586217_587162_+	PRK05033, truB, tRNA pseudouridine synthase B; Provisional	NA|90aa|up_3|NZ_CP023166.1_587312_587582_+	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|712aa|up_2|NZ_CP023166.1_587823_589959_+	PRK11824, PRK11824, polynucleotide phosphorylase/polyadenylase; Provisional	NA|295aa|up_1|NZ_CP023166.1_590068_590953_+	PRK11189, PRK11189, lipoprotein NlpI; Provisional	NA|27aa|up_0|NZ_CP023166.1_591058_591139_+	NF033440, small_YrbN, protein YrbN	NA|415aa|down_0|NZ_CP023166.1_593174_594419_+	PRK10483, PRK10483, tryptophan permease; Provisional	NA|177aa|down_1|NZ_CP023166.1_594479_595010_-	NA	NA|240aa|down_2|NZ_CP023166.1_595168_595888_+	COG3034, COG3034, Uncharacterized protein conserved in bacteria [Function unknown]	NA|336aa|down_3|NZ_CP023166.1_595865_596873_-	PRK10508, PRK10508, luciferase-like monooxygenase	NA|299aa|down_4|NZ_CP023166.1_597050_597947_-	PRK15447, PRK15447, putative protease; Provisional	NA|332aa|down_5|NZ_CP023166.1_597937_598933_-	COG0826, COG0826, Collagenase and related proteases [Posttranslational modification, protein turnover, chaperones]	NA|175aa|down_6|NZ_CP023166.1_599149_599674_+	COG3154, COG3154, Putative lipid carrier protein [Lipid metabolism]	NA|168aa|down_7|NZ_CP023166.1_599667_600171_+	COG3153, COG3153, Predicted acetyltransferase [General function prediction only]	NA|106aa|down_8|NZ_CP023166.1_600157_600475_-	PRK00329, PRK00329, GIY-YIG nuclease superfamily protein; Validated	NA|148aa|down_9|NZ_CP023166.1_600512_600956_+	PRK03467, PRK03467, hypothetical protein; Provisional
GCF_002290205.1_ASM229020v1	NZ_CP023166	Salmonella enterica subsp. enterica serovar Saintpaul strain SGB23 chromosome, complete genome	2	1036971-1038341	1,2,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCGC,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	30,29,29,29	0	0	NA	NA	I-E:I-E:I-E:I-E	19,22,22,19	22	TypeI-E	cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|381aa|up_9|NZ_CP023166.1_1022769_1023912_+	COG1929, COG1929, Glycerate kinase [Carbohydrate transport and metabolism]	NA|919aa|up_8|NZ_CP023166.1_1023955_1026712_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|432aa|up_7|NZ_CP023166.1_1026769_1028065_+	PRK13168, rumA, 23S rRNA (uracil(1939)-C(5))-methyltransferase RlmD	NA|745aa|up_6|NZ_CP023166.1_1028116_1030351_+	PRK10872, relA, (p)ppGpp synthetase I/GTP pyrophosphokinase; Provisional	NA|119aa|up_5|NZ_CP023166.1_1030434_1030791_+	COG3609, COG3609, Predicted transcriptional regulators containing the CopG/Arc/MetJ DNA-binding domain [Transcription]	NA|99aa|up_4|NZ_CP023166.1_1030756_1031053_+	COG3668, ParE, Plasmid stabilization system protein [General function prediction only]	NA|267aa|up_3|NZ_CP023166.1_1031820_1032621_+	PRK09562, mazG, nucleoside triphosphate pyrophosphohydrolase; Reviewed	NA|546aa|up_2|NZ_CP023166.1_1032848_1034486_+	PRK05380, pyrG, CTP synthetase; Validated	NA|433aa|up_1|NZ_CP023166.1_1034568_1035867_+	PRK00077, eno, enolase; Provisional	NA|224aa|up_0|NZ_CP023166.1_1036002_1036674_+	TIGR04322, organic_radical_activating_enzyme, putative 7-cyano-7-deazaguanosine (preQ0) biosynthesis protein QueE	NA|266aa|down_0|NZ_CP023166.1_1038438_1039236_+	COG1237, COG1237, Metal-dependent hydrolases of the beta-lactamase superfamily II [General function prediction only]	NA|121aa|down_1|NZ_CP023166.1_1039323_1039686_-	cd00470, PTPS, 6-pyruvoyl tetrahydropterin synthase (PTPS)	NA|600aa|down_2|NZ_CP023166.1_1040109_1041909_+	PRK10953, cysJ, NADPH-dependent assimilatory sulfite reductase flavoprotein subunit	NA|571aa|down_3|NZ_CP023166.1_1041908_1043621_+	PRK13504, PRK13504, NADPH-dependent assimilatory sulfite reductase hemoprotein subunit	NA|245aa|down_4|NZ_CP023166.1_1043696_1044431_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|318aa|down_5|NZ_CP023166.1_1044643_1045597_-	PRK15379, PRK15379, type III secretion system effector SopD	cas3|888aa|down_6|NZ_CP023166.1_1046040_1048704_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|520aa|down_7|NZ_CP023166.1_1048715_1050275_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|187aa|down_8|NZ_CP023166.1_1050271_1050832_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|353aa|down_9|NZ_CP023166.1_1050845_1051904_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI
GCF_002290205.1_ASM229020v1	NZ_CP023166	Salmonella enterica subsp. enterica serovar Saintpaul strain SGB23 chromosome, complete genome	3	1054600-1055300	3,2	CRISPRCasFinder,CRT	no	cas3,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2	cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	Type I-E	GTGTTCCCCGCGCCAGCGGGGATAAACCG,GTGTTCCCCGCGCCAGCGGGGATAAACCG	29,29	0	0	NA	NA	I-E:I-E	11,11	11	TypeI-E	cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA,NA	NA|245aa|up_9|NZ_CP023166.1_1043696_1044431_+	PRK02090, PRK02090, phosphoadenylyl-sulfate reductase	NA|318aa|up_8|NZ_CP023166.1_1044643_1045597_-	PRK15379, PRK15379, type III secretion system effector SopD	cas3|888aa|up_7|NZ_CP023166.1_1046040_1048704_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas8e|520aa|up_6|NZ_CP023166.1_1048715_1050275_+	TIGR02547, CRISPR_system_Cascade_subunit_CasA, CRISPR type I-E/ECOLI-associated protein CasA/Cse1	cse2gr11|187aa|up_5|NZ_CP023166.1_1050271_1050832_+	cd09731, Cse2_I-E, CRISPR/Cas system-associated protein Cse2	cas7|353aa|up_4|NZ_CP023166.1_1050845_1051904_+	TIGR01869, CRISPR_system_Cascade_subunit_CasC, CRISPR-associated protein Cas7/Cse4/CasC, subtype I-E/ECOLI	cas5|249aa|up_3|NZ_CP023166.1_1051914_1052661_+	cd09645, Cas5_I-E, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas6e|217aa|up_2|NZ_CP023166.1_1052642_1053293_+	TIGR01907, CRISPR_system_Cascade_subunit_CasE, CRISPR-associated protein Cas6/Cse3/CasE, subtype I-E/ECOLI	cas1|307aa|up_1|NZ_CP023166.1_1053289_1054210_+	TIGR03638, cas1_ECOLI, CRISPR-associated endonuclease Cas1, subtype I-E/ECOLI	cas2|98aa|up_0|NZ_CP023166.1_1054209_1054503_+	PRK11558, PRK11558, putative ssRNA endonuclease; Provisional	NA|349aa|down_0|NZ_CP023166.1_1055314_1056361_-	PRK10199, PRK10199, alkaline phosphatase isozyme conversion aminopeptidase; Provisional	NA|303aa|down_1|NZ_CP023166.1_1056611_1057520_+	PRK05253, PRK05253, sulfate adenylyltransferase subunit CysD	NA|480aa|down_2|NZ_CP023166.1_1057529_1058969_+	PRK05124, cysN, sulfate adenylyltransferase subunit 1; Provisional	NA|202aa|down_3|NZ_CP023166.1_1058955_1059561_+	PRK03846, PRK03846, adenylylsulfate kinase; Provisional	NA|119aa|down_4|NZ_CP023166.1_1059578_1059935_+	pfam12084, DUF3561, Protein of unknown function (DUF3561)	NA|104aa|down_5|NZ_CP023166.1_1060125_1060437_+	PRK00888, ftsB, cell division protein FtsB; Reviewed	NA|237aa|down_6|NZ_CP023166.1_1060455_1061166_+	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|160aa|down_7|NZ_CP023166.1_1061165_1061645_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|350aa|down_8|NZ_CP023166.1_1061641_1062691_+	PRK00984, truD, tRNA pseudouridine synthase D; Reviewed	NA|254aa|down_9|NZ_CP023166.1_1062671_1063433_+	PRK00346, surE, 5'(3')-nucleotidase/polyphosphatase; Provisional
GCF_002290205.1_ASM229020v1	NZ_CP023167	Salmonella enterica subsp. enterica serovar Saintpaul strain SGB23 plasmid pSGB23, complete sequence	1	229036-229193	1	PILER-CR	no		WYL,csa3	Orphan	CCGTACCCGGTATAGTGGAT	20	0	0	NA	NA	NA	2	2	Orphan	cas3,PD-DExK,csa3,WYL,cas8e,cse2gr11,cas7,cas5,cas6e,cas1,cas2,DEDDh,DinG	NA|41aa|up_9|NZ_CP023167.1_220985_221108_+,NA|114aa|up_8|NZ_CP023167.1_221109_221451_+,NA|120aa|up_7|NZ_CP023167.1_221455_221815_+,NA|235aa|up_6|NZ_CP023167.1_222042_222747_+,NA|140aa|up_5|NZ_CP023167.1_222779_223199_-,NA|166aa|down_0|NZ_CP023167.1_229382_229880_-,NA|68aa|down_1|NZ_CP023167.1_229894_230098_-,NA|59aa|down_3|NZ_CP023167.1_233450_233627_-,NA|386aa|down_5|NZ_CP023167.1_235581_236739_-,NA|274aa|down_7|NZ_CP023167.1_237937_238759_-,NA|67aa|down_9|NZ_CP023167.1_239745_239946_-	NA|41aa|up_9|NZ_CP023167.1_220985_221108_+	NA	NA|114aa|up_8|NZ_CP023167.1_221109_221451_+	NA	NA|120aa|up_7|NZ_CP023167.1_221455_221815_+	NA	NA|235aa|up_6|NZ_CP023167.1_222042_222747_+	NA	NA|140aa|up_5|NZ_CP023167.1_222779_223199_-	NA	NA|795aa|up_4|NZ_CP023167.1_223286_225671_-	pfam13750, Big_3_3, Bacterial Ig-like domain (group 3)	NA|201aa|up_3|NZ_CP023167.1_225921_226524_+	pfam13752, DUF4165, Domain of unknown function (DUF4165)	NA|79aa|up_2|NZ_CP023167.1_226535_226772_+	pfam12245, Big_3_2, Bacterial Ig-like domain (group 3)	NA|199aa|up_1|NZ_CP023167.1_226927_227524_+	pfam13750, Big_3_3, Bacterial Ig-like domain (group 3)	NA|294aa|up_0|NZ_CP023167.1_227915_228797_+	pfam16441, DUF5038, Domain of unknown function (DUF5038)	NA|166aa|down_0|NZ_CP023167.1_229382_229880_-	NA	NA|68aa|down_1|NZ_CP023167.1_229894_230098_-	NA	NA|819aa|down_2|NZ_CP023167.1_230548_233005_-	pfam13750, Big_3_3, Bacterial Ig-like domain (group 3)	NA|59aa|down_3|NZ_CP023167.1_233450_233627_-	NA	NA|585aa|down_4|NZ_CP023167.1_233641_235396_-	pfam13708, DUF4942, Domain of unknown function (DUF4942)	NA|386aa|down_5|NZ_CP023167.1_235581_236739_-	NA	NA|275aa|down_6|NZ_CP023167.1_237098_237923_+	TIGR00571, DNA_adenine_methylase, DNA adenine methylase (dam)	NA|274aa|down_7|NZ_CP023167.1_237937_238759_-	NA	NA|236aa|down_8|NZ_CP023167.1_239041_239749_-	cd10719, DnaJ_zf, Zinc finger domain of DnaJ and HSP40	NA|67aa|down_9|NZ_CP023167.1_239745_239946_-	NA
