assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002197425.1_ASM219742v1	NZ_CP021863	Streptococcus agalactiae strain SG-M163 chromosome, complete genome	1	513653-514345	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	 Type I-U?,Type I-C,Type I-U	GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT	32,32,32,32	0	0	NA	NA	I-C:I-C:I-C:I-C	8,9,10,8	10	TypeI-U?,TypeI-C,TypeI-U	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|231aa|up_9|NZ_CP021863.1_500100_500793_+,NA|260aa|up_7|NZ_CP021863.1_503683_504463_-,NA|97aa|down_6|NZ_CP021863.1_520008_520299_+	NA|231aa|up_9|NZ_CP021863.1_500100_500793_+	NA	NA|884aa|up_8|NZ_CP021863.1_500814_503466_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|260aa|up_7|NZ_CP021863.1_503683_504463_-	NA	cas3|808aa|up_6|NZ_CP021863.1_505474_507898_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_CP021863.1_508030_508759_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_CP021863.1_508758_510654_+	cd09642, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|283aa|up_3|NZ_CP021863.1_510658_511507_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|224aa|up_2|NZ_CP021863.1_511508_512180_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_CP021863.1_512176_513202_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_CP021863.1_513212_513506_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|320aa|down_0|NZ_CP021863.1_514481_515441_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|301aa|down_1|NZ_CP021863.1_515601_516504_+	cd12827, EcCorA_ZntB-like_u2, uncharacterized bacterial subfamily of the Escherichia coli CorA-Salmonella typhimurium ZntB family	NA|355aa|down_2|NZ_CP021863.1_516663_517728_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|331aa|down_3|NZ_CP021863.1_517840_518833_+	COG2502, AsnA, Asparagine synthetase A [Amino acid transport and metabolism]	NA|150aa|down_4|NZ_CP021863.1_518877_519327_-	TIGR01295, Pediocin_PA-1_biosynthesis_protein_PedC, bacteriocin transport accessory protein, putative	NA|235aa|down_5|NZ_CP021863.1_519292_519997_+	pfam03602, Cons_hypoth95, Conserved hypothetical protein 95	NA|97aa|down_6|NZ_CP021863.1_520008_520299_+	NA	NA|162aa|down_7|NZ_CP021863.1_520295_520781_+	cd02163, PPAT, Phosphopantetheine adenylyltransferase	NA|358aa|down_8|NZ_CP021863.1_520770_521844_+	COG3480, SdrC, Predicted secreted protein containing a PDZ domain [Signal transduction mechanisms]	NA|445aa|down_9|NZ_CP021863.1_521918_523253_+	cd00845, MPP_UshA_N_like, Escherichia coli UshA-like family, N-terminal metallophosphatase domain
GCF_002197425.1_ASM219742v1	NZ_CP021863	Streptococcus agalactiae strain SG-M163 chromosome, complete genome	2	915874-916569	3,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas9,cas1,cas2,csn2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type II-C,Type II-B,Type II-A	GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	7,9,10	10	TypeII-C,TypeII-B,TypeII-A	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA,NA	NA|124aa|up_9|NZ_CP021863.1_905255_905627_+	pfam08349, DUF1722, Protein of unknown function (DUF1722)	NA|127aa|up_8|NZ_CP021863.1_905651_906032_+	TIGR02328, TIGR02328, conserved hypothetical protein	NA|377aa|up_7|NZ_CP021863.1_906123_907254_+	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|246aa|up_6|NZ_CP021863.1_907257_907995_+	pfam01643, Acyl-ACP_TE, Acyl-ACP thioesterase	NA|257aa|up_5|NZ_CP021863.1_907995_908766_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|219aa|up_4|NZ_CP021863.1_908755_909412_+	COG4478, COG4478, Predicted membrane protein [Function unknown]	cas9|1371aa|up_3|NZ_CP021863.1_909799_913912_+	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	cas1|290aa|up_2|NZ_CP021863.1_913913_914783_+	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	cas2|114aa|up_1|NZ_CP021863.1_914779_915121_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|222aa|up_0|NZ_CP021863.1_915107_915773_+	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	NA|139aa|down_0|NZ_CP021863.1_917126_917543_+	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|611aa|down_1|NZ_CP021863.1_917678_919511_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|878aa|down_2|NZ_CP021863.1_919757_922391_+	NF033189, internalin_A, class 1 internalin InlA	NA|220aa|down_3|NZ_CP021863.1_922490_923150_+	COG1418, COG1418, Predicted HD superfamily hydrolase [General function prediction only]	NA|155aa|down_4|NZ_CP021863.1_923158_923623_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|130aa|down_5|NZ_CP021863.1_923622_924012_+	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|931aa|down_6|NZ_CP021863.1_924163_926956_+	COG0474, MgtA, Cation transport ATPase [Inorganic ion transport and metabolism]	NA|368aa|down_7|NZ_CP021863.1_926955_928059_+	pfam11187, DUF2974, Protein of unknown function (DUF2974)	NA|213aa|down_8|NZ_CP021863.1_928179_928818_-	cd03349, LbH_XAT, Xenobiotic acyltransferase (XAT): The XAT class of hexapeptide acyltransferases is composed of a large number of microbial enzymes that catalyze the CoA-dependent acetylation of a variety of hydroxyl-bearing acceptors such as chloramphenicol and streptogramin, among others	NA|204aa|down_9|NZ_CP021863.1_929528_930140_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]
GCF_002197425.1_ASM219742v1	NZ_CP021863	Streptococcus agalactiae strain SG-M163 chromosome, complete genome	3	1954831-1955328	3	CRT	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Orphan	TGGTTTGGCNTCTGGNTT	18	1	1	1955209-1955226	NZ_CP021863.1_1955608-1955625	NA	8	8	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|203aa|up_4|NZ_CP021863.1_1947189_1947798_+,NA	NA|615aa|up_9|NZ_CP021863.1_1934256_1936101_-	PRK08645, PRK08645, bifunctional homocysteine S-methyltransferase/5,10-methylenetetrahydrofolate reductase protein; Reviewed	NA|746aa|up_8|NZ_CP021863.1_1936145_1938383_-	PRK05222, PRK05222, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase; Provisional	NA|108aa|up_7|NZ_CP021863.1_1938752_1939076_-	COG4392, COG4392, Predicted membrane protein [Function unknown]	NA|231aa|up_6|NZ_CP021863.1_1939065_1939758_-	COG1296, AzlC, Predicted branched-chain amino acid permease (azaleucine resistance) [Amino acid transport and metabolism]	NA|463aa|up_5|NZ_CP021863.1_1945708_1947097_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|203aa|up_4|NZ_CP021863.1_1947189_1947798_+	NA	NA|834aa|up_3|NZ_CP021863.1_1947887_1950389_-	PRK00390, leuS, leucyl-tRNA synthetase; Validated	NA|416aa|up_2|NZ_CP021863.1_1950765_1952013_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|269aa|up_1|NZ_CP021863.1_1952670_1953476_-	pfam13359, DDE_Tnp_4, DDE superfamily endonuclease	NA|180aa|up_0|NZ_CP021863.1_1953899_1954439_-	PRK05609, nusG, transcription antitermination protein NusG; Validated	NA|58aa|down_0|NZ_CP021863.1_1957429_1957603_-	COG0690, SecE, Preprotein translocase subunit SecE [Intracellular trafficking and secretion]	NA|51aa|down_1|NZ_CP021863.1_1957638_1957791_-	PRK00504, rpmG, 50S ribosomal protein L33; Validated	NA|774aa|down_2|NZ_CP021863.1_1957839_1960161_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|295aa|down_3|NZ_CP021863.1_1960204_1961089_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|547aa|down_4|NZ_CP021863.1_1961113_1962754_-	COG4640, COG4640, Predicted membrane protein [Function unknown]	NA|404aa|down_5|NZ_CP021863.1_1962923_1964135_-	PRK05362, PRK05362, phosphopentomutase; Provisional	NA|224aa|down_6|NZ_CP021863.1_1964201_1964873_-	PRK00507, PRK00507, deoxyribose-phosphate aldolase; Provisional	NA|401aa|down_7|NZ_CP021863.1_1964902_1966105_-	COG1972, NupC, Nucleoside permease [Nucleotide transport and metabolism]	NA|260aa|down_8|NZ_CP021863.1_1966125_1966905_-	cd17767, UP_EcUdp-like, uridine phosphorylases similar to Escherichia coli Udp and related phosphorylases	NA|246aa|down_9|NZ_CP021863.1_1967063_1967801_+	COG2188, PhnF, Transcriptional regulators [Transcription]
GCF_002197425.1_ASM219742v1	NZ_CP021863	Streptococcus agalactiae strain SG-M163 chromosome, complete genome	4	2004879-2004965	3	CRISPRCasFinder	no	csa3	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-A	AGCAGTATCGTACTTAGTTTGAGC	24	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|154aa|up_0|NZ_CP021863.1_2003533_2003995_-,NA|319aa|down_1|NZ_CP021863.1_2007384_2008341_-,NA|98aa|down_2|NZ_CP021863.1_2008575_2008869_+,NA|147aa|down_3|NZ_CP021863.1_2008950_2009391_+,NA|177aa|down_4|NZ_CP021863.1_2009387_2009918_+,NA|424aa|down_6|NZ_CP021863.1_2010827_2012099_+,NA|88aa|down_7|NZ_CP021863.1_2012181_2012445_+	NA|146aa|up_9|NZ_CP021863.1_1994874_1995312_-	TIGR01529, Arginine_repressor	NA|564aa|up_8|NZ_CP021863.1_1995533_1997225_+	PRK12451, PRK12451, arginyl-tRNA synthetase; Reviewed	NA|103aa|up_7|NZ_CP021863.1_1997312_1997621_+	pfam08951, EntA_Immun, Enterocin A Immunity	NA|291aa|up_6|NZ_CP021863.1_1997647_1998520_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|315aa|up_5|NZ_CP021863.1_1998627_1999572_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|584aa|up_4|NZ_CP021863.1_1999561_2001313_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|427aa|up_3|NZ_CP021863.1_2001405_2002686_-	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|61aa|up_2|NZ_CP021863.1_2002905_2003088_+	PRK01110, rpmF, 50S ribosomal protein L32; Validated	NA|50aa|up_1|NZ_CP021863.1_2003103_2003253_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|154aa|up_0|NZ_CP021863.1_2003533_2003995_-	NA	NA|112aa|down_0|NZ_CP021863.1_2007012_2007348_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|319aa|down_1|NZ_CP021863.1_2007384_2008341_-	NA	NA|98aa|down_2|NZ_CP021863.1_2008575_2008869_+	NA	NA|147aa|down_3|NZ_CP021863.1_2008950_2009391_+	NA	NA|177aa|down_4|NZ_CP021863.1_2009387_2009918_+	NA	NA|249aa|down_5|NZ_CP021863.1_2009917_2010664_+	COG1674, FtsK, DNA segregation ATPase FtsK/SpoIIIE and related proteins [Cell division and chromosome partitioning]	NA|424aa|down_6|NZ_CP021863.1_2010827_2012099_+	NA	NA|88aa|down_7|NZ_CP021863.1_2012181_2012445_+	NA	NA|422aa|down_8|NZ_CP021863.1_2012541_2013807_+	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons	NA|209aa|down_9|NZ_CP021863.1_2014213_2014840_+	pfam03596, Cad, Cadmium resistance transporter
