assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002197285.1_ASM219728v1	NZ_CP021866	Streptococcus agalactiae strain SG-M29 chromosome, complete genome	1	513652-514344	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-C,Type I-U, Type I-U?	GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT	32,32,32	0	0	NA	NA	I-C:I-C:I-C	7,9,10	10	TypeI-C,TypeI-U,TypeI-U?	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|231aa|up_9|NZ_CP021866.1_500099_500792_+,NA|260aa|up_7|NZ_CP021866.1_503682_504462_-,NA|97aa|down_6|NZ_CP021866.1_520007_520298_+	NA|231aa|up_9|NZ_CP021866.1_500099_500792_+	NA	NA|884aa|up_8|NZ_CP021866.1_500813_503465_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|260aa|up_7|NZ_CP021866.1_503682_504462_-	NA	cas3|808aa|up_6|NZ_CP021866.1_505473_507897_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_CP021866.1_508029_508758_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_CP021866.1_508757_510653_+	cd09642, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|283aa|up_3|NZ_CP021866.1_510657_511506_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|224aa|up_2|NZ_CP021866.1_511507_512179_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_CP021866.1_512175_513201_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_CP021866.1_513211_513505_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|320aa|down_0|NZ_CP021866.1_514480_515440_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|301aa|down_1|NZ_CP021866.1_515600_516503_+	cd12827, EcCorA_ZntB-like_u2, uncharacterized bacterial subfamily of the Escherichia coli CorA-Salmonella typhimurium ZntB family	NA|355aa|down_2|NZ_CP021866.1_516662_517727_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|331aa|down_3|NZ_CP021866.1_517839_518832_+	COG2502, AsnA, Asparagine synthetase A [Amino acid transport and metabolism]	NA|150aa|down_4|NZ_CP021866.1_518876_519326_-	TIGR01295, Pediocin_PA-1_biosynthesis_protein_PedC, bacteriocin transport accessory protein, putative	NA|235aa|down_5|NZ_CP021866.1_519291_519996_+	pfam03602, Cons_hypoth95, Conserved hypothetical protein 95	NA|97aa|down_6|NZ_CP021866.1_520007_520298_+	NA	NA|162aa|down_7|NZ_CP021866.1_520294_520780_+	cd02163, PPAT, Phosphopantetheine adenylyltransferase	NA|358aa|down_8|NZ_CP021866.1_520769_521843_+	COG3480, SdrC, Predicted secreted protein containing a PDZ domain [Signal transduction mechanisms]	NA|445aa|down_9|NZ_CP021866.1_521917_523252_+	cd00845, MPP_UshA_N_like, Escherichia coli UshA-like family, N-terminal metallophosphatase domain
GCF_002197285.1_ASM219728v1	NZ_CP021866	Streptococcus agalactiae strain SG-M29 chromosome, complete genome	2	915873-916568	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas9,cas1,cas2,csn2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type II-B,Type II-C,Type II-A	GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	7,9,10	10	TypeII-B,TypeII-C,TypeII-A	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA,NA	NA|124aa|up_9|NZ_CP021866.1_905254_905626_+	pfam08349, DUF1722, Protein of unknown function (DUF1722)	NA|127aa|up_8|NZ_CP021866.1_905650_906031_+	TIGR02328, TIGR02328, conserved hypothetical protein	NA|377aa|up_7|NZ_CP021866.1_906122_907253_+	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|246aa|up_6|NZ_CP021866.1_907256_907994_+	pfam01643, Acyl-ACP_TE, Acyl-ACP thioesterase	NA|257aa|up_5|NZ_CP021866.1_907994_908765_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|219aa|up_4|NZ_CP021866.1_908754_909411_+	COG4478, COG4478, Predicted membrane protein [Function unknown]	cas9|1371aa|up_3|NZ_CP021866.1_909798_913911_+	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	cas1|290aa|up_2|NZ_CP021866.1_913912_914782_+	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	cas2|114aa|up_1|NZ_CP021866.1_914778_915120_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|222aa|up_0|NZ_CP021866.1_915106_915772_+	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	NA|139aa|down_0|NZ_CP021866.1_917125_917542_+	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|611aa|down_1|NZ_CP021866.1_917677_919510_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|878aa|down_2|NZ_CP021866.1_919756_922390_+	NF033189, internalin_A, class 1 internalin InlA	NA|220aa|down_3|NZ_CP021866.1_922489_923149_+	COG1418, COG1418, Predicted HD superfamily hydrolase [General function prediction only]	NA|155aa|down_4|NZ_CP021866.1_923157_923622_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|130aa|down_5|NZ_CP021866.1_923621_924011_+	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|931aa|down_6|NZ_CP021866.1_924162_926955_+	COG0474, MgtA, Cation transport ATPase [Inorganic ion transport and metabolism]	NA|368aa|down_7|NZ_CP021866.1_926954_928058_+	pfam11187, DUF2974, Protein of unknown function (DUF2974)	NA|213aa|down_8|NZ_CP021866.1_928178_928817_-	cd03349, LbH_XAT, Xenobiotic acyltransferase (XAT): The XAT class of hexapeptide acyltransferases is composed of a large number of microbial enzymes that catalyze the CoA-dependent acetylation of a variety of hydroxyl-bearing acceptors such as chloramphenicol and streptogramin, among others	NA|204aa|down_9|NZ_CP021866.1_929527_930139_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]
GCF_002197285.1_ASM219728v1	NZ_CP021866	Streptococcus agalactiae strain SG-M29 chromosome, complete genome	3	1954791-1955288	3	CRT	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Orphan	TCTGGTTTGGCNTCTGGN	18	0	0	NA	NA	NA	8	8	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|203aa|up_4|NZ_CP021866.1_1947151_1947760_+,NA	NA|615aa|up_9|NZ_CP021866.1_1934218_1936063_-	PRK08645, PRK08645, bifunctional homocysteine S-methyltransferase/5,10-methylenetetrahydrofolate reductase protein; Reviewed	NA|746aa|up_8|NZ_CP021866.1_1936107_1938345_-	PRK05222, PRK05222, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase; Provisional	NA|108aa|up_7|NZ_CP021866.1_1938714_1939038_-	COG4392, COG4392, Predicted membrane protein [Function unknown]	NA|231aa|up_6|NZ_CP021866.1_1939027_1939720_-	COG1296, AzlC, Predicted branched-chain amino acid permease (azaleucine resistance) [Amino acid transport and metabolism]	NA|463aa|up_5|NZ_CP021866.1_1945670_1947059_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|203aa|up_4|NZ_CP021866.1_1947151_1947760_+	NA	NA|834aa|up_3|NZ_CP021866.1_1947849_1950351_-	PRK00390, leuS, leucyl-tRNA synthetase; Validated	NA|416aa|up_2|NZ_CP021866.1_1950727_1951975_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|269aa|up_1|NZ_CP021866.1_1952632_1953438_-	pfam13359, DDE_Tnp_4, DDE superfamily endonuclease	NA|180aa|up_0|NZ_CP021866.1_1953861_1954401_-	PRK05609, nusG, transcription antitermination protein NusG; Validated	NA|58aa|down_0|NZ_CP021866.1_1957392_1957566_-	COG0690, SecE, Preprotein translocase subunit SecE [Intracellular trafficking and secretion]	NA|51aa|down_1|NZ_CP021866.1_1957601_1957754_-	PRK00504, rpmG, 50S ribosomal protein L33; Validated	NA|774aa|down_2|NZ_CP021866.1_1957802_1960124_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|295aa|down_3|NZ_CP021866.1_1960167_1961052_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|547aa|down_4|NZ_CP021866.1_1961076_1962717_-	COG4640, COG4640, Predicted membrane protein [Function unknown]	NA|404aa|down_5|NZ_CP021866.1_1962886_1964098_-	PRK05362, PRK05362, phosphopentomutase; Provisional	NA|224aa|down_6|NZ_CP021866.1_1964164_1964836_-	PRK00507, PRK00507, deoxyribose-phosphate aldolase; Provisional	NA|401aa|down_7|NZ_CP021866.1_1964865_1966068_-	COG1972, NupC, Nucleoside permease [Nucleotide transport and metabolism]	NA|260aa|down_8|NZ_CP021866.1_1966088_1966868_-	cd17767, UP_EcUdp-like, uridine phosphorylases similar to Escherichia coli Udp and related phosphorylases	NA|246aa|down_9|NZ_CP021866.1_1967026_1967764_+	COG2188, PhnF, Transcriptional regulators [Transcription]
GCF_002197285.1_ASM219728v1	NZ_CP021866	Streptococcus agalactiae strain SG-M29 chromosome, complete genome	4	2004842-2004928	3	CRISPRCasFinder	no	csa3	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-A	AGCAGTATCGTACTTAGTTTGAGC	24	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|154aa|up_0|NZ_CP021866.1_2003496_2003958_-,NA|319aa|down_1|NZ_CP021866.1_2007347_2008304_-,NA|98aa|down_2|NZ_CP021866.1_2008538_2008832_+,NA|147aa|down_3|NZ_CP021866.1_2008913_2009354_+,NA|177aa|down_4|NZ_CP021866.1_2009350_2009881_+,NA|424aa|down_6|NZ_CP021866.1_2010790_2012062_+,NA|88aa|down_7|NZ_CP021866.1_2012144_2012408_+	NA|146aa|up_9|NZ_CP021866.1_1994837_1995275_-	TIGR01529, Arginine_repressor	NA|564aa|up_8|NZ_CP021866.1_1995496_1997188_+	PRK12451, PRK12451, arginyl-tRNA synthetase; Reviewed	NA|103aa|up_7|NZ_CP021866.1_1997275_1997584_+	pfam08951, EntA_Immun, Enterocin A Immunity	NA|291aa|up_6|NZ_CP021866.1_1997610_1998483_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|315aa|up_5|NZ_CP021866.1_1998590_1999535_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|584aa|up_4|NZ_CP021866.1_1999524_2001276_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|427aa|up_3|NZ_CP021866.1_2001368_2002649_-	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|61aa|up_2|NZ_CP021866.1_2002868_2003051_+	PRK01110, rpmF, 50S ribosomal protein L32; Validated	NA|50aa|up_1|NZ_CP021866.1_2003066_2003216_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|154aa|up_0|NZ_CP021866.1_2003496_2003958_-	NA	NA|112aa|down_0|NZ_CP021866.1_2006975_2007311_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|319aa|down_1|NZ_CP021866.1_2007347_2008304_-	NA	NA|98aa|down_2|NZ_CP021866.1_2008538_2008832_+	NA	NA|147aa|down_3|NZ_CP021866.1_2008913_2009354_+	NA	NA|177aa|down_4|NZ_CP021866.1_2009350_2009881_+	NA	NA|249aa|down_5|NZ_CP021866.1_2009880_2010627_+	COG1674, FtsK, DNA segregation ATPase FtsK/SpoIIIE and related proteins [Cell division and chromosome partitioning]	NA|424aa|down_6|NZ_CP021866.1_2010790_2012062_+	NA	NA|88aa|down_7|NZ_CP021866.1_2012144_2012408_+	NA	NA|422aa|down_8|NZ_CP021866.1_2012504_2013770_+	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons	NA|209aa|down_9|NZ_CP021866.1_2014176_2014803_+	pfam03596, Cad, Cadmium resistance transporter
