assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002197245.1_ASM219724v1	NZ_CP021865	Streptococcus agalactiae strain SG-M50 chromosome, complete genome	1	513652-514344	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	 Type I-U?,Type I-U,Type I-C	GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT	32,32,32,32	0	0	NA	NA	I-C:I-C:I-C:I-C	8,9,10,8	10	TypeI-U,TypeI-C,TypeI-U?	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|231aa|up_9|NZ_CP021865.1_500099_500792_+,NA|260aa|up_7|NZ_CP021865.1_503682_504462_-,NA|97aa|down_6|NZ_CP021865.1_520007_520298_+	NA|231aa|up_9|NZ_CP021865.1_500099_500792_+	NA	NA|884aa|up_8|NZ_CP021865.1_500813_503465_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|260aa|up_7|NZ_CP021865.1_503682_504462_-	NA	cas3|808aa|up_6|NZ_CP021865.1_505473_507897_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_CP021865.1_508029_508758_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_CP021865.1_508757_510653_+	cd09642, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|283aa|up_3|NZ_CP021865.1_510657_511506_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|224aa|up_2|NZ_CP021865.1_511507_512179_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_CP021865.1_512175_513201_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_CP021865.1_513211_513505_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|320aa|down_0|NZ_CP021865.1_514480_515440_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|301aa|down_1|NZ_CP021865.1_515600_516503_+	cd12827, EcCorA_ZntB-like_u2, uncharacterized bacterial subfamily of the Escherichia coli CorA-Salmonella typhimurium ZntB family	NA|355aa|down_2|NZ_CP021865.1_516662_517727_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|331aa|down_3|NZ_CP021865.1_517839_518832_+	COG2502, AsnA, Asparagine synthetase A [Amino acid transport and metabolism]	NA|150aa|down_4|NZ_CP021865.1_518876_519326_-	TIGR01295, Pediocin_PA-1_biosynthesis_protein_PedC, bacteriocin transport accessory protein, putative	NA|235aa|down_5|NZ_CP021865.1_519291_519996_+	pfam03602, Cons_hypoth95, Conserved hypothetical protein 95	NA|97aa|down_6|NZ_CP021865.1_520007_520298_+	NA	NA|162aa|down_7|NZ_CP021865.1_520294_520780_+	cd02163, PPAT, Phosphopantetheine adenylyltransferase	NA|358aa|down_8|NZ_CP021865.1_520769_521843_+	COG3480, SdrC, Predicted secreted protein containing a PDZ domain [Signal transduction mechanisms]	NA|445aa|down_9|NZ_CP021865.1_521917_523252_+	cd00845, MPP_UshA_N_like, Escherichia coli UshA-like family, N-terminal metallophosphatase domain
GCF_002197245.1_ASM219724v1	NZ_CP021865	Streptococcus agalactiae strain SG-M50 chromosome, complete genome	2	915873-916568	3,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas9,cas1,cas2,csn2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type II-B,Type II-C,Type II-A	GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	7,9,10	10	TypeII-B,TypeII-C,TypeII-A	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA,NA	NA|124aa|up_9|NZ_CP021865.1_905254_905626_+	pfam08349, DUF1722, Protein of unknown function (DUF1722)	NA|127aa|up_8|NZ_CP021865.1_905650_906031_+	TIGR02328, TIGR02328, conserved hypothetical protein	NA|377aa|up_7|NZ_CP021865.1_906122_907253_+	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|246aa|up_6|NZ_CP021865.1_907256_907994_+	pfam01643, Acyl-ACP_TE, Acyl-ACP thioesterase	NA|257aa|up_5|NZ_CP021865.1_907994_908765_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|219aa|up_4|NZ_CP021865.1_908754_909411_+	COG4478, COG4478, Predicted membrane protein [Function unknown]	cas9|1371aa|up_3|NZ_CP021865.1_909798_913911_+	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	cas1|290aa|up_2|NZ_CP021865.1_913912_914782_+	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	cas2|114aa|up_1|NZ_CP021865.1_914778_915120_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|222aa|up_0|NZ_CP021865.1_915106_915772_+	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	NA|139aa|down_0|NZ_CP021865.1_917125_917542_+	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|611aa|down_1|NZ_CP021865.1_917677_919510_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|878aa|down_2|NZ_CP021865.1_919756_922390_+	NF033189, internalin_A, class 1 internalin InlA	NA|220aa|down_3|NZ_CP021865.1_922489_923149_+	COG1418, COG1418, Predicted HD superfamily hydrolase [General function prediction only]	NA|155aa|down_4|NZ_CP021865.1_923157_923622_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|130aa|down_5|NZ_CP021865.1_923621_924011_+	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|931aa|down_6|NZ_CP021865.1_924162_926955_+	COG0474, MgtA, Cation transport ATPase [Inorganic ion transport and metabolism]	NA|368aa|down_7|NZ_CP021865.1_926954_928058_+	pfam11187, DUF2974, Protein of unknown function (DUF2974)	NA|213aa|down_8|NZ_CP021865.1_928178_928817_-	cd03349, LbH_XAT, Xenobiotic acyltransferase (XAT): The XAT class of hexapeptide acyltransferases is composed of a large number of microbial enzymes that catalyze the CoA-dependent acetylation of a variety of hydroxyl-bearing acceptors such as chloramphenicol and streptogramin, among others	NA|204aa|down_9|NZ_CP021865.1_929527_930139_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]
GCF_002197245.1_ASM219724v1	NZ_CP021865	Streptococcus agalactiae strain SG-M50 chromosome, complete genome	3	1954830-1955327	3	CRT	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Orphan	TGGTTTGGCNTCTGGNTT	18	1	1	1955208-1955225	NZ_CP021865.1_1955607-1955624	NA	8	8	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|203aa|up_4|NZ_CP021865.1_1947188_1947797_+,NA	NA|615aa|up_9|NZ_CP021865.1_1934255_1936100_-	PRK08645, PRK08645, bifunctional homocysteine S-methyltransferase/5,10-methylenetetrahydrofolate reductase protein; Reviewed	NA|746aa|up_8|NZ_CP021865.1_1936144_1938382_-	PRK05222, PRK05222, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase; Provisional	NA|108aa|up_7|NZ_CP021865.1_1938751_1939075_-	COG4392, COG4392, Predicted membrane protein [Function unknown]	NA|231aa|up_6|NZ_CP021865.1_1939064_1939757_-	COG1296, AzlC, Predicted branched-chain amino acid permease (azaleucine resistance) [Amino acid transport and metabolism]	NA|463aa|up_5|NZ_CP021865.1_1945707_1947096_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|203aa|up_4|NZ_CP021865.1_1947188_1947797_+	NA	NA|834aa|up_3|NZ_CP021865.1_1947886_1950388_-	PRK00390, leuS, leucyl-tRNA synthetase; Validated	NA|416aa|up_2|NZ_CP021865.1_1950764_1952012_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|269aa|up_1|NZ_CP021865.1_1952669_1953475_-	pfam13359, DDE_Tnp_4, DDE superfamily endonuclease	NA|180aa|up_0|NZ_CP021865.1_1953898_1954438_-	PRK05609, nusG, transcription antitermination protein NusG; Validated	NA|58aa|down_0|NZ_CP021865.1_1957429_1957603_-	COG0690, SecE, Preprotein translocase subunit SecE [Intracellular trafficking and secretion]	NA|51aa|down_1|NZ_CP021865.1_1957638_1957791_-	PRK00504, rpmG, 50S ribosomal protein L33; Validated	NA|774aa|down_2|NZ_CP021865.1_1957839_1960161_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|295aa|down_3|NZ_CP021865.1_1960204_1961089_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|547aa|down_4|NZ_CP021865.1_1961113_1962754_-	COG4640, COG4640, Predicted membrane protein [Function unknown]	NA|404aa|down_5|NZ_CP021865.1_1962923_1964135_-	PRK05362, PRK05362, phosphopentomutase; Provisional	NA|224aa|down_6|NZ_CP021865.1_1964201_1964873_-	PRK00507, PRK00507, deoxyribose-phosphate aldolase; Provisional	NA|401aa|down_7|NZ_CP021865.1_1964902_1966105_-	COG1972, NupC, Nucleoside permease [Nucleotide transport and metabolism]	NA|260aa|down_8|NZ_CP021865.1_1966125_1966905_-	cd17767, UP_EcUdp-like, uridine phosphorylases similar to Escherichia coli Udp and related phosphorylases	NA|246aa|down_9|NZ_CP021865.1_1967063_1967801_+	COG2188, PhnF, Transcriptional regulators [Transcription]
GCF_002197245.1_ASM219724v1	NZ_CP021865	Streptococcus agalactiae strain SG-M50 chromosome, complete genome	4	2004879-2004965	3	CRISPRCasFinder	no	csa3	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-A	AGCAGTATCGTACTTAGTTTGAGC	24	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|154aa|up_0|NZ_CP021865.1_2003533_2003995_-,NA|319aa|down_1|NZ_CP021865.1_2007384_2008341_-,NA|98aa|down_2|NZ_CP021865.1_2008575_2008869_+,NA|147aa|down_3|NZ_CP021865.1_2008950_2009391_+,NA|177aa|down_4|NZ_CP021865.1_2009387_2009918_+,NA|424aa|down_6|NZ_CP021865.1_2010827_2012099_+,NA|88aa|down_7|NZ_CP021865.1_2012181_2012445_+	NA|146aa|up_9|NZ_CP021865.1_1994874_1995312_-	TIGR01529, Arginine_repressor	NA|564aa|up_8|NZ_CP021865.1_1995533_1997225_+	PRK12451, PRK12451, arginyl-tRNA synthetase; Reviewed	NA|103aa|up_7|NZ_CP021865.1_1997312_1997621_+	pfam08951, EntA_Immun, Enterocin A Immunity	NA|291aa|up_6|NZ_CP021865.1_1997647_1998520_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|315aa|up_5|NZ_CP021865.1_1998627_1999572_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|584aa|up_4|NZ_CP021865.1_1999561_2001313_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|427aa|up_3|NZ_CP021865.1_2001405_2002686_-	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|61aa|up_2|NZ_CP021865.1_2002905_2003088_+	PRK01110, rpmF, 50S ribosomal protein L32; Validated	NA|50aa|up_1|NZ_CP021865.1_2003103_2003253_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|154aa|up_0|NZ_CP021865.1_2003533_2003995_-	NA	NA|112aa|down_0|NZ_CP021865.1_2007012_2007348_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|319aa|down_1|NZ_CP021865.1_2007384_2008341_-	NA	NA|98aa|down_2|NZ_CP021865.1_2008575_2008869_+	NA	NA|147aa|down_3|NZ_CP021865.1_2008950_2009391_+	NA	NA|177aa|down_4|NZ_CP021865.1_2009387_2009918_+	NA	NA|249aa|down_5|NZ_CP021865.1_2009917_2010664_+	COG1674, FtsK, DNA segregation ATPase FtsK/SpoIIIE and related proteins [Cell division and chromosome partitioning]	NA|424aa|down_6|NZ_CP021865.1_2010827_2012099_+	NA	NA|88aa|down_7|NZ_CP021865.1_2012181_2012445_+	NA	NA|422aa|down_8|NZ_CP021865.1_2012541_2013807_+	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons	NA|209aa|down_9|NZ_CP021865.1_2014213_2014840_+	pfam03596, Cad, Cadmium resistance transporter
