assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001592385.1_ASM159238v1	NZ_CP010874	Streptococcus agalactiae strain CU_GBS_08 chromosome, complete genome	1	503596-504222	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	 Type I-U?,Type I-U,Type I-C	GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT,GTCGCACCCTTTGCGGGTGCGTGGATTGAAAT	32,32,32,32	0	0	NA	NA	I-C:I-C:I-C:I-C	7,8,9,7	9	TypeI-U?,TypeI-U,TypeI-C	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|231aa|up_9|NZ_CP010874.1_490043_490736_+,NA|260aa|up_7|NZ_CP010874.1_493626_494406_-,NA|97aa|down_6|NZ_CP010874.1_509885_510176_+	NA|231aa|up_9|NZ_CP010874.1_490043_490736_+	NA	NA|884aa|up_8|NZ_CP010874.1_490757_493409_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	NA|260aa|up_7|NZ_CP010874.1_493626_494406_-	NA	cas3|808aa|up_6|NZ_CP010874.1_495417_497841_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_CP010874.1_497973_498702_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_CP010874.1_498701_500597_+	cd09642, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|283aa|up_3|NZ_CP010874.1_500601_501450_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|224aa|up_2|NZ_CP010874.1_501451_502123_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_CP010874.1_502119_503145_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_CP010874.1_503155_503449_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|320aa|down_0|NZ_CP010874.1_504358_505318_+	COG0673, MviM, Predicted dehydrogenases and related proteins [General function prediction only]	NA|301aa|down_1|NZ_CP010874.1_505478_506381_+	cd12827, EcCorA_ZntB-like_u2, uncharacterized bacterial subfamily of the Escherichia coli CorA-Salmonella typhimurium ZntB family	NA|355aa|down_2|NZ_CP010874.1_506540_507605_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|331aa|down_3|NZ_CP010874.1_507717_508710_+	COG2502, AsnA, Asparagine synthetase A [Amino acid transport and metabolism]	NA|150aa|down_4|NZ_CP010874.1_508754_509204_-	TIGR01295, Pediocin_PA-1_biosynthesis_protein_PedC, bacteriocin transport accessory protein, putative	NA|180aa|down_5|NZ_CP010874.1_509334_509874_+	pfam03602, Cons_hypoth95, Conserved hypothetical protein 95	NA|97aa|down_6|NZ_CP010874.1_509885_510176_+	NA	NA|162aa|down_7|NZ_CP010874.1_510172_510658_+	cd02163, PPAT, Phosphopantetheine adenylyltransferase	NA|445aa|down_8|NZ_CP010874.1_511794_513129_+	cd00845, MPP_UshA_N_like, Escherichia coli UshA-like family, N-terminal metallophosphatase domain	NA|193aa|down_9|NZ_CP010874.1_513198_513777_+	COG4470, COG4470, Uncharacterized protein conserved in bacteria [Function unknown]
GCF_001592385.1_ASM159238v1	NZ_CP010874	Streptococcus agalactiae strain CU_GBS_08 chromosome, complete genome	2	905749-906510	3,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas9,cas1,cas2,csn2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type II-B,Type II-C,Type II-A	GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC,GTTTTAGAGCTGTGCTGTTTCGAATGGTTCCAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	7,10,11	11	TypeII-B,TypeII-C,TypeII-A	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA,NA	NA|124aa|up_9|NZ_CP010874.1_895130_895502_+	pfam08349, DUF1722, Protein of unknown function (DUF1722)	NA|127aa|up_8|NZ_CP010874.1_895526_895907_+	TIGR02328, TIGR02328, conserved hypothetical protein	NA|377aa|up_7|NZ_CP010874.1_895998_897129_+	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|246aa|up_6|NZ_CP010874.1_897132_897870_+	pfam01643, Acyl-ACP_TE, Acyl-ACP thioesterase	NA|257aa|up_5|NZ_CP010874.1_897870_898641_+	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|219aa|up_4|NZ_CP010874.1_898630_899287_+	COG4478, COG4478, Predicted membrane protein [Function unknown]	cas9|1371aa|up_3|NZ_CP010874.1_899674_903787_+	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	cas1|290aa|up_2|NZ_CP010874.1_903788_904658_+	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	cas2|114aa|up_1|NZ_CP010874.1_904654_904996_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|222aa|up_0|NZ_CP010874.1_904982_905648_+	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	NA|139aa|down_0|NZ_CP010874.1_907067_907484_+	PRK00668, ndk, mulitfunctional nucleoside diphosphate kinase/apyrimidinic endonuclease/3'-; Validated	NA|611aa|down_1|NZ_CP010874.1_907619_909452_+	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|878aa|down_2|NZ_CP010874.1_909698_912332_+	NF033189, internalin_A, class 1 internalin InlA	NA|220aa|down_3|NZ_CP010874.1_912431_913091_+	COG1418, COG1418, Predicted HD superfamily hydrolase [General function prediction only]	NA|155aa|down_4|NZ_CP010874.1_913099_913564_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|130aa|down_5|NZ_CP010874.1_913563_913953_+	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|931aa|down_6|NZ_CP010874.1_914104_916897_+	COG0474, MgtA, Cation transport ATPase [Inorganic ion transport and metabolism]	NA|368aa|down_7|NZ_CP010874.1_916896_918000_+	pfam11187, DUF2974, Protein of unknown function (DUF2974)	NA|213aa|down_8|NZ_CP010874.1_918120_918759_-	cd03349, LbH_XAT, Xenobiotic acyltransferase (XAT): The XAT class of hexapeptide acyltransferases is composed of a large number of microbial enzymes that catalyze the CoA-dependent acetylation of a variety of hydroxyl-bearing acceptors such as chloramphenicol and streptogramin, among others	NA|204aa|down_9|NZ_CP010874.1_919469_920081_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]
GCF_001592385.1_ASM159238v1	NZ_CP010874	Streptococcus agalactiae strain CU_GBS_08 chromosome, complete genome	3	1403587-1405128	3	CRT	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Orphan	GANGCGCTNGTNCTNGCT	18	2	4	1403941-1403994|1404013-1404030|1404013-1404030|1404013-1404030	NZ_CP010874.1_1405285-1405338|NZ_CP010874.1_1405321-1405338|NZ_CP010874.1_1405249-1405266|NZ_CP010874.1_1405285-1405302	NA	23	23	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA,NA|117aa|down_4|NZ_CP010874.1_1415658_1416009_+,NA|53aa|down_5|NZ_CP010874.1_1416100_1416259_-	NA|331aa|up_9|NZ_CP010874.1_1390874_1391867_-	TIGR03711, acc_sec_asp3, accessory Sec system protein Asp3	NA|520aa|up_8|NZ_CP010874.1_1391863_1393423_-	TIGR03712, acc_sec_asp2, accessory Sec system protein Asp2	NA|515aa|up_7|NZ_CP010874.1_1393429_1394974_-	pfam16993, Asp1, Accessory Sec system protein Asp1	NA|410aa|up_6|NZ_CP010874.1_1394973_1396203_-	PRK12417, secY, preprotein translocase subunit SecY; Reviewed	NA|399aa|up_5|NZ_CP010874.1_1396325_1397522_-	TIGR03728, glyco_access_1, glycosyltransferase, SP_1767 family	NA|292aa|up_4|NZ_CP010874.1_1397582_1398458_-	pfam00535, Glycos_transf_2, Glycosyl transferase family 2	NA|395aa|up_3|NZ_CP010874.1_1398450_1399635_-	cd04194, GT8_A4GalT_like, A4GalT_like proteins catalyze the addition of galactose or glucose residues to the lipooligosaccharide (LOS) or lipopolysaccharide (LPS) of the bacterial cell surface	NA|414aa|up_2|NZ_CP010874.1_1399624_1400866_-	cd04194, GT8_A4GalT_like, A4GalT_like proteins catalyze the addition of galactose or glucose residues to the lipooligosaccharide (LOS) or lipopolysaccharide (LPS) of the bacterial cell surface	NA|402aa|up_1|NZ_CP010874.1_1400862_1402068_-	cd04194, GT8_A4GalT_like, A4GalT_like proteins catalyze the addition of galactose or glucose residues to the lipooligosaccharide (LOS) or lipopolysaccharide (LPS) of the bacterial cell surface	NA|336aa|up_0|NZ_CP010874.1_1402076_1403084_-	PRK09814, PRK09814, sugar transferase	NA|664aa|down_0|NZ_CP010874.1_1409431_1411423_-	PRK05298, PRK05298, excinuclease ABC subunit UvrB	NA|307aa|down_1|NZ_CP010874.1_1411483_1412404_-	pfam02517, Abi, CAAX protease self-immunity	NA|728aa|down_2|NZ_CP010874.1_1412586_1414770_+	cd13619, PBP2_GlnP, Glutamine-binding domain of ABC transporter, a member of the type 2 periplasmic binding fold protein superfamily	NA|247aa|down_3|NZ_CP010874.1_1414769_1415510_+	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|117aa|down_4|NZ_CP010874.1_1415658_1416009_+	NA	NA|53aa|down_5|NZ_CP010874.1_1416100_1416259_-	NA	NA|438aa|down_6|NZ_CP010874.1_1416284_1417598_-	PRK12297, obgE, GTPase CgtA; Reviewed	NA|43aa|down_7|NZ_CP010874.1_1417658_1417787_-	pfam13253, DUF4044, Protein of unknown function (DUF4044)	NA|414aa|down_8|NZ_CP010874.1_1417964_1419206_+	pfam02073, Peptidase_M29, Thermophilic metalloprotease (M29)	NA|193aa|down_9|NZ_CP010874.1_1419239_1419818_-	pfam05887, Trypan_PARP, Procyclic acidic repetitive protein (PARP)
GCF_001592385.1_ASM159238v1	NZ_CP010874	Streptococcus agalactiae strain CU_GBS_08 chromosome, complete genome	4	1925632-1926129	4	CRT	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Orphan	CTGGTTTGGCNTCTGGNT	18	1	1	1926094-1926111	NZ_CP010874.1_2025494-2025477	NA	8	8	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|203aa|up_4|NZ_CP010874.1_1917991_1918600_+,NA	NA|615aa|up_9|NZ_CP010874.1_1905055_1906900_-	PRK08645, PRK08645, bifunctional homocysteine S-methyltransferase/5,10-methylenetetrahydrofolate reductase protein; Reviewed	NA|746aa|up_8|NZ_CP010874.1_1906944_1909182_-	PRK05222, PRK05222, 5-methyltetrahydropteroyltriglutamate--homocysteine S-methyltransferase; Provisional	NA|108aa|up_7|NZ_CP010874.1_1909551_1909875_-	COG4392, COG4392, Predicted membrane protein [Function unknown]	NA|231aa|up_6|NZ_CP010874.1_1909864_1910557_-	COG1296, AzlC, Predicted branched-chain amino acid permease (azaleucine resistance) [Amino acid transport and metabolism]	NA|463aa|up_5|NZ_CP010874.1_1916510_1917899_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|203aa|up_4|NZ_CP010874.1_1917991_1918600_+	NA	NA|834aa|up_3|NZ_CP010874.1_1918689_1921191_-	PRK00390, leuS, leucyl-tRNA synthetase; Validated	NA|416aa|up_2|NZ_CP010874.1_1921567_1922815_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|269aa|up_1|NZ_CP010874.1_1923472_1924278_-	pfam13359, DDE_Tnp_4, DDE superfamily endonuclease	NA|180aa|up_0|NZ_CP010874.1_1924701_1925241_-	PRK05609, nusG, transcription antitermination protein NusG; Validated	NA|59aa|down_0|NZ_CP010874.1_1928232_1928409_-	COG0690, SecE, Preprotein translocase subunit SecE [Intracellular trafficking and secretion]	NA|51aa|down_1|NZ_CP010874.1_1928441_1928594_-	PRK00504, rpmG, 50S ribosomal protein L33; Validated	NA|774aa|down_2|NZ_CP010874.1_1928642_1930964_-	COG0744, MrcB, Membrane carboxypeptidase (penicillin-binding protein) [Cell envelope biogenesis, outer membrane]	NA|295aa|down_3|NZ_CP010874.1_1931007_1931892_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|547aa|down_4|NZ_CP010874.1_1931916_1933557_-	COG4640, COG4640, Predicted membrane protein [Function unknown]	NA|404aa|down_5|NZ_CP010874.1_1933726_1934938_-	PRK05362, PRK05362, phosphopentomutase; Provisional	NA|224aa|down_6|NZ_CP010874.1_1935004_1935676_-	PRK00507, PRK00507, deoxyribose-phosphate aldolase; Provisional	NA|401aa|down_7|NZ_CP010874.1_1935705_1936908_-	COG1972, NupC, Nucleoside permease [Nucleotide transport and metabolism]	NA|260aa|down_8|NZ_CP010874.1_1936928_1937708_-	cd17767, UP_EcUdp-like, uridine phosphorylases similar to Escherichia coli Udp and related phosphorylases	NA|246aa|down_9|NZ_CP010874.1_1937866_1938604_+	COG2188, PhnF, Transcriptional regulators [Transcription]
GCF_001592385.1_ASM159238v1	NZ_CP010874	Streptococcus agalactiae strain CU_GBS_08 chromosome, complete genome	5	1975682-1975768	3	CRISPRCasFinder	no	csa3	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	Type I-A	AGCAGTATCGTACTTAGTTTGAGC	24	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,DinG,cas9,csn2,csm6,DEDDh,WYL,csa3	NA|154aa|up_0|NZ_CP010874.1_1974336_1974798_-,NA|319aa|down_1|NZ_CP010874.1_1978187_1979144_-,NA|98aa|down_2|NZ_CP010874.1_1979378_1979672_+,NA|147aa|down_3|NZ_CP010874.1_1979753_1980194_+,NA|177aa|down_4|NZ_CP010874.1_1980190_1980721_+,NA|424aa|down_6|NZ_CP010874.1_1981630_1982902_+,NA|88aa|down_7|NZ_CP010874.1_1982984_1983248_+,NA|62aa|down_9|NZ_CP010874.1_1984814_1985000_-	NA|146aa|up_9|NZ_CP010874.1_1965677_1966115_-	TIGR01529, Arginine_repressor	NA|564aa|up_8|NZ_CP010874.1_1966336_1968028_+	PRK12451, PRK12451, arginyl-tRNA synthetase; Reviewed	NA|103aa|up_7|NZ_CP010874.1_1968115_1968424_+	pfam08951, EntA_Immun, Enterocin A Immunity	NA|291aa|up_6|NZ_CP010874.1_1968450_1969323_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|315aa|up_5|NZ_CP010874.1_1969430_1970375_-	COG1284, COG1284, Uncharacterized conserved protein [Function unknown]	NA|584aa|up_4|NZ_CP010874.1_1970364_1972116_-	PRK00476, aspS, aspartyl-tRNA synthetase; Validated	NA|427aa|up_3|NZ_CP010874.1_1972208_1973489_-	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|61aa|up_2|NZ_CP010874.1_1973708_1973891_+	PRK01110, rpmF, 50S ribosomal protein L32; Validated	NA|50aa|up_1|NZ_CP010874.1_1973906_1974056_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|154aa|up_0|NZ_CP010874.1_1974336_1974798_-	NA	NA|112aa|down_0|NZ_CP010874.1_1977815_1978151_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|319aa|down_1|NZ_CP010874.1_1978187_1979144_-	NA	NA|98aa|down_2|NZ_CP010874.1_1979378_1979672_+	NA	NA|147aa|down_3|NZ_CP010874.1_1979753_1980194_+	NA	NA|177aa|down_4|NZ_CP010874.1_1980190_1980721_+	NA	NA|249aa|down_5|NZ_CP010874.1_1980720_1981467_+	COG1674, FtsK, DNA segregation ATPase FtsK/SpoIIIE and related proteins [Cell division and chromosome partitioning]	NA|424aa|down_6|NZ_CP010874.1_1981630_1982902_+	NA	NA|88aa|down_7|NZ_CP010874.1_1982984_1983248_+	NA	NA|422aa|down_8|NZ_CP010874.1_1983344_1984610_+	cd01189, INT_ICEBs1_C_like, C-terminal catalytic domain of integrases from bacterial phages and conjugate transposons	NA|62aa|down_9|NZ_CP010874.1_1984814_1985000_-	NA
