assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000479335.1_ASM47933v1	NC_022584	Streptococcus sp. I-G2, complete genome	1	231990-232204	1	CRT	no		cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	Orphan	TCCGGGGGACCTTTTTAAC	19	0	0	NA	NA	NA	4	4	Orphan	cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	NA,NA|267aa|down_2|NC_022584.1_233531_234332_+	NA|299aa|up_9|NC_022584.1_222399_223296_+	PRK05416, PRK05416, RNase adapter RapZ	NA|326aa|up_8|NC_022584.1_223292_224270_+	TIGR01826, Putative_gluconeogenesis_factor, conserved hypothetical protein, cofD-related	NA|307aa|up_7|NC_022584.1_224266_225187_+	COG1481, COG1481, Uncharacterized protein conserved in bacteria [Function unknown]	NA|323aa|up_6|NC_022584.1_225602_226571_-	COG0492, TrxB, Thioredoxin reductase [Posttranslational modification, protein turnover, chaperones]	NA|290aa|up_5|NC_022584.1_226775_227645_+	COG0580, GlpF, Glycerol uptake facilitator and related permeases (Major Intrinsic Protein Family) [Carbohydrate transport and metabolism]	NA|104aa|up_4|NC_022584.1_227724_228036_+	pfam15592, Imm41, Immunity protein 41	NA|59aa|up_3|NC_022584.1_228182_228359_+	PRK00270, rpsU, 30S ribosomal protein S21; Reviewed	NA|127aa|up_2|NC_022584.1_228460_228841_-	COG1970, MscL, Large-conductance mechanosensitive channel [Cell envelope biogenesis, outer membrane]	NA|596aa|up_1|NC_022584.1_229081_230869_+	PRK05667, dnaG, DNA primase; Validated	NA|371aa|up_0|NC_022584.1_230871_231984_+	PRK09210, PRK09210, RNA polymerase sigma factor RpoD; Validated	NA|110aa|down_0|NC_022584.1_232329_232659_+	COG2151, PaaD, Predicted metal-sulfur cluster biosynthetic enzyme [General function prediction only]	NA|236aa|down_1|NC_022584.1_232814_233522_+	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|267aa|down_2|NC_022584.1_233531_234332_+	NA	NA|1034aa|down_3|NC_022584.1_235261_238363_+	PRK07279, dnaE, DNA polymerase III DnaE; Reviewed	NA|338aa|down_4|NC_022584.1_238448_239462_+	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|502aa|down_5|NC_022584.1_239522_241028_+	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|186aa|down_6|NC_022584.1_241172_241730_+	TIGR02227, Inactive_signal_peptidase_IA	NA|398aa|down_7|NC_022584.1_241822_243016_-	COG0053, MMT1, Predicted Co/Zn/Cd cation transporters [Inorganic ion transport and metabolism]	NA|762aa|down_8|NC_022584.1_243201_245487_+	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|425aa|down_9|NC_022584.1_245858_247133_+	pfam09903, DUF2130, Uncharacterized protein conserved in bacteria (DUF2130)
GCF_000479335.1_ASM47933v1	NC_022584	Streptococcus sp. I-G2, complete genome	2	378085-379637	1,2,1	CRISPRCasFinder,CRT,PILER-CR	no	cas9,cas1,cas2,csn2,csm6	cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	Type II-C,Type II-B,Type II-A	GTTTTTGTACTCTCAAGATTTAAGTAACTGTACAAC,GTTTTTGTACTCTCAAGATTTAAGTAACTGTACAAC,GTTTTTGTACTCTCAAGATTTAAGTAACTGTACAAC	36,36,36	0	0	NA	NA	NA:NA:NA	23,23,10	23	TypeII-C,TypeII-B,TypeII-A	cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	NA,NA	NA|331aa|up_9|NC_022584.1_366878_367871_-	pfam09770, PAT1, Topoisomerase II-associated protein PAT1	NA|313aa|up_8|NC_022584.1_368053_368992_-	COG0618, COG0618, Exopolyphosphatase-related proteins [General function prediction only]	NA|148aa|up_7|NC_022584.1_369169_369613_+	PRK07308, PRK07308, flavodoxin; Validated	NA|94aa|up_6|NC_022584.1_369732_370014_+	PRK07248, PRK07248, chorismate mutase	NA|404aa|up_5|NC_022584.1_370015_371227_+	cd03682, ClC_sycA_like, ClC sycA-like chloride channel proteins	NA|116aa|up_4|NC_022584.1_371344_371692_+	PRK05338, rplS, 50S ribosomal protein L19; Provisional	cas9|1128aa|up_3|NC_022584.1_372172_375556_+	TIGR01865, conserved_hypothetical_protein, CRISPR subtype II/NMENI RNA-guided endonuclease Cas9/Csn1	cas1|303aa|up_2|NC_022584.1_375736_376645_+	TIGR03639, cas1_NMENI, CRISPR-associated endonuclease Cas1, subtype II/NMENI	cas2|108aa|up_1|NC_022584.1_376649_376973_+	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	csn2|348aa|up_0|NC_022584.1_376969_378013_+	cd12217, Stu0660_Csn2, Stu0660-like CRISPR/Cas system-associated protein Csn2	NA|271aa|down_0|NC_022584.1_380299_381112_+	COG2339, prsW, Membrane proteinase, regulator of anti-sigma factor [Posttranslational modification, protein turnover, chaperones]	NA|458aa|down_1|NC_022584.1_381155_382529_-	PRK05291, trmE, tRNA uridine-5-carboxymethylaminomethyl(34) synthesis GTPase MnmE	NA|233aa|down_2|NC_022584.1_382691_383390_+	PRK00702, PRK00702, ribose-5-phosphate isomerase RpiA	NA|404aa|down_3|NC_022584.1_383455_384667_+	PRK05362, PRK05362, phosphopentomutase; Provisional	NA|181aa|down_4|NC_022584.1_384668_385211_+	COG3797, COG3797, Uncharacterized protein conserved in bacteria [Function unknown]	NA|270aa|down_5|NC_022584.1_385224_386034_+	PRK08202, PRK08202, purine nucleoside phosphorylase; Provisional	NA|237aa|down_6|NC_022584.1_387660_388371_+	PRK05819, deoD, DeoD-type purine-nucleoside phosphorylase	csm6|253aa|down_7|NC_022584.1_388370_389129_+	pfam09659, Cas_Csm6, CRISPR-associated protein (Cas_Csm6)	NA|244aa|down_8|NC_022584.1_389139_389871_+	PRK00481, PRK00481, NAD-dependent deacetylase; Provisional	NA|303aa|down_9|NC_022584.1_389943_390852_-	COG0583, LysR, Transcriptional regulator [Transcription]
GCF_000479335.1_ASM47933v1	NC_022584	Streptococcus sp. I-G2, complete genome	3	667679-667761	2	CRISPRCasFinder	no		cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	Orphan	TTCTGGTGTCTGCCACCGCTTGGCCCTTA	29	0	0	NA	NA	NA	1	1	Orphan	cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	NA|128aa|up_9|NC_022584.1_656785_657169_-,NA|78aa|up_8|NC_022584.1_657165_657399_-,NA|214aa|up_6|NC_022584.1_658544_659186_-,NA|66aa|up_5|NC_022584.1_659345_659543_+,NA|99aa|up_4|NC_022584.1_659556_659853_-,NA|95aa|up_3|NC_022584.1_659866_660151_-,NA|137aa|up_1|NC_022584.1_666491_666902_-,NA|285aa|down_3|NC_022584.1_673402_674257_-,NA|81aa|down_4|NC_022584.1_674273_674516_-,NA|163aa|down_6|NC_022584.1_676413_676902_-,NA|100aa|down_7|NC_022584.1_676891_677191_-,NA|78aa|down_9|NC_022584.1_678114_678348_-	NA|128aa|up_9|NC_022584.1_656785_657169_-	NA	NA|78aa|up_8|NC_022584.1_657165_657399_-	NA	NA|362aa|up_7|NC_022584.1_657449_658535_-	pfam13154, DUF3991, Protein of unknown function (DUF3991)	NA|214aa|up_6|NC_022584.1_658544_659186_-	NA	NA|66aa|up_5|NC_022584.1_659345_659543_+	NA	NA|99aa|up_4|NC_022584.1_659556_659853_-	NA	NA|95aa|up_3|NC_022584.1_659866_660151_-	NA	NA|2078aa|up_2|NC_022584.1_660225_666459_-	COG4646, COG4646, DNA methylase [Transcription / DNA replication, recombination, and repair]	NA|137aa|up_1|NC_022584.1_666491_666902_-	NA	NA|189aa|up_0|NC_022584.1_667052_667619_-	pfam18813, PBECR4, phage-Barnase-EndoU-ColicinE5/D-RelE like nuclease4	NA|938aa|down_0|NC_022584.1_667856_670670_-	pfam18013, Phage_lysozyme2, Phage tail lysozyme	NA|772aa|down_1|NC_022584.1_670681_672997_-	TIGR02746, hypothetical_protein, type-IV secretion system protein TraC	NA|120aa|down_2|NC_022584.1_672989_673349_-	pfam12666, PrgI, PrgI family protein	NA|285aa|down_3|NC_022584.1_673402_674257_-	NA	NA|81aa|down_4|NC_022584.1_674273_674516_-	NA	NA|626aa|down_5|NC_022584.1_674536_676414_-	COG3505, VirD4, Type IV secretory pathway, VirD4 components [Intracellular trafficking and secretion]	NA|163aa|down_6|NC_022584.1_676413_676902_-	NA	NA|100aa|down_7|NC_022584.1_676891_677191_-	NA	NA|196aa|down_8|NC_022584.1_677524_678112_-	pfam02517, Abi, CAAX protease self-immunity	NA|78aa|down_9|NC_022584.1_678114_678348_-	NA
GCF_000479335.1_ASM47933v1	NC_022584	Streptococcus sp. I-G2, complete genome	4	1624728-1624819	3	CRISPRCasFinder	no		cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	Orphan	GTTGAAGTTGTAGTCGGTTCTTC	23	0	0	NA	NA	NA	1	1	Orphan	cas9,cas1,cas2,csn2,csm6,DinG,csa3,DEDDh,cas3	NA|63aa|up_3|NC_022584.1_1621606_1621795_+,NA|77aa|up_0|NC_022584.1_1623988_1624219_+,NA|47aa|down_4|NC_022584.1_1633526_1633667_+	NA|114aa|up_9|NC_022584.1_1617307_1617649_+	COG2151, PaaD, Predicted metal-sulfur cluster biosynthetic enzyme [General function prediction only]	NA|568aa|up_8|NC_022584.1_1617697_1619401_-	PRK00911, PRK00911, dihydroxy-acid dehydratase; Provisional	NA|341aa|up_7|NC_022584.1_1619589_1620612_+	cd03402, SPFH_like_u2, Uncharacterized family; SPFH (stomatin, prohibitin, flotillin, and HflK/C) superfamily	NA|67aa|up_6|NC_022584.1_1620614_1620815_+	COG4877, COG4877, Uncharacterized protein conserved in bacteria [Function unknown]	NA|61aa|up_5|NC_022584.1_1620965_1621148_+	PRK01110, rpmF, 50S ribosomal protein L32; Validated	NA|50aa|up_4|NC_022584.1_1621163_1621313_+	PRK00595, rpmG, 50S ribosomal protein L33; Validated	NA|63aa|up_3|NC_022584.1_1621606_1621795_+	NA	NA|204aa|up_2|NC_022584.1_1621787_1622399_+	COG2184, Fic, Protein involved in cell division [Cell division and chromosome partitioning]	NA|283aa|up_1|NC_022584.1_1622604_1623453_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|77aa|up_0|NC_022584.1_1623988_1624219_+	NA	NA|331aa|down_0|NC_022584.1_1626595_1627588_+	COG2502, AsnA, Asparagine synthetase A [Amino acid transport and metabolism]	NA|425aa|down_1|NC_022584.1_1627778_1629053_+	PRK00037, hisS, histidyl-tRNA synthetase; Reviewed	NA|594aa|down_2|NC_022584.1_1629396_1631178_+	COG5617, COG5617, Predicted integral membrane protein [Function unknown]	NA|737aa|down_3|NC_022584.1_1631303_1633514_+	PRK09263, PRK09263, anaerobic ribonucleoside triphosphate reductase; Provisional	NA|47aa|down_4|NC_022584.1_1633526_1633667_+	NA	NA|167aa|down_5|NC_022584.1_1633710_1634211_+	COG3981, COG3981, Predicted acetyltransferase [General function prediction only]	NA|199aa|down_6|NC_022584.1_1634215_1634812_+	pfam13353, Fer4_12, 4Fe-4S single cluster domain	NA|495aa|down_7|NC_022584.1_1635006_1636491_+	PRK09225, PRK09225, threonine synthase; Validated	NA|428aa|down_8|NC_022584.1_1636551_1637835_+	cd13137, MATE_NorM_like, Subfamily of the multidrug and toxic compound extrusion (MATE)-like proteins similar to Thermotoga marina NorM	NA|208aa|down_9|NC_022584.1_1637840_1638464_+	cd07523, HAD_YsbA-like, uncharacterized family of the haloacid dehalogenase-like superfamily, similar to the uncharacterized Lactococcus lactis YsbA
