assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001021955.1_ASM102195v1	NZ_CP008776	Streptococcus pyogenes strain 5448 chromosome, complete genome	1	598749-599043	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Type I-U, Type I-U?,Type I-C	GTCTCACCCTTCATGGGTGAGTGGATTGAAA,GTCTCACCCTTCATGGGTGAGTGGATTGAAAT,GTCTCACCCTTCATGGGTGAGTGGATTGAAAT	31,32,32	0	0	NA	NA	I-C:I-C:I-C	4,4,4	4	TypeI-U,TypeI-U?,TypeI-C	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA	NA|132aa|up_9|NZ_CP008776.1_586217_586613_+	PRK07758, PRK07758, hypothetical protein; Provisional	NA|188aa|up_8|NZ_CP008776.1_587213_587777_+	pfam13238, AAA_18, AAA domain	NA|883aa|up_7|NZ_CP008776.1_587778_590427_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	cas3|803aa|up_6|NZ_CP008776.1_590580_592989_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_CP008776.1_593121_593850_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_CP008776.1_593849_595745_+	cd09642, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|283aa|up_3|NZ_CP008776.1_595749_596598_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|225aa|up_2|NZ_CP008776.1_596599_597274_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_CP008776.1_597270_598296_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_CP008776.1_598306_598600_+	COG1343, COG1343, CRISPR-associated protein Cas2 [Defense mechanisms]	NA|237aa|down_0|NZ_CP008776.1_599202_599913_+	COG0785, CcdA, Cytochrome c biogenesis protein [Posttranslational modification, protein turnover, chaperones]	NA|208aa|down_1|NZ_CP008776.1_599925_600549_+	cd02966, TlpA_like_family, TlpA-like family; composed of  TlpA, ResA, DsbE and similar proteins	NA|369aa|down_2|NZ_CP008776.1_600591_601698_+	PRK14018, PRK14018, bifunctional peptide-methionine (S)-S-oxide reductase MsrA/peptide-methionine (R)-S-oxide reductase MsrB	NA|247aa|down_3|NZ_CP008776.1_601785_602526_+	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|578aa|down_4|NZ_CP008776.1_602522_604256_+	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|360aa|down_5|NZ_CP008776.1_604328_605408_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|239aa|down_6|NZ_CP008776.1_605421_606138_+	COG3382, COG3382, Solo B3/4 domain (OB-fold DNA/RNA-binding) of Phe-aaRS-beta [General function prediction only]	NA|158aa|down_7|NZ_CP008776.1_606303_606777_-	COG1438, ArgR, Arginine repressor [Transcription]	NA|227aa|down_8|NZ_CP008776.1_606918_607599_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|412aa|down_9|NZ_CP008776.1_607872_609108_+	PRK01388, PRK01388, arginine deiminase; Provisional
GCF_001021955.1_ASM102195v1	NZ_CP008776	Streptococcus pyogenes strain 5448 chromosome, complete genome	2	759163-759298	2	CRISPRCasFinder	no		cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Orphan	GCCTTAGAAGCATTAGCGGATCAAACAGACGCTTTACAATCAGAAGAAGCTG	52	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA	NA|209aa|up_9|NZ_CP008776.1_747420_748047_+	PRK05480, PRK05480, uridine/cytidine kinase; Provisional	NA|88aa|up_8|NZ_CP008776.1_748126_748390_+	COG3326, COG3326, Predicted membrane protein [Function unknown]	NA|270aa|up_7|NZ_CP008776.1_748442_749252_-	COG2339, prsW, Membrane proteinase, regulator of anti-sigma factor [Posttranslational modification, protein turnover, chaperones]	NA|166aa|up_6|NZ_CP008776.1_749396_749894_+	COG1956, COG1956, GAF domain-containing protein [Signal transduction mechanisms]	NA|557aa|up_5|NZ_CP008776.1_749893_751564_+	PRK05563, PRK05563, DNA polymerase III subunits gamma and tau; Validated	NA|68aa|up_4|NZ_CP008776.1_751658_751862_+	pfam11676, DUF3272, Protein of unknown function (DUF3272)	NA|314aa|up_3|NZ_CP008776.1_751836_752778_-	PRK11886, PRK11886, bifunctional biotin--[acetyl-CoA-carboxylase] ligase/biotin operon repressor BirA	NA|793aa|up_2|NZ_CP008776.1_752981_755360_+	COG4886, COG4886, Leucine-rich repeat (LRR) protein [Function unknown]	NA|399aa|up_1|NZ_CP008776.1_755896_757093_+	PRK05250, PRK05250, S-adenosylmethionine synthetase; Validated	NA|420aa|up_0|NZ_CP008776.1_757266_758526_+	PRK12830, PRK12830, UDP-N-acetylglucosamine 1-carboxyvinyltransferase; Reviewed	NA|181aa|down_0|NZ_CP008776.1_759774_760317_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|428aa|down_1|NZ_CP008776.1_760325_761609_+	COG4109, COG4109, Predicted transcriptional regulator containing CBS domains [Transcription]	NA|287aa|down_2|NZ_CP008776.1_761624_762485_+	PRK07281, PRK07281, methionyl aminopeptidase	NA|322aa|down_3|NZ_CP008776.1_762486_763452_+	COG1295, Rbn, Ribonuclease BN family enzyme [Replication, recombination, and repair]	NA|428aa|down_4|NZ_CP008776.1_763562_764846_+	PRK02427, PRK02427, 3-phosphoshikimate 1-carboxyvinyltransferase; Provisional	NA|164aa|down_5|NZ_CP008776.1_764838_765330_+	PRK00131, aroK, shikimate kinase; Reviewed	NA|484aa|down_6|NZ_CP008776.1_765537_766989_+	COG1316, LytR, Transcriptional regulator [Transcription]	NA|463aa|down_7|NZ_CP008776.1_767037_768426_+	COG2265, TrmA, SAM-dependent methyltransferases related to tRNA (uracil-5-)-methyltransferase [Translation, ribosomal structure and biogenesis]	NA|134aa|down_8|NZ_CP008776.1_769327_769729_+	COG2050, PaaI, HGG motif-containing thioesterase, possibly involved in aromatic compounds catabolism [Secondary metabolites biosynthesis,    transport, and catabolism]	NA|495aa|down_9|NZ_CP008776.1_769835_771320_-	PRK13663, PRK13663, hypothetical protein; Provisional
GCF_001021955.1_ASM102195v1	NZ_CP008776	Streptococcus pyogenes strain 5448 chromosome, complete genome	3	864797-864897	3	CRISPRCasFinder	no		cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Orphan	TATAATTAGACTATACCAATTTT	23	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA|63aa|up_8|NZ_CP008776.1_854660_854849_+,NA|262aa|up_6|NZ_CP008776.1_856180_856966_-,NA	NA|252aa|up_9|NZ_CP008776.1_853685_854441_-	pfam02876, Stap_Strp_tox_C, Staphylococcal/Streptococcal toxin, beta-grasp domain	NA|63aa|up_8|NZ_CP008776.1_854660_854849_+	NA	NA|205aa|up_7|NZ_CP008776.1_855439_856054_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]	NA|262aa|up_6|NZ_CP008776.1_856180_856966_-	NA	NA|233aa|up_5|NZ_CP008776.1_856975_857674_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|124aa|up_4|NZ_CP008776.1_857673_858045_-	COG1725, COG1725, Predicted transcriptional regulators [Transcription]	NA|1037aa|up_3|NZ_CP008776.1_858229_861340_+	PRK07279, dnaE, DNA polymerase III DnaE; Reviewed	NA|338aa|up_2|NZ_CP008776.1_861419_862433_+	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|501aa|up_1|NZ_CP008776.1_862495_863998_+	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|186aa|up_0|NZ_CP008776.1_864215_864773_+	TIGR02227, Inactive_signal_peptidase_IA	NA|605aa|down_0|NZ_CP008776.1_864948_866763_+	PRK00331, PRK00331, isomerizing glutamine--fructose-6-phosphate transaminase	NA|112aa|down_1|NZ_CP008776.1_866958_867294_+	COG2824, PhnA, Uncharacterized Zn-ribbon-containing protein involved in phosphonate metabolism [Inorganic ion transport and metabolism]	NA|214aa|down_2|NZ_CP008776.1_867399_868041_+	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|210aa|down_3|NZ_CP008776.1_868050_868680_+	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|279aa|down_4|NZ_CP008776.1_868695_869532_+	cd00996, PBP2_AatB_like, Polar amino acids-binding domain of ATP-binding cassette transporter-like systems that belong to the type 2 periplasmic binding fold protein superfamily	NA|258aa|down_5|NZ_CP008776.1_869901_870675_+	pfam07373, CAMP_factor, CAMP factor (Cfa)	NA|412aa|down_6|NZ_CP008776.1_871043_872279_-	COG0053, MMT1, Predicted Co/Zn/Cd cation transporters [Inorganic ion transport and metabolism]	NA|441aa|down_7|NZ_CP008776.1_872398_873721_-	COG1115, AlsT, Na+/alanine symporter [Amino acid transport and metabolism]	NA|773aa|down_8|NZ_CP008776.1_874249_876568_+	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|83aa|down_9|NZ_CP008776.1_876931_877180_+	COG2261, COG2261, Predicted membrane protein [Function unknown]
GCF_001021955.1_ASM102195v1	NZ_CP008776	Streptococcus pyogenes strain 5448 chromosome, complete genome	4	1059134-1059367	4,2,2	CRISPRCasFinder,CRT,PILER-CR	no	csn2,cas2,cas1,cas9	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Type II-A,Type II-B,Type II-C	GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC,GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC,GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	3,3,2	3	TypeII-A,TypeII-B,TypeII-C	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA|214aa|down_8|NZ_CP008776.1_1069265_1069907_-	NA|263aa|up_9|NZ_CP008776.1_1048392_1049181_-	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|550aa|up_8|NZ_CP008776.1_1049184_1050834_-	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|276aa|up_7|NZ_CP008776.1_1050969_1051797_-	COG3716, ManZ, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IID [Carbohydrate transport and metabolism]	NA|270aa|up_6|NZ_CP008776.1_1051793_1052603_-	COG3715, ManY, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIC [Carbohydrate transport and metabolism]	NA|164aa|up_5|NZ_CP008776.1_1052619_1053111_-	COG3444, COG3444, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIB [Carbohydrate transport and metabolism]	NA|142aa|up_4|NZ_CP008776.1_1053129_1053555_-	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|340aa|up_3|NZ_CP008776.1_1053761_1054781_-	COG2855, COG2855, Predicted membrane protein [Function unknown]	NA|146aa|up_2|NZ_CP008776.1_1054895_1055333_-	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|294aa|up_1|NZ_CP008776.1_1055518_1056400_-	pfam00746, Gram_pos_anchor, LPXTG cell wall anchor motif	NA|611aa|up_0|NZ_CP008776.1_1056657_1058490_-	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	csn2|221aa|down_0|NZ_CP008776.1_1059469_1060132_-	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	cas2|114aa|down_1|NZ_CP008776.1_1060121_1060463_-	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	cas1|290aa|down_2|NZ_CP008776.1_1060459_1061329_-	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas9|1369aa|down_3|NZ_CP008776.1_1061328_1065435_-	COG3513, COG3513, Predicted CRISPR-associated nuclease, contains McrA/HNH-nuclease and RuvC-like nuclease domain [Defense mechanisms]	NA|211aa|down_4|NZ_CP008776.1_1065914_1066547_-	COG4478, COG4478, Predicted membrane protein [Function unknown]	NA|255aa|down_5|NZ_CP008776.1_1066546_1067311_-	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|251aa|down_6|NZ_CP008776.1_1067310_1068063_-	COG3884, FatA, Acyl-ACP thioesterase [Lipid metabolism]	NA|377aa|down_7|NZ_CP008776.1_1068072_1069203_-	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|214aa|down_8|NZ_CP008776.1_1069265_1069907_-	NA	NA|452aa|down_9|NZ_CP008776.1_1070040_1071396_-	PRK14316, glmM, phosphoglucosamine mutase; Provisional
GCF_001021955.1_ASM102195v1	NZ_CP008776	Streptococcus pyogenes strain 5448 chromosome, complete genome	5	1675307-1675440	5	CRISPRCasFinder	no		cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	Orphan	TGGTCTATCGCTAATTCAAGAGCTTTCTTTTTCTCTTCTAACTCTTTTTC	50	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,csa3	NA,NA|84aa|down_1|NZ_CP008776.1_1678288_1678540_-,NA|95aa|down_8|NZ_CP008776.1_1686035_1686320_-	NA|326aa|up_9|NZ_CP008776.1_1657726_1658704_+	COG0601, DppB, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|274aa|up_8|NZ_CP008776.1_1658700_1659522_+	COG1173, DppC, ABC-type dipeptide/oligopeptide/nickel transport systems, permease components [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|268aa|up_7|NZ_CP008776.1_1659533_1660337_+	COG0444, DppD, ABC-type dipeptide/oligopeptide/nickel transport system, ATPase component [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|209aa|up_6|NZ_CP008776.1_1660320_1660947_+	COG1124, DppF, ABC-type dipeptide/oligopeptide/nickel transport system, ATPase component [Amino acid transport and metabolism / Inorganic ion transport and metabolism]	NA|67aa|up_5|NZ_CP008776.1_1661027_1661228_-	COG3237, COG3237, Uncharacterized protein conserved in bacteria [Function unknown]	NA|826aa|up_4|NZ_CP008776.1_1661396_1663874_-	TIGR01363, pneumococcal_histidine_triad_A_protein, streptococcal histidine triad protein	NA|307aa|up_3|NZ_CP008776.1_1663886_1664807_-	cd01017, AdcA, Metal binding protein AdcA	NA|350aa|up_2|NZ_CP008776.1_1666357_1667407_-	TIGR01168, M_protein_serotype, Gram-positive signal peptide, YSIRK family	NA|1165aa|up_1|NZ_CP008776.1_1667503_1670998_-	cd07475, Peptidases_S8_C5a_Peptidase, Peptidase S8 family domain in Streptococcal C5a peptidases	NA|327aa|up_0|NZ_CP008776.1_1673215_1674196_-	pfam03482, SIC, sic protein repeat	NA|530aa|down_0|NZ_CP008776.1_1676023_1677613_-	pfam08270, PRD_Mga, M protein trans-acting positive regulator (MGA) PRD domain	NA|84aa|down_1|NZ_CP008776.1_1678288_1678540_-	NA	NA|534aa|down_2|NZ_CP008776.1_1678618_1680220_-	COG3942, COG3942, Surface antigen [General function prediction only]	NA|463aa|down_3|NZ_CP008776.1_1680321_1681710_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|218aa|down_4|NZ_CP008776.1_1681706_1682360_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|406aa|down_5|NZ_CP008776.1_1682453_1683671_-	PRK10535, PRK10535, macrolide ABC transporter ATP-binding protein/permease MacB	NA|225aa|down_6|NZ_CP008776.1_1683683_1684358_-	COG1136, SalX, ABC-type antimicrobial peptide transport system, ATPase component [Defense mechanisms]	NA|423aa|down_7|NZ_CP008776.1_1684344_1685613_-	COG0845, AcrA, Membrane-fusion protein [Cell envelope biogenesis, outer membrane]	NA|95aa|down_8|NZ_CP008776.1_1686035_1686320_-	NA	NA|99aa|down_9|NZ_CP008776.1_1686466_1686763_-	pfam14131, DUF4298, Domain of unknown function (DUF4298)
