assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_900474865.1_41906_D02	NZ_LS483329	Streptococcus pyogenes strain NCTC12058 chromosome 1	1	131524-131620	1	CRISPRCasFinder	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	Orphan	GCTAGATGGTGAAGAAGTCCCAGAA	25	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	NA,NA|222aa|down_8|NZ_LS483329.1_144563_145229_-	NA|257aa|up_9|NZ_LS483329.1_121835_122606_-	PRK11880, PRK11880, pyrroline-5-carboxylate reductase; Reviewed	NA|356aa|up_8|NZ_LS483329.1_122653_123721_-	TIGR03107, Glutamyl_aminopeptidase, glutamyl aminopeptidase	NA|98aa|up_7|NZ_LS483329.1_124176_124470_+	pfam15513, DUF4651, Domain of unknown function (DUF4651)	NA|106aa|up_6|NZ_LS483329.1_124466_124784_+	cd02947, TRX_family, TRX family; composed of two groups: Group I, which includes proteins that exclusively encode a TRX domain; and Group II, which are composed of fusion proteins of TRX and additional domains	NA|209aa|up_5|NZ_LS483329.1_124801_125428_+	cd02796, tRNA_bind_bactPheRS, tRNA-binding-domain-containing prokaryotic phenylalanly tRNA synthetase (PheRS) beta chain	NA|132aa|up_4|NZ_LS483329.1_125579_125975_+	PRK07274, PRK07274, single-stranded DNA-binding protein; Provisional	NA|214aa|up_3|NZ_LS483329.1_126235_126877_-	COG1428, COG1428, Deoxynucleoside kinases [Nucleotide transport and metabolism]	NA|326aa|up_2|NZ_LS483329.1_126896_127874_-	TIGR00737, Probable_tRNA-dihydrouridine_synthase, putative TIM-barrel protein, nifR3 family	NA|291aa|up_1|NZ_LS483329.1_127860_128733_-	PRK00114, hslO, Hsp33 family molecular chaperone HslO	NA|498aa|up_0|NZ_LS483329.1_128879_130373_-	pfam08270, PRD_Mga, M protein trans-acting positive regulator (MGA) PRD domain	NA|283aa|down_0|NZ_LS483329.1_132747_133596_+	cd05827, Sortase_C, Sortase domain found in class C sortases	NA|748aa|down_1|NZ_LS483329.1_133881_136125_+	NF033396, pilus_ancill_1, pilus ancillary protein 1	NA|174aa|down_2|NZ_LS483329.1_136117_136639_+	TIGR02227, Inactive_signal_peptidase_IA	NA|352aa|down_3|NZ_LS483329.1_136660_137716_+	TIGR03065, srtB_sig_QVPTGV, sortase B signal domain, QVPTGV class	NA|242aa|down_4|NZ_LS483329.1_137731_138457_+	TIGR03064, sortase_srtB, sortase, SrtB family	NA|196aa|down_5|NZ_LS483329.1_138473_139061_+	TIGR03786, strep_pil_rpt, streptococcal pilin isopeptide linkage domain	NA|402aa|down_6|NZ_LS483329.1_139219_140425_-	TIGR04094, AraC_family_transcriptional_regulator, YSIRK-targeted surface antigen transcriptional regulator	NA|1163aa|down_7|NZ_LS483329.1_140809_144298_+	NF033395, fibronec_SfbI, fibronectin-binding protein SfbI	NA|222aa|down_8|NZ_LS483329.1_144563_145229_-	NA	NA|469aa|down_9|NZ_LS483329.1_145581_146988_+	COG2031, AtoE, Short chain fatty acids transporter [Lipid metabolism]
GCF_900474865.1_41906_D02	NZ_LS483329	Streptococcus pyogenes strain NCTC12058 chromosome 1	2	413761-413923	1	PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	 Type I-U?,Type I-C,Type I-U	GTCTCACCCTTCATGGGTGAGTGGATTGAAA	31	0	0	NA	NA	I-C	2	2	TypeI-U?,TypeI-C,TypeI-U	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	NA,NA	NA|132aa|up_9|NZ_LS483329.1_401229_401625_+	PRK07758, PRK07758, hypothetical protein; Provisional	NA|188aa|up_8|NZ_LS483329.1_402225_402789_+	pfam13238, AAA_18, AAA domain	NA|883aa|up_7|NZ_LS483329.1_402790_405439_+	PRK05729, valS, valyl-tRNA synthetase; Reviewed	cas3|803aa|up_6|NZ_LS483329.1_405592_408001_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|243aa|up_5|NZ_LS483329.1_408133_408862_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|632aa|up_4|NZ_LS483329.1_408861_410757_+	TIGR01863, CRISPR-associated_protein_CT1133_family, CRISPR-associated protein Cas8c/Csd1, subtype I-C/DVULG	cas7|283aa|up_3|NZ_LS483329.1_410761_411610_+	COG3649, COG3649, CRISPR system related protein [Defense mechanisms]	cas4|225aa|up_2|NZ_LS483329.1_411611_412286_+	COG1468, COG1468, CRISPR-associated protein Cas4 (RecB family exonuclease) [Defense    mechanisms]	cas1|342aa|up_1|NZ_LS483329.1_412282_413308_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|98aa|up_0|NZ_LS483329.1_413318_413612_+	COG1343, COG1343, CRISPR-associated protein Cas2 [Defense mechanisms]	NA|237aa|down_0|NZ_LS483329.1_414084_414795_+	COG0785, CcdA, Cytochrome c biogenesis protein [Posttranslational modification, protein turnover, chaperones]	NA|208aa|down_1|NZ_LS483329.1_414807_415431_+	cd02966, TlpA_like_family, TlpA-like family; composed of  TlpA, ResA, DsbE and similar proteins	NA|369aa|down_2|NZ_LS483329.1_415473_416580_+	PRK14018, PRK14018, bifunctional peptide-methionine (S)-S-oxide reductase MsrA/peptide-methionine (R)-S-oxide reductase MsrB	NA|245aa|down_3|NZ_LS483329.1_416667_417402_+	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|578aa|down_4|NZ_LS483329.1_417404_419138_+	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|360aa|down_5|NZ_LS483329.1_419210_420290_+	COG2315, MmcQ, Uncharacterized protein conserved in bacteria [Function unknown]	NA|239aa|down_6|NZ_LS483329.1_420303_421020_+	COG3382, COG3382, Solo B3/4 domain (OB-fold DNA/RNA-binding) of Phe-aaRS-beta [General function prediction only]	NA|158aa|down_7|NZ_LS483329.1_421185_421659_-	COG1438, ArgR, Arginine repressor [Transcription]	NA|227aa|down_8|NZ_LS483329.1_421800_422481_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|412aa|down_9|NZ_LS483329.1_422754_423990_+	PRK01388, PRK01388, arginine deiminase; Provisional
GCF_900474865.1_41906_D02	NZ_LS483329	Streptococcus pyogenes strain NCTC12058 chromosome 1	3	640958-641058	2	CRISPRCasFinder	no		cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	Orphan	TATAATTAGACTATACCAATTTT	23	0	0	NA	NA	NA	1	1	Orphan	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	NA|262aa|up_6|NZ_LS483329.1_632341_633127_-,NA	NA|755aa|up_9|NZ_LS483329.1_627714_629979_+	cd04300, GT35_Glycogen_Phosphorylase, glycogen phosphorylase and similar proteins	NA|207aa|up_8|NZ_LS483329.1_630235_630856_-	pfam12978, DUF3862, Domain of Unknown Function with PDB structure (DUF3862)	NA|205aa|up_7|NZ_LS483329.1_631596_632211_+	COG0398, COG0398, Uncharacterized conserved protein [Function unknown]	NA|262aa|up_6|NZ_LS483329.1_632341_633127_-	NA	NA|233aa|up_5|NZ_LS483329.1_633136_633835_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|124aa|up_4|NZ_LS483329.1_633834_634206_-	COG1725, COG1725, Predicted transcriptional regulators [Transcription]	NA|1037aa|up_3|NZ_LS483329.1_634390_637501_+	PRK07279, dnaE, DNA polymerase III DnaE; Reviewed	NA|338aa|up_2|NZ_LS483329.1_637580_638594_+	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|501aa|up_1|NZ_LS483329.1_638656_640159_+	PRK05826, PRK05826, pyruvate kinase; Provisional	NA|186aa|up_0|NZ_LS483329.1_640376_640934_+	TIGR02227, Inactive_signal_peptidase_IA	NA|605aa|down_0|NZ_LS483329.1_641109_642924_+	PRK00331, PRK00331, isomerizing glutamine--fructose-6-phosphate transaminase	NA|112aa|down_1|NZ_LS483329.1_643119_643455_+	COG2824, PhnA, Uncharacterized Zn-ribbon-containing protein involved in phosphonate metabolism [Inorganic ion transport and metabolism]	NA|214aa|down_2|NZ_LS483329.1_643561_644203_+	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|210aa|down_3|NZ_LS483329.1_644212_644842_+	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|279aa|down_4|NZ_LS483329.1_644857_645694_+	cd00996, PBP2_AatB_like, Polar amino acids-binding domain of ATP-binding cassette transporter-like systems that belong to the type 2 periplasmic binding fold protein superfamily	NA|258aa|down_5|NZ_LS483329.1_646062_646836_+	pfam07373, CAMP_factor, CAMP factor (Cfa)	NA|418aa|down_6|NZ_LS483329.1_647185_648439_-	COG0053, MMT1, Predicted Co/Zn/Cd cation transporters [Inorganic ion transport and metabolism]	NA|441aa|down_7|NZ_LS483329.1_648558_649881_-	COG1115, AlsT, Na+/alanine symporter [Amino acid transport and metabolism]	NA|773aa|down_8|NZ_LS483329.1_650410_652729_+	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|83aa|down_9|NZ_LS483329.1_653091_653340_+	COG2261, COG2261, Predicted membrane protein [Function unknown]
GCF_900474865.1_41906_D02	NZ_LS483329	Streptococcus pyogenes strain NCTC12058 chromosome 1	4	821266-821829	3,1,2	CRISPRCasFinder,CRT,PILER-CR	no	csn2,cas2,cas1,cas9	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	Type II-C,Type II-A,Type II-B	GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC,GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC,GTTTTGGGACCATTCAAAACAGCATAGCTCTAAAAC	36,36,36	0	0	NA	NA	II-A:II-A:II-A	8,8,7	8	TypeII-C,TypeII-A,TypeII-B	cas3,cas5,cas8c,cas7,cas4,cas1,cas2,csn2,cas9,csm6,DinG,DEDDh,csa3	NA,NA|214aa|down_8|NZ_LS483329.1_831725_832367_-	NA|263aa|up_9|NZ_LS483329.1_810185_810974_-	COG4753, COG4753, Response regulator containing CheY-like receiver domain and AraC-type DNA-binding domain [Signal transduction mechanisms]	NA|550aa|up_8|NZ_LS483329.1_810977_812627_-	COG2972, COG2972, Predicted signal transduction protein with a C-terminal ATPase domain [Signal transduction mechanisms]	NA|276aa|up_7|NZ_LS483329.1_812762_813590_-	COG3716, ManZ, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IID [Carbohydrate transport and metabolism]	NA|270aa|up_6|NZ_LS483329.1_813586_814396_-	COG3715, ManY, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIC [Carbohydrate transport and metabolism]	NA|164aa|up_5|NZ_LS483329.1_814412_814904_-	COG3444, COG3444, Phosphotransferase system, mannose/fructose/N-acetylgalactosamine-specific component IIB [Carbohydrate transport and metabolism]	NA|142aa|up_4|NZ_LS483329.1_814922_815348_-	COG2893, ManX, Phosphotransferase system, mannose/fructose-specific component IIA [Carbohydrate transport and metabolism]	NA|340aa|up_3|NZ_LS483329.1_815554_816574_-	COG2855, COG2855, Predicted membrane protein [Function unknown]	NA|146aa|up_2|NZ_LS483329.1_816703_817141_-	PRK00222, PRK00222, peptide-methionine (R)-S-oxide reductase MsrB	NA|427aa|up_1|NZ_LS483329.1_817326_818607_-	PRK12678, PRK12678, transcription termination factor Rho; Provisional	NA|611aa|up_0|NZ_LS483329.1_818791_820624_-	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	csn2|221aa|down_0|NZ_LS483329.1_821931_822594_-	cd09758, Csn2, CRISPR/Cas system-associated protein Csn2	cas2|114aa|down_1|NZ_LS483329.1_822583_822925_-	COG3512, COG3512, CRISPR-associated protein, Cas2 homolog [Defense mechanisms]	cas1|290aa|down_2|NZ_LS483329.1_822921_823791_-	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas9|1369aa|down_3|NZ_LS483329.1_823790_827897_-	COG3513, COG3513, Predicted CRISPR-associated nuclease, contains McrA/HNH-nuclease and RuvC-like nuclease domain [Defense mechanisms]	NA|211aa|down_4|NZ_LS483329.1_828374_829007_-	COG4478, COG4478, Predicted membrane protein [Function unknown]	NA|255aa|down_5|NZ_LS483329.1_829006_829771_-	cd07530, HAD_Pase_UmpH-like, UmpH/NagD family phosphatase, similar to Escherichia coli UmpH UMP phosphatase/NagD nucleotide phosphatase and Mycobacterium tuberculosis Rv1692 glycerol 3-phosphate phosphatase	NA|251aa|down_6|NZ_LS483329.1_829770_830523_-	COG3884, FatA, Acyl-ACP thioesterase [Lipid metabolism]	NA|377aa|down_7|NZ_LS483329.1_830532_831663_-	PRK08599, PRK08599, oxygen-independent coproporphyrinogen III oxidase	NA|214aa|down_8|NZ_LS483329.1_831725_832367_-	NA	NA|452aa|down_9|NZ_LS483329.1_832490_833846_-	PRK14316, glmM, phosphoglucosamine mutase; Provisional
