assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_001712815.1_ASM171281v1	NZ_CP012047	Tetragenococcus halophilus strain MJ4, complete genome	1	421504-422835	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	Type III-B,Type III-A,Type III-C,Type III-D	AATAGATACCTAACCCCATTATTAGGGGACGAGAAC,AATAGATACCTAACCCCATTATTAGGGGACGAGAAC,AATAGATACCTAACCCCATNATTAGGGGACGAGAAC	36,36,36	0	0	NA	NA	NA:NA:NA	17,18,18	18	TypeIII-B,TypeIII-A,TypeIII-C,TypeIII-D	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	NA|106aa|up_7|NZ_CP012047.1_413420_413738_+,NA|78aa|down_9|NZ_CP012047.1_431999_432233_+	NA|550aa|up_9|NZ_CP012047.1_409515_411165_+	COG0433, COG0433,  HerA helicase [Replication, recombination, and repair]	NA|316aa|up_8|NZ_CP012047.1_411427_412375_+	smart00901, FRG, This domain contains a conserved N-terminal (F/Y)RG motif	NA|106aa|up_7|NZ_CP012047.1_413420_413738_+	NA	cas6|249aa|up_6|NZ_CP012047.1_414034_414781_+	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	cas10|763aa|up_5|NZ_CP012047.1_414773_417062_+	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	csm2gr11|143aa|up_4|NZ_CP012047.1_417070_417499_+	pfam03750, Csm2_III-A, Csm2 Type III-A	csm3gr7|225aa|up_3|NZ_CP012047.1_417510_418185_+	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm4gr5|299aa|up_2|NZ_CP012047.1_418181_419078_+	pfam17953, Csm4_C, CRISPR Csm4 C-terminal domain	csm5gr7|338aa|up_1|NZ_CP012047.1_419095_420109_+	COG1332, COG1332, CRISPR system related protein, RAMP superfamily [Defense mechanisms]	csm6|418aa|up_0|NZ_CP012047.1_420104_421358_+	cd09699, Csm6_III-A, CRISPR/Cas system-associated protein Csm6	cas1|303aa|down_0|NZ_CP012047.1_422876_423785_+	cd09720, Cas1_II, CRISPR/Cas system-associated protein Cas1	cas2|102aa|down_1|NZ_CP012047.1_423785_424091_+	TIGR01573, cas2, CRISPR-associated endonuclease Cas2	NA|109aa|down_2|NZ_CP012047.1_424512_424839_-	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|159aa|down_3|NZ_CP012047.1_425309_425786_+	cd00211, PTS_IIA_fru, PTS_IIA, PTS system, fructose/mannitol specific IIA subunit	NA|483aa|down_4|NZ_CP012047.1_426012_427461_-	pfam13610, DDE_Tnp_IS240, DDE domain	NA|554aa|down_5|NZ_CP012047.1_427798_429460_+	cd00211, PTS_IIA_fru, PTS_IIA, PTS system, fructose/mannitol specific IIA subunit	NA|128aa|down_6|NZ_CP012047.1_429566_429950_+	PRK12858, PRK12858, tagatose 1,6-diphosphate aldolase; Reviewed	NA|191aa|down_7|NZ_CP012047.1_430088_430661_+	cd05014, SIS_Kpsf, KpsF-like protein	NA|317aa|down_8|NZ_CP012047.1_430864_431815_+	COG2421, COG2421, Predicted acetamidase/formamidase [Energy production and conversion]	NA|78aa|down_9|NZ_CP012047.1_431999_432233_+	NA
GCF_001712815.1_ASM171281v1	NZ_CP012047	Tetragenococcus halophilus strain MJ4, complete genome	2	494575-495806	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	Type I-C,Type I-U, Type I-U?	GTCGCTCTCTTCATGAGAGCGTGGATTGAAAT,GTCGCTCTCTTCATGAGAGCGTGGATTGAAAT,GTCGCTCTCTTCATGAGAGCGTGGATTGAAAT	32,32,32	0	0	NA	NA	I-C:I-C:I-C	17,18,18	18	TypeI-C,TypeI-U,TypeI-U?	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	NA|83aa|up_7|NZ_CP012047.1_484124_484373_-,NA	NA|388aa|up_9|NZ_CP012047.1_480967_482131_+	COG2856, COG2856, Predicted Zn peptidase [Amino acid transport and metabolism]	NA|409aa|up_8|NZ_CP012047.1_482583_483810_+	cd17371, MFS_MucK, Cis,cis-muconate transport protein and similar proteins of the Major Facilitator Superfamily	NA|83aa|up_7|NZ_CP012047.1_484124_484373_-	NA	NA|184aa|up_6|NZ_CP012047.1_484842_485394_+	pfam13508, Acetyltransf_7, Acetyltransferase (GNAT) domain	NA|297aa|up_5|NZ_CP012047.1_485526_486417_-	pfam06800, Sugar_transport, Sugar transport protein	NA|132aa|up_4|NZ_CP012047.1_486447_486843_-	PRK11797, PRK11797, D-ribose pyranase; Provisional	NA|302aa|up_3|NZ_CP012047.1_486866_487772_-	TIGR02152, Putative_ribokinase, ribokinase	NA|348aa|up_2|NZ_CP012047.1_488123_489167_+	cd09019, galactose_mutarotase_like, galactose mutarotase_like	NA|471aa|up_1|NZ_CP012047.1_489635_491048_+	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily	NA|201aa|up_0|NZ_CP012047.1_493234_493837_+	pfam04892, VanZ, VanZ like family	cas3|815aa|down_0|NZ_CP012047.1_496653_499098_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|241aa|down_1|NZ_CP012047.1_499428_500151_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|638aa|down_2|NZ_CP012047.1_500155_502069_+	TIGR01863, CRISPR-associated_protein_CT1133_family, CRISPR-associated protein Cas8c/Csd1, subtype I-C/DVULG	cas7|282aa|down_3|NZ_CP012047.1_502055_502901_+	cd09689, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas4|222aa|down_4|NZ_CP012047.1_502903_503569_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|343aa|down_5|NZ_CP012047.1_503578_504607_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	NA|417aa|down_6|NZ_CP012047.1_504745_505996_-	pfam02371, Transposase_20, Transposase IS116/IS110/IS902 family	cas2|98aa|down_7|NZ_CP012047.1_506469_506763_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|453aa|down_8|NZ_CP012047.1_508535_509894_+	pfam13546, DDE_5, DDE superfamily endonuclease	NA|238aa|down_9|NZ_CP012047.1_510541_511255_-	COG4279, COG4279, Uncharacterized conserved protein [Function unknown]
GCF_001712815.1_ASM171281v1	NZ_CP012047	Tetragenococcus halophilus strain MJ4, complete genome	3	506911-508281	3,3,3	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	Type I-C,Type I-U, Type I-U?	GTCGCTCTCTTCATGAGAGCGTGGATTGAAAT,GTCGCTCTCTTCATGAGAGCGTGGATTGAAAT,GTCGCTCTCTTCATGAGAGCGTGGATTGAAAT	32,32,32	0	0	NA	NA	I-C:I-C:I-C	19,20,20	20	TypeI-C,TypeI-U,TypeI-U?	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	NA,NA	NA|471aa|up_9|NZ_CP012047.1_489635_491048_+	TIGR00711, Uncharacterized_MFS-type_transporter_YhcA, drug resistance transporter, EmrB/QacA subfamily	NA|201aa|up_8|NZ_CP012047.1_493234_493837_+	pfam04892, VanZ, VanZ like family	cas3|815aa|up_7|NZ_CP012047.1_496653_499098_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|241aa|up_6|NZ_CP012047.1_499428_500151_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|638aa|up_5|NZ_CP012047.1_500155_502069_+	TIGR01863, CRISPR-associated_protein_CT1133_family, CRISPR-associated protein Cas8c/Csd1, subtype I-C/DVULG	cas7|282aa|up_4|NZ_CP012047.1_502055_502901_+	cd09689, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas4|222aa|up_3|NZ_CP012047.1_502903_503569_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|343aa|up_2|NZ_CP012047.1_503578_504607_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	NA|417aa|up_1|NZ_CP012047.1_504745_505996_-	pfam02371, Transposase_20, Transposase IS116/IS110/IS902 family	cas2|98aa|up_0|NZ_CP012047.1_506469_506763_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|453aa|down_0|NZ_CP012047.1_508535_509894_+	pfam13546, DDE_5, DDE superfamily endonuclease	NA|238aa|down_1|NZ_CP012047.1_510541_511255_-	COG4279, COG4279, Uncharacterized conserved protein [Function unknown]	NA|844aa|down_2|NZ_CP012047.1_511257_513789_-	COG0553, HepA, Superfamily II DNA/RNA helicases, SNF2 family [Transcription / DNA replication, recombination, and repair]	NA|325aa|down_3|NZ_CP012047.1_513979_514954_+	COG0042, COG0042, tRNA-dihydrouridine synthase [Translation, ribosomal structure and biogenesis]	NA|524aa|down_4|NZ_CP012047.1_515374_516946_+	pfam07905, PucR, Purine catabolism regulatory protein-like family	NA|423aa|down_5|NZ_CP012047.1_517080_518349_+	cd11484, SLC-NCS1sbd_CobB-like, nucleobase-cation-symport-1 (NCS1) transporter CobB-like; solute-binding domain	NA|365aa|down_6|NZ_CP012047.1_518383_519478_+	COG3535, COG3535, Uncharacterized conserved protein [Function unknown]	NA|522aa|down_7|NZ_CP012047.1_519477_521043_+	COG0145, HyuA, N-methylhydantoinase A/acetone carboxylase, beta subunit [Amino acid transport and metabolism / Secondary metabolites biosynthesis, transport, and catabolism]	NA|411aa|down_8|NZ_CP012047.1_521265_522498_-	pfam05552, TM_helix, Conserved TM helix	NA|567aa|down_9|NZ_CP012047.1_522576_524277_+	COG0021, TktA, Transketolase [Carbohydrate transport and metabolism]
GCF_001712815.1_ASM171281v1	NZ_CP012047	Tetragenococcus halophilus strain MJ4, complete genome	4	1969768-1969892	4	CRISPRCasFinder	no	cas14j	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	Unclear	TCTCTTAGCTCCCTTTGGTCGCTAAATCGCAGTGATTC	38	0	0	NA	NA	NA	1	1	TypeV	RT,cas6,cas10,csm2gr11,csm3gr7,csm4gr5,csm5gr7,csm6,cas1,cas2,cas3,cas5,cas8c,cas7,cas4,csa3,DEDDh,DinG,cas14j	NA|137aa|up_1|NZ_CP012047.1_1966822_1967233_-,NA|141aa|down_6|NZ_CP012047.1_1975742_1976165_-	NA|621aa|up_9|NZ_CP012047.1_1957707_1959570_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|580aa|up_8|NZ_CP012047.1_1959559_1961299_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|235aa|up_7|NZ_CP012047.1_1961527_1962232_-	cd01411, SIR2H, SIR2H: Uncharacterized prokaryotic Sir2 homologs from several gram positive bacterial species and Fusobacteria; and are members of the SIR2 family of proteins, silent information regulator 2 (Sir2) enzymes which catalyze NAD+-dependent protein/histone deacetylation	NA|158aa|up_6|NZ_CP012047.1_1962338_1962812_-	TIGR01994, Iron-sulfur_cluster_assembly_scaffold_protein_IscU, SUF system FeS assembly protein, NifU family	NA|412aa|up_5|NZ_CP012047.1_1962798_1964034_-	TIGR01979, Probable_cysteine_desulfurase, cysteine desulfurases, SufSfamily	NA|431aa|up_4|NZ_CP012047.1_1964030_1965323_-	COG0719, SufB, Cysteine desulfurase activator SufB [Posttranslational modification, protein turnover, chaperones]	NA|258aa|up_3|NZ_CP012047.1_1965337_1966111_-	COG0396, sufC, Cysteine desulfurase activator ATPase [Posttranslational modification, protein turnover, chaperones]	NA|153aa|up_2|NZ_CP012047.1_1966285_1966744_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|137aa|up_1|NZ_CP012047.1_1966822_1967233_-	NA	NA|716aa|up_0|NZ_CP012047.1_1967321_1969469_-	PRK11824, PRK11824, polynucleotide phosphorylase/polyadenylase; Provisional	NA|90aa|down_0|NZ_CP012047.1_1969942_1970212_-	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|97aa|down_1|NZ_CP012047.1_1970471_1970762_+	cd00158, RHOD, Rhodanese Homology Domain (RHOD); an alpha beta fold domain found duplicated in the rhodanese protein	NA|392aa|down_2|NZ_CP012047.1_1970806_1971982_-	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|117aa|down_3|NZ_CP012047.1_1971997_1972348_-	pfam03829, PTSIIA_gutA, PTS system glucitol/sorbitol-specific IIA component	NA|340aa|down_4|NZ_CP012047.1_1972518_1973538_+	pfam10282, Lactonase, Lactonase, 7-bladed beta-propeller	NA|497aa|down_5|NZ_CP012047.1_1973862_1975353_-	COG0488, Uup, ATPase components of ABC transporters with duplicated ATPase domains [General function prediction only]	NA|141aa|down_6|NZ_CP012047.1_1975742_1976165_-	NA	NA|882aa|down_7|NZ_CP012047.1_1976584_1979230_+	cd02089, P-type_ATPase_Ca_prok, prokaryotic P-type Ca(2+)-ATPase similar to Synechococcus elongatus sp	NA|671aa|down_8|NZ_CP012047.1_1979435_1981448_-	PRK12267, PRK12267, methionyl-tRNA synthetase; Reviewed	NA|274aa|down_9|NZ_CP012047.1_1981979_1982801_+	COG1051, COG1051, ADP-ribose pyrophosphatase [Nucleotide transport and metabolism]
