assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_003814325.1_ASM381432v1	CP031018	Lactobacillus helveticus isolate NWC_2_4 chromosome, complete genome	1	608918-610494	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas14k	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	Type I-C, Type I-U?,Type I-U	GTCGCACTCCTTGTGAGTGCGTGGATTGAAAT,GTCGCACTCCTTGTGAGTGCGTGGATTGAAAT,GTCGCACTCCTTGTGAGTGCGTGGATTGAAAT	32,32,32	0	0	NA	NA	I-C:I-C:I-C	22,22,23	23	TypeI-C,TypeI-U?,TypeV,TypeI-U	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	NA,NA|177aa|down_8|CP031018.1_622356_622887_+	NA|422aa|up_9|CP031018.1_592511_593777_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|393aa|up_8|CP031018.1_596418_597597_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|567aa|up_7|CP031018.1_597898_599599_+	COG3666, COG3666, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|286aa|up_6|CP031018.1_599630_600488_-	pfam13612, DDE_Tnp_1_3, Transposase DDE domain	cas3|845aa|up_5|CP031018.1_600649_603184_+	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	cas5|248aa|up_4|CP031018.1_603198_603942_+	TIGR01876, cas_Cas5d, CRISPR-associated protein Cas5, subtype I-C/DVULG	cas8c|658aa|up_3|CP031018.1_603941_605915_+	pfam09709, Cas_Csd1, CRISPR-associated protein (Cas_Csd1)	cas7|284aa|up_2|CP031018.1_605917_606769_+	cd09689, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	cas4|219aa|up_1|CP031018.1_606771_607428_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|344aa|up_0|CP031018.1_607424_608456_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	NA|888aa|down_0|CP031018.1_611092_613756_+	PRK05755, PRK05755, DNA polymerase I; Provisional	NA|277aa|down_1|CP031018.1_613764_614595_+	PRK01103, PRK01103, bifunctional DNA-formamidopyrimidine glycosylase/DNA-(apurinic or apyrimidinic site) lyase	NA|201aa|down_2|CP031018.1_614591_615194_+	PRK00081, coaE, dephospho-CoA kinase; Reviewed	NA|156aa|down_3|CP031018.1_615196_615664_+	PRK00464, nrdR, transcriptional repressor NrdR	NA|444aa|down_4|CP031018.1_615666_616998_+	COG3611, DnaB, Replication initiation/membrane attachment protein [DNA replication, recombination, and repair]	NA|303aa|down_5|CP031018.1_617029_617938_+	PRK08939, PRK08939, primosomal protein DnaI; Reviewed	NA|645aa|down_6|CP031018.1_618228_620163_+	PRK00413, thrS, threonyl-tRNA synthetase; Reviewed	NA|393aa|down_7|CP031018.1_620438_621617_+	pfam00872, Transposase_mut, Transposase, Mutator family	NA|177aa|down_8|CP031018.1_622356_622887_+	NA	NA|203aa|down_9|CP031018.1_623077_623686_+	cd03769, SR_IS607_transposase_like, Serine Recombinase (SR) family, IS607-like transposase subfamily, catalytic domain; members contain a DNA binding domain with homology to MerR/SoxR located N-terminal to the catalytic domain
GCA_003814325.1_ASM381432v1	CP031018	Lactobacillus helveticus isolate NWC_2_4 chromosome, complete genome	2	738782-738872	2	CRISPRCasFinder	no		cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	Orphan	GTATTCTCCACGTATGTGGAGGTGATCCTA	30	0	0	NA	NA	I-B,III-A,III-B	1	1	Orphan	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	NA|205aa|up_5|CP031018.1_729979_730594_+,NA|79aa|up_1|CP031018.1_736136_736373_-,NA|99aa|down_5|CP031018.1_745264_745561_+	NA|420aa|up_9|CP031018.1_722253_723513_-	COG3464, COG3464, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|1071aa|up_8|CP031018.1_723775_726988_+	PRK11448, hsdR, type I restriction enzyme EcoKI subunit R; Provisional	NA|485aa|up_7|CP031018.1_727008_728463_+	pfam02384, N6_Mtase, N-6 DNA Methylase	NA|481aa|up_6|CP031018.1_728449_729892_+	cd17246, RMtype1_S_SonII-TRD2-CR2_like, Type I restriction-modification system specificity (S) subunit Target Recognition Domain-ConseRved domain (TRD-CR), similar to Shewanella oneidensis MR-1 S subunit (S	NA|205aa|up_5|CP031018.1_729979_730594_+	NA	NA|415aa|up_4|CP031018.1_730676_731921_+	pfam13020, DUF3883, Domain of unknown function (DUF3883)	NA|395aa|up_3|CP031018.1_732160_733345_+	pfam03217, SLAP, SLAP domain	NA|422aa|up_2|CP031018.1_733616_734882_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|79aa|up_1|CP031018.1_736136_736373_-	NA	NA|324aa|up_0|CP031018.1_736483_737455_-	COG4990, COG4990, Uncharacterized protein conserved in bacteria [Function unknown]	NA|393aa|down_0|CP031018.1_739308_740487_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|109aa|down_1|CP031018.1_741238_741565_-	COG2151, PaaD, Predicted metal-sulfur cluster biosynthetic enzyme [General function prediction only]	NA|295aa|down_2|CP031018.1_741566_742451_-	TIGR00718, Probable_L-serine_dehydratase_alpha_chain, L-serine dehydratase, iron-sulfur-dependent, alpha subunit	NA|221aa|down_3|CP031018.1_742465_743128_-	TIGR00719, Probable_L-serine_dehydratase_beta_chain, L-serine dehydratase, iron-sulfur-dependent, beta subunit	NA|469aa|down_4|CP031018.1_743481_744888_-	pfam06782, UPF0236, Uncharacterized protein family (UPF0236)	NA|99aa|down_5|CP031018.1_745264_745561_+	NA	NA|412aa|down_6|CP031018.1_745695_746931_+	cd17355, MFS_YcxA_like, MFS-type transporter YcxA and similar proteins of the Major Facilitator Superfamily of transporters	NA|875aa|down_7|CP031018.1_746987_749612_-	cd02089, P-type_ATPase_Ca_prok, prokaryotic P-type Ca(2+)-ATPase similar to Synechococcus elongatus sp	NA|128aa|down_8|CP031018.1_750774_751158_-	COG4603, COG4603, ABC-type uncharacterized transport system, permease component [General function prediction only]	NA|93aa|down_9|CP031018.1_751541_751820_+	TIGR02384, Putative_antitoxin_RelB, addiction module antitoxin, RelB/DinJ family
GCA_003814325.1_ASM381432v1	CP031018	Lactobacillus helveticus isolate NWC_2_4 chromosome, complete genome	3	789148-789252	3	CRISPRCasFinder	no		cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	Orphan	GTTGTTGTTGATGTTGGTATGAATCATGTTGATGG	35	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	NA,NA	NA|342aa|up_9|CP031018.1_780227_781253_-	PRK13357, PRK13357, branched-chain amino acid aminotransferase; Provisional	NA|456aa|up_8|CP031018.1_781391_782759_+	pfam10087, DUF2325, Uncharacterized protein conserved in bacteria (DUF2325)	NA|104aa|up_7|CP031018.1_782925_783237_+	PRK05573, rplU, 50S ribosomal protein L21; Validated	NA|97aa|up_6|CP031018.1_783255_783546_+	PRK05435, rpmA, 50S ribosomal protein L27; Validated	NA|370aa|up_5|CP031018.1_783655_784765_+	cd01092, APP-like, Similar to Prolidase and Aminopeptidase P	NA|190aa|up_4|CP031018.1_784848_785418_+	PRK00529, PRK00529, elongation factor P; Validated	NA|142aa|up_3|CP031018.1_785435_785861_+	pfam03780, Asp23, Asp23 family, cell envelope-related function	NA|131aa|up_2|CP031018.1_785868_786261_+	TIGR01951, nusB, transcription antitermination factor NusB	NA|283aa|up_1|CP031018.1_786319_787168_+	PRK14190, PRK14190, bifunctional 5,10-methylene-tetrahydrofolate dehydrogenase/ 5,10-methylene-tetrahydrofolate cyclohydrolase; Provisional	NA|350aa|up_0|CP031018.1_787305_788355_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|448aa|down_0|CP031018.1_789386_790730_+	PRK00286, xseA, exodeoxyribonuclease VII large subunit; Reviewed	NA|81aa|down_1|CP031018.1_790732_790975_+	PRK00977, PRK00977, exodeoxyribonuclease VII small subunit; Provisional	NA|290aa|down_2|CP031018.1_790977_791847_+	COG0142, IspA, Geranylgeranyl pyrophosphate synthase [Coenzyme metabolism]	NA|271aa|down_3|CP031018.1_791847_792660_+	COG1189, COG1189, Predicted rRNA methylase [Translation, ribosomal structure and biogenesis]	NA|561aa|down_4|CP031018.1_792670_794353_+	COG0497, RecN, ATPase involved in DNA repair [DNA replication, recombination, and repair]	NA|469aa|down_5|CP031018.1_798266_799673_+	pfam06782, UPF0236, Uncharacterized protein family (UPF0236)	NA|205aa|down_6|CP031018.1_799805_800420_+	PRK00300, gmk, guanylate kinase; Provisional	NA|75aa|down_7|CP031018.1_800422_800647_+	PRK00392, rpoZ, DNA-directed RNA polymerase subunit omega; Reviewed	NA|800aa|down_8|CP031018.1_800697_803097_+	PRK05580, PRK05580, primosome assembly protein PriA; Validated	NA|315aa|down_9|CP031018.1_803110_804055_+	PRK00005, fmt, methionyl-tRNA formyltransferase; Reviewed
GCA_003814325.1_ASM381432v1	CP031018	Lactobacillus helveticus isolate NWC_2_4 chromosome, complete genome	4	1656865-1657004	4	CRISPRCasFinder	no	cas14j	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	Unclear	AAATTAATTTAAGGAATCATTCATCCTTACACAAACTATTTTACGGTCTCA	51	1	2	1656916-1656953|1656916-1656953	CP031018.1_1876506-1876469|CP031018.1_1880855-1880892	NA	1	1	TypeV	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	NA,NA|224aa|down_5|CP031018.1_1663300_1663972_-	NA|448aa|up_9|CP031018.1_1644446_1645790_+	PRK05313, PRK05313, hypothetical protein; Provisional	NA|434aa|up_8|CP031018.1_1645938_1647240_+	cd14748, PBP2_UgpB, The periplasmic-binding component of ABC transport system specific for sn-glycerol-3-phosphate; possesses type 2 periplasmic binding fold	NA|399aa|up_7|CP031018.1_1647523_1648720_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|437aa|up_6|CP031018.1_1648803_1650114_+	COG3464, COG3464, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	cas14j|418aa|up_5|CP031018.1_1650810_1652064_-	COG0675, COG0675, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|218aa|up_4|CP031018.1_1652576_1653230_-	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|214aa|up_3|CP031018.1_1653244_1653886_-	COG0765, HisM, ABC-type amino acid transport system, permease component [Amino acid transport and metabolism]	NA|273aa|up_2|CP031018.1_1653885_1654704_-	cd01000, PBP2_Cys_DEBP_like, Substrate-binding domain of cysteine- and aspartate/glutamate-binding proteins; the type 2 periplasmic-binding protein fold	NA|247aa|up_1|CP031018.1_1654714_1655455_-	COG1126, GlnQ, ABC-type polar amino acid transport system, ATPase component [Amino acid transport and metabolism]	NA|393aa|up_0|CP031018.1_1655605_1656784_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|590aa|down_0|CP031018.1_1657674_1659444_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|577aa|down_1|CP031018.1_1659443_1661174_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|154aa|down_2|CP031018.1_1661152_1661614_-	pfam12802, MarR_2, MarR family	NA|273aa|down_3|CP031018.1_1661758_1662577_+	cd13689, PBP2_BsGlnH, Substrate binding domain of ABC glutamine transporter from Bacillus subtilis; the type 2 periplasmic-bindig protein fold	NA|223aa|down_4|CP031018.1_1662619_1663288_-	cd01741, GATase1_1, Subgroup of proteins having the Type 1 glutamine amidotransferase (GATase1) domain	NA|224aa|down_5|CP031018.1_1663300_1663972_-	NA	NA|541aa|down_6|CP031018.1_1664248_1665871_-	PRK15064, PRK15064, ABC transporter ATP-binding protein; Provisional	NA|361aa|down_7|CP031018.1_1665975_1667058_-	cd05656, M42_Frv, M42 Peptidase, endoglucanases	NA|469aa|down_8|CP031018.1_1667195_1668602_-	pfam06782, UPF0236, Uncharacterized protein family (UPF0236)	NA|402aa|down_9|CP031018.1_1668791_1669997_+	cd17391, MFS_MdtG_MDR_like, Multidrug resistance protein MdtG and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily
GCA_003814325.1_ASM381432v1	CP031018	Lactobacillus helveticus isolate NWC_2_4 chromosome, complete genome	5	1678476-1678655	2	PILER-CR	no	cas14j	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	Unclear	ATGTGGGATTTGAACCCACGC	21	0	0	NA	NA	NA	2	2	TypeV	cas14j,cas3,csa3,cas2,cas14k,cas5,cas8c,cas7,cas4,cas1,DEDDh,DinG,Cas14u_CAS-V,c2c9_V-U4	NA|60aa|up_3|CP031018.1_1673152_1673332_-,NA|143aa|down_3|CP031018.1_1684510_1684939_-	NA|541aa|up_9|CP031018.1_1664248_1665871_-	PRK15064, PRK15064, ABC transporter ATP-binding protein; Provisional	NA|361aa|up_8|CP031018.1_1665975_1667058_-	cd05656, M42_Frv, M42 Peptidase, endoglucanases	NA|469aa|up_7|CP031018.1_1667195_1668602_-	pfam06782, UPF0236, Uncharacterized protein family (UPF0236)	NA|402aa|up_6|CP031018.1_1668791_1669997_+	cd17391, MFS_MdtG_MDR_like, Multidrug resistance protein MdtG and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|490aa|up_5|CP031018.1_1670020_1671490_-	cd17502, MFS_Azr1_MDR_like, Saccharomyces cerevisiae Azole resistance protein 1 (Azr1p), and similar multidrug resistance (MDR) transporters of the Major Facilitator Superfamily	NA|469aa|up_4|CP031018.1_1671723_1673130_+	pfam06782, UPF0236, Uncharacterized protein family (UPF0236)	NA|60aa|up_3|CP031018.1_1673152_1673332_-	NA	NA|177aa|up_2|CP031018.1_1673387_1673918_+	PRK05205, PRK05205, bifunctional pyr operon transcriptional regulator/uracil phosphoribosyltransferase PyrR	NA|443aa|up_1|CP031018.1_1673930_1675259_+	PRK10720, PRK10720, uracil transporter; Provisional	cas14j|410aa|up_0|CP031018.1_1676181_1677411_-	COG0675, COG0675, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|203aa|down_0|CP031018.1_1680410_1681019_-	cd03769, SR_IS607_transposase_like, Serine Recombinase (SR) family, IS607-like transposase subfamily, catalytic domain; members contain a DNA binding domain with homology to MerR/SoxR located N-terminal to the catalytic domain	NA|167aa|down_1|CP031018.1_1681121_1681622_-	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|469aa|down_2|CP031018.1_1681832_1683239_-	pfam06782, UPF0236, Uncharacterized protein family (UPF0236)	NA|143aa|down_3|CP031018.1_1684510_1684939_-	NA	NA|67aa|down_4|CP031018.1_1685147_1685348_+	COG1278, CspC, Cold shock proteins [Transcription]	NA|319aa|down_5|CP031018.1_1686702_1687659_+	COG2826, Tra8, Transposase and inactivated derivatives, IS30 family [DNA replication, recombination, and repair]	NA|186aa|down_6|CP031018.1_1687776_1688334_-	pfam07563, DUF1541, Protein of unknown function (DUF1541)	NA|75aa|down_7|CP031018.1_1688515_1688740_-	pfam04024, PspC, PspC domain	NA|393aa|down_8|CP031018.1_1688762_1689941_-	pfam00872, Transposase_mut, Transposase, Mutator family	NA|116aa|down_9|CP031018.1_1690190_1690538_-	COG1695, COG1695, Predicted transcriptional regulators [Transcription]
