assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000710375.2_ASM71037v3	NZ_CP036539	Bacteroides fragilis strain DCMOUH0017B chromosome, complete genome	1	3765743-3765909	1	CRISPRCasFinder	no		cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL	Orphan	TTTTTCTTTGTCGGGGTAGCGGGATTCGAACCCACGACCCCCAGCTCCCAAAGC	54	0	0	NA	NA	NA	1	1	Orphan	cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL,c2c9_V-U4,Cas14u_CAS-V	NA|225aa|up_9|NZ_CP036539.1_3751843_3752518_+,NA|701aa|up_7|NZ_CP036539.1_3756671_3758774_+,NA|74aa|up_6|NZ_CP036539.1_3758818_3759040_+,NA|398aa|up_5|NZ_CP036539.1_3759036_3760230_+,NA|145aa|up_2|NZ_CP036539.1_3761784_3762219_+,NA|113aa|up_1|NZ_CP036539.1_3762832_3763171_+,NA|73aa|down_0|NZ_CP036539.1_3766150_3766369_-,NA|61aa|down_1|NZ_CP036539.1_3766459_3766642_-,NA|58aa|down_4|NZ_CP036539.1_3767922_3768096_+	NA|225aa|up_9|NZ_CP036539.1_3751843_3752518_+	NA	NA|1374aa|up_8|NZ_CP036539.1_3752539_3756661_+	COG1196, Smc, Chromosome segregation ATPases [Cell division and chromosome partitioning]	NA|701aa|up_7|NZ_CP036539.1_3756671_3758774_+	NA	NA|74aa|up_6|NZ_CP036539.1_3758818_3759040_+	NA	NA|398aa|up_5|NZ_CP036539.1_3759036_3760230_+	NA	NA|209aa|up_4|NZ_CP036539.1_3760327_3760954_+	cd14948, BACON, Bacteroidetes-Associated Carbohydrate-binding (putative) Often N-terminal (BACON) domain	NA|208aa|up_3|NZ_CP036539.1_3761006_3761630_-	cd14948, BACON, Bacteroidetes-Associated Carbohydrate-binding (putative) Often N-terminal (BACON) domain	NA|145aa|up_2|NZ_CP036539.1_3761784_3762219_+	NA	NA|113aa|up_1|NZ_CP036539.1_3762832_3763171_+	NA	NA|415aa|up_0|NZ_CP036539.1_3764342_3765587_-	cd01185, INTN1_C_like, Integrase IntN1 of Bacteroides mobilizable transposon NBU1 and similar proteins, C-terminal catalytic domain	NA|73aa|down_0|NZ_CP036539.1_3766150_3766369_-	NA	NA|61aa|down_1|NZ_CP036539.1_3766459_3766642_-	NA	NA|317aa|down_2|NZ_CP036539.1_3766553_3767504_+	pfam13149, Mfa_like_1, Fimbrillin-like	NA|114aa|down_3|NZ_CP036539.1_3767512_3767854_+	pfam07784, DUF1622, Protein of unknown function (DUF1622)	NA|58aa|down_4|NZ_CP036539.1_3767922_3768096_+	NA	NA|426aa|down_5|NZ_CP036539.1_3768102_3769380_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|455aa|down_6|NZ_CP036539.1_3769376_3770741_-	COG2204, AtoC, Response regulator containing CheY-like receiver, AAA-type ATPase, and DNA-binding domains [Signal transduction mechanisms]	NA|491aa|down_7|NZ_CP036539.1_3771058_3772531_+	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|417aa|down_8|NZ_CP036539.1_3772571_3773822_+	TIGR01730, COG0845:_Membrane-fusion_protein, RND family efflux transporter, MFP subunit	NA|811aa|down_9|NZ_CP036539.1_3773947_3776380_+	pfam12704, MacB_PCD, MacB-like periplasmic core domain
GCF_000710375.2_ASM71037v3	NZ_CP036539	Bacteroides fragilis strain DCMOUH0017B chromosome, complete genome	2	3960527-3960604	2	CRISPRCasFinder	no		cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL	Orphan	GGACACAGAGATTAATTGGCTGC	23	0	0	NA	NA	NA	1	1	Orphan	cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL,c2c9_V-U4,Cas14u_CAS-V	NA|125aa|up_4|NZ_CP036539.1_3953528_3953903_-,NA|125aa|up_2|NZ_CP036539.1_3955447_3955822_+,NA|207aa|down_1|NZ_CP036539.1_3961490_3962111_+	NA|518aa|up_9|NZ_CP036539.1_3947123_3948677_-	pfam15495, Fimbrillin_C, Major fimbrial subunit protein type IV, Fimbrillin, C-terminal	NA|351aa|up_8|NZ_CP036539.1_3948663_3949716_-	pfam08842, Mfa2, Fimbrillin-A associated anchor proteins Mfa1 and Mfa2	NA|552aa|up_7|NZ_CP036539.1_3949846_3951502_-	pfam15495, Fimbrillin_C, Major fimbrial subunit protein type IV, Fimbrillin, C-terminal	NA|467aa|up_6|NZ_CP036539.1_3951526_3952927_-	cd07185, OmpA_C-like, Peptidoglycan binding domains similar to the C-terminal domain of outer-membrane protein OmpA	NA|186aa|up_5|NZ_CP036539.1_3952935_3953493_-	pfam12099, DUF3575, Protein of unknown function (DUF3575)	NA|125aa|up_4|NZ_CP036539.1_3953528_3953903_-	NA	NA|335aa|up_3|NZ_CP036539.1_3954293_3955298_-	cd01185, INTN1_C_like, Integrase IntN1 of Bacteroides mobilizable transposon NBU1 and similar proteins, C-terminal catalytic domain	NA|125aa|up_2|NZ_CP036539.1_3955447_3955822_+	NA	NA|526aa|up_1|NZ_CP036539.1_3955897_3957475_-	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|403aa|up_0|NZ_CP036539.1_3959232_3960441_-	COG5026, COG5026, Hexokinase [Carbohydrate transport and metabolism]	NA|104aa|down_0|NZ_CP036539.1_3960824_3961136_+	pfam14053, DUF4248, Domain of unknown function (DUF4248)	NA|207aa|down_1|NZ_CP036539.1_3961490_3962111_+	NA	NA|455aa|down_2|NZ_CP036539.1_3962240_3963605_+	TIGR00665, DnaB, replicative DNA helicase	NA|160aa|down_3|NZ_CP036539.1_3963734_3964214_+	pfam18291, HU-HIG, HU domain fused to wHTH, Ig, or Glycine-rich motif	NA|148aa|down_4|NZ_CP036539.1_3964432_3964876_+	PHA00447, PHA00447, lysozyme	NA|380aa|down_5|NZ_CP036539.1_3965844_3966984_-	cd06829, PLPDE_III_CANSDC, Type III Pyridoxal 5-phosphate (PLP)-Dependent Enzyme Carboxynorspermidine Decarboxylase	NA|787aa|down_6|NZ_CP036539.1_3967102_3969463_-	TIGR01073, ATP-dependent_DNA_helicase_PcrA, ATP-dependent DNA helicase PcrA	NA|206aa|down_7|NZ_CP036539.1_3969584_3970202_+	COG0605, SodA, Superoxide dismutase [Inorganic ion transport and metabolism]	NA|66aa|down_8|NZ_CP036539.1_3970542_3970740_+	cd00565, Ubl_ThiS, ubiquitin-like (Ubl) domain found in sulfur carrier protein ThiS	NA|205aa|down_9|NZ_CP036539.1_3970743_3971358_+	PRK00043, thiE, thiamine phosphate synthase
GCF_000710375.2_ASM71037v3	NZ_CP036539	Bacteroides fragilis strain DCMOUH0017B chromosome, complete genome	3	3985078-3989392	3,1,1	CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas4,cas7	cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL	Unclear	GTTTCAATTCCATAAGGTACAATTAACAC,GTTTCAATTCCATAAGGTACAATTAACAC,GTTTCAATTCCATAAGGTACAATTAACAC	29,29,29	1	1	3985107-3985142	NZ_CP036539.1_2342107-2342072	NA:NA:NA	67,67,66	67	Unclear	cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL,c2c9_V-U4,Cas14u_CAS-V	NA|135aa|up_1|NZ_CP036539.1_3984034_3984439_-,NA|145aa|up_0|NZ_CP036539.1_3984460_3984895_-,NA|80aa|down_7|NZ_CP036539.1_3996597_3996837_-,NA|64aa|down_8|NZ_CP036539.1_3997077_3997269_+,NA|79aa|down_9|NZ_CP036539.1_3997461_3997698_-	NA|375aa|up_9|NZ_CP036539.1_3974557_3975682_+	PRK09240, thiH, 2-iminoacetate synthase ThiH	NA|234aa|up_8|NZ_CP036539.1_3975697_3976399_+	cd00757, ThiF_MoeB_HesA_family, ThiF_MoeB_HesA	NA|203aa|up_7|NZ_CP036539.1_3976460_3977069_+	cd00564, TMP_TenI, Thiamine monophosphate synthase (TMP synthase)/TenI	NA|172aa|up_6|NZ_CP036539.1_3977146_3977662_-	pfam13505, OMP_b-brl, Outer membrane protein beta-barrel domain	NA|190aa|up_5|NZ_CP036539.1_3977861_3978431_-	pfam13568, OMP_b-brl_2, Outer membrane protein beta-barrel domain	NA|907aa|up_4|NZ_CP036539.1_3978632_3981353_-	PRK09279, PRK09279, pyruvate phosphate dikinase; Provisional	NA|473aa|up_3|NZ_CP036539.1_3981619_3983038_+	COG2265, TrmA, SAM-dependent methyltransferases related to tRNA (uracil-5-)-methyltransferase [Translation, ribosomal structure and biogenesis]	NA|306aa|up_2|NZ_CP036539.1_3983048_3983966_+	COG0564, RluA, Pseudouridylate synthases, 23S RNA-specific [Translation, ribosomal structure and biogenesis]	NA|135aa|up_1|NZ_CP036539.1_3984034_3984439_-	NA	NA|145aa|up_0|NZ_CP036539.1_3984460_3984895_-	NA	cas2|88aa|down_0|NZ_CP036539.1_3989603_3989867_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|338aa|down_1|NZ_CP036539.1_3989869_3990883_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|171aa|down_2|NZ_CP036539.1_3990879_3991392_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas7|353aa|down_3|NZ_CP036539.1_3991456_3992515_-	cd09687, Cas7_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas7	NA|264aa|down_4|NZ_CP036539.1_3993200_3993992_-	PRK09183, PRK09183, transposase/IS protein; Provisional	NA|521aa|down_5|NZ_CP036539.1_3993960_3995523_-	COG4584, COG4584, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|105aa|down_6|NZ_CP036539.1_3996115_3996430_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|80aa|down_7|NZ_CP036539.1_3996597_3996837_-	NA	NA|64aa|down_8|NZ_CP036539.1_3997077_3997269_+	NA	NA|79aa|down_9|NZ_CP036539.1_3997461_3997698_-	NA
GCF_000710375.2_ASM71037v3	NZ_CP036539	Bacteroides fragilis strain DCMOUH0017B chromosome, complete genome	4	5065922-5065999	4	CRISPRCasFinder	no		cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL	Orphan	CAAGACTTAGACACTCAGCAGGCT	24	0	0	NA	NA	NA	1	1	Orphan	cas3,PrimPol,PD-DExK,RT,DEDDh,cas2,cas1,cas4,cas7,WYL,c2c9_V-U4,Cas14u_CAS-V	NA|352aa|up_8|NZ_CP036539.1_5052577_5053633_+,NA|211aa|up_5|NZ_CP036539.1_5055036_5055669_+,NA	NA|457aa|up_9|NZ_CP036539.1_5051130_5052501_+	pfam13148, DUF3987, Protein of unknown function (DUF3987)	NA|352aa|up_8|NZ_CP036539.1_5052577_5053633_+	NA	NA|116aa|up_7|NZ_CP036539.1_5053732_5054080_+	pfam05713, MobC, Bacterial mobilisation protein (MobC)	NA|313aa|up_6|NZ_CP036539.1_5054076_5055015_+	pfam03432, Relaxase, Relaxase/Mobilisation nuclease domain	NA|211aa|up_5|NZ_CP036539.1_5055036_5055669_+	NA	NA|68aa|up_4|NZ_CP036539.1_5055871_5056075_+	smart00530, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|212aa|up_3|NZ_CP036539.1_5056067_5056703_+	pfam08849, DUF1819, Putative inner membrane protein (DUF1819)	NA|200aa|up_2|NZ_CP036539.1_5056708_5057308_+	pfam08747, DUF1788, Domain of unknown function (DUF1788)	NA|1212aa|up_1|NZ_CP036539.1_5057320_5060956_+	NF033441, BREX_BrxC, BREX system P-loop protein BrxC	NA|1213aa|up_0|NZ_CP036539.1_5060967_5064606_+	NF033452, BREX_1_MTaseX, BREX-1 system adenine-specific DNA-methyltransferase PglX	NA|852aa|down_0|NZ_CP036539.1_5066237_5068793_+	TIGR02687, conserved_hypothetical_protein, TIGR02687 family protein	NA|678aa|down_1|NZ_CP036539.1_5068806_5070840_+	pfam13337, Lon_2, Putative ATP-dependent Lon protease	NA|276aa|down_2|NZ_CP036539.1_5071792_5072620_+	cd10447, GIY-YIG_unchar_2, GIY-YIG domain of uncharacterized hypothetical protein found in bacteria and archaea	NA|344aa|down_3|NZ_CP036539.1_5072630_5073662_+	COG3177, COG3177, Fic family protein [Function unknown]	NA|263aa|down_4|NZ_CP036539.1_5073652_5074441_+	TIGR01575, rimI, ribosomal-protein-alanine acetyltransferase	NA|254aa|down_5|NZ_CP036539.1_5074424_5075186_+	pfam13649, Methyltransf_25, Methyltransferase domain	NA|149aa|down_6|NZ_CP036539.1_5075323_5075770_+	PRK10514, PRK10514, putative acetyltransferase; Provisional	NA|73aa|down_7|NZ_CP036539.1_5076179_5076398_+	TIGR03070, couple_hipB, transcriptional regulator, y4mF family	NA|111aa|down_8|NZ_CP036539.1_5076394_5076727_+	TIGR03071, couple_hipA, HipA N-terminal domain	NA|314aa|down_9|NZ_CP036539.1_5076723_5077665_+	pfam07804, HipA_C, HipA-like C-terminal domain
