assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_002173755.1_ASM217375v1	NZ_CP017577	Bacillus thuringiensis strain SCG04-02, complete genome	1	1346303-1346413	1	CRISPRCasFinder	no		DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh	Orphan	AAAATGAAACCGATTTTTGATGCACAA	27	0	0	NA	NA	NA	1	1	Orphan	DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh,cas9,cas14j	NA|84aa|up_8|NZ_CP017577.1_1337324_1337576_+,NA|65aa|up_6|NZ_CP017577.1_1338461_1338656_-,NA|390aa|up_5|NZ_CP017577.1_1339669_1340839_+,NA|210aa|up_3|NZ_CP017577.1_1342595_1343225_+,NA|241aa|down_0|NZ_CP017577.1_1346431_1347154_+,NA|70aa|down_1|NZ_CP017577.1_1347514_1347724_+,NA|85aa|down_2|NZ_CP017577.1_1347862_1348117_+	NA|56aa|up_9|NZ_CP017577.1_1337131_1337299_+	pfam13128, DUF3954, Protein of unknown function (DUF3954)	NA|84aa|up_8|NZ_CP017577.1_1337324_1337576_+	NA	NA|161aa|up_7|NZ_CP017577.1_1337596_1338079_+	cd11541, NTP-PPase_u4, Nucleoside Triphosphate Pyrophosphohydrolase (EC 3	NA|65aa|up_6|NZ_CP017577.1_1338461_1338656_-	NA	NA|390aa|up_5|NZ_CP017577.1_1339669_1340839_+	NA	NA|229aa|up_4|NZ_CP017577.1_1341288_1341975_-	pfam02517, Abi, CAAX protease self-immunity	NA|210aa|up_3|NZ_CP017577.1_1342595_1343225_+	NA	NA|161aa|up_2|NZ_CP017577.1_1343581_1344064_+	TIGR01637, Putative_autolysin_regulatory_protein_ArpU, phage transcriptional regulator, ArpU family	NA|181aa|up_1|NZ_CP017577.1_1344063_1344606_+	cd01192, INT_C_like_3, Uncharacterized site-specific tyrosine recombinase, C-terminal catalytic domain	NA|317aa|up_0|NZ_CP017577.1_1344819_1345770_+	cd00455, nuc_hydro, nuc_hydro: Nucleoside hydrolases	NA|241aa|down_0|NZ_CP017577.1_1346431_1347154_+	NA	NA|70aa|down_1|NZ_CP017577.1_1347514_1347724_+	NA	NA|85aa|down_2|NZ_CP017577.1_1347862_1348117_+	NA	NA|126aa|down_3|NZ_CP017577.1_1348106_1348484_+	COG1403, McrA, Restriction endonuclease [Defense mechanisms]	NA|168aa|down_4|NZ_CP017577.1_1348611_1349115_+	pfam05119, Terminase_4, Phage terminase, small subunit	NA|565aa|down_5|NZ_CP017577.1_1349116_1350811_+	COG4626, COG4626, Phage terminase-like protein, large subunit [General function prediction only]	NA|418aa|down_6|NZ_CP017577.1_1350999_1352253_+	pfam04860, Phage_portal, Phage portal protein	NA|237aa|down_7|NZ_CP017577.1_1352239_1352950_+	cd07016, S14_ClpP_1, Caseinolytic protease (ClpP) is an ATP-dependent, highly conserved serine protease	NA|391aa|down_8|NZ_CP017577.1_1352987_1354160_+	TIGR01554, prophage_Lp3_protein_18, phage major capsid protein, HK97 family	NA|96aa|down_9|NZ_CP017577.1_1354180_1354468_+	cd08054, gp6, Head-Tail Connector Protein gp6 of Bacteriophage HK97 and similar proteins
GCF_002173755.1_ASM217375v1	NZ_CP017577	Bacillus thuringiensis strain SCG04-02, complete genome	2	3979600-3979733	2	CRISPRCasFinder	no		DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh	Orphan	GTTGATTTCTCTTCTTTTTGAGA	23	0	0	NA	NA	NA	2	2	Orphan	DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh,cas9,cas14j	NA|45aa|up_0|NZ_CP017577.1_3979277_3979412_-,NA	NA|607aa|up_9|NZ_CP017577.1_3970064_3971885_-	COG1086, COG1086, Predicted nucleoside-diphosphate sugar epimerases [Cell envelope biogenesis, outer membrane / Carbohydrate transport and metabolism]	NA|294aa|up_8|NZ_CP017577.1_3971945_3972827_-	COG1210, GalU, UDP-glucose pyrophosphorylase [Cell envelope biogenesis, outer membrane]	NA|256aa|up_7|NZ_CP017577.1_3973072_3973840_-	COG4464, CapC, Capsular polysaccharide biosynthesis protein [Carbohydrate transport and metabolism / Cell envelope biogenesis, outer membrane]	NA|234aa|up_6|NZ_CP017577.1_3973951_3974653_-	cd05387, BY-kinase, bacterial tyrosine-kinase	NA|248aa|up_5|NZ_CP017577.1_3974642_3975386_-	COG3944, COG3944, Capsular polysaccharide biosynthesis protein [Cell envelope biogenesis, outer membrane]	NA|226aa|up_4|NZ_CP017577.1_3975645_3976323_-	cd05387, BY-kinase, bacterial tyrosine-kinase	NA|145aa|up_3|NZ_CP017577.1_3976669_3977104_-	PRK00006, fabZ, 3-hydroxyacyl-ACP dehydratase FabZ	NA|334aa|up_2|NZ_CP017577.1_3977533_3978535_-	PRK13928, PRK13928, rod shape-determining protein Mbl; Provisional	NA|91aa|up_1|NZ_CP017577.1_3978695_3978968_-	pfam12116, SpoIIID, Stage III sporulation protein D	NA|45aa|up_0|NZ_CP017577.1_3979277_3979412_-	NA	NA|235aa|down_0|NZ_CP017577.1_3980621_3981326_-	pfam12698, ABC2_membrane_3, ABC-2 family transporter protein	NA|281aa|down_1|NZ_CP017577.1_3981325_3982168_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|336aa|down_2|NZ_CP017577.1_3982348_3983356_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]	NA|340aa|down_3|NZ_CP017577.1_3983455_3984475_-	TIGR02870, Stage_II_sporulation_protein_D, stage II sporulation protein D	NA|435aa|down_4|NZ_CP017577.1_3984681_3985986_-	PRK09369, PRK09369, UDP-N-acetylglucosamine 1-carboxyvinyltransferase; Validated	NA|237aa|down_5|NZ_CP017577.1_3986025_3986736_-	pfam08680, DUF1779, TATA-box binding	NA|79aa|down_6|NZ_CP017577.1_3986781_3987018_-	COG4836, COG4836, Predicted membrane protein [Function unknown]	NA|507aa|down_7|NZ_CP017577.1_3987220_3988741_-	PRK05777, PRK05777, NADH-quinone oxidoreductase subunit NuoN	NA|501aa|down_8|NZ_CP017577.1_3988742_3990245_-	PRK05846, PRK05846, NADH:ubiquinone oxidoreductase subunit M; Reviewed	NA|621aa|down_9|NZ_CP017577.1_3990241_3992104_-	PRK06590, PRK06590, NADH:ubiquinone oxidoreductase subunit L; Reviewed
GCF_002173755.1_ASM217375v1	NZ_CP017577	Bacillus thuringiensis strain SCG04-02, complete genome	3	5292905-5293033	3	CRISPRCasFinder	no		DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh	Orphan	AGGAGCAAACCAAATGGCAGGTGGCGTAAATCAATTAGCAGATGG	45	0	0	NA	NA	NA	1	1	Orphan	DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh,cas9,cas14j	NA|100aa|up_4|NZ_CP017577.1_5286130_5286430_+,NA|282aa|up_3|NZ_CP017577.1_5286484_5287330_-,NA|71aa|down_0|NZ_CP017577.1_5294059_5294272_+,NA|143aa|down_8|NZ_CP017577.1_5299034_5299463_+	NA|349aa|up_9|NZ_CP017577.1_5278543_5279590_+	PRK00115, hemE, uroporphyrinogen decarboxylase; Validated	NA|312aa|up_8|NZ_CP017577.1_5279604_5280540_+	PRK12435, PRK12435, ferrochelatase; Provisional	NA|474aa|up_7|NZ_CP017577.1_5280559_5281981_+	PRK11883, PRK11883, protoporphyrinogen oxidase; Reviewed	NA|451aa|up_6|NZ_CP017577.1_5282037_5283390_-	pfam13218, DUF4026, Protein of unknown function (DUF4026)	NA|789aa|up_5|NZ_CP017577.1_5283631_5285998_+	COG2374, COG2374, Predicted extracellular nuclease [General function prediction only]	NA|100aa|up_4|NZ_CP017577.1_5286130_5286430_+	NA	NA|282aa|up_3|NZ_CP017577.1_5286484_5287330_-	NA	NA|134aa|up_2|NZ_CP017577.1_5287559_5287961_+	pfam03965, Penicillinase_R, Penicillinase repressor	NA|638aa|up_1|NZ_CP017577.1_5287963_5289877_+	pfam05569, Peptidase_M56, BlaR1 peptidase M56	NA|191aa|up_0|NZ_CP017577.1_5290090_5290663_+	COG1309, AcrR, Transcriptional regulator [Transcription]	NA|71aa|down_0|NZ_CP017577.1_5294059_5294272_+	NA	NA|102aa|down_1|NZ_CP017577.1_5294276_5294582_+	COG3860, COG3860, Uncharacterized protein conserved in bacteria [Function unknown]	NA|118aa|down_2|NZ_CP017577.1_5294608_5294962_-	pfam14470, bPH_3, Bacterial PH domain	NA|170aa|down_3|NZ_CP017577.1_5295095_5295605_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|338aa|down_4|NZ_CP017577.1_5295799_5296813_+	COG1609, PurR, Transcriptional regulators [Transcription]	NA|43aa|down_5|NZ_CP017577.1_5296852_5296981_-	pfam14149, YhfH, YhfH-like protein	NA|245aa|down_6|NZ_CP017577.1_5297161_5297896_+	cd07716, RNaseZ_short-form-like_MBL-fold, uncharacterized bacterial subgroup of Ribonuclease Z, short form; MBL-fold metallo-hydrolase domain	NA|330aa|down_7|NZ_CP017577.1_5297905_5298895_+	TIGR00545, Probable_lipoate-protein_ligase_A, lipoyltransferase and lipoate-protein ligase	NA|143aa|down_8|NZ_CP017577.1_5299034_5299463_+	NA	NA|511aa|down_9|NZ_CP017577.1_5299624_5301157_+	PRK07656, PRK07656, long-chain-fatty-acid--CoA ligase; Validated
GCF_002173755.1_ASM217375v1	NZ_CP017574	Bacillus thuringiensis strain SCG04-02 plasmid PSCG364, complete sequence	1	233155-233340	1	CRT	no	RT	csa3,DEDDh,cas9,cas14j,RT	Unclear	GAAACCAGAACAGAAGCCAGAGCAGAAACC	30	0	0	NA	NA	NA	3	3	Orphan	DinG,cas14k,csa3,cas3,RT,Cas14u_CAS-V,WYL,c2c9_V-U4,DEDDh,cas9,cas14j	NA|280aa|up_9|NZ_CP017574.1_216830_217670_-,NA|517aa|up_7|NZ_CP017574.1_218172_219723_+,NA|77aa|up_4|NZ_CP017574.1_224377_224608_+,NA|579aa|up_2|NZ_CP017574.1_225782_227519_+,NA|150aa|down_0|NZ_CP017574.1_233678_234128_+,NA|174aa|down_2|NZ_CP017574.1_235550_236072_+,NA|63aa|down_3|NZ_CP017574.1_236095_236284_+,NA|104aa|down_4|NZ_CP017574.1_236356_236668_+,NA|175aa|down_5|NZ_CP017574.1_236690_237215_+,NA|200aa|down_6|NZ_CP017574.1_237227_237827_+,NA|332aa|down_8|NZ_CP017574.1_238558_239554_+	NA|280aa|up_9|NZ_CP017574.1_216830_217670_-	NA	NA|81aa|up_8|NZ_CP017574.1_217928_218171_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|517aa|up_7|NZ_CP017574.1_218172_219723_+	NA	RT|614aa|up_6|NZ_CP017574.1_220764_222606_+	TIGR04416, hypothetical_protein, group II intron reverse transcriptase/maturase	NA|414aa|up_5|NZ_CP017574.1_222640_223882_+	pfam12965, DUF3854, Domain of unknown function (DUF3854)	NA|77aa|up_4|NZ_CP017574.1_224377_224608_+	NA	NA|324aa|up_3|NZ_CP017574.1_224630_225602_+	COG0568, RpoD, DNA-directed RNA polymerase, sigma subunit (sigma70/sigma32) [Transcription]	NA|579aa|up_2|NZ_CP017574.1_225782_227519_+	NA	NA|332aa|up_1|NZ_CP017574.1_227544_228540_+	PRK05574, holA, DNA polymerase III subunit delta; Reviewed	NA|588aa|up_0|NZ_CP017574.1_229025_230789_+	PRK09510, tolA, cell envelope integrity inner membrane protein TolA; Provisional	NA|150aa|down_0|NZ_CP017574.1_233678_234128_+	NA	NA|185aa|down_1|NZ_CP017574.1_234726_235281_-	TIGR02227, Inactive_signal_peptidase_IA	NA|174aa|down_2|NZ_CP017574.1_235550_236072_+	NA	NA|63aa|down_3|NZ_CP017574.1_236095_236284_+	NA	NA|104aa|down_4|NZ_CP017574.1_236356_236668_+	NA	NA|175aa|down_5|NZ_CP017574.1_236690_237215_+	NA	NA|200aa|down_6|NZ_CP017574.1_237227_237827_+	NA	NA|228aa|down_7|NZ_CP017574.1_237858_238542_+	pfam14460, Prok-E2_D, Prokaryotic E2 family D	NA|332aa|down_8|NZ_CP017574.1_238558_239554_+	NA	NA|285aa|down_9|NZ_CP017574.1_239550_240405_+	TIGR03736, PRTRC_ThiF, PRTRC system ThiF family protein
