assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_004101825.1_ASM410182v1	CP034358	Clostridium septicum strain VAT12 chromosome, complete genome	1	258845-258945	1	CRISPRCasFinder	no	DinG	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	Type IV-A	AAGCGACTCGTTTATCTTATCACTC	25	0	0	NA	NA	NA	1	1	Orphan	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	NA|102aa|up_4|CP034358.1_248841_249147_-,NA|70aa|down_2|CP034358.1_260737_260947_-,NA|143aa|down_3|CP034358.1_261080_261509_+,NA|79aa|down_6|CP034358.1_263325_263562_-	NA|197aa|up_9|CP034358.1_244046_244637_-	pfam08876, DUF1836, Domain of unknown function (DUF1836)	NA|80aa|up_8|CP034358.1_245167_245407_+	TIGR02851, stage_V_sporulation_protein_T, stage V sporulation protein T	NA|282aa|up_7|CP034358.1_245488_246334_-	COG0313, COG0313, Predicted methyltransferases [General function prediction only]	NA|250aa|up_6|CP034358.1_246336_247086_-	COG4123, COG4123, Predicted O-methyltransferase [General function prediction only]	NA|419aa|up_5|CP034358.1_247208_248465_-	COG0791, Spr, Cell wall-associated hydrolases (invasion-associated proteins) [Cell envelope biogenesis, outer membrane]	NA|102aa|up_4|CP034358.1_248841_249147_-	NA	NA|450aa|up_3|CP034358.1_249811_251161_+	TIGR04105, hypothetical_protein, [FeFe] hydrogenase, group B1/B3	NA|214aa|up_2|CP034358.1_251292_251934_+	COG0637, COG0637, Predicted phosphatase/phosphohexomutase [General function prediction only]	NA|249aa|up_1|CP034358.1_252019_252766_-	PRK00059, prsA, peptidylprolyl isomerase; Provisional	NA|153aa|up_0|CP034358.1_252933_253392_+	COG1225, Bcp, Peroxiredoxin [Posttranslational modification, protein turnover, chaperones]	NA|226aa|down_0|CP034358.1_259263_259941_+	PRK05254, PRK05254, uracil-DNA glycosylase; Provisional	NA|70aa|down_1|CP034358.1_260036_260246_-	PHA03231, PHA03231, glycoprotein BALF4; Provisional	NA|70aa|down_2|CP034358.1_260737_260947_-	NA	NA|143aa|down_3|CP034358.1_261080_261509_+	NA	NA|312aa|down_4|CP034358.1_261588_262524_-	pfam02517, Abi, CAAX protease self-immunity	NA|163aa|down_5|CP034358.1_262713_263202_-	PRK00549, PRK00549, competence damage-inducible protein A; Provisional	NA|79aa|down_6|CP034358.1_263325_263562_-	NA	NA|692aa|down_7|CP034358.1_263654_265730_-	PRK12740, PRK12740, elongation factor G-like protein EF-G2	NA|312aa|down_8|CP034358.1_267419_268355_-	cd04187, DPM1_like_bac, Bacterial DPM1_like enzymes are related to eukaryotic DPM1	NA|122aa|down_9|CP034358.1_268675_269041_-	pfam04138, GtrA, GtrA-like protein
GCA_004101825.1_ASM410182v1	CP034358	Clostridium septicum strain VAT12 chromosome, complete genome	2	564931-565092	2	CRISPRCasFinder	no	csx1	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	Orphan	AAAACTATGCACTACTATGCACA	23	0	0	NA	NA	NA	2	2	Orphan	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	NA,NA|63aa|down_2|CP034358.1_569088_569277_+,NA|95aa|down_6|CP034358.1_574904_575189_-	NA|173aa|up_9|CP034358.1_545559_546078_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|1148aa|up_8|CP034358.1_546120_549564_+	TIGR02773, ATP-dependent_helicase/deoxyribonuclease_subunit_B, helicase-exonuclease AddAB, AddB subunit	NA|1245aa|up_7|CP034358.1_549566_553301_+	TIGR02785, ATP-dependent_helicase/nuclease_subunit_A, helicase-exonuclease AddAB, AddA subunit, Firmicutes type	NA|108aa|up_6|CP034358.1_553327_553651_+	TIGR04091, hypothetical_protein, D-alanyl-lipoteichoic acid biosynthesis protein DltB	NA|565aa|up_5|CP034358.1_553868_555563_-	cd08023, GH16_laminarinase_like, Laminarinase, member of the glycosyl hydrolase family 16	NA|249aa|up_4|CP034358.1_556007_556754_-	COG1737, RpiR, Transcriptional regulators [Transcription]	NA|453aa|up_3|CP034358.1_556989_558348_-	COG0617, PcnB, tRNA nucleotidyltransferase/poly(A) polymerase [Translation, ribosomal structure and biogenesis]	NA|409aa|up_2|CP034358.1_558541_559768_-	cd16913, YkuD_like, L,D-transpeptidases/carboxypeptidases similar to Bacillus YkuD	NA|260aa|up_1|CP034358.1_559911_560691_+	pfam06691, DUF1189, Protein of unknown function (DUF1189)	NA|295aa|up_0|CP034358.1_562498_563383_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|77aa|down_0|CP034358.1_565299_565530_-	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|49aa|down_1|CP034358.1_565783_565930_+	pfam12728, HTH_17, Helix-turn-helix domain	NA|63aa|down_2|CP034358.1_569088_569277_+	NA	NA|62aa|down_3|CP034358.1_569579_569765_+	TIGR01554, prophage_Lp3_protein_18, phage major capsid protein, HK97 family	NA|188aa|down_4|CP034358.1_569858_570422_+	pfam05065, Phage_capsid, Phage capsid family	NA|85aa|down_5|CP034358.1_570483_570738_+	pfam03592, Terminase_2, Terminase small subunit	NA|95aa|down_6|CP034358.1_574904_575189_-	NA	NA|48aa|down_7|CP034358.1_575275_575419_-	TIGR03433, padR_acidobact, transcriptional regulator, Acidobacterial, PadR-family	NA|314aa|down_8|CP034358.1_575964_576906_-	cd01146, FhuD, Fe3+-siderophore binding domain FhuD	NA|337aa|down_9|CP034358.1_577039_578050_+	pfam01032, FecCD, FecCD transport family
GCA_004101825.1_ASM410182v1	CP034358	Clostridium septicum strain VAT12 chromosome, complete genome	4	1708740-1708964	1,4,1	PILER-CR,CRISPRCasFinder,CRT	no	c2c10_CAS-V-U3	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	Type V-U3	GTTTAATATCAACAGAAGTTGTATTTAAAG,GTTTAATATCAACAGAAGTTGTATTTAAAG,TATCAACAGAAGTTGTATTTAAAG	30,30,24	0	0	NA	NA	NA:NA:NA	3,3,3	3	TypeV-U3	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	NA|91aa|up_3|CP034358.1_1703664_1703937_+,c2c10_CAS-V-U3|101aa|up_1|CP034358.1_1707983_1708286_+,NA|217aa|down_4|CP034358.1_1712262_1712913_+,NA|181aa|down_9|CP034358.1_1716911_1717454_+	NA|94aa|up_9|CP034358.1_1701127_1701409_+	pfam16079, Phage_holin_5_2, Phage holin family Hol44, in holin superfamily V	NA|349aa|up_8|CP034358.1_1701478_1702525_+	pfam01510, Amidase_2, N-acetylmuramoyl-L-alanine amidase	NA|58aa|up_7|CP034358.1_1702857_1703031_+	pfam14319, Zn_Tnp_IS91, Transposase zinc-binding domain	NA|87aa|up_6|CP034358.1_1703040_1703301_+	pfam04986, Y2_Tnp, Putative transposase	NA|59aa|up_5|CP034358.1_1703399_1703576_+	pfam04986, Y2_Tnp, Putative transposase	NA|32aa|up_4|CP034358.1_1703572_1703668_+	pfam04986, Y2_Tnp, Putative transposase	NA|91aa|up_3|CP034358.1_1703664_1703937_+	NA	NA|64aa|up_2|CP034358.1_1703951_1704143_+	pfam02146, SIR2, Sir2 family	c2c10_CAS-V-U3|101aa|up_1|CP034358.1_1707983_1708286_+	NA	c2c10_CAS-V-U3|64aa|up_0|CP034358.1_1708343_1708535_+	pfam07282, OrfB_Zn_ribbon, Putative transposase DNA-binding domain	NA|56aa|down_0|CP034358.1_1709194_1709362_-	pfam12651, RHH_3, Ribbon-helix-helix domain	NA|218aa|down_1|CP034358.1_1709513_1710167_+	pfam13730, HTH_36, Helix-turn-helix domain	NA|252aa|down_2|CP034358.1_1710235_1710991_+	COG0338, Dam, Site-specific DNA methylase [DNA replication, recombination, and repair]	NA|206aa|down_3|CP034358.1_1711533_1712151_+	pfam04343, DUF488, Protein of unknown function, DUF488	NA|217aa|down_4|CP034358.1_1712262_1712913_+	NA	NA|219aa|down_5|CP034358.1_1713107_1713764_+	PRK00121, trmB, tRNA (guanine-N(7)-)-methyltransferase; Reviewed	NA|259aa|down_6|CP034358.1_1713817_1714594_-	PRK04201, PRK04201, zinc transporter ZupT; Provisional	NA|274aa|down_7|CP034358.1_1714823_1715645_+	COG0657, Aes, Esterase/lipase [Lipid metabolism]	NA|343aa|down_8|CP034358.1_1715637_1716666_+	COG3594, NolL, Fucose 4-O-acetylase and related acetyltransferases [Carbohydrate transport and metabolism]	NA|181aa|down_9|CP034358.1_1716911_1717454_+	NA
GCA_004101825.1_ASM410182v1	CP034358	Clostridium septicum strain VAT12 chromosome, complete genome	5	2545844-2551817	2,5,2,3	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas2,cas1,cas5,cas7,cas8b2,cas6,WYL	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	Unclear	ATTTACATTCCACTAGTTAAGATAAAAC,ATTTACATTCCACTAGTTAAGATAAAAC,ATTTACATTCCACTAGTTAAGATAAAAC,ATTTACATTCCACTAGTTAAGATAAAAC	28,28,28,28	0	0	NA	NA	NA:NA:NA:NA	90,92,92,90	92	Unclear	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	NA|137aa|up_4|CP034358.1_2541931_2542342_-,NA|20aa|up_2|CP034358.1_2544311_2544371_+,NA|95aa|up_0|CP034358.1_2545212_2545497_-,NA	NA|559aa|up_9|CP034358.1_2534626_2536303_+	pfam09972, DUF2207, Predicted membrane protein (DUF2207)	NA|312aa|up_8|CP034358.1_2536347_2537283_-	PRK03822, lplA, lipoate-protein ligase A; Provisional	NA|564aa|up_7|CP034358.1_2537276_2538968_-	TIGR01350, Dihydrolipoyl_dehydrogenase, dihydrolipoamide dehydrogenase	NA|118aa|up_6|CP034358.1_2539050_2539404_-	COG0599, COG0599, Uncharacterized homolog of gamma-carboxymuconolactone decarboxylase subunit [Function unknown]	NA|148aa|up_5|CP034358.1_2539475_2539919_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|137aa|up_4|CP034358.1_2541931_2542342_-	NA	NA|377aa|up_3|CP034358.1_2542656_2543787_+	COG5316, COG5316, Uncharacterized conserved protein [Function unknown]	NA|20aa|up_2|CP034358.1_2544311_2544371_+	NA	NA|131aa|up_1|CP034358.1_2544570_2544963_+	PHA02517, PHA02517, putative transposase OrfB; Reviewed	NA|95aa|up_0|CP034358.1_2545212_2545497_-	NA	cas2|88aa|down_0|CP034358.1_2551998_2552262_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|328aa|down_1|CP034358.1_2552263_2553247_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas5|245aa|down_2|CP034358.1_2556077_2556812_-	cd09658, Cas5_I-B, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas7|292aa|down_3|CP034358.1_2556821_2557697_-	TIGR02585, conserved_protein, CRISPR-associated protein Cas7/Cst2/DevR, subtype I-B/TNEAP	cas8b2|564aa|down_4|CP034358.1_2557696_2559388_-	cd09665, Cas8a1_I-A, CRISPR/Cas system-associated protein Cas8a1	cas6|245aa|down_5|CP034358.1_2559399_2560134_-	cd09652, Cas6-I-III, CRISPR/Cas system-associated RAMP superfamily protein Cas6	WYL|313aa|down_6|CP034358.1_2560258_2561197_-	pfam13280, WYL, WYL domain	NA|862aa|down_7|CP034358.1_2561608_2564194_-	pfam13320, DUF4091, Domain of unknown function (DUF4091)	NA|407aa|down_8|CP034358.1_2564555_2565776_-	PRK05469, PRK05469, tripeptide aminopeptidase PepT	NA|355aa|down_9|CP034358.1_2565870_2566935_-	cd10944, CE4_SmPgdA_like, Catalytic NodB homology domain of Streptococcus mutans polysaccharide deacetylase PgdA, Bacillus subtilis YheN, and similar proteins
GCA_004101825.1_ASM410182v1	CP034358	Clostridium septicum strain VAT12 chromosome, complete genome	6	2699942-2700032	6	CRISPRCasFinder	no		DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	Orphan	CTATTTATGAAATAACTAACCAAATACC	28	0	0	NA	NA	NA	1	1	Orphan	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	NA,NA|188aa|down_9|CP034358.1_2711673_2712237_-	NA|683aa|up_9|CP034358.1_2691295_2693344_-	COG1480, COG1480, Predicted membrane-associated HD superfamily hydrolase [General function prediction only]	NA|379aa|up_8|CP034358.1_2693375_2694512_-	pfam06898, YqfD, Putative stage IV sporulation protein YqfD	NA|93aa|up_7|CP034358.1_2694517_2694796_-	TIGR02856, Uncharacterized_protein_YqfC, sporulation protein YqfC	NA|150aa|up_6|CP034358.1_2694904_2695354_-	pfam09424, YqeY, Yqey-like protein	NA|59aa|up_5|CP034358.1_2695386_2695563_-	PRK00270, rpsU, 30S ribosomal protein S21; Reviewed	NA|114aa|up_4|CP034358.1_2695683_2696025_-	cd01276, PKCI_related, Protein Kinase C Interacting protein related (PKCI): PKCI and related proteins belong to the ubiquitous HIT family of hydrolases that act on alpha-phosphates of ribonucleotides	NA|435aa|up_3|CP034358.1_2696112_2697417_-	COG0621, MiaB, 2-methylthioadenine synthetase [Translation, ribosomal structure and biogenesis]	NA|255aa|up_2|CP034358.1_2697416_2698181_-	PRK11713, PRK11713, 16S ribosomal RNA methyltransferase RsmE; Provisional	NA|314aa|up_1|CP034358.1_2698204_2699146_-	pfam06325, PrmA, Ribosomal protein L11 methyltransferase (PrmA)	NA|166aa|up_0|CP034358.1_2699298_2699796_-	PRK00522, tpx, thiol peroxidase	NA|518aa|down_0|CP034358.1_2700419_2701973_-	COG0155, CysI, Sulfite reductase, beta subunit (hemoprotein) [Inorganic ion transport and metabolism]	NA|377aa|down_1|CP034358.1_2702124_2703255_-	PRK14297, PRK14297, molecular chaperone DnaJ	NA|618aa|down_2|CP034358.1_2703347_2705201_-	PRK00290, dnaK, molecular chaperone DnaK; Provisional	NA|205aa|down_3|CP034358.1_2705248_2705863_-	PRK14160, PRK14160, heat shock protein GrpE; Provisional	NA|344aa|down_4|CP034358.1_2705883_2706915_-	PRK00082, hrcA, heat-inducible transcription repressor; Provisional	NA|378aa|down_5|CP034358.1_2707083_2708217_-	PRK05799, PRK05799, oxygen-independent coproporphyrinogen III oxidase	NA|90aa|down_6|CP034358.1_2708345_2708615_-	cd00495, Ribosomal_L25_TL5_CTC, Ribosomal L25/TL5/CTC N-terminal 5S rRNA binding domain	NA|303aa|down_7|CP034358.1_2708780_2709689_+	cd07213, Pat17_PNPLA8_PNPLA9_like1, Patatin-like phospholipase	NA|602aa|down_8|CP034358.1_2709753_2711559_-	PRK05433, PRK05433, GTP-binding protein LepA; Provisional	NA|188aa|down_9|CP034358.1_2711673_2712237_-	NA
GCA_004101825.1_ASM410182v1	CP034358	Clostridium septicum strain VAT12 chromosome, complete genome	7	3198448-3198540	7	CRISPRCasFinder	no	WYL	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	Unclear	CTTTTAACTTAACATAAATGTGCTTTCC	28	0	0	NA	NA	NA	1	1	Orphan	DinG,DEDDh,csx1,cas3,csa3,WYL,c2c10_CAS-V-U3,cas2,cas1,cas5,cas7,cas8b2,cas6	NA|216aa|up_7|CP034358.1_3191047_3191695_-,NA|84aa|up_2|CP034358.1_3196193_3196445_-,NA|104aa|up_1|CP034358.1_3196502_3196814_-,NA|153aa|down_0|CP034358.1_3198587_3199046_-,NA|393aa|down_2|CP034358.1_3200424_3201603_-,NA|123aa|down_3|CP034358.1_3201612_3201981_-,NA|276aa|down_4|CP034358.1_3202060_3202888_-,NA|267aa|down_6|CP034358.1_3203753_3204554_-,NA|255aa|down_8|CP034358.1_3205364_3206129_-	NA|87aa|up_9|CP034358.1_3190064_3190325_-	TIGR04090, hypothetical_protein, alternate signal-mediated exported protein, CPF_0494 family	NA|211aa|up_8|CP034358.1_3190371_3191004_-	TIGR04090, hypothetical_protein, alternate signal-mediated exported protein, CPF_0494 family	NA|216aa|up_7|CP034358.1_3191047_3191695_-	NA	NA|222aa|up_6|CP034358.1_3191705_3192371_-	TIGR04090, hypothetical_protein, alternate signal-mediated exported protein, CPF_0494 family	NA|169aa|up_5|CP034358.1_3192400_3192907_-	TIGR02228, Signal_peptidase_I_W, signal peptidase I, archaeal type	WYL|221aa|up_4|CP034358.1_3193141_3193804_-	COG2378, COG2378, Predicted transcriptional regulator [Transcription]	NA|673aa|up_3|CP034358.1_3194072_3196091_+	cd01949, GGDEF, Diguanylate-cyclase (DGC) or GGDEF domain	NA|84aa|up_2|CP034358.1_3196193_3196445_-	NA	NA|104aa|up_1|CP034358.1_3196502_3196814_-	NA	NA|321aa|up_0|CP034358.1_3197328_3198291_-	NF033189, internalin_A, class 1 internalin InlA	NA|153aa|down_0|CP034358.1_3198587_3199046_-	NA	NA|213aa|down_1|CP034358.1_3199739_3200378_+	pfam04892, VanZ, VanZ like family	NA|393aa|down_2|CP034358.1_3200424_3201603_-	NA	NA|123aa|down_3|CP034358.1_3201612_3201981_-	NA	NA|276aa|down_4|CP034358.1_3202060_3202888_-	NA	NA|288aa|down_5|CP034358.1_3202888_3203752_-	cd03264, ABC_drug_resistance_like, ABC-type multidrug transport system, ATPase component	NA|267aa|down_6|CP034358.1_3203753_3204554_-	NA	NA|187aa|down_7|CP034358.1_3204543_3205104_-	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|255aa|down_8|CP034358.1_3205364_3206129_-	NA	NA|411aa|down_9|CP034358.1_3206175_3207408_-	PRK13628, PRK13628, serine/threonine transporter SstT; Provisional
