assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000145615.1_ASM14561v1	NC_014410	Thermoanaerobacterium thermosaccharolyticum DSM 571, complete genome	1	309414-312133	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no		RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	Orphan	GTTTTTAGCCTACCTATAAGGGATTGAAAC,GTTTTTAGCCTACCTATAAGGGATTGAAAC,GTTTTTAGCCTACCTATAAGGGATTGAAAC	30,30,30	0	0	NA	NA	NA:NA:NA	40,40,40	40	Orphan	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	NA|72aa|up_9|NC_014410.1_296431_296647_+,NA|191aa|up_1|NC_014410.1_306555_307128_-,NA|123aa|down_0|NC_014410.1_312327_312696_+,NA|61aa|down_3|NC_014410.1_315256_315439_+,NA|66aa|down_5|NC_014410.1_319103_319301_+,NA|118aa|down_6|NC_014410.1_319248_319602_+	NA|72aa|up_9|NC_014410.1_296431_296647_+	NA	NA|76aa|up_8|NC_014410.1_297110_297338_+	pfam17295, DUF5348, Domain of unknown function (DUF5348)	NA|83aa|up_7|NC_014410.1_297439_297688_+	pfam13711, DUF4160, Domain of unknown function (DUF4160)	NA|83aa|up_6|NC_014410.1_297694_297943_+	pfam10387, DUF2442, Protein of unknown function (DUF2442)	NA|191aa|up_5|NC_014410.1_297986_298559_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|332aa|up_4|NC_014410.1_298582_299578_+	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|268aa|up_3|NC_014410.1_304259_305063_-	TIGR03015, pepcterm_ATPase, putative secretion ATPase, PEP-CTERM locus subfamily	NA|370aa|up_2|NC_014410.1_305084_306194_-	pfam00665, rve, Integrase core domain	NA|191aa|up_1|NC_014410.1_306555_307128_-	NA	NA|290aa|up_0|NC_014410.1_308182_309052_-	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|123aa|down_0|NC_014410.1_312327_312696_+	NA	NA|278aa|down_1|NC_014410.1_313144_313978_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|192aa|down_2|NC_014410.1_314603_315179_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|61aa|down_3|NC_014410.1_315256_315439_+	NA	NA|428aa|down_4|NC_014410.1_316634_317918_-	pfam01548, DEDD_Tnp_IS110, Transposase	NA|66aa|down_5|NC_014410.1_319103_319301_+	NA	NA|118aa|down_6|NC_014410.1_319248_319602_+	NA	NA|431aa|down_7|NC_014410.1_319715_321008_-	pfam02810, SEC-C, SEC-C motif	NA|367aa|down_8|NC_014410.1_321423_322524_+	pfam02317, Octopine_DH, NAD/NADP octopine/nopaline dehydrogenase, alpha-helical domain	NA|551aa|down_9|NC_014410.1_322520_324173_+	pfam02310, B12-binding, B12 binding domain
GCF_000145615.1_ASM14561v1	NC_014410	Thermoanaerobacterium thermosaccharolyticum DSM 571, complete genome	2	315799-316092	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no		RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	Orphan	GTTTTTAGCCTACCTATGAGGAATTGAAAC,GTTTTTAGCCTACCTATGAGGAATTGAAAC,GTTTTTAGCCTACCTATGAGGAATTGAAAC	30,30,30	0	0	NA	NA	NA:NA:NA	4,4,4	4	Orphan	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	NA|191aa|up_5|NC_014410.1_306555_307128_-,NA|123aa|up_3|NC_014410.1_312327_312696_+,NA|61aa|up_0|NC_014410.1_315256_315439_+,NA|66aa|down_1|NC_014410.1_319103_319301_+,NA|118aa|down_2|NC_014410.1_319248_319602_+,NA|186aa|down_9|NC_014410.1_326953_327511_+	NA|191aa|up_9|NC_014410.1_297986_298559_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|332aa|up_8|NC_014410.1_298582_299578_+	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|268aa|up_7|NC_014410.1_304259_305063_-	TIGR03015, pepcterm_ATPase, putative secretion ATPase, PEP-CTERM locus subfamily	NA|370aa|up_6|NC_014410.1_305084_306194_-	pfam00665, rve, Integrase core domain	NA|191aa|up_5|NC_014410.1_306555_307128_-	NA	NA|290aa|up_4|NC_014410.1_308182_309052_-	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|123aa|up_3|NC_014410.1_312327_312696_+	NA	NA|278aa|up_2|NC_014410.1_313144_313978_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|192aa|up_1|NC_014410.1_314603_315179_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|61aa|up_0|NC_014410.1_315256_315439_+	NA	NA|428aa|down_0|NC_014410.1_316634_317918_-	pfam01548, DEDD_Tnp_IS110, Transposase	NA|66aa|down_1|NC_014410.1_319103_319301_+	NA	NA|118aa|down_2|NC_014410.1_319248_319602_+	NA	NA|431aa|down_3|NC_014410.1_319715_321008_-	pfam02810, SEC-C, SEC-C motif	NA|367aa|down_4|NC_014410.1_321423_322524_+	pfam02317, Octopine_DH, NAD/NADP octopine/nopaline dehydrogenase, alpha-helical domain	NA|551aa|down_5|NC_014410.1_322520_324173_+	pfam02310, B12-binding, B12 binding domain	NA|218aa|down_6|NC_014410.1_324313_324967_+	cd02696, MurNAc-LAA, N-acetylmuramoyl-L-alanine amidase or MurNAc-LAA (also known as peptidoglycan aminohydrolase, NAMLA amidase, NAMLAA, Amidase 3, and peptidoglycan amidase; EC 3	NA|112aa|down_7|NC_014410.1_324971_325307_+	TIGR01673, putative_holin, phage holin, LL-H family	NA|426aa|down_8|NC_014410.1_325369_326647_-	PRK10720, PRK10720, uracil transporter; Provisional	NA|186aa|down_9|NC_014410.1_326953_327511_+	NA
GCF_000145615.1_ASM14561v1	NC_014410	Thermoanaerobacterium thermosaccharolyticum DSM 571, complete genome	3	318047-319079	3,3,3	PILER-CR,CRISPRCasFinder,CRT	no		RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	Orphan	GTTTTTAGCCTACCTATGAGGAATTGAAAC,GTTTTTAGCCTACCTATGAGGAATTGAAAC,GTTTTTAGCCTACCTATGAGGAATTGAAAC	30,30,30	0	0	NA	NA	NA:NA:NA	14,15,15	15	Orphan	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	NA|191aa|up_6|NC_014410.1_306555_307128_-,NA|123aa|up_4|NC_014410.1_312327_312696_+,NA|61aa|up_1|NC_014410.1_315256_315439_+,NA|66aa|down_0|NC_014410.1_319103_319301_+,NA|118aa|down_1|NC_014410.1_319248_319602_+,NA|186aa|down_8|NC_014410.1_326953_327511_+	NA|332aa|up_9|NC_014410.1_298582_299578_+	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|268aa|up_8|NC_014410.1_304259_305063_-	TIGR03015, pepcterm_ATPase, putative secretion ATPase, PEP-CTERM locus subfamily	NA|370aa|up_7|NC_014410.1_305084_306194_-	pfam00665, rve, Integrase core domain	NA|191aa|up_6|NC_014410.1_306555_307128_-	NA	NA|290aa|up_5|NC_014410.1_308182_309052_-	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|123aa|up_4|NC_014410.1_312327_312696_+	NA	NA|278aa|up_3|NC_014410.1_313144_313978_+	smart00283, MA, Methyl-accepting chemotaxis-like domains (chemotaxis sensory transducer)	NA|192aa|up_2|NC_014410.1_314603_315179_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|61aa|up_1|NC_014410.1_315256_315439_+	NA	NA|428aa|up_0|NC_014410.1_316634_317918_-	pfam01548, DEDD_Tnp_IS110, Transposase	NA|66aa|down_0|NC_014410.1_319103_319301_+	NA	NA|118aa|down_1|NC_014410.1_319248_319602_+	NA	NA|431aa|down_2|NC_014410.1_319715_321008_-	pfam02810, SEC-C, SEC-C motif	NA|367aa|down_3|NC_014410.1_321423_322524_+	pfam02317, Octopine_DH, NAD/NADP octopine/nopaline dehydrogenase, alpha-helical domain	NA|551aa|down_4|NC_014410.1_322520_324173_+	pfam02310, B12-binding, B12 binding domain	NA|218aa|down_5|NC_014410.1_324313_324967_+	cd02696, MurNAc-LAA, N-acetylmuramoyl-L-alanine amidase or MurNAc-LAA (also known as peptidoglycan aminohydrolase, NAMLA amidase, NAMLAA, Amidase 3, and peptidoglycan amidase; EC 3	NA|112aa|down_6|NC_014410.1_324971_325307_+	TIGR01673, putative_holin, phage holin, LL-H family	NA|426aa|down_7|NC_014410.1_325369_326647_-	PRK10720, PRK10720, uracil transporter; Provisional	NA|186aa|down_8|NC_014410.1_326953_327511_+	NA	NA|248aa|down_9|NC_014410.1_328666_329410_-	COG1131, CcmA, ABC-type multidrug transport system, ATPase component [Defense mechanisms]
GCF_000145615.1_ASM14561v1	NC_014410	Thermoanaerobacterium thermosaccharolyticum DSM 571, complete genome	4	2643518-2647416	4,4,4	CRISPRCasFinder,CRT,PILER-CR	no	csx1,cas2,cas1,cas4,cas3,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,cas10,csx20	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	Type III-C,Type III-D,Type III-A,Type III-B,Type I-B	GTTTCAATTCCTGATAGGTAGGCTAAAAAC,GTTTCAATTCCTGATAGGTAGGCTAAAAAC,GTTTTTAGCCTACCTATCAGGAATTGAAAC	30,30,30	0	0	NA	NA	NA:NA:NA	58,58,30	58	TypeIII-C,TypeIII-D,TypeIII-A,TypeIII-B,TypeI-B	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	NA,csm2gr11|122aa|down_5|NC_014410.1_2654359_2654725_-,csm2gr11|150aa|down_9|NC_014410.1_2657128_2657578_-	NA|283aa|up_9|NC_014410.1_2629503_2630352_+	PRK11867, PRK11867, 2-oxoglutarate ferredoxin oxidoreductase subunit beta; Reviewed	NA|624aa|up_8|NC_014410.1_2630391_2632263_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|742aa|up_7|NC_014410.1_2632262_2634488_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|148aa|up_6|NC_014410.1_2634520_2634964_-	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|522aa|up_5|NC_014410.1_2635097_2636663_-	cd01031, EriC, ClC chloride channel EriC	csx1|401aa|up_4|NC_014410.1_2636802_2638005_-	cd09732, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	cas2|88aa|up_3|NC_014410.1_2638027_2638291_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|331aa|up_2|NC_014410.1_2638303_2639296_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|166aa|up_1|NC_014410.1_2639292_2639790_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	NA|480aa|up_0|NC_014410.1_2640420_2641860_-	COG5184, ATS1, Alpha-tubulin suppressor and related RCC1 domain-containing proteins [Cell division and chromosome partitioning / Cytoskeleton]	cas3|788aa|down_0|NC_014410.1_2647584_2649948_-	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas5|238aa|down_1|NC_014410.1_2649925_2650639_-	TIGR02592, hypothetical_protein_CTC_01466, CRISPR-associated protein Cas5, subtype I-B/HMARI	cas7|304aa|down_2|NC_014410.1_2650714_2651626_-	TIGR02590, hypothetical_protein_MM_0563, CRISPR-associated protein Cas7/Csh2, subtype I-B/HMARI	cas8b1|587aa|down_3|NC_014410.1_2651622_2653383_-	pfam09484, Cas_TM1802, CRISPR-associated protein TM1802 (cas_TM1802)	cas6|247aa|down_4|NC_014410.1_2653398_2654139_-	TIGR01877, CRISPR-associated_endoribonuclease_Cas6_1, CRISPR-associated endoribonuclease Cas6	csm2gr11|122aa|down_5|NC_014410.1_2654359_2654725_-	NA	csm3gr7|285aa|down_6|NC_014410.1_2654738_2655593_-	TIGR03986, CRISPR-associated_protein, CRISPR-associated protein	csm3gr7|260aa|down_7|NC_014410.1_2655579_2656359_-	cd09683, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm3gr7|250aa|down_8|NC_014410.1_2656351_2657101_-	cd09683, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|150aa|down_9|NC_014410.1_2657128_2657578_-	NA
GCF_000145615.1_ASM14561v1	NC_014410	Thermoanaerobacterium thermosaccharolyticum DSM 571, complete genome	5	2723692-2726373	5,5,5	PILER-CR,CRISPRCasFinder,CRT	no	cas6,cas2,cas1,cas4,cas5,cas7,cas8a4,cas3	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	Unclear	GTTTCAATTCCACTATGGTTAGATTAAATC,GTTTCAATTCCACTATGGTTAGATTAAATC,GTTTCAATTCCACTATGGTTAGATTAAATC	30,30,30	0	0	NA	NA	I-A,II-B,III-A:I-A,II-B,III-A:I-A,II-B,III-A	40,40,40	40	Unclear	RT,cas3,cas14j,cas4,csa3,WYL,DinG,csx1,cmr1gr7,cas10,cmr3gr5,csm6,cmr4gr7,cmr5gr11,cmr6gr7,DEDDh,cas2,cas1,cas5,cas7,cas8b1,cas6,csm2gr11,csm3gr7,csx10gr5,csx20,cas8a4	NA,cas5|239aa|down_4|NC_014410.1_2729215_2729932_-,cas8a4|602aa|down_6|NC_014410.1_2730938_2732744_-,NA|224aa|down_9|NC_014410.1_2736648_2737320_-	NA|233aa|up_9|NC_014410.1_2711920_2712619_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|272aa|up_8|NC_014410.1_2712625_2713441_-	pfam13485, Peptidase_MA_2, Peptidase MA superfamily	NA|422aa|up_7|NC_014410.1_2713600_2714866_-	pfam01551, Peptidase_M23, Peptidase family M23	NA|324aa|up_6|NC_014410.1_2715052_2716024_+	pfam07261, DnaB_2, Replication initiation and membrane attachment	NA|327aa|up_5|NC_014410.1_2716016_2716997_+	PRK06835, PRK06835, DNA replication protein DnaC; Validated	NA|481aa|up_4|NC_014410.1_2716993_2718436_-	cd09604, M1_APN_like, Peptidase M1 family similar to aminopeptidase N catalytic domain	NA|204aa|up_3|NC_014410.1_2718576_2719188_+	TIGR02840, conserved_hypothetical_protein, putative sporulation protein YtaF	NA|253aa|up_2|NC_014410.1_2719486_2720245_-	pfam07833, Cu_amine_oxidN1, Copper amine oxidase N-terminal domain	NA|413aa|up_1|NC_014410.1_2720600_2721839_-	pfam01548, DEDD_Tnp_IS110, Transposase	NA|458aa|up_0|NC_014410.1_2722141_2723515_-	pfam13546, DDE_5, DDE superfamily endonuclease	cas6|252aa|down_0|NC_014410.1_2726614_2727370_-	cd09759, Cas6_I-A, CRISPR/Cas system-associated RAMP superfamily protein Cas6	cas2|88aa|down_1|NC_014410.1_2727380_2727644_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|331aa|down_2|NC_014410.1_2727645_2728638_-	TIGR03641, cas1_HMARI, CRISPR-associated endonuclease Cas1, subtype I-B/HMARI/TNEAP	cas4|164aa|down_3|NC_014410.1_2728649_2729141_-	pfam01930, Cas_Cas4, Domain of unknown function DUF83	cas5|239aa|down_4|NC_014410.1_2729215_2729932_-	NA	cas7|322aa|down_5|NC_014410.1_2729953_2730919_-	pfam01905, DevR, CRISPR-associated negative auto-regulator DevR/Csa2	cas8a4|602aa|down_6|NC_014410.1_2730938_2732744_-	NA	cas3|804aa|down_7|NC_014410.1_2732733_2735145_-	COG1203, COG1203, CRISPR-associated helicase Cas3 [Defense mechanisms]	NA|351aa|down_8|NC_014410.1_2735494_2736547_+	pfam07854, DUF1646, Protein of unknown function (DUF1646)	NA|224aa|down_9|NC_014410.1_2736648_2737320_-	NA
