assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000827125.1_ASM82712v1	NZ_CP010311	Geoalkalibacter subterraneus strain Red1 chromosome, complete genome	1	1369072-1372389	1,1,1,2	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no	cas3,cas5,cas8c,cas7,cas4,cas1,cas2	csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT	Type I-U, Type I-U?,Type I-C	GTCGCCCCCCGTGCGGGGGCGTGGATTGAAAC,GTCGCCCCCCGTGCGGGGGCGTGGATTGAAAC,GTCGCCCCCCGTGCGGGGGCGTGGATTGAAAC,GTCGCCCCCCGTGCGGGGGCGTGGATTGAAAC	32,32,32,32	1	1	1372261-1372292	NZ_CP010311.1_3417950-3417981	I-C:I-C:I-C:I-C	48,50,50,48	50	TypeI-U,TypeI-U?,TypeI-C	csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT,c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5	NA,NA|121aa|down_2|NZ_CP010311.1_1373678_1374041_+	NA|297aa|up_9|NZ_CP010311.1_1357127_1358018_+	COG0142, IspA, Geranylgeranyl pyrophosphate synthase [Coenzyme metabolism]	NA|624aa|up_8|NZ_CP010311.1_1358053_1359925_+	PRK05444, PRK05444, 1-deoxy-D-xylulose-5-phosphate synthase; Provisional	cas3|731aa|up_7|NZ_CP010311.1_1360372_1362565_+	cd17930, DEXHc_cas3, DEXH/Q-box helicase domain of Cas3	cas5|222aa|up_6|NZ_CP010311.1_1362595_1363261_+	cd09752, Cas5_I-C, CRISPR/Cas system-associated RAMP superfamily protein Cas5	cas8c|584aa|up_5|NZ_CP010311.1_1363257_1365009_+	cd09757, Cas8c_I-C, CRISPR/Cas system-associated protein Cas8c	cas7|287aa|up_4|NZ_CP010311.1_1365012_1365873_+	pfam05107, Cas_Cas7, CRISPR-associated protein Cas7	NA|289aa|up_3|NZ_CP010311.1_1366038_1366905_+	pfam13646, HEAT_2, HEAT repeats	cas4|225aa|up_2|NZ_CP010311.1_1366963_1367638_+	TIGR00372, conserved_hypothetical_protein, CRISPR-associated protein Cas4	cas1|344aa|up_1|NZ_CP010311.1_1367582_1368614_+	TIGR03640, cas1_DVULG, CRISPR-associated endonuclease Cas1, subtype I-C/DVULG	cas2|97aa|up_0|NZ_CP010311.1_1368616_1368907_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|114aa|down_0|NZ_CP010311.1_1373067_1373409_+	TIGR02683, Uncharacterized_protein_HI_1419, putative addiction module killer protein	NA|104aa|down_1|NZ_CP010311.1_1373401_1373713_+	COG3636, COG3636, Predicted transcriptional regulator [Transcription]	NA|121aa|down_2|NZ_CP010311.1_1373678_1374041_+	NA	NA|368aa|down_3|NZ_CP010311.1_1374512_1375616_-	pfam04986, Y2_Tnp, Putative transposase	NA|294aa|down_4|NZ_CP010311.1_1375608_1376490_-	cd01193, INT_IntI_C, Integron integrase and similar protiens, C-terminal catalytic domain	NA|221aa|down_5|NZ_CP010311.1_1376740_1377403_-	pfam07589, VPEP, PEP-CTERM motif	NA|57aa|down_6|NZ_CP010311.1_1378371_1378542_+	COG5487, COG5487, Small integral membrane protein [Function unknown]	NA|416aa|down_7|NZ_CP010311.1_1378773_1380021_-	TIGR00275, TIGR00275, flavoprotein, HI0933 family	NA|138aa|down_8|NZ_CP010311.1_1380073_1380487_-	PRK09256, PRK09256, aminoacyl-tRNA hydrolase	NA|484aa|down_9|NZ_CP010311.1_1380895_1382347_-	TIGR00785, Uncharacterized_transporter_HI_0020, anion transporter
GCF_000827125.1_ASM82712v1	NZ_CP010311	Geoalkalibacter subterraneus strain Red1 chromosome, complete genome	2	3133024-3133154	2	CRISPRCasFinder	no		csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT	Orphan	GGCATAAGGGGACGCTGGTAACTTATG	27	1	1	3133051-3133075	NZ_CP010311.1_3230665-3230689	NA	2	2	Orphan	csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT,c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5	NA|193aa|up_5|NZ_CP010311.1_3126140_3126719_+,NA|132aa|up_3|NZ_CP010311.1_3128765_3129161_-,NA	NA|246aa|up_9|NZ_CP010311.1_3122363_3123101_-	COG0580, GlpF, Glycerol uptake facilitator and related permeases (Major Intrinsic Protein Family) [Carbohydrate transport and metabolism]	NA|68aa|up_8|NZ_CP010311.1_3123253_3123457_-	COG4855, COG4855, Uncharacterized protein conserved in archaea [Function unknown]	NA|538aa|up_7|NZ_CP010311.1_3123467_3125081_-	PLN02464, PLN02464, glycerol-3-phosphate dehydrogenase	NA|261aa|up_6|NZ_CP010311.1_3125305_3126088_+	PRK10906, PRK10906, DeoR/GlpR family transcriptional regulator	NA|193aa|up_5|NZ_CP010311.1_3126140_3126719_+	NA	NA|638aa|up_4|NZ_CP010311.1_3126751_3128665_-	COG2905, COG2905, Predicted signal-transduction protein containing cAMP-binding and CBS domains [Signal transduction mechanisms]	NA|132aa|up_3|NZ_CP010311.1_3128765_3129161_-	NA	NA|605aa|up_2|NZ_CP010311.1_3129334_3131149_-	TIGR03648, Na_symport_lg, probable sodium:solute symporter, VC_2705 subfamily	NA|85aa|up_1|NZ_CP010311.1_3131162_3131417_-	TIGR03647, Na_symport_sm, putative solute:sodium symporter small subunit	NA|260aa|up_0|NZ_CP010311.1_3131908_3132688_-	COG1414, IclR, Transcriptional regulator [Transcription]	NA|224aa|down_0|NZ_CP010311.1_3134437_3135109_-	PRK10710, PRK10710, DNA-binding transcriptional regulator BaeR; Provisional	NA|472aa|down_1|NZ_CP010311.1_3135105_3136521_-	PRK10549, PRK10549, two-component system sensor histidine kinase BaeS	NA|172aa|down_2|NZ_CP010311.1_3136908_3137424_+	cd09916, CpxP_like, CpxP component of the bacterial Cpx-two-component system and related proteins	NA|79aa|down_3|NZ_CP010311.1_3137534_3137771_-	pfam01934, DUF86, Protein of unknown function DUF86	NA|93aa|down_4|NZ_CP010311.1_3137758_3138037_-	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase	NA|698aa|down_5|NZ_CP010311.1_3138299_3140393_+	pfam02810, SEC-C, SEC-C motif	NA|509aa|down_6|NZ_CP010311.1_3140531_3142058_+	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|514aa|down_7|NZ_CP010311.1_3142154_3143696_-	pfam09820, AAA-ATPase_like, Predicted AAA-ATPase	NA|137aa|down_8|NZ_CP010311.1_3143929_3144340_-	pfam01934, DUF86, Protein of unknown function DUF86	NA|132aa|down_9|NZ_CP010311.1_3144329_3144725_-	pfam18765, Polbeta, Polymerase beta, Nucleotidyltransferase
GCF_000827125.1_ASM82712v1	NZ_CP010311	Geoalkalibacter subterraneus strain Red1 chromosome, complete genome	3	3260585-3260653	3	CRISPRCasFinder	no		csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT	Orphan	AATCTTTAAGTGGGTGTCCTATAGA	25	0	0	NA	NA	NA	1	1	Orphan	csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT,c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5	NA|369aa|up_9|NZ_CP010311.1_3249754_3250861_-,NA|227aa|up_5|NZ_CP010311.1_3253021_3253702_-,NA|227aa|up_3|NZ_CP010311.1_3254955_3255636_-,NA|369aa|up_0|NZ_CP010311.1_3259452_3260559_-,NA|375aa|down_7|NZ_CP010311.1_3267944_3269069_-	NA|369aa|up_9|NZ_CP010311.1_3249754_3250861_-	NA	NA|76aa|up_8|NZ_CP010311.1_3250964_3251192_-	pfam07878, RHH_5, CopG-like RHH_1 or ribbon-helix-helix domain, RHH_5	NA|98aa|up_7|NZ_CP010311.1_3251654_3251948_-	pfam05016, ParE_toxin, ParE toxin of type II toxin-antitoxin system, parDE	NA|91aa|up_6|NZ_CP010311.1_3251935_3252208_-	COG3905, COG3905, Predicted transcriptional regulator [Transcription]	NA|227aa|up_5|NZ_CP010311.1_3253021_3253702_-	NA	NA|356aa|up_4|NZ_CP010311.1_3253743_3254811_-	pfam14236, DUF4338, Domain of unknown function (DUF4338)	NA|227aa|up_3|NZ_CP010311.1_3254955_3255636_-	NA	NA|356aa|up_2|NZ_CP010311.1_3255677_3256745_-	pfam14236, DUF4338, Domain of unknown function (DUF4338)	NA|565aa|up_1|NZ_CP010311.1_3257144_3258839_-	pfam01609, DDE_Tnp_1, Transposase DDE domain	NA|369aa|up_0|NZ_CP010311.1_3259452_3260559_-	NA	NA|99aa|down_0|NZ_CP010311.1_3261160_3261457_-	COG2026, RelE, Cytotoxic translational repressor of toxin-antitoxin stability system [Translation, ribosomal structure and biogenesis / Cell division and chromosome partitioning]	NA|76aa|down_1|NZ_CP010311.1_3261437_3261665_-	pfam07878, RHH_5, CopG-like RHH_1 or ribbon-helix-helix domain, RHH_5	NA|409aa|down_2|NZ_CP010311.1_3262444_3263671_-	cd03794, GT4_WbuB-like, Escherichia coli WbuB and similar proteins	NA|355aa|down_3|NZ_CP010311.1_3263731_3264796_-	cd03786, GTB_UDP-GlcNAc_2-Epimerase, UDP-N-acetylglucosamine 2-epimerase and similar proteins	NA|370aa|down_4|NZ_CP010311.1_3264801_3265911_-	cd03794, GT4_WbuB-like, Escherichia coli WbuB and similar proteins	NA|310aa|down_5|NZ_CP010311.1_3265907_3266837_-	pfam06662, C5-epim_C, D-glucuronyl C5-epimerase C-terminus	NA|378aa|down_6|NZ_CP010311.1_3266814_3267948_-	cd03794, GT4_WbuB-like, Escherichia coli WbuB and similar proteins	NA|375aa|down_7|NZ_CP010311.1_3267944_3269069_-	NA	NA|481aa|down_8|NZ_CP010311.1_3269472_3270915_-	cd13127, MATE_tuaB_like, Uncharacterized subfamily of the multidrug and toxic compound extrusion (MATE) proteins	NA|384aa|down_9|NZ_CP010311.1_3270904_3272056_-	cd00616, AHBA_syn, 3-amino-5-hydroxybenzoic acid synthase family (AHBA_syn)
GCF_000827125.1_ASM82712v1	NZ_CP010312	Geoalkalibacter subterraneus strain Red1 plasmid pGSUB1, complete sequence	1	115445-115561	1	CRISPRCasFinder	no	Cas9_archaeal	c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,RT,Cas9_archaeal,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5,DinG	 Type II-B,Type II-A, or Type II-C?	GAGGGCCCAAATGGGCCCGCTAGAGGGCCCAAATGGGCCCTCG	43	0	0	NA	NA	NA	1	1	TypeII-A,TypeII-B,orTypeII-C?	csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT,c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5	NA|118aa|up_9|NZ_CP010312.1_108488_108842_+,NA|95aa|up_7|NZ_CP010312.1_109520_109805_+,NA|54aa|up_6|NZ_CP010312.1_109862_110024_+,NA|174aa|up_3|NZ_CP010312.1_111628_112150_+,NA|159aa|down_0|NZ_CP010312.1_116158_116635_+,NA|64aa|down_4|NZ_CP010312.1_120721_120913_+,NA|83aa|down_5|NZ_CP010312.1_120899_121148_+,NA|145aa|down_8|NZ_CP010312.1_124373_124808_+	NA|118aa|up_9|NZ_CP010312.1_108488_108842_+	NA	NA|175aa|up_8|NZ_CP010312.1_108819_109344_+	pfam05280, FlhC, Flagellar transcriptional activator (FlhC)	NA|95aa|up_7|NZ_CP010312.1_109520_109805_+	NA	NA|54aa|up_6|NZ_CP010312.1_109862_110024_+	NA	NA|154aa|up_5|NZ_CP010312.1_109995_110457_+	pfam07291, MauE, Methylamine utilisation protein MauE	NA|258aa|up_4|NZ_CP010312.1_110837_111611_+	COG1192, Soj, ATPases involved in chromosome partitioning [Cell division and chromosome partitioning]	NA|174aa|up_3|NZ_CP010312.1_111628_112150_+	NA	NA|109aa|up_2|NZ_CP010312.1_112905_113232_+	PRK09330, PRK09330, cell division protein FtsZ; Validated	NA|166aa|up_1|NZ_CP010312.1_113634_114132_-	smart00318, SNc, Staphylococcal nuclease homologues	NA|325aa|up_0|NZ_CP010312.1_114437_115412_-	cd10227, ParM_like, Plasmid segregation protein ParM and similar proteins	NA|159aa|down_0|NZ_CP010312.1_116158_116635_+	NA	NA|429aa|down_1|NZ_CP010312.1_116637_117924_+	pfam08346, AntA, AntA/AntB antirepressor	NA|699aa|down_2|NZ_CP010312.1_118066_120163_+	PRK10917, PRK10917, ATP-dependent DNA helicase RecG; Provisional	NA|110aa|down_3|NZ_CP010312.1_120257_120587_+	PRK07395, PRK07395, L-aspartate oxidase; Provisional	NA|64aa|down_4|NZ_CP010312.1_120721_120913_+	NA	NA|83aa|down_5|NZ_CP010312.1_120899_121148_+	NA	NA|612aa|down_6|NZ_CP010312.1_121210_123046_+	COG0286, HsdM, Type I restriction-modification system methyltransferase subunit [Defense mechanisms]	NA|445aa|down_7|NZ_CP010312.1_123042_124377_+	cd17283, RMtype1_S_Hpy180ORF7835P_TRD2-CR2_like, Type I restriction-modification system specificity (S) subunit Target Recognition Domain-ConseRved domain (TRD-CR), similar to Helicobacter pylori SJM180 S subunit (S	NA|145aa|down_8|NZ_CP010312.1_124373_124808_+	NA	NA|1046aa|down_9|NZ_CP010312.1_124819_127957_+	COG0610, COG0610, Type I site-specific restriction-modification system, R (restriction) subunit and related helicases [Defense mechanisms]
GCF_000827125.1_ASM82712v1	NZ_CP010312	Geoalkalibacter subterraneus strain Red1 plasmid pGSUB1, complete sequence	2	160059-161201	1,2,1	PILER-CR,CRISPRCasFinder,CRT	no	cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5,DinG	c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,RT,Cas9_archaeal,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5,DinG	Type IV-A	GTTGTAATAAGCTGTAAAGTGTTGCGGCTTTGGAAA,GTTGTAATAAGCTGTAAAGTGTTGCGGCTTTGGAAAC,GTTGTAATAAGCTGTAANAGTNTTGCGGCTTTGGAAAN	36,37,38	3	3	160095-160131|160096-160131|160691-160727	NZ_CP010311.1_3429041-3429005|NZ_CP010311.1_3429040-3429005|NZ_CP010311.1_2124882-2124846	NA:NA:NA	11,12,15	15	TypeV,TypeIV-A	csa3,WYL,cas3,cas5,cas8c,cas7,cas4,cas1,cas2,cas6,Cas9_archaeal,DinG,RT,c2c9_V-U4,cas14k,Cas14u_CAS-V,cas14i,cas14j,csf5gr6,csf1gr8,csf2gr7,csf3gr5	NA|104aa|up_7|NZ_CP010312.1_152885_153197_+,NA|213aa|up_5|NZ_CP010312.1_154883_155522_+,csf5gr6|237aa|up_3|NZ_CP010312.1_156528_157239_+,NA|205aa|down_1|NZ_CP010312.1_163251_163866_+,NA|219aa|down_2|NZ_CP010312.1_163875_164532_+,NA|200aa|down_6|NZ_CP010312.1_167939_168539_+,NA|125aa|down_7|NZ_CP010312.1_168554_168929_+,NA|112aa|down_8|NZ_CP010312.1_169034_169370_+,NA|234aa|down_9|NZ_CP010312.1_169389_170091_+	NA|219aa|up_9|NZ_CP010312.1_150101_150758_+	smart00318, SNc, Staphylococcal nuclease homologues	NA|135aa|up_8|NZ_CP010312.1_152154_152559_+	cd06554, ASCH_ASC-1_like, ASC-1 homology domain, ASC-1-like subfamily	NA|104aa|up_7|NZ_CP010312.1_152885_153197_+	NA	NA|460aa|up_6|NZ_CP010312.1_153489_154869_+	cd01713, PAPS_reductase, This domain is found in phosphoadenosine phosphosulphate (PAPS) reductase enzymes or PAPS sulphotransferase	NA|213aa|up_5|NZ_CP010312.1_154883_155522_+	NA	NA|317aa|up_4|NZ_CP010312.1_155547_156498_+	COG0286, HsdM, Type I restriction-modification system methyltransferase subunit [Defense mechanisms]	csf5gr6|237aa|up_3|NZ_CP010312.1_156528_157239_+	NA	csf1gr8|259aa|up_2|NZ_CP010312.1_157228_158005_+	cd09705, Csf1_U, CRISPR/Cas system-associated protein Csf1	csf2gr7|375aa|up_1|NZ_CP010312.1_158035_159160_+	cd09706, Csf2_U, CRISPR/Cas system-associated RAMP superfamily protein Csf2	csf3gr5|238aa|up_0|NZ_CP010312.1_159159_159873_+	cd09707, Csf3_U, CRISPR/Cas system-associated RAMP superfamily protein Csf3	DinG|632aa|down_0|NZ_CP010312.1_161224_163120_+	TIGR03117, cas_csf4, CRISPR type AFERR-associated DEAD/DEAH-box helicase Csf4	NA|205aa|down_1|NZ_CP010312.1_163251_163866_+	NA	NA|219aa|down_2|NZ_CP010312.1_163875_164532_+	NA	cas14j|385aa|down_3|NZ_CP010312.1_165269_166424_-	COG0675, COG0675, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|136aa|down_4|NZ_CP010312.1_166447_166855_+	pfam01797, Y1_Tnp, Transposase IS200 like	NA|292aa|down_5|NZ_CP010312.1_166896_167772_-	pfam07042, TrfA, TrfA protein	NA|200aa|down_6|NZ_CP010312.1_167939_168539_+	NA	NA|125aa|down_7|NZ_CP010312.1_168554_168929_+	NA	NA|112aa|down_8|NZ_CP010312.1_169034_169370_+	NA	NA|234aa|down_9|NZ_CP010312.1_169389_170091_+	NA
