assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCA_900638105.1_56433_A01	LR134490	Haemophilus influenzae strain NCTC11873 genome assembly, chromosome: 1	1	408472-408570	1	CRISPRCasFinder	no		cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	Orphan	ACGATTGTTTGATGGTGGGCTGAAGCCCACCCTACAA	37	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	NA|56aa|up_9|LR134490.1_400276_400444_-,NA	NA|56aa|up_9|LR134490.1_400276_400444_-	NA	NA|145aa|up_8|LR134490.1_400708_401143_-	PRK05273, PRK05273, D-tyrosyl-tRNA(Tyr) deacylase; Provisional	NA|147aa|up_7|LR134490.1_401139_401580_-	PRK09004, PRK09004, FMN-binding protein MioC; Provisional	NA|73aa|up_6|LR134490.1_401676_401895_-	COG3074, COG3074, Uncharacterized protein conserved in bacteria [Function unknown]	NA|334aa|up_5|LR134490.1_402056_403058_+	TIGR00330, Fructose-16-bisphosphatase_class_2, fructose-1,6-bisphosphatase, class II	NA|103aa|up_4|LR134490.1_403257_403566_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|107aa|up_3|LR134490.1_403553_403874_+	COG3550, HipA, Toxin module HipA, protein kinase of phosphatidylinositol 3/4-kinase superfamily [General function prediction only]	NA|344aa|up_2|LR134490.1_403870_404902_+	COG3550, HipA, Toxin module HipA, protein kinase of phosphatidylinositol 3/4-kinase superfamily [General function prediction only]	NA|553aa|up_1|LR134490.1_404985_406644_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|582aa|up_0|LR134490.1_406636_408382_-	COG4988, CydD, ABC-type transport system involved in cytochrome bd biosynthesis, ATPase and permease components [Energy production and conversion / Posttranslational modification, protein turnover, chaperones]	NA|1002aa|down_0|LR134490.1_408751_411757_+	TIGR01786, hemoglobin-haptoglobin-binding_protein, TonB-dependent hemoglobin/transferrin/lactoferrin receptor family protein	NA|99aa|down_1|LR134490.1_412077_412374_+	pfam01381, HTH_3, Helix-turn-helix	NA|639aa|down_2|LR134490.1_412557_414474_+	PRK10636, PRK10636, putative ABC transporter ATP-binding protein; Provisional	NA|183aa|down_3|LR134490.1_414483_415032_+	COG0551, TopA, Zn-finger domain associated with topoisomerase type I [DNA replication, recombination, and repair]	NA|184aa|down_4|LR134490.1_415047_415599_+	PRK10634, PRK10634, L-threonylcarbamoyladenylate synthase type 1 TsaC	NA|273aa|down_5|LR134490.1_415602_416421_+	TIGR00507, Shikimate_dehydrogenase, shikimate dehydrogenase	NA|188aa|down_6|LR134490.1_416417_416981_+	pfam03352, Adenine_glyco, Methyladenine glycosylase	NA|255aa|down_7|LR134490.1_416977_417742_-	cd02511, Beta4Glucosyltransferase, UDP-glucose LOS-beta-1,4 glucosyltransferase is required for biosynthesis of lipooligosaccharide	NA|428aa|down_8|LR134490.1_417804_419088_+	PRK05749, PRK05749, 3-deoxy-D-manno-octulosonic-acid transferase; Reviewed	NA|157aa|down_9|LR134490.1_419084_419555_+	PRK00168, coaD, phosphopantetheine adenylyltransferase; Provisional
GCA_900638105.1_56433_A01	LR134490	Haemophilus influenzae strain NCTC11873 genome assembly, chromosome: 1	2	1049510-1049614	2	CRISPRCasFinder	no	csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	Type III-A,Type III-C,Type III-D,Type III-B	AATCCCTTTGGAACAGGGCAATGTCTTTCGACA	33	0	0	NA	NA	NA	1	1	TypeIII-A,TypeIII-C,TypeIII-D,TypeIII-B	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	NA|85aa|up_5|LR134490.1_1044795_1045050_-,NA|34aa|down_9|LR134490.1_1061421_1061523_+	NA|426aa|up_9|LR134490.1_1040059_1041337_+	PRK09225, PRK09225, threonine synthase; Validated	NA|370aa|up_8|LR134490.1_1042185_1043295_+	PRK08247, PRK08247, methionine biosynthesis PLP-dependent protein	NA|332aa|up_7|LR134490.1_1043307_1044303_+	cd12183, LDH_like_2, D-Lactate and related Dehydrogenases, NAD-binding and catalytic domains	NA|108aa|up_6|LR134490.1_1044422_1044746_+	TIGR01068, Thioredoxin-like_protein_slr0233, thioredoxin	NA|85aa|up_5|LR134490.1_1044795_1045050_-	NA	NA|89aa|up_4|LR134490.1_1045025_1045292_-	COG1960, CaiA, Acyl-CoA dehydrogenases [Lipid metabolism]	NA|263aa|up_3|LR134490.1_1045549_1046338_-	COG0084, TatD, Mg-dependent DNase [DNA replication, recombination, and repair]	NA|170aa|up_2|LR134490.1_1046392_1046902_-	PRK10791, PRK10791, peptidylprolyl isomerase B	NA|460aa|up_1|LR134490.1_1047004_1048384_+	PRK00260, cysS, cysteinyl-tRNA synthetase; Validated	NA|287aa|up_0|LR134490.1_1048544_1049405_-	COG1946, TesB, Acyl-CoA thioesterase [Lipid metabolism]	csx1|387aa|down_0|LR134490.1_1050750_1051911_-	cd09741, Csx1_III-U, CRISPR/Cas system-associated protein Csx1	csx1|391aa|down_1|LR134490.1_1051918_1053091_-	pfam09002, DUF1887, Domain of unknown function (DUF1887)	csx16|97aa|down_2|LR134490.1_1053100_1053391_-	pfam09652, Cas_VVA1548, Putative CRISPR-associated protein (Cas_VVA1548)	cas6|307aa|down_3|LR134490.1_1053449_1054370_-	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	csm5gr7|518aa|down_4|LR134490.1_1054369_1055923_-	pfam03787, RAMPs, RAMP superfamily	csm4gr5|313aa|down_5|LR134490.1_1055919_1056858_-	cd09663, Csm4_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm4	csm3gr7|231aa|down_6|LR134490.1_1056867_1057560_-	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|130aa|down_7|LR134490.1_1057576_1057966_-	pfam03750, Csm2_III-A, Csm2 Type III-A	cas10|724aa|down_8|LR134490.1_1057975_1060147_-	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	NA|34aa|down_9|LR134490.1_1061421_1061523_+	NA
GCA_900638105.1_56433_A01	LR134490	Haemophilus influenzae strain NCTC11873 genome assembly, chromosome: 1	3	1063578-1064179	1,3,1	PILER-CR,CRISPRCasFinder,CRT	no	csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	Type III-A,Type III-C,Type III-D,Type III-B	GTCGAAAGACATTGCCCTGTTCCAAAGGGATTGAGAC,GTCGAAAGACATTGCCCTGTTCCAAAGGGATTGAGAC,GTCGAAAGACATTGCCCTGTTCCAAAGGGATTGAGAC	37,37,37	0	0	NA	NA	NA:NA:NA	6,7,8	8	TypeIII-A,TypeIII-C,TypeIII-D,TypeIII-B	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	NA|34aa|up_3|LR134490.1_1061421_1061523_+,NA|121aa|down_2|LR134490.1_1066497_1066860_+,NA|86aa|down_3|LR134490.1_1066933_1067191_+,NA|210aa|down_4|LR134490.1_1067165_1067795_+	cas6|307aa|up_9|LR134490.1_1053449_1054370_-	pfam10040, CRISPR_Cas6, CRISPR-associated endoribonuclease Cas6	csm5gr7|518aa|up_8|LR134490.1_1054369_1055923_-	pfam03787, RAMPs, RAMP superfamily	csm4gr5|313aa|up_7|LR134490.1_1055919_1056858_-	cd09663, Csm4_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm4	csm3gr7|231aa|up_6|LR134490.1_1056867_1057560_-	cd09684, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|130aa|up_5|LR134490.1_1057576_1057966_-	pfam03750, Csm2_III-A, Csm2 Type III-A	cas10|724aa|up_4|LR134490.1_1057975_1060147_-	cd09680, Cas10_III, CRISPR/Cas system-associated protein Cas10	NA|34aa|up_3|LR134490.1_1061421_1061523_+	NA	cas2|95aa|up_2|LR134490.1_1061723_1062008_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|357aa|up_1|LR134490.1_1062016_1063087_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas2|97aa|up_0|LR134490.1_1063097_1063388_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|155aa|down_0|LR134490.1_1064433_1064898_+	PRK06863, PRK06863, single-stranded DNA-binding protein; Provisional	NA|495aa|down_1|LR134490.1_1064912_1066397_+	cd17933, DEXSc_RecD-like, DEXS-box helicase domain of RecD and similar proteins	NA|121aa|down_2|LR134490.1_1066497_1066860_+	NA	NA|86aa|down_3|LR134490.1_1066933_1067191_+	NA	NA|210aa|down_4|LR134490.1_1067165_1067795_+	NA	NA|708aa|down_5|LR134490.1_1068367_1070491_-	PRK09263, PRK09263, anaerobic ribonucleoside triphosphate reductase; Provisional	NA|144aa|down_6|LR134490.1_1070771_1071203_+	TIGR01987, Uncharacterized_protein_HI_0074, nucleotidyltransferase substrate binding protein, HI0074 family	NA|115aa|down_7|LR134490.1_1071204_1071549_+	pfam01909, NTP_transf_2, Nucleotidyltransferase domain	NA|204aa|down_8|LR134490.1_1071561_1072173_-	PRK14150, PRK14150, heat shock protein GrpE; Provisional	NA|297aa|down_9|LR134490.1_1072272_1073163_+	PRK02231, ppnK, NAD(+) kinase
GCA_900638105.1_56433_A01	LR134490	Haemophilus influenzae strain NCTC11873 genome assembly, chromosome: 1	4	1190652-1190800	4	CRISPRCasFinder	no	DEDDh	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	Unclear	TTGGAGCGGGAAACGAGGCTCGAACTCGCGACCCCGACCTTGGCAAGGT	49	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,DEDDh,csx1,csx16,cas6,csm5gr7,csm4gr5,csm3gr7,csm2gr11,cas10,cas2,cas1,WYL,csa3	NA,NA	NA|246aa|up_9|LR134490.1_1178119_1178857_+	cd10800, LamB_YcsF_YbgL_like, Escherichia coli putative lactam utilization protein YbgL and similar proteins	NA|398aa|up_8|LR134490.1_1178900_1180094_+	COG1914, MntH, Mn2+ and Fe2+ transporters of the NRAMP family [Inorganic ion transport and metabolism]	NA|445aa|up_7|LR134490.1_1180164_1181499_-	PRK05370, PRK05370, argininosuccinate synthase; Validated	NA|291aa|up_6|LR134490.1_1181654_1182527_-	PRK13961, PRK13961, phosphoribosylaminoimidazole-succinocarboxamide synthase; Provisional	NA|782aa|up_5|LR134490.1_1182699_1185045_-	TIGR02071, Includes:_Penicillin-insensitive_transglycosylase, penicillin-binding protein 1B	NA|133aa|up_4|LR134490.1_1185051_1185450_-	COG3112, COG3112, Uncharacterized protein conserved in bacteria [Function unknown]	NA|115aa|up_3|LR134490.1_1185406_1185751_-	PRK13623, PRK13623, iron-sulfur cluster insertion protein ErpA; Provisional	NA|269aa|up_2|LR134490.1_1185886_1186693_+	PRK05716, PRK05716, methionine aminopeptidase; Validated	NA|864aa|up_1|LR134490.1_1186786_1189378_+	PRK01759, glnD, bifunctional uridylyltransferase/uridylyl-removing protein GlnD	NA|356aa|up_0|LR134490.1_1189452_1190520_+	TIGR02380, ECA_wecA, undecaprenyl-phosphate alpha-N-acetylglucosaminyl 1-phosphatetransferase	DEDDh|183aa|down_0|LR134490.1_1190921_1191470_-	PRK05359, PRK05359, oligoribonuclease; Provisional	NA|347aa|down_1|LR134490.1_1191540_1192581_+	PRK12288, PRK12288, small ribosomal subunit biogenesis GTPase RsgA	NA|86aa|down_2|LR134490.1_1192739_1192997_+	PRK10850, PRK10850, phosphocarrier protein Hpr	NA|576aa|down_3|LR134490.1_1193076_1194804_+	PRK11177, PRK11177, phosphoenolpyruvate-protein phosphotransferase PtsI	NA|167aa|down_4|LR134490.1_1194863_1195364_+	PRK09439, PRK09439, PTS system glucose-specific transporter subunit; Provisional	NA|71aa|down_5|LR134490.1_1195546_1195759_+	COG1482, ManA, Phosphomannose isomerase [Carbohydrate transport and metabolism]	NA|122aa|down_6|LR134490.1_1195873_1196239_+	TIGR00156, Uncharacterized_protein_HI_1709, TIGR00156 family protein	NA|222aa|down_7|LR134490.1_1196302_1196968_+	PRK10336, PRK10336, two-component system response regulator QseB	NA|85aa|down_8|LR134490.1_1196964_1197219_+	PRK10337, PRK10337, sensor protein QseC; Provisional	NA|340aa|down_9|LR134490.1_1197299_1198319_+	PRK10337, PRK10337, sensor protein QseC; Provisional
