assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000165525.1_ASM16552v1	NC_017451	Haemophilus influenzae R2866, complete genome	1	602240-602411	1	CRISPRCasFinder	no		cas3,DinG,cas14j,DEDDh,WYL	Orphan	ACAGTGGTTAATTTTTGTTCACTGTGCA	28	0	0	NA	NA	NA	2	2	Orphan	cas3,DinG,cas14j,DEDDh,WYL	NA|136aa|up_8|NC_017451.1_594309_594717_-,NA|408aa|down_0|NC_017451.1_602446_603670_-,NA|86aa|down_9|NC_017451.1_611743_612001_-	NA|157aa|up_9|NC_017451.1_593738_594209_-	PRK00024, PRK00024, DNA repair protein RadC	NA|136aa|up_8|NC_017451.1_594309_594717_-	NA	NA|214aa|up_7|NC_017451.1_594751_595393_-	pfam12083, DUF3560, Domain of unknown function (DUF3560)	NA|143aa|up_6|NC_017451.1_595507_595936_-	pfam12101, DUF3577, Protein of unknown function (DUF3577)	NA|682aa|up_5|NC_017451.1_596820_598866_-	PRK07726, PRK07726, DNA topoisomerase 3	NA|186aa|up_4|NC_017451.1_598956_599514_+	cd16389, FIN, fertility inhibition factors, including OSA and FiwA, related to the ParB/Srx superfamily	NA|173aa|up_3|NC_017451.1_599729_600248_-	pfam08139, LPAM_1, Prokaryotic membrane lipoprotein lipid attachment site	NA|141aa|up_2|NC_017451.1_600274_600697_-	PRK06863, PRK06863, single-stranded DNA-binding protein; Provisional	NA|158aa|up_1|NC_017451.1_600942_601416_-	pfam11358, DUF3158, Protein of unknown function (DUF3158)	NA|252aa|up_0|NC_017451.1_601430_602186_-	TIGR03761, ICE_PFL4669, integrating conjugative element protein, PFL_4669 family	NA|408aa|down_0|NC_017451.1_602446_603670_-	NA	NA|184aa|down_1|NC_017451.1_603819_604371_-	pfam11198, DUF2857, Protein of unknown function (DUF2857)	NA|567aa|down_2|NC_017451.1_604370_606071_-	TIGR03764, ICE_PFGI_1_parB, integrating conjugative element, PFGI_1 class, ParB family protein	NA|452aa|down_3|NC_017451.1_606063_607419_-	TIGR00665, DnaB, replicative DNA helicase	NA|279aa|down_4|NC_017451.1_607420_608257_-	COG1192, Soj, ATPases involved in chromosome partitioning [Cell division and chromosome partitioning]	NA|382aa|down_5|NC_017451.1_608812_609958_+	PRK08247, PRK08247, methionine biosynthesis PLP-dependent protein	NA|332aa|down_6|NC_017451.1_609970_610966_+	cd12183, LDH_like_2, D-Lactate and related Dehydrogenases, NAD-binding and catalytic domains	NA|108aa|down_7|NC_017451.1_611085_611409_+	TIGR01068, Thioredoxin-like_protein_slr0233, thioredoxin	NA|123aa|down_8|NC_017451.1_611364_611733_-	cd03311, CIMS_C_terminal_like, CIMS - Cobalamine-independent methonine synthase, or MetE, C-terminal domain_like	NA|86aa|down_9|NC_017451.1_611743_612001_-	NA
GCF_000165525.1_ASM16552v1	NC_017451	Haemophilus influenzae R2866, complete genome	2	741215-741363	2	CRISPRCasFinder	no	DEDDh	cas3,DinG,cas14j,DEDDh,WYL	Unclear	TTGGAGCGGGAAACGAGGCTCGAACTCGCGACCCCGACCTTGGCAAGGT	49	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,cas14j,DEDDh,WYL	NA,NA	NA|246aa|up_9|NC_017451.1_728682_729420_+	cd10800, LamB_YcsF_YbgL_like, Escherichia coli putative lactam utilization protein YbgL and similar proteins	NA|398aa|up_8|NC_017451.1_729463_730657_+	COG1914, MntH, Mn2+ and Fe2+ transporters of the NRAMP family [Inorganic ion transport and metabolism]	NA|445aa|up_7|NC_017451.1_730727_732062_-	PRK05370, PRK05370, argininosuccinate synthase; Validated	NA|291aa|up_6|NC_017451.1_732217_733090_-	PRK13961, PRK13961, phosphoribosylaminoimidazole-succinocarboxamide synthase; Provisional	NA|782aa|up_5|NC_017451.1_733262_735608_-	TIGR02071, Includes:_Penicillin-insensitive_transglycosylase, penicillin-binding protein 1B	NA|118aa|up_4|NC_017451.1_735614_735968_-	COG3112, COG3112, Uncharacterized protein conserved in bacteria [Function unknown]	NA|115aa|up_3|NC_017451.1_735969_736314_-	PRK13623, PRK13623, iron-sulfur cluster insertion protein ErpA; Provisional	NA|269aa|up_2|NC_017451.1_736449_737256_+	PRK05716, PRK05716, methionine aminopeptidase; Validated	NA|864aa|up_1|NC_017451.1_737349_739941_+	PRK01759, glnD, bifunctional uridylyltransferase/uridylyl-removing protein GlnD	NA|356aa|up_0|NC_017451.1_740015_741083_+	TIGR02380, ECA_wecA, undecaprenyl-phosphate alpha-N-acetylglucosaminyl 1-phosphatetransferase	DEDDh|183aa|down_0|NC_017451.1_741484_742033_-	PRK05359, PRK05359, oligoribonuclease; Provisional	NA|347aa|down_1|NC_017451.1_742103_743144_+	PRK12288, PRK12288, small ribosomal subunit biogenesis GTPase RsgA	NA|86aa|down_2|NC_017451.1_743302_743560_+	PRK10850, PRK10850, phosphocarrier protein Hpr	NA|576aa|down_3|NC_017451.1_743639_745367_+	PRK11177, PRK11177, phosphoenolpyruvate-protein phosphotransferase PtsI	NA|167aa|down_4|NC_017451.1_745426_745927_+	PRK09439, PRK09439, PTS system glucose-specific transporter subunit; Provisional	NA|71aa|down_5|NC_017451.1_746109_746322_+	COG1482, ManA, Phosphomannose isomerase [Carbohydrate transport and metabolism]	NA|122aa|down_6|NC_017451.1_746436_746802_+	TIGR00156, Uncharacterized_protein_HI_1709, TIGR00156 family protein	NA|222aa|down_7|NC_017451.1_746865_747531_+	PRK10336, PRK10336, two-component system response regulator QseB	NA|452aa|down_8|NC_017451.1_747527_748883_+	PRK10337, PRK10337, sensor protein QseC; Provisional	NA|676aa|down_9|NC_017451.1_749159_751187_+	COG1292, BetT, Choline-glycine betaine transporter [Cell envelope biogenesis, outer membrane]
GCF_000165525.1_ASM16552v1	NC_017451	Haemophilus influenzae R2866, complete genome	3	1433758-1433910	3	CRISPRCasFinder	no		cas3,DinG,cas14j,DEDDh,WYL	Orphan	ACTTCTACTGACAAAACAACAGTAGCTGATAATTCAAAA	39	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,cas14j,DEDDh,WYL	NA,NA|194aa|down_6|NC_017451.1_1442389_1442971_+	NA|542aa|up_9|NC_017451.1_1416481_1418107_-	PRK01318, PRK01318, membrane protein insertase; Provisional	NA|87aa|up_8|NC_017451.1_1418106_1418367_-	PRK00041, PRK00041, hypothetical protein; Validated	NA|120aa|up_7|NC_017451.1_1418330_1418690_-	PRK01732, rnpA, ribonuclease P; Reviewed	NA|45aa|up_6|NC_017451.1_1418702_1418837_-	PRK00399, rpmH, 50S ribosomal protein L34; Reviewed	NA|483aa|up_5|NC_017451.1_1419013_1420462_-	pfam04575, DUF560, Protein of unknown function (DUF560)	NA|651aa|up_4|NC_017451.1_1420558_1422511_+	pfam01298, TbpB_B_D, C-lobe and N-lobe beta barrels of Tf-binding protein B	NA|916aa|up_3|NC_017451.1_1422524_1425272_+	TIGR01776, Lactoferrin-binding_protein_A, TonB-dependent lactoferrin and transferrin receptors	NA|455aa|up_2|NC_017451.1_1425463_1426828_+	TIGR00362, DnaA, chromosomal replication initiator protein DnaA	NA|367aa|up_1|NC_017451.1_1427086_1428187_+	PRK05643, PRK05643, DNA polymerase III subunit beta; Validated	NA|360aa|up_0|NC_017451.1_1428188_1429268_+	TIGR00611, DNA_replication_and_repair_protein_RecF, recF protein	NA|201aa|down_0|NC_017451.1_1434968_1435571_-	PRK01641, leuD, 3-isopropylmalate dehydratase small subunit	NA|470aa|down_1|NC_017451.1_1435595_1437005_-	PRK05478, PRK05478, 3-isopropylmalate dehydratase large subunit	NA|359aa|down_2|NC_017451.1_1437180_1438257_-	PRK00772, PRK00772, 3-isopropylmalate dehydrogenase; Provisional	NA|516aa|down_3|NC_017451.1_1438342_1439890_-	PRK00915, PRK00915, 2-isopropylmalate synthase; Validated	NA|374aa|down_4|NC_017451.1_1440446_1441568_+	COG0758, Smf, Predicted Rossmann fold nucleotide-binding protein involved in DNA uptake [DNA replication, recombination, and repair / Intracellular trafficking and secretion]	NA|259aa|down_5|NC_017451.1_1441620_1442397_+	PRK02101, PRK02101, peroxide stress protein YaaA	NA|194aa|down_6|NC_017451.1_1442389_1442971_+	NA	NA|322aa|down_7|NC_017451.1_1443066_1444032_+	PRK03202, PRK03202, ATP-dependent 6-phosphofructokinase	NA|162aa|down_8|NC_017451.1_1444270_1444756_+	PRK05422, smpB, SsrA-binding protein SmpB	NA|100aa|down_9|NC_017451.1_1444847_1445147_-	PRK00430, fis, DNA-binding transcriptional regulator Fis
GCF_000165525.1_ASM16552v1	NC_017451	Haemophilus influenzae R2866, complete genome	4	1852404-1852495	4	CRISPRCasFinder	no		cas3,DinG,cas14j,DEDDh,WYL	Orphan	TGGTGGGCTGAAGCCCACCCTACAACTACT	30	0	0	NA	NA	NA	1	1	Orphan	cas3,DinG,cas14j,DEDDh,WYL	NA,NA	NA|159aa|up_9|NC_017451.1_1843840_1844317_+	PRK00084, ispF, 2-C-methyl-D-erythritol 2,4-cyclodiphosphate synthase; Reviewed	NA|145aa|up_8|NC_017451.1_1844629_1845064_-	PRK05273, PRK05273, D-tyrosyl-tRNA(Tyr) deacylase; Provisional	NA|147aa|up_7|NC_017451.1_1845060_1845501_-	PRK09004, PRK09004, FMN-binding protein MioC; Provisional	NA|73aa|up_6|NC_017451.1_1845597_1845816_-	COG3074, COG3074, Uncharacterized protein conserved in bacteria [Function unknown]	NA|334aa|up_5|NC_017451.1_1845977_1846979_+	TIGR00330, Fructose-16-bisphosphatase_class_2, fructose-1,6-bisphosphatase, class II	NA|103aa|up_4|NC_017451.1_1847178_1847487_+	cd00093, HTH_XRE, Helix-turn-helix XRE-family like proteins	NA|107aa|up_3|NC_017451.1_1847474_1847795_+	COG3550, HipA, Toxin module HipA, protein kinase of phosphatidylinositol 3/4-kinase superfamily [General function prediction only]	NA|344aa|up_2|NC_017451.1_1847791_1848823_+	COG3550, HipA, Toxin module HipA, protein kinase of phosphatidylinositol 3/4-kinase superfamily [General function prediction only]	NA|553aa|up_1|NC_017451.1_1848905_1850564_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|582aa|up_0|NC_017451.1_1850556_1852302_-	COG4988, CydD, ABC-type transport system involved in cytochrome bd biosynthesis, ATPase and permease components [Energy production and conversion / Posttranslational modification, protein turnover, chaperones]	NA|1014aa|down_0|NC_017451.1_1852670_1855712_+	TIGR01786, hemoglobin-haptoglobin-binding_protein, TonB-dependent hemoglobin/transferrin/lactoferrin receptor family protein	NA|61aa|down_1|NC_017451.1_1855981_1856164_+	COG4679, COG4679, Phage-related protein [Function unknown]	NA|99aa|down_2|NC_017451.1_1856156_1856453_+	pfam01381, HTH_3, Helix-turn-helix	NA|639aa|down_3|NC_017451.1_1856636_1858553_+	PRK10636, PRK10636, putative ABC transporter ATP-binding protein; Provisional	NA|179aa|down_4|NC_017451.1_1858562_1859099_+	COG0551, TopA, Zn-finger domain associated with topoisomerase type I [DNA replication, recombination, and repair]	NA|184aa|down_5|NC_017451.1_1859114_1859666_+	PRK10634, PRK10634, L-threonylcarbamoyladenylate synthase type 1 TsaC	NA|269aa|down_6|NC_017451.1_1859669_1860476_+	TIGR00507, Shikimate_dehydrogenase, shikimate dehydrogenase	NA|251aa|down_7|NC_017451.1_1860487_1861240_+	pfam12686, DUF3800, Protein of unknown function (DUF3800)	NA|188aa|down_8|NC_017451.1_1861354_1861918_+	pfam03352, Adenine_glyco, Methyladenine glycosylase	NA|257aa|down_9|NC_017451.1_1861914_1862685_-	cd02511, Beta4Glucosyltransferase, UDP-glucose LOS-beta-1,4 glucosyltransferase is required for biosynthesis of lipooligosaccharide
