assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000006885.1_ASM688v1	NC_003028	Streptococcus pneumoniae TIGR4, complete sequence	1	102124-102219	1	CRISPRCasFinder	no		cas3,DEDDh,DinG	Orphan	AATGTGTAAGATTTTTATATATAA	24	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG	NA|47aa|up_7|NC_003028.3_94938_95079_-,NA|101aa|down_3|NC_003028.3_106603_106906_-,NA|107aa|down_8|NC_003028.3_110042_110363_-	NA|310aa|up_9|NC_003028.3_92998_93928_+	COG4209, LplB, ABC-type polysaccharide transport system, permease component [Carbohydrate transport and metabolism]	NA|308aa|up_8|NC_003028.3_93941_94865_+	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|47aa|up_7|NC_003028.3_94938_95079_-	NA	NA|492aa|up_6|NC_003028.3_95122_96598_+	pfam12010, DUF3502, Domain of unknown function (DUF3502)	NA|329aa|up_5|NC_003028.3_96869_97856_+	PRK00142, PRK00142, rhodanese-related sulfurtransferase	NA|287aa|up_4|NC_003028.3_98130_98991_+	pfam14132, DUF4299, Domain of unknown function (DUF4299)	NA|355aa|up_3|NC_003028.3_99168_100233_-	pfam10310, DUF5427, Family of unknown function (DUF5427)	NA|304aa|up_2|NC_003028.3_100295_101207_-	pfam13349, DUF4097, Putative adhesin	NA|198aa|up_1|NC_003028.3_101199_101793_-	COG4709, COG4709, Predicted membrane protein [Function unknown]	NA|109aa|up_0|NC_003028.3_101779_102106_-	COG1695, COG1695, Predicted transcriptional regulators [Transcription]	NA|389aa|down_0|NC_003028.3_102244_103411_-	COG2807, CynX, Cyanate permease [Inorganic ion transport and metabolism]	NA|386aa|down_1|NC_003028.3_103468_104626_+	cd02525, Succinoglycan_BP_ExoA, ExoA is involved in the biosynthesis of succinoglycan	NA|617aa|down_2|NC_003028.3_104667_106518_+	COG1086, COG1086, Predicted nucleoside-diphosphate sugar epimerases [Cell envelope biogenesis, outer membrane / Carbohydrate transport and metabolism]	NA|101aa|down_3|NC_003028.3_106603_106906_-	NA	NA|211aa|down_4|NC_003028.3_106955_107588_-	cd04302, HAD_5NT, haloacid dehalogenase (HAD)-like 5'-nucleotidases similar to the Pseudomonas aeruginosa PA0065	NA|291aa|down_5|NC_003028.3_107609_108482_-	TIGR00718, Probable_L-serine_dehydratase_alpha_chain, L-serine dehydratase, iron-sulfur-dependent, alpha subunit	NA|224aa|down_6|NC_003028.3_108490_109162_-	COG1760, SdaA, L-serine deaminase [Amino acid transport and metabolism]	NA|196aa|down_7|NC_003028.3_109403_109991_+	cd00118, LysM, Lysin Motif is a small domain involved in binding peptidoglycan	NA|107aa|down_8|NC_003028.3_110042_110363_-	NA	NA|96aa|down_9|NC_003028.3_110793_111081_+	TIGR01653, hypothetical_protein, bacteriocin, lactococcin 972 family
GCF_000006885.1_ASM688v1	NC_003028	Streptococcus pneumoniae TIGR4, complete sequence	2	523301-523431	2	CRISPRCasFinder	no		cas3,DEDDh,DinG	Orphan	GCAAAACCTGCAGCCCCAAAAGTAAGTGCAGAAAAGAAAGCCGAAAA	47	0	0	NA	NA	NA	1	1	Orphan	cas3,DEDDh,DinG	NA|128aa|up_9|NC_003028.3_516966_517350_+,NA|78aa|up_7|NC_003028.3_518132_518366_+,NA|260aa|down_1|NC_003028.3_526879_527659_+,NA|61aa|down_2|NC_003028.3_527660_527843_+	NA|128aa|up_9|NC_003028.3_516966_517350_+	NA	NA|230aa|up_8|NC_003028.3_517401_518091_+	pfam02517, Abi, CAAX protease self-immunity	NA|78aa|up_7|NC_003028.3_518132_518366_+	NA	NA|204aa|up_6|NC_003028.3_518516_519128_+	pfam02517, Abi, CAAX protease self-immunity	NA|265aa|up_5|NC_003028.3_519288_520083_+	COG0510, ycfN, Thiamine kinase and related kinases [Coenzyme transport and metabolism]	NA|212aa|up_4|NC_003028.3_520079_520715_+	PRK00121, trmB, tRNA (guanine-N(7)-)-methyltransferase; Reviewed	NA|160aa|up_3|NC_003028.3_520840_521320_+	PRK00092, PRK00092, ribosome maturation protein RimP; Reviewed	NA|379aa|up_2|NC_003028.3_521363_522500_+	PRK12327, nusA, transcription elongation factor NusA; Provisional	NA|98aa|up_1|NC_003028.3_522521_522815_+	COG2740, COG2740, Predicted nucleic-acid-binding protein implicated in transcription termination [Transcription]	NA|100aa|up_0|NC_003028.3_522807_523107_+	PRK07283, PRK07283, YlxQ-related RNA-binding protein	NA|117aa|down_0|NC_003028.3_526250_526601_+	PRK00521, rbfA, 30S ribosome-binding factor RbfA	NA|260aa|down_1|NC_003028.3_526879_527659_+	NA	NA|61aa|down_2|NC_003028.3_527660_527843_+	NA	NA|78aa|down_3|NC_003028.3_528302_528536_+	pfam08984, DUF1858, Domain of unknown function (DUF1858)	NA|445aa|down_4|NC_003028.3_528535_529870_+	COG2461, COG2461, Uncharacterized conserved protein [Function unknown]	NA|85aa|down_5|NC_003028.3_529879_530134_+	pfam08930, DUF1912, Domain of unknown function (DUF1912)	NA|132aa|down_6|NC_003028.3_530229_530625_+	PRK07758, PRK07758, hypothetical protein; Provisional	NA|150aa|down_7|NC_003028.3_531037_531487_+	COG1853, COG1853, Conserved protein/domain typically associated with flavoprotein oxygenases, DIM6/NTAB family [General function prediction only]	NA|187aa|down_8|NC_003028.3_531473_532034_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|193aa|down_9|NC_003028.3_532033_532612_+	pfam13238, AAA_18, AAA domain
GCF_000006885.1_ASM688v1	NC_003028	Streptococcus pneumoniae TIGR4, complete sequence	3	1678507-1691354	1	CRT	no		cas3,DEDDh,DinG	Orphan	GANGCNGANGCACTNGTTGATGCTGA	26	4	4	1683687-1683714|1685175-1685202|1686579-1686606|1691139-1691166	NC_003028.3_1678455-1678482|NC_003028.3_1678503-1678530|NC_003028.3_1691337-1691364|NC_003028.3_1678449-1678476	NA	146	146	Orphan	cas3,DEDDh,DinG	NA|197aa|up_3|NC_003028.3_1673679_1674270_-,NA|34aa|down_1|NC_003028.3_1693385_1693487_-,NA|49aa|down_7|NC_003028.3_1697589_1697736_-	NA|406aa|up_9|NC_003028.3_1665551_1666769_-	PRK12417, secY, preprotein translocase subunit SecY; Reviewed	NA|302aa|up_8|NC_003028.3_1666825_1667731_-	pfam00535, Glycos_transf_2, Glycosyl transferase family 2	NA|399aa|up_7|NC_003028.3_1667730_1668927_-	COG1442, RfaJ, Lipopolysaccharide biosynthesis proteins, LPS:glycosyltransferases [Cell envelope biogenesis, outer membrane]	NA|407aa|up_6|NC_003028.3_1668935_1670156_-	COG1442, RfaJ, Lipopolysaccharide biosynthesis proteins, LPS:glycosyltransferases [Cell envelope biogenesis, outer membrane]	NA|815aa|up_5|NC_003028.3_1670186_1672631_-	TIGR03728, glyco_access_1, glycosyltransferase, SP_1767 family	NA|337aa|up_4|NC_003028.3_1672640_1673651_-	PRK09814, PRK09814, sugar transferase	NA|197aa|up_3|NC_003028.3_1673679_1674270_-	NA	NA|93aa|up_2|NC_003028.3_1674277_1674556_-	pfam00535, Glycos_transf_2, Glycosyl transferase family 2	NA|405aa|up_1|NC_003028.3_1674560_1675775_-	COG1442, RfaJ, Lipopolysaccharide biosynthesis proteins, LPS:glycosyltransferases [Cell envelope biogenesis, outer membrane]	NA|695aa|up_0|NC_003028.3_1676081_1678166_-	COG1442, RfaJ, Lipopolysaccharide biosynthesis proteins, LPS:glycosyltransferases [Cell envelope biogenesis, outer membrane]	NA|154aa|down_0|NC_003028.3_1692957_1693419_-	pfam01710, HTH_Tnp_IS630, Transposase	NA|34aa|down_1|NC_003028.3_1693385_1693487_-	NA	NA|127aa|down_2|NC_003028.3_1693795_1694176_+	smart00347, HTH_MARR, helix_turn_helix multiple antibiotic resistance protein	NA|74aa|down_3|NC_003028.3_1694274_1694496_+	pfam15507, DUF4649, Domain of unknown function (DUF4649)	NA|105aa|down_4|NC_003028.3_1694512_1694827_+	TIGR01068, Thioredoxin-like_protein_slr0233, thioredoxin	NA|223aa|down_5|NC_003028.3_1696188_1696857_-	cd00333, MIP, Major intrinsic protein (MIP) superfamily	NA|185aa|down_6|NC_003028.3_1696967_1697522_-	pfam10978, DUF2785, Protein of unknown function (DUF2785)	NA|49aa|down_7|NC_003028.3_1697589_1697736_-	NA	NA|599aa|down_8|NC_003028.3_1697767_1699564_-	cd09609, M3B_PepF, Peptidase family M3B, oligopeptidase F (PepF)	NA|248aa|down_9|NC_003028.3_1699574_1700318_-	COG1385, COG1385, Uncharacterized protein conserved in bacteria [Function unknown]
