assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	1	996949-999314	1,1,1	PILER-CR,CRISPRCasFinder,CRT	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	GTTTC----AATCCCTAATAGGGATTAAGTGAAATTGCAAT,GTTTCAATCCCTAATAGGGATTAAGTGAAATTGCAAT,GTTTCAATCCCTAATAGGGATTAAGTGAAATTGCAAT	41,37,37	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	32,32,32	32	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|73aa|up_2|NC_019684.1_993247_993466_-,NA	NA|409aa|up_9|NC_019684.1_981991_983218_-	cd06442, DPM1_like, DPM1_like represents putative enzymes similar to eukaryotic DPM1	NA|543aa|up_8|NC_019684.1_983532_985161_+	COG5305, COG5305, Predicted membrane protein [Function unknown]	NA|565aa|up_7|NC_019684.1_985457_987152_-	COG5305, COG5305, Predicted membrane protein [Function unknown]	NA|391aa|up_6|NC_019684.1_987807_988980_+	PRK07360, PRK07360, FO synthase subunit 2; Reviewed	NA|836aa|up_5|NC_019684.1_989086_991594_+	COG4449, COG4449, Predicted protease of the Abi (CAAX) family [General function prediction only]	NA|115aa|up_4|NC_019684.1_992352_992697_+	pfam06967, Mo-nitro_C, Mo-dependent nitrogenase C-terminus	NA|91aa|up_3|NC_019684.1_992719_992992_+	cd02227, cupin_TM1112-like, Thermotoga maritima TM1112 and related proteins, cupin domain	NA|73aa|up_2|NC_019684.1_993247_993466_-	NA	NA|316aa|up_1|NC_019684.1_994112_995060_+	COG4294, Uve, UV damage repair endonuclease [DNA replication, recombination, and repair]	NA|533aa|up_0|NC_019684.1_995118_996717_+	COG0443, DnaK, Molecular chaperone [Posttranslational modification, protein turnover, chaperones]	NA|268aa|down_0|NC_019684.1_999565_1000369_-	pfam08242, Methyltransf_12, Methyltransferase domain	NA|524aa|down_1|NC_019684.1_1000380_1001952_-	cd07378, MPP_ACP5, Homo sapiens acid phosphatase 5 and related proteins, metallophosphatase domain	NA|607aa|down_2|NC_019684.1_1002114_1003935_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|344aa|down_3|NC_019684.1_1004053_1005085_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|71aa|down_4|NC_019684.1_1005077_1005290_+	cd14840, D-Ala-D-Ala_dipeptidase_Aad, D-Ala-D-Ala dipeptidase (includes Lactobacillus plantarum Aad peptidase)	NA|280aa|down_5|NC_019684.1_1005381_1006221_+	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]	NA|564aa|down_6|NC_019684.1_1006311_1008003_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|290aa|down_7|NC_019684.1_1008035_1008905_+	COG5464, COG5464, Uncharacterized conserved protein [Function unknown]	NA|263aa|down_8|NC_019684.1_1008914_1009703_-	COG4587, COG4587, ABC-type uncharacterized transport system, permease component [General function prediction only]	NA|327aa|down_9|NC_019684.1_1009718_1010699_-	COG4586, COG4586, ABC-type uncharacterized transport system, ATPase component [General function prediction only]
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	2	1073074-1076785	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no	cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,cas3,WYL	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Type I-D	GTTTC----AATCCCTAATAGGGATTAGTTGAAATTGCAAT,GTTTCAATCCCTAATAGGGATTAGTTGAAATTGCAAT,GTTTCAATCCCTAATAGGGATTAGTTGAAATTGCAAT	41,37,37	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	50,50,50	50	TypeI-D	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|181aa|up_9|NC_019684.1_1061599_1062142_+,NA|109aa|up_7|NC_019684.1_1063510_1063837_+,NA|116aa|up_2|NC_019684.1_1069632_1069980_+,NA|137aa|down_6|NC_019684.1_1081143_1081554_+	NA|181aa|up_9|NC_019684.1_1061599_1062142_+	NA	NA|321aa|up_8|NC_019684.1_1062340_1063303_+	cd12796, LbR_Ice_bind, Ice-binding protein, left-handed beta-roll	NA|109aa|up_7|NC_019684.1_1063510_1063837_+	NA	NA|109aa|up_6|NC_019684.1_1063889_1064216_-	pfam09876, DUF2103, Predicted metal-binding protein (DUF2103)	NA|109aa|up_5|NC_019684.1_1064221_1064548_-	PRK13019, clpS, ATP-dependent Clp protease adapter ClpS	NA|679aa|up_4|NC_019684.1_1064749_1066786_-	pfam12831, FAD_oxidored, FAD dependent oxidoreductase	NA|740aa|up_3|NC_019684.1_1067019_1069239_+	sd00006, TPR, Tetratricopeptide repeat	NA|116aa|up_2|NC_019684.1_1069632_1069980_+	NA	NA|451aa|up_1|NC_019684.1_1070254_1071607_+	pfam00300, His_Phos_1, Histidine phosphatase superfamily (branch 1)	NA|428aa|up_0|NC_019684.1_1071677_1072961_+	PRK07369, PRK07369, dihydroorotase; Provisional	cas2|102aa|down_0|NC_019684.1_1076996_1077302_-	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas1|335aa|down_1|NC_019684.1_1077356_1078361_-	TIGR04093, hypothetical_protein_L8106_25395, CRISPR-associated endonuclease Cas1, subtype CYANO	cas4|226aa|down_2|NC_019684.1_1078536_1079214_-	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4	NA|122aa|down_3|NC_019684.1_1079213_1079579_-	cd16377, 23S_rRNA_IVP_like, 23S rRNA-intervening sequence protein and similar proteins	cas6|281aa|down_4|NC_019684.1_1079575_1080418_-	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	2OG_CAS|211aa|down_5|NC_019684.1_1080395_1081028_-	pfam13640, 2OG-FeII_Oxy_3, 2OG-Fe(II) oxygenase superfamily	NA|137aa|down_6|NC_019684.1_1081143_1081554_+	NA	csc1gr5|236aa|down_7|NC_019684.1_1081554_1082262_-	cd09711, Csc1_I-D, CRISPR/Cas system-associated protein Csc1	csc2gr7|345aa|down_8|NC_019684.1_1082261_1083296_-	pfam18320, Csc2, Csc2 Crispr	cas10d|1103aa|down_9|NC_019684.1_1083409_1086718_-	TIGR03174, cas_Csc3, CRISPR type I-D/CYANO-associated protein Csc3/Cas10d
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	3	1348332-1348454	3	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	CCGGAGGCATCGCCTGAAAAATACCAATAAGTGCGATCGC	40	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|78aa|up_9|NC_019684.1_1339341_1339575_-,NA|327aa|up_8|NC_019684.1_1339602_1340583_-,NA|75aa|up_6|NC_019684.1_1342535_1342760_-,NA|89aa|up_5|NC_019684.1_1342959_1343226_-,NA|180aa|up_2|NC_019684.1_1346565_1347105_-,NA|70aa|down_3|NC_019684.1_1349584_1349794_-,NA|141aa|down_4|NC_019684.1_1350270_1350693_+,NA|165aa|down_5|NC_019684.1_1351323_1351818_+,NA|125aa|down_7|NC_019684.1_1352383_1352758_-	NA|78aa|up_9|NC_019684.1_1339341_1339575_-	NA	NA|327aa|up_8|NC_019684.1_1339602_1340583_-	NA	NA|439aa|up_7|NC_019684.1_1340969_1342286_+	COG1252, Ndh, NADH dehydrogenase, FAD-containing subunit [Energy production and conversion]	NA|75aa|up_6|NC_019684.1_1342535_1342760_-	NA	NA|89aa|up_5|NC_019684.1_1342959_1343226_-	NA	NA|321aa|up_4|NC_019684.1_1343721_1344684_+	COG1740, HyaA, Ni,Fe-hydrogenase I small subunit [Energy production and conversion]	NA|532aa|up_3|NC_019684.1_1344781_1346377_+	COG0374, HyaB, Ni,Fe-hydrogenase I large subunit [Energy production and conversion]	NA|180aa|up_2|NC_019684.1_1346565_1347105_-	NA	NA|122aa|up_1|NC_019684.1_1347528_1347894_-	pfam18480, DUF5615, Domain of unknown function (DUF5615)	NA|96aa|up_0|NC_019684.1_1347890_1348178_-	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	NA|76aa|down_0|NC_019684.1_1348459_1348687_-	pfam09720, Unstab_antitox, Putative addiction module component	NA|73aa|down_1|NC_019684.1_1348753_1348972_-	TIGR02574, hypothetical_protein, putative addiction module component, TIGR02574 family	NA|141aa|down_2|NC_019684.1_1349160_1349583_-	cd09881, PIN_VapC4-5_FitB-like, VapC-like PIN domain of Mycobacterium tuberculosis VapC4 and VapC5, and Neisseria gonorrhoeae FitB and related proteins	NA|70aa|down_3|NC_019684.1_1349584_1349794_-	NA	NA|141aa|down_4|NC_019684.1_1350270_1350693_+	NA	NA|165aa|down_5|NC_019684.1_1351323_1351818_+	NA	NA|163aa|down_6|NC_019684.1_1351832_1352321_+	cd06063, H2MP_Cyano-H2up, This group of endopeptidases include HupW enzymes that are specific to the cyanobacterial hydrogenase and are involved in the C-terminal cleavage of the hydrogenase large subunit precursor protein	NA|125aa|down_7|NC_019684.1_1352383_1352758_-	NA	NA|429aa|down_8|NC_019684.1_1352777_1354064_-	cd02142, McbC_SagB-like_oxidoreductase, oxidase similar to the microcin B17 processing protein McbC	NA|155aa|down_9|NC_019684.1_1354050_1354515_-	sd00045, ANK, ankyrin repeats
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	4	1708448-1708524	4	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	GTACCTGTGGTGTTGAGTGTCCC	23	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA,NA|122aa|down_0|NC_019684.1_1710313_1710679_+,NA|73aa|down_2|NC_019684.1_1712342_1712561_+	NA|1998aa|up_9|NC_019684.1_1662183_1668177_+	PRK12467, PRK12467, peptide synthase; Provisional	NA|556aa|up_8|NC_019684.1_1668195_1669863_+	cd04742, NPD_FabD, 2-Nitropropane dioxygenase (NPD)-like domain, associated with the (acyl-carrier-protein) S-malonyltransferase  FabD	NA|427aa|up_7|NC_019684.1_1669881_1671162_+	cd06173, MFS_MefA_like, Macrolide efflux protein A and similar proteins of the Major Facilitator Superfamily of transporters	NA|260aa|up_6|NC_019684.1_1671195_1671975_+	COG3176, COG3176, Putative hemolysin [General function prediction only]	NA|780aa|up_5|NC_019684.1_1672040_1674380_-	COG4252, COG4252, Predicted transmembrane sensor domain [Signal transduction mechanisms]	NA|382aa|up_4|NC_019684.1_1674554_1675700_-	pfam08852, DUF1822, Protein of unknown function (DUF1822)	NA|406aa|up_3|NC_019684.1_1675702_1676920_-	TIGR02937, RNA_polymerase_sigma_factor, RNA polymerase sigma factor, sigma-70 family	NA|284aa|up_2|NC_019684.1_1677265_1678117_+	pfam06051, DUF928, Domain of Unknown Function (DUF928)	NA|1016aa|up_1|NC_019684.1_1678094_1681142_+	COG3210, FhaB, Large exoproteins involved in heme utilization or adhesion [Intracellular trafficking and secretion]	NA|852aa|up_0|NC_019684.1_1681180_1683736_+	COG4995, COG4995, Uncharacterized protein conserved in bacteria [Function unknown]	NA|122aa|down_0|NC_019684.1_1710313_1710679_+	NA	NA|129aa|down_1|NC_019684.1_1710962_1711349_+	pfam01242, PTPS, 6-pyruvoyl tetrahydropterin synthase	NA|73aa|down_2|NC_019684.1_1712342_1712561_+	NA	NA|402aa|down_3|NC_019684.1_1712627_1713833_-	TIGR00326, eubact_ribD, riboflavin biosynthesis protein RibD	NA|203aa|down_4|NC_019684.1_1713998_1714607_-	COG2891, MreD, Cell shape-determining protein [Cell envelope biogenesis, outer membrane]	NA|274aa|down_5|NC_019684.1_1714621_1715443_-	PRK13922, PRK13922, rod shape-determining protein MreC; Provisional	NA|336aa|down_6|NC_019684.1_1715535_1716543_-	PRK13927, PRK13927, rod shape-determining protein MreB; Provisional	NA|120aa|down_7|NC_019684.1_1716913_1717273_+	PRK07459, PRK07459, single-stranded DNA-binding protein; Provisional	NA|249aa|down_8|NC_019684.1_1717327_1718074_-	COG2968, COG2968, Uncharacterized conserved protein [Function unknown]	NA|460aa|down_9|NC_019684.1_1718582_1719962_+	COG0475, KefB, Kef-type K+ transport systems, membrane components [Inorganic ion transport and metabolism]
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	5	2597398-2600981	3,5,3	PILER-CR,CRISPRCasFinder,CRT	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	ATTGCAATTTCAACTAATCCCTATTAGGG----------ATTGAAAC,ATTGCAATTTCAACTAATCCCTATTAGGGATTGAAAC,ATTGCAATTTCAACTAATCCCTATTAGGGATTGAAAC	47,37,37	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	48,48,48	48	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|138aa|up_7|NC_019684.1_2585397_2585811_-,NA|55aa|up_2|NC_019684.1_2592376_2592541_+,NA|61aa|down_3|NC_019684.1_2603075_2603258_+	NA|785aa|up_9|NC_019684.1_2580894_2583249_-	COG3211, PhoX, Predicted phosphatase [General function prediction only]	NA|470aa|up_8|NC_019684.1_2583660_2585070_-	COG1316, LytR, Transcriptional regulator [Transcription]	NA|138aa|up_7|NC_019684.1_2585397_2585811_-	NA	NA|394aa|up_6|NC_019684.1_2585921_2587103_+	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|443aa|up_5|NC_019684.1_2587407_2588736_-	cd19588, serpin_miropin-like, serpin miropin and similar proteins	NA|631aa|up_4|NC_019684.1_2589286_2591179_+	PRK13557, PRK13557, histidine kinase; Provisional	NA|304aa|up_3|NC_019684.1_2591303_2592215_+	cd16350, VOC_like, uncharacterized subfamily of the vicinal oxygen chelate (VOC) family	NA|55aa|up_2|NC_019684.1_2592376_2592541_+	NA	NA|455aa|up_1|NC_019684.1_2592713_2594078_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|835aa|up_0|NC_019684.1_2594515_2597020_+	PRK06464, PRK06464, phosphoenolpyruvate synthase; Validated	NA|205aa|down_0|NC_019684.1_2601176_2601791_+	pfam05685, Uma2, Putative restriction endonuclease	NA|103aa|down_1|NC_019684.1_2602069_2602378_+	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|63aa|down_2|NC_019684.1_2602493_2602682_+	PRK00270, rpsU, 30S ribosomal protein S21; Reviewed	NA|61aa|down_3|NC_019684.1_2603075_2603258_+	NA	NA|132aa|down_4|NC_019684.1_2603350_2603746_+	COG3695, COG3695, Predicted methylated DNA-protein cysteine methyltransferase [DNA replication, recombination, and repair]	NA|620aa|down_5|NC_019684.1_2603980_2605840_+	PRK07390, PRK07390, NAD(P)H-quinone oxidoreductase subunit F; Validated	NA|500aa|down_6|NC_019684.1_2605982_2607482_+	PRK07363, PRK07363, NADH-quinone oxidoreductase subunit M	NA|441aa|down_7|NC_019684.1_2607608_2608931_+	TIGR01964, chpXY, CO2 hydration protein	NA|753aa|down_8|NC_019684.1_2609171_2611430_+	PRK11788, PRK11788, tetratricopeptide repeat protein; Provisional	NA|331aa|down_9|NC_019684.1_2611475_2612468_-	cd06433, GT_2_WfgS_like, WfgS and WfeV are involved in O-antigen biosynthesis
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	6	2801793-2801893	6	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	ACTGCTGATATTGAGGCTGTTGA	23	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|126aa|up_9|NC_019684.1_2790477_2790855_-,NA|67aa|up_1|NC_019684.1_2800676_2800877_-,NA|75aa|down_5|NC_019684.1_2806965_2807190_-,NA|195aa|down_6|NC_019684.1_2807950_2808535_+,NA|141aa|down_9|NC_019684.1_2811051_2811474_+	NA|126aa|up_9|NC_019684.1_2790477_2790855_-	NA	NA|679aa|up_8|NC_019684.1_2791261_2793298_+	PRK07956, ligA, NAD-dependent DNA ligase LigA; Validated	NA|414aa|up_7|NC_019684.1_2793740_2794982_-	PRK05388, argJ, bifunctional glutamate N-acetyltransferase/amino-acid acetyltransferase ArgJ	NA|265aa|up_6|NC_019684.1_2795774_2796569_-	PRK09039, PRK09039, peptidoglycan -binding protein	NA|111aa|up_5|NC_019684.1_2797091_2797424_+	PRK13697, PRK13697, cytochrome c6; Provisional	NA|340aa|up_4|NC_019684.1_2797448_2798468_+	cd19101, AKR_unchar, uncharacterized aldo-keto reductase (AKR) superfamily protein	NA|307aa|up_3|NC_019684.1_2798531_2799452_+	pfam13649, Methyltransf_25, Methyltransferase domain	NA|321aa|up_2|NC_019684.1_2799444_2800407_+	COG2339, prsW, Membrane proteinase, regulator of anti-sigma factor [Posttranslational modification, protein turnover, chaperones]	NA|67aa|up_1|NC_019684.1_2800676_2800877_-	NA	NA|163aa|up_0|NC_019684.1_2801185_2801674_+	pfam07154, DUF1392, Protein of unknown function (DUF1392)	NA|120aa|down_0|NC_019684.1_2802443_2802803_+	cd06587, VOC, vicinal oxygen chelate (VOC) family	NA|135aa|down_1|NC_019684.1_2802892_2803297_+	smart00930, NIL, This domain is found at the C-terminus of ABC transporter proteins involved in D-methionine transport as well as a number of ferredoxin-like proteins	NA|356aa|down_2|NC_019684.1_2803293_2804361_-	pfam12275, DUF3616, Protein of unknown function (DUF3616)	NA|323aa|down_3|NC_019684.1_2804788_2805757_+	COG5607, COG5607, Uncharacterized conserved protein [Function unknown]	NA|201aa|down_4|NC_019684.1_2805815_2806418_-	COG3415, COG3415, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|75aa|down_5|NC_019684.1_2806965_2807190_-	NA	NA|195aa|down_6|NC_019684.1_2807950_2808535_+	NA	NA|314aa|down_7|NC_019684.1_2808674_2809616_-	cd02696, MurNAc-LAA, N-acetylmuramoyl-L-alanine amidase or MurNAc-LAA (also known as peptidoglycan aminohydrolase, NAMLA amidase, NAMLAA, Amidase 3, and peptidoglycan amidase; EC 3	NA|280aa|down_8|NC_019684.1_2810075_2810915_-	PRK07417, PRK07417, prephenate/arogenate dehydrogenase	NA|141aa|down_9|NC_019684.1_2811051_2811474_+	NA
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	7	2915314-2918932	4,7,4	PILER-CR,CRISPRCasFinder,CRT	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	ATTGCAATTAACACTAATCCCTATTAGGG----------ATTGAAAC,ATTGCAATTAACACTAATCCCTATTAGGGATTGAAAC,ATTGCAATTAACACTAATCCCTATTAGGGATTGAAAC	47,37,37	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	49,49,49	49	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|79aa|up_8|NC_019684.1_2901845_2902082_-,NA|80aa|up_3|NC_019684.1_2907596_2907836_+,NA|179aa|up_1|NC_019684.1_2912029_2912566_-,NA|64aa|down_2|NC_019684.1_2922063_2922255_+,NA|134aa|down_3|NC_019684.1_2922582_2922984_-,NA|53aa|down_5|NC_019684.1_2923996_2924155_-,NA|90aa|down_6|NC_019684.1_2924228_2924498_+,NA|81aa|down_9|NC_019684.1_2927517_2927760_-	NA|301aa|up_9|NC_019684.1_2900627_2901530_-	COG1295, Rbn, Ribonuclease BN family enzyme [Replication, recombination, and repair]	NA|79aa|up_8|NC_019684.1_2901845_2902082_-	NA	NA|334aa|up_7|NC_019684.1_2902955_2903957_+	PRK14016, PRK14016, cyanophycin synthetase; Provisional	NA|350aa|up_6|NC_019684.1_2904126_2905176_+	PRK05437, PRK05437, isopentenyl pyrophosphate isomerase; Provisional	NA|612aa|up_5|NC_019684.1_2905288_2907124_+	TIGR00705, Protease_4, signal peptide peptidase SppA, 67K type	NA|71aa|up_4|NC_019684.1_2907335_2907548_+	PLN00014, PLN00014, light-harvesting-like protein 3; Provisional	NA|80aa|up_3|NC_019684.1_2907596_2907836_+	NA	NA|1054aa|up_2|NC_019684.1_2907990_2911152_-	cd13653, PBP2_phosphate_like_1, Substrate binding domain of putative ABC-type phosphate transporter, a member of the type 2 periplasmic binding fold superfamily	NA|179aa|up_1|NC_019684.1_2912029_2912566_-	NA	NA|663aa|up_0|NC_019684.1_2913035_2915024_+	cd07498, Peptidases_S8_15, Peptidase S8 family domain, uncharacterized subfamily 15	NA|499aa|down_0|NC_019684.1_2919057_2920554_-	cd07131, ALDH_AldH-CAJ73105, Uncharacterized Candidatus kuenenia aldehyde dehydrogenase AldH (CAJ73105)-like	NA|238aa|down_1|NC_019684.1_2920665_2921379_-	COG1878, COG1878, Kynurenine formamidase [Amino acid transport and metabolism]	NA|64aa|down_2|NC_019684.1_2922063_2922255_+	NA	NA|134aa|down_3|NC_019684.1_2922582_2922984_-	NA	NA|90aa|down_4|NC_019684.1_2923258_2923528_-	PRK12864, PRK12864, YciI-like protein; Reviewed	NA|53aa|down_5|NC_019684.1_2923996_2924155_-	NA	NA|90aa|down_6|NC_019684.1_2924228_2924498_+	NA	NA|815aa|down_7|NC_019684.1_2924522_2926967_-	PRK00629, pheT, phenylalanyl-tRNA synthetase subunit beta; Reviewed	NA|130aa|down_8|NC_019684.1_2927131_2927521_-	cd09872, PIN_Sll0205-like, VapC-like PIN domain of Sll0205 protein and homologs	NA|81aa|down_9|NC_019684.1_2927517_2927760_-	NA
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	8	2980347-2980468	8	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	GCTAAATGAGTTAACAAACTGCTGTTTGCTTGCTGAAAA	39	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA,NA|51aa|down_7|NC_019684.1_2987744_2987897_+,NA|93aa|down_9|NC_019684.1_2988563_2988842_+	NA|871aa|up_9|NC_019684.1_2964942_2967555_+	PRK05580, PRK05580, primosome assembly protein PriA; Validated	NA|561aa|up_8|NC_019684.1_2967896_2969579_+	pfam03814, KdpA, Potassium-transporting ATPase A subunit	NA|702aa|up_7|NC_019684.1_2969674_2971780_+	PRK01122, PRK01122, potassium-transporting ATPase subunit KdpB	NA|200aa|up_6|NC_019684.1_2972051_2972651_+	PRK14003, PRK14003, K(+)-transporting ATPase subunit C	NA|238aa|up_5|NC_019684.1_2972760_2973474_-	COG1940, NagC, Transcriptional regulator/sugar kinase [Transcription / Carbohydrate transport and metabolism]	NA|266aa|up_4|NC_019684.1_2973687_2974485_+	COG1402, COG1402, Uncharacterized protein, putative amidase [General function prediction only]	NA|101aa|up_3|NC_019684.1_2974545_2974848_-	pfam14261, DUF4351, Domain of unknown function (DUF4351)	NA|993aa|up_2|NC_019684.1_2974971_2977950_-	NF033203, entero_EhxA, enterohemolysin EhxA	NA|276aa|up_1|NC_019684.1_2978525_2979353_-	pfam13469, Sulfotransfer_3, Sulfotransferase family	NA|194aa|up_0|NC_019684.1_2979685_2980267_+	PRK00889, PRK00889, adenylylsulfate kinase; Provisional	NA|168aa|down_0|NC_019684.1_2980865_2981369_+	pfam13239, 2TM, 2TM domain	NA|395aa|down_1|NC_019684.1_2981560_2982745_-	cd17370, MFS_MJ1317_like, MJ1317 and similar transporters of the Major Facilitator Superfamily	NA|605aa|down_2|NC_019684.1_2982927_2984742_-	COG1118, CysA, ABC-type sulfate/molybdate transport systems, ATPase component [Inorganic ion transport and metabolism]	NA|100aa|down_3|NC_019684.1_2985253_2985553_+	cd12399, RRM_HP0827_like, RNA recognition motif in Helicobacter pylori HP0827 protein and similar proteins	NA|126aa|down_4|NC_019684.1_2985773_2986151_-	pfam05542, DUF760, Protein of unknown function (DUF760)	NA|150aa|down_5|NC_019684.1_2986342_2986792_-	COG3585, MopI, Molybdopterin-binding protein [Coenzyme metabolism]	NA|266aa|down_6|NC_019684.1_2986890_2987688_+	cd13537, PBP2_YvgL_like, Substrate binding domain of putative molybdate-binding protein YvgL and similar proteins;the type 2 periplasmic binding protein fold	NA|51aa|down_7|NC_019684.1_2987744_2987897_+	NA	NA|154aa|down_8|NC_019684.1_2988094_2988556_+	cd06587, VOC, vicinal oxygen chelate (VOC) family	NA|93aa|down_9|NC_019684.1_2988563_2988842_+	NA
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	9	3075340-3075450	9	CRISPRCasFinder	no	cas3	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Unclear	AGAAAAATGCCAAATAGAACAAGAAAA	27	0	0	NA	NA	NA	1	1	Unclear	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|96aa|up_8|NC_019684.1_3065205_3065493_-,NA	NA|318aa|up_9|NC_019684.1_3064196_3065150_+	cd08242, MDR_like, Medium chain dehydrogenases/reductase (MDR)/zinc-dependent alcohol dehydrogenase-like family	NA|96aa|up_8|NC_019684.1_3065205_3065493_-	NA	NA|337aa|up_7|NC_019684.1_3065767_3066778_-	TIGR02056, chlorophyll_synthase_33_kD_subunit, chlorophyll synthase, ChlG	NA|367aa|up_6|NC_019684.1_3066935_3068036_-	COG0003, ArsA, Predicted ATPase involved in chromosome partitioning [Cell division and chromosome partitioning]	NA|64aa|up_5|NC_019684.1_3068122_3068314_-	pfam11061, DUF2862, Protein of unknown function (DUF2862)	NA|266aa|up_4|NC_019684.1_3068563_3069361_+	COG4636, Uma2, Endonuclease, Uma2 family (restriction endonuclease fold) [General function prediction only]	NA|232aa|up_3|NC_019684.1_3069373_3070069_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|269aa|up_2|NC_019684.1_3070295_3071102_+	COG1682, TagG, ABC-type polysaccharide/polyol phosphate export systems, permease component [Carbohydrate transport and metabolism / Cell envelope biogenesis, outer membrane]	NA|244aa|up_1|NC_019684.1_3071102_3071834_+	COG1134, TagH, ABC-type polysaccharide/polyol phosphate transport system, ATPase component [Carbohydrate transport and metabolism / Cell envelope biogenesis, outer membrane]	NA|396aa|up_0|NC_019684.1_3071926_3073114_+	cd06433, GT_2_WfgS_like, WfgS and WfeV are involved in O-antigen biosynthesis	NA|757aa|down_0|NC_019684.1_3075587_3077858_+	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|315aa|down_1|NC_019684.1_3077865_3078810_+	COG1216, COG1216, Predicted glycosyltransferases [General function prediction only]	NA|357aa|down_2|NC_019684.1_3078820_3079891_+	cd03809, GT4_MtfB-like, glycosyltransferases MtfB, WbpX, and similar proteins	NA|182aa|down_3|NC_019684.1_3079988_3080534_+	pfam00908, dTDP_sugar_isom, dTDP-4-dehydrorhamnose 3,5-epimerase	NA|298aa|down_4|NC_019684.1_3080526_3081420_+	COG1091, RfbD, dTDP-4-dehydrorhamnose reductase [Cell envelope biogenesis, outer membrane]	NA|359aa|down_5|NC_019684.1_3081416_3082493_+	TIGR01208, rmlA_long, glucose-1-phosphate thymidylylransferase, long form	NA|590aa|down_6|NC_019684.1_3082871_3084641_-	PRK06354, PRK06354, pyruvate kinase; Provisional	NA|297aa|down_7|NC_019684.1_3085007_3085898_+	cd03514, CrtR_beta-carotene-hydroxylase, Beta-carotene hydroxylase (CrtR), the carotenoid zeaxanthin biosynthetic enzyme catalyzes the addition of hydroxyl groups to the beta-ionone rings of beta-carotene to form zeaxanthin and is found in bacteria and red algae	NA|197aa|down_8|NC_019684.1_3086085_3086676_+	COG0664, Crp, cAMP-binding proteins - catabolite gene activator and regulatory subunit of cAMP-dependent protein kinases [Signal transduction mechanisms]	NA|658aa|down_9|NC_019684.1_3086685_3088659_+	COG3967, DltE, Short-chain dehydrogenase involved in D-alanine esterification of lipoteichoic acid and wall teichoic acid (D-alanine transfer protein) [Cell envelope biogenesis, outer membrane]
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	10	3658050-3658128	10	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	AGAGGTCATTTCCTGTTCCTCCTAA	25	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA,NA|146aa|down_0|NC_019684.1_3660364_3660802_-,NA|144aa|down_1|NC_019684.1_3660924_3661356_-,NA|144aa|down_2|NC_019684.1_3661436_3661868_-	NA|462aa|up_9|NC_019684.1_3637789_3639175_-	pfam13379, NMT1_2, NMT1-like family	NA|486aa|up_8|NC_019684.1_3639815_3641273_+	pfam02696, UPF0061, Uncharacterized ACR, YdiU/UPF0061 family	NA|1713aa|up_7|NC_019684.1_3642797_3647936_+	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|328aa|up_6|NC_019684.1_3647938_3648922_+	COG3706, PleD, Response regulator containing a CheY-like receiver domain and a GGDEF domain [Signal transduction mechanisms]	NA|302aa|up_5|NC_019684.1_3649002_3649908_-	COG0539, RpsA, Ribosomal protein S1 [Translation, ribosomal structure and biogenesis]	NA|250aa|up_4|NC_019684.1_3649984_3650734_-	COG0412, COG0412, Dienelactone hydrolase and related enzymes [Secondary metabolites biosynthesis, transport, and catabolism]	NA|328aa|up_3|NC_019684.1_3650885_3651869_+	COG1725, COG1725, Predicted transcriptional regulators [Transcription]	NA|315aa|up_2|NC_019684.1_3651957_3652902_-	pfam14261, DUF4351, Domain of unknown function (DUF4351)	NA|315aa|up_1|NC_019684.1_3653026_3653971_-	pfam14261, DUF4351, Domain of unknown function (DUF4351)	NA|303aa|up_0|NC_019684.1_3654098_3655007_-	pfam14261, DUF4351, Domain of unknown function (DUF4351)	NA|146aa|down_0|NC_019684.1_3660364_3660802_-	NA	NA|144aa|down_1|NC_019684.1_3660924_3661356_-	NA	NA|144aa|down_2|NC_019684.1_3661436_3661868_-	NA	NA|150aa|down_3|NC_019684.1_3662028_3662478_-	pfam08881, CVNH, CVNH domain	NA|354aa|down_4|NC_019684.1_3662827_3663889_+	sd00006, TPR, Tetratricopeptide repeat	NA|455aa|down_5|NC_019684.1_3664621_3665986_+	pfam14516, AAA_35, AAA-like domain	NA|708aa|down_6|NC_019684.1_3666029_3668153_+	pfam14516, AAA_35, AAA-like domain	NA|178aa|down_7|NC_019684.1_3668173_3668707_+	pfam00583, Acetyltransf_1, Acetyltransferase (GNAT) family	NA|225aa|down_8|NC_019684.1_3668775_3669450_+	cd03370, nitroreductase, uncharacterized nitroreductase family proteins	NA|307aa|down_9|NC_019684.1_3669514_3670435_-	COG0596, MhpC, Predicted hydrolases or acyltransferases (alpha/beta hydrolase superfamily) [General function prediction only]
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	11	3735339-3735435	11	CRISPRCasFinder	no	csa3	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Type I-A	ACGCAGATCATTATCCCAAATCAT	24	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA,NA|460aa|down_1|NC_019684.1_3736585_3737965_-,NA|84aa|down_2|NC_019684.1_3738275_3738527_-,NA|220aa|down_3|NC_019684.1_3738519_3739179_-,NA|78aa|down_4|NC_019684.1_3739175_3739409_-,NA|78aa|down_6|NC_019684.1_3740143_3740377_-,NA|61aa|down_7|NC_019684.1_3740373_3740556_-,NA|53aa|down_8|NC_019684.1_3740828_3740987_-,NA|134aa|down_9|NC_019684.1_3741058_3741460_+	NA|233aa|up_9|NC_019684.1_3722699_3723398_+	PRK13972, PRK13972, GSH-dependent disulfide bond oxidoreductase; Provisional	NA|164aa|up_8|NC_019684.1_3723688_3724180_+	pfam09150, Carot_N, Orange carotenoid protein, N-terminal	NA|176aa|up_7|NC_019684.1_3724612_3725140_+	pfam09150, Carot_N, Orange carotenoid protein, N-terminal	NA|639aa|up_6|NC_019684.1_3725290_3727207_-	TIGR01507, squalene-hopene_cyclase, squalene-hopene cyclase	NA|410aa|up_5|NC_019684.1_3727388_3728618_+	TIGR03469, HpnB, hopene-associated glycosyltransferase HpnB	NA|276aa|up_4|NC_019684.1_3728647_3729475_+	COG5464, COG5464, Uncharacterized conserved protein [Function unknown]	NA|276aa|up_3|NC_019684.1_3729510_3730338_+	COG5464, COG5464, Uncharacterized conserved protein [Function unknown]	NA|282aa|up_2|NC_019684.1_3730372_3731218_+	COG5464, COG5464, Uncharacterized conserved protein [Function unknown]	NA|873aa|up_1|NC_019684.1_3731235_3733854_-	cd01031, EriC, ClC chloride channel EriC	NA|436aa|up_0|NC_019684.1_3733986_3735294_-	COG0312, TldD, Predicted Zn-dependent proteases and their inactivated homologs [General function prediction only]	NA|288aa|down_0|NC_019684.1_3735650_3736514_-	pfam06485, DUF1092, Protein of unknown function (DUF1092)	NA|460aa|down_1|NC_019684.1_3736585_3737965_-	NA	NA|84aa|down_2|NC_019684.1_3738275_3738527_-	NA	NA|220aa|down_3|NC_019684.1_3738519_3739179_-	NA	NA|78aa|down_4|NC_019684.1_3739175_3739409_-	NA	NA|63aa|down_5|NC_019684.1_3739527_3739716_-	pfam13166, AAA_13, AAA domain	NA|78aa|down_6|NC_019684.1_3740143_3740377_-	NA	NA|61aa|down_7|NC_019684.1_3740373_3740556_-	NA	NA|53aa|down_8|NC_019684.1_3740828_3740987_-	NA	NA|134aa|down_9|NC_019684.1_3741058_3741460_+	NA
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	12	4664128-4664198	12	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	ATTTATCCATGTATATACATAAT	23	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|66aa|up_9|NC_019684.1_4655461_4655659_+,NA|67aa|up_0|NC_019684.1_4663903_4664104_+,NA|120aa|down_4|NC_019684.1_4671667_4672027_+	NA|66aa|up_9|NC_019684.1_4655461_4655659_+	NA	NA|342aa|up_8|NC_019684.1_4655760_4656786_+	cd01011, nicotinamidase, Nicotinamidase/pyrazinamidase (PZase)	NA|296aa|up_7|NC_019684.1_4657134_4658022_-	COG0739, NlpD, Membrane proteins related to metalloendopeptidases [Cell envelope biogenesis, outer membrane]	NA|402aa|up_6|NC_019684.1_4658345_4659551_+	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|116aa|up_5|NC_019684.1_4660021_4660369_-	pfam05542, DUF760, Protein of unknown function (DUF760)	NA|180aa|up_4|NC_019684.1_4660616_4661156_-	COG1386, scpB, Chromosome segregation and condensation protein B [DNA replication, recombination and repair]	NA|233aa|up_3|NC_019684.1_4661280_4661979_-	PRK00155, ispD, D-ribitol-5-phosphate cytidylyltransferase	NA|320aa|up_2|NC_019684.1_4662143_4663103_+	COG0859, RfaF, ADP-heptose:LPS heptosyltransferase [Cell envelope biogenesis, outer membrane]	NA|158aa|up_1|NC_019684.1_4663181_4663655_-	pfam08847, Crr6, Chlororespiratory reduction 6	NA|67aa|up_0|NC_019684.1_4663903_4664104_+	NA	NA|433aa|down_0|NC_019684.1_4665301_4666600_+	TIGR02971, devB-like_secretion_protein, ABC exporter membrane fusion protein, DevB family	NA|393aa|down_1|NC_019684.1_4666596_4667775_+	TIGR01185, membrane_spanning_subunit, DevC protein	NA|240aa|down_2|NC_019684.1_4667835_4668555_+	TIGR02982, heterocyst_DevA, ABC exporter ATP-binding subunit, DevA family	NA|888aa|down_3|NC_019684.1_4668563_4671227_-	pfam12770, CHAT, CHAT domain	NA|120aa|down_4|NC_019684.1_4671667_4672027_+	NA	NA|1004aa|down_5|NC_019684.1_4672065_4675077_-	PRK02509, PRK02509, hypothetical protein; Provisional	NA|148aa|down_6|NC_019684.1_4675396_4675840_+	cd00038, CAP_ED, effector domain of the CAP family of transcription factors; members include CAP (or cAMP receptor protein (CRP)), which binds cAMP, FNR (fumarate and nitrate reduction), which uses an iron-sulfur cluster to sense oxygen) and CooA, a heme containing CO sensor	NA|173aa|down_7|NC_019684.1_4675861_4676380_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|408aa|down_8|NC_019684.1_4676466_4677690_-	cd08021, M20_Acy1_YhaA-like, M20 Peptidase aminoacylase 1 subfamily, includes Bacillus subtilis YhaA and Staphylococcus aureus amidohydrolase, SACOL0085	NA|225aa|down_9|NC_019684.1_4677838_4678513_-	PRK00090, bioD, ATP-dependent dethiobiotin synthetase BioD
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	13	4785089-4785180	13	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	GATACATTGCCAATGTCAGGCGATACATT	29	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|125aa|up_0|NC_019684.1_4784601_4784976_-,NA|48aa|down_0|NC_019684.1_4785199_4785343_+	NA|418aa|up_9|NC_019684.1_4775532_4776786_-	PLN00049, PLN00049, carboxyl-terminal processing protease; Provisional	NA|216aa|up_8|NC_019684.1_4777152_4777800_+	CHL00070, petB, cytochrome b6	NA|161aa|up_7|NC_019684.1_4778010_4778493_+	CHL00058, petD, cytochrome b6/f complex subunit IV	NA|143aa|up_6|NC_019684.1_4778787_4779216_+	COG2172, RsbW, Anti-sigma regulatory factor (Ser/Thr protein kinase) [Signal transduction mechanisms]	NA|335aa|up_5|NC_019684.1_4779462_4780467_+	COG1089, Gmd, GDP-D-mannose dehydratase [Cell envelope biogenesis, outer membrane]	NA|389aa|up_4|NC_019684.1_4780649_4781816_+	cd03801, GT4_PimA-like, phosphatidyl-myo-inositol mannosyltransferase	NA|124aa|up_3|NC_019684.1_4782009_4782381_+	pfam08274, PhnA_Zn_Ribbon, PhnA Zinc-Ribbon	NA|249aa|up_2|NC_019684.1_4782503_4783250_-	COG1651, DsbG, Protein-disulfide isomerase [Posttranslational modification, protein turnover, chaperones]	NA|285aa|up_1|NC_019684.1_4783318_4784173_-	COG2897, SseA, Rhodanese-related sulfurtransferase [Inorganic ion transport and metabolism]	NA|125aa|up_0|NC_019684.1_4784601_4784976_-	NA	NA|48aa|down_0|NC_019684.1_4785199_4785343_+	NA	NA|186aa|down_1|NC_019684.1_4785407_4785965_-	cd03017, PRX_BCP, Peroxiredoxin (PRX) family, Bacterioferritin comigratory protein (BCP) subfamily; composed of  thioredoxin-dependent thiol peroxidases, widely expressed in pathogenic bacteria, that protect cells against toxicity from reactive oxygen species by reducing and detoxifying hydroperoxides	NA|88aa|down_2|NC_019684.1_4786104_4786368_-	pfam11347, DUF3148, Protein of unknown function (DUF3148)	NA|175aa|down_3|NC_019684.1_4786523_4787048_-	pfam05019, Coq4, Coenzyme Q (ubiquinone) biosynthesis protein Coq4	NA|166aa|down_4|NC_019684.1_4787048_4787546_-	COG3678, CpxP, P pilus assembly/Cpx signaling pathway, periplasmic inhibitor/zinc-resistance associated protein [Intracellular trafficking and secretion / Cell motility and secretio / Signal transduction mechanisms / Inorganic ion transport and metabolism]	NA|403aa|down_5|NC_019684.1_4787740_4788949_+	COG4585, COG4585, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|220aa|down_6|NC_019684.1_4788945_4789605_+	COG2197, CitB, Response regulator containing a CheY-like receiver domain and an HTH DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|142aa|down_7|NC_019684.1_4789664_4790090_-	COG0590, CumB, Cytosine/adenosine deaminases [Nucleotide transport and metabolism / Translation, ribosomal structure and biogenesis]	NA|265aa|down_8|NC_019684.1_4790154_4790949_+	pfam00520, Ion_trans, Ion transport protein	NA|80aa|down_9|NC_019684.1_4791033_4791273_+	pfam11332, DUF3134, Protein of unknown function (DUF3134)
GCF_000316645.1_ASM31664v1	NC_019684	Nostoc sp. PCC 7524, complete sequence	14	5429564-5429655	14	CRISPRCasFinder	no		cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG	Orphan	CTCTGGCTGTGGTTCGGGAGTAATTACTGGTG	32	0	0	NA	NA	NA	1	1	Orphan	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|53aa|up_0|NC_019684.1_5428878_5429037_-,NA|170aa|down_3|NC_019684.1_5436563_5437073_+	NA|454aa|up_9|NC_019684.1_5414364_5415726_+	PRK14951, PRK14951, DNA polymerase III subunits gamma and tau; Provisional	NA|401aa|up_8|NC_019684.1_5416650_5417853_-	PRK00073, pgk, phosphoglycerate kinase; Provisional	NA|136aa|up_7|NC_019684.1_5417943_5418351_+	cd00293, USP_Like, Usp: Universal stress protein family	NA|470aa|up_6|NC_019684.1_5423664_5425074_-	PRK09201, PRK09201, AtzE family amidohydrolase	NA|63aa|up_5|NC_019684.1_5425070_5425259_-	pfam13318, DUF4089, Protein of unknown function (DUF4089)	NA|116aa|up_4|NC_019684.1_5425284_5425632_-	COG3502, COG3502, Uncharacterized protein conserved in bacteria [Function unknown]	NA|141aa|up_3|NC_019684.1_5425727_5426150_-	pfam08872, KGK, KGK domain	NA|506aa|up_2|NC_019684.1_5426321_5427839_-	PLN02919, PLN02919, haloacid dehalogenase-like hydrolase family protein	NA|305aa|up_1|NC_019684.1_5427866_5428781_+	PRK00971, PRK00971, glutaminase; Provisional	NA|53aa|up_0|NC_019684.1_5428878_5429037_-	NA	NA|753aa|down_0|NC_019684.1_5431459_5433718_+	CHL00056, psaA, photosystem I P700 chlorophyll a apoprotein A1	NA|742aa|down_1|NC_019684.1_5433844_5436070_+	PRK13199, psaB, photosystem I P700 chlorophyll a apoprotein A2; Provisional	NA|135aa|down_2|NC_019684.1_5436159_5436564_+	pfam14437, MafB19-deam, MafB19-like deaminase	NA|170aa|down_3|NC_019684.1_5436563_5437073_+	NA	NA|47aa|down_4|NC_019684.1_5437235_5437376_+	COG2442, COG2442, Uncharacterized conserved protein [Function unknown]	NA|589aa|down_5|NC_019684.1_5437489_5439256_+	PLN02286, PLN02286, arginine-tRNA ligase	NA|397aa|down_6|NC_019684.1_5439509_5440700_-	cd06164, S2P-M50_SpoIVFB_CBS, SpoIVFB Site-2 protease (S2P), a zinc metalloprotease (MEROPS family M50B), regulates intramembrane proteolysis (RIP), and is involved in the pro-sigmaK pathway of bacterial spore formation	NA|235aa|down_7|NC_019684.1_5440981_5441686_-	TIGR02191, Ribonuclease_3, ribonuclease III, bacterial	NA|509aa|down_8|NC_019684.1_5441791_5443318_-	CHL00076, chlB, photochlorophyllide reductase subunit B	NA|79aa|down_9|NC_019684.1_5443684_5443921_+	PRK07883, PRK07883, DEDD exonuclease domain-containing protein
GCF_000316645.1_ASM31664v1	NC_019677	Nostoc sp. PCC 7524 plasmid pNOS7524.01, complete sequence	1	10998-13699	1,1,1	CRISPRCasFinder,CRT,PILER-CR	no	Cas9_archaeal,WYL,csx18,cas1,cas2	Cas9_archaeal,WYL,csx18,cas1,cas2,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	Unclear	GTTTCAATCCCTAATAGGGATTAAGGTTAATTGCAAT,GTTTCAATCCCTAATAGGGATTAAGGTTAATTGCAAT,GTTTC----AATCCCTAATAGGGATTAAGGTTAATTGCAAT	37,37,41	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	37,37,36	37	Unclear	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|57aa|up_8|NC_019677.1_4340_4511_-,NA|124aa|up_6|NC_019677.1_6835_7207_-,NA|97aa|up_5|NC_019677.1_7719_8010_-,NA|157aa|up_4|NC_019677.1_8218_8689_+,NA|130aa|up_3|NC_019677.1_8685_9075_+,NA|95aa|up_2|NC_019677.1_9783_10068_+,NA|63aa|up_1|NC_019677.1_10506_10695_+,NA|51aa|up_0|NC_019677.1_10714_10867_-,NA|116aa|down_1|NC_019677.1_14607_14955_-,NA|60aa|down_2|NC_019677.1_14971_15151_-,NA|68aa|down_3|NC_019677.1_15256_15460_+,NA|104aa|down_4|NC_019677.1_15518_15830_+,NA|80aa|down_5|NC_019677.1_16057_16297_-,NA|173aa|down_8|NC_019677.1_18226_18745_-	Cas9_archaeal|179aa|up_9|NC_019677.1_3216_3753_-	COG1403, McrA, Restriction endonuclease [Defense mechanisms]	NA|57aa|up_8|NC_019677.1_4340_4511_-	NA	NA|525aa|up_7|NC_019677.1_5044_6619_+	COG2303, BetA, Choline dehydrogenase and related flavoproteins [Amino acid transport and metabolism]	NA|124aa|up_6|NC_019677.1_6835_7207_-	NA	NA|97aa|up_5|NC_019677.1_7719_8010_-	NA	NA|157aa|up_4|NC_019677.1_8218_8689_+	NA	NA|130aa|up_3|NC_019677.1_8685_9075_+	NA	NA|95aa|up_2|NC_019677.1_9783_10068_+	NA	NA|63aa|up_1|NC_019677.1_10506_10695_+	NA	NA|51aa|up_0|NC_019677.1_10714_10867_-	NA	NA|138aa|down_0|NC_019677.1_14116_14530_-	PRK09256, PRK09256, aminoacyl-tRNA hydrolase	NA|116aa|down_1|NC_019677.1_14607_14955_-	NA	NA|60aa|down_2|NC_019677.1_14971_15151_-	NA	NA|68aa|down_3|NC_019677.1_15256_15460_+	NA	NA|104aa|down_4|NC_019677.1_15518_15830_+	NA	NA|80aa|down_5|NC_019677.1_16057_16297_-	NA	NA|362aa|down_6|NC_019677.1_16386_17472_-	cd00397, DNA_BRE_C, DNA breaking-rejoining enzymes, C-terminal catalytic domain	NA|174aa|down_7|NC_019677.1_17677_18199_-	pfam11320, DUF3122, Protein of unknown function (DUF3122)	NA|173aa|down_8|NC_019677.1_18226_18745_-	NA	NA|134aa|down_9|NC_019677.1_19220_19622_+	pfam07924, NuiA, Nuclease A inhibitor-like protein
GCF_000316645.1_ASM31664v1	NC_019677	Nostoc sp. PCC 7524 plasmid pNOS7524.01, complete sequence	2	27800-32404	2,2,2	PILER-CR,CRISPRCasFinder,CRT	no	WYL,csx18,cas1,cas2,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	Cas9_archaeal,WYL,csx18,cas1,cas2,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	Type III-B,Type III-D,Type III-A,Type III-C	ATTCCCACTCGCTGGGGATATTAATTGAATGGAAAC,ATTCCCACTCGCTGGGGATATTAATTGAATGGAAAC,ATTCCCACTCGCTGGGGATATTAATTGAATGGAAAC	36,36,36	0	0	NA	NA	NA:NA:NA	60,62,62	62	TypeIII-B,TypeIII-A,TypeIII-D,TypeIII-C	cas14j,cas14k,cas3,cas2,cas1,cas4,cas6,2OG_CAS,csc1gr5,csc2gr7,cas10d,PD-DExK,WYL,csa3,Cas14c_CAS-V-F,c2c9_V-U4,Cas9_archaeal,DinG,csx18,cas10,cmr3gr5,cmr4gr7,cmr5gr11,csm3gr7	NA|117aa|up_8|NC_019677.1_21626_21977_-,NA|137aa|up_5|NC_019677.1_23480_23891_-,csx18|92aa|up_2|NC_019677.1_25920_26196_+,cmr5gr11|132aa|down_3|NC_019677.1_37587_37983_+,NA|510aa|down_5|NC_019677.1_39901_41431_+,NA|71aa|down_8|NC_019677.1_44073_44286_+	NA|160aa|up_9|NC_019677.1_21128_21608_+	cd07824, SRPBCC_6, Ligand-binding SRPBCC domain of an uncharacterized subfamily of proteins	NA|117aa|up_8|NC_019677.1_21626_21977_-	NA	NA|109aa|up_7|NC_019677.1_22264_22591_+	COG1359, COG1359, Uncharacterized conserved protein [Function unknown]	NA|161aa|up_6|NC_019677.1_22793_23276_-	pfam13778, DUF4174, Domain of unknown function (DUF4174)	NA|137aa|up_5|NC_019677.1_23480_23891_-	NA	NA|146aa|up_4|NC_019677.1_23953_24391_-	COG0394, Wzb, Protein-tyrosine-phosphatase [Signal transduction mechanisms]	WYL|403aa|up_3|NC_019677.1_24493_25702_-	pfam13280, WYL, WYL domain	csx18|92aa|up_2|NC_019677.1_25920_26196_+	NA	cas1|330aa|up_1|NC_019677.1_26335_27325_+	pfam01867, Cas_Cas1, CRISPR associated protein Cas1	cas2|94aa|up_0|NC_019677.1_27333_27615_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	cas10|987aa|down_0|NC_019677.1_32711_35672_+	pfam12469, DUF3692, CRISPR-associated protein	cmr3gr5|369aa|down_1|NC_019677.1_35671_36778_+	cd09748, Cmr3_III-B, CRISPR/Cas system-associated RAMP superfamily protein Cmr3	cmr4gr7|259aa|down_2|NC_019677.1_36790_37567_+	TIGR02580, putative_CRISPR-associated_protein, CRISPR type III-B/RAMP module RAMP protein Cmr4	cmr5gr11|132aa|down_3|NC_019677.1_37587_37983_+	NA	csm3gr7|639aa|down_4|NC_019677.1_37988_39905_+	cd09661, Cmr6_III-B, CRISPR/Cas system-associated RAMP superfamily protein Cmr6	NA|510aa|down_5|NC_019677.1_39901_41431_+	NA	NA|623aa|down_6|NC_019677.1_41660_43529_+	COG0210, UvrD, Superfamily I DNA and RNA helicases [DNA replication, recombination, and repair]	NA|103aa|down_7|NC_019677.1_43556_43865_-	COG2350, COG2350, Uncharacterized protein conserved in bacteria [Function unknown]	NA|71aa|down_8|NC_019677.1_44073_44286_+	NA	NA|68aa|down_9|NC_019677.1_44325_44529_-	pfam01155, HypA, Hydrogenase/urease nickel incorporation, metallochaperone, hypA
