assembly_id	genome_id	genome_def	crispr_array_locus_merge	crispr_array_location_merge	crispr_locus_id	crispr_pred_method	array_in_prot	prot_within_array_20000	prot_in_genome	crispr_type_by_cas_prot	consensus_repeat	repeat_length	self-targeting_spacer_number	self-targeting_target_number	spacer_location	protospacer_location	repeat_type	spacer_locus_num	spacer_num	correct_crispr_type	genome_cas_prots	unknown_protein_around_crispr	L10	L10_domain	L9	L9_domain	L8	L8_domain	L7	L7_domain	L6	L6_domain	L5	L5_domain	L4	L4_domain	L3	L3_domain	L2	L2_domain	L1	L1_domain	R1	R1_domain	R2	R2_domain	R3	R3_domain	R4	R4_domain	R5	R5_domain	R6	R6_domain	R7	R7_domain	R8	R8_domain	R9	R9_domain	R10	R10_domain
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	1	19208-19303	1	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	TGGGAAAGAATTTTTCCTATACCCAGTC	28	0	0	NA	NA	NA	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|97aa|up_4|NC_003272.1_11559_11850_+,NA|174aa|up_1|NC_003272.1_13599_14121_-,NA|74aa|down_5|NC_003272.1_22722_22944_-,NA|82aa|down_6|NC_003272.1_23017_23263_-,NA|132aa|down_7|NC_003272.1_23448_23844_-	NA|164aa|up_9|NC_003272.1_7358_7850_-	PRK07353, PRK07353, F0F1 ATP synthase subunit B'; Validated	NA|82aa|up_8|NC_003272.1_7995_8241_-	CHL00061, atpH, ATP synthase CF0 C subunit	NA|252aa|up_7|NC_003272.1_8323_9079_-	CHL00046, atpI, ATP synthase CF0 A subunit	NA|154aa|up_6|NC_003272.1_9131_9593_-	pfam03899, ATP-synt_I, ATP synthase I chain	NA|400aa|up_5|NC_003272.1_10129_11329_-	pfam13649, Methyltransf_25, Methyltransferase domain	NA|97aa|up_4|NC_003272.1_11559_11850_+	NA	NA|143aa|up_3|NC_003272.1_11846_12275_+	pfam15565, Imm30, Immunity protein 30	NA|265aa|up_2|NC_003272.1_12727_13521_-	pfam13340, DUF4096, Putative transposase of IS4/5 family (DUF4096)	NA|174aa|up_1|NC_003272.1_13599_14121_-	NA	NA|1133aa|up_0|NC_003272.1_15777_19176_+	CHL00091, apcE, phycobillisome linker protein	NA|162aa|down_0|NC_003272.1_19614_20100_+	CHL00086, apcA, allophycocyanin alpha subunit	NA|163aa|down_1|NC_003272.1_20165_20654_+	CHL00088, apcB, allophycocyanin beta subunit	NA|69aa|down_2|NC_003272.1_20869_21076_+	pfam01383, CpcD, CpcD/allophycocyanin linker domain	NA|273aa|down_3|NC_003272.1_21220_22039_+	COG2912, COG2912, Uncharacterized conserved protein [Function unknown]	NA|147aa|down_4|NC_003272.1_22143_22584_-	pfam10604, Polyketide_cyc2, Polyketide cyclase / dehydrase and lipid transport	NA|74aa|down_5|NC_003272.1_22722_22944_-	NA	NA|82aa|down_6|NC_003272.1_23017_23263_-	NA	NA|132aa|down_7|NC_003272.1_23448_23844_-	NA	NA|1222aa|down_8|NC_003272.1_24367_28033_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|591aa|down_9|NC_003272.1_28284_30057_+	COG1032, COG1032, Fe-S oxidoreductase [Energy production and conversion]
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	2	445573-447863	2,1,1,2,3	CRISPRCasFinder,CRT,PILER-CR,PILER-CR,PILER-CR	no	csx18,cas1,cas2	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Unclear	GTTACTTACCATCACTTCCCCGCAAGGGGATGGAAAC,GTTACTTACCATCACTTCCCCGCAAGGGGATGGAAACNNNNNNNNNN,GTTACTTACCATCACTT--CCCCGCAAGGGGATGGAAAC,GTTACTTACCATCACTT--CCCCGCAAGGGGATGGAAAC,GTTACTTACCATCACTT--CCCCGCAAGGGGATGGAAAC	37,47,39,39,39	0	0	NA	NA	NA:NA:NA:NA:NA	28,29,21,21,21	29	Unclear	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|136aa|up_5|NC_003272.1_440673_441081_+,csx18|103aa|up_2|NC_003272.1_443339_443648_-,NA	NA|335aa|up_9|NC_003272.1_436552_437557_-	cd07423, MPP_Prp_like, Bacillus subtilis PrpE and related proteins, metallophosphatase domain	NA|387aa|up_8|NC_003272.1_437730_438891_-	PRK05958, PRK05958, 8-amino-7-oxononanoate synthase; Reviewed	NA|214aa|up_7|NC_003272.1_438968_439610_-	COG0632, RuvA, Holliday junction resolvasome, DNA-binding subunit [DNA replication, recombination, and repair]	NA|250aa|up_6|NC_003272.1_439606_440356_-	TIGR01485, putative_sucrose-phosphate_phosphatase, sucrose-6F-phosphate phosphohydrolase	NA|136aa|up_5|NC_003272.1_440673_441081_+	NA	NA|403aa|up_4|NC_003272.1_441158_442367_-	COG1972, NupC, Nucleoside permease [Nucleotide transport and metabolism]	NA|253aa|up_3|NC_003272.1_442486_443245_+	PRK00235, cobS, cobalamin synthase; Reviewed	csx18|103aa|up_2|NC_003272.1_443339_443648_-	NA	cas1|337aa|up_1|NC_003272.1_443836_444847_+	TIGR00287, CRISPR-associated_endonuclease_Cas1, CRISPR-associated endonuclease Cas1	cas2|95aa|up_0|NC_003272.1_444954_445239_+	TIGR01573, cas2, CRISPR-associated endonuclease Cas2	NA|310aa|down_0|NC_003272.1_448246_449176_-	COG1054, COG1054, Predicted sulfurtransferase [General function prediction only]	NA|211aa|down_1|NC_003272.1_449573_450206_-	pfam06080, DUF938, Protein of unknown function (DUF938)	NA|471aa|down_2|NC_003272.1_450620_452033_+	smart00563, PlsC, Phosphate acyltransferases	NA|647aa|down_3|NC_003272.1_452144_454085_-	PRK10577, PRK10577, Fe(3+)-hydroxamate ABC transporter permease FhuB	NA|301aa|down_4|NC_003272.1_454142_455045_-	cd01146, FhuD, Fe3+-siderophore binding domain FhuD	NA|274aa|down_5|NC_003272.1_455041_455863_-	COG1120, FepC, ABC-type cobalamin/Fe3+-siderophores transport systems, ATPase components [Inorganic ion transport and metabolism / Coenzyme metabolism]	NA|603aa|down_6|NC_003272.1_456013_457822_-	COG4264, RhbC, Siderophore synthetase component [Secondary metabolites biosynthesis, transport, and catabolism]	NA|399aa|down_7|NC_003272.1_457995_459192_-	cd17325, MFS_MdtG_SLC18_like, bacterial MdtG-like and eukaryotic solute carrier 18 (SLC18) family of the Major Facilitator Superfamily of transporters	NA|428aa|down_8|NC_003272.1_459188_460472_-	COG3486, IucD, Lysine/ornithine N-monooxygenase [Secondary metabolites biosynthesis, transport, and catabolism]	NA|194aa|down_9|NC_003272.1_460465_461047_-	pfam13523, Acetyltransf_8, Acetyltransferase (GNAT) domain
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	3	476040-476497	2	CRT	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	AANTNCCAGTTACCATTACC	20	0	0	NA	NA	NA	10	10	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|88aa|up_6|NC_003272.1_469419_469683_-,NA|281aa|up_4|NC_003272.1_470216_471059_-,NA|111aa|up_3|NC_003272.1_471951_472284_+,NA|256aa|down_0|NC_003272.1_477035_477803_-,NA|415aa|down_9|NC_003272.1_488667_489912_-	NA|539aa|up_9|NC_003272.1_463057_464674_-	COG0076, GadB, Glutamate decarboxylase and related PLP-dependent proteins [Amino acid transport and metabolism]	NA|494aa|up_8|NC_003272.1_464673_466155_-	PRK06938, PRK06938, diaminobutyrate--2-oxoglutarate aminotransferase; Provisional	NA|850aa|up_7|NC_003272.1_466678_469228_+	cd01347, ligand_gated_channel, TonB dependent/Ligand-Gated channels are created by a monomeric 22 strand (22,24) anti-parallel beta-barrel	NA|88aa|up_6|NC_003272.1_469419_469683_-	NA	NA|83aa|up_5|NC_003272.1_469799_470048_-	COG2886, COG2886, Uncharacterized small protein [Function unknown]	NA|281aa|up_4|NC_003272.1_470216_471059_-	NA	NA|111aa|up_3|NC_003272.1_471951_472284_+	NA	NA|110aa|up_2|NC_003272.1_472355_472685_-	pfam09876, DUF2103, Predicted metal-binding protein (DUF2103)	NA|109aa|up_1|NC_003272.1_472690_473017_-	PRK13019, clpS, ATP-dependent Clp protease adapter ClpS	NA|677aa|up_0|NC_003272.1_473247_475278_-	pfam12831, FAD_oxidored, FAD dependent oxidoreductase	NA|256aa|down_0|NC_003272.1_477035_477803_-	NA	NA|355aa|down_1|NC_003272.1_478300_479365_-	PRK13396, PRK13396, 3-deoxy-7-phosphoheptulonate synthase; Provisional	NA|365aa|down_2|NC_003272.1_479387_480482_-	PRK00188, trpD, anthranilate phosphoribosyltransferase; Provisional	NA|410aa|down_3|NC_003272.1_480494_481724_-	PRK04346, PRK04346, tryptophan synthase subunit beta; Validated	NA|271aa|down_4|NC_003272.1_481777_482590_-	PLN02591, PLN02591, tryptophan synthase	NA|319aa|down_5|NC_003272.1_482643_483600_-	cd08272, MDR6, Medium chain dehydrogenases/reductase (MDR)/zinc-dependent alcohol dehydrogenase-like family	NA|291aa|down_6|NC_003272.1_483798_484671_-	PRK00278, trpC, indole-3-glycerol phosphate synthase TrpC	NA|736aa|down_7|NC_003272.1_484615_486823_-	TIGR01815, Includes:_Glutamine_amidotransferase, anthranilate synthase, alpha proteobacterial clade	NA|466aa|down_8|NC_003272.1_487181_488579_-	COG1524, COG1524, Uncharacterized proteins of the AP superfamily [General function prediction only]	NA|415aa|down_9|NC_003272.1_488667_489912_-	NA
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	4	807451-807558	3	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	CATTGCAATTAACTAAAATCCCTATCAGGGATTGAAAC	38	0	0	NA	NA	I-D,II-B	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|330aa|up_9|NC_003272.1_797711_798701_+,NA|179aa|down_5|NC_003272.1_814581_815118_-,NA|300aa|down_9|NC_003272.1_828695_829595_-	NA|330aa|up_9|NC_003272.1_797711_798701_+	NA	NA|159aa|up_8|NC_003272.1_798760_799237_+	COG0694, COG0694, Thioredoxin-like proteins and domains [Posttranslational modification, protein turnover, chaperones]	NA|391aa|up_7|NC_003272.1_799263_800436_+	cd05819, NHL, NHL repeat unit of beta-propeller proteins	NA|786aa|up_6|NC_003272.1_800535_802893_+	COG0068, HypF, Hydrogenase maturation factor [Posttranslational modification, protein turnover, chaperones]	NA|83aa|up_5|NC_003272.1_803005_803254_+	COG0298, HypC, Hydrogenase maturation factor [Posttranslational modification, protein turnover, chaperones]	NA|384aa|up_4|NC_003272.1_803284_804436_+	PRK15062, PRK15062, hydrogenase isoenzymes formation protein HypD; Provisional	NA|72aa|up_3|NC_003272.1_804489_804705_+	COG1942, COG1942, Uncharacterized protein, 4-oxalocrotonate tautomerase homolog [General function prediction only]	NA|368aa|up_2|NC_003272.1_804889_805993_+	TIGR02124, Hydrogenase_expression/formation_protein_HypE, hydrogenase expression/formation protein HypE	NA|114aa|up_1|NC_003272.1_806011_806353_+	pfam01155, HypA, Hydrogenase/urease nickel incorporation, metallochaperone, hypA	NA|282aa|up_0|NC_003272.1_806343_807189_+	PRK10463, PRK10463, hydrogenase nickel incorporation protein HypB; Provisional	NA|415aa|down_0|NC_003272.1_807765_809010_+	TIGR02037, Probable_periplasmic_serine_protease_do/HhoA-like, periplasmic serine protease, Do/DeqQ family	NA|124aa|down_1|NC_003272.1_809101_809473_-	pfam01925, TauE, Sulfite exporter TauE/SafE	NA|681aa|down_2|NC_003272.1_809813_811856_+	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|329aa|down_3|NC_003272.1_811998_812985_-	COG2421, COG2421, Predicted acetamidase/formamidase [Energy production and conversion]	NA|452aa|down_4|NC_003272.1_813019_814375_-	PRK11360, PRK11360, two-component system sensor histidine kinase AtoS	NA|179aa|down_5|NC_003272.1_814581_815118_-	NA	NA|1797aa|down_6|NC_003272.1_815624_821015_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|1800aa|down_7|NC_003272.1_821087_826487_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|641aa|down_8|NC_003272.1_826760_828683_-	COG0443, DnaK, Molecular chaperone [Posttranslational modification, protein turnover, chaperones]	NA|300aa|down_9|NC_003272.1_828695_829595_-	NA
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	5	875039-875149	4	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	ACCAAAAAGCGATCGCGCTTTCCCAACATTACACA	35	0	0	NA	NA	NA	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|89aa|down_1|NC_003272.1_875552_875819_-,NA|70aa|down_4|NC_003272.1_876672_876882_+,NA|156aa|down_8|NC_003272.1_883178_883646_+	NA|547aa|up_9|NC_003272.1_864310_865951_-	cd07302, CHD, cyclase homology domain	NA|495aa|up_8|NC_003272.1_866399_867884_+	pfam04892, VanZ, VanZ like family	NA|294aa|up_7|NC_003272.1_868011_868893_-	PRK09563, rbgA, GTPase YlqF; Reviewed	NA|128aa|up_6|NC_003272.1_868980_869364_-	cd07264, VOC_like, uncharacterized subfamily of vicinal oxygen chelate (VOC) family	NA|353aa|up_5|NC_003272.1_869617_870676_-	PRK13396, PRK13396, 3-deoxy-7-phosphoheptulonate synthase; Provisional	NA|157aa|up_4|NC_003272.1_870939_871410_-	pfam11947, DUF3464, Protein of unknown function (DUF3464)	NA|90aa|up_3|NC_003272.1_871422_871692_-	PRK05626, rpsO, 30S ribosomal protein S15; Reviewed	NA|181aa|up_2|NC_003272.1_871941_872484_+	pfam00582, Usp, Universal stress protein family	NA|165aa|up_1|NC_003272.1_872574_873069_+	PRK07571, PRK07571, bidirectional hydrogenase complex protein HoxE; Reviewed	NA|545aa|up_0|NC_003272.1_873379_875014_+	COG1894, NuoF, NADH:ubiquinone oxidoreductase, NADH-binding (51 kD) subunit [Energy production and conversion]	NA|132aa|down_0|NC_003272.1_875160_875556_-	COG3744, COG3744, PIN domain nuclease, a component of toxin-antitoxin system (PIN domain) [Signal transduction mechanisms]	NA|89aa|down_1|NC_003272.1_875552_875819_-	NA	NA|92aa|down_2|NC_003272.1_875993_876269_+	COG2929, COG2929, Uncharacterized protein conserved in bacteria [Function unknown]	NA|89aa|down_3|NC_003272.1_876252_876519_+	pfam14384, BrnA_antitoxin, BrnA antitoxin of type II toxin-antitoxin system	NA|70aa|down_4|NC_003272.1_876672_876882_+	NA	NA|114aa|down_5|NC_003272.1_876868_877210_+	pfam02452, PemK_toxin, PemK-like, MazF-like toxin of type II toxin-antitoxin system	NA|1330aa|down_6|NC_003272.1_877322_881312_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|444aa|down_7|NC_003272.1_881706_883038_+	pfam14516, AAA_35, AAA-like domain	NA|156aa|down_8|NC_003272.1_883178_883646_+	NA	NA|239aa|down_9|NC_003272.1_883816_884533_+	PRK07569, PRK07569, bidirectional hydrogenase complex protein HoxU; Validated
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	6	1342079-1342206	5	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	TTAATTCGTGCTGACCTCAGTCG	23	0	0	NA	NA	NA	2	2	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|161aa|up_8|NC_003272.1_1333866_1334349_+,NA|147aa|up_6|NC_003272.1_1335258_1335699_+,NA|174aa|up_5|NC_003272.1_1335733_1336255_+,NA|108aa|up_4|NC_003272.1_1336736_1337060_+,NA|195aa|up_2|NC_003272.1_1338894_1339479_+,NA|365aa|down_5|NC_003272.1_1353845_1354940_+	NA|666aa|up_9|NC_003272.1_1331524_1333522_-	PRK05298, PRK05298, excinuclease ABC subunit UvrB	NA|161aa|up_8|NC_003272.1_1333866_1334349_+	NA	NA|61aa|up_7|NC_003272.1_1334632_1334815_+	COG3237, COG3237, Uncharacterized protein conserved in bacteria [Function unknown]	NA|147aa|up_6|NC_003272.1_1335258_1335699_+	NA	NA|174aa|up_5|NC_003272.1_1335733_1336255_+	NA	NA|108aa|up_4|NC_003272.1_1336736_1337060_+	NA	NA|369aa|up_3|NC_003272.1_1337490_1338597_+	COG1748, LYS9, Saccharopine dehydrogenase and related proteins [Amino acid transport and metabolism]	NA|195aa|up_2|NC_003272.1_1338894_1339479_+	NA	NA|314aa|up_1|NC_003272.1_1339556_1340498_-	cd02696, MurNAc-LAA, N-acetylmuramoyl-L-alanine amidase or MurNAc-LAA (also known as peptidoglycan aminohydrolase, NAMLA amidase, NAMLAA, Amidase 3, and peptidoglycan amidase; EC 3	NA|282aa|up_0|NC_003272.1_1340975_1341821_-	PRK07417, PRK07417, prephenate/arogenate dehydrogenase	NA|194aa|down_0|NC_003272.1_1343544_1344126_+	pfam07466, DUF1517, Protein of unknown function (DUF1517)	NA|291aa|down_1|NC_003272.1_1344345_1345218_+	pfam04484, QWRF, QWRF family	NA|642aa|down_2|NC_003272.1_1345294_1347220_-	COG4191, COG4191, Signal transduction histidine kinase regulating C4-dicarboxylate transport system [Signal transduction mechanisms]	NA|848aa|down_3|NC_003272.1_1347726_1350270_+	pfam00350, Dynamin_N, Dynamin family	NA|1129aa|down_4|NC_003272.1_1350320_1353707_+	cd10170, HSP70_NBD, Nucleotide-binding domain of the HSP70 family	NA|365aa|down_5|NC_003272.1_1353845_1354940_+	NA	NA|163aa|down_6|NC_003272.1_1355018_1355507_-	COG5500, COG5500, Predicted integral membrane protein [Function unknown]	NA|139aa|down_7|NC_003272.1_1355579_1355996_-	pfam01124, MAPEG, MAPEG family	NA|241aa|down_8|NC_003272.1_1356142_1356865_-	pfam01292, Ni_hydr_CYTB, Prokaryotic cytochrome b561	NA|294aa|down_9|NC_003272.1_1356961_1357843_+	COG0338, Dam, Site-specific DNA methylase [DNA replication, recombination, and repair]
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	7	1727817-1728071	4,6,3	PILER-CR,CRISPRCasFinder,CRT	no	cas1,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Type III-A,Type III-B,Type III-D,Type III-C	GTTTCCATCCCCGTGAGGGGTAAAGGAATTAAAAC,GTTTCCATCCCCGTGAGGGGTAAAGGAATTAAAAC,GTTTCCATCCCCGTGAGGGGTAAAGGAATTAAAAC	35,35,35	0	0	NA	NA	NA:NA:NA	3,3,3	3	TypeIII-A,TypeIII-B,TypeIII-D,TypeIII-C	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|302aa|up_0|NC_003272.1_1723259_1724165_-,NA|274aa|down_2|NC_003272.1_1733487_1734309_+,csx19|176aa|down_5|NC_003272.1_1736144_1736672_-,csm2gr11|152aa|down_8|NC_003272.1_1738619_1739075_-	NA|481aa|up_9|NC_003272.1_1711820_1713263_-	TIGR01282, Nitrogenase_molybdenum-iron_protein_alpha_chain, nitrogenase molybdenum-iron protein alpha chain	NA|296aa|up_8|NC_003272.1_1713395_1714283_-	PRK13236, PRK13236, nitrogenase reductase; Reviewed	NA|301aa|up_7|NC_003272.1_1714500_1715403_-	TIGR02000, Nitrogen_fixation_protein_NifU, Fe-S cluster assembly protein NifU	NA|401aa|up_6|NC_003272.1_1715534_1716737_-	TIGR03402, Cysteine_desulfurase_NifS, cysteine desulfurase NifS	NA|515aa|up_5|NC_003272.1_1716846_1718391_+	COG1961, PinR, Site-specific recombinases, DNA invertase Pin homologs [DNA replication, recombination, and repair]	NA|194aa|up_4|NC_003272.1_1718607_1719189_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|138aa|up_3|NC_003272.1_1719362_1719776_+	pfam08814, XisH, XisH protein	NA|112aa|up_2|NC_003272.1_1719763_1720099_+	pfam08869, XisI, XisI protein	NA|605aa|up_1|NC_003272.1_1721071_1722886_-	cd00397, DNA_BRE_C, DNA breaking-rejoining enzymes, C-terminal catalytic domain	NA|302aa|up_0|NC_003272.1_1723259_1724165_-	NA	NA|248aa|down_0|NC_003272.1_1728407_1729151_-	pfam14326, DUF4384, Domain of unknown function (DUF4384)	cas1|669aa|down_1|NC_003272.1_1729648_1731655_+	TIGR00287, CRISPR-associated_endonuclease_Cas1, CRISPR-associated endonuclease Cas1	NA|274aa|down_2|NC_003272.1_1733487_1734309_+	NA	csx21|239aa|down_3|NC_003272.1_1734361_1735078_-	PLN02226, PLN02226, 2-oxoglutarate dehydrogenase E2 component	csm3gr7|352aa|down_4|NC_003272.1_1735087_1736143_-	TIGR03986, CRISPR-associated_protein, CRISPR-associated protein	csx19|176aa|down_5|NC_003272.1_1736144_1736672_-	NA	csm3gr7|338aa|down_6|NC_003272.1_1736659_1737673_-	COG1337, COG1337, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	csm3gr7|309aa|down_7|NC_003272.1_1737677_1738604_-	cd09683, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|152aa|down_8|NC_003272.1_1738619_1739075_-	NA	csx10gr5|435aa|down_9|NC_003272.1_1739071_1740376_-	TIGR02674, cas_cyan_RAMP_2, CRISPR-associated RAMP protein, Csx10 family
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	8	1732269-1733321	5,7,4	PILER-CR,CRISPRCasFinder,CRT	no	cas1,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Type III-A,Type III-B,Type III-D,Type III-C	GTTTCCATCCCCGTGAGGGGTAAAGGAATTAAAAC,GTTTTAATTCCTTTACCCCTCACGGGGATGGAAAC,GTTTTNATTCCTTTACCCCTCACGGGGATGGAAAC	35,35,35	0	0	NA	NA	NA:NA:NA	14,14,14	14	TypeIII-A,TypeIII-B,TypeIII-D,TypeIII-C	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|302aa|up_2|NC_003272.1_1723259_1724165_-,NA|274aa|down_0|NC_003272.1_1733487_1734309_+,csx19|176aa|down_3|NC_003272.1_1736144_1736672_-,csm2gr11|152aa|down_6|NC_003272.1_1738619_1739075_-	NA|301aa|up_9|NC_003272.1_1714500_1715403_-	TIGR02000, Nitrogen_fixation_protein_NifU, Fe-S cluster assembly protein NifU	NA|401aa|up_8|NC_003272.1_1715534_1716737_-	TIGR03402, Cysteine_desulfurase_NifS, cysteine desulfurase NifS	NA|515aa|up_7|NC_003272.1_1716846_1718391_+	COG1961, PinR, Site-specific recombinases, DNA invertase Pin homologs [DNA replication, recombination, and repair]	NA|194aa|up_6|NC_003272.1_1718607_1719189_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|138aa|up_5|NC_003272.1_1719362_1719776_+	pfam08814, XisH, XisH protein	NA|112aa|up_4|NC_003272.1_1719763_1720099_+	pfam08869, XisI, XisI protein	NA|605aa|up_3|NC_003272.1_1721071_1722886_-	cd00397, DNA_BRE_C, DNA breaking-rejoining enzymes, C-terminal catalytic domain	NA|302aa|up_2|NC_003272.1_1723259_1724165_-	NA	NA|248aa|up_1|NC_003272.1_1728407_1729151_-	pfam14326, DUF4384, Domain of unknown function (DUF4384)	cas1|669aa|up_0|NC_003272.1_1729648_1731655_+	TIGR00287, CRISPR-associated_endonuclease_Cas1, CRISPR-associated endonuclease Cas1	NA|274aa|down_0|NC_003272.1_1733487_1734309_+	NA	csx21|239aa|down_1|NC_003272.1_1734361_1735078_-	PLN02226, PLN02226, 2-oxoglutarate dehydrogenase E2 component	csm3gr7|352aa|down_2|NC_003272.1_1735087_1736143_-	TIGR03986, CRISPR-associated_protein, CRISPR-associated protein	csx19|176aa|down_3|NC_003272.1_1736144_1736672_-	NA	csm3gr7|338aa|down_4|NC_003272.1_1736659_1737673_-	COG1337, COG1337, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	csm3gr7|309aa|down_5|NC_003272.1_1737677_1738604_-	cd09683, Csm3_III-A, CRISPR/Cas system-associated RAMP superfamily protein Csm3	csm2gr11|152aa|down_6|NC_003272.1_1738619_1739075_-	NA	csx10gr5|435aa|down_7|NC_003272.1_1739071_1740376_-	TIGR02674, cas_cyan_RAMP_2, CRISPR-associated RAMP protein, Csx10 family	csm3gr7|253aa|down_8|NC_003272.1_1740372_1741131_-	COG1337, COG1337, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas10|789aa|down_9|NC_003272.1_1741127_1743494_-	TIGR02577, thermophile-specific_DNA_repair_system, CRISPR-associated protein Cas10/Cmr2, subtype III-B
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	9	1836813-1837723	6,8,5	PILER-CR,CRISPRCasFinder,CRT	no	WYL,cas10d,csc2gr7,csc1gr5,cas3,2OG_CAS,cas6,cas4,cas1,cas2	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Type I-D	GTTTCTATTAACACAAATCCCTATCAGGGA----------TTGAAAC,GTTTCTATTAACACAAATCCCTATCAGGGATTGAAAC,GTTTCTATTAACACAAATCCCTATCAGGGATTGAAAC	47,37,37	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	12,12,12	12	TypeI-D	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|159aa|down_5|NC_003272.1_1847128_1847605_+	cas10d|898aa|up_9|NC_003272.1_1824896_1827590_+	TIGR03174, cas_Csc3, CRISPR type I-D/CYANO-associated protein Csc3/Cas10d	csc2gr7|345aa|up_8|NC_003272.1_1827610_1828645_+	pfam18320, Csc2, Csc2 Crispr	csc1gr5|253aa|up_7|NC_003272.1_1828646_1829405_+	TIGR03159, cas_Csc1, CRISPR type I-D/CYANO-associated protein Csc1	cas3|762aa|up_6|NC_003272.1_1829397_1831683_+	cd09710, Cas3_I-D, CRISPR/Cas system-associated protein Cas3; Distinct diverged subfamily of Cas3 helicase domain	2OG_CAS|206aa|up_5|NC_003272.1_1831759_1832377_+	pfam13640, 2OG-FeII_Oxy_3, 2OG-Fe(II) oxygenase superfamily	cas6|291aa|up_4|NC_003272.1_1832406_1833279_+	COG5551, COG5551, CRISPR system related protein, RAMP superfamily [Defense    mechanisms]	cas4|197aa|up_3|NC_003272.1_1833469_1834060_+	cd09637, Cas4_I-A_I-B_I-C_I-D_II-B, CRISPR/Cas system-associated protein Cas4	cas1|334aa|up_2|NC_003272.1_1834183_1835185_+	TIGR04093, hypothetical_protein_L8106_25395, CRISPR-associated endonuclease Cas1, subtype CYANO	NA|298aa|up_1|NC_003272.1_1835378_1836272_+	pfam13612, DDE_Tnp_1_3, Transposase DDE domain	cas2|97aa|up_0|NC_003272.1_1836265_1836556_+	cd09725, Cas2_I_II_III, CRISPR/Cas system-associated protein Cas2	NA|195aa|down_0|NC_003272.1_1837760_1838345_-	pfam14015, DUF4231, Protein of unknown function (DUF4231)	NA|246aa|down_1|NC_003272.1_1838354_1839092_-	pfam18171, LSDAT_prok, SLOG in TRPM, prokaryote	NA|1048aa|down_2|NC_003272.1_1839676_1842820_+	COG4252, COG4252, Predicted transmembrane sensor domain [Signal transduction mechanisms]	NA|620aa|down_3|NC_003272.1_1843957_1845817_+	COG2303, BetA, Choline dehydrogenase and related flavoproteins [Amino acid transport and metabolism]	NA|367aa|down_4|NC_003272.1_1845981_1847082_+	pfam12902, Ferritin-like, Ferritin-like	NA|159aa|down_5|NC_003272.1_1847128_1847605_+	NA	NA|223aa|down_6|NC_003272.1_1847709_1848378_+	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|372aa|down_7|NC_003272.1_1848816_1849932_+	TIGR04379, myo-inositol_catabolism_protein, myo-inosose-2 dehydratase	NA|130aa|down_8|NC_003272.1_1850342_1850732_+	COG4319, COG4319, Ketosteroid isomerase homolog [Function unknown]	NA|130aa|down_9|NC_003272.1_1850769_1851159_+	pfam16247, DUF4904, Domain of unknown function (DUF4904)
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	10	1976173-1976273	9	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	AGGGTAAAACAAGCCCAAAGTCA	23	0	0	NA	NA	NA	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|260aa|up_2|NC_003272.1_1972328_1973108_+,NA|316aa|up_1|NC_003272.1_1973155_1974103_+,NA|101aa|down_2|NC_003272.1_1982832_1983135_-,NA|79aa|down_3|NC_003272.1_1983277_1983514_+,NA|89aa|down_4|NC_003272.1_1983539_1983806_+	NA|239aa|up_9|NC_003272.1_1950937_1951654_-	TIGR02813, omega-3_polyunsaturated_fatty_acid_synthase_PfaA, polyketide-type polyunsaturated fatty acid synthase PfaA	NA|1264aa|up_8|NC_003272.1_1951709_1955501_-	TIGR02813, omega-3_polyunsaturated_fatty_acid_synthase_PfaA, polyketide-type polyunsaturated fatty acid synthase PfaA	NA|988aa|up_7|NC_003272.1_1956110_1959074_-	cd05930, A_NRPS, The adenylation domain of nonribosomal peptide synthetases (NRPS)	NA|1588aa|up_6|NC_003272.1_1959319_1964083_-	COG3321, COG3321, Polyketide synthase modules and related proteins [Secondary metabolites biosynthesis, transport, and catabolism]	NA|1571aa|up_5|NC_003272.1_1964097_1968810_-	COG3321, COG3321, Polyketide synthase modules and related proteins [Secondary metabolites biosynthesis, transport, and catabolism]	NA|86aa|up_4|NC_003272.1_1969134_1969392_-	pfam00550, PP-binding, Phosphopantetheine attachment site	NA|278aa|up_3|NC_003272.1_1969529_1970363_-	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|260aa|up_2|NC_003272.1_1972328_1973108_+	NA	NA|316aa|up_1|NC_003272.1_1973155_1974103_+	NA	NA|328aa|up_0|NC_003272.1_1974359_1975343_+	pfam07589, VPEP, PEP-CTERM motif	NA|1035aa|down_0|NC_003272.1_1977238_1980343_+	COG0841, AcrB, Cation/multidrug efflux pump [Defense mechanisms]	NA|586aa|down_1|NC_003272.1_1980941_1982699_+	COG2831, FhaC, Hemolysin activation/secretion protein [Intracellular trafficking and secretion]	NA|101aa|down_2|NC_003272.1_1982832_1983135_-	NA	NA|79aa|down_3|NC_003272.1_1983277_1983514_+	NA	NA|89aa|down_4|NC_003272.1_1983539_1983806_+	NA	NA|497aa|down_5|NC_003272.1_1983933_1985424_-	PRK00139, murE, UDP-N-acetylmuramoylalanyl-D-glutamate--2,6-diaminopimelate ligase; Provisional	NA|96aa|down_6|NC_003272.1_1985456_1985744_-	pfam05768, DUF836, Glutaredoxin-like domain (DUF836)	NA|472aa|down_7|NC_003272.1_1986106_1987522_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|488aa|down_8|NC_003272.1_1987790_1989254_+	COG2027, DacB, D-alanyl-D-alanine carboxypeptidase (penicillin-binding protein 4) [Cell envelope biogenesis, outer membrane]	NA|428aa|down_9|NC_003272.1_1990620_1991904_+	cd03794, GT4_WbuB-like, Escherichia coli WbuB and similar proteins
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	11	2178258-2178438	10	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	GTTTCCATCCCCGTGAGGGGTAAGAGATTAAAAAC	35	0	0	NA	NA	NA	2	2	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|82aa|up_2|NC_003272.1_2175324_2175570_+,NA|343aa|up_1|NC_003272.1_2175578_2176607_+,NA|105aa|down_1|NC_003272.1_2179967_2180282_-,NA|190aa|down_2|NC_003272.1_2180443_2181013_-,NA|144aa|down_3|NC_003272.1_2181342_2181774_+	NA|281aa|up_9|NC_003272.1_2164273_2165116_+	PLN02244, PLN02244, tocopherol O-methyltransferase	NA|1288aa|up_8|NC_003272.1_2165158_2169022_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|277aa|up_7|NC_003272.1_2170421_2171252_+	COG1562, ERG9, Phytoene/squalene synthetase [Lipid metabolism]	NA|262aa|up_6|NC_003272.1_2171315_2172101_-	COG1714, COG1714, Predicted membrane protein/domain [Function unknown]	NA|285aa|up_5|NC_003272.1_2172168_2173023_-	pfam10110, GPDPase_memb, Membrane domain of glycerophosphoryl diester phosphodiesterase	NA|319aa|up_4|NC_003272.1_2173104_2174061_+	COG1300, SpoIIM, Uncharacterized membrane protein [Function unknown]	NA|156aa|up_3|NC_003272.1_2174289_2174757_+	COG0071, IbpA, Molecular chaperone (small heat shock protein) [Posttranslational modification, protein turnover, chaperones]	NA|82aa|up_2|NC_003272.1_2175324_2175570_+	NA	NA|343aa|up_1|NC_003272.1_2175578_2176607_+	NA	NA|501aa|up_0|NC_003272.1_2176666_2178169_-	cd07786, FGGY_EcGK_like, Escherichia coli glycerol kinase-like proteins; belongs to the FGGY family of carbohydrate kinases	NA|123aa|down_0|NC_003272.1_2179609_2179978_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|105aa|down_1|NC_003272.1_2179967_2180282_-	NA	NA|190aa|down_2|NC_003272.1_2180443_2181013_-	NA	NA|144aa|down_3|NC_003272.1_2181342_2181774_+	NA	NA|216aa|down_4|NC_003272.1_2181763_2182411_-	cd06259, YdcF-like, YdcF-like	NA|559aa|down_5|NC_003272.1_2183274_2184951_+	COG2335, COG2335, Secreted and surface protein containing fasciclin-like repeats [Cell envelope biogenesis, outer membrane]	NA|1010aa|down_6|NC_003272.1_2185026_2188056_-	COG4995, COG4995, Uncharacterized protein conserved in bacteria [Function unknown]	NA|194aa|down_7|NC_003272.1_2188124_2188706_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|145aa|down_8|NC_003272.1_2188886_2189321_+	pfam10990, DUF2809, Protein of unknown function (DUF2809)	NA|367aa|down_9|NC_003272.1_2189615_2190716_-	COG3839, MalK, ABC-type sugar transport systems, ATPase components [Carbohydrate transport and metabolism]
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	12	2178606-2179167	7,11,6	PILER-CR,CRISPRCasFinder,CRT	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	GTTTCCATCCCCGTGAGGGGTAAGAGATTAAAAAC,GTTTCCATCCCCGTGAGGGGTAAGAGATTAAAAAC,GTTTCCATCCCCGTGAGGGGTAAGAGATTAAAAAC	35,35,35	0	0	NA	NA	NA:NA:NA	7,7,7	7	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|82aa|up_2|NC_003272.1_2175324_2175570_+,NA|343aa|up_1|NC_003272.1_2175578_2176607_+,NA|105aa|down_1|NC_003272.1_2179967_2180282_-,NA|190aa|down_2|NC_003272.1_2180443_2181013_-,NA|144aa|down_3|NC_003272.1_2181342_2181774_+	NA|281aa|up_9|NC_003272.1_2164273_2165116_+	PLN02244, PLN02244, tocopherol O-methyltransferase	NA|1288aa|up_8|NC_003272.1_2165158_2169022_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|277aa|up_7|NC_003272.1_2170421_2171252_+	COG1562, ERG9, Phytoene/squalene synthetase [Lipid metabolism]	NA|262aa|up_6|NC_003272.1_2171315_2172101_-	COG1714, COG1714, Predicted membrane protein/domain [Function unknown]	NA|285aa|up_5|NC_003272.1_2172168_2173023_-	pfam10110, GPDPase_memb, Membrane domain of glycerophosphoryl diester phosphodiesterase	NA|319aa|up_4|NC_003272.1_2173104_2174061_+	COG1300, SpoIIM, Uncharacterized membrane protein [Function unknown]	NA|156aa|up_3|NC_003272.1_2174289_2174757_+	COG0071, IbpA, Molecular chaperone (small heat shock protein) [Posttranslational modification, protein turnover, chaperones]	NA|82aa|up_2|NC_003272.1_2175324_2175570_+	NA	NA|343aa|up_1|NC_003272.1_2175578_2176607_+	NA	NA|501aa|up_0|NC_003272.1_2176666_2178169_-	cd07786, FGGY_EcGK_like, Escherichia coli glycerol kinase-like proteins; belongs to the FGGY family of carbohydrate kinases	NA|123aa|down_0|NC_003272.1_2179609_2179978_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|105aa|down_1|NC_003272.1_2179967_2180282_-	NA	NA|190aa|down_2|NC_003272.1_2180443_2181013_-	NA	NA|144aa|down_3|NC_003272.1_2181342_2181774_+	NA	NA|216aa|down_4|NC_003272.1_2181763_2182411_-	cd06259, YdcF-like, YdcF-like	NA|559aa|down_5|NC_003272.1_2183274_2184951_+	COG2335, COG2335, Secreted and surface protein containing fasciclin-like repeats [Cell envelope biogenesis, outer membrane]	NA|1010aa|down_6|NC_003272.1_2185026_2188056_-	COG4995, COG4995, Uncharacterized protein conserved in bacteria [Function unknown]	NA|194aa|down_7|NC_003272.1_2188124_2188706_+	cd06260, DUF820, Domain of unknown function (DUF820)	NA|145aa|down_8|NC_003272.1_2188886_2189321_+	pfam10990, DUF2809, Protein of unknown function (DUF2809)	NA|367aa|down_9|NC_003272.1_2189615_2190716_-	COG3839, MalK, ABC-type sugar transport systems, ATPase components [Carbohydrate transport and metabolism]
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	13	3274979-3275083	12	CRISPRCasFinder	no	c2c5_V-U5	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Type V-U5	TCAGTTTTAAAGAATTATTGTCCAA	25	0	0	NA	NA	NA	1	1	TypeV-U5	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|79aa|down_3|NC_003272.1_3277321_3277558_-,NA|49aa|down_6|NC_003272.1_3281937_3282084_-,c2c5_V-U5|675aa|down_7|NC_003272.1_3282085_3284110_+	NA|438aa|up_9|NC_003272.1_3238655_3239969_-	cd06173, MFS_MefA_like, Macrolide efflux protein A and similar proteins of the Major Facilitator Superfamily of transporters	NA|868aa|up_8|NC_003272.1_3240066_3242670_-	TIGR01783, Ferrienterobactin_receptor, TonB-dependent siderophore receptor	NA|454aa|up_7|NC_003272.1_3242897_3244259_-	TIGR01843, Hemolysin_secretion_protein_D_plasmid, type I secretion membrane fusion protein, HlyD family	NA|977aa|up_6|NC_003272.1_3244519_3247450_-	COG2274, SunT, ABC-type bacteriocin/lantibiotic exporters, contain an N-terminal double-glycine peptidase domain [Defense mechanisms]	NA|226aa|up_5|NC_003272.1_3247586_3248264_-	COG0760, SurA, Parvulin-like peptidyl-prolyl isomerase [Posttranslational modification, protein turnover, chaperones]	NA|1207aa|up_4|NC_003272.1_3248681_3252302_+	cd05931, FAAL, Fatty acyl-AMP ligase (FAAL)	NA|2456aa|up_3|NC_003272.1_3252398_3259766_+	COG3321, COG3321, Polyketide synthase modules and related proteins [Secondary metabolites biosynthesis, transport, and catabolism]	NA|2519aa|up_2|NC_003272.1_3259880_3267437_+	COG3321, COG3321, Polyketide synthase modules and related proteins [Secondary metabolites biosynthesis, transport, and catabolism]	NA|216aa|up_1|NC_003272.1_3267480_3268128_-	cd04302, HAD_5NT, haloacid dehalogenase (HAD)-like 5'-nucleotidases similar to the Pseudomonas aeruginosa PA0065	NA|1947aa|up_0|NC_003272.1_3268693_3274534_+	COG3899, COG3899, Predicted ATPase [General function prediction only]	NA|298aa|down_0|NC_003272.1_3275412_3276306_+	pfam13612, DDE_Tnp_1_3, Transposase DDE domain	NA|180aa|down_1|NC_003272.1_3276292_3276832_-	COG0610, COG0610, Type I site-specific restriction-modification system, R (restriction) subunit and related helicases [Defense mechanisms]	NA|130aa|down_2|NC_003272.1_3276935_3277325_-	COG3744, COG3744, PIN domain nuclease, a component of toxin-antitoxin system (PIN domain) [Signal transduction mechanisms]	NA|79aa|down_3|NC_003272.1_3277321_3277558_-	NA	NA|426aa|down_4|NC_003272.1_3277623_3278901_-	cd17264, RMtype1_S_Eco3763I-TRD2-CR2_like, Type I restriction-modification system specificity (S) subunit Target Recognition Domain-ConseRved domain (TRD-CR), similar to Escherichia coli O69:H11 07-3763 S subunit (S	NA|49aa|down_5|NC_003272.1_3281509_3281656_-	pfam07878, RHH_5, CopG-like RHH_1 or ribbon-helix-helix domain, RHH_5	NA|49aa|down_6|NC_003272.1_3281937_3282084_-	NA	c2c5_V-U5|675aa|down_7|NC_003272.1_3282085_3284110_+	NA	NA|265aa|down_8|NC_003272.1_3284235_3285029_-	pfam13340, DUF4096, Putative transposase of IS4/5 family (DUF4096)	NA|298aa|down_9|NC_003272.1_3285535_3286429_+	pfam13612, DDE_Tnp_1_3, Transposase DDE domain
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	14	3516819-3517367	13,7,8	CRISPRCasFinder,CRT,PILER-CR	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	GTTTCAATCCCTGATAGGGATTTTTGTTAGTTAAAAC,GTTTCAATCCCTGATAGGGATTTTTGTTAGTTAAAAC,TTCAATCCCTGATAGGGATTTTTGTTAGTTAAAAC	37,37,35	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	7,7,6	7	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|126aa|down_5|NC_003272.1_3527413_3527791_+,NA|169aa|down_6|NC_003272.1_3527928_3528435_+,NA|499aa|down_9|NC_003272.1_3530310_3531807_+	NA|335aa|up_9|NC_003272.1_3498852_3499857_+	COG4240, COG4240, Predicted kinase [General function prediction only]	NA|331aa|up_8|NC_003272.1_3499901_3500894_-	COG3706, PleD, Response regulator containing a CheY-like receiver domain and a GGDEF domain [Signal transduction mechanisms]	NA|1818aa|up_7|NC_003272.1_3500890_3506344_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|486aa|up_6|NC_003272.1_3507042_3508500_-	pfam02696, UPF0061, Uncharacterized ACR, YdiU/UPF0061 family	NA|459aa|up_5|NC_003272.1_3509079_3510456_+	pfam13379, NMT1_2, NMT1-like family	NA|280aa|up_4|NC_003272.1_3510546_3511386_+	TIGR01183, Nitrate_transport_permease_protein_NrtB, nitrate ABC transporter, permease protein	NA|668aa|up_3|NC_003272.1_3511459_3513463_+	TIGR01184, Nitrate_transport_ATP-binding_protein_NrtC, nitrate transport ATP-binding subunits C and D	NA|290aa|up_2|NC_003272.1_3513585_3514455_+	TIGR01184, Nitrate_transport_ATP-binding_protein_NrtC, nitrate transport ATP-binding subunits C and D	NA|292aa|up_1|NC_003272.1_3515094_3515970_+	PRK13057, PRK13057, lipid kinase	NA|211aa|up_0|NC_003272.1_3516115_3516748_+	COG3932, COG3932, Uncharacterized ABC-type transport system, permease components [General function prediction only]	NA|1114aa|down_0|NC_003272.1_3518350_3521692_-	PRK11091, PRK11091, aerobic respiration control sensor protein ArcB; Provisional	NA|103aa|down_1|NC_003272.1_3522617_3522926_+	pfam07688, KaiA, KaiA C-terminal domain	NA|109aa|down_2|NC_003272.1_3523031_3523358_+	PRK09301, PRK09301, circadian clock protein KaiB; Provisional	NA|520aa|down_3|NC_003272.1_3523432_3524992_+	TIGR02655, Circadian_clock_protein_kinase_KaiC, circadian clock protein KaiC	NA|743aa|down_4|NC_003272.1_3525096_3527325_+	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|126aa|down_5|NC_003272.1_3527413_3527791_+	NA	NA|169aa|down_6|NC_003272.1_3527928_3528435_+	NA	NA|260aa|down_7|NC_003272.1_3528548_3529328_+	TIGR03069, RNA-binding_S4_domain-containing_protein, photosystem II S4 domain protein	NA|259aa|down_8|NC_003272.1_3529350_3530127_-	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]	NA|499aa|down_9|NC_003272.1_3530310_3531807_+	NA
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	15	3517472-3518084	8,9,14	CRT,PILER-CR,CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	GTTTCAATCCCTGATAGGGATTTTTGTTAGTTAAAAC,GTTTTAACTAACAAAAATCCCTATCAGGGA----------TTGAAAC,GTTTCAATCCCTGATAGGGATTTTTGTTAGTTAAAAC	37,47,37	0	0	NA	NA	I-D,II-B:I-D,II-B:I-D,II-B	8,7,7	8	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|126aa|down_5|NC_003272.1_3527413_3527791_+,NA|169aa|down_6|NC_003272.1_3527928_3528435_+,NA|499aa|down_9|NC_003272.1_3530310_3531807_+	NA|335aa|up_9|NC_003272.1_3498852_3499857_+	COG4240, COG4240, Predicted kinase [General function prediction only]	NA|331aa|up_8|NC_003272.1_3499901_3500894_-	COG3706, PleD, Response regulator containing a CheY-like receiver domain and a GGDEF domain [Signal transduction mechanisms]	NA|1818aa|up_7|NC_003272.1_3500890_3506344_-	PRK11107, PRK11107, hybrid sensory histidine kinase BarA; Provisional	NA|486aa|up_6|NC_003272.1_3507042_3508500_-	pfam02696, UPF0061, Uncharacterized ACR, YdiU/UPF0061 family	NA|459aa|up_5|NC_003272.1_3509079_3510456_+	pfam13379, NMT1_2, NMT1-like family	NA|280aa|up_4|NC_003272.1_3510546_3511386_+	TIGR01183, Nitrate_transport_permease_protein_NrtB, nitrate ABC transporter, permease protein	NA|668aa|up_3|NC_003272.1_3511459_3513463_+	TIGR01184, Nitrate_transport_ATP-binding_protein_NrtC, nitrate transport ATP-binding subunits C and D	NA|290aa|up_2|NC_003272.1_3513585_3514455_+	TIGR01184, Nitrate_transport_ATP-binding_protein_NrtC, nitrate transport ATP-binding subunits C and D	NA|292aa|up_1|NC_003272.1_3515094_3515970_+	PRK13057, PRK13057, lipid kinase	NA|211aa|up_0|NC_003272.1_3516115_3516748_+	COG3932, COG3932, Uncharacterized ABC-type transport system, permease components [General function prediction only]	NA|1114aa|down_0|NC_003272.1_3518350_3521692_-	PRK11091, PRK11091, aerobic respiration control sensor protein ArcB; Provisional	NA|103aa|down_1|NC_003272.1_3522617_3522926_+	pfam07688, KaiA, KaiA C-terminal domain	NA|109aa|down_2|NC_003272.1_3523031_3523358_+	PRK09301, PRK09301, circadian clock protein KaiB; Provisional	NA|520aa|down_3|NC_003272.1_3523432_3524992_+	TIGR02655, Circadian_clock_protein_kinase_KaiC, circadian clock protein KaiC	NA|743aa|down_4|NC_003272.1_3525096_3527325_+	COG1538, TolC, Outer membrane protein [Cell envelope biogenesis, outer membrane / Intracellular trafficking and secretion]	NA|126aa|down_5|NC_003272.1_3527413_3527791_+	NA	NA|169aa|down_6|NC_003272.1_3527928_3528435_+	NA	NA|260aa|down_7|NC_003272.1_3528548_3529328_+	TIGR03069, RNA-binding_S4_domain-containing_protein, photosystem II S4 domain protein	NA|259aa|down_8|NC_003272.1_3529350_3530127_-	COG0300, DltE, Short-chain dehydrogenases of various substrate specificities [General function prediction only]	NA|499aa|down_9|NC_003272.1_3530310_3531807_+	NA
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	16	3772540-3772637	15	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	TTGGAATTTGACGACGTAGATGTTCTAGGCGCAGA	35	0	0	NA	NA	NA	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|127aa|up_9|NC_003272.1_3760607_3760988_-,NA|64aa|up_8|NC_003272.1_3761115_3761307_+,NA|87aa|up_0|NC_003272.1_3771123_3771384_-,NA	NA|127aa|up_9|NC_003272.1_3760607_3760988_-	NA	NA|64aa|up_8|NC_003272.1_3761115_3761307_+	NA	NA|270aa|up_7|NC_003272.1_3761375_3762185_-	COG5464, COG5464, Uncharacterized conserved protein [Function unknown]	NA|411aa|up_6|NC_003272.1_3762326_3763559_-	PRK05579, PRK05579, bifunctional phosphopantothenoylcysteine decarboxylase/phosphopantothenate synthase; Validated	NA|71aa|up_5|NC_003272.1_3763634_3763847_-	pfam10742, DUF2555, Protein of unknown function (DUF2555)	NA|205aa|up_4|NC_003272.1_3764001_3764616_-	COG0400, COG0400, Predicted esterase [General function prediction only]	NA|577aa|up_3|NC_003272.1_3764871_3766602_-	COG1357, COG1357, Pentapeptide repeats containing protein [Function unknown]	NA|1007aa|up_2|NC_003272.1_3767070_3770091_+	pfam16313, DUF4953, Met-zincin	NA|246aa|up_1|NC_003272.1_3770157_3770895_-	pfam09353, DUF1995, Domain of unknown function (DUF1995)	NA|87aa|up_0|NC_003272.1_3771123_3771384_-	NA	NA|677aa|down_0|NC_003272.1_3773444_3775475_+	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|1275aa|down_1|NC_003272.1_3775962_3779787_+	PRK15347, PRK15347, two component system sensor kinase	NA|383aa|down_2|NC_003272.1_3779783_3780932_+	cd17538, REC_D1_PleD-like, first (D1) phosphoacceptor receiver (REC) domain of response regulator PleD and similar domains	NA|247aa|down_3|NC_003272.1_3781215_3781956_+	pfam02683, DsbD, Cytochrome C biogenesis protein transmembrane region	NA|462aa|down_4|NC_003272.1_3781959_3783345_+	CHL00177, ccs1, c-type cytochrome biogenensis protein; Validated	NA|112aa|down_5|NC_003272.1_3783425_3783761_-	pfam08869, XisI, XisI protein	NA|238aa|down_6|NC_003272.1_3784285_3784999_+	COG5398, COG5398, Heme oxygenase [Inorganic ion transport and metabolism]	NA|461aa|down_7|NC_003272.1_3785365_3786748_+	PRK09249, PRK09249, coproporphyrinogen dehydrogenase	NA|303aa|down_8|NC_003272.1_3786994_3787903_-	COG4278, COG4278, Uncharacterized conserved protein [Function unknown]	NA|71aa|down_9|NC_003272.1_3788538_3788751_-	pfam09957, VapB_antitoxin, Bacterial antitoxin of type II TA system, VapB
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	17	3840120-3840737	10,16,9,11	PILER-CR,CRISPRCasFinder,CRT,PILER-CR	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	TGTTTC----------AATCCCTAATAGGGATTATATGGTGTTGCAAC,GTTGCAACACCATATAATCCCTATTAGGGATTGAAAC,GTTGCAACACCATATAATCCCTATTAGGGATTGAAAC,GGTTTC----------AATCCCTAATAGGGATTATATGGTGTTGCAACT	48,37,37,49	0	0	NA	NA	N:A	6,8,8,6	8	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|99aa|up_6|NC_003272.1_3830410_3830707_-,NA|144aa|down_2|NC_003272.1_3842359_3842791_-,NA|265aa|down_4|NC_003272.1_3843827_3844622_+	NA|642aa|up_9|NC_003272.1_3826185_3828111_-	cd07551, P-type_ATPase_HM_ZosA_PfeT-like, P-type heavy metal-transporting ATPase, similar to Bacillus subtilis ZosA/PfeT which transports copper, and perhaps zinc under oxidative stress, and perhaps ferrous iron	NA|369aa|up_8|NC_003272.1_3828235_3829342_+	COG2082, CobH, Precorrin isomerase [Coenzyme metabolism]	NA|348aa|up_7|NC_003272.1_3829370_3830414_-	COG0628, yhhT, Predicted permease, member of the PurR regulon [General function prediction only]	NA|99aa|up_6|NC_003272.1_3830410_3830707_-	NA	NA|262aa|up_5|NC_003272.1_3831312_3832098_+	cd15240, 7tm_ASR-like, Anabaena sensory rhodopsin and similar proteins, member of the seven-transmembrane GPCR superfamily	NA|126aa|up_4|NC_003272.1_3832114_3832492_+	pfam07100, ASRT, Anabaena sensory rhodopsin transducer	NA|421aa|up_3|NC_003272.1_3832497_3833760_-	TIGR02966, Phosphate_regulon_sensor_protein_PhoR, phosphate regulon sensor kinase PhoR	NA|100aa|up_2|NC_003272.1_3834073_3834373_+	PRK02724, PRK02724, 30S ribosomal protein PSRP-3	NA|560aa|up_1|NC_003272.1_3834496_3836176_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|1022aa|up_0|NC_003272.1_3836735_3839801_+	PRK10060, PRK10060, cyclic di-GMP phosphodiesterase	NA|304aa|down_0|NC_003272.1_3840823_3841735_-	COG2207, AraC, AraC-type DNA-binding domain-containing proteins [Transcription]	NA|131aa|down_1|NC_003272.1_3841906_3842299_+	COG3011, COG3011, Predicted thiol-disulfide oxidoreductase [General function    prediction only]	NA|144aa|down_2|NC_003272.1_3842359_3842791_-	NA	NA|185aa|down_3|NC_003272.1_3842919_3843474_-	PRK05800, cobU, adenosylcobinamide kinase/adenosylcobinamide-phosphate guanylyltransferase; Validated	NA|265aa|down_4|NC_003272.1_3843827_3844622_+	NA	NA|314aa|down_5|NC_003272.1_3844811_3845753_+	cd00761, Glyco_tranf_GTA_type, Glycosyltransferase family A (GT-A) includes diverse families of glycosyl transferases with a common GT-A type structural fold	NA|314aa|down_6|NC_003272.1_3845773_3846715_+	cd02511, Beta4Glucosyltransferase, UDP-glucose LOS-beta-1,4 glucosyltransferase is required for biosynthesis of lipooligosaccharide	NA|188aa|down_7|NC_003272.1_3846743_3847307_+	PRK10502, PRK10502, putative acyl transferase; Provisional	NA|268aa|down_8|NC_003272.1_3847389_3848193_-	pfam06051, DUF928, Domain of Unknown Function (DUF928)	NA|781aa|down_9|NC_003272.1_3848275_3850618_-	COG4252, COG4252, Predicted transmembrane sensor domain [Signal transduction mechanisms]
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	18	4362255-4362578	17,10,12	CRISPRCasFinder,CRT,PILER-CR	no	c2c5_V-U5	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Type V-U5	CTTTCAACCCTCCCATTACTGGAAGGAGGGTTGCAACG,CTTTCAACCCTCCCATTACTGGAAGGAGGGTTGCAAC,CTTTCAACCCTCCCATTACTGGAAGGAGGGTTGCAACG	38,37,38	0	0	NA	NA	N:A	4,4,3	4	TypeV-U5	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|499aa|up_8|NC_003272.1_4350643_4352140_+,NA|175aa|up_5|NC_003272.1_4355338_4355863_-,NA|105aa|down_3|NC_003272.1_4367526_4367841_-,NA|331aa|down_5|NC_003272.1_4370938_4371931_+,NA|73aa|down_7|NC_003272.1_4373441_4373660_+	NA|402aa|up_9|NC_003272.1_4349313_4350519_-	PRK09303, PRK09303, histidine kinase	NA|499aa|up_8|NC_003272.1_4350643_4352140_+	NA	NA|659aa|up_7|NC_003272.1_4352810_4354787_+	cd17640, LC_FACS_like, Long-chain fatty acid CoA synthetase	NA|151aa|up_6|NC_003272.1_4354829_4355282_+	pfam11068, YlqD, YlqD protein	NA|175aa|up_5|NC_003272.1_4355338_4355863_-	NA	NA|431aa|up_4|NC_003272.1_4356209_4357502_+	PRK11856, PRK11856, branched-chain alpha-keto acid dehydrogenase subunit E2; Reviewed	NA|233aa|up_3|NC_003272.1_4357615_4358314_+	sd00006, TPR, Tetratricopeptide repeat	NA|553aa|up_2|NC_003272.1_4358562_4360221_+	pfam07602, DUF1565, Protein of unknown function (DUF1565)	NA|89aa|up_1|NC_003272.1_4360601_4360868_-	pfam11998, DUF3493, Protein of unknown function (DUF3493)	NA|265aa|up_0|NC_003272.1_4361123_4361917_+	pfam13340, DUF4096, Putative transposase of IS4/5 family (DUF4096)	c2c5_V-U5|640aa|down_0|NC_003272.1_4363024_4364944_-	TIGR01766, Putative_transposase_MJ0751, transposase, IS605 OrfB family, central region	NA|151aa|down_1|NC_003272.1_4365026_4365479_+	cd01105, HTH_GlnR-like, Helix-Turn-Helix DNA binding domain of GlnR-like transcription regulators	NA|617aa|down_2|NC_003272.1_4365533_4367384_-	COG3472, COG3472, Uncharacterized conserved protein [Function unknown]	NA|105aa|down_3|NC_003272.1_4367526_4367841_-	NA	NA|777aa|down_4|NC_003272.1_4368582_4370913_+	COG4096, HsdR, Type I site-specific restriction-modification system, R (restriction) subunit and related helicases [Defense mechanisms]	NA|331aa|down_5|NC_003272.1_4370938_4371931_+	NA	NA|485aa|down_6|NC_003272.1_4371938_4373393_+	COG0286, HsdM, Type I restriction-modification system methyltransferase subunit [Defense mechanisms]	NA|73aa|down_7|NC_003272.1_4373441_4373660_+	NA	NA|141aa|down_8|NC_003272.1_4373643_4374066_+	COG5573, COG5573, Predicted nucleic-acid-binding protein, contains PIN domain [General function prediction only]	NA|147aa|down_9|NC_003272.1_4374062_4374503_+	cd17266, RMtype1_S_Sau1132ORF3780P-TRD2-CR2_like, Type I restriction-modification system specificity (S) subunit Target Recognition Domain-ConseRved domain (TRD-CR), similar to Staphylococcus aureus subsp
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	19	4682741-4682812	18	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	CCCGGCTTGTAGCGAATGGCGTG	23	0	0	NA	NA	N:A	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|73aa|down_0|NC_003272.1_4682827_4683046_-,NA|69aa|down_5|NC_003272.1_4687482_4687689_+,NA|55aa|down_7|NC_003272.1_4689348_4689513_-,NA|247aa|down_8|NC_003272.1_4690044_4690785_+	NA|503aa|up_9|NC_003272.1_4670925_4672434_+	PRK14508, PRK14508, 4-alpha-glucanotransferase; Provisional	NA|267aa|up_8|NC_003272.1_4672521_4673322_-	COG1426, COG1426, Predicted transcriptional regulator contains Xre-like HTH domain [Function unknown]	NA|263aa|up_7|NC_003272.1_4673407_4674196_-	COG1187, RsuA, 16S rRNA uridine-516 pseudouridylate synthase and related pseudouridylate synthases [Translation, ribosomal structure and biogenesis]	NA|238aa|up_6|NC_003272.1_4674471_4675185_+	pfam11209, DUF2993, Protein of unknown function (DUF2993)	NA|295aa|up_5|NC_003272.1_4675267_4676152_-	PLN02953, PLN02953, phosphatidate cytidylyltransferase	NA|201aa|up_4|NC_003272.1_4676298_4676901_-	PRK07402, PRK07402, precorrin-6Y C5,15-methyltransferase subunit CbiT	NA|464aa|up_3|NC_003272.1_4676995_4678387_+	cd14014, STKc_PknB_like, Catalytic domain of bacterial Serine/Threonine kinases, PknB and similar proteins	NA|57aa|up_2|NC_003272.1_4678708_4678879_+	COG1826, TatA, Sec-independent protein secretion pathway components [Intracellular trafficking and secretion]	NA|902aa|up_1|NC_003272.1_4678949_4681655_-	TIGR02068, Cyanophycin_synthetase, cyanophycin synthetase	NA|288aa|up_0|NC_003272.1_4681827_4682691_-	COG4242, CphB, Cyanophycinase and related exopeptidases [Secondary metabolites biosynthesis, transport, and catabolism / Inorganic ion transport and metabolism]	NA|73aa|down_0|NC_003272.1_4682827_4683046_-	NA	NA|253aa|down_1|NC_003272.1_4683303_4684062_+	PRK00026, trmD, tRNA (guanine-N(1)-)-methyltransferase; Reviewed	NA|166aa|down_2|NC_003272.1_4684072_4684570_+	pfam02542, YgbB, YgbB family	NA|596aa|down_3|NC_003272.1_4684651_4686439_+	cd08500, PBP2_NikA_DppA_OppA_like_4, The substrate-binding component of an uncharacterized ABC-type nickel/dipeptide/oligopeptide-like import system contains the type 2 periplasmic binding fold	NA|263aa|down_4|NC_003272.1_4686520_4687309_+	COG1691, COG1691, NCAIR mutase (PurE)-related proteins [General function prediction only]	NA|69aa|down_5|NC_003272.1_4687482_4687689_+	NA	NA|462aa|down_6|NC_003272.1_4687821_4689207_+	PRK00855, PRK00855, argininosuccinate lyase; Provisional	NA|55aa|down_7|NC_003272.1_4689348_4689513_-	NA	NA|247aa|down_8|NC_003272.1_4690044_4690785_+	NA	NA|571aa|down_9|NC_003272.1_4690924_4692637_-	COG0426, FpaA, Uncharacterized flavoproteins [Energy production and conversion]
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	20	5646379-5647145	19,11,13	CRISPRCasFinder,CRT,PILER-CR	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	GTTTCCATCCCCTTTCGGGGTGATGTGATCGGAAAG,GTTTCCATCCCCTTTCGGGGTGATGTGATCGGAAAG,CTTTCCGATCACATCACCCCGAAAGGGGATGGAAAC	36,36,36	0	0	NA	NA	N:A	10,10,9	10	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|529aa|down_4|NC_003272.1_5654598_5656185_+,NA|64aa|down_5|NC_003272.1_5656391_5656583_-	NA|354aa|up_9|NC_003272.1_5628087_5629149_-	COG0523, COG0523, Putative GTPases (G3E family) [General function prediction only]	NA|613aa|up_8|NC_003272.1_5629259_5631098_-	PRK12305, thrS, threonyl-tRNA synthetase; Reviewed	NA|411aa|up_7|NC_003272.1_5631209_5632442_-	pfam13434, K_oxygenase, L-lysine 6-monooxygenase (NADPH-requiring)	NA|337aa|up_6|NC_003272.1_5632501_5633512_-	PRK09283, PRK09283, porphobilinogen synthase	NA|372aa|up_5|NC_003272.1_5633624_5634740_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|239aa|up_4|NC_003272.1_5634736_5635453_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|237aa|up_3|NC_003272.1_5635711_5636422_-	cd10911, PIN_LabA, PIN domain of Synechococcus elongatus LabA (low-amplitude and bright) and related proteins	NA|592aa|up_2|NC_003272.1_5639127_5640903_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|1229aa|up_1|NC_003272.1_5641381_5645068_+	TIGR02025, Magnesium-chelatase_subunit_H, magnesium chelatase, H subunit	NA|181aa|up_0|NC_003272.1_5645250_5645793_+	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|185aa|down_0|NC_003272.1_5647524_5648079_-	pfam01243, Putative_PNPOx, Pyridoxamine 5'-phosphate oxidase	NA|224aa|down_1|NC_003272.1_5648263_5648935_-	pfam12900, Pyridox_ox_2, Pyridoxamine 5'-phosphate oxidase	NA|491aa|down_2|NC_003272.1_5649033_5650506_+	COG1167, ARO8, Transcriptional regulators containing a DNA-binding HTH domain and an aminotransferase domain (MocR family) and their eukaryotic orthologs [Transcription / Amino acid transport and metabolism]	NA|555aa|down_3|NC_003272.1_5652123_5653788_+	pfam04966, OprB, Carbohydrate-selective porin, OprB family	NA|529aa|down_4|NC_003272.1_5654598_5656185_+	NA	NA|64aa|down_5|NC_003272.1_5656391_5656583_-	NA	NA|614aa|down_6|NC_003272.1_5656757_5658599_-	COG4715, COG4715, Uncharacterized conserved protein [Function unknown]	NA|476aa|down_7|NC_003272.1_5658888_5660316_+	PRK06416, PRK06416, dihydrolipoamide dehydrogenase; Reviewed	NA|297aa|down_8|NC_003272.1_5660423_5661314_+	PRK00278, trpC, indole-3-glycerol phosphate synthase TrpC	NA|83aa|down_9|NC_003272.1_5661593_5661842_+	pfam17275, DUF5340, Family of unknown function (DUF5340)
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	21	5654133-5654384	14,20,12	PILER-CR,CRISPRCasFinder,CRT	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	GTTAAAACCCTCTAAAATCCCTATCAGGGA----------TTGAAAC,GTTAAAACCCTCTAAAATCCCTATCAGGGATTGAAAC,GTTAAAACCCTCTAAAATCCCTATCAGGGATTGAAAC	47,37,37	0	0	NA	NA	N:A	3,3,3	3	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA|529aa|down_0|NC_003272.1_5654598_5656185_+,NA|64aa|down_1|NC_003272.1_5656391_5656583_-	NA|372aa|up_9|NC_003272.1_5633624_5634740_-	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|239aa|up_8|NC_003272.1_5634736_5635453_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|237aa|up_7|NC_003272.1_5635711_5636422_-	cd10911, PIN_LabA, PIN domain of Synechococcus elongatus LabA (low-amplitude and bright) and related proteins	NA|592aa|up_6|NC_003272.1_5639127_5640903_-	COG1132, MdlB, ABC-type multidrug transport system, ATPase and permease components [Defense mechanisms]	NA|1229aa|up_5|NC_003272.1_5641381_5645068_+	TIGR02025, Magnesium-chelatase_subunit_H, magnesium chelatase, H subunit	NA|181aa|up_4|NC_003272.1_5645250_5645793_+	COG1943, COG1943, Transposase and inactivated derivatives [DNA replication, recombination, and repair]	NA|185aa|up_3|NC_003272.1_5647524_5648079_-	pfam01243, Putative_PNPOx, Pyridoxamine 5'-phosphate oxidase	NA|224aa|up_2|NC_003272.1_5648263_5648935_-	pfam12900, Pyridox_ox_2, Pyridoxamine 5'-phosphate oxidase	NA|491aa|up_1|NC_003272.1_5649033_5650506_+	COG1167, ARO8, Transcriptional regulators containing a DNA-binding HTH domain and an aminotransferase domain (MocR family) and their eukaryotic orthologs [Transcription / Amino acid transport and metabolism]	NA|555aa|up_0|NC_003272.1_5652123_5653788_+	pfam04966, OprB, Carbohydrate-selective porin, OprB family	NA|529aa|down_0|NC_003272.1_5654598_5656185_+	NA	NA|64aa|down_1|NC_003272.1_5656391_5656583_-	NA	NA|614aa|down_2|NC_003272.1_5656757_5658599_-	COG4715, COG4715, Uncharacterized conserved protein [Function unknown]	NA|476aa|down_3|NC_003272.1_5658888_5660316_+	PRK06416, PRK06416, dihydrolipoamide dehydrogenase; Reviewed	NA|297aa|down_4|NC_003272.1_5660423_5661314_+	PRK00278, trpC, indole-3-glycerol phosphate synthase TrpC	NA|83aa|down_5|NC_003272.1_5661593_5661842_+	pfam17275, DUF5340, Family of unknown function (DUF5340)	NA|76aa|down_6|NC_003272.1_5662070_5662298_-	pfam11165, DUF2949, Protein of unknown function (DUF2949)	NA|174aa|down_7|NC_003272.1_5662802_5663324_-	COG1430, COG1430, Uncharacterized conserved protein [Function unknown]	NA|229aa|down_8|NC_003272.1_5663529_5664216_-	COG0745, OmpR, Response regulators consisting of a CheY-like receiver domain and a winged-helix DNA-binding domain [Signal transduction mechanisms / Transcription]	NA|306aa|down_9|NC_003272.1_5664298_5665216_-	PRK02649, ppnK, NAD(+) kinase
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	22	5751524-5751631	21	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	CTCTTTGACCACTCATACTAGTTTGGTCAAAAACGAT	37	0	0	NA	NA	N:A	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA	NA|638aa|up_9|NC_003272.1_5737372_5739286_-	COG3596, COG3596, Predicted GTPase [General function prediction only]	NA|353aa|up_8|NC_003272.1_5740064_5741123_+	pfam07082, DUF1350, Protein of unknown function (DUF1350)	NA|425aa|up_7|NC_003272.1_5741319_5742594_-	COG2367, PenP, Beta-lactamase class A [Defense mechanisms]	NA|236aa|up_6|NC_003272.1_5743192_5743900_+	COG2148, WcaJ, Sugar transferases involved in lipopolysaccharide synthesis [Cell envelope biogenesis, outer membrane]	NA|280aa|up_5|NC_003272.1_5743900_5744740_-	COG0395, UgpE, ABC-type sugar transport system, permease component [Carbohydrate transport and metabolism]	NA|194aa|up_4|NC_003272.1_5744776_5745358_-	COG0212, COG0212, 5-formyltetrahydrofolate cyclo-ligase [Coenzyme metabolism]	NA|315aa|up_3|NC_003272.1_5745454_5746399_-	cd05239, GDP_FS_SDR_e, GDP-fucose synthetase, extended (e) SDRs	NA|253aa|up_2|NC_003272.1_5748038_5748797_-	TIGR03022, WbaP_sugtrans, Undecaprenyl-phosphate galactose phosphotransferase, WbaP	NA|382aa|up_1|NC_003272.1_5748907_5750053_-	cd03804, GT4_WbaZ-like, mannosyltransferase WbaZ and similar proteins	NA|312aa|up_0|NC_003272.1_5750529_5751465_+	PLN00016, PLN00016, RNA-binding protein; Provisional	NA|430aa|down_0|NC_003272.1_5751638_5752928_-	COG0025, NhaP, NhaP-type Na+/H+ and K+/H+ antiporters [Inorganic ion transport and metabolism]	NA|456aa|down_1|NC_003272.1_5753082_5754450_+	COG2124, CypX, Cytochrome P450 [Secondary metabolites biosynthesis, transport, and catabolism]	NA|1552aa|down_2|NC_003272.1_5754513_5759169_-	cd00200, WD40, WD40 domain, found in a number of eukaryotic proteins that cover a wide variety of functions including adaptor/regulatory modules in signal transduction, pre-mRNA processing and cytoskeleton assembly; typically contains a GH dipeptide 11-24 residues from its N-terminus and the WD dipeptide at its C-terminus and is 40 residues long, hence the name WD40; between GH and WD lies a conserved core; serves as a stable propeller-like platform to which proteins can bind either stably or reversibly; forms a propeller-like structure with several blades where each blade is composed of a four-stranded anti-parallel b-sheet; instances with few detectable copies are hypothesized to form larger structures by dimerization; each WD40 sequence repeat forms the first three strands of one blade and the last strand in the next blade; the last C-terminal WD40 repeat completes the blade structure of the first WD40 repeat to create the closed ring propeller-structure; residues on the top and bottom surface of the propeller are proposed to coordinate interactions with other proteins and/or small ligands; 7 copies of the repeat are present in this alignment	NA|435aa|down_3|NC_003272.1_5759189_5760494_-	pfam07693, KAP_NTPase, KAP family P-loop domain	NA|159aa|down_4|NC_003272.1_5761177_5761654_+	pfam08670, MEKHLA, MEKHLA domain	NA|240aa|down_5|NC_003272.1_5761879_5762599_+	COG0705, COG0705, Membrane associated serine protease [Amino acid transport and metabolism]	NA|778aa|down_6|NC_003272.1_5762620_5764954_-	COG4252, COG4252, Predicted transmembrane sensor domain [Signal transduction mechanisms]	NA|174aa|down_7|NC_003272.1_5765756_5766278_+	cd10911, PIN_LabA, PIN domain of Synechococcus elongatus LabA (low-amplitude and bright) and related proteins	NA|532aa|down_8|NC_003272.1_5766368_5767964_+	PRK00915, PRK00915, 2-isopropylmalate synthase; Validated	NA|286aa|down_9|NC_003272.1_5768032_5768890_+	PRK13577, PRK13577, diaminopimelate epimerase; Provisional
GCF_000009705.1_ASM970v1	NC_003272	Nostoc sp. PCC 7120 = FACHB-418, complete genome	23	5826074-5826154	22	CRISPRCasFinder	no		csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG	Orphan	ACCAATGATTTGGGATAATTATCTGCGT	28	0	0	NA	NA	N:A	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA,NA	NA|408aa|up_9|NC_003272.1_5812605_5813829_+	cd19920, REC_PA4781-like, phosphoacceptor receiver (REC) domain of cyclic di-GMP phosphodiesterase PA4781 and similar domains	NA|444aa|up_8|NC_003272.1_5814306_5815638_+	cd19920, REC_PA4781-like, phosphoacceptor receiver (REC) domain of cyclic di-GMP phosphodiesterase PA4781 and similar domains	NA|383aa|up_7|NC_003272.1_5815886_5817035_+	COG3287, COG3287, Uncharacterized conserved protein [Function unknown]	NA|343aa|up_6|NC_003272.1_5817050_5818079_+	COG0642, BaeS, Signal transduction histidine kinase [Signal transduction mechanisms]	NA|521aa|up_5|NC_003272.1_5818140_5819703_-	PRK02504, PRK02504, NAD(P)H-quinone oxidoreductase subunit N	NA|511aa|up_4|NC_003272.1_5820138_5821671_-	cd02142, McbC_SagB-like_oxidoreductase, oxidase similar to the microcin B17 processing protein McbC	NA|292aa|up_3|NC_003272.1_5821874_5822750_-	pfam14257, DUF4349, Domain of unknown function (DUF4349)	NA|153aa|up_2|NC_003272.1_5822842_5823301_-	pfam12158, DUF3592, Protein of unknown function (DUF3592)	NA|489aa|up_1|NC_003272.1_5823471_5824938_-	COG1982, LdcC, Arginine/lysine/ornithine decarboxylases [Amino acid transport and metabolism]	NA|287aa|up_0|NC_003272.1_5825079_5825940_+	pfam06485, DUF1092, Protein of unknown function (DUF1092)	NA|437aa|down_0|NC_003272.1_5826198_5827509_+	COG0312, TldD, Predicted Zn-dependent proteases and their inactivated homologs [General function prediction only]	NA|872aa|down_1|NC_003272.1_5827614_5830230_+	cd01031, EriC, ClC chloride channel EriC	NA|457aa|down_2|NC_003272.1_5830252_5831623_-	COG4370, COG4370, Uncharacterized protein conserved in bacteria [Function unknown]	NA|677aa|down_3|NC_003272.1_5831762_5833793_+	COG4775, COG4775, Outer membrane protein/protective antigen OMA87 [Cell envelope biogenesis, outer membrane]	NA|134aa|down_4|NC_003272.1_5833875_5834277_-	COG2335, COG2335, Secreted and surface protein containing fasciclin-like repeats [Cell envelope biogenesis, outer membrane]	NA|473aa|down_5|NC_003272.1_5834399_5835818_-	COG3670, COG3670, Lignostilbene-alpha,beta-dioxygenase and related enzymes [Secondary metabolites biosynthesis, transport, and catabolism]	NA|584aa|down_6|NC_003272.1_5835840_5837592_-	cd01949, GGDEF, Diguanylate-cyclase (DGC) or GGDEF domain	NA|673aa|down_7|NC_003272.1_5838198_5840217_-	PRK10060, PRK10060, cyclic di-GMP phosphodiesterase	NA|340aa|down_8|NC_003272.1_5841168_5842188_+	cd02801, DUS_like_FMN, Dihydrouridine synthase-like (DUS-like) FMN-binding domain	NA|84aa|down_9|NC_003272.1_5842406_5842658_+	pfam11741, AMIN, AMIN domain
GCF_000009705.1_ASM970v1	NC_003276	Nostoc sp. PCC 7120 = FACHB-418 plasmid pCC7120alpha, complete sequence	1	52724-52840	1	CRISPRCasFinder	no		cas14j,Cas14u_CAS-V,cas14k,Cas14c_CAS-V-F,RT,Cas9_archaeal,c2c9_V-U4	Orphan	TTTAACTATTCTTCTCAAACTCCACTTCAGACAAGACTTAG	41	0	0	NA	NA	N:A	1	1	Orphan	csx18,cas1,cas2,csa3,Cas9_archaeal,Cas14c_CAS-V-F,cas3,csx21,csm3gr7,csx19,csm2gr11,csx10gr5,cas10,cas6,cas14j,WYL,cas10d,csc2gr7,csc1gr5,2OG_CAS,cas4,cas14k,c2c9_V-U4,c2c5_V-U5,RT,DinG,Cas14u_CAS-V	NA|88aa|up_8|NC_003276.1_45337_45601_-,NA|114aa|up_7|NC_003276.1_46026_46368_+,NA|139aa|up_6|NC_003276.1_46549_46966_+,NA|239aa|up_5|NC_003276.1_46958_47675_+,NA|52aa|up_4|NC_003276.1_48145_48301_+,NA|138aa|up_3|NC_003276.1_48310_48724_+,NA|235aa|up_2|NC_003276.1_48720_49425_+,NA|607aa|up_1|NC_003276.1_49436_51257_+,NA|334aa|up_0|NC_003276.1_51294_52296_-,NA|54aa|down_0|NC_003276.1_53240_53402_+,NA|125aa|down_6|NC_003276.1_64267_64642_+,NA|156aa|down_9|NC_003276.1_66196_66664_+	NA|189aa|up_9|NC_003276.1_44748_45315_-	pfam13673, Acetyltransf_10, Acetyltransferase (GNAT) domain	NA|88aa|up_8|NC_003276.1_45337_45601_-	NA	NA|114aa|up_7|NC_003276.1_46026_46368_+	NA	NA|139aa|up_6|NC_003276.1_46549_46966_+	NA	NA|239aa|up_5|NC_003276.1_46958_47675_+	NA	NA|52aa|up_4|NC_003276.1_48145_48301_+	NA	NA|138aa|up_3|NC_003276.1_48310_48724_+	NA	NA|235aa|up_2|NC_003276.1_48720_49425_+	NA	NA|607aa|up_1|NC_003276.1_49436_51257_+	NA	NA|334aa|up_0|NC_003276.1_51294_52296_-	NA	NA|54aa|down_0|NC_003276.1_53240_53402_+	NA	NA|185aa|down_1|NC_003276.1_53469_54024_+	COG1670, RimL, Acetyltransferases, including N-acetylases of ribosomal proteins [Translation, ribosomal structure and biogenesis]	NA|195aa|down_2|NC_003276.1_54375_54960_+	pfam10706, Aminoglyc_resit, Aminoglycoside-2''-adenylyltransferase	NA|749aa|down_3|NC_003276.1_55236_57483_-	TIGR01448, recD_rel, helicase, putative, RecD/TraA family	NA|1190aa|down_4|NC_003276.1_58130_61700_-	TIGR01901, Heme/hemopexin-binding_protein, filamentous hemagglutinin family N-terminal domain	NA|229aa|down_5|NC_003276.1_63088_63775_+	COG0546, Gph, Predicted phosphatases [General function prediction only]	NA|125aa|down_6|NC_003276.1_64267_64642_+	NA	NA|138aa|down_7|NC_003276.1_64654_65068_+	COG1403, McrA, Restriction endonuclease [Defense mechanisms]	NA|343aa|down_8|NC_003276.1_65164_66193_+	cd00796, INT_Rci_Hp1_C, Shufflon-specific DNA recombinase Rci and Bacteriophage Hp1_like integrase, C-terminal catalytic domain	NA|156aa|down_9|NC_003276.1_66196_66664_+	NA
