LOCUS       NC_001420               5577 bp    DNA     circular PHG 13-AUG-2018
DEFINITION  Genome of phage G4 (coliphage).
ACCESSION   NC_001420
VERSION     NC_001420.2
DBLINK      BioProject: PRJNA485481
KEYWORDS    RefSeq; circular; coat protein; genome; origin of replication.
SOURCE      Enterobacteria phage G4
  ORGANISM  Enterobacteria phage G4
            Viruses; ssDNA viruses; Microviridae; Bullavirinae; G4microvirus.
REFERENCE   1  (bases 1 to 5577)
  AUTHORS   Godson,G.N., Barrell,B.G., Staden,R. and Fiddes,J.C.
  TITLE     Nucleotide sequence of bacteriophage G4 DNA
  JOURNAL   Nature 276 (5685), 236-247 (1978)
   PUBMED   714153
REFERENCE   2
  AUTHORS   Fiddes,J.C. and Godson,G.N.
  TITLE     Nucleotide sequence of the J gene and surrounding untranslated
            regions of phage G4 DNA: comparison with phage phiX174
  JOURNAL   Cell 15 (3), 1045-1053 (1978)
   PUBMED   728985
REFERENCE   3  (bases 1 to 5577)
  CONSRTM   NCBI Genome Project
  TITLE     Direct Submission
  JOURNAL   Submitted (06-JUL-2018) National Center for Biotechnology
            Information, NIH, Bethesda, MD 20894, USA
COMMENT     PROVISIONAL REFSEQ: This record has not yet been subject to final
            NCBI review. The reference sequence is identical to V00657.
            On Apr 7, 2008 this sequence version replaced NC_001420.1.
            COMPLETENESS: full length.
FEATURES             Location/Qualifiers
     source          1..5577
                     /organism="Enterobacteria phage G4"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:10843"
     gene            59..1723
                     /locus_tag="G4p03"
                     /db_xref="GeneID:1260914"
     CDS             59..1723
                     /locus_tag="G4p03"
                     /note="reading frame (A protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497836.1"
                     /db_xref="GOA:P03632"
                     /db_xref="InterPro:IPR008683"
                     /db_xref="InterPro:IPR008684"
                     /db_xref="UniProtKB/Swiss-Prot:P03632"
                     /db_xref="GeneID:1260914"
                     /translation="MFKVHSDYFSKPNIDAIKPLVETAGMSVLTQSPNLRIWKQCNTR
                     IKLLEEILAHYTNGIRRDDNGDFWMNPNSQLATTIAYRAHHKGHNPKFKQYPETFTLD
                     DIITGKPIPQTAPDELQLSDEIVEDYRLTVLSIIEELQECYDVLGQLDINNTIDHKPL
                     GNDHWNLLYEKPVYKHWYQLVSNRPLKDIRADYNYAKAKGVKDECSKILEESTMKSRR
                     GFTVQRLMNAMRTAHSKGWYVVFDTLTLADDRLKDFYDNPNALRDYFRDIGRMVLTAE
                     GRSVHDSSSDCYQYFCVPEYGTQHGRLHFHAVHLMRTLPLGSLHPNFGKLVRINRQIN
                     SLQNTWPYGYSMPIAVRYSQDAFSRAGWLWPVDSKGEPLKATSYMAVGFYVAKYVNKK
                     SDIDMAVKGLGNKEWNNSLKTKINLIPKKVFRIRMSRNFGMKLLSMAHLSAETLMELT
                     QVGYDVTPFNNILKQNAKKELKSRLAKKSVADVLEAQPVTTNLLKFMRNLTRTIGASN
                     LQSFIASMTTKLTSTDISDETKNYVASAGIAVANLRIKSKWTAGGK"
     gene            698..1723
                     /locus_tag="G4p04"
                     /db_xref="GeneID:1260919"
     CDS             698..1723
                     /locus_tag="G4p04"
                     /note="reading frame (A* protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497837.1"
                     /db_xref="GOA:P03632"
                     /db_xref="InterPro:IPR008683"
                     /db_xref="InterPro:IPR008684"
                     /db_xref="UniProtKB/Swiss-Prot:P03632"
                     /db_xref="GeneID:1260919"
                     /translation="MKSRRGFTVQRLMNAMRTAHSKGWYVVFDTLTLADDRLKDFYDN
                     PNALRDYFRDIGRMVLTAEGRSVHDSSSDCYQYFCVPEYGTQHGRLHFHAVHLMRTLP
                     LGSLHPNFGKLVRINRQINSLQNTWPYGYSMPIAVRYSQDAFSRAGWLWPVDSKGEPL
                     KATSYMAVGFYVAKYVNKKSDIDMAVKGLGNKEWNNSLKTKINLIPKKVFRIRMSRNF
                     GMKLLSMAHLSAETLMELTQVGYDVTPFNNILKQNAKKELKSRLAKKSVADVLEAQPV
                     TTNLLKFMRNLTRTIGASNLQSFIASMTTKLTSTDISDETKNYVASAGIAVANLRIKS
                     KWTAGGK"
     gene            1276..1638
                     /locus_tag="G4p05"
                     /db_xref="GeneID:1260918"
     CDS             1276..1638
                     /locus_tag="G4p05"
                     /note="reading frame (B protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497838.1"
                     /db_xref="GOA:P03634"
                     /db_xref="InterPro:IPR003513"
                     /db_xref="UniProtKB/Swiss-Prot:P03634"
                     /db_xref="GeneID:1260918"
                     /translation="MEQFTQNQNQPHTQESVQNTNVSQFRNETVINGSPVSGNPDGTD
                     PSGLRRDPVQQHLEAERQERAQIEAGKEICRRRFGGATCDDESAKIHAQFDPNNRSVQ
                     PTEFYRFNDHEINKYGYF"
     gene            1638..1808
                     /locus_tag="G4p07"
                     /db_xref="GeneID:1260916"
     CDS             1638..1808
                     /locus_tag="G4p07"
                     /note="reading frame (K protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497839.1"
                     /db_xref="InterPro:IPR020962"
                     /db_xref="UniProtKB/Swiss-Prot:P03654"
                     /db_xref="GeneID:1260916"
                     /translation="MKPKTTLLLQELLLLTYELNRSGLLVENEEIQSQLKKLEVVLLC
                     NLSPSSQRAGKN"
     gene            1720..1974
                     /locus_tag="G4p08"
                     /db_xref="GeneID:1260917"
     CDS             1720..1974
                     /locus_tag="G4p08"
                     /note="reading frame (C protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497840.1"
                     /db_xref="InterPro:IPR016407"
                     /db_xref="UniProtKB/Swiss-Prot:P03636"
                     /db_xref="GeneID:1260917"
                     /translation="MRKFNLNLKNSRSSYFATFRHHLNVLAKTDALDEEKYLNMLGAL
                     LKDWFRYEEHFVHGKQSMLDILKERGLLSTSSTDTNHKGN"
     gene            1976..2434
                     /locus_tag="G4p09"
                     /db_xref="GeneID:1260921"
     CDS             1976..2434
                     /locus_tag="G4p09"
                     /note="reading frame (D protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497841.1"
                     /db_xref="GOA:P03638"
                     /db_xref="InterPro:IPR004196"
                     /db_xref="UniProtKB/Swiss-Prot:P03638"
                     /db_xref="GeneID:1260921"
                     /translation="MSKSNESAVAFQTAIASIKLIQASSVLDLTEDDFDFLTRDRVWI
                     ATDRSRARRAIEACVYGTLDFVGYPRFPAPVEFISAVIAYYVHPVNIQTACLIMEGAE
                     FTENIVNGVERPVKASELFAFTLLVRAGNKDLIGHAETNIREQLRAQGVM"
     gene            2154..2444
                     /locus_tag="G4p10"
                     /db_xref="GeneID:1260912"
     CDS             2154..2444
                     /locus_tag="G4p10"
                     /note="reading frame (E protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497842.1"
                     /db_xref="GOA:P03640"
                     /db_xref="InterPro:IPR007605"
                     /db_xref="UniProtKB/Swiss-Prot:P03640"
                     /db_xref="GeneID:1260912"
                     /translation="MEHWTLSGILAFLLLLSLFLPSLLITFIPLTSKPPVSSWKVLSL
                     PKTSSMVLNAPLKPLNCSPSLFLFAPETKILSVTLKQTSVNSYALKVSCKDL"
     gene            2477..2554
                     /locus_tag="G4p11"
                     /db_xref="GeneID:1260913"
     CDS             2477..2554
                     /locus_tag="G4p11"
                     /note="reading frame (J protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497843.1"
                     /db_xref="GOA:P03652"
                     /db_xref="InterPro:IPR006815"
                     /db_xref="PDB:1GFF"
                     /db_xref="UniProtKB/Swiss-Prot:P03652"
                     /db_xref="GeneID:1260913"
                     /translation="MKKSIRRSGGKSKGARLWYVGGTQY"
     CDS             2600..3883
                     /note="reading frame (F protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497844.1"
                     /db_xref="GOA:P03642"
                     /db_xref="InterPro:IPR003514"
                     /db_xref="InterPro:IPR016184"
                     /db_xref="PDB:1GFF"
                     /db_xref="UniProtKB/Swiss-Prot:P03642"
                     /translation="MSNVQTSADRVPHDLSHLVFEAGKIGRLKTISWTPGGAGDSFEC
                     DMVGAIRLSPLRRGLAVDSRVDIFPFYIPHRHIYGQQWINFMKDGVNASPLPPVTCSS
                     GWDSAAYLGTIPSSTLKVPKFLHQGYLNIYNNYFKPPWSDDLTYANPSNMPSEDYKWG
                     VRVANLKSIWTAPLPPDTRTSENMTTGTSTIDIMGLQAAYAKLHTEQERDYFMTRYRD
                     IMKEFGGHTSYDGDNRPLLLMRSEFWASGYDVDGTDQSSLGQFSGRVQQTFNHKVPRF
                     YVPEHRVIMTLAVTRFPPTHEMEMHYLVGKENLTYTDIACDPALMANLPPREVSLKEF
                     FHSSPDSAKFKIAEGQWYRTQPDRVAFPYNALDGFPFYSALPSTELKDRVLVNTNNYD
                     EIFQSMQLAHWNMQTKFNINVYRHMPTTRDSIMTS"
     misc_feature    3970..3997
                     /note="RNA primer of replication"
     rep_origin      3998
                     /note="origin of compl. strand synthesis"
     gene            4020..4553
                     /locus_tag="G4p12"
                     /db_xref="GeneID:1260923"
     CDS             4020..4553
                     /locus_tag="G4p12"
                     /note="reading frame (G protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497845.1"
                     /db_xref="GOA:P03644"
                     /db_xref="InterPro:IPR003515"
                     /db_xref="InterPro:IPR016184"
                     /db_xref="PDB:1GFF"
                     /db_xref="UniProtKB/Swiss-Prot:P03644"
                     /db_xref="GeneID:1260923"
                     /translation="MFQKFISKHNAPINSTQLAATKTPAVAAPVLSVPNLSRSTILIN
                     ATTTAVTTHSGLCHVVRIDETNPTNHHALSIAGSLSNVPADMIAFAIRFEVADGVVPT
                     AVPALYDVYPIETFNNGKAISFKDAVTIDSHPRTVGNDVYAGIMLWSNAWTASTISGV
                     LSVNQVNREATVLQPLK"
     gene            4564..5577
                     /locus_tag="G4p13"
                     /db_xref="GeneID:1260924"
     CDS             4564..5577
                     /locus_tag="G4p13"
                     /note="reading frame (H protein)"
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="YP_009497846.1"
                     /db_xref="GOA:P03647"
                     /db_xref="InterPro:IPR006777"
                     /db_xref="UniProtKB/Swiss-Prot:P03647"
                     /db_xref="GeneID:1260924"
                     /translation="MFGSIAGGIASALAGGLMGKLFGGGQSADSTGIQGNVLASDNNV
                     VGANDAGIKSAIQGSTVPNSQEAAPSAISGILADSGKHALSSLTNAGANKLMEAVGLS
                     KSASDKGKDTKDYLAAAFPELNPWERAGAGASSPGMQDAGFQNQKELTKMQLDNQKEI
                     AKMQNETQKEIAGLQSITSRENTKDTVYAQNEMLAYNQKESMSRVGAILENTSLTKQQ
                     QTSEIMRQMLTQAQTAGQYFTNDQIKELTRKVGADIDAVRANTARTHVETDRSKQEVQ
                     NSRYASSQVGKTAKDVSNAITDTAGSIVDYFRGADQKVADVYNNYFKDGKSKGIESNH
                     RSK"
ORIGIN      
        1 tgcttgacta atactcaatc accactctaa tatgcctccc atcaaacgga ggcttttcat
       61 gtttaaagta cattctgact acttcagcaa acctaacatc gacgcaatca aacctctcgt
      121 cgaaactgct ggtatgtctg ttcttactca atctccaaac ctccgtatct ggaaacagtg
      181 caatactcgc atcaaattac tggaagaaat ccttgctcac tatacaaatg gtattcgccg
      241 tgacgacaat ggtgacttct ggatgaatcc caactctcaa ctcgcaacta ctattgccta
      301 tcgtgctcat cacaaaggcc ataaccctaa gttcaaacaa tacccagaaa ccttcactct
      361 ggacgacatt attactggta aaccaatccc tcaaactgcc cctgacgaat tacaactctc
      421 cgatgaaatc gttgaagact atcgccttac agtcctctcc ataatcgaag aattgcaaga
      481 atgctatgac gtgctcggac aacttgatat taataacact atagaccaca aacccctcgg
      541 taatgaccat tggaacctcc tctatgaaaa acccgtatac aaacattggt atcagctcgt
      601 ttcaaatcga ccccttaaag atatccgcgc cgattacaac tatgcaaagg ctaagggtgt
      661 taaagatgag tgctcaaaaa tcttggagga gtcaactatg aagtctcgac gtggctttac
      721 cgttcaaaga ttaatgaatg ctatgcgtac tgcccattct aagggctggt atgtcgtatt
      781 cgatactctt actctagccg atgaccgctt aaaggatttc tatgataatc ccaatgctct
      841 tcgtgactac ttccgtgata ttggtcgtat ggtgcttact gccgaaggtc gctcggtgca
      901 tgactcatct tccgactgct atcagtattt ttgtgtgcca gagtatggta cacagcacgg
      961 tcgtctacat ttccacgcag tgcatcttat gcgcacactt cctctgggtt ctctgcaccc
     1021 taacttcggt aagctggtac gcatcaatcg gcaaataaat agcttgcaaa acacgtggcc
     1081 ttatggttac tctatgccca tcgcagtccg gtactcccaa gacgcattct ctcgcgctgg
     1141 ctggctctgg cctgtggact caaagggtga accccttaaa gctacctcgt atatggctgt
     1201 aggcttctac gttgctaaat acgttaacaa aaaatcagat attgacatgg ccgtaaaagg
     1261 cctagggaat aaagaatgga acaattcact caaaaccaaa atcaacctca tacccaagaa
     1321 agtgttcaga atacgaatgt ctcgcaattt cggaatgaaa ctgttatcaa tggctcacct
     1381 gtcagcggaa accctgatgg aactgaccca agtgggttac gacgtgaccc cgttcaacaa
     1441 catcttgaag cagaacgcca agaaagagct caaatcgagg ctggcaaaga aatctgtcgc
     1501 cgacgttttg gaggcgcaac ctgtgacgac gaatctgcta aaattcatgc gcaatttgac
     1561 ccgaacaatc ggagcgtcca acctacagag ttttatcgct tcaatgacca cgaaattaac
     1621 aagtacggat atttctgatg aaaccaaaaa ctacgttgct tctgcaggaa ttgctgttgc
     1681 taacttacga attaaatcga agtggactgc tggtggaaaa tgaggaaatt caatctcaac
     1741 ttaaaaaact cgaggtcgtc ttactttgca acctttcgcc atcatctcaa cgtgctggca
     1801 aaaactgacg cccttgacga ggagaaatac ttaaatatgt taggtgctct cctcaaggac
     1861 tggttccggt acgaagaaca tttcgtgcat ggtaaacaat caatgcttga catactgaaa
     1921 gaacgtggcc tattatccac atcgtcaact gacacaaacc acaaaggaaa ctgaaatgtc
     1981 taaatcaaac gaatctgctg tagcctttca aactgctatc gcttctatca aacttattca
     2041 agcatcttct gttcttgact tgacagagga cgattttgac ttcttaactc gcgaccgtgt
     2101 ctggattgct accgaccgtt cacgcgctcg ccgtgctatc gaggcttgcg tatatggaac
     2161 actggacttt gtcgggtatc ctcgctttcc tgctcctgtt gagtttattt ctgccgtcat
     2221 tgcttattac gttcatcccg ttaacatcca aaccgcctgt ctcatcatgg aaggtgctga
     2281 gtttaccgaa aacatcgtca atggtgttga acgccccgtt aaagcctctg aactgttcgc
     2341 cttcactctt cttgttcgcg ccggaaacaa agatcttatc ggtcacgctg aaacaaacat
     2401 ccgtgaacag ttacgcgctc aaggtgtcat gtaaagacct ttgattttat cgtcttcact
     2461 tttaaggagt tatgtaatga aaaaatcaat tcgccgctct ggtggcaaat ctaagggtgc
     2521 ccgtctctgg tatgtaggcg gaacacaata ctaatctttt atgtgggacc gcggtcccac
     2581 tctatttaag gatacaaaaa tgtctaacgt tcaaacatct gcggaccgtg tacctcatga
     2641 cttatctcac cttgtctttg aggctggtaa aattggccgc ctcaaaacta tctcttggac
     2701 gcctggtggt gctggtgact ctttcgagtg tgatatggtt ggcgctattc gtctgtcccc
     2761 tcttcgtcgt ggcctcgctg ttgactcacg cgttgatatc tttcctttct atatcccaca
     2821 ccgtcatatc tacggtcagc agtggattaa ctttatgaag gatggcgtta atgcctcccc
     2881 tcttcctcct gttacatgct cctctggttg ggactctgct gcttatctcg gtaccattcc
     2941 gtcttctacc cttaaagtgc ctaaattctt acatcagggc tatctgaata tttataataa
     3001 ctacttcaaa ccgccttggt ctgatgactt aacttacgct aacccatcca atatgccttc
     3061 tgaggattat aaatggggcg tacgtgtcgc taaccttaaa tctatctgga ctgcgccact
     3121 tccaccggat actcgtacat ctgaaaacat gactactggt acatccacta ttgacattat
     3181 gggccttcaa gccgcatacg ctaaattaca tacggaacag gaacgtgatt acttcatgac
     3241 ccgttaccgt gacattatga aagagttcgg cggtcataca tcctatgatg gtgacaatcg
     3301 tcctcttctg ctcatgcgct ctgaattttg ggcatctggc tatgacgtag acggtactga
     3361 ccaatcttct ctcggtcaat tctctggtcg cgttcagcag accttcaatc acaaagtccc
     3421 acgcttctat gttcctgagc atcgcgtaat tatgactctg gcggttactc gctttccgcc
     3481 tactcatgaa atggaaatgc actatcttgt aggtaaagaa aacttaactt ataccgatat
     3541 tgcttgtgac cctgcactga tggctaacct gccacctcgt gaagtatcct taaaagaatt
     3601 cttccactcc tcacccgatt ctgctaaatt caaaatcgct gagggccaat ggtatcgtac
     3661 acagcctgac cgtgtcgctt tcccatataa tgctctggat ggattcccgt tctactctgc
     3721 tctcccgtcc acggaactaa aagaccgtgt actggttaac actaataact acgatgaaat
     3781 cttccagtct atgcagcttg cacactggaa tatgcaaact aaatttaaca ttaacgttta
     3841 tcgtcacatg cctacgacac gtgactcaat catgacctcg taacgcaaca aaggccgccc
     3901 ctctactggt cagatacctg cccaatgtgg ggcggaccgt gcctacggag atactcgagt
     3961 ctccgataca tggacggcga aagccgccgt ccctactgca aagccaaaag gactaacata
     4021 tgttccagaa attcatttct aagcacaatg ctccaattaa ctctactcag cttgctgcta
     4081 ctaaaacccc agctgtagcg gcacctgttt tatctgtgcc taacttaagt cgctctacta
     4141 ttctaatcaa tgcaacaacc acagccgtta caactcattc aggcttgtgc catgttgttc
     4201 gcattgatga aacaaaccca acaaatcatc acgctctatc tattgcaggt tcgttatcaa
     4261 acgtccctgc tgatatgatt gcttttgcca ttcgttttga ggtcgctgat ggcgtcgttc
     4321 ctactgccgt cccggcctta tacgacgtct atccaatcga aaccttcaat aacggcaaag
     4381 caatctcatt taaagatgct gttaccatcg actcacatcc ccgcaccgtc ggtaacgacg
     4441 tttatgcggg aatcatgctc tggtctaacg cttggaccgc ctctactatc tctggcgtcc
     4501 tctctgttaa tcaggtaaac cgtgaagcaa ccgtccttca acctctgaaa taaggattat
     4561 cctatgtttg gctctatcgc tggcggtatc gcctccgcac ttgccggagg ccttatgggt
     4621 aaattatttg gcggcggtca gtccgccgac tctaccggaa tccaaggcaa cgtccttgct
     4681 tccgacaaca atgttgtagg tgctaatgat gctggtatta aatctgctat tcagggctct
     4741 actgtcccta actctcagga agctgctccc tctgctatct ctggcatcct tgccgactct
     4801 ggcaagcatg cgctctcgtc tcttaccaat gctggtgcaa ataaactcat ggaggctgtc
     4861 ggcctttcta agtctgcctc tgacaagggc aaggacacaa aagactatct cgccgccgca
     4921 ttccccgagc tcaacccatg ggaacgtgct ggtgctggcg cttctagtcc aggcatgcaa
     4981 gacgctggct tccaaaatca gaaggagcta accaagatgc agcttgacaa ccaaaaggaa
     5041 atcgctaaga tgcaaaacga aactcagaag gaaattgctg ggcttcaatc tattacatca
     5101 cgcgaaaata ctaaggatac tgtctatgct caaaatgaaa tgctcgcgta taaccaaaaa
     5161 gagtctatgt cacgcgttgg cgctattctc gaaaacacaa gcctcaccaa acagcaacaa
     5221 acttctgaaa ttatgcggca aatgcttact caggctcaaa ccgcaggtca atattttaca
     5281 aatgaccaaa tcaaggagct tacgagaaaa gttggtgctg atattgatgc tgttcgcgct
     5341 aacactgcac gcacccatgt agaaaccgac cgctcaaaac aggaagtaca aaactcccgt
     5401 tatgcctctt ctcaggtagg taaaaccgct aaggacgtgt ccaatgcaat tactgataca
     5461 gctggttcta ttgttgatta ttttcgtggt gctgatcaaa aagtggcaga cgtttacaac
     5521 aactatttca aagatggcaa atcgaaagga atagaatcca atcaccgctc caaataa
//

