LOCUS       AJC72901.1              1650 aa    PRT              BCT 19-SEP-2017
DEFINITION  Pseudothermotoga hypogea DSM 11164 = NBRC 106472 DNA-directed
            RNA polymerase subunit beta' protein.
ACCESSION   CP007141-74
PROTEIN_ID  AJC72901.1
SOURCE      Pseudothermotoga hypogea DSM 11164 = NBRC 106472
  ORGANISM  Pseudothermotoga hypogea DSM 11164 = NBRC 106472
            Bacteria; Thermotogae; Thermotogales; Thermotogaceae;
            Pseudothermotoga.
REFERENCE   1  (bases 1 to 2165416)
  AUTHORS   Zhang,X., Alvare,G., Fristensky,B., Chen,L., Suen,T., Chen,Q. and
            Ma,K.
  TITLE     Genome sequencing of Thermotog hypogea
  JOURNAL   Unpublished
REFERENCE   2  (bases 1 to 2165416)
  AUTHORS   Zhang,X., Alvare,G., Fristensky,B., Chen,L., Suen,T., Chen,Q. and
            Ma,K.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-JAN-2014) Department of Biology, University of
            Waterloo, 200 University Avenue West, Waterloo, Ontario N2L 3G1,
            Canada
COMMENT     Annotation was added by the NCBI Prokaryotic Genome Annotation
            Pipeline (released 2013). Information about the Pipeline can be
            found here: http://www.ncbi.nlm.nih.gov/genome/annotation_prok/
            
            ##Genome-Assembly-Data-START##
            Assembly Method       :: Newbler v. 2.6
            Genome Coverage       :: 56X
            Sequencing Technology :: 454 GS FLX Titanium
            ##Genome-Assembly-Data-END##
            
            ##Genome-Annotation-Data-START##
            Annotation Provider          :: NCBI
            Annotation Date              :: 01/17/2014 14:13:17
            Annotation Pipeline          :: NCBI Prokaryotic Genome Annotation
                                            Pipeline
            Annotation Method            :: Best-placed reference protein set;
                                            GeneMarkS+
            Annotation Software revision :: 2.3 (rev. 423251)
            Features Annotated           :: Gene; CDS; rRNA; tRNA; ncRNA;
                                            repeat_region
            Genes                        :: 2,168
            CDS                          :: 2,097
            Pseudo Genes                 :: 21
            CRISPR Arrays                :: 4
            rRNAs                        :: 3 (5S, 16S, 23S)
            tRNAs                        :: 46
            ncRNA                        :: 1
            Frameshifted Genes           :: 9
            ##Genome-Annotation-Data-END##
FEATURES             Qualifiers
     source          /organism="Pseudothermotoga hypogea DSM 11164 = NBRC
                     106472"
                     /mol_type="genomic DNA"
                     /strain="DSM 11164 = NBRC 106472"
                     /isolation_source="an African oil producing well"
                     /culture_collection="DSM:11164"
                     /type_material="type strain of Pseudothermotoga hypogea"
                     /db_xref="taxon:1123384"
                     /country="Cameroon"
                     /collection_date="1979"
     protein         /locus_tag="AJ81_00390"
                     /inference="EXISTENCE: similar to AA
                     sequence:RefSeq:YP_001470109.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /transl_table=11
BEGIN
        1 MAISTFKRKI AAVKIGVASP DTIRSWSSGE VKKPETINYR TFKPERDGLF CEKIFGPTKD
       61 YECACGKYKG KKYEGTVCER CGVRVESKEA RRKRMGHIEL AAPVVHIWYL KSTPSILSTL
      121 LNIPARDLEN IVYYGSRHII EKAYIVTNPK KTSFAEGDVI YETEYNIYKK VLDFEAEQSV
      181 IVKNPKTPVI SEIDGEVSLK NERSNTGRTI TWIIVRNVVR SHVQLFPGMI LLVKNGQEVS
      241 EGDILVAEKE VPALYAPFDG TVEIDELTSS LTLKPLATSK DQPLTVSIPY CCRLTVKNGA
      301 KVKAGDQIWT AGMIQALTSP ASGKVVFGKE LNVRPLEDGS YEVLSSGSIY VEQTAIEKKY
      361 PIFEGALAYV NDGDRVKAGD YLADRFLFED EHLSLSEYAI FQQYYPDQFT VETEVENDRP
      421 ILAITKIDEE LARETSLTVG SIITENEYEA YRELYPGKIE AHYGAAAVKK LLEMIDLEKL
      481 KAQIEAELAE LPKSSGRALK LLRRLKIVKS LINSGARPEW MVLEALPVIP PELRPMIQID
      541 GGRFATTDLN DLYRRVINRN NRLKRFLELN APEVMIRNEM RMLQEAVDSL IYNGRVGRPV
      601 ADRNGRPLKS LTDLVKGKKG RFRRNLLGKR VDYSGRAVIV VGPELKIHQC GLPKKMALEL
      661 FKPFVLAKLL EEGGESSKTA RKLKKTIIER EMPEAWDVLE EVIKGQTVLL NRAPTLHRMS
      721 IQAFEPKLIE GNAIQLHPLV CPPFNADFDG DQMAVHVPLS AAAQAEARYL MLSRYNIISP
      781 AHGKPISMPG KDIIVGIYYL TAVSKDYDFV STDRIEFKFS SPEEAILAHS LGFVGLHTPV
      841 LARVKQNGEE KTLKTTVGRI IFNEIVPEDL RDYSKTFGKK EIKDLIYETF KRHGMEATAD
      901 LLDDMKDLGF HYATVSGLTI SLKDLVVSPK KNAIIKDALE KVEKVEQEYA EGFLTYEERY
      961 KEIIRIWTKA TEEVQKVTYE ALGENPFNPV FMMVNSGARG NIDQVKQLAG MRGLMADPSG
     1021 KTIEIPIISN FREGLNSIEF FISTHGARKG AADTALRTSS AGYLTRRLVD VAQSVFITTT
     1081 DCGTENGVKA LELMSGTLTV QKLKDFLFGR ILARDVIDPL SGEVVKNPDN NREYVRNSML
     1141 SDEDAEFLAK YVVSVPVCVE QVLDLQSLQL PASYAVTDEE IRLEDGTVYE VGTEVSWDLV
     1201 RNARNAGKKQ IKIKVYPVVG TISQEIVWDK KGEKQLLVYQ EEIDEVTAML LEQNGVSAVK
     1261 VRPNIYVRSP LTCEAEHGVC AMCYGMDLSN HKVVNVGEAV GIIAAQSIGE PGTQLTMRTF
     1321 HTGGIATTAD ITQGLPRAEE LFEARKKLKE PEGIFSMVSG FVKDIKEVDG KKKIYIEDLA
     1381 GEIHEYEVPE KVKEIVTRGQ KVLPGQMLTT GAVKLRRMMD ALGVEATAMY LLRETQKVYV
     1441 EQGVDIHNKH FEIIIRQMLG RVEIVDPGDT DFLPGQLLTL SEAMRINNEI LKANAQVQSN
     1501 RNMVVGKILA KKIVAKLKDE VEEIAPEGTE VSEDIVEKAV AAGVKEIVVL EDGKPVTYQI
     1561 APKEPMKYRR RLLRITKASL EQEGWLSAAS FQQTPQVLTE AAIEGRIDYL RGLKENVIVG
     1621 QLIPSGTGLE IFANIQIEET PRAAEEEKMA
//