LOCUS       ASS93002.1               667 aa    PRT              BCT 08-AUG-2017
DEFINITION  Peribacillus simplex NBRC 15720 = DSM 1321 transketolase protein.
ACCESSION   CP017704-577
PROTEIN_ID  ASS93002.1
SOURCE      Peribacillus simplex NBRC 15720 = DSM 1321
  ORGANISM  Peribacillus simplex NBRC 15720 = DSM 1321
            Bacteria; Firmicutes; Bacilli; Bacillales; Bacillaceae;
            Peribacillus.
REFERENCE   1  (bases 1 to 5645783)
  AUTHORS   Park,M.-K., Lee,Y.-J., Yi,H., Bahn,Y.-S., Kim,J.F. and Lee,D.-W.
  TITLE     The whole genome sequencing and assembly of Bacillus simplex DSM
            1321 strain
  JOURNAL   Unpublished
REFERENCE   2  (bases 1 to 5645783)
  AUTHORS   Park,M.-K., Lee,Y.-J., Yi,H., Bahn,Y.-S., Kim,J.F. and Lee,D.-W.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-OCT-2016) Kyungpook National University, School of
            Applied Biosciences, 80 Daehak-Ro, Bukgu, Daegu 41566, South Korea
COMMENT     Annotation was added by the NCBI Prokaryotic Genome Annotation
            Pipeline (released 2013). Information about the Pipeline can be
            found here: https://www.ncbi.nlm.nih.gov/genome/annotation_prok/
            This genome has a base modification file available.
            
            ##Genome-Assembly-Data-START##
            Assembly Method       :: SMRT analysis 2.3 v. HGAP protocol 2
            Genome Coverage       :: missing
            Sequencing Technology :: PacBio
            ##Genome-Assembly-Data-END##
            
            ##Genome-Annotation-Data-START##
            Annotation Provider               :: NCBI
            Annotation Date                   :: 10/17/2016 13:55:10
            Annotation Pipeline               :: NCBI Prokaryotic Genome
                                                 Annotation Pipeline
            Annotation Method                 :: Best-placed reference protein
                                                 set; GeneMarkS+
            Annotation Software revision      :: 3.3
            Features Annotated                :: Gene; CDS; rRNA; tRNA; ncRNA;
                                                 repeat_region
            Genes (total)                     :: 5,348
            CDS (total)                       :: 5,228
            Genes (coding)                    :: 5,118
            CDS (coding)                      :: 5,118
            Genes (RNA)                       :: 120
            rRNAs                             :: 13, 12, 12 (5S, 16S, 23S)
            complete rRNAs                    :: 13, 12, 12 (5S, 16S, 23S)
            tRNAs                             :: 77
            ncRNAs                            :: 6
            Pseudo Genes (total)              :: 110
            Pseudo Genes (ambiguous residues) :: 0 of 110
            Pseudo Genes (frameshifted)       :: 73 of 110
            Pseudo Genes (incomplete)         :: 32 of 110
            Pseudo Genes (internal stop)      :: 34 of 110
            Pseudo Genes (multiple problems)  :: 28 of 110
            ##Genome-Annotation-Data-END##
FEATURES             Qualifiers
     source          /organism="Peribacillus simplex NBRC 15720 = DSM 1321"
                     /mol_type="genomic DNA"
                     /strain="DSM 1321"
                     /isolation_source="soil"
                     /type_material="type strain of Bacillus simplex"
                     /db_xref="taxon:1349754"
                     /collection_date="1989"
     protein         /locus_tag="BS1321_02900"
                     /inference="EXISTENCE: similar to AA
                     sequence:RefSeq:WP_009330561.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /transl_table=11
BEGIN
        1 MLDKLDALSI NTIRTLSIDA IEKANSGHPG MPMGAAPMAY KLWTEYMNHN PKNPDWFNRD
       61 RFVLSAGHGS MLLYSLLHLS GYGLSIDDLK GFRQWGSKTP GHPEYGHTAG VDATTGPLGQ
      121 GIAMAVGMAM AERHLAESYN RDSYNVVDHY TYSICGDGDL MEGVSAEAAS LAGHLQLGRL
      181 VVLYDSNDIS LDGDLSQSFS ESVADRFKSY GWQYIRVEDG NDLQEIAKAI EEAKTDDARP
      241 TLIEVKTVIG YGSPNRSGKS AVHGAPLGAD ELKLTKEAYK WTFEEDFHVP EEVYSHFNEA
      301 VVDAGAQKEE AWNELFKNYK EAHPELAQQL ELAIKGEMPA EWDQEIPVYE EGKTLASRAS
      361 SGEVLNAIAK KVPSFIGGSA DLAGSNNTAI KGETDLLPGN YSGRNIWFGV REFAMGAALN
      421 GMALHGGLKV YGGTFFVFSD YLRPAIRMAA LMGLPVNYVF THDSIAVGED GPTHEPIEQL
      481 AALRAMPNLG VIRPADGNET AAAWKVAMES TNKPTALVLT RQGLPTIKDT SETAYEGVSK
      541 GAYIISASKK EVADALLLAT GSEVNLAVEA QKALANEGID VSVISMPSWD RFETQSKEYK
      601 QSVINPAVKK RLAIELASPF GWDRYAGDEG EILAINHFGA SAPGGKIMEE FGFTVENVVA
      661 RVKEMLK
//