LOCUS       QJU56452.1              1089 aa    PRT              BCT 18-MAY-2020
DEFINITION  Sphingomonas sp. AP4-R1 peptidase S41 protein.
ACCESSION   CP053346-84
PROTEIN_ID  QJU56452.1
SOURCE      Sphingomonas sp. AP4-R1
  ORGANISM  Sphingomonas sp. AP4-R1
            Bacteria; Proteobacteria; Alphaproteobacteria; Sphingomonadales;
            Sphingomonadaceae; Sphingomonas.
REFERENCE   1  (bases 1 to 5252057)
  AUTHORS   Heo,J., Kim,S.-J., Kim,J.-S., Hong,S.-B. and Kwon,S.-W.
  TITLE     Genome sequencing of strain KACC 21605
  JOURNAL   Unpublished
REFERENCE   2  (bases 1 to 5252057)
  AUTHORS   Heo,J., Kim,S.-J., Kim,J.-S., Hong,S.-B. and Kwon,S.-W.
  TITLE     Direct Submission
  JOURNAL   Submitted (08-MAY-2020) Agricultural Mircrobiology Division,
            National Institute of Agricultural Sciences, 166
            Nongsaengmyeong-ro, Iseo-myeon, Wanju-gun, Jeollabuk-do 55365,
            South Korea
COMMENT     The annotation was added by the NCBI Prokaryotic Genome Annotation
            Pipeline (PGAP). Information about PGAP can be found here:
            https://www.ncbi.nlm.nih.gov/genome/annotation_prok/
            This genome has a base modification file available.
            
            ##Genome-Assembly-Data-START##
            Assembly Date          :: APR-2020
            Assembly Method        :: RS HGAP Assembly v. 3.0
            Genome Representation  :: Full
            Expected Final Version :: Yes
            Genome Coverage        :: 99.0x
            Sequencing Technology  :: PacBio RSII
            ##Genome-Assembly-Data-END##
            
            ##Genome-Annotation-Data-START##
            Annotation Provider               :: NCBI
            Annotation Date                   :: 05/11/2020 21:04:38
            Annotation Pipeline               :: NCBI Prokaryotic Genome
                                                 Annotation Pipeline (PGAP)
            Annotation Method                 :: Best-placed reference protein
                                                 set; GeneMarkS-2+
            Annotation Software revision      :: 4.11
            Features Annotated                :: Gene; CDS; rRNA; tRNA; ncRNA;
                                                 repeat_region
            Genes (total)                     :: 4,788
            CDSs (total)                      :: 4,729
            Genes (coding)                    :: 4,613
            CDSs (with protein)               :: 4,613
            Genes (RNA)                       :: 59
            rRNAs                             :: 2, 2, 2 (5S, 16S, 23S)
            complete rRNAs                    :: 2, 2, 2 (5S, 16S, 23S)
            tRNAs                             :: 50
            ncRNAs                            :: 3
            Pseudo Genes (total)              :: 116
            CDSs (without protein)            :: 116
            Pseudo Genes (ambiguous residues) :: 0 of 116
            Pseudo Genes (frameshifted)       :: 56 of 116
            Pseudo Genes (incomplete)         :: 58 of 116
            Pseudo Genes (internal stop)      :: 26 of 116
            Pseudo Genes (multiple problems)  :: 22 of 116
            ##Genome-Annotation-Data-END##
FEATURES             Qualifiers
     source          /organism="Sphingomonas sp. AP4-R1"
                     /mol_type="genomic DNA"
                     /strain="AP4-R1"
                     /host="Malus prunifolia (crab apple)"
                     /culture_collection="KACC:21605"
                     /db_xref="taxon:2735134"
                     /country="South Korea: Naju-si"
                     /collection_date="23-Oct-2019"
                     /collected_by="Jun Heo, Soon-Wo Kwon"
                     /identified_by="Jun Heo, Soon-Wo Kwon"
     protein         /locus_tag="HL653_00425"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_012930170.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /transl_table=11
BEGIN
        1 MRTAGRLTSS LIALLGSAAL FAQTPSASPP PASPGKPALT QPAASPDGRT IAFASGGDIW
       61 EVPSTGGIAH LLVTDAATEA RPLYSPDGKS LAFTSTRGGS TNIFLLDLAS GAVTRLTWSE
      121 ASEELDSWSA DGKWLYFASS ANDPGGTPDV FRVSAAGGTP IEVSREDYLS EFQAAPSPDG
      181 SIVALAARGI SFNQWWRNGH SHIDETEIWL KPLSGTGAYR KLLPGGAKQA WPMWKPGGAS
      241 IVYMSDASGA ENLWEVPAAG GTPTQLTRFT SGRLLFPTMA ADGKAILFER DMAVWRYDPA
      301 TGQTAEVPIT LRGAPATEGQ RHLNLATFTR LAVSPDGQKV AVIAHGEVFA APAKDGGTAQ
      361 RITNSVGAER ELTWSPDSRR ILTVGERGLD RRVAEYDVAA DRETMLTGAG IATVPVYAPD
      421 GKSIAYVKDA RELHLLTLAA PGKPATDRIL YTGTLATDEG DGPRPTFSPD GRWIAFPLVD
      481 RRSFVNVNVV ATAGGPARPV SFLANGQMGG IAWSPDGKYL LIDSAQRTED SRLIRIDLLP
      541 HVPRYREDAF RDLFKPKSPG DPAPDKGPST TPQPKPLPAA AKKKGAAAPA KPAVPPVEIV
      601 WEGLRDRATI LPIGLSAELP HVSSDGKTLV FLAREKGQEN LYSYNLDELA TETPVAQQIS
      661 ASDRPKADAG LTADGKTLFY LDGGRIIATP LEKPAPKVVA VTAQMDVDFA TEKQIMFDEA
      721 WSVLDRNFFD PAFNGHDWKA LRAQYQPYVD GARTPDELRR VIGLMIGDLN ASHSGINRPR
      781 RGPGALPQGR VGMLGLRFDR AAYEAGRGLV VSEVVPLSPA AIEGKIVPGE RLVSVDGHAI
      841 GAHDNLDALL ENSVGQRVAI GVSGPNGTRT VNLKPVTLTT IDGLAYRGWV DRRRAYVDRI
      901 SGGKLGYVHM ADMSADSLDQ LYLDLDADNQ AKQGVVIDVR NNNGGFVNGY ALDAISRRNY
      961 LTMEPRGLYP FPARQALGQR ALGLPTILVT NQSSLSDAED FTEGYRALGL GKVVGQPTAG
     1021 WIIYTWSETL IDGSTVRVPR ARIRTLSGQD MEMHPRPVDI AVERPLGETG AGTDAQLDVA
     1081 VKTLLGAEK
//