LOCUS       VTR91845.1               538 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana Trypsin-like serine protease with C-
            terminal PDZ domain OS=Singulisphaera acidiphila (strain
            ATCC BAA-1392 / DSM 18658 / VKM B-2454 / MOB10) GN=Sinac_4277
            PE=4 SV=1 protein.
ACCESSION   LR593886-1146
PROTEIN_ID  VTR91845.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_58690"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|L0DIK5|L0DIK5_SINAD ;
                     ALN/Q_length_ratio=0.496 ; DESCRIPTION=Trypsin-like serine
                     protease with C-terminal PDZ domain OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_4277 PE=4 SV=1 ; EVALUE=3e-10 ;
                     Q/S_length_ratio=0.976"
BEGIN
        1 MRFALSIAAV LILAPIVSAQ EPKGSPFPRR VLFVQIGGYL YLNPLTHAAP GGPDRVRAVA
       61 ERFAAGFRTP TAKGNEQLFV LSDTLVTDAR LPTKDALAKT IAGFCSTTRP HDRVVIYLGV
      121 HAVEKDGRAF VVPVDGDPDA PETLLPVADV YAKLKDLHAA QKIVVWDVCR HNPERVRGRR
      181 DPGPMTPVLF KALTTPPEGV QALVACSPGE HSLEYSAPRG PAGIFAGSAY LDALRHAAAD
      241 TAAKATPGDA IPIEELHKSA CQSVAALGKQ TPVLVGTAPK QPAAYDPKVA PAKRFELPAA
      301 PKGTADTKAI LDELALPPLF EGDAGAIELL PFSEALLKGY ASDVSADDAL KNGDKYPLRV
      361 ATLRALQAVR DTWPLTAKEP KGVTPLTAPI VDRTKRAISD AQLPLAQAIT RLESELEGLL
      421 AVAKHRAKET KRWQAHYDYT LAELRLRLVV LNEYNVLLAR VRTETLPDLP AGATGWRLCP
      481 AEKLTSRREV RAMFDAAQEG FNKLAADPIT RTRRGACSRS GRVRSCRGYA GSRSFRRK
//