LOCUS       VTR92393.1               414 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana Uncharacterized protein OS=Sorangium
            cellulosum (strain So ce56) GN=sce5405 PE=4 SV=1 protein.
ACCESSION   LR593886-1694
PROTEIN_ID  VTR92393.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_53210"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|A9FY04|A9FY04_SORC5 ;
                     ALN/Q_length_ratio=0.227 ; DESCRIPTION=Uncharacterized
                     protein OS=Sorangium cellulosum (strain So ce56)
                     GN=sce5405 PE=4 SV=1 ; EVALUE=4e-13 ;
                     Q/S_length_ratio=1.443"
                     /note="BLAST_uniprot:hit_2 ;
                     ACCESSION=tr|E8QYU5|E8QYU5_ISOPI ;
                     ALN/Q_length_ratio=0.213 ; DESCRIPTION=Uncharacterized
                     protein OS=Isosphaera pallida (strain ATCC 43644 / DSM
                     9630 / IS1B) GN=Isop_1497 PE=4 SV=1 ; EVALUE=8e-12 ;
                     Q/S_length_ratio=1.243"
BEGIN
        1 MPKPNLGTRL AQELIACRTE GGDHYPIRLD HLAARLDPAL EPAAVLKAVD STAFKKQAVV
       61 TADKRIDARV ALREDASLFA ADPLTLEMAF RTKGETGTPP WSPSELAKTV PTSWRPAFSE
      121 ILARQIASDE LPAFAVQVKA GKGVKLHHKE QPPPPPPEVQ DAERLVDMLR RRQPGVPLAE
      181 LETAAELKPA AFKKAVKRPE FTAAVVQVKM TSKDVFVVPN GDAFGRFVTG TLLTHLLGKC
      241 KRPNAHAFPV NELVAHVSKA DQSQITGLLN RPDLAAELPA GVGCVLLGGG KSGSQNAFFL
      301 LEHLRTAQPV ARSVAALNQA PPPPPADFVA TFDAAFARID RERGSNNFVS LVDLRAALPA
      361 VPRETFDTCL RQLRRDRRYV LSSDERYDGI TPEQQAAAIR EEGEFLLHVS RGRP
//