LOCUS       VTR96499.1               553 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana Uncharacterized protein OS=Nitrospina
            gracilis (strain 3/211) GN=NITGR_780007 PE=4 SV=1 protein.
ACCESSION   LR593886-5800
PROTEIN_ID  VTR96499.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_12150"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|M1Z2K7|M1Z2K7_NITG3 ;
                     ALN/Q_length_ratio=0.266 ; DESCRIPTION=Uncharacterized
                     protein OS=Nitrospina gracilis (strain 3/211)
                     GN=NITGR_780007 PE=4 SV=1 ; EVALUE=2e-07 ;
                     Q/S_length_ratio=2.221"
                     /note="BLAST_uniprot:hit_2 ;
                     ACCESSION=tr|L0DGZ0|L0DGZ0_SINAD ;
                     ALN/Q_length_ratio=0.177 ; DESCRIPTION=Repeat-companion
                     domain TIGR02996 OS=Singulisphaera acidiphila (strain ATCC
                     BAA-1392 / DSM 18658 / VKM B-2454 / MOB10) GN=Sinac_4455
                     PE=4 SV=1 ; EVALUE=1e-06 ; Q/S_length_ratio=1.057"
BEGIN
        1 MSDETAFLNT IREYPDEDTP RLAFADWLDE QGDPAKAGRV TFIRAQVELA RLPVDDPRCA
       61 DFEVTERRLL AKYATEWSAP WPAFRNREDA DDGPNQAIFR RGFLEAVNGS GVVGNANTNG
      121 LAELCAAHPI RDGGVLPTNN LASVVSWPEW GRIESLALWS RPTSRDVAAH YREQLPQIDS
      181 FLRHADFARL RKLSVTLSGI SDRDVLHWFR MPIVQRLVAL NVVMYAGMAW DVQLNGDSVL
      241 ELVRGDFPNL RELGLAGGVR PDYSRAVTQF VDSDVWKQIT HFTLFGGSDF PWFRALATAR
      301 LQQLTLHTGS SSEPARVFAN AIQAASGPVT LEELRINGPA VHGENLSRVL AAHVTSNLQR
      361 LHLVRARLTD DGLRRIAESP VLANLNSLSL WLDHTTGAGL DALFASPNLG QLTDLRIHGG
      421 RVPPDALRAL ARNSSCRQLR TLALGSLFVP SALTALTDGD EFPDLHTIAF ECVRPAPDPT
      481 TLEAFVNSPK FPRLCVVRFD TDDDCVDALI SVFRNCKRLA WAVGVMIDGG DGARVAFAPE
      541 GVYLPNHLDG LDE
//