LOCUS       VTR94236.1              2368 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana rhs repeat-associated core domain-containing
            protein : RHS repeat-associated core domain protein OS=
            Singulisphaera acidiphila (strain ATCC BAA-1392 / DSM
            18658 / VKM B-2454 / MOB10) GN=Sinac_0717 PE=4 SV=1: RHS_repeat
            protein.
ACCESSION   LR593886-3537
PROTEIN_ID  VTR94236.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_34780"
                     /note="BLAST_uniprot:hit_2 ;
                     ACCESSION=tr|E8QWU3|E8QWU3_ISOPI ;
                     ALN/Q_length_ratio=0.448 ; DESCRIPTION=YD repeat protein
                     OS=Isosphaera pallida (strain ATCC 43644 / DSM 9630 /
                     IS1B) GN=Isop_2419 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=0.951"
                     /note="BLAST_uniprot:hit_3 ;
                     ACCESSION=tr|L0D5P0|L0D5P0_SINAD ;
                     ALN/Q_length_ratio=0.436 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_0291 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=1.093"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|L0D7A8|L0D7A8_SINAD ;
                     ALN/Q_length_ratio=0.641 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_0717 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=1.400"
                     /note="BLAST_uniprot:hit_4 ;
                     ACCESSION=tr|L0DA66|L0DA66_SINAD ;
                     ALN/Q_length_ratio=0.307 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_1341 PE=4 SV=1 ; EVALUE=1e-166 ;
                     Q/S_length_ratio=1.061"
                     /note="BLAST_uniprot:hit_5 ;
                     ACCESSION=tr|L0D9R6|L0D9R6_SINAD ;
                     ALN/Q_length_ratio=0.413 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_1226 PE=4 SV=1 ; EVALUE=1e-123 ;
                     Q/S_length_ratio=1.038"
                     /note="BLAST_uniprot:hit_6 ;
                     ACCESSION=tr|D5STB0|D5STB0_PLAL2 ;
                     ALN/Q_length_ratio=0.418 ; DESCRIPTION=AmoP
                     OS=Planctomyces limnophilus (strain ATCC 43296 / DSM 3776
                     / IFAM 1008 / 290) GN=Plim_1036 PE=4 SV=1 ; EVALUE=1e-118
                     ; Q/S_length_ratio=1.258"
                     /note="BLAST_uniprot:hit_7 ;
                     ACCESSION=tr|D5SST5|D5SST5_PLAL2 ;
                     ALN/Q_length_ratio=0.511 ; DESCRIPTION=YD repeat protein
                     OS=Planctomyces limnophilus (strain ATCC 43296 / DSM 3776
                     / IFAM 1008 / 290) GN=Plim_3067 PE=4 SV=1 ; EVALUE=1e-110
                     ; Q/S_length_ratio=1.182"
                     /note="BLAST_uniprot:hit_8 ;
                     ACCESSION=tr|D2QZZ5|D2QZZ5_PIRSD ;
                     ALN/Q_length_ratio=0.319 ; DESCRIPTION=YD repeat protein
                     OS=Pirellula staleyi (strain ATCC 27377 / DSM 6068 / ICPB
                     4128) GN=Psta_3703 PE=4 SV=1 ; EVALUE=5e-91 ;
                     Q/S_length_ratio=1.159"
                     /note="BLAST_uniprot:hit_9 ;
                     ACCESSION=tr|D5SQM4|D5SQM4_PLAL2 ;
                     ALN/Q_length_ratio=0.219 ; DESCRIPTION=Uncharacterized
                     protein OS=Planctomyces limnophilus (strain ATCC 43296 /
                     DSM 3776 / IFAM 1008 / 290) GN=Plim_2663 PE=4 SV=1 ;
                     EVALUE=4e-81 ; Q/S_length_ratio=3.373"
                     /note="BLAST_uniprot:hit_10 ;
                     ACCESSION=tr|D5SWT5|D5SWT5_PLAL2 ;
                     ALN/Q_length_ratio=0.210 ; DESCRIPTION=Uncharacterized
                     protein OS=Planctomyces limnophilus (strain ATCC 43296 /
                     DSM 3776 / IFAM 1008 / 290) GN=Plim_1602 PE=4 SV=1 ;
                     EVALUE=2e-71 ; Q/S_length_ratio=3.145"
                     /note="BLAST_uniprot:hit_11 ;
                     ACCESSION=tr|D5SWT3|D5SWT3_PLAL2 ;
                     ALN/Q_length_ratio=0.157 ; DESCRIPTION=Uncharacterized
                     protein OS=Planctomyces limnophilus (strain ATCC 43296 /
                     DSM 3776 / IFAM 1008 / 290) GN=Plim_1600 PE=4 SV=1 ;
                     EVALUE=8e-45 ; Q/S_length_ratio=3.901"
                     /note="BLAST_uniprot:hit_12 ;
                     ACCESSION=tr|Q1Q7C5|Q1Q7C5_9BACT ;
                     ALN/Q_length_ratio=0.417 ; DESCRIPTION=Similar to
                     wall-associated protein OS=Candidatus Kuenenia
                     stuttgartiensis GN=WapA PE=4 SV=1 ; EVALUE=2e-41 ;
                     Q/S_length_ratio=1.127"
                     /note="BLAST_uniprot:hit_13 ;
                     ACCESSION=tr|F4KRN7|F4KRN7_HALH1 ;
                     ALN/Q_length_ratio=0.349 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Haliscomenobacter
                     hydrossis (strain ATCC 27775 / DSM 1100 / LMG 10767 / O)
                     GN=Halhy_1128 PE=4 SV=1 ; EVALUE=3e-37 ;
                     Q/S_length_ratio=1.748"
                     /note="BLAST_uniprot:hit_14 ;
                     ACCESSION=tr|D0THP1|D0THP1_9BACE ;
                     ALN/Q_length_ratio=0.372 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Bacteroides sp.
                     2_1_33B GN=HMPREF0103_2864 PE=4 SV=1 ; EVALUE=4e-37 ;
                     Q/S_length_ratio=1.693"
                     /note="BLAST_uniprot:hit_15 ;
                     ACCESSION=tr|A0A090KF71|A0A090KF71_9BACT ;
                     ALN/Q_length_ratio=0.055 ; DESCRIPTION=Uncultured
                     bacterium genome assembly Metasoil_fosmids_resub
                     OS=uncultured bacterium PE=4 SV=1 ; EVALUE=8e-37 ;
                     Q/S_length_ratio=10.120"
                     /note="Pfam_scan:hit_1 (1932..1971);
                     Pfam:PF05593.9:RHS_repeat;
                     Pfam_type:Repeat;HMM_aln_Length:36; HMM_Length:38;
                     EVALUE:1.9e-05; BITSCORE: 24.6"
                     /note="GO_domain:GO:0008150"
BEGIN
        1 MDLNGDHKAE VILGGSSGGW VKTYNPTTGA PIAGPLGCFQ AFGTGYTGSV FVNSDSLAND
       61 VDGDGTPDLV VGTDVGVAAE VKVFSGATGG VLYDFQPFGS GFTGGARVAL AYADDDDRAD
      121 IVVGSGTGAA DVRVFSGATG AQLASPLGQY APFGASTGGV FVAASNDPIA PTVMWTTAPS
      181 SAKVGQVVRG VITITGQSPN VPTGTATLKA TVIPGGTVLT LDTVSLVPVG SGYQATATFD
      241 FGSLPLGNYL LSATYNGDSN YSSNTAGGGS FGVTAPVAGV PAPVYRGGYN PDLSTGVAPG
      301 SGSITVSSCP DLSSIGMGDL FGIDHSWTSA PGYDDGLTGT GGSAGQFSHA VQVNGDTSIA
      361 LALGGSDAQF FDFYGGAYHG RFGDPTTLVH DTTNGLFVAT DGTGRTLTYY DFSASTPSGR
      421 AGQLAKVTAP DGQLTQVTSW DGSGRPTEVQ RTTGSGGSAL TESFVYAYVA SGTNAGLLQT
      481 VTQRTQVGAG AWGTVRSAEY TYHDGTTSAG LAKEMRTAVV KDASGNVIDQ SYYRYYGSSS
      541 GSGSGSGSGS GSGSGSGSGS SGKMKFAFGA DAYARLVSAL GTSVDALTDA QIDDYADKYI
      601 EYSASGQASK VVDAAAGCSV CAGGQGAFNY TYSTNSAANL LDTNVWKNKA VETLPDGSTN
      661 TFYTNGFGQT MLRVFTDTAS NVWRWYTKYD AAGRTILEAG PSVVTGFSES YADLVNFVSG
      721 NAQYLSDSAG LVTAYTYGAT TTATTSTVGD ALGYLKEVDL KQGETGTAVP QQVLAYIKNT
      781 VGSIDFFILA SSTVYRNDNG TGAQATSYAY TYLSGTNQIA STVTTLPTVT TAQNGSNSAT
      841 TVTTVNDTFG HPVWTKDQAG IISYTQYDTL TGAVVKTITD VDTAQTGTFA NLPSGWSTPS
      901 GAGLHLTTTY EVDALGRATK VTYPNGRVDY TVYNDANHEV RTYTGWDATN NVATGPTTVN
      961 RMDRAGSYTE TLTMSAAPSV SGGRPTGTEG IAKIQSLSRT YTNAAGQAIY SDAYFNLTGL
     1021 AYSTSTTLGT EGVNFYRTRY QYDDQGRLNK TTSAQGTISR TVYDSLGRAV SEWVGTDDTP
     1081 TSGFWSPTNL TGTNTVKVRE YEYDGGGVGD GNLTKVTEIP GGGAANRVTQ TWFDWRNRAV
     1141 AVKSGVEGSE STSVNRPLVY TDYDNLGEIT TTRVYDADGV TPTVTGGVPQ PLSSSLLRGQ
     1201 ATTSYDELGR AYRTDTYSVD SSTGSVGTNT LYSQTWYDAR GQVIKTSSPG GIVQKTTFDG
     1261 AGRTVATYTS DGGGDTGYGD ADDVTGDTVL NQTEYVYDGN GSVLQVTTRD RFHDASGTGA
     1321 LGTPTTGVGA RVSYTGYYYD LAGRTVATVD VGTNGGSSWS RPGTVPSRSA TVLVNSTKYA
     1381 TDAVQVIALT GSPTGGTFTL TLGGNTTSAL AYNASAATVQ SALAGLASIG SGNVQVSAAA
     1441 GGGWEIRFIG TKGGAYQSAI TGNGSGLTGG TSPAVSTSTV NAGGDVGLAA EVTDPVGHVS
     1501 RIYADALGRT TRSVTNFVDG VVSDTDDKAT GYTYNGTGVT SLIAYLTGGG VQTTGYVYGV
     1561 TVATGSTIES NDIVRLTQWA DPTTGAASSS QQEAIAVNAL GQTLTSTDRN GSVHTLTYDV
     1621 LGRVVSDAVT TLGSGVDGSV RRIECAYDSQ GNAYLITSYN AASGGSVVNQ TQRAFNGLGQ
     1681 MTTEWQSHSG AVNTSTSPKV QYAYSEMTGG ANHSRLTSIT YPSGYVLTYN YSSGLNDSIS
     1741 RLSSLSDSTG ALESYDYLGW GIVVRRAHSQ PNVDLSYIKH SGESNGDAGD QYTGLDRFGR
     1801 VVDQRWLNPT TGTATDRFQY GYDQDGNRTY RDNLVNTAFG EVYSYDALDQ LTGYDRGTLN
     1861 GTKTGITGTV ARSQDWDYDA LGNFDSVTTN GTAQTRTANK QNEITGISGA TTPTYDANGN
     1921 MTGDETSKQF VYDAWNRLVA VKNSGGSTLK TYAYDGANRR VSETVSGTTT DLFYSKDWQV
     1981 LEEKVGSATK NRYVWSPVYV DAMVLRDRDA DGSTGNGLEE RLWVQQDANW NVTALVNGSG
     2041 AVVERYVYDP YGAATIYDAS YVMRASSLYD AKYFSQGRPL DAASGNYYFR ERDYRPTLGR
     2101 FINLDPVTYA SGDINLYRFV ANSPVNLSDP SGLAPFSDIP SIGGSIGGGV LDVISYPDPA
     2161 KITWDYFKIY ITPPEGQRPG ERARTIGQFV PVLIDPSIRI IKLPCSPGYV AVMKVNKIDL
     2221 KYRFRFDNSW FYDDPLNKIT KEKKEILLKH EQFHYKLSLD FVAQATERWN SHSKLGKKGI
     2281 VGIGFGFTPG QATEAAQKRV LAALQVHINE LSKSLNSLQL AYDRVSQIPL PGGGGDITDD
     2341 SQSLGERAAK KAMFDSITRA IERMLGLR
//