LOCUS       VTR98885.1              2394 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana rhs repeat-associated core domain-containing
            protein : YD repeat protein OS=Isosphaera pallida (strain
            ATCC 43644 / DSM 9630 / IS1B) GN=Isop_2419 PE=4 SV=1:
            RHS_repeat: PT-HINT protein.
ACCESSION   LR593886-6890
PROTEIN_ID  VTR98885.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_01250"
                     /note="BLAST_uniprot:hit_4 ;
                     ACCESSION=tr|L0DA66|L0DA66_SINAD ;
                     ALN/Q_length_ratio=0.279 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_1341 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=1.073"
                     /note="BLAST_uniprot:hit_2 ;
                     ACCESSION=tr|L0D5P0|L0D5P0_SINAD ;
                     ALN/Q_length_ratio=0.449 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_0291 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=1.105"
                     /note="BLAST_uniprot:hit_3 ;
                     ACCESSION=tr|L0D7A8|L0D7A8_SINAD ;
                     ALN/Q_length_ratio=0.356 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_0717 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=1.415"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|E8QWU3|E8QWU3_ISOPI ;
                     ALN/Q_length_ratio=0.454 ; DESCRIPTION=YD repeat protein
                     OS=Isosphaera pallida (strain ATCC 43644 / DSM 9630 /
                     IS1B) GN=Isop_2419 PE=4 SV=1 ; EVALUE=0.0 ;
                     Q/S_length_ratio=0.961"
                     /note="BLAST_uniprot:hit_5 ;
                     ACCESSION=tr|L0D9R6|L0D9R6_SINAD ;
                     ALN/Q_length_ratio=0.429 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Singulisphaera
                     acidiphila (strain ATCC BAA-1392 / DSM 18658 / VKM B-2454
                     / MOB10) GN=Sinac_1226 PE=4 SV=1 ; EVALUE=1e-142 ;
                     Q/S_length_ratio=1.050"
                     /note="BLAST_uniprot:hit_6 ;
                     ACCESSION=tr|D5STB0|D5STB0_PLAL2 ;
                     ALN/Q_length_ratio=0.422 ; DESCRIPTION=AmoP
                     OS=Planctomyces limnophilus (strain ATCC 43296 / DSM 3776
                     / IFAM 1008 / 290) GN=Plim_1036 PE=4 SV=1 ; EVALUE=1e-126
                     ; Q/S_length_ratio=1.272"
                     /note="BLAST_uniprot:hit_7 ;
                     ACCESSION=tr|D5SST5|D5SST5_PLAL2 ;
                     ALN/Q_length_ratio=0.454 ; DESCRIPTION=YD repeat protein
                     OS=Planctomyces limnophilus (strain ATCC 43296 / DSM 3776
                     / IFAM 1008 / 290) GN=Plim_3067 PE=4 SV=1 ; EVALUE=1e-108
                     ; Q/S_length_ratio=1.195"
                     /note="BLAST_uniprot:hit_8 ;
                     ACCESSION=tr|D2QZZ5|D2QZZ5_PIRSD ;
                     ALN/Q_length_ratio=0.465 ; DESCRIPTION=YD repeat protein
                     OS=Pirellula staleyi (strain ATCC 27377 / DSM 6068 / ICPB
                     4128) GN=Psta_3703 PE=4 SV=1 ; EVALUE=1e-101 ;
                     Q/S_length_ratio=1.172"
                     /note="BLAST_uniprot:hit_9 ;
                     ACCESSION=tr|D5SQM4|D5SQM4_PLAL2 ;
                     ALN/Q_length_ratio=0.212 ; DESCRIPTION=Uncharacterized
                     protein OS=Planctomyces limnophilus (strain ATCC 43296 /
                     DSM 3776 / IFAM 1008 / 290) GN=Plim_2663 PE=4 SV=1 ;
                     EVALUE=2e-72 ; Q/S_length_ratio=3.410"
                     /note="BLAST_uniprot:hit_10 ;
                     ACCESSION=tr|D5SWT5|D5SWT5_PLAL2 ;
                     ALN/Q_length_ratio=0.206 ; DESCRIPTION=Uncharacterized
                     protein OS=Planctomyces limnophilus (strain ATCC 43296 /
                     DSM 3776 / IFAM 1008 / 290) GN=Plim_1602 PE=4 SV=1 ;
                     EVALUE=2e-67 ; Q/S_length_ratio=3.179"
                     /note="BLAST_uniprot:hit_11 ;
                     ACCESSION=tr|D5SWT3|D5SWT3_PLAL2 ;
                     ALN/Q_length_ratio=0.149 ; DESCRIPTION=Uncharacterized
                     protein OS=Planctomyces limnophilus (strain ATCC 43296 /
                     DSM 3776 / IFAM 1008 / 290) GN=Plim_1600 PE=4 SV=1 ;
                     EVALUE=9e-39 ; Q/S_length_ratio=3.944"
                     /note="BLAST_uniprot:hit_12 ;
                     ACCESSION=tr|Q1Q7C5|Q1Q7C5_9BACT ;
                     ALN/Q_length_ratio=0.231 ; DESCRIPTION=Similar to
                     wall-associated protein OS=Candidatus Kuenenia
                     stuttgartiensis GN=WapA PE=4 SV=1 ; EVALUE=1e-38 ;
                     Q/S_length_ratio=1.139"
                     /note="BLAST_uniprot:hit_13 ;
                     ACCESSION=tr|B8FIJ1|B8FIJ1_DESAA ;
                     ALN/Q_length_ratio=0.219 ; DESCRIPTION=YD repeat protein
                     OS=Desulfatibacillum alkenivorans (strain AK-01)
                     GN=Dalk_2288 PE=4 SV=1 ; EVALUE=9e-38 ;
                     Q/S_length_ratio=1.469"
                     /note="BLAST_uniprot:hit_14 ;
                     ACCESSION=tr|D0THP1|D0THP1_9BACE ;
                     ALN/Q_length_ratio=0.226 ; DESCRIPTION=RHS
                     repeat-associated core domain protein OS=Bacteroides sp.
                     2_1_33B GN=HMPREF0103_2864 PE=4 SV=1 ; EVALUE=5e-37 ;
                     Q/S_length_ratio=1.711"
                     /note="BLAST_uniprot:hit_15 ;
                     ACCESSION=tr|A3ZZ08|A3ZZ08_9PLAN ;
                     ALN/Q_length_ratio=0.226 ; DESCRIPTION=Uncharacterized
                     protein (Fragment) OS=Blastopirellula marina DSM 3645
                     GN=DSM3645_15255 PE=4 SV=1 ; EVALUE=3e-34 ;
                     Q/S_length_ratio=1.312"
                     /note="Pfam_scan:hit_1 (1812..1851);
                     Pfam:PF05593.9:RHS_repeat;
                     Pfam_type:Repeat;HMM_aln_Length:35; HMM_Length:38;
                     EVALUE:5.6e-05; BITSCORE: 23.1"
                     /note="Pfam_scan:hit_2 (2221..2289);
                     Pfam:PF07591.6:PT-HINT;
                     Pfam_type:Family;HMM_aln_Length:65; HMM_Length:130;
                     EVALUE:5.1e-09; BITSCORE: 36.0"
                     /note="GO_domain:GO:0051604"
BEGIN
        1 MSHIDDAGGT RSLNLTQTVT YDAPGFEGLF LWKYVVENAS TTLHPSETIN GEGYVNVEYF
       61 EDVELPVNFG TSTDWYKGYS DGIAYWTHDT HPFTKTYIAP GSTESFWFTT SPNWLADSSL
      121 ELFQEDIKED ASYLYEANVK VPGGALPAFV PKSLATLGPL CVQSQVNPTA PPPLPNPQSS
      181 TGNPIRYVDG VNLVVAPGLS STGFGGGWGT TQSWSNDPSY SAGTNAGNGW VAGDQPRLYR
      241 TGSSLYLVTD AITAHFFDGQ GTPDGDGNYA TYAPRFFYNT TVTYDGANDQ FVITADDGTV
      301 YRYLDFGSAR PVVSRGAFQS RTDPGGLITQ VTSRDTDGRP LEVQAAQTVG GVTTTESYLY
      361 AYLGSGDTNA GKLASVTLRR KVGAGAWATV QQVAYAYYVS GDANGNWGDL KRLTVSDAAG
      421 SVLDQRYYRY YTGDTFNGAT QIGYRGGLKY ELGPDAYARL KAAQGGTDAA VETTADATVA
      481 TYADKYFEYD ALHRASKETV SGAGCTSCSA GQGAYTYSYT TSSNTIGHNS WATKTVETRP
      541 DGSTNTVYTN AFGGVMLTAF ADVTTGLVSI TYYQYDSKGR VVLVANPSAV TGYSNAYPDL
      601 VRFVSGNAQY LSDSSGLVTN YTYGASTTAT TLVPGDAVWY LKTIAIRQGE TSTAVPKESL
      661 TYIMNTVGGL NFFHLASDTV YRNDNGTGGQ TTNYAYTFLA GTNQPATVTA TLPTVTTAQN
      721 GSNSATAATV VSDAFGRPVW IRDEAGFITY TAYDTSSGAV VKIITDVDTA QTGTFTNLPS
      781 GWVTPPGGGL HLVTSYEVDS LGRATKTTYP NGRIDYTVYN DTAHEVRYYA GWDATTNRPT
      841 GPTAVVRVDR ANGYSETLTM SAPPTVSGGR PTGTESVSQV QSLSRSYTNE AGQLTHTDAY
      901 FNPSGLAYST SSALGAEGVN FYRTRYEYDN TGQLKRVQTP QGTITRYVRN GFGEVVSEWV
      961 GTDDTPTTGY WSPTNTTGTN LVKVREYQYD NGAVGDGNLT KVSEYPGGGA AARVTQTWYD
     1021 WRNRAVAVKS GVETTESTSV NRQLVFYTYD NLDRVTMAQV YDADGVAPTV TGGVPQPLSA
     1081 SLLRAQGATE FDELGRAFRT RVFSVNPATG AVSTNSLATD TWYDARGLTI KTSAPNGLVQ
     1141 KWAYDGAGRV TTAYTGDWGG DAGYADADDV VGDTVLTQVE YVYDPSGNVR QVTTRDRFHD
     1201 ASGTGALGTP TTGIAARVSY MGYYYDLADR TIAAVDVGTN GGSSWSRPGA VPSRSATVLV
     1261 TSTKYATDAV QVIKLTGSPT GGTFTLTFGV NTTGAIAYNA SAATVQTALA GLASIGAGNV
     1321 QVSAAAGGGW EIRFIGTKAG AYQSAIAANG AGLTGGTAPA ASVSTINAGG DVGLAAEVTD
     1381 AAGRVTRTYA DALGRTTRTV ANFVDGVVSD VDDKATGYMY NGAGITSVIA YLSGGGVQTT
     1441 GYVYGVSSAT GSAVESNEIV RLTQWADPTS GAASATEQES VTVNALGQTV TTTDRNGNVH
     1501 VLTYDVLGRV VSDSVTASGT NVGMIETGYD TLGNASLVTS RDATNAIVNQ VAREYNGLGQ
     1561 LTAEWQSHSG AVTGSTPKVQ YAYNFNGGGT TNQSRLTSIT YPSGYVLTFN YSSGINSAVS
     1621 RVSSLSDPNG AVESYDYLGL DTVVRRAHSG PSLDLSYIKR AGESNGDAGD QYTGLDRFGR
     1681 IVDQRWLNPT TGTATDRFQY GYDQAGNRTY RDNLVSATLG EVYTYDALDQ LTAYSRGTLN
     1741 GTKTGVTGTA SRTQNWDYDA LGNFDSVTTN GTAQARTANK QNEITSISGV TTPTYDANGN
     1801 MTKDETGKLY VYDAWNRLVT VKNSGGTVLK TYTYDGLNRR ITETASGTTT DLFYSRDWQV
     1861 LEEKVGSTTK TRYVWSPVYV NAMVLRDRDA DGSTGNGLEE RLWVQQDANF NVTALANSSG
     1921 AVVERYLYDP YGNVTVTNAS GTTLGSSAYA WAHTFQGMRL DTTSGFLEAN QRWYSPILGR
     1981 WVTLDPIRYA AGDMNLYRFV GNNSTNVTDP SGLDPLISVA PTGPDSPGGK FAHGVIDTIA
     2041 EPFRIGGDLI RVGQWTVNTQ LLGREMYEPD WHSNLAKKAP QANASPEEWD EYAKKSFKKH
     2101 AKNSAIAVIT FGAGKAAGPI IRKLRKPACV NCFPADTVVG TEHGLKPIQD VRAADRVWAF
     2161 DLVVGEWKLR QVIETYRHEH DGDMVTATVA GEMIESTGHH PWWVARGEGL RGRPQPEHVP
     2221 DNPDGYDRGG RWVDAIDLRV GDVLLLRSGE EAAITELVAR HAKLPVYNFH VEELHCYAVG
     2281 RAQILVHNNS VDVKSLNIAG STDAVFHPEI VQGMRLQIRA NSKKFWADAL AKDGPIEIWE
     2341 IGGKRYLFNG NHRYRAALAE DVAIPEANLK IIDKTGSKIP TFGLNEMVPA PGLK
//