LOCUS       VTR96973.1              2513 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana Serine-aspartate repeat-containing
            protein F OS=Candidatus Accumulibacter sp. BA-93 GN=sdrF
            PE=4 SV=1: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B:
            Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B:
            Cna_B protein.
ACCESSION   LR593886-6062
PROTEIN_ID  VTR96973.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_09530"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|A0A011PQN1|A0A011PQN1_9PROT ;
                     ALN/Q_length_ratio=0.199 ; DESCRIPTION=Serine-aspartate
                     repeat-containing protein F OS=Candidatus Accumulibacter
                     sp. BA-93 GN=sdrF PE=4 SV=1 ; EVALUE=1e-133 ;
                     Q/S_length_ratio=1.160"
                     /note="BLAST_uniprot:hit_2 ;
                     ACCESSION=tr|A0A084Y1E0|A0A084Y1E0_9PROT ;
                     ALN/Q_length_ratio=0.189 ; DESCRIPTION=Serine-aspartate
                     repeat-containing protein F OS=Candidatus Accumulibacter
                     sp. SK-01 GN=sdrF PE=4 SV=1 ; EVALUE=1e-123 ;
                     Q/S_length_ratio=1.762"
                     /note="BLAST_uniprot:hit_3 ;
                     ACCESSION=tr|A0A080MK61|A0A080MK61_9PROT ;
                     ALN/Q_length_ratio=0.149 ; DESCRIPTION=Serine-aspartate
                     repeat-containing protein D OS=Candidatus Accumulibacter
                     sp. SK-02 GN=sdrD PE=4 SV=1 ; EVALUE=1e-112 ;
                     Q/S_length_ratio=3.351"
                     /note="BLAST_uniprot:hit_4 ;
                     ACCESSION=tr|N6ZZR9|N6ZZR9_9RHOO ;
                     ALN/Q_length_ratio=0.173 ; DESCRIPTION=Collagen-binding
                     protein OS=Thauera phenylacetica B4P GN=C667_07861 PE=4
                     SV=1 ; EVALUE=2e-93 ; Q/S_length_ratio=1.088"
                     /note="BLAST_uniprot:hit_5 ;
                     ACCESSION=tr|I3YB57|I3YB57_THIV6 ;
                     ALN/Q_length_ratio=0.444 ; DESCRIPTION=Putative
                     collagen-binding protein OS=Thiocystis violascens (strain
                     ATCC 17096 / DSM 198 / 6111) GN=Thivi_2278 PE=4 SV=1 ;
                     EVALUE=1e-85 ; Q/S_length_ratio=1.386"
                     /note="BLAST_uniprot:hit_6 ;
                     ACCESSION=tr|A3IZB2|A3IZB2_9CHRO ;
                     ALN/Q_length_ratio=0.323 ; DESCRIPTION=Uncharacterized
                     protein OS=Cyanothece sp. CCY0110 GN=CY0110_30026 PE=4
                     SV=1 ; EVALUE=1e-85 ; Q/S_length_ratio=1.733"
                     /note="BLAST_uniprot:hit_7 ;
                     ACCESSION=tr|C6WJY6|C6WJY6_ACTMD ;
                     ALN/Q_length_ratio=0.589 ; DESCRIPTION=Conserved repeat
                     domain protein OS=Actinosynnema mirum (strain ATCC 29888 /
                     DSM 43827 / NBRC 14064 / IMRU 3971) GN=Amir_2421 PE=4 SV=1
                     ; EVALUE=3e-85 ; Q/S_length_ratio=0.745"
                     /note="BLAST_uniprot:hit_8 ;
                     ACCESSION=tr|Q8YWB9|Q8YWB9_NOSS1 ;
                     ALN/Q_length_ratio=0.430 ; DESCRIPTION=All1696 protein
                     OS=Nostoc sp. (strain PCC 7120 / UTEX 2576) GN=all1696
                     PE=4 SV=1 ; EVALUE=1e-81 ; Q/S_length_ratio=1.257"
                     /note="BLAST_uniprot:hit_9 ;
                     ACCESSION=tr|M5SPI7|M5SPI7_9PLAN ;
                     ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
                     protein OS=Rhodopirellula europaea SH398 GN=RESH_01285
                     PE=4 SV=1 ; EVALUE=3e-77 ; Q/S_length_ratio=1.455"
                     /note="BLAST_uniprot:hit_10 ;
                     ACCESSION=tr|L7CFZ1|L7CFZ1_RHOBT ;
                     ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
                     protein OS=Rhodopirellula baltica SWK14 GN=RBSWK_03634
                     PE=4 SV=1 ; EVALUE=6e-77 ; Q/S_length_ratio=1.438"
                     /note="BLAST_uniprot:hit_11 ;
                     ACCESSION=tr|K5D2K5|K5D2K5_RHOBT ;
                     ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
                     protein OS=Rhodopirellula baltica SH28 GN=RBSH_03818 PE=4
                     SV=1 ; EVALUE=6e-77 ; Q/S_length_ratio=1.455"
                     /note="BLAST_uniprot:hit_12 ;
                     ACCESSION=tr|Q7ULR8|Q7ULR8_RHOBA ;
                     ALN/Q_length_ratio=0.417 ; DESCRIPTION=Probable
                     fibrinogen-binding protein homolog-putative involved in
                     cell-cell interaction OS=Rhodopirellula baltica (strain
                     SH1) GN=RB9330 PE=4 SV=1 ; EVALUE=3e-76 ;
                     Q/S_length_ratio=1.431"
                     /note="BLAST_uniprot:hit_13 ;
                     ACCESSION=tr|M5UPV6|M5UPV6_9PLAN ;
                     ALN/Q_length_ratio=0.392 ; DESCRIPTION=Collagen-binding
                     surface protein Cna-like, B region domain protein
                     OS=Rhodopirellula sallentina SM41 GN=RSSM_00552 PE=4 SV=1
                     ; EVALUE=3e-76 ; Q/S_length_ratio=1.335"
                     /note="BLAST_uniprot:hit_14 ;
                     ACCESSION=tr|F2AZ90|F2AZ90_RHOBT ;
                     ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
                     protein OS=Rhodopirellula baltica WH47 GN=RBWH47_05824
                     PE=4 SV=1 ; EVALUE=4e-76 ; Q/S_length_ratio=1.455"
                     /note="BLAST_uniprot:hit_15 ;
                     ACCESSION=tr|E8R1G1|E8R1G1_ISOPI ;
                     ALN/Q_length_ratio=0.563 ; DESCRIPTION=Cna B domain
                     protein OS=Isosphaera pallida (strain ATCC 43644 / DSM
                     9630 / IS1B) GN=Isop_1796 PE=4 SV=1 ; EVALUE=2e-74 ;
                     Q/S_length_ratio=1.653"
                     /note="Pfam_scan:hit_1 (243..309); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:56; HMM_Length:70;
                     EVALUE:7.3e-09; BITSCORE: 35.2"
                     /note="Pfam_scan:hit_2 (340..405); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
                     EVALUE:2.7e-08; BITSCORE: 33.4"
                     /note="Pfam_scan:hit_3 (437..502); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:48; HMM_Length:70;
                     EVALUE:7.8e-09; BITSCORE: 35.1"
                     /note="Pfam_scan:hit_4 (543..607); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:57; HMM_Length:70;
                     EVALUE:4.2e-09; BITSCORE: 36.0"
                     /note="Pfam_scan:hit_5 (639..705); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
                     EVALUE:4.7e-07; BITSCORE: 29.4"
                     /note="Pfam_scan:hit_6 (744..798); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:51; HMM_Length:70;
                     EVALUE:2.5e-06; BITSCORE: 27.1"
                     /note="Pfam_scan:hit_7 (850..917); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
                     EVALUE:6.9e-08; BITSCORE: 32.1"
                     /note="Pfam_scan:hit_8 (955..1020); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
                     EVALUE:2.7e-08; BITSCORE: 33.4"
                     /note="Pfam_scan:hit_9 (1052..1117); Pfam:PF05738.8:Cna_B;
                     Pfam_type:Family;HMM_aln_Length:48; HMM_Length:70;
                     EVALUE:1.9e-08; BITSCORE: 33.9"
                     /note="Pfam_scan:hit_10 (1158..1222);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:57;
                     HMM_Length:70; EVALUE:4.2e-09; BITSCORE: 36.0"
                     /note="Pfam_scan:hit_11 (1254..1318);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:53;
                     HMM_Length:70; EVALUE:7.6e-11; BITSCORE: 41.6"
                     /note="Pfam_scan:hit_12 (1360..1427);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:49;
                     HMM_Length:70; EVALUE:4.2e-10; BITSCORE: 39.2"
                     /note="Pfam_scan:hit_13 (1459..1526);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:55;
                     HMM_Length:70; EVALUE:6e-09; BITSCORE: 35.5"
                     /note="Pfam_scan:hit_14 (1565..1628);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:52;
                     HMM_Length:70; EVALUE:8.5e-08; BITSCORE: 31.8"
                     /note="Pfam_scan:hit_15 (1992..2071);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:32;
                     HMM_Length:70; EVALUE:1.3e-06; BITSCORE: 28.0"
                     /note="Pfam_scan:hit_16 (2258..2329);
                     Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:64;
                     HMM_Length:70; EVALUE:3.4e-09; BITSCORE: 36.3"
BEGIN
        1 MTPTWKTFLS RLHSTISGTG RRPIRTRRPR ALAIEQLEDR LVPAFALQFS TNGGATFSAP
       61 VTDQGVGDTD ALVGTIGVNI GAVTIAASSL GSTGTASTTL NLSVTGVAAA SAHDIIVRAS
      121 LSDLTTTPAP QTLVYSFTGS TPSGGTVTSQ TWVDDNNALF GMTGDTTGAK TIPASGSLVV
      181 SDTVPYSATT QIHLVFKNTF PINLSLNNLN TITASPEQKA EIHGTKFEDV NGNGVRESSE
      241 AGLQGWTIQL LDTNDNVLAT TLTAVDGSYS FTNLTPGIYR VREVNQAGWT QITANPGDIG
      301 TVSGSNITGV DFGNFKNITI AGTKYTDITG NSFSSDDTPL AGITVNLFKN GALVATTTTA
      361 TDGTYSFANQ GPGNYFVQEL VPTGYQQTGG NAGYTIVATS GLVSNNNNFD NFQLAKITGK
      421 KVNDLTGDGL SSDDTGLGGV TVNLYKDNAS GVLVASTTTA ADGTYSFDNL APGTYFVQEL
      481 VPAGSVQTAG NAGYTVTVGG TGVQSGGTAT GNDFANFKQV TITGTKFTDI TGNSFSSDDT
      541 PRAGVTINLY QNGNFVTSTV TGADGTYKFE NLGPGTYFVQ ELVPAGATQT GGNAGYTIAA
      601 TSGLVSNNNN FDNFYHGQIT GKKVTDLTGN GLTSDDTGLG GVTVNLYKAT STLTLIASTV
      661 TAADGTYSFG DLDLGTYFVQ ELVPSGYVQT GGNTGYTITV GPGGVVSGGT SSGNDFANFQ
      721 KGSITGTKYT DITGNGLSGD DTELGGVTIN LYSGNSTAGT LVASTVTAAN GTYSFGDLAP
      781 GTYFVQELVP AGATQTAGSA GYVVVIGQGG VGSGGTSSGN NFANFYRGQI TGTKYTDVTG
      841 NGITGDDTGL GGVTINLYKD NASGALIATT TTASDGTYSF GNLDLGTYFV QEIVPAGSTQ
      901 TAGIAGYTIT VGSGGVASGG TATGNNFANF KNITIAGTKY TDITGNSFSS DDTPLAGITV
      961 NLFKNGALVA TTTTATDGTY SFANQGPGNY FVQELVPTGY QQTGGNAGYT IVATSGLVSN
     1021 NNNFDNFQLA KITGKKVNDL TGDGLSSDDT GLGGVTVNLY KDNASGVLVA STTTAADGTY
     1081 SFDNLAPGTY CVQELVPAGS VQTAGNAGYT VTVGGTGVQS GGTATGNDFA NFKQVTITGT
     1141 KFTDITGNSF SSDDTPRAGV TINLYQNGNF VTSTVTGADG TYKFENLGPG TYFVQELVPA
     1201 GATQTGGNAG YTIAATSGLV SNNNNFDNFY HGQITGKKVT DLTGNGLTSD DTGLGGVTIN
     1261 LYSGGSAAGA IVATTTTAAN GTYSFSNLAP GTYFVQELVP AGYQQTAGNA GYVVVIGQGG
     1321 VTSGGTSSGN DFANFQKITI SGTKYNDITG NSFSADDTPL AGVTINLFKD GGTTPVATTV
     1381 TGADGTYSFT DLAPGTYFVQ ELVPAGSVQT GGNAGYTIAA TSGLNSTGNN FDNFKKVSIT
     1441 GTKVTDKTGN GFTSDDAGLG GITINLYSGT STAGALVAST TTASNGTFSF SNLAPGTYFV
     1501 QEVVPSGYVQ TTGTSGYAVT VGGTGIQSGG TSANNNFANF QKVKITGTKF QDMDGCGFGS
     1561 DDVVLGGVTI KLYSGTSTAG ALVASTVTAA NGTFSFEGLA PGTYFVQEVV PTGWTQTGGN
     1621 AGYVVTVGGT GVQSGGTASG KNFDNYKKPN PGIDIEKTTN GPTNSNPVAP DYDNEDAVDG
     1681 AGVPILTPGS SVTWTYKVTN TGDVAFTTSQ IAIVDDNGTP GVTSDDLSIA NGKITFLSVL
     1741 TGDSDNLLEP GEVWLYKATG IVQDFSVPVS GSTVSFDFSG NSAVSGTAGN VRTFTSSGVS
     1801 VNASAFSRDK TTGAWSTAYL GSYGGGLGVT DTSESGSSNS HTVDNSGRDN YVLFEFSENV
     1861 VIDSAFLGYV VGDSDLTVWI GTKTGAFNSH LTLSDSVLAS LGFTEVNLGG SSTRTANLNA
     1921 ALLAGNVLVI AAKTGDSDDN FKIETLCLQK VKPGVYENKA TVTVPGASDS DLSHYKNPPA
     1981 VVGGSISGTK YLDVSGNGLN KTAGTNSPAD TPLAGVTIYL DLDNDGRLDV GEPETVTDAN
     2041 GNYLFTGLAS KTYYVREVVP AGFVRTGPAL SDNYAVAVSA GKSYTGYDFA NAETCEDDTV
     2101 TCVSFTIRHT DGTCETVTDL RGRTREGDLI TVTFNVNVPA GQTHQITFVS YTAPGADFDA
     2161 NTASQQKIYD LDTDEFGPGY HTLTVRVPNC YYQVDFVCGF AIDKLGPANS NIFYTPQKRL
     2221 VSADNGGAEC CDNDGMISGY KFNDADADGV WDNGEKGLSG WVVYLDSNNN GYKDSWETAT
     2281 VTDANGYYKF NNLAAGNYRV REVQQSGWVQ SAAPALVALT TGQNKTGVNF GNVAGSLVSG
     2341 CDTASIDFWN CSSGQSLIKS LNGGSTKTAL GTWLASNFSK LYGSSSSYNL SGKTNAQVAS
     2401 YFQTLAGKSD KLEAQILATA LAVYVTDSDL AGGTYARNYG FKVTTTGIAD EFYNIGTNGS
     2461 LFGVANGGVR TVWQILVAAN NSATSGLAWN GNSTARSAAR TLFAGLNDVG GIG
//