LOCUS VTR96973.1 2513 aa PRT BCT 03-FEB-2020 DEFINITION Gemmata massiliana Serine-aspartate repeat-containing protein F OS=Candidatus Accumulibacter sp. BA-93 GN=sdrF PE=4 SV=1: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B protein. ACCESSION LR593886-6062 PROTEIN_ID VTR96973.1 SOURCE Gemmata massiliana ORGANISM Gemmata massiliana Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae; Gemmata. REFERENCE 1 AUTHORS CONSRTM Science for Life Laboratories JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution, Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden FEATURES Qualifiers source /organism="Gemmata massiliana" /chromosome="1" /isolate="Soil9" /mol_type="genomic DNA" /isolation_source="soil" /db_xref="taxon:1210884" protein /locus_tag="SOIL9_09530" /note="BLAST_uniprot:hit_1 ; ACCESSION=tr|A0A011PQN1|A0A011PQN1_9PROT ; ALN/Q_length_ratio=0.199 ; DESCRIPTION=Serine-aspartate repeat-containing protein F OS=Candidatus Accumulibacter sp. BA-93 GN=sdrF PE=4 SV=1 ; EVALUE=1e-133 ; Q/S_length_ratio=1.160" /note="BLAST_uniprot:hit_2 ; ACCESSION=tr|A0A084Y1E0|A0A084Y1E0_9PROT ; ALN/Q_length_ratio=0.189 ; DESCRIPTION=Serine-aspartate repeat-containing protein F OS=Candidatus Accumulibacter sp. SK-01 GN=sdrF PE=4 SV=1 ; EVALUE=1e-123 ; Q/S_length_ratio=1.762" /note="BLAST_uniprot:hit_3 ; ACCESSION=tr|A0A080MK61|A0A080MK61_9PROT ; ALN/Q_length_ratio=0.149 ; DESCRIPTION=Serine-aspartate repeat-containing protein D OS=Candidatus Accumulibacter sp. SK-02 GN=sdrD PE=4 SV=1 ; EVALUE=1e-112 ; Q/S_length_ratio=3.351" /note="BLAST_uniprot:hit_4 ; ACCESSION=tr|N6ZZR9|N6ZZR9_9RHOO ; ALN/Q_length_ratio=0.173 ; DESCRIPTION=Collagen-binding protein OS=Thauera phenylacetica B4P GN=C667_07861 PE=4 SV=1 ; EVALUE=2e-93 ; Q/S_length_ratio=1.088" /note="BLAST_uniprot:hit_5 ; ACCESSION=tr|I3YB57|I3YB57_THIV6 ; ALN/Q_length_ratio=0.444 ; DESCRIPTION=Putative collagen-binding protein OS=Thiocystis violascens (strain ATCC 17096 / DSM 198 / 6111) GN=Thivi_2278 PE=4 SV=1 ; EVALUE=1e-85 ; Q/S_length_ratio=1.386" /note="BLAST_uniprot:hit_6 ; ACCESSION=tr|A3IZB2|A3IZB2_9CHRO ; ALN/Q_length_ratio=0.323 ; DESCRIPTION=Uncharacterized protein OS=Cyanothece sp. CCY0110 GN=CY0110_30026 PE=4 SV=1 ; EVALUE=1e-85 ; Q/S_length_ratio=1.733" /note="BLAST_uniprot:hit_7 ; ACCESSION=tr|C6WJY6|C6WJY6_ACTMD ; ALN/Q_length_ratio=0.589 ; DESCRIPTION=Conserved repeat domain protein OS=Actinosynnema mirum (strain ATCC 29888 / DSM 43827 / NBRC 14064 / IMRU 3971) GN=Amir_2421 PE=4 SV=1 ; EVALUE=3e-85 ; Q/S_length_ratio=0.745" /note="BLAST_uniprot:hit_8 ; ACCESSION=tr|Q8YWB9|Q8YWB9_NOSS1 ; ALN/Q_length_ratio=0.430 ; DESCRIPTION=All1696 protein OS=Nostoc sp. (strain PCC 7120 / UTEX 2576) GN=all1696 PE=4 SV=1 ; EVALUE=1e-81 ; Q/S_length_ratio=1.257" /note="BLAST_uniprot:hit_9 ; ACCESSION=tr|M5SPI7|M5SPI7_9PLAN ; ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain protein OS=Rhodopirellula europaea SH398 GN=RESH_01285 PE=4 SV=1 ; EVALUE=3e-77 ; Q/S_length_ratio=1.455" /note="BLAST_uniprot:hit_10 ; ACCESSION=tr|L7CFZ1|L7CFZ1_RHOBT ; ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain protein OS=Rhodopirellula baltica SWK14 GN=RBSWK_03634 PE=4 SV=1 ; EVALUE=6e-77 ; Q/S_length_ratio=1.438" /note="BLAST_uniprot:hit_11 ; ACCESSION=tr|K5D2K5|K5D2K5_RHOBT ; ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain protein OS=Rhodopirellula baltica SH28 GN=RBSH_03818 PE=4 SV=1 ; EVALUE=6e-77 ; Q/S_length_ratio=1.455" /note="BLAST_uniprot:hit_12 ; ACCESSION=tr|Q7ULR8|Q7ULR8_RHOBA ; ALN/Q_length_ratio=0.417 ; DESCRIPTION=Probable fibrinogen-binding protein homolog-putative involved in cell-cell interaction OS=Rhodopirellula baltica (strain SH1) GN=RB9330 PE=4 SV=1 ; EVALUE=3e-76 ; Q/S_length_ratio=1.431" /note="BLAST_uniprot:hit_13 ; ACCESSION=tr|M5UPV6|M5UPV6_9PLAN ; ALN/Q_length_ratio=0.392 ; DESCRIPTION=Collagen-binding surface protein Cna-like, B region domain protein OS=Rhodopirellula sallentina SM41 GN=RSSM_00552 PE=4 SV=1 ; EVALUE=3e-76 ; Q/S_length_ratio=1.335" /note="BLAST_uniprot:hit_14 ; ACCESSION=tr|F2AZ90|F2AZ90_RHOBT ; ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain protein OS=Rhodopirellula baltica WH47 GN=RBWH47_05824 PE=4 SV=1 ; EVALUE=4e-76 ; Q/S_length_ratio=1.455" /note="BLAST_uniprot:hit_15 ; ACCESSION=tr|E8R1G1|E8R1G1_ISOPI ; ALN/Q_length_ratio=0.563 ; DESCRIPTION=Cna B domain protein OS=Isosphaera pallida (strain ATCC 43644 / DSM 9630 / IS1B) GN=Isop_1796 PE=4 SV=1 ; EVALUE=2e-74 ; Q/S_length_ratio=1.653" /note="Pfam_scan:hit_1 (243..309); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:56; HMM_Length:70; EVALUE:7.3e-09; BITSCORE: 35.2" /note="Pfam_scan:hit_2 (340..405); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70; EVALUE:2.7e-08; BITSCORE: 33.4" /note="Pfam_scan:hit_3 (437..502); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:48; HMM_Length:70; EVALUE:7.8e-09; BITSCORE: 35.1" /note="Pfam_scan:hit_4 (543..607); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:57; HMM_Length:70; EVALUE:4.2e-09; BITSCORE: 36.0" /note="Pfam_scan:hit_5 (639..705); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70; EVALUE:4.7e-07; BITSCORE: 29.4" /note="Pfam_scan:hit_6 (744..798); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:51; HMM_Length:70; EVALUE:2.5e-06; BITSCORE: 27.1" /note="Pfam_scan:hit_7 (850..917); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70; EVALUE:6.9e-08; BITSCORE: 32.1" /note="Pfam_scan:hit_8 (955..1020); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70; EVALUE:2.7e-08; BITSCORE: 33.4" /note="Pfam_scan:hit_9 (1052..1117); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:48; HMM_Length:70; EVALUE:1.9e-08; BITSCORE: 33.9" /note="Pfam_scan:hit_10 (1158..1222); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:57; HMM_Length:70; EVALUE:4.2e-09; BITSCORE: 36.0" /note="Pfam_scan:hit_11 (1254..1318); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:53; HMM_Length:70; EVALUE:7.6e-11; BITSCORE: 41.6" /note="Pfam_scan:hit_12 (1360..1427); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:49; HMM_Length:70; EVALUE:4.2e-10; BITSCORE: 39.2" /note="Pfam_scan:hit_13 (1459..1526); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:55; HMM_Length:70; EVALUE:6e-09; BITSCORE: 35.5" /note="Pfam_scan:hit_14 (1565..1628); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:52; HMM_Length:70; EVALUE:8.5e-08; BITSCORE: 31.8" /note="Pfam_scan:hit_15 (1992..2071); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:32; HMM_Length:70; EVALUE:1.3e-06; BITSCORE: 28.0" /note="Pfam_scan:hit_16 (2258..2329); Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:64; HMM_Length:70; EVALUE:3.4e-09; BITSCORE: 36.3" BEGIN 1 MTPTWKTFLS RLHSTISGTG RRPIRTRRPR ALAIEQLEDR LVPAFALQFS TNGGATFSAP 61 VTDQGVGDTD ALVGTIGVNI GAVTIAASSL GSTGTASTTL NLSVTGVAAA SAHDIIVRAS 121 LSDLTTTPAP QTLVYSFTGS TPSGGTVTSQ TWVDDNNALF GMTGDTTGAK TIPASGSLVV 181 SDTVPYSATT QIHLVFKNTF PINLSLNNLN TITASPEQKA EIHGTKFEDV NGNGVRESSE 241 AGLQGWTIQL LDTNDNVLAT TLTAVDGSYS FTNLTPGIYR VREVNQAGWT QITANPGDIG 301 TVSGSNITGV DFGNFKNITI AGTKYTDITG NSFSSDDTPL AGITVNLFKN GALVATTTTA 361 TDGTYSFANQ GPGNYFVQEL VPTGYQQTGG NAGYTIVATS GLVSNNNNFD NFQLAKITGK 421 KVNDLTGDGL SSDDTGLGGV TVNLYKDNAS GVLVASTTTA ADGTYSFDNL APGTYFVQEL 481 VPAGSVQTAG NAGYTVTVGG TGVQSGGTAT GNDFANFKQV TITGTKFTDI TGNSFSSDDT 541 PRAGVTINLY QNGNFVTSTV TGADGTYKFE NLGPGTYFVQ ELVPAGATQT GGNAGYTIAA 601 TSGLVSNNNN FDNFYHGQIT GKKVTDLTGN GLTSDDTGLG GVTVNLYKAT STLTLIASTV 661 TAADGTYSFG DLDLGTYFVQ ELVPSGYVQT GGNTGYTITV GPGGVVSGGT SSGNDFANFQ 721 KGSITGTKYT DITGNGLSGD DTELGGVTIN LYSGNSTAGT LVASTVTAAN GTYSFGDLAP 781 GTYFVQELVP AGATQTAGSA GYVVVIGQGG VGSGGTSSGN NFANFYRGQI TGTKYTDVTG 841 NGITGDDTGL GGVTINLYKD NASGALIATT TTASDGTYSF GNLDLGTYFV QEIVPAGSTQ 901 TAGIAGYTIT VGSGGVASGG TATGNNFANF KNITIAGTKY TDITGNSFSS DDTPLAGITV 961 NLFKNGALVA TTTTATDGTY SFANQGPGNY FVQELVPTGY QQTGGNAGYT IVATSGLVSN 1021 NNNFDNFQLA KITGKKVNDL TGDGLSSDDT GLGGVTVNLY KDNASGVLVA STTTAADGTY 1081 SFDNLAPGTY CVQELVPAGS VQTAGNAGYT VTVGGTGVQS GGTATGNDFA NFKQVTITGT 1141 KFTDITGNSF SSDDTPRAGV TINLYQNGNF VTSTVTGADG TYKFENLGPG TYFVQELVPA 1201 GATQTGGNAG YTIAATSGLV SNNNNFDNFY HGQITGKKVT DLTGNGLTSD DTGLGGVTIN 1261 LYSGGSAAGA IVATTTTAAN GTYSFSNLAP GTYFVQELVP AGYQQTAGNA GYVVVIGQGG 1321 VTSGGTSSGN DFANFQKITI SGTKYNDITG NSFSADDTPL AGVTINLFKD GGTTPVATTV 1381 TGADGTYSFT DLAPGTYFVQ ELVPAGSVQT GGNAGYTIAA TSGLNSTGNN FDNFKKVSIT 1441 GTKVTDKTGN GFTSDDAGLG GITINLYSGT STAGALVAST TTASNGTFSF SNLAPGTYFV 1501 QEVVPSGYVQ TTGTSGYAVT VGGTGIQSGG TSANNNFANF QKVKITGTKF QDMDGCGFGS 1561 DDVVLGGVTI KLYSGTSTAG ALVASTVTAA NGTFSFEGLA PGTYFVQEVV PTGWTQTGGN 1621 AGYVVTVGGT GVQSGGTASG KNFDNYKKPN PGIDIEKTTN GPTNSNPVAP DYDNEDAVDG 1681 AGVPILTPGS SVTWTYKVTN TGDVAFTTSQ IAIVDDNGTP GVTSDDLSIA NGKITFLSVL 1741 TGDSDNLLEP GEVWLYKATG IVQDFSVPVS GSTVSFDFSG NSAVSGTAGN VRTFTSSGVS 1801 VNASAFSRDK TTGAWSTAYL GSYGGGLGVT DTSESGSSNS HTVDNSGRDN YVLFEFSENV 1861 VIDSAFLGYV VGDSDLTVWI GTKTGAFNSH LTLSDSVLAS LGFTEVNLGG SSTRTANLNA 1921 ALLAGNVLVI AAKTGDSDDN FKIETLCLQK VKPGVYENKA TVTVPGASDS DLSHYKNPPA 1981 VVGGSISGTK YLDVSGNGLN KTAGTNSPAD TPLAGVTIYL DLDNDGRLDV GEPETVTDAN 2041 GNYLFTGLAS KTYYVREVVP AGFVRTGPAL SDNYAVAVSA GKSYTGYDFA NAETCEDDTV 2101 TCVSFTIRHT DGTCETVTDL RGRTREGDLI TVTFNVNVPA GQTHQITFVS YTAPGADFDA 2161 NTASQQKIYD LDTDEFGPGY HTLTVRVPNC YYQVDFVCGF AIDKLGPANS NIFYTPQKRL 2221 VSADNGGAEC CDNDGMISGY KFNDADADGV WDNGEKGLSG WVVYLDSNNN GYKDSWETAT 2281 VTDANGYYKF NNLAAGNYRV REVQQSGWVQ SAAPALVALT TGQNKTGVNF GNVAGSLVSG 2341 CDTASIDFWN CSSGQSLIKS LNGGSTKTAL GTWLASNFSK LYGSSSSYNL SGKTNAQVAS 2401 YFQTLAGKSD KLEAQILATA LAVYVTDSDL AGGTYARNYG FKVTTTGIAD EFYNIGTNGS 2461 LFGVANGGVR TVWQILVAAN NSATSGLAWN GNSTARSAAR TLFAGLNDVG GIG //