LOCUS VTR96973.1 2513 aa PRT BCT 03-FEB-2020
DEFINITION Gemmata massiliana Serine-aspartate repeat-containing
protein F OS=Candidatus Accumulibacter sp. BA-93 GN=sdrF
PE=4 SV=1: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B:
Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B: Cna_B:
Cna_B protein.
ACCESSION LR593886-6062
PROTEIN_ID VTR96973.1
SOURCE Gemmata massiliana
ORGANISM Gemmata massiliana
Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
Gemmata.
REFERENCE 1
AUTHORS
CONSRTM Science for Life Laboratories
JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES Qualifiers
source /organism="Gemmata massiliana"
/chromosome="1"
/isolate="Soil9"
/mol_type="genomic DNA"
/isolation_source="soil"
/db_xref="taxon:1210884"
protein /locus_tag="SOIL9_09530"
/note="BLAST_uniprot:hit_1 ;
ACCESSION=tr|A0A011PQN1|A0A011PQN1_9PROT ;
ALN/Q_length_ratio=0.199 ; DESCRIPTION=Serine-aspartate
repeat-containing protein F OS=Candidatus Accumulibacter
sp. BA-93 GN=sdrF PE=4 SV=1 ; EVALUE=1e-133 ;
Q/S_length_ratio=1.160"
/note="BLAST_uniprot:hit_2 ;
ACCESSION=tr|A0A084Y1E0|A0A084Y1E0_9PROT ;
ALN/Q_length_ratio=0.189 ; DESCRIPTION=Serine-aspartate
repeat-containing protein F OS=Candidatus Accumulibacter
sp. SK-01 GN=sdrF PE=4 SV=1 ; EVALUE=1e-123 ;
Q/S_length_ratio=1.762"
/note="BLAST_uniprot:hit_3 ;
ACCESSION=tr|A0A080MK61|A0A080MK61_9PROT ;
ALN/Q_length_ratio=0.149 ; DESCRIPTION=Serine-aspartate
repeat-containing protein D OS=Candidatus Accumulibacter
sp. SK-02 GN=sdrD PE=4 SV=1 ; EVALUE=1e-112 ;
Q/S_length_ratio=3.351"
/note="BLAST_uniprot:hit_4 ;
ACCESSION=tr|N6ZZR9|N6ZZR9_9RHOO ;
ALN/Q_length_ratio=0.173 ; DESCRIPTION=Collagen-binding
protein OS=Thauera phenylacetica B4P GN=C667_07861 PE=4
SV=1 ; EVALUE=2e-93 ; Q/S_length_ratio=1.088"
/note="BLAST_uniprot:hit_5 ;
ACCESSION=tr|I3YB57|I3YB57_THIV6 ;
ALN/Q_length_ratio=0.444 ; DESCRIPTION=Putative
collagen-binding protein OS=Thiocystis violascens (strain
ATCC 17096 / DSM 198 / 6111) GN=Thivi_2278 PE=4 SV=1 ;
EVALUE=1e-85 ; Q/S_length_ratio=1.386"
/note="BLAST_uniprot:hit_6 ;
ACCESSION=tr|A3IZB2|A3IZB2_9CHRO ;
ALN/Q_length_ratio=0.323 ; DESCRIPTION=Uncharacterized
protein OS=Cyanothece sp. CCY0110 GN=CY0110_30026 PE=4
SV=1 ; EVALUE=1e-85 ; Q/S_length_ratio=1.733"
/note="BLAST_uniprot:hit_7 ;
ACCESSION=tr|C6WJY6|C6WJY6_ACTMD ;
ALN/Q_length_ratio=0.589 ; DESCRIPTION=Conserved repeat
domain protein OS=Actinosynnema mirum (strain ATCC 29888 /
DSM 43827 / NBRC 14064 / IMRU 3971) GN=Amir_2421 PE=4 SV=1
; EVALUE=3e-85 ; Q/S_length_ratio=0.745"
/note="BLAST_uniprot:hit_8 ;
ACCESSION=tr|Q8YWB9|Q8YWB9_NOSS1 ;
ALN/Q_length_ratio=0.430 ; DESCRIPTION=All1696 protein
OS=Nostoc sp. (strain PCC 7120 / UTEX 2576) GN=all1696
PE=4 SV=1 ; EVALUE=1e-81 ; Q/S_length_ratio=1.257"
/note="BLAST_uniprot:hit_9 ;
ACCESSION=tr|M5SPI7|M5SPI7_9PLAN ;
ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
protein OS=Rhodopirellula europaea SH398 GN=RESH_01285
PE=4 SV=1 ; EVALUE=3e-77 ; Q/S_length_ratio=1.455"
/note="BLAST_uniprot:hit_10 ;
ACCESSION=tr|L7CFZ1|L7CFZ1_RHOBT ;
ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
protein OS=Rhodopirellula baltica SWK14 GN=RBSWK_03634
PE=4 SV=1 ; EVALUE=6e-77 ; Q/S_length_ratio=1.438"
/note="BLAST_uniprot:hit_11 ;
ACCESSION=tr|K5D2K5|K5D2K5_RHOBT ;
ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
protein OS=Rhodopirellula baltica SH28 GN=RBSH_03818 PE=4
SV=1 ; EVALUE=6e-77 ; Q/S_length_ratio=1.455"
/note="BLAST_uniprot:hit_12 ;
ACCESSION=tr|Q7ULR8|Q7ULR8_RHOBA ;
ALN/Q_length_ratio=0.417 ; DESCRIPTION=Probable
fibrinogen-binding protein homolog-putative involved in
cell-cell interaction OS=Rhodopirellula baltica (strain
SH1) GN=RB9330 PE=4 SV=1 ; EVALUE=3e-76 ;
Q/S_length_ratio=1.431"
/note="BLAST_uniprot:hit_13 ;
ACCESSION=tr|M5UPV6|M5UPV6_9PLAN ;
ALN/Q_length_ratio=0.392 ; DESCRIPTION=Collagen-binding
surface protein Cna-like, B region domain protein
OS=Rhodopirellula sallentina SM41 GN=RSSM_00552 PE=4 SV=1
; EVALUE=3e-76 ; Q/S_length_ratio=1.335"
/note="BLAST_uniprot:hit_14 ;
ACCESSION=tr|F2AZ90|F2AZ90_RHOBT ;
ALN/Q_length_ratio=0.417 ; DESCRIPTION=Repeat domain
protein OS=Rhodopirellula baltica WH47 GN=RBWH47_05824
PE=4 SV=1 ; EVALUE=4e-76 ; Q/S_length_ratio=1.455"
/note="BLAST_uniprot:hit_15 ;
ACCESSION=tr|E8R1G1|E8R1G1_ISOPI ;
ALN/Q_length_ratio=0.563 ; DESCRIPTION=Cna B domain
protein OS=Isosphaera pallida (strain ATCC 43644 / DSM
9630 / IS1B) GN=Isop_1796 PE=4 SV=1 ; EVALUE=2e-74 ;
Q/S_length_ratio=1.653"
/note="Pfam_scan:hit_1 (243..309); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:56; HMM_Length:70;
EVALUE:7.3e-09; BITSCORE: 35.2"
/note="Pfam_scan:hit_2 (340..405); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
EVALUE:2.7e-08; BITSCORE: 33.4"
/note="Pfam_scan:hit_3 (437..502); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:48; HMM_Length:70;
EVALUE:7.8e-09; BITSCORE: 35.1"
/note="Pfam_scan:hit_4 (543..607); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:57; HMM_Length:70;
EVALUE:4.2e-09; BITSCORE: 36.0"
/note="Pfam_scan:hit_5 (639..705); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
EVALUE:4.7e-07; BITSCORE: 29.4"
/note="Pfam_scan:hit_6 (744..798); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:51; HMM_Length:70;
EVALUE:2.5e-06; BITSCORE: 27.1"
/note="Pfam_scan:hit_7 (850..917); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
EVALUE:6.9e-08; BITSCORE: 32.1"
/note="Pfam_scan:hit_8 (955..1020); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:61; HMM_Length:70;
EVALUE:2.7e-08; BITSCORE: 33.4"
/note="Pfam_scan:hit_9 (1052..1117); Pfam:PF05738.8:Cna_B;
Pfam_type:Family;HMM_aln_Length:48; HMM_Length:70;
EVALUE:1.9e-08; BITSCORE: 33.9"
/note="Pfam_scan:hit_10 (1158..1222);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:57;
HMM_Length:70; EVALUE:4.2e-09; BITSCORE: 36.0"
/note="Pfam_scan:hit_11 (1254..1318);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:53;
HMM_Length:70; EVALUE:7.6e-11; BITSCORE: 41.6"
/note="Pfam_scan:hit_12 (1360..1427);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:49;
HMM_Length:70; EVALUE:4.2e-10; BITSCORE: 39.2"
/note="Pfam_scan:hit_13 (1459..1526);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:55;
HMM_Length:70; EVALUE:6e-09; BITSCORE: 35.5"
/note="Pfam_scan:hit_14 (1565..1628);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:52;
HMM_Length:70; EVALUE:8.5e-08; BITSCORE: 31.8"
/note="Pfam_scan:hit_15 (1992..2071);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:32;
HMM_Length:70; EVALUE:1.3e-06; BITSCORE: 28.0"
/note="Pfam_scan:hit_16 (2258..2329);
Pfam:PF05738.8:Cna_B; Pfam_type:Family;HMM_aln_Length:64;
HMM_Length:70; EVALUE:3.4e-09; BITSCORE: 36.3"
BEGIN
1 MTPTWKTFLS RLHSTISGTG RRPIRTRRPR ALAIEQLEDR LVPAFALQFS TNGGATFSAP
61 VTDQGVGDTD ALVGTIGVNI GAVTIAASSL GSTGTASTTL NLSVTGVAAA SAHDIIVRAS
121 LSDLTTTPAP QTLVYSFTGS TPSGGTVTSQ TWVDDNNALF GMTGDTTGAK TIPASGSLVV
181 SDTVPYSATT QIHLVFKNTF PINLSLNNLN TITASPEQKA EIHGTKFEDV NGNGVRESSE
241 AGLQGWTIQL LDTNDNVLAT TLTAVDGSYS FTNLTPGIYR VREVNQAGWT QITANPGDIG
301 TVSGSNITGV DFGNFKNITI AGTKYTDITG NSFSSDDTPL AGITVNLFKN GALVATTTTA
361 TDGTYSFANQ GPGNYFVQEL VPTGYQQTGG NAGYTIVATS GLVSNNNNFD NFQLAKITGK
421 KVNDLTGDGL SSDDTGLGGV TVNLYKDNAS GVLVASTTTA ADGTYSFDNL APGTYFVQEL
481 VPAGSVQTAG NAGYTVTVGG TGVQSGGTAT GNDFANFKQV TITGTKFTDI TGNSFSSDDT
541 PRAGVTINLY QNGNFVTSTV TGADGTYKFE NLGPGTYFVQ ELVPAGATQT GGNAGYTIAA
601 TSGLVSNNNN FDNFYHGQIT GKKVTDLTGN GLTSDDTGLG GVTVNLYKAT STLTLIASTV
661 TAADGTYSFG DLDLGTYFVQ ELVPSGYVQT GGNTGYTITV GPGGVVSGGT SSGNDFANFQ
721 KGSITGTKYT DITGNGLSGD DTELGGVTIN LYSGNSTAGT LVASTVTAAN GTYSFGDLAP
781 GTYFVQELVP AGATQTAGSA GYVVVIGQGG VGSGGTSSGN NFANFYRGQI TGTKYTDVTG
841 NGITGDDTGL GGVTINLYKD NASGALIATT TTASDGTYSF GNLDLGTYFV QEIVPAGSTQ
901 TAGIAGYTIT VGSGGVASGG TATGNNFANF KNITIAGTKY TDITGNSFSS DDTPLAGITV
961 NLFKNGALVA TTTTATDGTY SFANQGPGNY FVQELVPTGY QQTGGNAGYT IVATSGLVSN
1021 NNNFDNFQLA KITGKKVNDL TGDGLSSDDT GLGGVTVNLY KDNASGVLVA STTTAADGTY
1081 SFDNLAPGTY CVQELVPAGS VQTAGNAGYT VTVGGTGVQS GGTATGNDFA NFKQVTITGT
1141 KFTDITGNSF SSDDTPRAGV TINLYQNGNF VTSTVTGADG TYKFENLGPG TYFVQELVPA
1201 GATQTGGNAG YTIAATSGLV SNNNNFDNFY HGQITGKKVT DLTGNGLTSD DTGLGGVTIN
1261 LYSGGSAAGA IVATTTTAAN GTYSFSNLAP GTYFVQELVP AGYQQTAGNA GYVVVIGQGG
1321 VTSGGTSSGN DFANFQKITI SGTKYNDITG NSFSADDTPL AGVTINLFKD GGTTPVATTV
1381 TGADGTYSFT DLAPGTYFVQ ELVPAGSVQT GGNAGYTIAA TSGLNSTGNN FDNFKKVSIT
1441 GTKVTDKTGN GFTSDDAGLG GITINLYSGT STAGALVAST TTASNGTFSF SNLAPGTYFV
1501 QEVVPSGYVQ TTGTSGYAVT VGGTGIQSGG TSANNNFANF QKVKITGTKF QDMDGCGFGS
1561 DDVVLGGVTI KLYSGTSTAG ALVASTVTAA NGTFSFEGLA PGTYFVQEVV PTGWTQTGGN
1621 AGYVVTVGGT GVQSGGTASG KNFDNYKKPN PGIDIEKTTN GPTNSNPVAP DYDNEDAVDG
1681 AGVPILTPGS SVTWTYKVTN TGDVAFTTSQ IAIVDDNGTP GVTSDDLSIA NGKITFLSVL
1741 TGDSDNLLEP GEVWLYKATG IVQDFSVPVS GSTVSFDFSG NSAVSGTAGN VRTFTSSGVS
1801 VNASAFSRDK TTGAWSTAYL GSYGGGLGVT DTSESGSSNS HTVDNSGRDN YVLFEFSENV
1861 VIDSAFLGYV VGDSDLTVWI GTKTGAFNSH LTLSDSVLAS LGFTEVNLGG SSTRTANLNA
1921 ALLAGNVLVI AAKTGDSDDN FKIETLCLQK VKPGVYENKA TVTVPGASDS DLSHYKNPPA
1981 VVGGSISGTK YLDVSGNGLN KTAGTNSPAD TPLAGVTIYL DLDNDGRLDV GEPETVTDAN
2041 GNYLFTGLAS KTYYVREVVP AGFVRTGPAL SDNYAVAVSA GKSYTGYDFA NAETCEDDTV
2101 TCVSFTIRHT DGTCETVTDL RGRTREGDLI TVTFNVNVPA GQTHQITFVS YTAPGADFDA
2161 NTASQQKIYD LDTDEFGPGY HTLTVRVPNC YYQVDFVCGF AIDKLGPANS NIFYTPQKRL
2221 VSADNGGAEC CDNDGMISGY KFNDADADGV WDNGEKGLSG WVVYLDSNNN GYKDSWETAT
2281 VTDANGYYKF NNLAAGNYRV REVQQSGWVQ SAAPALVALT TGQNKTGVNF GNVAGSLVSG
2341 CDTASIDFWN CSSGQSLIKS LNGGSTKTAL GTWLASNFSK LYGSSSSYNL SGKTNAQVAS
2401 YFQTLAGKSD KLEAQILATA LAVYVTDSDL AGGTYARNYG FKVTTTGIAD EFYNIGTNGS
2461 LFGVANGGVR TVWQILVAAN NSATSGLAWN GNSTARSAAR TLFAGLNDVG GIG
//