LOCUS VTR94201.1 2220 aa PRT BCT 03-FEB-2020 DEFINITION Gemmata massiliana cadherin-related protein : Uncharacterized protein OS=Cylindrospermopsis raciborskii CS-505 GN=CRC_01020 PE=3 SV=1: MAM: Lectin_C: Lectin_C: PKD protein. ACCESSION LR593886-3502 PROTEIN_ID VTR94201.1 SOURCE Gemmata massiliana ORGANISM Gemmata massiliana Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae; Gemmata. REFERENCE 1 AUTHORS CONSRTM Science for Life Laboratories JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution, Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden FEATURES Qualifiers source /organism="Gemmata massiliana" /chromosome="1" /isolate="Soil9" /mol_type="genomic DNA" /isolation_source="soil" /db_xref="taxon:1210884" protein /locus_tag="SOIL9_35130" /note="BLAST_uniprot:hit_1 ; ACCESSION=tr|D4TF66|D4TF66_9NOST ; ALN/Q_length_ratio=0.076 ; DESCRIPTION=Uncharacterized protein OS=Cylindrospermopsis raciborskii CS-505 GN=CRC_01020 PE=3 SV=1 ; EVALUE=2e-59 ; Q/S_length_ratio=0.675" /note="BLAST_uniprot:hit_2 ; ACCESSION=tr|I4G2A9|I4G2A9_MICAE ; ALN/Q_length_ratio=0.075 ; DESCRIPTION=Putative peptidase OS=Microcystis aeruginosa PCC 9443 GN=MICAC_2910001 PE=3 SV=1 ; EVALUE=7e-59 ; Q/S_length_ratio=1.651" /note="BLAST_uniprot:hit_3 ; ACCESSION=tr|B0JT18|B0JT18_MICAN ; ALN/Q_length_ratio=0.076 ; DESCRIPTION=Putative peptidase OS=Microcystis aeruginosa (strain NIES-843) GN=MAE_12400 PE=3 SV=1 ; EVALUE=1e-55 ; Q/S_length_ratio=0.876" /note="BLAST_uniprot:hit_4 ; ACCESSION=tr|M5TC19|M5TC19_9PLAN ; ALN/Q_length_ratio=0.158 ; DESCRIPTION=Cadherin-related protein OS=Rhodopirellula sp. SWK7 GN=RRSWK_00797 PE=4 SV=1 ; EVALUE=3e-50 ; Q/S_length_ratio=1.939" /note="BLAST_uniprot:hit_5 ; ACCESSION=tr|A0A017SYD8|A0A017SYD8_9DELT ; ALN/Q_length_ratio=0.078 ; DESCRIPTION=Uncharacterized protein OS=Chondromyces apiculatus DSM 436 GN=CAP_7929 PE=4 SV=1 ; EVALUE=3e-50 ; Q/S_length_ratio=4.073" /note="BLAST_uniprot:hit_6 ; ACCESSION=tr|A1S2J6|A1S2J6_SHEAM ; ALN/Q_length_ratio=0.077 ; DESCRIPTION=Uncharacterized protein OS=Shewanella amazonensis (strain ATCC BAA-1098 / SB2B) GN=Sama_0391 PE=4 SV=1 ; EVALUE=6e-49 ; Q/S_length_ratio=6.748" /note="BLAST_uniprot:hit_7 ; ACCESSION=tr|A0A085XWK6|A0A085XWK6_9DELT ; ALN/Q_length_ratio=0.081 ; DESCRIPTION=Uncharacterized protein OS=Sandaracinus amylolyticus GN=DB32_3395 PE=4 SV=1 ; EVALUE=1e-48 ; Q/S_length_ratio=4.521" /note="BLAST_uniprot:hit_8 ; ACCESSION=tr|A9EPJ6|A9EPJ6_SORC5 ; ALN/Q_length_ratio=0.078 ; DESCRIPTION=Uncharacterized protein OS=Sorangium cellulosum (strain So ce56) GN=sce0833 PE=4 SV=1 ; EVALUE=2e-47 ; Q/S_length_ratio=4.286" /note="BLAST_uniprot:hit_9 ; ACCESSION=tr|A0A017TJ43|A0A017TJ43_9DELT ; ALN/Q_length_ratio=0.078 ; DESCRIPTION=Uncharacterized protein OS=Chondromyces apiculatus DSM 436 GN=CAP_2773 PE=4 SV=1 ; EVALUE=1e-46 ; Q/S_length_ratio=3.213" /note="BLAST_uniprot:hit_10 ; ACCESSION=tr|A0A085Y8U9|A0A085Y8U9_9DELT ; ALN/Q_length_ratio=0.074 ; DESCRIPTION=Uncharacterized protein OS=Sandaracinus amylolyticus GN=DB32_4508 PE=4 SV=1 ; EVALUE=3e-46 ; Q/S_length_ratio=5.092" /note="BLAST_uniprot:hit_12 ; ACCESSION=tr|A0A017SY98|A0A017SY98_9DELT ; ALN/Q_length_ratio=0.082 ; DESCRIPTION=Uncharacterized protein OS=Chondromyces apiculatus DSM 436 GN=CAP_8435 PE=4 SV=1 ; EVALUE=7e-46 ; Q/S_length_ratio=4.396" /note="BLAST_uniprot:hit_11 ; ACCESSION=tr|A6G8Z6|A6G8Z6_9DELT ; ALN/Q_length_ratio=0.077 ; DESCRIPTION=Putative lipoprotein OS=Plesiocystis pacifica SIR-1 GN=PPSIR1_14055 PE=4 SV=1 ; EVALUE=7e-46 ; Q/S_length_ratio=4.302" /note="BLAST_uniprot:hit_13 ; ACCESSION=tr|I3YTD9|I3YTD9_AEQSU ; ALN/Q_length_ratio=0.124 ; DESCRIPTION=HYR domain-containing protein OS=Aequorivita sublithincola (strain DSM 14238 / LMG 21431 / ACAM 643 / 9-3) GN=Aeqsu_0750 PE=4 SV=1 ; EVALUE=1e-41 ; Q/S_length_ratio=1.461" /note="BLAST_uniprot:hit_14 ; ACCESSION=tr|A9F8T9|A9F8T9_SORC5 ; ALN/Q_length_ratio=0.077 ; DESCRIPTION=Uncharacterized protein OS=Sorangium cellulosum (strain So ce56) GN=sce4527 PE=4 SV=1 ; EVALUE=1e-36 ; Q/S_length_ratio=9.447" /note="BLAST_uniprot:hit_15 ; ACCESSION=tr|S4Y150|S4Y150_SORCE ; ALN/Q_length_ratio=0.077 ; DESCRIPTION=Uncharacterized protein OS=Sorangium cellulosum So0157-2 GN=SCE1572_27585 PE=4 SV=1 ; EVALUE=1e-30 ; Q/S_length_ratio=9.447" /note="Pfam_scan:hit_1 (44..216); Pfam:PF00629.18:MAM; Pfam_type:Domain;HMM_aln_Length:153; HMM_Length:160; EVALUE:1.1e-05; BITSCORE: 25.2" /note="Pfam_scan:hit_2 (1398..1490); Pfam:PF00059.16:Lectin_C; Pfam_type:Domain;HMM_aln_Length:71; HMM_Length:105; EVALUE:2.9e-08; BITSCORE: 34.2" /note="Pfam_scan:hit_3 (1646..1741); Pfam:PF00059.16:Lectin_C; Pfam_type:Domain;HMM_aln_Length:69; HMM_Length:105; EVALUE:1.4e-06; BITSCORE: 28.8" /note="Pfam_scan:hit_4 (1820..1909); Pfam:PF00801.15:PKD; Pfam_type:Domain;HMM_aln_Length:57; HMM_Length:69; EVALUE:1.1e-06; BITSCORE: 28.3" /note="GO_domain:GO:0005575" BEGIN 1 MFSLKSWLRR WKPVTRKPSS RRSPRRAPLG VARLEDRLVP SVLFSEDFSD NSAGWTLGTE 61 WQIGSATLSA GQSTGNPDPA LDHTPTGDNG VAGVKIGGNA ATTVHDYYYL TSPTINTASA 121 TAPVTLEFYR WLNSDYAPFM ANRVEVFDGA SWQAVWQTAG SPGIQDSSWQ RQQFDVSAYK 181 NANMQVRFGF SVGSSGAFTM SSWNIDDVTI TASDPPPTEN GLSAQIVGAP ANSSEGSAIT 241 VSAAVTDTVG TGPYAYVWSV TKNGASYAAG TSTDPTFTFT PDDNGTYLIG LTVTAPGGRT 301 SGATTGTGPT DVLIIYDALN AQTQSLKNSL EAAGFNVALS STDETLFNGT NPSLAPFEAV 361 IHLNGTTWSS PMPVAGQNAL VGYVQSGGAY LGSEWSSYET QYGSMGPMRD LALFDYQSER 421 FLTTLTLTEI AAQSAHPILA NIPASVSFSA SALIGPVHTF ATNPATVLMT DQFGNAALAV 481 REFGTGRVVG FHNAGNYSGG TALSDTELQQ LYIDGVKWAS RRGAGGPGAS ATILVTNVAP 541 TATLSSAAPV PEAVPVTVTF TGAADASTAD QAAGFRYSFA TSAAGLATSY AGASPLASGQ 601 VTFPDNGTYT VFARIFDKDG GFRDYTTNVT VTNSAPTATI STGGSVGEGS AATVSLINPV 661 DSATDLSAGL RYSFSTSAAN LATSYATAGA ASAQQFSFPE NGTYTVFARV FDKDGGSSDY 721 QTTVTVTNVA PIVTITGAPA NSPEGTAITL GSTVSDPGSG DTFTYAWSVT KNGVPYATGT 781 PTNGSTFTFT PNDNGTYVVS LIVTDDDGGV GIAGTGSFGG PTAGTTDVLI IYDAATAPGT 841 IALRNALQAA GMNVSLSTTD ETLFNGSNPF LTPYEAVIHL NGITWPTDMP LGGQTALVNY 901 VQNGGGYIGN EWNAYEFSVG RMQQMRDLIL LNSVSNSSGN LTLTDVPGQS GHPILANVPS 961 PAFFSASYNV GQVRSYATQP AVALMRDQFG NDAVAVREFG IGHVVAFHHA GNYFSGTLND 1021 ADVLQLYVDG VKWAARASGG QGATITVTNA APTATDVSVT PVVNEGGTAT VTGRITDPGA 1081 ADTHTVTVSW GDGTSSTAVV NADRTFTATH VYTDDNPTGT PADVYQVGVS VRDDDGGVSG 1141 GGTQELVTNG GFESGFTGWT TNVQSGTWSL NSGSTDPDGP GLPTAPISGQ FDALAAQSGP 1201 SRLILSAPIV VPTGITSAVL SWSDRIRNHY SQYSDPNQEW RVRVLDAAGN ELTTVFSTNP 1261 GDPLEQFGPN HRSVDLTALL QGRAGQTIRL SFELDDNLFY FNVNLDDVSL LTTTGPGIPV 1321 TVTNVAPTAP VLQVSPAVGE DGTVTLTGTF TDAGLNDTHT VTVDWGDGSQ TVLGGGATVP 1381 VSQAVEYNGH RYYVIRQAGL SWFEAQNQAQ RLGGNLVTIN DAAENTFVSE LLRSNFGYYA 1441 LAWIGLNDEA NEGQFGWVSG DPITYTNWFV QDGEPNDYPP QVTEDFAITN YAYGYGPGWW 1501 NDLAGTRDSA IYWGAYAVVE VNPTRTFTLS HRYADDTAGA YTIGVTVTDD DTGASSATTT 1561 ATVTNAAPTD LTVSADAVTI NEDGSVTLTG SFTDRGTLDA HTVTIDWKDG TTSQVAVPGF 1621 PGAPSPGVNL ATSAEFGGHT YHFISTPLAW ADAEAEARRM GGHLVTINSD AENLFLFHYV 1681 RRAALQGDVQ TWIGLSDGGT DGPLQWASGE SLGYTNWATG QPSDLVGPTG YAFNYNNVEI 1741 GARWGAFSAE TPLFAVIEVD GKRTFTATHR YLDDAPSGTA SDTYAIGVTV TDDDAGTTST 1801 TVPVTVNNIA PVIGSLTGPV AGTQTTATPG GAPVAFSGVR GQPLAFSVGF SDTGTIDTHE 1861 VQWNFGDGTV SGWLPASGST ASAPAHAFAA TGTYTVTVTV RDDDGGTVSF AQQVVIKTIE 1921 LQADPTDPSK TALVVGGTTG TDQIQLSGSS SVTVNLNGSY LGSFARTGRL AAYGQGGNDQ 1981 VQISGNFEDV LVDAGAGTDQ IQLSGTFRDL FTDGGAGNDQ TQVSGNFRDA VLSAGSGNDT 2041 VQVSGNFNTT TVSAGDGDDN VQISGTFARV LVAGGAGNDV LRVYGTGPSI LVGGDGNDEL 2101 VGSTGRSLLI GGRGADRITG SSAEDVLIAG FTAYDDDFGA LTALHGVWVD PTKNYAQRVA 2161 ALQLAGTIGG IRLAPDTVFD DDSADRLTGA AGRDWFLFAP TRDDVTDDAA NESLGFTNTP //