LOCUS       VTR94201.1              2220 aa    PRT              BCT 03-FEB-2020
DEFINITION  Gemmata massiliana cadherin-related protein : Uncharacterized
            protein OS=Cylindrospermopsis raciborskii CS-505 GN=CRC_01020
            PE=3 SV=1: MAM: Lectin_C: Lectin_C: PKD protein.
ACCESSION   LR593886-3502
PROTEIN_ID  VTR94201.1
SOURCE      Gemmata massiliana
  ORGANISM  Gemmata massiliana
            Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
            Gemmata.
REFERENCE   1
  AUTHORS   
  CONSRTM   Science for Life Laboratories
  JOURNAL   Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
            MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
            Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES             Qualifiers
     source          /organism="Gemmata massiliana"
                     /chromosome="1"
                     /isolate="Soil9"
                     /mol_type="genomic DNA"
                     /isolation_source="soil"
                     /db_xref="taxon:1210884"
     protein         /locus_tag="SOIL9_35130"
                     /note="BLAST_uniprot:hit_1 ;
                     ACCESSION=tr|D4TF66|D4TF66_9NOST ;
                     ALN/Q_length_ratio=0.076 ; DESCRIPTION=Uncharacterized
                     protein OS=Cylindrospermopsis raciborskii CS-505
                     GN=CRC_01020 PE=3 SV=1 ; EVALUE=2e-59 ;
                     Q/S_length_ratio=0.675"
                     /note="BLAST_uniprot:hit_2 ;
                     ACCESSION=tr|I4G2A9|I4G2A9_MICAE ;
                     ALN/Q_length_ratio=0.075 ; DESCRIPTION=Putative peptidase
                     OS=Microcystis aeruginosa PCC 9443 GN=MICAC_2910001 PE=3
                     SV=1 ; EVALUE=7e-59 ; Q/S_length_ratio=1.651"
                     /note="BLAST_uniprot:hit_3 ;
                     ACCESSION=tr|B0JT18|B0JT18_MICAN ;
                     ALN/Q_length_ratio=0.076 ; DESCRIPTION=Putative peptidase
                     OS=Microcystis aeruginosa (strain NIES-843) GN=MAE_12400
                     PE=3 SV=1 ; EVALUE=1e-55 ; Q/S_length_ratio=0.876"
                     /note="BLAST_uniprot:hit_4 ;
                     ACCESSION=tr|M5TC19|M5TC19_9PLAN ;
                     ALN/Q_length_ratio=0.158 ; DESCRIPTION=Cadherin-related
                     protein OS=Rhodopirellula sp. SWK7 GN=RRSWK_00797 PE=4
                     SV=1 ; EVALUE=3e-50 ; Q/S_length_ratio=1.939"
                     /note="BLAST_uniprot:hit_5 ;
                     ACCESSION=tr|A0A017SYD8|A0A017SYD8_9DELT ;
                     ALN/Q_length_ratio=0.078 ; DESCRIPTION=Uncharacterized
                     protein OS=Chondromyces apiculatus DSM 436 GN=CAP_7929
                     PE=4 SV=1 ; EVALUE=3e-50 ; Q/S_length_ratio=4.073"
                     /note="BLAST_uniprot:hit_6 ;
                     ACCESSION=tr|A1S2J6|A1S2J6_SHEAM ;
                     ALN/Q_length_ratio=0.077 ; DESCRIPTION=Uncharacterized
                     protein OS=Shewanella amazonensis (strain ATCC BAA-1098 /
                     SB2B) GN=Sama_0391 PE=4 SV=1 ; EVALUE=6e-49 ;
                     Q/S_length_ratio=6.748"
                     /note="BLAST_uniprot:hit_7 ;
                     ACCESSION=tr|A0A085XWK6|A0A085XWK6_9DELT ;
                     ALN/Q_length_ratio=0.081 ; DESCRIPTION=Uncharacterized
                     protein OS=Sandaracinus amylolyticus GN=DB32_3395 PE=4
                     SV=1 ; EVALUE=1e-48 ; Q/S_length_ratio=4.521"
                     /note="BLAST_uniprot:hit_8 ;
                     ACCESSION=tr|A9EPJ6|A9EPJ6_SORC5 ;
                     ALN/Q_length_ratio=0.078 ; DESCRIPTION=Uncharacterized
                     protein OS=Sorangium cellulosum (strain So ce56)
                     GN=sce0833 PE=4 SV=1 ; EVALUE=2e-47 ;
                     Q/S_length_ratio=4.286"
                     /note="BLAST_uniprot:hit_9 ;
                     ACCESSION=tr|A0A017TJ43|A0A017TJ43_9DELT ;
                     ALN/Q_length_ratio=0.078 ; DESCRIPTION=Uncharacterized
                     protein OS=Chondromyces apiculatus DSM 436 GN=CAP_2773
                     PE=4 SV=1 ; EVALUE=1e-46 ; Q/S_length_ratio=3.213"
                     /note="BLAST_uniprot:hit_10 ;
                     ACCESSION=tr|A0A085Y8U9|A0A085Y8U9_9DELT ;
                     ALN/Q_length_ratio=0.074 ; DESCRIPTION=Uncharacterized
                     protein OS=Sandaracinus amylolyticus GN=DB32_4508 PE=4
                     SV=1 ; EVALUE=3e-46 ; Q/S_length_ratio=5.092"
                     /note="BLAST_uniprot:hit_12 ;
                     ACCESSION=tr|A0A017SY98|A0A017SY98_9DELT ;
                     ALN/Q_length_ratio=0.082 ; DESCRIPTION=Uncharacterized
                     protein OS=Chondromyces apiculatus DSM 436 GN=CAP_8435
                     PE=4 SV=1 ; EVALUE=7e-46 ; Q/S_length_ratio=4.396"
                     /note="BLAST_uniprot:hit_11 ;
                     ACCESSION=tr|A6G8Z6|A6G8Z6_9DELT ;
                     ALN/Q_length_ratio=0.077 ; DESCRIPTION=Putative
                     lipoprotein OS=Plesiocystis pacifica SIR-1 GN=PPSIR1_14055
                     PE=4 SV=1 ; EVALUE=7e-46 ; Q/S_length_ratio=4.302"
                     /note="BLAST_uniprot:hit_13 ;
                     ACCESSION=tr|I3YTD9|I3YTD9_AEQSU ;
                     ALN/Q_length_ratio=0.124 ; DESCRIPTION=HYR
                     domain-containing protein OS=Aequorivita sublithincola
                     (strain DSM 14238 / LMG 21431 / ACAM 643 / 9-3)
                     GN=Aeqsu_0750 PE=4 SV=1 ; EVALUE=1e-41 ;
                     Q/S_length_ratio=1.461"
                     /note="BLAST_uniprot:hit_14 ;
                     ACCESSION=tr|A9F8T9|A9F8T9_SORC5 ;
                     ALN/Q_length_ratio=0.077 ; DESCRIPTION=Uncharacterized
                     protein OS=Sorangium cellulosum (strain So ce56)
                     GN=sce4527 PE=4 SV=1 ; EVALUE=1e-36 ;
                     Q/S_length_ratio=9.447"
                     /note="BLAST_uniprot:hit_15 ;
                     ACCESSION=tr|S4Y150|S4Y150_SORCE ;
                     ALN/Q_length_ratio=0.077 ; DESCRIPTION=Uncharacterized
                     protein OS=Sorangium cellulosum So0157-2 GN=SCE1572_27585
                     PE=4 SV=1 ; EVALUE=1e-30 ; Q/S_length_ratio=9.447"
                     /note="Pfam_scan:hit_1 (44..216); Pfam:PF00629.18:MAM;
                     Pfam_type:Domain;HMM_aln_Length:153; HMM_Length:160;
                     EVALUE:1.1e-05; BITSCORE: 25.2"
                     /note="Pfam_scan:hit_2 (1398..1490);
                     Pfam:PF00059.16:Lectin_C;
                     Pfam_type:Domain;HMM_aln_Length:71; HMM_Length:105;
                     EVALUE:2.9e-08; BITSCORE: 34.2"
                     /note="Pfam_scan:hit_3 (1646..1741);
                     Pfam:PF00059.16:Lectin_C;
                     Pfam_type:Domain;HMM_aln_Length:69; HMM_Length:105;
                     EVALUE:1.4e-06; BITSCORE: 28.8"
                     /note="Pfam_scan:hit_4 (1820..1909); Pfam:PF00801.15:PKD;
                     Pfam_type:Domain;HMM_aln_Length:57; HMM_Length:69;
                     EVALUE:1.1e-06; BITSCORE: 28.3"
                     /note="GO_domain:GO:0005575"
BEGIN
        1 MFSLKSWLRR WKPVTRKPSS RRSPRRAPLG VARLEDRLVP SVLFSEDFSD NSAGWTLGTE
       61 WQIGSATLSA GQSTGNPDPA LDHTPTGDNG VAGVKIGGNA ATTVHDYYYL TSPTINTASA
      121 TAPVTLEFYR WLNSDYAPFM ANRVEVFDGA SWQAVWQTAG SPGIQDSSWQ RQQFDVSAYK
      181 NANMQVRFGF SVGSSGAFTM SSWNIDDVTI TASDPPPTEN GLSAQIVGAP ANSSEGSAIT
      241 VSAAVTDTVG TGPYAYVWSV TKNGASYAAG TSTDPTFTFT PDDNGTYLIG LTVTAPGGRT
      301 SGATTGTGPT DVLIIYDALN AQTQSLKNSL EAAGFNVALS STDETLFNGT NPSLAPFEAV
      361 IHLNGTTWSS PMPVAGQNAL VGYVQSGGAY LGSEWSSYET QYGSMGPMRD LALFDYQSER
      421 FLTTLTLTEI AAQSAHPILA NIPASVSFSA SALIGPVHTF ATNPATVLMT DQFGNAALAV
      481 REFGTGRVVG FHNAGNYSGG TALSDTELQQ LYIDGVKWAS RRGAGGPGAS ATILVTNVAP
      541 TATLSSAAPV PEAVPVTVTF TGAADASTAD QAAGFRYSFA TSAAGLATSY AGASPLASGQ
      601 VTFPDNGTYT VFARIFDKDG GFRDYTTNVT VTNSAPTATI STGGSVGEGS AATVSLINPV
      661 DSATDLSAGL RYSFSTSAAN LATSYATAGA ASAQQFSFPE NGTYTVFARV FDKDGGSSDY
      721 QTTVTVTNVA PIVTITGAPA NSPEGTAITL GSTVSDPGSG DTFTYAWSVT KNGVPYATGT
      781 PTNGSTFTFT PNDNGTYVVS LIVTDDDGGV GIAGTGSFGG PTAGTTDVLI IYDAATAPGT
      841 IALRNALQAA GMNVSLSTTD ETLFNGSNPF LTPYEAVIHL NGITWPTDMP LGGQTALVNY
      901 VQNGGGYIGN EWNAYEFSVG RMQQMRDLIL LNSVSNSSGN LTLTDVPGQS GHPILANVPS
      961 PAFFSASYNV GQVRSYATQP AVALMRDQFG NDAVAVREFG IGHVVAFHHA GNYFSGTLND
     1021 ADVLQLYVDG VKWAARASGG QGATITVTNA APTATDVSVT PVVNEGGTAT VTGRITDPGA
     1081 ADTHTVTVSW GDGTSSTAVV NADRTFTATH VYTDDNPTGT PADVYQVGVS VRDDDGGVSG
     1141 GGTQELVTNG GFESGFTGWT TNVQSGTWSL NSGSTDPDGP GLPTAPISGQ FDALAAQSGP
     1201 SRLILSAPIV VPTGITSAVL SWSDRIRNHY SQYSDPNQEW RVRVLDAAGN ELTTVFSTNP
     1261 GDPLEQFGPN HRSVDLTALL QGRAGQTIRL SFELDDNLFY FNVNLDDVSL LTTTGPGIPV
     1321 TVTNVAPTAP VLQVSPAVGE DGTVTLTGTF TDAGLNDTHT VTVDWGDGSQ TVLGGGATVP
     1381 VSQAVEYNGH RYYVIRQAGL SWFEAQNQAQ RLGGNLVTIN DAAENTFVSE LLRSNFGYYA
     1441 LAWIGLNDEA NEGQFGWVSG DPITYTNWFV QDGEPNDYPP QVTEDFAITN YAYGYGPGWW
     1501 NDLAGTRDSA IYWGAYAVVE VNPTRTFTLS HRYADDTAGA YTIGVTVTDD DTGASSATTT
     1561 ATVTNAAPTD LTVSADAVTI NEDGSVTLTG SFTDRGTLDA HTVTIDWKDG TTSQVAVPGF
     1621 PGAPSPGVNL ATSAEFGGHT YHFISTPLAW ADAEAEARRM GGHLVTINSD AENLFLFHYV
     1681 RRAALQGDVQ TWIGLSDGGT DGPLQWASGE SLGYTNWATG QPSDLVGPTG YAFNYNNVEI
     1741 GARWGAFSAE TPLFAVIEVD GKRTFTATHR YLDDAPSGTA SDTYAIGVTV TDDDAGTTST
     1801 TVPVTVNNIA PVIGSLTGPV AGTQTTATPG GAPVAFSGVR GQPLAFSVGF SDTGTIDTHE
     1861 VQWNFGDGTV SGWLPASGST ASAPAHAFAA TGTYTVTVTV RDDDGGTVSF AQQVVIKTIE
     1921 LQADPTDPSK TALVVGGTTG TDQIQLSGSS SVTVNLNGSY LGSFARTGRL AAYGQGGNDQ
     1981 VQISGNFEDV LVDAGAGTDQ IQLSGTFRDL FTDGGAGNDQ TQVSGNFRDA VLSAGSGNDT
     2041 VQVSGNFNTT TVSAGDGDDN VQISGTFARV LVAGGAGNDV LRVYGTGPSI LVGGDGNDEL
     2101 VGSTGRSLLI GGRGADRITG SSAEDVLIAG FTAYDDDFGA LTALHGVWVD PTKNYAQRVA
     2161 ALQLAGTIGG IRLAPDTVFD DDSADRLTGA AGRDWFLFAP TRDDVTDDAA NESLGFTNTP
//