LOCUS VTR95457.1 1052 aa PRT BCT 03-FEB-2020 DEFINITION Gemmata massiliana wd-40 repeat protein : Uncultured bacterium genome assembly Metasoil_fosmids_resub OS=uncultured bacterium PE=4 SV=1: Sigma70_r2: Sigma70_r4_2: WD40: WD40: WD40 protein. ACCESSION LR593886-4758 PROTEIN_ID VTR95457.1 SOURCE Gemmata massiliana ORGANISM Gemmata massiliana Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae; Gemmata. REFERENCE 1 AUTHORS CONSRTM Science for Life Laboratories JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution, Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden FEATURES Qualifiers source /organism="Gemmata massiliana" /chromosome="1" /isolate="Soil9" /mol_type="genomic DNA" /isolation_source="soil" /db_xref="taxon:1210884" protein /locus_tag="SOIL9_22570" /note="BLAST_uniprot:hit_1 ; ACCESSION=tr|A0A090KPX2|A0A090KPX2_9BACT ; ALN/Q_length_ratio=1.067 ; DESCRIPTION=Uncultured bacterium genome assembly Metasoil_fosmids_resub OS=uncultured bacterium PE=4 SV=1 ; EVALUE=4e-88 ; Q/S_length_ratio=0.908" /note="BLAST_uniprot:hit_2 ; ACCESSION=tr|X0KUP7|X0KUP7_FUSOX ; ALN/Q_length_ratio=0.564 ; DESCRIPTION=Uncharacterized protein OS=Fusarium oxysporum f. sp. vasinfectum 25433 GN=FOTG_18972 PE=4 SV=1 ; EVALUE=5e-60 ; Q/S_length_ratio=1.179" /note="BLAST_uniprot:hit_3 ; ACCESSION=tr|K9V395|K9V395_9CYAN ; ALN/Q_length_ratio=0.569 ; DESCRIPTION=(Myosin heavy-chain) kinase OS=Calothrix sp. PCC 6303 GN=Cal6303_2739 PE=4 SV=1 ; EVALUE=9e-56 ; Q/S_length_ratio=0.660" /note="BLAST_uniprot:hit_4 ; ACCESSION=tr|K9UX17|K9UX17_9CYAN ; ALN/Q_length_ratio=0.536 ; DESCRIPTION=(Myosin heavy-chain) kinase OS=Calothrix sp. PCC 6303 GN=Cal6303_1366 PE=4 SV=1 ; EVALUE=4e-55 ; Q/S_length_ratio=1.670" /note="BLAST_uniprot:hit_5 ; ACCESSION=tr|A0YMI4|A0YMI4_LYNSP ; ALN/Q_length_ratio=0.513 ; DESCRIPTION=WD-40 repeat protein OS=Lyngbya sp. (strain PCC 8106) GN=L8106_17667 PE=4 SV=1 ; EVALUE=9e-55 ; Q/S_length_ratio=0.769" /note="BLAST_uniprot:hit_6 ; ACCESSION=tr|E0UJ20|E0UJ20_CYAP2 ; ALN/Q_length_ratio=0.553 ; DESCRIPTION=WD40 repeat, subgroup OS=Cyanothece sp. (strain PCC 7822) GN=Cyan7822_2631 PE=4 SV=1 ; EVALUE=5e-54 ; Q/S_length_ratio=0.828" /note="BLAST_uniprot:hit_7 ; ACCESSION=tr|A0A061AE54|A0A061AE54_9ACTO ; ALN/Q_length_ratio=0.550 ; DESCRIPTION=Transcriptional regulator, XRE family OS=Streptomyces iranensis GN=SIRAN60 PE=4 SV=1 ; EVALUE=2e-53 ; Q/S_length_ratio=0.852" /note="BLAST_uniprot:hit_8 ; ACCESSION=tr|D7BXH8|D7BXH8_STRBB ; ALN/Q_length_ratio=0.573 ; DESCRIPTION=Putative WD-40 repeat protein OS=Streptomyces bingchenggensis (strain BCW-1) GN=SBI_04631 PE=4 SV=1 ; EVALUE=6e-53 ; Q/S_length_ratio=0.813" /note="BLAST_uniprot:hit_9 ; ACCESSION=tr|B5VVI6|B5VVI6_ARTMA ; ALN/Q_length_ratio=0.474 ; DESCRIPTION=WD-40 repeat protein OS=Arthrospira maxima CS-328 GN=AmaxDRAFT_0527 PE=4 SV=1 ; EVALUE=3e-52 ; Q/S_length_ratio=1.269" /note="BLAST_uniprot:hit_10 ; ACCESSION=tr|B8LXS9|B8LXS9_TALSN ; ALN/Q_length_ratio=0.507 ; DESCRIPTION=G-protein beta WD-40 repeats containing protein, putative OS=Talaromyces stipitatus (strain ATCC 10500 / CBS 375.48 / QM 6759 / NRRL 1006) GN=TSTA_062310 PE=4 SV=1 ; EVALUE=4e-52 ; Q/S_length_ratio=0.653" /note="BLAST_uniprot:hit_11 ; ACCESSION=tr|A0EB01|A0EB01_PARTE ; ALN/Q_length_ratio=0.551 ; DESCRIPTION=Chromosome undetermined scaffold_87, whole genome shotgun sequence OS=Paramecium tetraurelia GN=GSPATT00025202001 PE=4 SV=1 ; EVALUE=2e-51 ; Q/S_length_ratio=1.431" /note="BLAST_uniprot:hit_12 ; ACCESSION=tr|B2IXC4|B2IXC4_NOSP7 ; ALN/Q_length_ratio=0.541 ; DESCRIPTION=WD-40 repeat protein OS=Nostoc punctiforme (strain ATCC 29133 / PCC 73102) GN=Npun_F1222 PE=4 SV=1 ; EVALUE=3e-51 ; Q/S_length_ratio=0.868" /note="BLAST_uniprot:hit_13 ; ACCESSION=tr|F4XK01|F4XK01_9CYAN ; ALN/Q_length_ratio=0.551 ; DESCRIPTION=WD-40 repeat-containing protein OS=Moorea producens 3L GN=LYNGBM3L_10820 PE=4 SV=1 ; EVALUE=5e-51 ; Q/S_length_ratio=0.722" /note="BLAST_uniprot:hit_14 ; ACCESSION=tr|A0A0A1VVL1|A0A0A1VVL1_MICAE ; ALN/Q_length_ratio=0.551 ; DESCRIPTION=High-affnity carbon uptake protein Hat/HatR OS=Microcystis aeruginosa NIES-44 GN=N44_02003 PE=4 SV=1 ; EVALUE=1e-50 ; Q/S_length_ratio=1.145" /note="BLAST_uniprot:hit_15 ; ACCESSION=tr|A0DHV3|A0DHV3_PARTE ; ALN/Q_length_ratio=0.574 ; DESCRIPTION=Chromosome undetermined scaffold_502, whole genome shotgun sequence (Fragment) OS=Paramecium tetraurelia GN=GSPATT00039495001 PE=4 SV=1 ; EVALUE=9e-50 ; Q/S_length_ratio=1.128" /note="Pfam_scan:hit_1 (45..114); Pfam:PF04542.9:Sigma70_r2; Pfam_type:Domain;HMM_aln_Length:69; HMM_Length:71; EVALUE:4.6e-09; BITSCORE: 35.7" /note="Pfam_scan:hit_2 (136..189); Pfam:PF08281.7:Sigma70_r4_2; Pfam_type:Domain;HMM_aln_Length:50; HMM_Length:54; EVALUE:5.9e-10; BITSCORE: 38.4" /note="Pfam_scan:hit_3 (495..529); Pfam:PF00400.27:WD40; Pfam_type:Repeat;HMM_aln_Length:27; HMM_Length:39; EVALUE:2.8e-06; BITSCORE: 26.9" /note="Pfam_scan:hit_4 (861..883); Pfam:PF00400.27:WD40; Pfam_type:Repeat;HMM_aln_Length:21; HMM_Length:39; EVALUE:0.0031; BITSCORE: 17.3" /note="Pfam_scan:hit_5 (887..925); Pfam:PF00400.27:WD40; Pfam_type:Repeat;HMM_aln_Length:33; HMM_Length:39; EVALUE:1.2e-09; BITSCORE: 37.7" /note="GO_domain:GO:0003677" /note="GO_domain:GO:0001071" /note="GO_domain:GO:0000988" /note="GO_domain:GO:0034641" /note="GO_domain:GO:0009058" /note="GO_domain:GO:0043234" /note="GO_domain:GO:0005622" BEGIN 1 MGRDVPRGLA HYIRDMAGLW RTDARTDREL LSAFVSGDGS AFAALVVRHG QTVWSACRRV 61 LGNDADAEDA FQATFIALAR NAAHVRSDSI SGWLQKVSHT VAVNARKAAH RRNTVERQLL 121 DRANRSDEQL PDEELRAVVD DEVARLPERL RVPLILYYLE GKTQAEIGRI LGVTDRAAAH 181 RLKQSLKLLR ERLGRRGVAV ATTALVAILG QVPIVTAVPI ALVTQATEIA LAVAAGSPID 241 TAATQLALGA TRTHGWARLK LYSLVLVSVA CALIGGALLA QRAEPYAESG PHGAPNAPLS 301 GVMNRTDWFG DQLPAGAIAR LGTVRFRTGG GTGLSSVAFG PAGKMLISSH GEDAVHFWDL 361 ETGREVRKLH APRACWAVTT ALNGNRLVAA GIDEIWAWDL ADGAPRFLWS ARSKSVGFAN 421 VEFSPDGTLI AHGGDAAEQI NLLDAATGAV VRTLAGHGER FAFSADSKLL ASWKWWEFTE 481 VGVWDVATGA KRHTFVASSG KKGVSSAAFA PSGKWLATAG QDGELRVWDL DRGIEQYHLA 541 SDADPNAFVG FGPHGSTLLE IGGGRVRSWD AVTGRMTRAI ACSIDNRWAN VHRLSADGSQ 601 SAVAWHSGVG AWDVATGREL GSAVEMPHES VHPVVFSRDG ATLATSTLDV NGAAVQLWDS 661 DGRPRQRFAI PPGQLVWGCD FAADGSLSAL IGTATQLPLD PPDRISRWDA RTGARFAESR 721 LPAGVRSVAF APDGHHMAVA LAEGVSLCNR ATGRVVRKLP GACTADALTF SADESTLAAL 781 DAATGEITIW SLAGGRERKW PVSADPKVRA SLRRSLALSP DGRLLAIGTE DFKIGIRVMN 841 VATGTEVWEL AGQLHGWRQE FAFAPDGRTI AACGFDGAVR VWELASGRER YRLAGHRSGV 901 GAVTFSPDGR RLASASFDCT VLIWDVSTPQ QPVPTDRPTV AQLWDALIAP DAAAGHRALV 961 SFAATPETSV PLLRDRLCPG SDTRSTDLGD ERDPKSPAHR ATARGIEALE RMGYDPAAKQ 1021 LLEDLAKHPI ESVSGREARR ALDRLAGSLK RD //