LOCUS VTR94733.1 818 aa PRT BCT 03-FEB-2020 DEFINITION Gemmata massiliana (myosin heavy-chain) kinase : Uncultured bacterium genome assembly Metasoil_fosmids_resub OS=uncultured bacterium PE=4 SV=1: WD40: PD40: WD40 protein. ACCESSION LR593886-4034 PROTEIN_ID VTR94733.1 SOURCE Gemmata massiliana ORGANISM Gemmata massiliana Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae; Gemmata. REFERENCE 1 AUTHORS CONSRTM Science for Life Laboratories JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution, Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden FEATURES Qualifiers source /organism="Gemmata massiliana" /chromosome="1" /isolate="Soil9" /mol_type="genomic DNA" /isolation_source="soil" /db_xref="taxon:1210884" protein /locus_tag="SOIL9_29810" /note="BLAST_uniprot:hit_1 ; ACCESSION=tr|A0A090KPX2|A0A090KPX2_9BACT ; ALN/Q_length_ratio=1.016 ; DESCRIPTION=Uncultured bacterium genome assembly Metasoil_fosmids_resub OS=uncultured bacterium PE=4 SV=1 ; EVALUE=9e-45 ; Q/S_length_ratio=0.706" /note="BLAST_uniprot:hit_2 ; ACCESSION=tr|K9V395|K9V395_9CYAN ; ALN/Q_length_ratio=0.676 ; DESCRIPTION=(Myosin heavy-chain) kinase OS=Calothrix sp. PCC 6303 GN=Cal6303_2739 PE=4 SV=1 ; EVALUE=8e-36 ; Q/S_length_ratio=0.513" /note="BLAST_uniprot:hit_3 ; ACCESSION=tr|B2IXC4|B2IXC4_NOSP7 ; ALN/Q_length_ratio=0.709 ; DESCRIPTION=WD-40 repeat protein OS=Nostoc punctiforme (strain ATCC 29133 / PCC 73102) GN=Npun_F1222 PE=4 SV=1 ; EVALUE=3e-35 ; Q/S_length_ratio=0.675" /note="BLAST_uniprot:hit_4 ; ACCESSION=tr|Q10XW6|Q10XW6_TRIEI ; ALN/Q_length_ratio=0.725 ; DESCRIPTION=WD-40 repeat OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_3869 PE=4 SV=1 ; EVALUE=1e-33 ; Q/S_length_ratio=0.527" /note="BLAST_uniprot:hit_5 ; ACCESSION=tr|B7KD29|B7KD29_CYAP7 ; ALN/Q_length_ratio=0.677 ; DESCRIPTION=WD-40 repeat protein OS=Cyanothece sp. (strain PCC 7424) GN=PCC7424_4792 PE=4 SV=1 ; EVALUE=1e-33 ; Q/S_length_ratio=0.600" /note="BLAST_uniprot:hit_6 ; ACCESSION=tr|S9QCY4|S9QCY4_9DELT ; ALN/Q_length_ratio=0.666 ; DESCRIPTION=High-affnity carbon uptake protein Hat/HatR OS=Cystobacter fuscus DSM 2262 GN=D187_003093 PE=4 SV=1 ; EVALUE=2e-33 ; Q/S_length_ratio=0.703" /note="BLAST_uniprot:hit_7 ; ACCESSION=tr|Q111Z3|Q111Z3_TRIEI ; ALN/Q_length_ratio=0.682 ; DESCRIPTION=Peptidase C14, caspase catalytic subunit p20 OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_2471 PE=4 SV=1 ; EVALUE=2e-32 ; Q/S_length_ratio=0.552" /note="BLAST_uniprot:hit_8 ; ACCESSION=tr|Q10VX7|Q10VX7_TRIEI ; ALN/Q_length_ratio=0.730 ; DESCRIPTION=WD-40 repeat OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_4625 PE=4 SV=1 ; EVALUE=4e-32 ; Q/S_length_ratio=0.542" /note="BLAST_uniprot:hit_9 ; ACCESSION=tr|S9QRF9|S9QRF9_9DELT ; ALN/Q_length_ratio=0.667 ; DESCRIPTION=High-affnity carbon uptake protein Hat/HatR OS=Cystobacter fuscus DSM 2262 GN=D187_003092 PE=4 SV=1 ; EVALUE=1e-31 ; Q/S_length_ratio=0.702" /note="BLAST_uniprot:hit_10 ; ACCESSION=tr|A8YGJ6|A8YGJ6_MICAE ; ALN/Q_length_ratio=0.762 ; DESCRIPTION=Genome sequencing data, contig C309 OS=Microcystis aeruginosa PCC 7806 GN=IPF_734 PE=4 SV=1 ; EVALUE=2e-31 ; Q/S_length_ratio=0.681" /note="BLAST_uniprot:hit_11 ; ACCESSION=tr|L8NXS5|L8NXS5_MICAE ; ALN/Q_length_ratio=0.762 ; DESCRIPTION=WD domain, G-beta repeat family protein OS=Microcystis aeruginosa DIANCHI905 GN=C789_1479 PE=4 SV=1 ; EVALUE=2e-31 ; Q/S_length_ratio=0.681" /note="BLAST_uniprot:hit_12 ; ACCESSION=tr|F4KU47|F4KU47_HALH1 ; ALN/Q_length_ratio=0.654 ; DESCRIPTION=(Myosin heavy-chain) kinase., Histone acetyltransferase OS=Haliscomenobacter hydrossis (strain ATCC 27775 / DSM 1100 / LMG 10767 / O) GN=Halhy_2265 PE=4 SV=1 ; EVALUE=4e-31 ; Q/S_length_ratio=0.725" /note="BLAST_uniprot:hit_13 ; ACCESSION=tr|K9PFT4|K9PFT4_9CYAN ; ALN/Q_length_ratio=0.762 ; DESCRIPTION=WD40 repeat-containing protein OS=Calothrix sp. PCC 7507 GN=Cal7507_1331 PE=4 SV=1 ; EVALUE=2e-30 ; Q/S_length_ratio=0.714" /note="BLAST_uniprot:hit_14 ; ACCESSION=tr|B4W111|B4W111_9CYAN ; ALN/Q_length_ratio=0.655 ; DESCRIPTION=Putative uncharacterized protein OS=Coleofasciculus chthonoplastes PCC 7420 GN=MC7420_7550 PE=4 SV=1 ; EVALUE=3e-30 ; Q/S_length_ratio=1.159" /note="BLAST_uniprot:hit_15 ; ACCESSION=tr|A0EB01|A0EB01_PARTE ; ALN/Q_length_ratio=0.704 ; DESCRIPTION=Chromosome undetermined scaffold_87, whole genome shotgun sequence OS=Paramecium tetraurelia GN=GSPATT00025202001 PE=4 SV=1 ; EVALUE=4e-30 ; Q/S_length_ratio=1.113" /note="Pfam_scan:hit_1 (64..96); Pfam:PF00400.27:WD40; Pfam_type:Repeat;HMM_aln_Length:24; HMM_Length:39; EVALUE:5.2e-07; BITSCORE: 29.2" /note="Pfam_scan:hit_2 (220..261); Pfam:PF07676.7:PD40; Pfam_type:Repeat;HMM_aln_Length:21; HMM_Length:39; EVALUE:0.11; BITSCORE: 12.1" /note="Pfam_scan:hit_3 (473..506); Pfam:PF00400.27:WD40; Pfam_type:Repeat;HMM_aln_Length:28; HMM_Length:39; EVALUE:0.016; BITSCORE: 15.0" /note="GO_domain:GO:0003674" BEGIN 1 MAARPGSWIL AGVLLCGAAG LAFGQKDPPA PAPQPKPAPK QPAQPAKGPN GLAEGVIARL 61 GKTRLRHAER PTCVAFAPDG KTFVTGGEDG TVRAWSVATG DQVGIVQRPA MSVETLRYVH 121 GGTKLAVHHS SETVIRLLDA KTLREVDSVP FPNPHRFGFS TDGSMVITSE PTGNAVVTEV 181 EGNLPKLELT PADYFDFRPD GKAIAVASAK GTLTVHLVTG GKPVFSLKDL GNIYGVAYSP 241 DGKRIAIGSR TPAGVDTVRI FAENNPKPLN EIAGANLPRA WISGDVLAVG NGSDAGVYNL 301 KTNEWAGRIS GAFGEFAVSP DGTKLVATGK GGLRVRLWDL TTGKQLHAED DSFPDPALML 361 GCADGKSLFL LTTETAYLWS VGADKAKVVG TLPARAVSAA ANGGTLAIAT PDTVVAFTDF 421 DPLKGLPSKP AVTFEGSAGA KVVAVSPDSK RVAWAVDGGK VVIASATGNT RVELPPTTTS 481 IMALAFDPSG KKLAQIGRDG FVRLWSLTES DKKPKELWIV RIGRGQRAAL AFSPDGKLIA 541 AASQAQVPVF NTADGSEVFK ADRYSEDGYA HHVAFSPDSK LLMFGSSGTA GRVEVWELAT 601 QGLVRSYTSG YGGISRLAVF PDGTRVASAG AEEAVTVWDL TFRGTKPAPT ADELRTAWTN 661 LESPDAAVGY PATKLLAAAG EAGTETIARS AKDLLATQQK IQSWVEDLAS ETLAVREVAS 721 KQLFDLGTRA MPTLAAASKS KNTELRDRAQ ALLSKMEEKG LSTPAHGFVG DSIRLYRAVQ 781 ALEAIGTPKA QTVLSEIATT GGRPGDEAKA ALARLKKK //