LOCUS VTR91965.1 1111 aa PRT BCT 03-FEB-2020 DEFINITION Gemmata massiliana (myosin heavy-chain) kinase : Uncultured bacterium genome assembly Metasoil_fosmids_resub OS=uncultured bacterium PE=4 SV=1: Sigma70_r2: Sigma70_r4_2: WD40 protein. ACCESSION LR593886-1266 PROTEIN_ID VTR91965.1 SOURCE Gemmata massiliana ORGANISM Gemmata massiliana Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae; Gemmata. REFERENCE 1 AUTHORS CONSRTM Science for Life Laboratories JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution, Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden FEATURES Qualifiers source /organism="Gemmata massiliana" /chromosome="1" /isolate="Soil9" /mol_type="genomic DNA" /isolation_source="soil" /db_xref="taxon:1210884" protein /locus_tag="SOIL9_57490" /note="BLAST_uniprot:hit_1 ; ACCESSION=tr|A0A090KPX2|A0A090KPX2_9BACT ; ALN/Q_length_ratio=1.000 ; DESCRIPTION=Uncultured bacterium genome assembly Metasoil_fosmids_resub OS=uncultured bacterium PE=4 SV=1 ; EVALUE=8e-88 ; Q/S_length_ratio=0.959" /note="BLAST_uniprot:hit_2 ; ACCESSION=tr|F4KU47|F4KU47_HALH1 ; ALN/Q_length_ratio=0.519 ; DESCRIPTION=(Myosin heavy-chain) kinase., Histone acetyltransferase OS=Haliscomenobacter hydrossis (strain ATCC 27775 / DSM 1100 / LMG 10767 / O) GN=Halhy_2265 PE=4 SV=1 ; EVALUE=5e-34 ; Q/S_length_ratio=0.984" /note="BLAST_uniprot:hit_3 ; ACCESSION=tr|K9V395|K9V395_9CYAN ; ALN/Q_length_ratio=0.514 ; DESCRIPTION=(Myosin heavy-chain) kinase OS=Calothrix sp. PCC 6303 GN=Cal6303_2739 PE=4 SV=1 ; EVALUE=4e-33 ; Q/S_length_ratio=0.697" /note="BLAST_uniprot:hit_4 ; ACCESSION=tr|B2IZJ6|B2IZJ6_NOSP7 ; ALN/Q_length_ratio=0.519 ; DESCRIPTION=WD-40 repeat protein OS=Nostoc punctiforme (strain ATCC 29133 / PCC 73102) GN=Npun_F1419 PE=4 SV=1 ; EVALUE=2e-32 ; Q/S_length_ratio=0.606" /note="BLAST_uniprot:hit_5 ; ACCESSION=tr|A0YMI4|A0YMI4_LYNSP ; ALN/Q_length_ratio=0.524 ; DESCRIPTION=WD-40 repeat protein OS=Lyngbya sp. (strain PCC 8106) GN=L8106_17667 PE=4 SV=1 ; EVALUE=2e-32 ; Q/S_length_ratio=0.812" /note="BLAST_uniprot:hit_6 ; ACCESSION=tr|X6PA04|X6PA04_RETFI ; ALN/Q_length_ratio=0.518 ; DESCRIPTION=G-protein beta WD-40 repeats containing protein (Fragment) OS=Reticulomyxa filosa GN=RFI_02058 PE=4 SV=1 ; EVALUE=3e-32 ; Q/S_length_ratio=1.501" /note="BLAST_uniprot:hit_7 ; ACCESSION=tr|Q10VX7|Q10VX7_TRIEI ; ALN/Q_length_ratio=0.502 ; DESCRIPTION=WD-40 repeat OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_4625 PE=4 SV=1 ; EVALUE=1e-31 ; Q/S_length_ratio=0.736" /note="BLAST_uniprot:hit_8 ; ACCESSION=tr|C7RS72|C7RS72_ACCPU ; ALN/Q_length_ratio=0.524 ; DESCRIPTION=WD-40 repeat protein OS=Accumulibacter phosphatis (strain UW-1) GN=CAP2UW1_2609 PE=4 SV=1 ; EVALUE=2e-31 ; Q/S_length_ratio=0.640" /note="BLAST_uniprot:hit_9 ; ACCESSION=tr|X6MEE5|X6MEE5_RETFI ; ALN/Q_length_ratio=0.519 ; DESCRIPTION=G-protein beta WD-40 repeats containing protein OS=Reticulomyxa filosa GN=RFI_25013 PE=4 SV=1 ; EVALUE=4e-31 ; Q/S_length_ratio=1.319" /note="BLAST_uniprot:hit_10 ; ACCESSION=tr|K9QMP1|K9QMP1_NOSS7 ; ALN/Q_length_ratio=0.482 ; DESCRIPTION=WD40 repeat-containing protein OS=Nostoc sp. (strain ATCC 29411 / PCC 7524) GN=Nos7524_0419 PE=4 SV=1 ; EVALUE=5e-31 ; Q/S_length_ratio=0.610" /note="BLAST_uniprot:hit_11 ; ACCESSION=tr|B2IXC4|B2IXC4_NOSP7 ; ALN/Q_length_ratio=0.518 ; DESCRIPTION=WD-40 repeat protein OS=Nostoc punctiforme (strain ATCC 29133 / PCC 73102) GN=Npun_F1222 PE=4 SV=1 ; EVALUE=6e-30 ; Q/S_length_ratio=0.917" /note="BLAST_uniprot:hit_12 ; ACCESSION=tr|Q10XW6|Q10XW6_TRIEI ; ALN/Q_length_ratio=0.500 ; DESCRIPTION=WD-40 repeat OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_3869 PE=4 SV=1 ; EVALUE=1e-29 ; Q/S_length_ratio=0.715" /note="BLAST_uniprot:hit_13 ; ACCESSION=tr|B7K750|B7K750_CYAP7 ; ALN/Q_length_ratio=0.517 ; DESCRIPTION=WD-40 repeat protein OS=Cyanothece sp. (strain PCC 7424) GN=PCC7424_1167 PE=4 SV=1 ; EVALUE=1e-29 ; Q/S_length_ratio=0.955" /note="BLAST_uniprot:hit_14 ; ACCESSION=tr|A5URP9|A5URP9_ROSS1 ; ALN/Q_length_ratio=0.479 ; DESCRIPTION=Ribosome assembly protein 4 (RSA4) OS=Roseiflexus sp. (strain RS-1) GN=RoseRS_0892 PE=4 SV=1 ; EVALUE=2e-29 ; Q/S_length_ratio=1.596" /note="BLAST_uniprot:hit_15 ; ACCESSION=tr|Q111Z3|Q111Z3_TRIEI ; ALN/Q_length_ratio=0.500 ; DESCRIPTION=Peptidase C14, caspase catalytic subunit p20 OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_2471 PE=4 SV=1 ; EVALUE=3e-29 ; Q/S_length_ratio=0.750" /note="Pfam_scan:hit_1 (42..102); Pfam:PF04542.9:Sigma70_r2; Pfam_type:Domain;HMM_aln_Length:57; HMM_Length:71; EVALUE:1.1e-06; BITSCORE: 28.1" /note="Pfam_scan:hit_2 (130..183); Pfam:PF08281.7:Sigma70_r4_2; Pfam_type:Domain;HMM_aln_Length:50; HMM_Length:54; EVALUE:2.5e-09; BITSCORE: 36.4" /note="Pfam_scan:hit_3 (304..338); Pfam:PF00400.27:WD40; Pfam_type:Repeat;HMM_aln_Length:29; HMM_Length:39; EVALUE:8.7e-05; BITSCORE: 22.2" /note="GO_domain:GO:0003677" /note="GO_domain:GO:0001071" /note="GO_domain:GO:0000988" /note="GO_domain:GO:0034641" /note="GO_domain:GO:0009058" /note="GO_domain:GO:0043234" /note="GO_domain:GO:0005622" BEGIN 1 MRLTAALQLV RTVERAPVCD TSDAELLRRF CRDRDEGAFR EILRRYEALV RDASRRLTRD 61 RHAVDDAAQA TFLTLARKAH TIRHAEALPS WLYRVARSVT ARPVAVVPTV TEPVDPTSSP 121 LDQLSAREVL AIFDEELARL PAAHRSAVLL CTIEGNTVED TARRLGTTPG AVRGWLQRGR 181 ETLRHRLGRR GVELSVAVSL LLIDSTTGTA GATLDAIVRG AMATHSPVNV VTRFLTGSSV 241 TSAVVSVLVA GAVASVVLLS SGASAPPPVP EPKAEAKVDT QADALVTRDG LPEGAVARIG 301 SPRLRHAGEV AAMAFSRDGR RLATASPANR DKSVRVWDLT NGKEMYRVPV AVNSHENTER 361 HRTVAVAFTA DDKRLLVLDA AEFRTFDATT GRQELVTVLF KETNPNQFFP PDRIIGAGFS 421 PDANVFVVVR QNGEMVLGDT TAGTVKRIFT KAMTVPENTH YAHVDVLFTP DGTEVCVPIP 481 GEPVPLFDVA TGKSKRALAK ELVSQHQMLH NAAFADGGRK FVTITSTAQE GKPSTHAITI 541 GDIATGKVLR TIPLTALPRV LSASPNGKLL AVSTDSVSSS EIRVLDLESG KELQSMPLEL 601 TPALVTFSPD SRLLAGTCHY EGRVTVWNLE KNARHPQSAD EHARAAHFDA RGNVVLRQSS 661 RTITVNWQNG KVLGDKKELK PESTFSHLGT ESGDGKVRAT LDVPEGKSGR PLAILVKETD 721 TGKTVARLEG LSDFPWRMVF ADRNRLVVTV TQDNVLTVWD VVAGKVLWSE AYPARSLGYS 781 GMGAPHFDAA NSRMAIGSLT QKGTVIDVWE LRRHNRVSRV EAPGPVLTGG IAFSPDGAFI 841 AGGSETVTCW RVSDGRVMHT LKGHATKESP NDRPAISCEF SADGRKLLTV DGTGTIRVWE 901 FATGQVIRTF SGHKGPTTAH FAPDARAIVG ASYEAPVFVW DVYGLGAPTS FNADRVWTDL 961 ADASSTTAFR AVRELCASPK EAIALLKQKL EPESIDPKAI AGWVKDLSSE QFADRERATA 1021 ELEKRGETIA SLLREALGAA TDAETRQRLT AILGRIDRPS PTALRLHRAM DALEHLGTPE 1081 AKSHLETLSR GALKGSRTIQ AKEALSRISE R //