LOCUS VTR91965.1 1111 aa PRT BCT 03-FEB-2020
DEFINITION Gemmata massiliana (myosin heavy-chain) kinase : Uncultured
bacterium genome assembly Metasoil_fosmids_resub OS=uncultured
bacterium PE=4 SV=1: Sigma70_r2: Sigma70_r4_2: WD40 protein.
ACCESSION LR593886-1266
PROTEIN_ID VTR91965.1
SOURCE Gemmata massiliana
ORGANISM Gemmata massiliana
Bacteria; Planctomycetes; Planctomycetia; Gemmatales; Gemmataceae;
Gemmata.
REFERENCE 1
AUTHORS
CONSRTM Science for Life Laboratories
JOURNAL Submitted (14-MAY-2019) to the INSDC. DEPARTMENT OF CELL AND
MOLECULAR BIOLOGY, Uppsala University, Molecular Evolution,
Biomedicinskt centrum (BMC), Husargatan 3, 752 37 Uppsala, Sweden
FEATURES Qualifiers
source /organism="Gemmata massiliana"
/chromosome="1"
/isolate="Soil9"
/mol_type="genomic DNA"
/isolation_source="soil"
/db_xref="taxon:1210884"
protein /locus_tag="SOIL9_57490"
/note="BLAST_uniprot:hit_1 ;
ACCESSION=tr|A0A090KPX2|A0A090KPX2_9BACT ;
ALN/Q_length_ratio=1.000 ; DESCRIPTION=Uncultured
bacterium genome assembly Metasoil_fosmids_resub
OS=uncultured bacterium PE=4 SV=1 ; EVALUE=8e-88 ;
Q/S_length_ratio=0.959"
/note="BLAST_uniprot:hit_2 ;
ACCESSION=tr|F4KU47|F4KU47_HALH1 ;
ALN/Q_length_ratio=0.519 ; DESCRIPTION=(Myosin
heavy-chain) kinase., Histone acetyltransferase
OS=Haliscomenobacter hydrossis (strain ATCC 27775 / DSM
1100 / LMG 10767 / O) GN=Halhy_2265 PE=4 SV=1 ;
EVALUE=5e-34 ; Q/S_length_ratio=0.984"
/note="BLAST_uniprot:hit_3 ;
ACCESSION=tr|K9V395|K9V395_9CYAN ;
ALN/Q_length_ratio=0.514 ; DESCRIPTION=(Myosin
heavy-chain) kinase OS=Calothrix sp. PCC 6303
GN=Cal6303_2739 PE=4 SV=1 ; EVALUE=4e-33 ;
Q/S_length_ratio=0.697"
/note="BLAST_uniprot:hit_4 ;
ACCESSION=tr|B2IZJ6|B2IZJ6_NOSP7 ;
ALN/Q_length_ratio=0.519 ; DESCRIPTION=WD-40 repeat
protein OS=Nostoc punctiforme (strain ATCC 29133 / PCC
73102) GN=Npun_F1419 PE=4 SV=1 ; EVALUE=2e-32 ;
Q/S_length_ratio=0.606"
/note="BLAST_uniprot:hit_5 ;
ACCESSION=tr|A0YMI4|A0YMI4_LYNSP ;
ALN/Q_length_ratio=0.524 ; DESCRIPTION=WD-40 repeat
protein OS=Lyngbya sp. (strain PCC 8106) GN=L8106_17667
PE=4 SV=1 ; EVALUE=2e-32 ; Q/S_length_ratio=0.812"
/note="BLAST_uniprot:hit_6 ;
ACCESSION=tr|X6PA04|X6PA04_RETFI ;
ALN/Q_length_ratio=0.518 ; DESCRIPTION=G-protein beta
WD-40 repeats containing protein (Fragment)
OS=Reticulomyxa filosa GN=RFI_02058 PE=4 SV=1 ;
EVALUE=3e-32 ; Q/S_length_ratio=1.501"
/note="BLAST_uniprot:hit_7 ;
ACCESSION=tr|Q10VX7|Q10VX7_TRIEI ;
ALN/Q_length_ratio=0.502 ; DESCRIPTION=WD-40 repeat
OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_4625
PE=4 SV=1 ; EVALUE=1e-31 ; Q/S_length_ratio=0.736"
/note="BLAST_uniprot:hit_8 ;
ACCESSION=tr|C7RS72|C7RS72_ACCPU ;
ALN/Q_length_ratio=0.524 ; DESCRIPTION=WD-40 repeat
protein OS=Accumulibacter phosphatis (strain UW-1)
GN=CAP2UW1_2609 PE=4 SV=1 ; EVALUE=2e-31 ;
Q/S_length_ratio=0.640"
/note="BLAST_uniprot:hit_9 ;
ACCESSION=tr|X6MEE5|X6MEE5_RETFI ;
ALN/Q_length_ratio=0.519 ; DESCRIPTION=G-protein beta
WD-40 repeats containing protein OS=Reticulomyxa filosa
GN=RFI_25013 PE=4 SV=1 ; EVALUE=4e-31 ;
Q/S_length_ratio=1.319"
/note="BLAST_uniprot:hit_10 ;
ACCESSION=tr|K9QMP1|K9QMP1_NOSS7 ;
ALN/Q_length_ratio=0.482 ; DESCRIPTION=WD40
repeat-containing protein OS=Nostoc sp. (strain ATCC 29411
/ PCC 7524) GN=Nos7524_0419 PE=4 SV=1 ; EVALUE=5e-31 ;
Q/S_length_ratio=0.610"
/note="BLAST_uniprot:hit_11 ;
ACCESSION=tr|B2IXC4|B2IXC4_NOSP7 ;
ALN/Q_length_ratio=0.518 ; DESCRIPTION=WD-40 repeat
protein OS=Nostoc punctiforme (strain ATCC 29133 / PCC
73102) GN=Npun_F1222 PE=4 SV=1 ; EVALUE=6e-30 ;
Q/S_length_ratio=0.917"
/note="BLAST_uniprot:hit_12 ;
ACCESSION=tr|Q10XW6|Q10XW6_TRIEI ;
ALN/Q_length_ratio=0.500 ; DESCRIPTION=WD-40 repeat
OS=Trichodesmium erythraeum (strain IMS101) GN=Tery_3869
PE=4 SV=1 ; EVALUE=1e-29 ; Q/S_length_ratio=0.715"
/note="BLAST_uniprot:hit_13 ;
ACCESSION=tr|B7K750|B7K750_CYAP7 ;
ALN/Q_length_ratio=0.517 ; DESCRIPTION=WD-40 repeat
protein OS=Cyanothece sp. (strain PCC 7424)
GN=PCC7424_1167 PE=4 SV=1 ; EVALUE=1e-29 ;
Q/S_length_ratio=0.955"
/note="BLAST_uniprot:hit_14 ;
ACCESSION=tr|A5URP9|A5URP9_ROSS1 ;
ALN/Q_length_ratio=0.479 ; DESCRIPTION=Ribosome assembly
protein 4 (RSA4) OS=Roseiflexus sp. (strain RS-1)
GN=RoseRS_0892 PE=4 SV=1 ; EVALUE=2e-29 ;
Q/S_length_ratio=1.596"
/note="BLAST_uniprot:hit_15 ;
ACCESSION=tr|Q111Z3|Q111Z3_TRIEI ;
ALN/Q_length_ratio=0.500 ; DESCRIPTION=Peptidase C14,
caspase catalytic subunit p20 OS=Trichodesmium erythraeum
(strain IMS101) GN=Tery_2471 PE=4 SV=1 ; EVALUE=3e-29 ;
Q/S_length_ratio=0.750"
/note="Pfam_scan:hit_1 (42..102);
Pfam:PF04542.9:Sigma70_r2;
Pfam_type:Domain;HMM_aln_Length:57; HMM_Length:71;
EVALUE:1.1e-06; BITSCORE: 28.1"
/note="Pfam_scan:hit_2 (130..183);
Pfam:PF08281.7:Sigma70_r4_2;
Pfam_type:Domain;HMM_aln_Length:50; HMM_Length:54;
EVALUE:2.5e-09; BITSCORE: 36.4"
/note="Pfam_scan:hit_3 (304..338); Pfam:PF00400.27:WD40;
Pfam_type:Repeat;HMM_aln_Length:29; HMM_Length:39;
EVALUE:8.7e-05; BITSCORE: 22.2"
/note="GO_domain:GO:0003677"
/note="GO_domain:GO:0001071"
/note="GO_domain:GO:0000988"
/note="GO_domain:GO:0034641"
/note="GO_domain:GO:0009058"
/note="GO_domain:GO:0043234"
/note="GO_domain:GO:0005622"
BEGIN
1 MRLTAALQLV RTVERAPVCD TSDAELLRRF CRDRDEGAFR EILRRYEALV RDASRRLTRD
61 RHAVDDAAQA TFLTLARKAH TIRHAEALPS WLYRVARSVT ARPVAVVPTV TEPVDPTSSP
121 LDQLSAREVL AIFDEELARL PAAHRSAVLL CTIEGNTVED TARRLGTTPG AVRGWLQRGR
181 ETLRHRLGRR GVELSVAVSL LLIDSTTGTA GATLDAIVRG AMATHSPVNV VTRFLTGSSV
241 TSAVVSVLVA GAVASVVLLS SGASAPPPVP EPKAEAKVDT QADALVTRDG LPEGAVARIG
301 SPRLRHAGEV AAMAFSRDGR RLATASPANR DKSVRVWDLT NGKEMYRVPV AVNSHENTER
361 HRTVAVAFTA DDKRLLVLDA AEFRTFDATT GRQELVTVLF KETNPNQFFP PDRIIGAGFS
421 PDANVFVVVR QNGEMVLGDT TAGTVKRIFT KAMTVPENTH YAHVDVLFTP DGTEVCVPIP
481 GEPVPLFDVA TGKSKRALAK ELVSQHQMLH NAAFADGGRK FVTITSTAQE GKPSTHAITI
541 GDIATGKVLR TIPLTALPRV LSASPNGKLL AVSTDSVSSS EIRVLDLESG KELQSMPLEL
601 TPALVTFSPD SRLLAGTCHY EGRVTVWNLE KNARHPQSAD EHARAAHFDA RGNVVLRQSS
661 RTITVNWQNG KVLGDKKELK PESTFSHLGT ESGDGKVRAT LDVPEGKSGR PLAILVKETD
721 TGKTVARLEG LSDFPWRMVF ADRNRLVVTV TQDNVLTVWD VVAGKVLWSE AYPARSLGYS
781 GMGAPHFDAA NSRMAIGSLT QKGTVIDVWE LRRHNRVSRV EAPGPVLTGG IAFSPDGAFI
841 AGGSETVTCW RVSDGRVMHT LKGHATKESP NDRPAISCEF SADGRKLLTV DGTGTIRVWE
901 FATGQVIRTF SGHKGPTTAH FAPDARAIVG ASYEAPVFVW DVYGLGAPTS FNADRVWTDL
961 ADASSTTAFR AVRELCASPK EAIALLKQKL EPESIDPKAI AGWVKDLSSE QFADRERATA
1021 ELEKRGETIA SLLREALGAA TDAETRQRLT AILGRIDRPS PTALRLHRAM DALEHLGTPE
1081 AKSHLETLSR GALKGSRTIQ AKEALSRISE R
//