LOCUS       AEC07729.1               745 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana SPOC domain / Transcription elongation
            factor S-II protein protein.
ACCESSION   CP002685-3209
PROTEIN_ID  AEC07729.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G25640"
                     /gene_synonym="F3N11.9"
                     /gene_synonym="F3N11_9"
                     /inference="Similar to RNA sequence,
                     EST:INSD:BP867189.1,INSD:ES047054.1,INSD:AV528864.1,
                     INSD:ES106182.1,INSD:EH974742.1"
                     /inference="similar to RNA sequence, mRNA:INSD:AK175365.1"
                     /note="SPOC domain / Transcription elongation factor S-II
                     protein; FUNCTIONS IN: zinc ion binding; INVOLVED IN:
                     transcription; LOCATED IN: nucleus; EXPRESSED IN: 10 plant
                     structures; EXPRESSED DURING: 6 growth stages; CONTAINS
                     InterPro DOMAIN/s: Spen paralogue and orthologue SPOC,
                     C-terminal (InterPro:IPR012921), Transcription elongation
                     factor S-IIM (InterPro:IPR017890), Transcription
                     elongation factor S-II, central domain
                     (InterPro:IPR003618); BEST Arabidopsis thaliana protein
                     match is: SPOC domain / Transcription elongation factor
                     S-II protein (TAIR:AT5G11430.1); Has 1179 Blast hits to
                     1045 proteins in 235 species: Archae - 0; Bacteria - 202;
                     Metazoa - 503; Fungi - 239; Plants - 160; Viruses - 0;
                     Other Eukaryotes - 75 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G25640"
                     /db_xref="TAIR:AT2G25640"
     intron_pos      619:2 (1/3)
     intron_pos      660:0 (2/3)
     intron_pos      680:0 (3/3)
BEGIN
        1 MSNNLLPQPC MQMGQFINVP TPTPELISNP EMRLSQPICS HISGGRQDFH VMLPSVVGLG
       61 SVNMDKTLLP GKRKSPLHPS VQNKRMALPM EGRPWASAPM PVQLSSVSPR TQYLPASFVS
      121 KNSFVSFSKP GKQAAARKPT LQKPMLLKPQ SESSGSVRSK MRESLAGALA MVQCQMDVPN
      181 ESKMLDSETV ANPLEGHVSG PVSAASGVDV MVSNGSTEML TLSDPSPVAG ISVQTVLPEI
      241 LSIAKTSDAQ VPEAVKPFVQ DNVSYSDNVF SKDDLLQGND LSWALESDIE FTVNCQNEMI
      301 GAMANDGSLE KLLLDPQVLA FEIETELFKL FGGVNKKYKE KGRSLLFNLK DKSNPKLREK
      361 VMYGEIAAER LCSMSAEELA SKELAEWRQA KAEEMAQMVV LQDTEVDIRS LVRKTHKGEF
      421 QVEVEPMDSG SVEVSVGMSS INWSRTKNFK KKTPSITKTL GVKNELNSSN ESTGPINGVT
      481 IDDEMQAATG SLPPIVSLDE FMSSIDSESP SGFLSSDTEK KPSVSDNNDV EEVLVSSPKE
      541 SANIDLCTSP VKAEALSPLT AKASSPVNAE DADIVSSKPS SDLKSKTTSV FIPDGERLWE
      601 GVLQLSPSTV SSVIGILRSG EKTTTKEWPI LLEIKGRVRL DAFEKFVREL PNSRSRAVMV
      661 MCFVCKEECS KTEQENISEV VDSYAKDGRV GYAEPASGVE LYLCPTRGRT VEILNKIVPR
      721 NQLDFLKSIN DDGLIGVVVW RRHTI
//