LOCUS       AEE76407.1               370 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana mRNA capping enzyme family protein protein.
ACCESSION   CP002686-3889
PROTEIN_ID  AEE76407.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G20650"
                     /inference="Similar to RNA sequence,
                     EST:INSD:Z46702.1,INSD:EL089705.1,INSD:BP809366.1,
                     INSD:AA585727.1,INSD:DR292211.1,INSD:AU236297.1,
                     INSD:DR292210.1,INSD:EL050615.1,INSD:ES087840.1,
                     INSD:EL268685.1,INSD:DR292212.1,INSD:ES173778.1,
                     INSD:EG499884.1,INSD:ES180381.1,INSD:AU227176.1,
                     INSD:DR292209.1,INSD:DR282792.1,INSD:DR380406.1,
                     INSD:BP634667.1,INSD:EL303103.1,INSD:ES023103.1,
                     INSD:BP777850.1,INSD:AV542995.1,INSD:Z46701.1"
                     /inference="Similar to RNA sequence,
                     mRNA:INSD:BT005804.1,INSD:BX822732.1,INSD:AK228381.1,
                     INSD:BX825779.1,INSD:BT006067.1"
                     /note="mRNA capping enzyme family protein; FUNCTIONS IN:
                     catalytic activity; INVOLVED IN: mRNA capping; LOCATED IN:
                     chloroplast; EXPRESSED IN: 23 plant structures; EXPRESSED
                     DURING: 14 growth stages; CONTAINS InterPro DOMAIN/s: mRNA
                     (guanine-N(7))-methyltransferase (InterPro:IPR016899),
                     mRNA capping enzyme, large subunit (InterPro:IPR004971);
                     BEST Arabidopsis thaliana protein match is:
                     S-adenosyl-L-methionine-dependent methyltransferases
                     superfamily protein (TAIR:AT3G52210.1); Has 916 Blast hits
                     to 903 proteins in 291 species: Archae - 0; Bacteria - 22;
                     Metazoa - 149; Fungi - 179; Plants - 106; Viruses - 144;
                     Other Eukaryotes - 316 (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G20650"
                     /db_xref="Araport:AT3G20650"
     intron_pos      26:1 (1/12)
     intron_pos      73:0 (2/12)
     intron_pos      96:0 (3/12)
     intron_pos      120:0 (4/12)
     intron_pos      154:0 (5/12)
     intron_pos      173:0 (6/12)
     intron_pos      219:1 (7/12)
     intron_pos      241:0 (8/12)
     intron_pos      258:0 (9/12)
     intron_pos      279:0 (10/12)
     intron_pos      320:1 (11/12)
     intron_pos      341:0 (12/12)
BEGIN
        1 MKRGFSDSPS SSAPPPSSRF KSNPEGDSQF LEDETTKNFA RKVADHYSRR TNQTLEEREA
       61 SPIIHLKKLN NWIKSVLIQL YARPDDAVLD LACGKGGDLI KWDKARIGYY VGIDIAEGSI
      121 EDCRTRYNGD ADHHQRRKKF SFPSRLLCGD CFEVELDKIL EEDAPFDICS CQFAMHYSWT
      181 TEARARRALA NVSALLRPGG VFIGTMPDAN VIIKKLREAE GLEIGNSVYW IRFGEEYSQK
      241 KFKSSSPFGI EYVFHLEDAV DCPEWIVPFN VFKSLAEEYD LELVFVKNSH EFVHEYMKKP
      301 EFVELMRRLG ALGDGSNDQS TLSADEWEAA YLYLSFVLRK RGESDGARRS GRRKNGKMNL
      361 SKDDVLYIDS
//