LOCUS       AEE79198.1               235 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Late embryogenesis abundant (LEA)
            hydroxyproline-rich glycoprotein family protein.
ACCESSION   CP002686-7679
PROTEIN_ID  AEE79198.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G54200"
                     /inference="Similar to RNA sequence,
                     EST:INSD:CB255940.1,INSD:BP621914.1,INSD:DR290131.1,
                     INSD:BE523535.1,INSD:EL069234.1,INSD:T21917.1,
                     INSD:AI996410.1,INSD:BX838078.1,INSD:EL990354.1,
                     INSD:ES187239.1,INSD:AV543884.1,INSD:AU228707.1,
                     INSD:EL087799.1,INSD:EL081712.1,INSD:BE528613.1,
                     INSD:EL004489.1,INSD:EL288019.1,INSD:EL081570.1,
                     INSD:EL121260.1,INSD:DR290132.1,INSD:EL238292.1,
                     INSD:CF651526.1,INSD:ES123906.1,INSD:CF651525.1,
                     INSD:AV552328.1,INSD:BP808728.1,INSD:EL194762.1,
                     INSD:BP623532.1,INSD:EL256399.1,INSD:ES146619.1,
                     INSD:AU237627.1,INSD:DR290130.1,INSD:EL167379.1,
                     INSD:EG487961.1,INSD:AV556441.1,INSD:EH924015.1"
                     /inference="Similar to RNA sequence,
                     mRNA:INSD:AY085665.1,INSD:AK229134.1,INSD:BX825919.1,
                     INSD:BX826211.1,INSD:BX825887.1,INSD:BX825406.1"
                     /note="Late embryogenesis abundant (LEA)
                     hydroxyproline-rich glycoprotein family; FUNCTIONS IN:
                     molecular_function unknown; INVOLVED IN:
                     biological_process unknown; LOCATED IN: anchored to plasma
                     membrane, plasma membrane; EXPRESSED IN: 23 plant
                     structures; EXPRESSED DURING: 14 growth stages; CONTAINS
                     InterPro DOMAIN/s: Late embryogenesis abundant protein,
                     group 2 (InterPro:IPR004864); BEST Arabidopsis thaliana
                     protein match is: Late embryogenesis abundant (LEA)
                     hydroxyproline-rich glycoprotein family
                     (TAIR:AT3G05975.1); Has 631 Blast hits to 630 proteins in
                     23 species: Archae - 0; Bacteria - 0; Metazoa - 0; Fungi -
                     0; Plants - 631; Viruses - 0; Other Eukaryotes - 0
                     (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G54200"
                     /db_xref="Araport:AT3G54200"
BEGIN
        1 MSDFSIKPDD KKEEEKPATA MLPPPKPNAS SMETQSANTG TAKKLRRKRN CKICICFTIL
       61 LILLIAIVIV ILAFTLFKPK RPTTTIDSVT VDRLQASVNP LLLKVLLNLT LNVDLSLKNP
      121 NRIGFSYDSS SALLNYRGQV IGEAPLPANR IAARKTVPLN ITLTLMADRL LSETQLLSDV
      181 MAGVIPLNTF VKVTGKVTVL KIFKIKVQSS SSCDLSISVS DRNVTSQHCK YSTKL
//