LOCUS       AEE78022.1               357 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Cysteine proteinases superfamily
            protein protein.
ACCESSION   CP002686-6114
PROTEIN_ID  AEE78022.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G45310"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EL996201.1,INSD:Z30859.1,INSD:R90500.1,
                     INSD:T45255.1,INSD:EL071759.1,INSD:EG439763.1,
                     INSD:EL010249.1,INSD:T88043.1,INSD:T45293.1,
                     INSD:AV553227.1,INSD:AV831219.1,INSD:DR216931.1,
                     INSD:AV442597.1,INSD:H76998.1,INSD:AV551895.1,
                     INSD:BP798494.1,INSD:N97010.1,INSD:AV823103.1,
                     INSD:EL006316.1,INSD:EL195492.1,INSD:BU635243.1,
                     INSD:BP590573.1,INSD:H76621.1,INSD:AV553931.1,
                     INSD:EH976726.1,INSD:CA781230.1,INSD:EL094269.1"
                     /note="Cysteine proteinases superfamily protein; FUNCTIONS
                     IN: cysteine-type endopeptidase activity, cysteine-type
                     peptidase activity; INVOLVED IN: proteolysis; LOCATED IN:
                     endomembrane system; EXPRESSED IN: 22 plant structures;
                     EXPRESSED DURING: 13 growth stages; CONTAINS InterPro
                     DOMAIN/s: Peptidase C1A, papain (InterPro:IPR013128),
                     Proteinase inhibitor I29, cathepsin propeptide
                     (InterPro:IPR013201), Peptidase C1A, papain C-terminal
                     (InterPro:IPR000668), Peptidase, cysteine peptidase active
                     site (InterPro:IPR000169); BEST Arabidopsis thaliana
                     protein match is: aleurain-like protease
                     (TAIR:AT5G60360.2); Has 35333 Blast hits to 34131 proteins
                     in 2444 species: Archae - 798; Bacteria - 22429; Metazoa -
                     974; Fungi - 991; Plants - 531; Viruses - 0; Other
                     Eukaryotes - 9610 (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G45310"
                     /db_xref="Araport:AT3G45310"
     intron_pos      65:2 (1/7)
     intron_pos      106:1 (2/7)
     intron_pos      145:0 (3/7)
     intron_pos      169:2 (4/7)
     intron_pos      258:0 (5/7)
     intron_pos      302:0 (6/7)
     intron_pos      346:1 (7/7)
BEGIN
        1 MSVKLNLSSS ILLILFAAAA SKEIGFDESN PIKMVSDNLH ELEDTVVQIL GQSRHVLSFS
       61 RFTHRYGKKY QSVEEMKLRF SVFKENLDLI RSTNKKGLSY KLSLNQFADL TWQEFQRYKL
      121 GAAQNCSATL KGSHKITEAT VPDTKDWRED GIVSPVKEQG HCGSCWTFST TGALEAAYHQ
      181 AFGKGISLSE QQLVDCAGTF NNFGCHGGLP SQAFEYIKYN GGLDTEEAYP YTGKDGGCKF
      241 SAKNIGVQVR DSVNITLGAE DELKHAVGLV RPVSVAFEVV HEFRFYKKGV FTSNTCGNTP
      301 MDVNHAVLAV GYGVEDDVPY WLIKNSWGGE WGDNGYFKME MGKNMCVATC SSYPVVA
//