LOCUS       AEE77849.1               376 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Cysteine proteinases superfamily
            protein protein.
ACCESSION   CP002686-5865
PROTEIN_ID  AEE77849.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G43960"
                     /inference="Similar to RNA sequence,
                     EST:INSD:T44367.1,INSD:DR264337.1,INSD:DR376486.1,
                     INSD:AI998461.1,INSD:AA721852.1,INSD:DR264332.1,
                     INSD:AU239508.1,INSD:AU230822.1,INSD:EL039522.1,
                     INSD:EL097541.1,INSD:BP816916.1,INSD:DR264333.1,
                     INSD:DR264340.1,INSD:DR264331.1,INSD:DR264335.1,
                     INSD:DR264338.1,INSD:DR264334.1,INSD:DR264336.1,
                     INSD:DR264341.1,INSD:EL204705.1,INSD:ES135191.1,
                     INSD:DR264342.1,INSD:DR264339.1,INSD:ES198725.1"
                     /inference="Similar to RNA sequence,
                     mRNA:INSD:AY087918.1,INSD:AK118634.1"
                     /note="Cysteine proteinases superfamily protein; FUNCTIONS
                     IN: cysteine-type peptidase activity, cysteine-type
                     endopeptidase activity; INVOLVED IN: proteolysis; LOCATED
                     IN: anchored to membrane; EXPRESSED IN: 22 plant
                     structures; EXPRESSED DURING: 13 growth stages; CONTAINS
                     InterPro DOMAIN/s: Peptidase C1A, papain
                     (InterPro:IPR013128), Proteinase inhibitor I29, cathepsin
                     propeptide (InterPro:IPR013201), Peptidase C1A, papain
                     C-terminal (InterPro:IPR000668), Peptidase, cysteine
                     peptidase active site (InterPro:IPR000169); BEST
                     Arabidopsis thaliana protein match is: Cysteine
                     proteinases superfamily protein (TAIR:AT3G19400.1); Has
                     7750 Blast hits to 7646 proteins in 706 species: Archae -
                     41; Bacteria - 178; Metazoa - 3340; Fungi - 4; Plants -
                     1867; Viruses - 137; Other Eukaryotes - 2183 (source: NCBI
                     BLink)."
                     /db_xref="TAIR:AT3G43960"
                     /db_xref="Araport:AT3G43960"
     intron_pos      150:1 (1/3)
     intron_pos      231:0 (2/3)
     intron_pos      277:0 (3/3)
BEGIN
        1 MAISFRTLAL LTLSVLLISI SLGVVTATES QRNEGEVLTM YEQWLVENGK NYNGLGEKER
       61 RFKIFKDNLK RIEEHNSDPN RSYERGLNKF SDLTADEFQA SYLGGKMEKK SLSDVAERYQ
      121 YKEGDVLPDE VDWRERGAVV PRVKRQGECG SCWAFAATGA VEGINQITTG ELVSLSEQEL
      181 IDCDRGNDNF GCAGGGAVWA FEFIKENGGI VSDEVYGYTG EDTAACKAIE MKTTRVVTIN
      241 GHEVVPVNDE MSLKKAVAYQ PISVMISAAN MSDYKSGVYK GACSNLWGDH NVLIVGYGTS
      301 SDEGDYWLIR NSWGPEWGEG GYLRLQRNFH EPTGKCAVAV APVYPIKSNS SSHLLSPSVF
      361 KLVVLFVFQL ISLALL
//