LOCUS       AEE76201.1              1080 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana presequence protease 1 protein.
ACCESSION   CP002686-3583
PROTEIN_ID  AEE76201.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /gene="PREP1"
                     /locus_tag="AT3G19170"
                     /gene_synonym="ATPREP1"
                     /gene_synonym="ATZNMP"
                     /gene_synonym="presequence protease 1"
                     /inference="Similar to RNA sequence,
                     EST:INSD:H36243.1,INSD:BX836142.1,INSD:ES043114.1,
                     INSD:EH830848.1,INSD:ES190429.1,INSD:EH990006.1,
                     INSD:EL097116.1,INSD:BP606677.1,INSD:EL213161.1,
                     INSD:EH827429.1,INSD:EL101242.1,INSD:AV528916.1,
                     INSD:EH799953.1,INSD:EL249634.1,INSD:ES176517.1,
                     INSD:AV523448.1,INSD:AV809299.1,INSD:AV523419.1,
                     INSD:AV528942.1,INSD:BP618402.1,INSD:BP659370.1,
                     INSD:BP618190.1,INSD:EG445696.1,INSD:EG469572.1,
                     INSD:AA713104.1,INSD:EL989402.1,INSD:EL991595.1,
                     INSD:EL257628.1,INSD:BP816853.1,INSD:EH898640.1,
                     INSD:EG445610.1,INSD:EL183680.1,INSD:EL131153.1,
                     INSD:EH962962.1,INSD:AV523274.1,INSD:BP652065.1,
                     INSD:EG426319.1,INSD:AV523158.1,INSD:EG476897.1,
                     INSD:EH872744.1,INSD:AV547903.1,INSD:AV831408.1,
                     INSD:BP640238.1,INSD:BP810479.2,INSD:EL115680.1,
                     INSD:EH873050.1,INSD:ES051808.1,INSD:EL065762.1,
                     INSD:AV550604.1,INSD:EH846555.1,INSD:EL319034.1,
                     INSD:EH799364.1,INSD:EL286103.1,INSD:ES152228.1,
                     INSD:EH805559.1,INSD:BP607446.1,INSD:EL255373.1,
                     INSD:AV529086.1,INSD:AV828839.1,INSD:CB261206.1,
                     INSD:BP807564.1,INSD:BP855278.1,INSD:BP645635.1,
                     INSD:BP598231.1,INSD:EG476908.1,INSD:EG481853.1,
                     INSD:EL082155.1,INSD:EG481808.1,INSD:EG525844.1,
                     INSD:EG426308.1,INSD:BP814761.1,INSD:EG525833.1,
                     INSD:AV803014.1,INSD:EL119292.1,INSD:EL986641.1,
                     INSD:EL143898.1,INSD:AV815988.1,INSD:EG445607.1,
                     INSD:EH832380.1,INSD:EL015168.1,INSD:AV523294.1,
                     INSD:EL214183.1,INSD:EL042307.1,INSD:EL135654.1,
                     INSD:EG481842.1,INSD:AV818366.1,INSD:EH947620.1,
                     INSD:EG445695.1,INSD:EH903115.1,INSD:EL172866.1,
                     INSD:BP613458.1,INSD:AV526607.1,INSD:EG469571.1,
                     INSD:EL226036.1,INSD:EL260034.1,INSD:DR355017.1,
                     INSD:AV528774.1,INSD:BU635291.1,INSD:AV547714.1,
                     INSD:EH918719.1,INSD:AV806003.1"
                     /inference="Similar to RNA sequence,
                     mRNA:INSD:AY091051.1,INSD:BT006362.1,INSD:AY090240.1,
                     INSD:BT002372.1"
                     /note="presequence protease 1 (PREP1); FUNCTIONS IN:
                     metalloendopeptidase activity; INVOLVED IN: response to
                     cadmium ion, proteolysis, protein maturation by peptide
                     bond cleavage; LOCATED IN: mitochondrion, apoplast,
                     chloroplast stroma, chloroplast, chloroplast envelope;
                     EXPRESSED IN: 26 plant structures; EXPRESSED DURING: 13
                     growth stages; CONTAINS InterPro DOMAIN/s: Peptidase M16,
                     C-terminal (InterPro:IPR007863), Peptidase M16C associated
                     (InterPro:IPR013578), Peptidase M16, N-terminal
                     (InterPro:IPR011765), Metalloenzyme, LuxS/M16
                     peptidase-like, metal-binding (InterPro:IPR011249),
                     Peptidase M16, core (InterPro:IPR011237); BEST Arabidopsis
                     thaliana protein match is: presequence protease 2
                     (TAIR:AT1G49630.2); Has 4222 Blast hits to 4196 proteins
                     in 1321 species: Archae - 9; Bacteria - 2812; Metazoa -
                     224; Fungi - 268; Plants - 81; Viruses - 0; Other
                     Eukaryotes - 828 (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G19170"
                     /db_xref="Araport:AT3G19170"
     intron_pos      96:1 (1/18)
     intron_pos      154:2 (2/18)
     intron_pos      213:0 (3/18)
     intron_pos      257:1 (4/18)
     intron_pos      281:0 (5/18)
     intron_pos      309:0 (6/18)
     intron_pos      339:1 (7/18)
     intron_pos      513:0 (8/18)
     intron_pos      568:0 (9/18)
     intron_pos      641:0 (10/18)
     intron_pos      683:2 (11/18)
     intron_pos      747:0 (12/18)
     intron_pos      775:0 (13/18)
     intron_pos      807:2 (14/18)
     intron_pos      896:0 (15/18)
     intron_pos      950:1 (16/18)
     intron_pos      1010:2 (17/18)
     intron_pos      1034:2 (18/18)
BEGIN
        1 MLRTVSCLAS RSSSSLFFRF FRQFPRSYMS LTSSTAALRV PSRNLRRISS PSVAGRRLLL
       61 RRGLRIPSAA VRSVNGQFSR LSVRAVATQP APLYPDVGQD EAEKLGFEKV SEEFISECKS
      121 KAILFKHKKT GCEVMSVSNE DENKVFGVVF RTPPKDSTGI PHILEHSVLC GSRKYPVKEP
      181 FVELLKGSLH TFLNAFTYPD RTCYPVASTN TKDFYNLVDV YLDAVFFPKC VDDAHTFQQE
      241 GWHYELNDPS EDISYKGVVF NEMKGVYSQP DNILGRIAQQ ALSPENTYGV DSGGDPKDIP
      301 NLTFEEFKEF HRQYYHPSNA RIWFYGDDDP VHRLRVLSEY LDMFEASPSP NSSKIKFQKL
      361 FSEPVRLVEK YPAGRDGDLK KKHMLCVNWL LSEKPLDLQT QLALGFLDHL MLGTPASPLR
      421 KILLESGLGE ALVSSGLSDE LLQPQFGIGL KGVSEENVQK VEELIMDTLK KLAEEGFDND
      481 AVEASMNTIE FSLRENNTGS FPRGLSLMLQ SISKWIYDMD PFEPLKYTEP LKALKTRIAE
      541 EGSKAVFSPL IEKLILNNSH RVTIEMQPDP EKATQEEVEE KNILEKVKAA MTEEDLAELA
      601 RATEELKLKQ ETPDPPEALR CVPSLNLGDI PKEPTYVPTE VGDINGVKVL RHDLFTNDII
      661 YTEVVFDIGS LKHELLPLVP LFCQSLLEMG TKDLTFVQLN QLIGRKTGGI SVYPLTSSVR
      721 GKDEPCSKII VRGKSMAGRA DDLFNLMNCL LQEVQFTDQQ RFKQFVSQSR ARMENRLRGS
      781 GHGIAAARMD AMLNIAGWMS EQMGGLSYLE FLHTLEKKVD EDWEGISSSL EEIRRSLLAR
      841 NGCIVNMTAD GKSLTNVEKS VAKFLDLLPE NPSGGLVTWD GRLPLRNEAI VIPTQVNYVG
      901 KAGNIYSTGY ELDGSAYVIS KHISNTWLWD RVRVSGGAYG GFCDFDSHSG VFSYLSYRDP
      961 NLLKTLDIYD GTGDFLRGLD VDQETLTKAI IGTIGDVDSY QLPDAKGYSS LLRHLLGVTD
     1021 EERQRKREEI LTTSLKDFKD FAQAIDVVRD KGVAVAVASA EDIDAANNER SNFFEVKKAL
//