LOCUS       AEC09074.1               579 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Trypsin family protein protein.
ACCESSION   CP002685-5046
PROTEIN_ID  AEC09074.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G35155"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EG463140.1,INSD:AV825453.1,INSD:EG463207.1,
                     INSD:EH968876.1,INSD:EL993415.1,INSD:ES163107.1,
                     INSD:AV803836.1,INSD:EL036053.1,INSD:ES192527.1,
                     INSD:AI999157.1,INSD:BP778459.1,INSD:AV791321.1,
                     INSD:EL128075.1,INSD:AV795686.1,INSD:BX841041.1"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:BX819153.1,INSD:AY059774.1,INSD:AY150434.1,
                     INSD:BX820331.1"
                     /note="Trypsin family protein; FUNCTIONS IN: catalytic
                     activity; INVOLVED IN: biological_process unknown; LOCATED
                     IN: cellular_component unknown; EXPRESSED IN: 22 plant
                     structures; EXPRESSED DURING: 13 growth stages; CONTAINS
                     InterPro DOMAIN/s: Serine/cysteine peptidase, trypsin-like
                     (InterPro:IPR009003); BEST Arabidopsis thaliana protein
                     match is: Trypsin family protein (TAIR:AT5G45030.2); Has
                     136 Blast hits to 136 proteins in 33 species: Archae - 0;
                     Bacteria - 53; Metazoa - 0; Fungi - 2; Plants - 81;
                     Viruses - 0; Other Eukaryotes - 0 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G35155"
                     /db_xref="TAIR:AT2G35155"
     intron_pos      169:0 (1/4)
     intron_pos      217:0 (2/4)
     intron_pos      297:1 (3/4)
     intron_pos      464:1 (4/4)
BEGIN
        1 MNLGAWGQRF IQAAASSESE DSALDLERNH HCNHLSLPSS SSPSPLQPFT LNIQHAESNA
       61 PYFSWPTLSR LNDTVEDRAN YFGNLQKGVL PETVGRLPSG QQATTLLELM TIRAFHSKIL
      121 RRFSLGTAVG FRISRGVLTN VPAILVFVAR KVHRQWLNPM QCLPSALEGP GGVWCDVDVV
      181 EFQYYGAPAA TPKEQVYNEL VDGLRGSDPC IGSGSQVASQ ETYGTLGAIV KSRTGNHQVG
      241 FLTNRHVAVD LDYPSQKMFH PLPPSLGPGV YLGAVERATS FITDDQWYGI FAGTNPETFV
      301 RADGAFIPFA EDFNTSNVTT LIKGIGEIGD VHVIDLQSPI DSLIGKQVVK VGRSSGYTTG
      361 TIMAYALEYN DEKGICFLTD FLVIGENQQT FDLEGDSGSL ILLTGPNGQK PRPVGIIWGG
      421 TANRGRLKLI AGQEPENWTS GVDLGRLLDL LELDLITSNH ELEAAAAARE ERNTSVTALD
      481 STVSQSSPPD PVPSGDKQDE SFEPFIPPEF HIEEAIKPTL EVEEHIFIAP ISVNESTSAI
      541 KGQEIPKLDN LMALKNSSEE EVNISLHLGE PKLKKPKFF
//