LOCUS       AEC10033.1               970 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Insulinase (Peptidase family M16)
            family protein protein.
ACCESSION   CP002685-6353
PROTEIN_ID  AEC10033.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G41790"
                     /gene_synonym="T11A7.11"
                     /gene_synonym="T11A7_11"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EG512623.1,INSD:ES181559.1,INSD:AV562337.1,
                     INSD:DR233760.1,INSD:EL106158.1,INSD:EL230783.1,
                     INSD:T44512.1,INSD:EH891838.1,INSD:ES115149.1,
                     INSD:EL076444.1,INSD:EG439465.1,INSD:EH944854.1,
                     INSD:EL104669.1,INSD:AV541578.1,INSD:EL160175.1,
                     INSD:AV555779.1,INSD:ES184184.1,INSD:EH877251.1,
                     INSD:EH860864.1,INSD:EG473109.1,INSD:EG473098.1,
                     INSD:ES177945.1,INSD:EL291249.1,INSD:DR381034.1,
                     INSD:EL260030.1"
                     /inference="similar to RNA sequence, mRNA:INSD:AK226643.1"
                     /note="Insulinase (Peptidase family M16) family protein;
                     FUNCTIONS IN: metalloendopeptidase activity, zinc ion
                     binding, catalytic activity, metal ion binding; INVOLVED
                     IN: proteolysis; LOCATED IN: cellular_component unknown;
                     EXPRESSED IN: 23 plant structures; EXPRESSED DURING: 13
                     growth stages; CONTAINS InterPro DOMAIN/s: Peptidase M16,
                     zinc-binding site (InterPro:IPR001431), Peptidase M16,
                     C-terminal (InterPro:IPR007863), Peptidase M16, N-terminal
                     (InterPro:IPR011765), Metalloenzyme, LuxS/M16
                     peptidase-like, metal-binding (InterPro:IPR011249),
                     Peptidase M16, core (InterPro:IPR011237); BEST Arabidopsis
                     thaliana protein match is: Insulinase (Peptidase family
                     M16) family protein (TAIR:AT3G57470.2); Has 9660 Blast
                     hits to 9541 proteins in 2186 species: Archae - 9;
                     Bacteria - 6247; Metazoa - 831; Fungi - 633; Plants - 271;
                     Viruses - 3; Other Eukaryotes - 1666 (source: NCBI
                     BLink)."
                     /db_xref="Araport:AT2G41790"
                     /db_xref="TAIR:AT2G41790"
     intron_pos      47:0 (1/25)
     intron_pos      72:1 (2/25)
     intron_pos      95:0 (3/25)
     intron_pos      125:2 (4/25)
     intron_pos      150:1 (5/25)
     intron_pos      165:0 (6/25)
     intron_pos      182:1 (7/25)
     intron_pos      223:1 (8/25)
     intron_pos      261:0 (9/25)
     intron_pos      315:1 (10/25)
     intron_pos      346:1 (11/25)
     intron_pos      375:0 (12/25)
     intron_pos      404:0 (13/25)
     intron_pos      438:2 (14/25)
     intron_pos      473:0 (15/25)
     intron_pos      505:0 (16/25)
     intron_pos      568:1 (17/25)
     intron_pos      589:0 (18/25)
     intron_pos      624:0 (19/25)
     intron_pos      691:1 (20/25)
     intron_pos      761:0 (21/25)
     intron_pos      802:2 (22/25)
     intron_pos      820:0 (23/25)
     intron_pos      849:0 (24/25)
     intron_pos      890:0 (25/25)
BEGIN
        1 MAVEKSNTTV GGVEILKPRT DNREYRMIVL KNLLQVLLIS DPDTDKCAAS MSVSVGSFSD
       61 PQGLEGLAHF LEHMLFYASE KYPEEDSYSK YITEHGGSTN AYTASEETNY HFDVNADCFD
      121 EALDRFAQFF IKPLMSADAT MREIKAVDSE NQKNLLSDGW RIRQLQKHLS KEDHPYHKFS
      181 TGNMDTLHVR PQAKGVDTRS ELIKFYEEHY SANIMHLVVY GKESLDKIQD LVERMFQEIQ
      241 NTNKVVPRFP GQPCTADHLQ ILVKAIPIKQ GHKLGVSWPV TPSIHHYDEA PSQYLGHLIG
      301 HEGEGSLFHA LKTLGWATGL SAGEGEWTLD YSFFKVSIDL TDAGHEHMQE ILGLLFNYIQ
      361 LLQQTGVCQW IFDELSAICE TKFHYQDKIP PMSYIVDIAS NMQIYPTKDW LVGSSLPTKF
      421 NPAIVQKVVD ELSPSNFRIF WESQKFEGQT DKAEPWYNTA YSLEKITSST IQEWVQSAPD
      481 VHLHLPAPNV FIPTDLSLKD ADDKETVPVL LRKTPFSRLW YKPDTMFSKP KAYVKMDFNC
      541 PLAVSSPDAA VLTDIFTRLL MDYLNEYAYY AQVAGLYYGV SLSDNGFELT LLGYNHKLRI
      601 LLETVVGKIA NFEVKPDRFA VIKETVTKEY QNYKFRQPYH QAMYYCSLIL QDQTWPWTEE
      661 LDVLSHLEAE DVAKFVPMLL SRTFIECYIA GNVENNEAES MVKHIEDVLF NDPKPICRPL
      721 FPSQHLTNRV VKLGEGMKYF YHQDGSNPSD ENSALVHYIQ VHRDDFSMNI KLQLFGLVAK
      781 QATFHQLRTV EQLGYITALA QRNDSGIYGV QFIIQSSVKG PGHIDSRVES LLKNFESKLY
      841 EMSNEDFKSN VTALIDMKLE KHKNLKEESR FYWREIQSGT LKFNRKEAEV SALKQLQKQE
      901 LIDFFDEYIK VGAARKKSLS IRVYGSQHLK EMASDKDEVP SPSVEIEDIV GFRKSQPLHG
      961 SFRGCGQPKL
//