LOCUS       AEC10342.1              1316 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Endonuclease/exonuclease/phosphatase
            family protein protein.
ACCESSION   CP002685-6776
PROTEIN_ID  AEC10342.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /gene="5PTase12"
                     /locus_tag="AT2G43900"
                     /gene_synonym="F6E13.3"
                     /gene_synonym="inositol-polyphosphate 5-phosphatase 12"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AV785870.1,INSD:EH975168.1,INSD:EL306267.1,
                     INSD:ES036208.1,INSD:EH948051.1,INSD:BX839129.1,
                     INSD:EL219463.1,INSD:EH867586.1,INSD:AV824367.1"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:AY080628.1,INSD:AY761187.1"
                     /note="Endonuclease/exonuclease/phosphatase family
                     protein; FUNCTIONS IN: inositol-polyphosphate
                     5-phosphatase activity, inositol or phosphatidylinositol
                     phosphatase activity; INVOLVED IN: biological_process
                     unknown; LOCATED IN: CUL4 RING ubiquitin ligase complex;
                     EXPRESSED IN: sperm cell, male gametophyte, flower,
                     cultured cell, pollen tube; EXPRESSED DURING: L mature
                     pollen stage, M germinated pollen stage, 4 anthesis;
                     CONTAINS InterPro DOMAIN/s: WD40 repeat-like-containing
                     domain (InterPro:IPR011046), Inositol polyphosphate
                     related phosphatase (InterPro:IPR000300), WD40/YVTN
                     repeat-like-containing domain (InterPro:IPR015943), WD40
                     repeat (InterPro:IPR001680),
                     Endonuclease/exonuclease/phosphatase (InterPro:IPR005135);
                     BEST Arabidopsis thaliana protein match is:
                     Endonuclease/exonuclease/phosphatase family protein
                     (TAIR:AT1G05630.2); Has 8064 Blast hits to 7016 proteins
                     in 490 species: Archae - 18; Bacteria - 518; Metazoa -
                     2458; Fungi - 805; Plants - 729; Viruses - 32; Other
                     Eukaryotes - 3504 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G43900"
                     /db_xref="TAIR:AT2G43900"
     intron_pos      278:1 (1/10)
     intron_pos      362:2 (2/10)
     intron_pos      632:0 (3/10)
     intron_pos      674:2 (4/10)
     intron_pos      703:0 (5/10)
     intron_pos      758:1 (6/10)
     intron_pos      772:0 (7/10)
     intron_pos      861:1 (8/10)
     intron_pos      902:2 (9/10)
     intron_pos      1023:0 (10/10)
BEGIN
        1 MDIINNNHRD ENDDDEEEAL SAMSSVPPPR KIHSYSHQLR ATGQKGHHRQ RQHSLDDIPK
       61 ITEIVSGCGI SGDSSDDEFY PYATTTNSSS FPFTGGDTGD SDDYLHQPEI GEDFQPLPEF
      121 VGSGGGVGMF KVPTRSPLHS ARPPCLELRP HPLKETQVGR FLRNIACTET QLWAGQESGV
      181 RFWNFDDAFE PGCGLSGRVQ RGDEDAAPFQ ESASTSPTTC LMVDNGNRLV WSGHKDGKIR
      241 SWKMDYVLDD GDDSPFKEGL AWQAHKGPVN SVIMSSYGDL WSCSEGGVIK IWTWESMEKS
      301 LSLRLEEKHM AALLVERSGI DLRAQVTVNG TCNISSSEVK CLLADNVRSK VWAAQLQTFS
      361 LWDGRTKELL KVFNSEGQTE NRVDMPLGQD QPAAEDEMKA KIASTSKKEK PHGFLQRSRN
      421 AIMGAADAVR RVATRGGGAY EDAKRTEAMV LAGDGMIWTG CTNGLLIQWD GNGNRLQDFR
      481 HHQCAVLCFC TFGERIYIGY VSGHIQIIDL EGNLIAGWVA HNNAVIKMAA ADGYIFSLAT
      541 HGGIRGWPVI SPGPLDGIIR SELAEKERTY AQTDSVRILT GSWNVGQGKA SHDALMSWLG
      601 SVASDVGILV VGLQEVEMGA GFLAMSAAKE SVGGNEGSTI GQYWIDTIGK TLDEKAVFER
      661 MGSRQLAGLL ISLWVRKNLR THVGDIDVAA VPCGFGRAIG NKGGVGLRIR VFDRIMCFIN
      721 CHLAAHLEAV NRRNADFDHI YKTMSFTRSS NAHNAPAAGV STGSHTTKSA NNANVNTEET
      781 KQDLAEADMV VFFGDFNYRL FGISYDEARD FVSQRSFDWL REKDQLRAEM KAGRVFQGMR
      841 EAIITFPPTY KFERHRPGLG GYDSGEKKRI PAWCDRVIFR DTRTSPESEC SLDCPVVASI
      901 MLYDACMDVT ESDHKPVRCK FHVKIEHVDR SVRRQEFGRI IKTNEKVRAL LNDLRYVPET
      961 IVSSNSIVLQ NQDTFVLRIT NKCVKENAVF RILCEGQSTV REDEDTLELH PLGSFGFPRW
     1021 LEVMPAAGTI KPDSSVEVSV HHEEFHTLEE FVDGIPQNWW CEDTRDKEAI LVVNVQGGCS
     1081 TETVCHRVHV RHCFSAKNLR IDSNPSNSKS QSLKKNEGDS NSKSSKKSDG DSNSKSSKKS
     1141 DGDSNSKSSK KSDGDSNSKS SKKSDGDSNS KSSKKSDGDS NSKSSKKSDG DSNSKSSKKS
     1201 DGDSCSKSQK KSDGDTNSKS QKKGDGDSSS KSHKKNDGDS SSKSHKKNDG DSSSKSHKKS
     1261 DGDSSSKSHK KSEGDSSSKS HKKNDGDSSS SYKSQSGKKN SNSSTVEESR NNHNKR
//