LOCUS       AEC06532.1               848 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana glycosyl hydrolase family 35 protein protein.
ACCESSION   CP002685-1546
PROTEIN_ID  AEC06532.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G16730"
                     /gene_synonym="beta-galactosidase 13"
                     /gene_synonym="BGAL13"
                     /gene_synonym="T24I21.14"
                     /gene_synonym="T24I21_14"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AU228003.1,INSD:BP562897.2"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:BT004177.1,INSD:AJ270309.1"
                     /note="glycosyl hydrolase family 35 protein; FUNCTIONS IN:
                     beta-galactosidase activity; INVOLVED IN: lactose
                     catabolic process, using glucoside 3-dehydrogenase,
                     carbohydrate metabolic process, lactose catabolic process
                     via UDP-galactose, lactose catabolic process; LOCATED IN:
                     endomembrane system; EXPRESSED IN: 14 plant structures;
                     EXPRESSED DURING: L mature pollen stage, M germinated
                     pollen stage, 4 anthesis, C globular stage, petal
                     differentiation and expansion stage; CONTAINS InterPro
                     DOMAIN/s: Glycoside hydrolase, family 35, conserved site
                     (InterPro:IPR019801), Glycoside hydrolase family 2,
                     carbohydrate-binding (InterPro:IPR006104), Glycoside
                     hydrolase, family 35 (InterPro:IPR001944),
                     D-galactoside/L-rhamnose binding SUEL lectin
                     (InterPro:IPR000922), Glycoside hydrolase, catalytic core
                     (InterPro:IPR017853), Glycoside hydrolase, subgroup,
                     catalytic core (InterPro:IPR013781), Galactose-binding
                     domain-like (InterPro:IPR008979); BEST Arabidopsis
                     thaliana protein match is: beta-galactosidase 11
                     (TAIR:AT4G35010.1); Has 2592 Blast hits to 2188 proteins
                     in 502 species: Archae - 15; Bacteria - 1202; Metazoa -
                     413; Fungi - 220; Plants - 636; Viruses - 0; Other
                     Eukaryotes - 106 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G16730"
                     /db_xref="TAIR:AT2G16730"
     intron_pos      74:0 (1/17)
     intron_pos      106:0 (2/17)
     intron_pos      143:2 (3/17)
     intron_pos      166:0 (4/17)
     intron_pos      197:0 (5/17)
     intron_pos      245:0 (6/17)
     intron_pos      276:2 (7/17)
     intron_pos      312:0 (8/17)
     intron_pos      340:1 (9/17)
     intron_pos      380:0 (10/17)
     intron_pos      436:0 (11/17)
     intron_pos      494:2 (12/17)
     intron_pos      531:1 (13/17)
     intron_pos      568:0 (14/17)
     intron_pos      605:0 (15/17)
     intron_pos      640:0 (16/17)
     intron_pos      805:0 (17/17)
BEGIN
        1 MKIHSSDHSW LLLAVLVILL SFSGALSSDD KEKKTKSVDK KKEVTYDGTS LIINGNRELL
       61 YSGSIHYPRS TPEMWPNIIK RAKQGGLNTI QTYVFWNVHE PEQGKFNFSG RADLVKFIKL
      121 IEKNGLYVTL RLGPFIQAEW THGGLPYWLR EVPGIFFRTD NEPFKEHTER YVKVVLDMMK
      181 EEKLFASQGG PIILGQIENE YSAVQRAYKE DGLNYIKWAS KLVHSMDLGI PWVMCKQNDA
      241 PDPMINACNG RHCGDTFPGP NKDNKPSLWT ENWTTQFRVF GDPPAQRSVE DIAYSVARFF
      301 SKNGTHVNYY MYHGGTNFGR TSAHYVTTRY YDDAPLDEFG LEREPKYGHL KHLHNALNLC
      361 KKALLWGQPR VEKPSNETEI RYYEQPGTKV CAAFLANNNT EAAEKIKFRG KEYLIPHRSI
      421 SILPDCKTVV YNTGEIISHH TSRNFMKSKK ANKNFDFKVF TESVPSKIKG DSFIPVELYG
      481 LTKDESDYGW YTTSFKIDDN DLSKKKGGKP NLRIASLGHA LHVWLNGEYL GNGHGSHEEK
      541 SFVFQKPVTL KEGENHLTML GVLTGFPDSG SYMEHRYTGP RSVSILGLGS GTLDLTEENK
      601 WGNKVGMEGE RLGIHAEEGL KKVKWEKASG KEPGMTWYQT YFDAPESQSA AAIRMNGMGK
      661 GLIWVNGEGV GRYWMSFLSP LGQPTQIEYH IPRSFLKPKK NLLVIFEEEP NVKPELIDFV
      721 IVNRDTVCSY IGENYTPSVR HWTRKNDQVQ AITDDVHLTA NLKCSGTKKI SAVEFASFGN
      781 PNGTCGNFTL GSCNAPVSKK VVEKYCLGKA ECVIPVNKST FEQDKKDSCP KVEKKLAVQV
      841 KCGRDKKN
//