LOCUS       AEE79230.1              1107 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana glycoside hydrolase family 2 protein protein.
ACCESSION   CP002686-7722
PROTEIN_ID  AEE79230.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G54440"
                     /inference="Similar to RNA sequence,
                     EST:INSD:CF651717.1,INSD:ES003707.1,INSD:BP817836.1,
                     INSD:AA651372.1,INSD:H37478.1,INSD:EG524111.1,
                     INSD:AV806096.1,INSD:BP818269.1,INSD:AV795844.1,
                     INSD:AV826072.1,INSD:EL974056.1,INSD:EL994734.1,
                     INSD:EL200646.1,INSD:EL296052.1,INSD:BP791834.1,
                     INSD:EL099840.1,INSD:AI994249.1,INSD:EH941101.1,
                     INSD:EL972477.1,INSD:BP783603.1,INSD:EG524123.1,
                     INSD:EH866052.1,INSD:BP655313.1,INSD:ES182563.1,
                     INSD:AV807647.1,INSD:EH963988.1,INSD:BP615570.1,
                     INSD:EH838698.1,INSD:AV793471.1,INSD:BE527892.1,
                     INSD:BP659401.1,INSD:EL283446.1,INSD:BP787741.1,
                     INSD:ES159969.1,INSD:EL081249.1"
                     /inference="Similar to RNA sequence,
                     mRNA:INSD:AY091780.1,INSD:AK222134.1"
                     /note="glycoside hydrolase family 2 protein; FUNCTIONS IN:
                     carbohydrate binding, cation binding, beta-galactosidase
                     activity, hydrolase activity, hydrolyzing O-glycosyl
                     compounds, catalytic activity; INVOLVED IN: carbohydrate
                     metabolic process; LOCATED IN: chloroplast; EXPRESSED IN:
                     male gametophyte, guard cell; CONTAINS InterPro DOMAIN/s:
                     Glycoside hydrolase family 2, immunoglobulin-like
                     beta-sandwich (InterPro:IPR006102), Glycoside hydrolase,
                     catalytic core (InterPro:IPR017853), Glycoside hydrolase,
                     family 42, domain 5 (InterPro:IPR004199), Glycoside
                     hydrolase family 2, TIM barrel (InterPro:IPR006103),
                     Glycoside hydrolase, family 2 (InterPro:IPR006101),
                     Glycoside hydrolase-type carbohydrate-binding
                     (InterPro:IPR011013), Glycoside hydrolase-type
                     carbohydrate-binding, subgroup (InterPro:IPR014718),
                     Glycoside hydrolase family 2, carbohydrate-binding
                     (InterPro:IPR006104), Glycoside hydrolase, subgroup,
                     catalytic core (InterPro:IPR013781), Glycoside hydrolase,
                     family 2/20, immunoglobulin-like beta-sandwich domain
                     (InterPro:IPR013812), Galactose-binding domain-like
                     (InterPro:IPR008979); Has 7598 Blast hits to 7490 proteins
                     in 1389 species: Archae - 50; Bacteria - 5980; Metazoa -
                     182; Fungi - 208; Plants - 51; Viruses - 3; Other
                     Eukaryotes - 1124 (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G54440"
                     /db_xref="Araport:AT3G54440"
     intron_pos      44:1 (1/16)
     intron_pos      124:1 (2/16)
     intron_pos      173:1 (3/16)
     intron_pos      199:2 (4/16)
     intron_pos      261:0 (5/16)
     intron_pos      283:0 (6/16)
     intron_pos      363:0 (7/16)
     intron_pos      432:0 (8/16)
     intron_pos      533:1 (9/16)
     intron_pos      586:2 (10/16)
     intron_pos      623:0 (11/16)
     intron_pos      668:1 (12/16)
     intron_pos      687:0 (13/16)
     intron_pos      787:0 (14/16)
     intron_pos      828:0 (15/16)
     intron_pos      1052:0 (16/16)
BEGIN
        1 MVSLATQMIL PSENGYRVWE DQTLFKWRKR DPHVTLRCHE SVQGALRYWY QRNNVDLTVS
       61 KSAVWNDDAV QAALDSAAFW VDGLPFVKSL SGYWKFFLAP KPANVPDKFY DAAFSDSDWN
      121 ALQVPSNWQC HGFDRPIYTN VVYPFPNDPP YVPEDNPTGC YRTYFQIPKE WKDRRILLHF
      181 EAVDSAFFAW INGNPVGYSQ DSRLPAEFEI SDYCYPWDSG KQNVLAVQVF RWSDGSYLED
      241 QDHWWLSGIH RDVLLLAKPK VFIADYFFKS KLADDFSYAD IQVEVKIDNM QESSKDLVLS
      301 NFIIEAAIFD TKNWYNSEGF SCELSPKVAN LKLNPSPSPT LGFHGYLLEG KLDSPNLWSA
      361 EQPNVYILVL TLKDTSGKVL DSESSIVGIR QVSKAFKQLL VNGHPVVIKG VNRHEHHPRV
      421 GKTNIEACMV KDLIMMKEYN INAVRNSHYP QHPRWYELCD LFGMYMIDEA NIETHGFDLS
      481 GHLKHPAKEP SWAAAMLDRV VGMVERDKNH TCIISWSLGN EAGYGPNHSA MAGWIREKDP
      541 SRLVHYEGGG SRTSSTDIVC PMYMRVWDII KIALDQNESR PLILCEYQHA MGNSNGNIDE
      601 YWEAIDNTFG LQGGFIWDWV DQGLLKLGSD GIKRWAYGGD FGDQPNDLNF CLNGLIWPDR
      661 TPHPALHEVK HCYQPIKVSL TDGMIKVANT YFFNTTEELE FSWTIHGDGL ELGSGTLSIP
      721 VIKPQNSFEM EWKSGPWFSF WNDSNAGELF LTINAKLLNL TRSLEAGHLL SSTQIPLPAK
      781 GQIIPQAIKK TDTSITCETV GDFIKISQKD SWELMVNVRK GTIEGWKIQG VLLMNEAILP
      841 CFWRAPTDND KGGGDSSYFS RWKAAQLDNV EFLVESCSVK SITDKSVEIE FIYLGSSASG
      901 SSKSDALFKV NVTYLIYGSG DIITNWFVEP NSDLPPLPRV GIEFHIEKTL DRVEWYGKGP
      961 FECYPDRKAA AHVAIYEHNV GDMHVPYIVP GENGGRTDVR WVTFRNKDGV GIYASTYGSS
     1021 SLMQMNASYY TTGELHRATH EEDLIKGQNI EVHLDHKHMG LGGDDSWTPC VHDKFLIPPA
     1081 QYSFSLRLCP ITASTSGLNI YKDQLPC
//