LOCUS       AEE76793.1               991 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana heteroglycan glucosidase 1 protein.
ACCESSION   CP002686-4419
PROTEIN_ID  AEE76793.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /gene="HGL1"
                     /locus_tag="AT3G23640"
                     /gene_synonym="heteroglycan glucosidase 1"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AV522931.1,INSD:ES196596.1,INSD:CB261795.1,
                     INSD:BP611408.1,INSD:AV804127.1,INSD:AV813735.1,
                     INSD:AV830895.1,INSD:EL185783.1,INSD:BP608793.1,
                     INSD:EL297482.1,INSD:EH891474.1,INSD:AV822916.1,
                     INSD:EL320928.1,INSD:EG431954.1,INSD:EL235127.1,
                     INSD:EG431953.1,INSD:AV803454.1,INSD:EH923780.1,
                     INSD:AV813955.1,INSD:AV807498.1,INSD:EH826146.1,
                     INSD:BP606813.1,INSD:CB262944.1,INSD:AV783788.1,
                     INSD:EL312740.1,INSD:EH973080.1,INSD:ES140056.1,
                     INSD:AV798831.1,INSD:EL222398.1,INSD:BE529834.1,
                     INSD:AV792653.1,INSD:EG521804.1"
                     /note="heteroglycan glucosidase 1 (HGL1); FUNCTIONS IN:
                     hydrolase activity, hydrolyzing O-glycosyl compounds;
                     INVOLVED IN: carbohydrate metabolic process; LOCATED IN:
                     chloroplast; EXPRESSED IN: 22 plant structures; EXPRESSED
                     DURING: 13 growth stages; CONTAINS InterPro DOMAIN/s:
                     Glycoside hydrolase, family 31 (InterPro:IPR000322),
                     Glycoside hydrolase, catalytic core (InterPro:IPR017853);
                     BEST Arabidopsis thaliana protein match is: Glycosyl
                     hydrolases family 31 protein (TAIR:AT5G63840.1); Has 5349
                     Blast hits to 5021 proteins in 1110 species: Archae - 88;
                     Bacteria - 3100; Metazoa - 761; Fungi - 803; Plants - 278;
                     Viruses - 0; Other Eukaryotes - 319 (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G23640"
                     /db_xref="Araport:AT3G23640"
     intron_pos      82:0 (1/21)
     intron_pos      105:0 (2/21)
     intron_pos      151:0 (3/21)
     intron_pos      190:1 (4/21)
     intron_pos      218:0 (5/21)
     intron_pos      250:0 (6/21)
     intron_pos      306:1 (7/21)
     intron_pos      354:0 (8/21)
     intron_pos      383:0 (9/21)
     intron_pos      445:0 (10/21)
     intron_pos      501:0 (11/21)
     intron_pos      541:1 (12/21)
     intron_pos      564:2 (13/21)
     intron_pos      594:0 (14/21)
     intron_pos      634:1 (15/21)
     intron_pos      699:0 (16/21)
     intron_pos      735:1 (17/21)
     intron_pos      787:1 (18/21)
     intron_pos      821:2 (19/21)
     intron_pos      879:2 (20/21)
     intron_pos      928:1 (21/21)
BEGIN
        1 MTLSGDSSET VEMTSTDMIF EPILEHGVFR FDCSVDHRKA AFPSVSFKNS KDREVPIVSH
       61 IVPAYIPTCG CLQDQQVVTF EFSPGTSFYG TGEVSGQLER TGKRVFTWNT DAWGYGSGTT
      121 SLYQSHPWVL VVLPTGETLG VLADTTRKCE IDLRKEGIIR IISPASYPII TFGPFSSPTA
      181 VLESLSHAIG TVFMPPKWAL GYHQCRWSYM SDKRVAEIAQ TFRDKKIPSD VIWMDIDYMD
      241 GFRCFTFDKE RFPDPSALAK DLHSNGFKAI WMLDPGIKQE EGYYVYDSGS KNDVWISRAD
      301 GKPFTGEVWP GPCVFPDYTN SKARSWWANL VKEFVSNGVD GIWNDMNEPA VFKVVTKTMP
      361 ENNIHHGDDE LGGVQNHSHY HNVYGMLMAR STYEGMELAD KNKRPFVLTR AGFIGSQRYA
      421 ATWTGDNLSN WEHLHMSISM VLQLGLSGQP LSGPDIGGFA GNATPRLFGR WMGVGAMFPF
      481 CRGHSEAGTD DHEPWSFGEE CEEVCRAALK RRYQLLPHFY TLFYIAHTTG APVAAPIFFA
      541 DPIDSRLRAV ENGFLLGPLL IYASTLSSQG SHELQHILPR GIWHRFDFAD SHPDLPTLYL
      601 QGGSIISLAP PHLHVGEFSL SDDLTLLVSL DENGKAKGLL FEDDGDGYGY TKGRFLVTHY
      661 IAERDSSTVT VKVSKTEGDW QRPNRRVHVQ LLLGGGAMLD AWGMDGEFIH IKVPSESGIS
      721 ELISTSNERF KLHMENTKLI PEKEVVPGQK GMELSKEPVE LSSGDWKLNI VPWVGGRILS
      781 MTHVPSGIQW LHSRIDINGY EEYSGTEYRS AGCTEEYNVI ERDLEHAGEE ESLILEGDVG
      841 GGLVLRRKIS IAKDNQRVFR IASSIEARSV GAGSGGFSRL VCLRVHPTFT LLHPTESFVS
      901 FTSIDGSKHE VWPDSGDQIY EGNNLPHGKW MLVDKSLNLR MVNRFDVSQV FKCIIHWDCG
      961 TVNLELWSKE RPVSKESPLK IEHEYEVTSF P
//