LOCUS       AEC07904.1              2554 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana DNAJ heat shock N-terminal domain-
            containing protein protein.
ACCESSION   CP002685-3467
PROTEIN_ID  AEC07904.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /gene="GRV2"
                     /locus_tag="AT2G26890"
                     /gene_synonym="F12C20.7"
                     /gene_synonym="F12C20_7"
                     /gene_synonym="GRAVITROPISM DEFECTIVE 2"
                     /gene_synonym="KAM2"
                     /gene_synonym="KATAMARI2"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EH895605.1,INSD:EG454221.1,INSD:AV529500.1,
                     INSD:EL244502.1,INSD:AV545598.1,INSD:EL336673.1,
                     INSD:ES051444.1,INSD:EH876496.1,INSD:AV526189.1,
                     INSD:EL259542.1,INSD:EG454225.1,INSD:AV554925.1,
                     INSD:ES028881.1,INSD:AA598182.1,INSD:AV547657.1,
                     INSD:EG482015.1,INSD:BX840725.1,INSD:AV554366.1,
                     INSD:AV439552.1,INSD:AV548707.1,INSD:AV520094.1,
                     INSD:AV545902.1,INSD:BX840516.1,INSD:EL335256.1,
                     INSD:EL971841.1,INSD:AA650872.1,INSD:EH985772.1,
                     INSD:DR352722.1,INSD:BX840706.1,INSD:EL307207.1,
                     INSD:EG482016.1,INSD:ES071958.1,INSD:AV548168.1,
                     INSD:AA394797.1,INSD:EL985544.1,INSD:EG454222.1,
                     INSD:EG454226.1,INSD:EL140111.1,INSD:ES048328.1,
                     INSD:EG454209.1,INSD:AA394406.1,INSD:BP791831.1"
                     /inference="similar to RNA sequence, mRNA:INSD:BX821814.1"
                     /note="GRAVITROPISM DEFECTIVE 2 (GRV2); FUNCTIONS IN:
                     binding, heat shock protein binding; INVOLVED IN: in 10
                     processes; LOCATED IN: in 6 components; EXPRESSED IN: 30
                     plant structures; EXPRESSED DURING: 14 growth stages;
                     CONTAINS InterPro DOMAIN/s: Molecular chaperone, heat
                     shock protein, Hsp40, DnaJ (InterPro:IPR015609), Heat
                     shock protein DnaJ, N-terminal (InterPro:IPR001623),
                     Armadillo-type fold (InterPro:IPR016024); Has 35333 Blast
                     hits to 34131 proteins in 2444 species: Archae - 798;
                     Bacteria - 22429; Metazoa - 974; Fungi - 991; Plants -
                     531; Viruses - 0; Other Eukaryotes - 9610 (source: NCBI
                     BLink)."
                     /db_xref="Araport:AT2G26890"
                     /db_xref="TAIR:AT2G26890"
     intron_pos      147:0 (1/21)
     intron_pos      225:0 (2/21)
     intron_pos      254:1 (3/21)
     intron_pos      324:0 (4/21)
     intron_pos      358:0 (5/21)
     intron_pos      379:0 (6/21)
     intron_pos      1114:0 (7/21)
     intron_pos      1235:0 (8/21)
     intron_pos      1282:0 (9/21)
     intron_pos      1413:0 (10/21)
     intron_pos      1578:0 (11/21)
     intron_pos      1652:2 (12/21)
     intron_pos      1767:2 (13/21)
     intron_pos      1866:0 (14/21)
     intron_pos      2015:0 (15/21)
     intron_pos      2130:1 (16/21)
     intron_pos      2245:0 (17/21)
     intron_pos      2401:0 (18/21)
     intron_pos      2442:2 (19/21)
     intron_pos      2484:0 (20/21)
     intron_pos      2507:0 (21/21)
BEGIN
        1 MDSVSRGAVA STTGGAVEEP EYLARYLVVK HSWRGRYKRI LCISSGGIVT LDPNTLAVTN
       61 SYDTGSNFDG ASPLVGRDEN TESVGGEFTV NVRTDGKGKF KAMKFSSRCR ASILTELYRL
      121 RWNQIRPVAE FQVLHLRRRN AEWVPYKLKI TFVGLELVDS KSGNSRWILD FRDMGSPAII
      181 LLSDAYRTKS ADSAGFVLCP MYGRKSKAFR AAPGTTNSSI VASLAKTAKS MVGVFLSVDD
      241 SQLLTVSEYM TRRAKEAVGA EETPNGWWSV TRLRSAAHGT LNMPGLSLAI GPKGGLGEHG
      301 DAVALQLILT KASLVERRID NYEVVIVRPL SSVSSLVRFA EEPQMFAIEF SDGCPVLVYA
      361 SISRDNLLAA ILDTLQTEGH CPIPVLPRLT MPGHRIDPPC GRVSLISGPQ HLVADLETCS
      421 LHLKHLAAAA KDAVAEGGSV PGCRARLWRR IREFNACIPY TGVPANSEVP EVTLMALITM
      481 LPSTPNLPVD APPLPPPSPK AAATVIGFVT CLRRLLSSRS AASHIMSFPA AVNRIMGLLR
      541 NGSEGVAAEA AGLIASLIGG WSADLSTAPD SRGEKHATIM HTKSVLFAQQ GYVTILVNRL
      601 KPMSVSPLFS MAIVEVFEAM VCDPHGETTQ YTVFVELLRQ IAALRRRLFA LFAHPAESVR
      661 ETIAVIMRTI AEEDAIAAES MRDAALRDGA LLRHLLNAFS LPASERREVS RQLVALWADS
      721 YQPALDLLSR VLPPGLVAYL HTRPDDVVDD TDQEGSSTNR RQKRLLQQRR GRIAKGMGAQ
      781 DIPLPPGNNV EAGDAAKHMS ANASVPDNFQ RRAADSSSEA SNPQASAFPG VDSTIAGVSQ
      841 NGYPAFASVT TNANGHEQPE TNASDVVGSD PNLYGIQNSV LPAPAQVIVE STAVGSGKLL
      901 LNWREFWRAF GLDHNRADLI WNERTRQELI EALKAEVHNL DVEKERTEDI SPGDVEATTG
      961 QEIIPRISWN YSEFSVSYRS LSKEVCVGQY YLRLLLESGN AGKAQDFPLR DPVAFFRALY
     1021 HRFQCDADMG LTIDGAVPDE LGSSGDWCDM SRLDGFGGGG GASVRELCAR AMAIVYEQHY
     1081 NTIGPFEGTA HITALIDRTN DRALRHRLLL LLKALVKVLL NVEGCVVVGG CVLAVDLLTV
     1141 VHENSERTPI PLQSNLIAAT AFMEPPKEWM YIDKGGAEVG PVEKDVIRSL WSKKDIDWTT
     1201 KCRALGMSDW KKLRDIRELR WAVAVRVPVL TPSQVGDAAL SILHSMVSAH SDLDDAGEIV
     1261 TPTPRVKRIL SSTRCLPHIA QALLSGEPVI VEAGAALLKD VVTRNSKAMI RLYSTGAFYF
     1321 ALAYPGSNLY SIAQLFSVTH VHQAFHGGEE ATVSSSLPLA KRSVLGGLLP ESLLYVLERS
     1381 GPAAFAAGMV SDSDTPEIIW THKMRAENLI CQVLQHLGDY PQKLSQHCHS LYDYAPMPPV
     1441 TYPELRDEMW CHRYYLRNLC DEIQFPNWPI VEHVEFLQSL LVMWREELTR KPMDLSEGEA
     1501 CKILEISLNN VSSDDLNRTA SVELNEEISN ISKQIQNLDE EKLKRQYRKL AMRYHPDKNP
     1561 EGREKFLAVQ KAYECLQATM QGLQGPQPWR LLLLLKAQCI LYRRYGHVLR PFKYAGYPML
     1621 LDAVTVDKDD NNFLSNDRSP LLVAASELVS LTCAASSLNG EELVRDGGVQ LLSTLLSRCM
     1681 CVVQPTTSQH EPAAIIVTNV MRTLSVISQF ESARAGFLEL PSLIEDIVHC TELERVPAAV
     1741 DAALQSIAKV SVFPELQHGL LKAGALWYIL PLLLQYDSTA EESNSVESHG VGVSIQIAKN
     1801 EHALQASQAL SRLTGLCADE SLTPYNATAA DVLKALLTPK LASLLKDEVA KDLLSKLNTN
     1861 LETPEIIWNS ATRSELLNFV DEQRACQCPD GSYDLKNAQS FSYDALSKEV FVGNVYLKVY
     1921 NDQPDSEISE PESFCNALID FISSLVHTEL PSVSEDQNLI EDRNSSNDTP ELQSSVAEPS
     1981 LIEEHSDHQP SSEGMKNEEC FLIDHLQLGL TALQNLLTKY PDLASVFSSK ERLLPLFECF
     2041 SVAIASKTDI PKLCLNVLSR LTAYAPCLET MVSDGSSLLL LLQMLHSAPS FREGALHVLY
     2101 ALASTPELAW AAAKHGGVVY ILELLLPLQK EIPLQQRAAA ASLLGKLVAQ PMHGPRVAIT
     2161 LVRFLPDGLV SIIRDGPGEA VVHALERTTE TPELVWTPAM AASLSAQIAT MASDIYREQQ
     2221 KGSVIEWDVP EQSAGQQEMR DEPQVGGIYV RRFLKDPKFP LRNPKRFLEG LLDQYLSAMA
     2281 ATHYEQHPVD PELPLLLSAA LVSLLRVHPA LADHIGHLGY VPKLVAAVAY EGRRETMSSG
     2341 EVKAEEIGSD GVNESTDPSS LPGQTPQERV RLSCLRVLHQ LAASTTCAEA MAATSAGNAQ
     2401 VVPLLMKAIG WLGGSILALE TLKRVVVAGN RARDALVAQG LKVGLIEVLL GLLDWRTGGR
     2461 YGLSSHMKWN ESEASIGRVL AVEVLHGFAT EGAHCSKVRE ILDASEVWSA YKDQKHDLFL
     2521 PSNTQSAAGV AGFIENSSNS LTYALTAPPP PSHP
//