LOCUS       AEC09066.1              1396 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana transcription activator protein.
ACCESSION   CP002685-5032
PROTEIN_ID  AEC09066.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /gene="GRL"
                     /locus_tag="AT2G35110"
                     /gene_synonym="GNARLED"
                     /gene_synonym="NAP1"
                     /gene_synonym="NAPP"
                     /gene_synonym="NCK-ASSOCIATED PROTEIN 1"
                     /gene_synonym="T4C15.22"
                     /gene_synonym="T4C15_22"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AV545854.1,INSD:BP839997.1,INSD:AV547935.1,
                     INSD:AV546555.1,INSD:ES206891.1,INSD:AV547490.1,
                     INSD:ES206183.1,INSD:EG462444.1,INSD:AV548139.1,
                     INSD:AV554853.1,INSD:AV554801.1,INSD:EH814037.1,
                     INSD:EL170195.1,INSD:EG460151.1,INSD:EG460262.1,
                     INSD:EG457858.1,INSD:EH980384.1,INSD:T88379.1,
                     INSD:EG457857.1,INSD:EH891048.1,INSD:ES117004.1,
                     INSD:EH832775.1,INSD:AV556813.1,INSD:EL110727.1,
                     INSD:EL044235.1,INSD:ES136757.1,INSD:EG462443.1,
                     INSD:AA394638.1,INSD:AV548158.1,INSD:BP812495.2"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:AY662956.1,INSD:AY496700.1,INSD:AK229925.1"
                     /note="GNARLED (GRL); CONTAINS InterPro DOMAIN/s:
                     Nck-associated protein 1 (InterPro:IPR019137); Has 35333
                     Blast hits to 34131 proteins in 2444 species: Archae -
                     798; Bacteria - 22429; Metazoa - 974; Fungi - 991; Plants
                     - 531; Viruses - 0; Other Eukaryotes - 9610 (source: NCBI
                     BLink)."
                     /db_xref="Araport:AT2G35110"
                     /db_xref="TAIR:AT2G35110"
     intron_pos      135:0 (1/21)
     intron_pos      160:0 (2/21)
     intron_pos      187:0 (3/21)
     intron_pos      214:0 (4/21)
     intron_pos      241:2 (5/21)
     intron_pos      270:0 (6/21)
     intron_pos      312:0 (7/21)
     intron_pos      348:0 (8/21)
     intron_pos      363:0 (9/21)
     intron_pos      410:2 (10/21)
     intron_pos      455:0 (11/21)
     intron_pos      492:0 (12/21)
     intron_pos      518:1 (13/21)
     intron_pos      583:0 (14/21)
     intron_pos      631:2 (15/21)
     intron_pos      659:0 (16/21)
     intron_pos      696:0 (17/21)
     intron_pos      738:0 (18/21)
     intron_pos      784:2 (19/21)
     intron_pos      817:0 (20/21)
     intron_pos      1222:2 (21/21)
BEGIN
        1 MANSRQYYPS QDESMSPTSV RSREWEGPSR WTEYLGPEMA ASVSSTRSSK QIDGHVGGST
       61 KALNIQWVVQ MIEVADGLMA KMYRLNQILE YPDPVGHVFS EAFWKAGVFP NHPRICTLLS
      121 KKFPEHFSKL QLERIDKFSL DSLHDGAELH LQSLEPWIQL LLDLMAFREQ ALRLILDLSS
      181 TVITLLPHQN SLILHAFMDL FCAFVRVNLF AEKIPRKMLL QVYNLLHALS RNDRDCDFYH
      241 RLVQFIDSYD PPLKGLQEDL NFVSPRIGEV LEAVGPSIFL SADTRKLRNE GFLSPYHPRF
      301 PDILTNSAHP MRAQDLANVT SYREWVLLGY LVCPDELLRV TSIDIALVVL KENLVVTLFR
      361 DEYILLHEDY QLYVLPRVLE SKKMAKSGRT KQKEADLEYS VAKQVEKMIS EVHEQALQLC
      421 DTIHRERRIL LKQEIGRMVL FFTDQPSLLA PNIQMVFSAL ALAQSEVLWY FQHAGIASSR
      481 SKAARVIPVD IDPNDPTIGF LLDGMDRLCC LVRKYISAAR GYALSYLSSS AGRIRYLMGT
      541 PGIVALDLDP TLKGLFQRIV QHLESIPKAQ GENVSAITCD LSDFRKDWLS ILMIVTSSRS
      601 SINIRHLEKA TVSTGKEGLL SEGNAAYNWS RCVDELESQL SKHGSLKKLY FYHQHLTTVF
      661 RNTMFGPEGR PQHCCAWLSV ASSFPECASL IIPEEVTKFG RDAVLYVESL IESIMGGLEG
      721 LINILDSEGG FGALESQLLP EQAAAYLNNA SRISAPSVKS PRVVGGFTLP GHESYPENNK
      781 SIKMLEAAIQ RLTNLCSILN DMEPICVINH VFVLREYMRE CILGNFKRRF LTALQTDNDL
      841 QRPSVLESLI RRHMGIVHLA EQHVSMDLTQ GIREILLTEA FSGPVSSLHT FEKPAEQQQT
      901 TGSAVEVVCN WYMDNIIKDV SGAGILFAPR HKYFKSTRPV GGYFAESVTD LKELQAFVRI
      961 FGGYGVDRLD RMMKVHTAAL VNCIETSLRS NRELIEAAAA SMHSGDRVER DASVRQIVDL
     1021 DTVIGFCIEA GQALAFDDLL AEASGAVLED NASLIHSMIS GIVEHIPEEI PEKKEIRRIK
     1081 GVANGVGVAG DHDSEWVRLI LEEVGGANDN SWSLLPYFFA SFMTSNAWNT TGFNIETGGF
     1141 SNNIHCLARC ISAVIAGSEY VRLQREYQQQ HQSLSNGHHS SENLDSEFPP RVTAEASIKS
     1201 SMLLFVKFAA SIVLDSWSEA NRSHLVAKLI FLDQLCEISP YLPRSSLESH VPYTILRSIY
     1261 TQYYSNTPST PLSTASPYHS PSVSLIHASP SMKNSTTPQR GSGSGSSSTA APDSGYFKGS
     1321 SSSLYGQEHY TESETGNSRN NENNNNNKQR GSSRRSGPLD YSSSHKGGSG SNSTGPSPLP
     1381 RFAVSRSGPI SYKQHN
//