LOCUS       AEC07449.1               902 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana SET domain-containing protein protein.
ACCESSION   CP002685-2786
PROTEIN_ID  AEC07449.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /gene="CLF"
                     /locus_tag="AT2G23380"
                     /gene_synonym="CURLY LEAF"
                     /gene_synonym="F26B6.3"
                     /gene_synonym="F26B6_3"
                     /gene_synonym="ICU1"
                     /gene_synonym="INCURVATA 1"
                     /gene_synonym="SDG1"
                     /gene_synonym="SET1"
                     /gene_synonym="SETDOMAIN 1"
                     /gene_synonym="SETDOMAIN GROUP 1"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EL216881.1,INSD:DR750719.1,INSD:EL138999.1,
                     INSD:EL240094.1,INSD:ES106056.1,INSD:BP795333.1,
                     INSD:EL333045.1,INSD:BP817523.1,INSD:EH812023.1,
                     INSD:EL982461.1,INSD:EL082413.1,INSD:EL988692.1,
                     INSD:EH930611.1,INSD:DR750720.1,INSD:EL242048.1"
                     /inference="similar to RNA sequence, mRNA:INSD:Y10580.1"
                     /note="CURLY LEAF (CLF); FUNCTIONS IN: protein binding,
                     sequence-specific DNA binding transcription factor
                     activity; INVOLVED IN: in 7 processes; LOCATED IN:
                     chloroplast; EXPRESSED IN: 15 plant structures; EXPRESSED
                     DURING: 7 growth stages; CONTAINS InterPro DOMAIN/s: SET
                     domain (InterPro:IPR001214); BEST Arabidopsis thaliana
                     protein match is: SET domain-containing protein
                     (TAIR:AT4G02020.1); Has 5951 Blast hits to 5285 proteins
                     in 534 species: Archae - 0; Bacteria - 530; Metazoa -
                     2584; Fungi - 730; Plants - 989; Viruses - 16; Other
                     Eukaryotes - 1102 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G23380"
                     /db_xref="TAIR:AT2G23380"
     intron_pos      22:0 (1/16)
     intron_pos      53:0 (2/16)
     intron_pos      153:2 (3/16)
     intron_pos      207:2 (4/16)
     intron_pos      236:0 (5/16)
     intron_pos      281:0 (6/16)
     intron_pos      297:0 (7/16)
     intron_pos      321:0 (8/16)
     intron_pos      554:2 (9/16)
     intron_pos      605:0 (10/16)
     intron_pos      679:2 (11/16)
     intron_pos      723:2 (12/16)
     intron_pos      754:0 (13/16)
     intron_pos      770:0 (14/16)
     intron_pos      813:0 (15/16)
     intron_pos      839:0 (16/16)
BEGIN
        1 MASEASPSSS ATRSEPPKDS PAEERGPASK EVSEVIESLK KKLAADRCIS IKKRIDENKK
       61 NLFAITQSFM RSSMERGGSC KDGSDLLVKR QRDSPGMKSG IDESNNNRYV EDGPASSGMV
      121 QGSSVPVKIS LRPIKMPDIK RLSPYTTWVF LDRNQRMTED QSVVGRRRIY YDQTGGEALI
      181 CSDSEEEAID DEEEKRDFLE PEDYIIRMTL EQLGLSDSVL AELASFLSRS TSEIKARHGV
      241 LMKEKEVSES GDNQAESSLL NKDMEGALDS FDNLFCRRCL VFDCRLHGCS QDLIFPAEKP
      301 APWCPPVDEN LTCGANCYKT LLKSGRFPGY GTIEGKTGTS SDGAGTKTTP TKFSSKLNGR
      361 KPKTFPSESA SSNEKCALET SDSENGLQQD TNSDKVSSSP KVKGSGRRVG RKRNKNRVAE
      421 RVPRKTQKRQ KKTEASDSDS IASGSCSPSD AKHKDNEDAT SSSQKHVKSG NSGKSRKNGT
      481 PAEVSNNSVK DDVPVCQSNE VASELDAPGS DESLRKEEFM GETVSRGRLA TNKLWRPLEK
      541 SLFDKGVEIF GMNSCLIARN LLSGFKSCWE VFQYMTCSEN KASFFGGDGL NPDGSSKFDI
      601 NGNMVNNQVR RRSRFLRRRG KVRRLKYTWK SAAYHSIRKR ITEKKDQPCR QFNPCNCKIA
      661 CGKECPCLLN GTCCEKYCGC PKSCKNRFRG CHCAKSQCRS RQCPCFAADR ECDPDVCRNC
      721 WVIGGDGSLG VPSQRGDNYE CRNMKLLLKQ QQRVLLGISD VSGWGAFLKN SVSKHEYLGE
      781 YTGELISHKE ADKRGKIYDR ENCSFLFNLN DQFVLDAYRK GDKLKFANHS PEPNCYAKVI
      841 MVAGDHRVGI FAKERILAGE ELFYDYRYEP DRAPAWAKKP EAPGSKKDEN VTPSVGRPKK
      901 LA
//