LOCUS       AEC05423.1               324 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana hypothetical protein (DUF789) protein.
ACCESSION   CP002685-49
PROTEIN_ID  AEC05423.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G01260"
                     /gene_synonym="F10A8.14"
                     /gene_synonym="F10A8_14"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EL057964.1,INSD:DR231737.1,INSD:BP572320.1,
                     INSD:BP600925.1,INSD:EH990366.1,INSD:AV522477.1,
                     INSD:DR231738.1,INSD:EL171190.1,INSD:BP607439.1,
                     INSD:EL043699.1,INSD:EL062481.1,INSD:EL321270.1,
                     INSD:AV533382.1,INSD:DR231741.1,INSD:AU226714.1,
                     INSD:BP611710.1,INSD:DR231740.1,INSD:BP590301.1,
                     INSD:EL176718.1,INSD:EL218259.1,INSD:BP847570.1,
                     INSD:EH895024.1,INSD:DR231739.1,INSD:BP779285.1"
                     /inference="similar to RNA sequence, mRNA:INSD:BX820744.1"
                     /note="Protein of unknown function (DUF789); CONTAINS
                     InterPro DOMAIN/s: Protein of unknown function DUF789
                     (InterPro:IPR008507); BEST Arabidopsis thaliana protein
                     match is: Protein of unknown function (DUF789)
                     (TAIR:AT1G15030.1); Has 35333 Blast hits to 34131 proteins
                     in 2444 species: Archae - 798; Bacteria - 22429; Metazoa -
                     974; Fungi - 991; Plants - 531; Viruses - 0; Other
                     Eukaryotes - 9610 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G01260"
                     /db_xref="TAIR:AT2G01260"
     intron_pos      85:0 (1/4)
     intron_pos      160:2 (2/4)
     intron_pos      237:0 (3/4)
     intron_pos      265:2 (4/4)
BEGIN
        1 MLGAGFQLTR GRHGDDPFYT SAKTRRANQR IDQLRRAQSD VSNVPSSAPS PHKQQLEPSD
       61 LSSSNLDRFL ESVTPSVPAQ FLSKTLLRER RADDDYNKLV PYFVLGDIWD SFAEWSAYGT
      121 GVPLVLNNNK DRVIQYYVPS LSAIQIYAHS HALDSSLKSR RPGDSSDSDF RDSSSDVSSD
      181 SDSERVSARV DCISLRDQHQ EDSSSDDGEP LGSQGRLMFE YLERDLPYIR EPFADKVLDL
      241 AAQFPELMTL RSCDLLRSSW FSVAWYPIYR IPTGPTLKDL DACFLTYHSL HTSFGGKPKL
      301 FYLSKQQVVG LHCSTTYTIS NQNT
//