LOCUS       AEE76415.1              1122 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana amino-terminal region of chorein protein.
ACCESSION   CP002686-3898
PROTEIN_ID  AEE76415.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G20720"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AA395038.1,INSD:ES113869.1,INSD:R90256.1,
                     INSD:AV548156.1,INSD:EH916439.1,INSD:ES096348.1,
                     INSD:AI099894.1,INSD:AV546068.1,INSD:BP858193.1,
                     INSD:AI993195.1,INSD:EL119311.1,INSD:T42350.1,
                     INSD:T46572.1,INSD:AU237098.1,INSD:AV441469.1,
                     INSD:EH920770.1,INSD:AI992928.1,INSD:AU228119.1,
                     INSD:AA651437.1"
                     /inference="Similar to RNA sequence, mRNA:INSD:AK176813.1"
                     /note="unknown protein; Has 184 Blast hits to 181 proteins
                     in 66 species: Archae - 0; Bacteria - 2; Metazoa - 137;
                     Fungi - 0; Plants - 40; Viruses - 0; Other Eukaryotes - 5
                     (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G20720"
                     /db_xref="Araport:AT3G20720"
     intron_pos      38:1 (1/19)
     intron_pos      68:0 (2/19)
     intron_pos      104:2 (3/19)
     intron_pos      123:0 (4/19)
     intron_pos      152:2 (5/19)
     intron_pos      175:0 (6/19)
     intron_pos      196:0 (7/19)
     intron_pos      235:0 (8/19)
     intron_pos      266:1 (9/19)
     intron_pos      293:0 (10/19)
     intron_pos      317:1 (11/19)
     intron_pos      332:0 (12/19)
     intron_pos      354:2 (13/19)
     intron_pos      382:1 (14/19)
     intron_pos      435:0 (15/19)
     intron_pos      809:1 (16/19)
     intron_pos      904:0 (17/19)
     intron_pos      975:0 (18/19)
     intron_pos      1027:1 (19/19)
BEGIN
        1 MESILARALE YTLKYWLKSF TRDQFKLQGR TAQLSNLDIN GEAIHASMGL PPALSVTTAK
       61 VGKLEIMLPY VSNVQTEPIV VQIDKLDLVL EENPDADVTK GPSSSQSPTA SAKSNGYGFA
      121 DKIADGMTLQ VKVVNLLLET GGGANREGGA AWAAPLASIT IRNLVLYTTN ESWKVVNLKE
      181 ARDFSTNTGF IYLFKKLEWE ALSIDLLPHP DMFTEANLAR SEEANLRDED GAKRITVQRT
      241 ALNSPLGLEV QLHIPEAVCP ALSEPGLRAL LRFLTGMYLC LNRGDVDPKS QQSAEAAGRS
      301 LVSVLVDHVF LCIKDAEFQL ELLMQSLLFS RACVSDGESA NYLTKILIGG LFLRDAFSRS
      361 PCALIQPSMK AAAEDLAIPD FAKNFCPLIY PLDSGPWQIV QDVPLISLHS LQVKPSPKPP
      421 HFFSKTVIQC QPLMVHLQEE ACLRISSFLA DGIVVNPGDV LPDNSVNSLL FTLKELDVSV
      481 PLDMSNLQDS AIEEDLSVKK SFVGARLHIE NLSFAESPTL KVRLLNLEKD PACFCLWPGQ
      541 PIDASQKKWT AGASHFSLAL ETSPNSTQLQ SPRGPEMGLW NCVEGKDVSI EVAMVSADGK
      601 PLITIPPPGG IVRIGVACEQ YISRASVEQL FFVLDLYSYF GKVSEKISIV KESKRQNTVS
      661 LTGGLLEKVP SDTAVKLALK DLQLKFLESS FTSTQDMPLV QFLGKDLSVK VTHRTLGGAI
      721 AVSSNIYWEN IEVDCVDTDV EHEHENSWNG HLVSCNGSTP LRRVFWVVNG RHDEHSGSTL
      781 TPFLDISITH VIPLSEKDME CHSVSIVAYG TPGNWNGDGF PHLGRPDDID VSVELRDWLF
      841 ALEGREGVGT RILNNEDIGR EERCWHTNFR TFRVIAKSTP KNVDSNGTEN QCDAHKYPVD
      901 SIIVSVEGLQ TVKPQMQKGT DSCNGLSTNG VHENGQMHGG VNIEANIVAS EDKSVHDDLL
      961 NWVAESLKFS VKQPVEAVVT KDELQHLTFL CKSEIDAMGR IVAGVLRVLK LEESIGQATL
     1021 NQLSNLGSEG FDKMFSPKAS RAGSPKSSPF AASLDSMREI SLRANLESTI SSIEEASMEL
     1081 EAKCSALVSD LNDSESSAKH ANELKQKLES LQSLMAKLRT QI
//