LOCUS       AEE79861.1              1029 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana ARM repeat superfamily protein protein.
ACCESSION   CP002686-8601
PROTEIN_ID  AEE79861.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 23459830)
  AUTHORS   Salanoubat,M., Lemcke,K., Rieger,M., Ansorge,W., Unseld,M.,
            Fartmann,B., Valle,G., Blocker,H., Perez-Alonso,M., Obermaier,B.,
            Delseny,M., Boutry,M., Grivell,L.A., Mache,R., Puigdomenech,P., De
            Simone,V., Choisne,N., Artiguenave,F., Robert,C., Brottier,P.,
            Wincker,P., Cattolico,L., Weissenbach,J., Saurin,W., Quetier,F.,
            Schafer,M., Muller-Auer,S., Gabel,C., Fuchs,M., Benes,V.,
            Wurmbach,E., Drzonek,H., Erfle,H., Jordan,N., Bangert,S.,
            Wiedelmann,R., Kranz,H., Voss,H., Holland,R., Brandt,P.,
            Nyakatura,G., Vezzi,A., D'Angelo,M., Pallavicini,A., Toppo,S.,
            Simionati,B., Conrad,A., Hornischer,K., Kauer,G., Lohnert,T.H.,
            Nordsiek,G., Reichelt,J., Scharfe,M., Schon,O., Bargues,M.,
            Terol,J., Climent,J., Navarro,P., Collado,C., Perez-Perez,A.,
            Ottenwalder,B., Duchemin,D., Cooke,R., Laudie,M., Berger-Llauro,C.,
            Purnelle,B., Masuy,D., de Haan,M., Maarse,A.C., Alcaraz,J.P.,
            Cottet,A., Casacuberta,E., Monfort,A., Argiriou,A., flores,M.,
            Liguori,R., Vitale,D., Mannhaupt,G., Haase,D., Schoof,H., Rudd,S.,
            Zaccaria,P., Mewes,H.W., Mayer,K.F., Kaul,S., Town,C.D., Koo,H.L.,
            Tallon,L.J., Jenkins,J., Rooney,T., Rizzo,M., Walts,A.,
            Utterback,T., Fujii,C.Y., Shea,T.P., Creasy,T.H., Haas,B.,
            Maiti,R., Wu,D., Peterson,J., Van Aken,S., Pai,G., Militscher,J.,
            Sellers,P., Gill,J.E., Feldblyum,T.V., Preuss,D., Lin,X.,
            Nierman,W.C., Salzberg,S.L., White,O., Venter,J.C., Fraser,C.M.,
            Kaneko,T., Nakamura,Y., Sato,S., Kato,T., Asamizu,E., Sasamoto,S.,
            Kimura,T., Idesawa,K., Kawashima,K., Kishida,Y., Kiyokawa,C.,
            Kohara,M., Matsumoto,M., Matsuno,A., Muraki,A., Nakayama,S.,
            Nakazaki,N., Shinpo,S., Takeuchi,C., Wada,T., Watanabe,A.,
            Yamada,M., Yasuda,M. and Tabata,S.
  CONSRTM   European Union Chromosome 3 Arabidopsis Sequencing Consortium;
            Institute for Genomic Research; Kazusa DNA Research Institute
  TITLE     Sequence and analysis of chromosome 3 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 408 (6814), 820-822 (2000)
   PUBMED   11130713
REFERENCE   2  (bases 1 to 23459830)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 23459830)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="3"
                     /ecotype="Columbia"
     protein         /locus_tag="AT3G59020"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AV791346.1,INSD:BP603766.1,INSD:CF652269.1,
                     INSD:BP614330.1,INSD:CF652270.1,INSD:BP607242.1,
                     INSD:EG508333.1,INSD:Z33990.1,INSD:EL206613.1,
                     INSD:EH923324.1,INSD:EL113418.1,INSD:AV828478.1,
                     INSD:EL105003.1,INSD:AV801533.1,INSD:BE523364.1,
                     INSD:EL157407.1,INSD:ES086219.1,INSD:EL173265.1,
                     INSD:BP612769.1,INSD:EL982664.1,INSD:AV530150.1,
                     INSD:EL243856.1,INSD:H76195.1,INSD:ES067417.1,
                     INSD:AV812836.1,INSD:BP783546.1,INSD:CB254333.1,
                     INSD:AV547530.1,INSD:AV812756.1,INSD:ES215788.1,
                     INSD:EL967941.1,INSD:ES051271.1,INSD:BP808036.1,
                     INSD:BP806451.1,INSD:EG508334.1,INSD:BP805394.1,
                     INSD:AV807817.1,INSD:EG510702.1,INSD:EL151983.1,
                     INSD:ES067392.1,INSD:ES132345.1,INSD:BP808879.1,
                     INSD:AV554894.1,INSD:BP609786.1,INSD:EL198533.1,
                     INSD:EG510701.1,INSD:EH959512.1,INSD:EH815699.1"
                     /inference="Similar to RNA sequence, mRNA:INSD:AY056143.2"
                     /note="ARM repeat superfamily protein; FUNCTIONS IN:
                     protein transporter activity, importin-alpha export
                     receptor activity, binding; INVOLVED IN: intracellular
                     protein transport, cell proliferation, protein import into
                     nucleus, docking; LOCATED IN: nucleus, nuclear pore,
                     cytoplasm; EXPRESSED IN: 24 plant structures; EXPRESSED
                     DURING: 13 growth stages; CONTAINS InterPro DOMAIN/s:
                     Importin-beta, N-terminal (InterPro:IPR001494), CAS/CSE,
                     C-terminal (InterPro:IPR005043), Armadillo-like helical
                     (InterPro:IPR011989), Armadillo-type fold
                     (InterPro:IPR016024), Exportin/Importin, Cse1-like
                     (InterPro:IPR013713); BEST Arabidopsis thaliana protein
                     match is: ARM repeat superfamily protein
                     (TAIR:AT2G31660.1); Has 8110 Blast hits to 5178 proteins
                     in 456 species: Archae - 41; Bacteria - 603; Metazoa -
                     2454; Fungi - 1580; Plants - 679; Viruses - 179; Other
                     Eukaryotes - 2574 (source: NCBI BLink)."
                     /db_xref="TAIR:AT3G59020"
                     /db_xref="Araport:AT3G59020"
     intron_pos      32:0 (1/21)
     intron_pos      76:1 (2/21)
     intron_pos      105:2 (3/21)
     intron_pos      155:2 (4/21)
     intron_pos      210:0 (5/21)
     intron_pos      271:2 (6/21)
     intron_pos      329:2 (7/21)
     intron_pos      378:1 (8/21)
     intron_pos      419:2 (9/21)
     intron_pos      480:0 (10/21)
     intron_pos      533:1 (11/21)
     intron_pos      547:1 (12/21)
     intron_pos      587:0 (13/21)
     intron_pos      653:1 (14/21)
     intron_pos      697:1 (15/21)
     intron_pos      732:0 (16/21)
     intron_pos      792:0 (17/21)
     intron_pos      838:2 (18/21)
     intron_pos      885:1 (19/21)
     intron_pos      934:0 (20/21)
     intron_pos      976:1 (21/21)
BEGIN
        1 MDLPSLALIV GAAAFSPNPD ERRAAEQSLN QLQHTPQHLI RILQIIVDGG SDLSVRQSAS
       61 IHFKNFIAKH WEPHSGDQNI ILPSDKNVVR NQILVFVSQV PPILRVQMGE CLKTIIYADY
      121 PEQWPELLDW VKQNLQKPQV YGALFVLRIL SSKYEFKSDE DRAPIHRVVE ETFPHLLNIF
      181 NNLVHVENPS LEVADHIKLI CKIFWSCIYL ELPRPLFDPN FFNAWMGLFL NILERPVPVE
      241 GQPEDPELRK SWGWWKAKKW IAHILNRLYT RFGDLKLQNP DNKAFAQMFQ INYAAKILEC
      301 HLKLLNAIRI GGYLPDRVIN LILQYLSNSI SKSSMYNLLQ PHLNTLLFEI VFPLMCFNDN
      361 DQMLWDEDPH EYVRKGYDII EDLYSPRTAS MDFVTELVRK RGKENFPKFI QFVVDIFKRY
      421 NEASLENKPY RLKDGALLAV GTLCDKLRQT EPYKSELENM LVQHVFPEFS SPAGHLRAKA
      481 AWVAGQYANI DFSDQSNFSK ALHCVISGMC DLELPVRVDS VFALRSFIEA CKDLDEIRPV
      541 LPQLLDEFFK LMKEVENEDL AFTLETIVYK FGEEISPYAL GLCQNLASAF WRCIDTDNGD
      601 DETDDAGALA AVGCLRAIST ILESISSLPH LYGQIEPQLL PIMRKMLTTD GQDVFEEVLE
      661 IVSYITTFSP TISLEMWSLW PLMMEALVDW AIDFFPNILV PLHNYISRGT GHYLTCKEPD
      721 YQQNLWNVIS VLMANKNIDD SDLEPAPKLL GIVLQTCKGQ VDQWVEPYLR ITLDRLRGAE
      781 KSSFKCLLVE VVANAFYYNT PLALGILQRF GIATEIFTLW FQMLQEKKKS GARSNFKREH
      841 DKKVCILGLT SLFSLPAGQL PGEVLPHVFR ALLELLVAYK DQLAAAKAEE EEEDEDGDDD
      901 DMDEFQTDDE DEDGDDENPD ETDGSTLRKL AAQAKDFRSY SDDDDFSDDD FSDDEELESP
      961 IDEVDPFVLF MDAVTAMQVS DSPRFQSLTQ TLDPHYHGLA STIAQHTELR RAEILKEKLE
     1021 KQSSATVAS
//