LOCUS       AEC09571.1               212 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana Gag-Pol polyprotein/retrotransposon protein.
ACCESSION   CP002685-5695
PROTEIN_ID  AEC09571.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G38695"
                     /inference="Similar to RNA sequence,
                     EST:INSD:EG516425.1,INSD:EG427118.1,INSD:EG427122.1,
                     INSD:EG427120.1,INSD:ES091188.1,INSD:EG427123.1,
                     INSD:ES172511.1,INSD:EG427114.1,INSD:EH912939.1,
                     INSD:EG427115.1,INSD:EG427124.1,INSD:EG516424.1,
                     INSD:EG427117.1,INSD:EG426640.1,INSD:EG426644.1,
                     INSD:EL328977.1,INSD:EL247257.1"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:AY773866.1,INSD:AY648329.1"
                     /note="unknown protein; Has 65 Blast hits to 65 proteins
                     in 18 species: Archae - 0; Bacteria - 0; Metazoa - 0;
                     Fungi - 0; Plants - 62; Viruses - 0; Other Eukaryotes - 3
                     (source: NCBI BLink)."
                     /db_xref="Araport:AT2G38695"
                     /db_xref="TAIR:AT2G38695"
     intron_pos      16:0 (1/8)
     intron_pos      56:0 (2/8)
     intron_pos      71:1 (3/8)
     intron_pos      89:2 (4/8)
     intron_pos      121:2 (5/8)
     intron_pos      139:2 (6/8)
     intron_pos      161:2 (7/8)
     intron_pos      188:0 (8/8)
BEGIN
        1 MSVAGVHRFS LPLPPKCSLR TFSVLANGKR TQSLLPHHFS VFNQSHRLVT SLSHNVSNKS
       61 DAEAERSCDE GEMLDKNRIS KKNPFVSEEL LKKLKRYGLS GILSYGLLNT VYYSTAFLLV
      121 WFYVAPAPGK MGYLAAAERF LKVMAMVWAG SQVTKLIRIG GAVALAPIVD RGLSWFTVKC
      181 NFESQGKAFG ALVGICLGMA LMLFIVVTLL WA
//