LOCUS       AEC07498.1               284 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana HNH endonuclease protein.
ACCESSION   CP002685-2854
PROTEIN_ID  AEC07498.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G23840"
                     /gene_synonym="T29E15.4"
                     /gene_synonym="T29E15_4"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AV521815.1,INSD:EL092962.1,INSD:BU636214.1,
                     INSD:EH907904.1,INSD:EH962054.1,INSD:AV564010.1,
                     INSD:DR369103.1,INSD:EH976518.1,INSD:EL214834.1,
                     INSD:EH868566.1,INSD:AV535369.1"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:BT010946.1,INSD:BT011660.1"
                     /note="HNH endonuclease; FUNCTIONS IN: endonuclease
                     activity, nucleic acid binding; INVOLVED IN:
                     biological_process unknown; LOCATED IN: cellular_component
                     unknown; EXPRESSED IN: 21 plant structures; EXPRESSED
                     DURING: 13 growth stages; CONTAINS InterPro DOMAIN/s: HNH
                     nuclease (InterPro:IPR003615), HNH endonuclease
                     (InterPro:IPR002711); Has 4176 Blast hits to 4176 proteins
                     in 656 species: Archae - 6; Bacteria - 1679; Metazoa - 0;
                     Fungi - 0; Plants - 37; Viruses - 29; Other Eukaryotes -
                     2425 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G23840"
                     /db_xref="TAIR:AT2G23840"
     intron_pos      114:2 (1/6)
     intron_pos      133:0 (2/6)
     intron_pos      158:0 (3/6)
     intron_pos      188:2 (4/6)
     intron_pos      216:0 (5/6)
     intron_pos      244:0 (6/6)
BEGIN
        1 MAHFSARLKL LSSNDGLSFG VDSRDQFRQS LYMAGGGSPL VPIRMSRLKF CARIFSSYSF
       61 PYKRKKIRDL DNTEKNLDID EDNDEWDFDG DDDGLETDDH LSCFRGLVLD ISYRPVNVVC
      121 WKRAICLEYM DKADVLEYYD QTVSSPTGSF YIPAVLRVPH LLQVVKRRRV KNSLSRKNIL
      181 LRDDYTCQYC SSRENLTIDH VMPVSRGGEW TWQNLVAACS RCNSRKGQKT ADEAHMKLLK
      241 VPKEPKDYDI VAIPLTNAAI RMLRSNKGMP EEWRQYLAKP LSET
//