LOCUS       AEC08620.1               838 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana DNA topoisomerase, type IA, core protein.
ACCESSION   CP002685-4429
PROTEIN_ID  AEC08620.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G32000"
                     /gene_synonym="F22D22.25"
                     /gene_synonym="F22D22_25"
                     /inference="Similar to RNA sequence,
                     EST:INSD:DR363694.1,INSD:BP821580.1,INSD:BP815012.1,
                     INSD:BX836041.1,INSD:EL983284.1,INSD:EL995232.1,
                     INSD:EH947278.1,INSD:EL990476.1,INSD:ES176397.1"
                     /inference="similar to RNA sequence,
                     mRNA:INSD:AK175789.1,INSD:AK175923.1"
                     /note="DNA topoisomerase, type IA, core; FUNCTIONS IN: DNA
                     topoisomerase activity, DNA topoisomerase type I activity,
                     DNA binding, nucleic acid binding; INVOLVED IN: DNA
                     topological change, DNA unwinding involved in replication,
                     DNA metabolic process; LOCATED IN: endomembrane system,
                     chromosome; EXPRESSED IN: 22 plant structures; EXPRESSED
                     DURING: 13 growth stages; CONTAINS InterPro DOMAIN/s:
                     Toprim domain, subgroup (InterPro:IPR006154), DNA
                     topoisomerase, type IA, central region, subdomain 1
                     (InterPro:IPR013824), DNA topoisomerase, type IA, core
                     (InterPro:IPR000380), Toprim domain (InterPro:IPR006171),
                     DNA topoisomerase, type IA, DNA-binding
                     (InterPro:IPR003602), DNA topoisomerase, type IA, domain 2
                     (InterPro:IPR003601), DNA topoisomerase, type IA, central
                     (InterPro:IPR013497), DNA topoisomerase, type IA, central
                     region, subdomain 3 (InterPro:IPR013826); BEST Arabidopsis
                     thaliana protein match is: topoisomerase 3alpha
                     (TAIR:AT5G63920.1); Has 35333 Blast hits to 34131 proteins
                     in 2444 species: Archae - 798; Bacteria - 22429; Metazoa -
                     974; Fungi - 991; Plants - 531; Viruses - 0; Other
                     Eukaryotes - 9610 (source: NCBI BLink)."
                     /db_xref="Araport:AT2G32000"
                     /db_xref="TAIR:AT2G32000"
     intron_pos      3:2 (1/13)
     intron_pos      38:1 (2/13)
     intron_pos      68:0 (3/13)
     intron_pos      101:1 (4/13)
     intron_pos      182:2 (5/13)
     intron_pos      237:0 (6/13)
     intron_pos      277:0 (7/13)
     intron_pos      303:2 (8/13)
     intron_pos      396:2 (9/13)
     intron_pos      453:0 (10/13)
     intron_pos      496:0 (11/13)
     intron_pos      567:0 (12/13)
     intron_pos      627:0 (13/13)
BEGIN
        1 MARCLQGEAV QRCMNLMACF EASKHIIELH LLSVMFSDFP EKYQNWATID PQDLFDAPII
       61 KKESNPKAHI CRHLSNEARG CSYMVLWLDC DREGENICFE VIESTGFDMK DSKRKVYRAR
      121 FSSVTEKDIS KAMDNLVEPN RDEALAVDAR QEIDLKVGVA FSRFQTSYFQ GKYQNLDCRV
      181 ISYGPCQTPT LGFCVQRYMH INTFKPEKFW ALRPYIRKDG YELQLEWERR RLFDLEAATV
      241 FQKLVVEGRT AKVMDVSEKQ EVKGRPAGLN TVNLLKVASS ALGFGPQTAM HLAERLYTQG
      301 FISYPRTEST AYPSSFDFTD TLRAQVSNPV WGGYVQRLLS DGFHMPKSGT DAGDHPPITP
      361 MRAATEVMVG GDAWRLYQYV CQHFLGTVSP NCKYIRTKVE LSIGGETFHC TGQRVTEKGF
      421 TAIMPWSAVD EKKLPSFLKG ERIEVLRVEL YEGNTAPPDY LTESELISLM EKHGIGTDAS
      481 IAVHINNIGE RNYVQVQSGR KMVPTALGIT LIRGYQCIDP DLCLPDIRSF IEQQITLVAK
      541 GQADHSHVVQ HVIQQFRRKF SYFVQQIEHM DALFEAQFSP LADSGRALSK CGKCLRYMKH
      601 ITAVPPRLFC GTCEEVYYLP QKGTVKLYKE LTCPLDNFEL VIYSVPGPEG KSFPLCPYCY
      661 NSPPFEGIDT LFGASKTPNA PAKTKTGAGM PCSLCPHPTC QHSVRNQGVC ACPECEGTLV
      721 LDPVSFPKWK LNCNLCSCIV LLPEGAHRIT TTSNRCPECD SAIIEIDFNK KTTPLENGAT
      781 LHQGCVLCDE LLLSLVEVKH GRSFVRRGGR GRGRGRGRGR GGRRGSKSVD PKMSFRDF
//