LOCUS       AEC10098.1              2172 aa    PRT              PLN 23-MAR-2023
DEFINITION  Arabidopsis thaliana U5 small nuclear ribonucleoprotein
            helicase protein.
ACCESSION   CP002685-6441
PROTEIN_ID  AEC10098.1
SOURCE      Arabidopsis thaliana (thale cress)
  ORGANISM  Arabidopsis thaliana
            Eukaryota; Viridiplantae; Streptophyta; Embryophyta; Tracheophyta;
            Spermatophyta; Magnoliopsida; eudicotyledons; Gunneridae;
            Pentapetalae; rosids; malvids; Brassicales; Brassicaceae;
            Camelineae; Arabidopsis.
REFERENCE   1  (bases 1 to 19698289)
  AUTHORS   Lin,X., Kaul,S., Rounsley,S., Shea,T.P., Benito,M.I., Town,C.D.,
            Fujii,C.Y., Mason,T., Bowman,C.L., Barnstead,M., Feldblyum,T.V.,
            Buell,C.R., Ketchum,K.A., Lee,J., Ronning,C.M., Koo,H.L.,
            Moffat,K.S., Cronin,L.A., Shen,M., Pai,G., Van Aken,S., Umayam,L.,
            Tallon,L.J., Gill,J.E., Adams,M.D., Carrera,A.J., Creasy,T.H.,
            Goodman,H.M., Somerville,C.R., Copenhaver,G.P., Preuss,D.,
            Nierman,W.C., White,O., Eisen,J.A., Salzberg,S.L., Fraser,C.M. and
            Venter,J.C.
  TITLE     Sequence and analysis of chromosome 2 of the plant Arabidopsis
            thaliana
  JOURNAL   Nature 402 (6763), 761-768 (1999)
   PUBMED   10617197
REFERENCE   2  (bases 1 to 19698289)
  AUTHORS   Swarbreck,D., Lamesch,P., Wilks,C. and Huala,E.
  CONSRTM   TAIR
  TITLE     Direct Submission
  JOURNAL   Submitted (18-FEB-2011) Department of Plant Biology, Carnegie
            Institution, 260 Panama Street, Stanford, CA, USA
REFERENCE   3  (bases 1 to 19698289)
  AUTHORS   Krishnakumar,V., Cheng,C.-Y., Chan,A.P., Schobel,S., Kim,M.,
            Ferlanti,E.S., Belyaeva,I., Rosen,B.D., Micklem,G., Miller,J.R.,
            Vaughn,M. and Town,C.D.
  TITLE     Direct Submission
  JOURNAL   Submitted (17-MAY-2016) Plant Genomics, J. Craig Venter Institute,
            9704 Medical Center Dr, Rockville, MD 20850, USA
  REMARK    Protein update by submitter
FEATURES             Qualifiers
     source          /organism="Arabidopsis thaliana"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:3702"
                     /chromosome="2"
                     /ecotype="Columbia"
     protein         /locus_tag="AT2G42270"
                     /gene_synonym="T24P15.18"
                     /gene_synonym="T24P15_18"
                     /inference="Similar to RNA sequence,
                     EST:INSD:AV526074.1,INSD:AI996341.1,INSD:EG496367.1,
                     INSD:AV826262.1,INSD:EL198497.1,INSD:EG478781.1,
                     INSD:EG478782.1,INSD:EG493774.1,INSD:EG522812.1,
                     INSD:EG496368.1,INSD:ES107038.1,INSD:EG522823.1,
                     INSD:EG510772.1,INSD:EG477004.1,INSD:AV794199.1,
                     INSD:EG526949.1,INSD:EG522801.1,INSD:EG504719.1,
                     INSD:BE529039.1,INSD:EG496811.1,INSD:EG496580.1,
                     INSD:EG493719.1,INSD:EG496579.1,INSD:EL977521.1,
                     INSD:EG510773.1,INSD:EG487018.1,INSD:EG510010.1,
                     INSD:EG508331.1,INSD:AV557979.1,INSD:BP793744.1,
                     INSD:EG512994.1,INSD:EG508353.1,INSD:EG496846.1,
                     INSD:EG496366.1,INSD:AI996854.1,INSD:EG498042.1,
                     INSD:EG526950.1,INSD:EG512365.1,INSD:EG522420.1,
                     INSD:EG510012.1,INSD:AU228545.1"
                     /inference="similar to RNA sequence, mRNA:INSD:AY059740.1"
                     /note="U5 small nuclear ribonucleoprotein helicase;
                     FUNCTIONS IN: in 6 functions; EXPRESSED IN: 24 plant
                     structures; EXPRESSED DURING: 15 growth stages; CONTAINS
                     InterPro DOMAIN/s: ATPase, AAA+ type, core
                     (InterPro:IPR003593), DNA/RNA helicase, DEAD/DEAH box
                     type, N-terminal (InterPro:IPR011545), Sec63 domain
                     (InterPro:IPR004179), Sec63 domain, subgroup
                     (InterPro:IPR018127), DEAD-like helicase, N-terminal
                     (InterPro:IPR014001), DNA/RNA helicase, C-terminal
                     (InterPro:IPR001650), Helicase, superfamily 1/2,
                     ATP-binding domain (InterPro:IPR014021); BEST Arabidopsis
                     thaliana protein match is: U5 small nuclear
                     ribonucleoprotein helicase, putative (TAIR:AT1G20960.2);
                     Has 20124 Blast hits to 12378 proteins in 1898 species:
                     Archae - 1780; Bacteria - 8009; Metazoa - 2781; Fungi -
                     2333; Plants - 1088; Viruses - 52; Other Eukaryotes - 4081
                     (source: NCBI BLink)."
                     /db_xref="Araport:AT2G42270"
                     /db_xref="TAIR:AT2G42270"
BEGIN
        1 MTNLGGGGAE EQARLKQYGY KVNSSLVLNS DERRRDTHES SGEPESLRGR IDPKSFGDRV
       61 VRGRPHELDE RLNKSKKKKE RCDDLVSARE SKRVRLREVS VLNDTEDGVY QPKTKETRVA
      121 FEIMLGLIQQ QLGGQPLDIV CGAADEILAV LKNESVKNHE KKVEIEKLLN VITDQVFSQF
      181 VSIGKLITDY EEGGDSLSGK ASEDGGLDYD IGVALECEED DDESDLDMVQ DEKDEEDEDV
      241 VELNKTGVVQ VGVAINGEDA RQAKEDTSLN VLDIDAYWLQ RKISQEYEQK IDAQECQELA
      301 EELLKILAEG NDRDVEIKLL EHLQFEKFSL VKFLLQNRLK VVWCTRLARG RDQEERNQIE
      361 EEMLGLGSEL AAIVKELHAK RATAKEREEK REKDIKEEAQ HLMDDDSGVD GDRGMRDVDD
      421 LDLENGWLKG QRQVMDLESL AFNQGGFTRE NNKCELPDRS FRIRGKEFDE VHVPWVSKKF
      481 DSNEKLVKIS DLPEWAQPAF RGMQQLNRVQ SKVYGTALFK ADNILLCAPT GAGKTNVAVL
      541 TILHQLGLNM NPGGTFNHGN YKIVYVAPMK ALVAEVVDSL SQRLKDFGVT VKELSGDQSL
      601 TGQEIKETQI IVTTPEKWDI ITRKSGDRTY TQLVRLLIID EIHLLDDNRG PVLESIVART
      661 LRQIESTKEH IRLVGLSATL PNCDDVASFL RVDLKNGLFI FDRSYRPVPL GQQYIGINVK
      721 KPLRRFQLMN DICYQKVVAV AGKHQVLIFV HSRKETAKTA RAIRDTAMAN DTLSRFLKED
      781 SQSREILKCL AGLLKNNDLK ELLPYGFAIH HAGLTRTDRE IVENQFRWGN LQVLISTATL
      841 AWGVNLPAHT VIIKGTQVYN PERGEWMELS PLDVMQMIGR AGRPQYDQQG EGIIITGYSK
      901 LQYYLRLMNE QLPIESQFIS KLADQLNAEI VLGTIQNARE ACHWLGYTYL YVRMVRNPTL
      961 YGVSPDALAK DLLLEERRAD LIHSAATILD KNNLIKYDRK SGHFQVTDLG RIASYYYISH
     1021 GTIAAYNENL KPTMNDIELC RLFSLSEEFK YVTVRQDEKM ELAKLLDRVP IPVKETLEDP
     1081 SAKINVLLQV YISKLKLEGL SLTSDMVYIT QSAGRLLRAI FEIVLKRGWA QLSQKALNLS
     1141 KMVGKRMWSV QTPLWQFPGI PKEILMKLEK NDLVWERYYD LSSQELGELI CNPKMGRPLH
     1201 KYIHQFPKLK LAAHVQPISR SVLQVELTVT PDFHWDDKAN KYVEPFWIIV EDNDGEKILH
     1261 HEYFLFKKRV IDEDHTLNFT VPISEPIPPQ YFIRVVSDKW LDSPTVLPVS FRHLILPEKY
     1321 PPPTELLDLQ PLPVMALRNP SYETLYQDFK HFNPVQTQVF TVLYNTSDNV VVAAPTGSGK
     1381 TICAEFAILR NHLEGPDSAM RVVYIAPLEA IAKEQFRDWE KKFGKGLGLR VVELTGETLL
     1441 DLKLLEKGQI IISTPEKWDA LSRRWKQRKY IQQVSLFIVD ELHLIGGQGG QVLEVIVSRM
     1501 RYISSQVGNK IRIVALSTSL ANAKDLGEWI GASSCGVFNF PPNVRPVPLE IHIHGVDILS
     1561 FEARMQAMTK PTYTAIVQHA KNKKPAIVFV PTRKHVRLTA VDLIAYSHMD NMKSPDFLLG
     1621 NLEELEPFLI QICEETLKET LRHGIGYLHE GLSNLDQEIV TQLFEAGRIQ VCVMSSSLCW
     1681 GTPLKAHLVV VMGTHFYDGR ENSHSDYPIS NLLQMMGRGS RPLLDDAGKC VIFCHAPRKE
     1741 YYKKFLYEAL PVESHLQHFL HDNFNAEVVA RVIENKQDAV DYLTWSFMYR RLPQNPNYYN
     1801 LLGVSHRHLS DHLSELVENT LSDLEVSKCI EIDNELDLSP LNLGMIASYY YINYTTIERF
     1861 SSLLASKTKM KGLLEILTSA SEYDLIPIRP GEEDAVRRLI NHQRFSFQNP RCTDPRVKTS
     1921 ALLQAHFSRQ KISGNLVMDQ CEVLLSATRL LQAMVDVISS NGCLNLALLA MEVSQMVTQG
     1981 MWDRDSMLLQ LPHFTKDLAK RCHENPGNNI ETIFDLVEME DDKRQELLQM SDAQLLDIAR
     2041 FCNRFPNIDL TYEIVGSNEV SPGKDITLQV LLERDMEGRT EVGPVDAPRY PKTKEEGWWL
     2101 VVGEAKTNQL MAIKRISLQR KAQVKLEFAV PTETGEKSYT LYFMCDSYLG CDQEYSFTVD
     2161 VKDSDAADHM EE
//