LOCUS       BC047790                2658 bp    mRNA    linear   HUM 22-APR-2003
DEFINITION  Homo sapiens GATA binding protein 5, mRNA (cDNA clone
            IMAGE:6464800), partial cds.
ACCESSION   BC047790
VERSION     BC047790.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2658)
  AUTHORS   Strausberg,R.L., Feingold,E.A., Grouse,L.H., Derge,J.G.,
            Klausner,R.D., Collins,F.S., Wagner,L., Shenmen,C.M., Schuler,G.D.,
            Altschul,S.F., Zeeberg,B., Buetow,K.H., Schaefer,C.F., Bhat,N.K.,
            Hopkins,R.F., Jordan,H., Moore,T., Max,S.I., Wang,J., Hsieh,F.,
            Diatchenko,L., Marusina,K., Farmer,A.A., Rubin,G.M., Hong,L.,
            Stapleton,M., Soares,M.B., Bonaldo,M.F., Casavant,T.L.,
            Scheetz,T.E., Brownstein,M.J., Usdin,T.B., Toshiyuki,S.,
            Carninci,P., Prange,C., Raha,S.S., Loquellano,N.A., Peters,G.J.,
            Abramson,R.D., Mullahy,S.J., Bosak,S.A., McEwan,P.J.,
            McKernan,K.J., Malek,J.A., Gunaratne,P.H., Richards,S.,
            Worley,K.C., Hale,S., Garcia,A.M., Gay,L.J., Hulyk,S.W.,
            Villalon,D.K., Muzny,D.M., Sodergren,E.J., Lu,X., Gibbs,R.A.,
            Fahey,J., Helton,E., Ketteman,M., Madan,A., Rodrigues,S.,
            Sanchez,A., Whiting,M., Madan,A., Young,A.C., Shevchenko,Y.,
            Bouffard,G.G., Blakesley,R.W., Touchman,J.W., Green,E.D.,
            Dickson,M.C., Rodriguez,A.C., Grimwood,J., Schmutz,J., Myers,R.M.,
            Butterfield,Y.S., Krzywinski,M.I., Skalska,U., Smailus,D.E.,
            Schnerch,A., Schein,J.E., Jones,S.J. and Marra,M.A.
  TITLE     Generation and initial analysis of more than 15,000 full-length
            human and mouse cDNA sequences
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 99 (26), 16899-16903 (2002)
   PUBMED   12477932
REFERENCE   2  (bases 1 to 2658)
  AUTHORS   Strausberg,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (03-MAR-2003) National Institutes of Health, Mammalian
            Gene Collection (MGC), Cancer Genomics Office, National Cancer
            Institute, 31 Center Drive, Room 11A03, Bethesda, MD 20892-2590,
            USA
  REMARK    NIH-MGC Project URL: http://mgc.nci.nih.gov
COMMENT     Contact: MGC help desk
            Email: cgapbs-r@mail.nih.gov
            Tissue Procurement: ATCC
            cDNA Library Preparation: Life Technologies, Inc.
            cDNA Library Arrayed by: The I.M.A.G.E. Consortium (LLNL)
            DNA Sequencing by: Sequencing Group at the Stanford Human Genome
            Center, Stanford University School of Medicine, Stanford, CA  94305
            Web site:       http://www-shgc.stanford.edu
            Contact:  (Dickson, Mark) mcd@paxil.stanford.edu
            Dickson, M., Schmutz, J., Grimwood, J., Rodriquez, A., and Myers,
            R. M.
            
            Clone distribution: MGC clone distribution information can be found
            through the I.M.A.G.E. Consortium/LLNL at: http://image.llnl.gov
            Series: IRAK Plate: 98 Row: o Column: 16
            This clone was selected for full length sequencing because it
            passed the following selection criteria: Similarity but not
            identity to protein.
FEATURES             Location/Qualifiers
     source          1..2658
                     /db_xref="H-InvDB:HIT000098800"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="IMAGE:6464800"
                     /tissue_type="Uterus, leiomyosarcoma"
                     /clone_lib="NIH_MGC_71"
                     /lab_host="DH10B"
                     /note="Vector: pCMV-SPORT6"
     gene            <1..2658
                     /gene="GATA5"
                     /gene_synonym="bB379O24.1"
                     /db_xref="GeneID:140628"
     CDS             <1..1256
                     /gene="GATA5"
                     /gene_synonym="bB379O24.1"
                     /codon_start=3
                     /product="GATA5 protein"
                     /protein_id="AAH47790.1"
                     /db_xref="GeneID:140628"
                     /translation="TATAVPCRPPCPLVKTTPGRMYQSLALAASPRQAAYADSGSFLH
                     APGAGSPMFVPPARVPSMLSYLSGCEPSPQPPELAARPGWAQTATADSSAFGPGSPHP
                     PAAHPPGATTFPFAHSPSGPGSGGSAGGRDGSAYQGALLPREQFAAPLGRPVGTSYSA
                     TYPAYVSPDVAQSWTAGPFDGSVLHGLPGRRPTFVSDFLEEFPGEGRECVNCGALSTP
                     LWRRDGTGHYLCNACGLYHKMNGVNRPLVRPQKRLSSSRRAGLCCTNCHTTNTTLWRR
                     NSEGEPVCNACGLYMKLHGVPRPLAMKKESIQTRKRKPKTIAKARGSSGSTRNASASP
                     SAVASTDSSAATSKAKPSLASPVCPGPSMAPQASGQEDDSLAPGHLEFKFEPEDFAFP
                     STAPSPQAGLRGALRQEAWCALALA"
BASE COUNT          532 a          885 c          782 g          459 t
ORIGIN      
        1 ccaccgccac cgccgtgccc tgccgccctc cctgcccgct ggtcaagacc acgcctggga
       61 ggatgtacca gagcctggcg ctggccgcga gcccccgcca ggccgcctac gccgactcgg
      121 gctccttcct gcacgctccg ggcgccggct ctccgatgtt tgtgccgccg gcgcgcgtcc
      181 cctcgatgct gtcctacctg tccgggtgtg agccgagccc gcagcccccc gagctcgctg
      241 cgcgccccgg ctgggcgcag acagccaccg cggattcgtc ggccttcggc ccgggcagtc
      301 cgcacccccc agccgcgcac ccgcccgggg ccaccacctt ccctttcgcg cacagcccct
      361 cggggcccgg cagcggcggc agcgcggggg gccgagacgg cagtgcctac cagggcgcgc
      421 tgttgcctcg agaacagttc gcggccccgc ttgggcggcc ggtggggacc tcgtactccg
      481 ccacctaccc ggcctacgtg agccccgacg tggcccagtc ctggactgcc gggcccttcg
      541 atggcagcgt cctgcacggc ctcccaggcc gcaggcccac cttcgtgtcc gacttcttgg
      601 aggagttccc gggtgagggt cgtgagtgtg tcaactgcgg ggccctgtcc acaccgctgt
      661 ggcgccgaga tggcaccggc cactacctgt gcaatgcctg cggcctctac cacaagatga
      721 atggcgtcaa ccggccgctc gttcggcctc agaagcgcct gtcctcgtcc cgccgcgccg
      781 gcctctgctg caccaactgc cacacgacca acaccacgct gtggcggcgg aactcggagg
      841 gggagcccgt gtgcaatgcc tgcggcctct acatgaagct gcacggggtg ccgcggcctc
      901 tggctatgaa gaaagaaagc atccagacac ggaagcggaa gccaaagacc atcgccaagg
      961 ccaggggctc ctcaggatcc acaaggaatg cctcggcctc cccatctgct gtcgccagca
     1021 ctgacagctc agcagccact tccaaagcca agcccagcct ggcgtcccca gtgtgccctg
     1081 ggcccagcat ggccccccag gcctctggcc aggaggatga ctctcttgcc cccggccact
     1141 tggagttcaa gttcgagcct gaggactttg ccttcccctc cacggccccg agcccccagg
     1201 ctggcctcag gggggctctg cgccaagagg cctggtgtgc gctggccttg gcctaggtcc
     1261 ccaggccagc ccatgtcagg ggaacagcct ggaacagacc acccactgag tcacctccgt
     1321 gcctgctttg ctccagcaca gcagagacca gcaggccccc caacccagag actgggtctg
     1381 ctggagtctc cacacagtgg tggggaggcc ttctggacag acggcagtcg ggccccagag
     1441 caagaaggct ggtgagggaa gggctcagct tcccacccca cgtacagcaa gggactcccc
     1501 aggtgcggcc caaggctccg gaccacactg gccccctgcg gcggaggcca acgcagggca
     1561 ccaccaccac caacttgaat tccgtcatca atgctcaccg tcaatatgtt tacaagttgt
     1621 agcagttggg ggaaaacagt caacctccca gtgtaaaacc aagattccca gtgaagcacc
     1681 tgaggccaag caggggagag gaatgagggg agcagctgga catgggcctc ctgaggcctc
     1741 ggggctgtcc ttcattgccc acatggatag acggagctgt ggtgcagaga acttttcccg
     1801 caacaggtgc aggactgcca gggatcggag tgcgggccgc gcacggtgcc aggattccgc
     1861 cgaggggaag ccgctcacat tgcagtcatc acagacttac gcacttgttt ggacagtttt
     1921 tccagagggg atgggaaagg gccttgttct agctgaatct gtgtatcatg accatttctg
     1981 acaggcagaa tgaattgtct ggtagccctg tcctgaccca tccaagcgct gttggggctg
     2041 gtggtgacgt ggtcacatgt cctggcatat ctggggccac gcagtttagt ctcttgtccc
     2101 aggagaattg ttagtgaccc ctctttctct tgcaagcccc ctccacactg ggttggatga
     2161 taccttaatg agtgacgctg gcgagaggca ccctacccga cgcagctgtg aatggccggt
     2221 gatgtatgtc aggaggccac agggagcgga ggagcggggc aggcagccac agggagcgga
     2281 ggagcggggc aggcagccac agggccctgc ggggagcaca tcctcgcctc cgtccggctg
     2341 ctgcccttca acaacaagcc ctgatttttc cagcaatgcc agaaacctgg attttaagtc
     2401 ttccaatttg attcaaaaat atttttaaca ttgtgagcca gctagacccc cagtgcacca
     2461 ccccatattg aaaaacagtt gtctggcatc agcttcagga gcggtccggt cattctgaaa
     2521 ctgtccctcc agaggttctt ccagccccac ttctatgcga tgtcatcttt tctaaaagag
     2581 acaaatgaag ccacagggaa agtgaaataa agccttgaac ctcaaaaaaa aaaaaaaaaa
     2641 aaaaaaaaaa aaaaaaaa
//