LOCUS       BC006545                1891 bp    mRNA    linear   HUM 08-OCT-2003
DEFINITION  Homo sapiens forkhead box A2, mRNA (cDNA clone IMAGE:2821244),
            partial cds.
ACCESSION   BC006545
VERSION     BC006545.2
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1891)
  AUTHORS   Strausberg,R.L., Feingold,E.A., Grouse,L.H., Derge,J.G.,
            Klausner,R.D., Collins,F.S., Wagner,L., Shenmen,C.M., Schuler,G.D.,
            Altschul,S.F., Zeeberg,B., Buetow,K.H., Schaefer,C.F., Bhat,N.K.,
            Hopkins,R.F., Jordan,H., Moore,T., Max,S.I., Wang,J., Hsieh,F.,
            Diatchenko,L., Marusina,K., Farmer,A.A., Rubin,G.M., Hong,L.,
            Stapleton,M., Soares,M.B., Bonaldo,M.F., Casavant,T.L.,
            Scheetz,T.E., Brownstein,M.J., Usdin,T.B., Toshiyuki,S.,
            Carninci,P., Prange,C., Raha,S.S., Loquellano,N.A., Peters,G.J.,
            Abramson,R.D., Mullahy,S.J., Bosak,S.A., McEwan,P.J.,
            McKernan,K.J., Malek,J.A., Gunaratne,P.H., Richards,S.,
            Worley,K.C., Hale,S., Garcia,A.M., Gay,L.J., Hulyk,S.W.,
            Villalon,D.K., Muzny,D.M., Sodergren,E.J., Lu,X., Gibbs,R.A.,
            Fahey,J., Helton,E., Ketteman,M., Madan,A., Rodrigues,S.,
            Sanchez,A., Whiting,M., Madan,A., Young,A.C., Shevchenko,Y.,
            Bouffard,G.G., Blakesley,R.W., Touchman,J.W., Green,E.D.,
            Dickson,M.C., Rodriguez,A.C., Grimwood,J., Schmutz,J., Myers,R.M.,
            Butterfield,Y.S., Krzywinski,M.I., Skalska,U., Smailus,D.E.,
            Schnerch,A., Schein,J.E., Jones,S.J. and Marra,M.A.
  TITLE     Generation and initial analysis of more than 15,000 full-length
            human and mouse cDNA sequences
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 99 (26), 16899-16903 (2002)
   PUBMED   12477932
REFERENCE   2  (bases 1 to 1891)
  AUTHORS   Strausberg,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (24-APR-2001) National Institutes of Health, Mammalian
            Gene Collection (MGC), Cancer Genomics Office, National Cancer
            Institute, 31 Center Drive, Room 11A03, Bethesda, MD 20892-2590,
            USA
  REMARK    NIH-MGC Project URL: http://mgc.nci.nih.gov
COMMENT     On Oct 8, 2003 this sequence version replaced BC006545.1.
            Contact: MGC help desk
            Email: cgapbs-r@mail.nih.gov
            Tissue Procurement: DCTD/DTP
            cDNA Library Preparation: Rubin Laboratory
            cDNA Library Arrayed by: The I.M.A.G.E. Consortium (LLNL)
            DNA Sequencing by: Institute for Systems Biology
            http://www.systemsbiology.org
            contact: amadan@systemsbiology.org
            Anup Madan, Jessica Fahey, Erin Helton, Mark Ketteman, Anuradha
            Madan, Stephanie Rodrigues, Amy Sanchez and Michelle Whiting
            
            Clone distribution: MGC clone distribution information can be found
            through the I.M.A.G.E. Consortium/LLNL at: http://image.llnl.gov
            Series: IRAL Plate: 2 Row: g Column: 19.
FEATURES             Location/Qualifiers
     source          1..1891
                     /db_xref="H-InvDB:HIT000086688"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="IMAGE:2821244"
                     /tissue_type="Lung, small cell carcinoma"
                     /clone_lib="NIH_MGC_7"
                     /lab_host="DH10B-R"
                     /note="Vector: pOTB7"
     gene            <1..1891
                     /gene="FOXA2"
                     /gene_synonym="HNF3B"
                     /gene_synonym="MGC19807"
                     /gene_synonym="TCF3B"
                     /db_xref="GeneID:3170"
                     /db_xref="MIM:600288"
     CDS             <1..1370
                     /gene="FOXA2"
                     /gene_synonym="HNF3B"
                     /gene_synonym="MGC19807"
                     /gene_synonym="TCF3B"
                     /codon_start=3
                     /product="FOXA2 protein"
                     /protein_id="AAH06545.2"
                     /db_xref="GeneID:3170"
                     /db_xref="MIM:600288"
                     /translation="GAVKMEGHEPSDWSSYYAEPEGYSSVSNMNAGLGMNGMNTYMSM
                     SAAAMGSGSGNMSAGSMNMSSYVGAGMSPSLAGMSPGAGAMAGMGGSAGAAGVAGMGP
                     HLSPSLSPLGGQAAGAMGGLAPYANMNSMSPMYGQAGLSRARDPKTYRRSYTHAKPPY
                     SYISLITMAIQQSPNKMLTLSEIYQWIMDLFPFYRQNQQRWQNSIRHSLSFNDCFLKV
                     PRSPDKPGKGSFWTLHPDSGNMFENGCYLRRQKRFKCEKQLALKEAAGAAGSGKKAAA
                     GAQASQAQLGEAAGPASETPAGTESPHSSASPCQEHKRGGLGELKGTPAAALSPPEPA
                     PSPGQQQQAAAHLLGPPHHPGLPPEAHLKPEHHYAFNHPFSINNLMSSEQQHHHSHHH
                     HQPHKMDLKAYEQVMHYPGYGSPMPGSLAMGPVTNKTGLDASPLAADTSYYQGVYSRP
                     IMNSS"
     misc_feature    471..758
                     /gene="FOXA2"
                     /gene_synonym="HNF3B"
                     /gene_synonym="MGC19807"
                     /gene_synonym="TCF3B"
                     /note="Fork_head; Region: Fork head domain"
                     /db_xref="CDD:pfam00250"
BASE COUNT          432 a          617 c          546 g          296 t
ORIGIN      
        1 tgggagcggt gaagatggaa gggcacgagc cgtccgactg gagcagctac tatgcagagc
       61 ccgagggcta ctcctccgtg agcaacatga acgccggcct ggggatgaac ggcatgaaca
      121 cgtacatgag catgtcggcg gccgccatgg gcagcggctc gggcaacatg agcgcgggct
      181 ccatgaacat gtcgtcgtac gtgggcgctg gcatgagccc gtccctggcg gggatgtccc
      241 ccggcgcggg cgccatggcg ggcatgggcg gctcggccgg ggcggctggc gtggcgggca
      301 tggggccgca cttgagtccc agcctgagcc cgctcggggg gcaggcggcc ggggccatgg
      361 gcggcctggc cccctacgcc aacatgaact ccatgagccc catgtacggg caggcgggcc
      421 tgagccgcgc ccgcgacccc aagacctaca ggcgcagcta cacgcacgca aagccgccct
      481 actcgtacat ctcgctcatc accatggcca tccagcagag ccccaacaag atgctgacgc
      541 tgagcgagat ctaccagtgg atcatggacc tcttcccctt ctaccggcag aaccagcagc
      601 gctggcagaa ctccatccgc cactcgctct ccttcaacga ctgtttcctg aaggtgcccc
      661 gctcgcccga caagcccggc aagggctcct tctggaccct gcaccctgac tcgggcaaca
      721 tgttcgagaa cggctgctac ctgcgccgcc agaagcgctt caagtgcgag aagcagctgg
      781 cgctgaagga ggccgcaggc gccgccggca gcggcaagaa ggcggccgcc ggggcccagg
      841 cctcacaggc tcaactcggg gaggccgccg ggccggcctc cgagactccg gcgggcaccg
      901 agtcgcctca ctcgagcgcc tccccgtgcc aggagcacaa gcgagggggc ctgggagagc
      961 tgaaggggac gccggctgcg gcgctgagcc ccccagagcc ggcgccctct cccgggcagc
     1021 agcagcaggc cgcggcccac ctgctgggcc cgccccacca cccgggcctg ccgcctgagg
     1081 cccacctgaa gccggaacac cactacgcct tcaaccaccc gttctccatc aacaacctca
     1141 tgtcctcgga gcagcagcac caccacagcc accaccacca ccagccccac aaaatggacc
     1201 tcaaggccta cgaacaggtg atgcactacc ccggctacgg ttcccccatg cctggcagct
     1261 tggccatggg cccggtcacg aacaaaacgg gcctggacgc ctcgcccctg gccgcagata
     1321 cctcctacta ccagggggtg tactcccggc ccattatgaa ctcctcttaa gaagacgacg
     1381 gcttcaggcc cggctaactc tggcaccccg gatcgaggat aagtgagaga gcaagtgggg
     1441 gtcgagactt tggggagacg gtgttgcaga gacgcaaggg agaagaaatc cataacaccc
     1501 ccaccccaac acccccaaga cagcagtctt ccttcacccg ctgcagctgt tccgtcccaa
     1561 acagagggcc acacagatac cccacgttct atataaggag gaaaacggga aagaatataa
     1621 agttaaaaaa aagcctccgg tttccactac tgtgtagact cctgcttctt caagcacctg
     1681 cagattctga tttttttgtt gttgttgttc tcctccattg ctgttgttgc agggaagtct
     1741 tacttaaaaa aaaaaaaaaa cttttgtgag tgactcggtg taaaaccatg tagttttaac
     1801 agaaccagag ggttgtacta ttgtttaaaa acaggaaaaa aaataatgta agggtctgtt
     1861 gtaaatgacc aagaaaaaaa aaaaaaaaaa a
//