LOCUS       BC001138                1440 bp    mRNA    linear   HUM 30-SEP-2003
DEFINITION  Homo sapiens hexosaminidase A (alpha polypeptide), mRNA (cDNA clone
            IMAGE:2989846), partial cds.
ACCESSION   BC001138
VERSION     BC001138.2
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1440)
  AUTHORS   Strausberg,R.L., Feingold,E.A., Grouse,L.H., Derge,J.G.,
            Klausner,R.D., Collins,F.S., Wagner,L., Shenmen,C.M., Schuler,G.D.,
            Altschul,S.F., Zeeberg,B., Buetow,K.H., Schaefer,C.F., Bhat,N.K.,
            Hopkins,R.F., Jordan,H., Moore,T., Max,S.I., Wang,J., Hsieh,F.,
            Diatchenko,L., Marusina,K., Farmer,A.A., Rubin,G.M., Hong,L.,
            Stapleton,M., Soares,M.B., Bonaldo,M.F., Casavant,T.L.,
            Scheetz,T.E., Brownstein,M.J., Usdin,T.B., Toshiyuki,S.,
            Carninci,P., Prange,C., Raha,S.S., Loquellano,N.A., Peters,G.J.,
            Abramson,R.D., Mullahy,S.J., Bosak,S.A., McEwan,P.J.,
            McKernan,K.J., Malek,J.A., Gunaratne,P.H., Richards,S.,
            Worley,K.C., Hale,S., Garcia,A.M., Gay,L.J., Hulyk,S.W.,
            Villalon,D.K., Muzny,D.M., Sodergren,E.J., Lu,X., Gibbs,R.A.,
            Fahey,J., Helton,E., Ketteman,M., Madan,A., Rodrigues,S.,
            Sanchez,A., Whiting,M., Madan,A., Young,A.C., Shevchenko,Y.,
            Bouffard,G.G., Blakesley,R.W., Touchman,J.W., Green,E.D.,
            Dickson,M.C., Rodriguez,A.C., Grimwood,J., Schmutz,J., Myers,R.M.,
            Butterfield,Y.S., Krzywinski,M.I., Skalska,U., Smailus,D.E.,
            Schnerch,A., Schein,J.E., Jones,S.J. and Marra,M.A.
  TITLE     Generation and initial analysis of more than 15,000 full-length
            human and mouse cDNA sequences
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 99 (26), 16899-16903 (2002)
   PUBMED   12477932
REFERENCE   2  (bases 1 to 1440)
  AUTHORS   Strausberg,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (11-DEC-2000) National Institutes of Health, Mammalian
            Gene Collection (MGC), Cancer Genomics Office, National Cancer
            Institute, 31 Center Drive, Room 11A03, Bethesda, MD 20892-2590,
            USA
  REMARK    NIH-MGC Project URL: http://mgc.nci.nih.gov
COMMENT     On Aug 19, 2003 this sequence version replaced BC001138.1.
            Contact: MGC help desk
            Email: cgapbs-r@mail.nih.gov
            Tissue Procurement: DCTD/DTP
            cDNA Library Preparation: Rubin Laboratory
            cDNA Library Arrayed by: The I.M.A.G.E. Consortium (LLNL)
            DNA Sequencing by: Institute for Systems Biology
            http://www.systemsbiology.org
            contact: amadan@systemsbiology.org
            Anup Madan, Jessica Fahey, Erin Helton, Mark Ketteman, Anuradha
            Madan, Stephanie Rodrigues, Amy Sanchez and Michelle Whiting
            
            Clone distribution: MGC clone distribution information can be found
            through the I.M.A.G.E. Consortium/LLNL at: http://image.llnl.gov
            Series: IRAL Plate: 3 Row: k Column: 16.
FEATURES             Location/Qualifiers
     source          1..1440
                     /db_xref="H-InvDB:HIT000085962"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="IMAGE:2989846"
                     /tissue_type="Ovary, adenocarcinoma"
                     /clone_lib="NIH_MGC_9"
                     /lab_host="DH10B-R"
                     /note="Vector: pOTB7"
     gene            <1..1440
                     /gene="HEXA"
                     /gene_synonym="TSD"
                     /db_xref="GeneID:3073"
                     /db_xref="MIM:606869"
     CDS             <1..1231
                     /gene="HEXA"
                     /gene_synonym="TSD"
                     /codon_start=2
                     /product="HEXA protein"
                     /protein_id="AAH01138.2"
                     /db_xref="GeneID:3073"
                     /db_xref="MIM:606869"
                     /translation="NDDQCLLLSETVWGALRGLETFSQLVWKSAEGTFFINKTEIEDF
                     PRFPHRGLLLDTSRHYLPLSSILDTLDVMAYNKLNVFHWHLVDDPSFPYESFTFPELM
                     RKGSYNPVTHIYTAQDVKEVIEYARLRGIRVLAEFDTPGHTLSWGPGIPGLLTPCYSG
                     SEPSGTFGPVNPSLNNTYEFMSTFFLEVSSVFPDFYLHLGGDEVDFTCWKSNPEIQDF
                     MRKKGFGEDFKQLESFYIQTLLDIVSSYGKGYVVWQEVFDNKVKIQPDTIIQVWREDI
                     PVNYMKELELVTKAGFRALLSAPWYLNRISYGPDWKDFYVVEPLAFEGTPEQKALVIG
                     GEACMWGEYVDNTNLVPRLWPRAGAVAERLWSNKLTSDLTFAYERLSHFRCELLRRGV
                     QAQPLNVGFCEQEFEQT"
     misc_feature    140..1105
                     /gene="HEXA"
                     /gene_synonym="TSD"
                     /note="Glyco_hydro_20; Region: Glycosyl hydrolase family
                     20, catalytic domain. This domain has a TIM barrel fold"
                     /db_xref="CDD:pfam00728"
BASE COUNT          334 a          355 c          383 g          368 t
ORIGIN      
        1 aaatgatgac cagtgtttac tcctctctga gactgtctgg ggagctctcc gaggtctgga
       61 gacttttagc cagcttgttt ggaaatctgc tgagggcaca ttctttatca acaagactga
      121 gattgaggac tttccccgct ttcctcaccg gggcttgctg ttggatacat ctcgccatta
      181 cctgccactc tctagcatcc tggacactct ggatgtcatg gcgtacaata aattgaacgt
      241 gttccactgg catctggtag atgatccttc cttcccatat gagagcttca cttttccaga
      301 gctcatgaga aaggggtcct acaaccctgt cacccacatc tacacagcac aggatgtgaa
      361 ggaggtcatt gaatacgcac ggctccgggg tatccgtgtg cttgcagagt ttgacactcc
      421 tggccacact ttgtcctggg gaccaggtat ccctggatta ctgactcctt gctactctgg
      481 gtctgagccc tctggcacct ttggaccagt gaatcccagt ctcaataata cctatgagtt
      541 catgagcaca ttcttcttag aagtcagctc tgtcttccca gatttttatc ttcatcttgg
      601 aggagatgag gttgatttca cctgctggaa gtccaaccca gagatccagg actttatgag
      661 gaagaaaggc ttcggtgagg acttcaagca gctggagtcc ttctacatcc agacgctgct
      721 ggacatcgtc tcttcttatg gcaagggcta tgtggtgtgg caggaggtgt ttgataataa
      781 agtaaagatt cagccagaca caatcataca ggtgtggcga gaggatattc cagtgaacta
      841 tatgaaggag ctggaattgg tcaccaaggc cggcttccgg gcccttctct ctgccccctg
      901 gtacctgaac cgtatatcct atggccctga ctggaaggat ttctacgtag tggaacccct
      961 ggcatttgaa ggtacccctg agcagaaggc tctggtgatt ggtggagagg cttgtatgtg
     1021 gggagaatat gtggacaaca caaacctggt ccccaggctc tggcccagag caggggctgt
     1081 tgccgaaagg ctgtggagca acaagttgac atctgacctg acatttgcct atgaacgttt
     1141 gtcacacttc cgctgtgagt tgctgaggcg aggtgtccag gcccaacccc tcaatgtagg
     1201 cttctgtgag caggagtttg aacagacctg agccccaggc accgaggagg gtgctggctg
     1261 taggtgaatg gtagtggagc caggcttcca ctgcatcctg gccaggggac ggagcccctt
     1321 gccttcgtgc cccttgcctg cgtgcccctg tgcttggaga gaaaggggcc ggtgctggcg
     1381 ctcgcattca ataaagagta atgtggcatt tttctataat aaaaaaaaaa aaaaaaaaaa
//