LOCUS       X05344                  1988 bp    mRNA    linear   HUM 07-OCT-2008
DEFINITION  Human mRNA for cathepsin D from oestrogen responsive breast cancer
            cells.
ACCESSION   X05344
VERSION     X05344.1
KEYWORDS    cathepsin D.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1988)
  AUTHORS   Westley B.R., May F.E.B.
  TITLE     Oestrogen regulates cathepsin D mRNA levels in oestrogen responsive
            human breast cancer cells
  JOURNAL   Nucleic Acids Res. 15(9), 3773-3786(1987).
   PUBMED   3588310
COMMENT     Data kindly reviewed (8.1.88 ) by Westley
FEATURES             Location/Qualifiers
     source          1..1988
                     /db_xref="H-InvDB:HIT000321128"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /cell_line="ZR-75"
                     /db_xref="taxon:9606"
     prim_transcript <1..1988
     CDS             3..1241
                     /product="cathepsin D"
                     /db_xref="GOA:P07339"
                     /db_xref="H-InvDB:HIT000321128.12"
                     /db_xref="HGNC:HGNC:2529"
                     /db_xref="InterPro:IPR001461"
                     /db_xref="InterPro:IPR001969"
                     /db_xref="InterPro:IPR012848"
                     /db_xref="InterPro:IPR021109"
                     /db_xref="InterPro:IPR033121"
                     /db_xref="InterPro:IPR033144"
                     /db_xref="PDB:1LYA"
                     /db_xref="PDB:1LYB"
                     /db_xref="PDB:1LYW"
                     /db_xref="PDB:4OBZ"
                     /db_xref="PDB:4OC6"
                     /db_xref="PDB:4OD9"
                     /db_xref="UniProtKB/Swiss-Prot:P07339"
                     /protein_id="CAA28955.1"
                     /translation="MQPSSLLPLALCLLAAPASALVRIPLHKFTSIRRTMSEVGGSVE
                     DLIAKGPVSKYSQAVPAVTEGPIPEVLKNYMDAQYYGEIGIGTPPQCFTVVFDTGSSN
                     LWVPSIHCKLLDIACWIHHKYNSDKSSTYVKNGTSFDIHYGSGSLSGYLSQDTVSVPC
                     QSASSASALGGVKVERQVFGEATKQPGITFIAAKFDGILGMAYPRISVNNVLPVFDNL
                     MQQKLVDQNIFSFYLSRDPDAQPGGELMLGGTDSKYYKGSLSYLNVTRKAYWQVHLDQ
                     VEVASGLTLCKEGCEAIVDTGTSLMVGPVDEVRELQKAIGAVPLIQGEYMIPCEKVST
                     LPAITLKLGGKGYKLSPEDYTLKVSQAGKTLCLSGFMGMDIPPPSGPLWILGDVFIGR
                     YYTVFDRDNNRVGFAEAARL"
     sig_peptide     3..62
     misc_feature    63..194
                     /note="propeptide (AA 1-44)"
     mat_peptide     195..1238
                     /note="mature cathepsin D (AA 45-392)"
     variation       1308..1308
                     /replace="g"
     regulatory      1959..1964
                     /regulatory_class="polyA_signal_sequence"
     variation       1979..1979
                     /replace="a"
     polyA_site      1988..1988
BASE COUNT          350 a          666 c          590 g          382 t
ORIGIN      
        1 ccatgcagcc ctccagcctt ctgccgctcg ccctctgcct gctggctgca cccgcctccg
       61 cgctcgtcag gatcccgctg cacaagttca cgtccatccg ccggaccatg tcggaggttg
      121 ggggctctgt ggaggacctg attgccaaag gccccgtctc aaagtactcc caggcggtgc
      181 cagccgtgac cgaggggccc attcccgagg tgctcaagaa ctacatggac gcccagtact
      241 acggggagat tggcatcggg acgccccccc agtgcttcac agtcgtcttc gacacgggct
      301 cctccaacct gtgggtcccc tccatccact gcaaactgct ggacatcgct tgctggatcc
      361 accacaagta caacagcgac aagtccagca cctacgttaa gaatggtacc tcgtttgaca
      421 tccactatgg ctcgggcagc ctctccgggt acctgagcca ggacactgtg tcggtgccct
      481 gccagtcagc gtcgtcagcc tctgccctgg gcggtgtcaa agtggagagg caggtctttg
      541 gggaggccac caagcagcca ggcatcacct tcatcgcagc caagttcgat ggcatcctgg
      601 gcatggccta cccccgcatc tccgtcaaca acgtgctgcc cgtcttcgac aacctgatgc
      661 agcagaagct ggtggaccag aacatcttct ccttctacct gagcagggac ccagatgcgc
      721 agcctggggg tgagctgatg ctgggtggca cagactccaa gtattacaag ggttctctgt
      781 cctacctgaa tgtcacccgc aaggcctact ggcaggtcca cctggaccag gtggaggtgg
      841 ccagcgggct gaccctgtgc aaggagggct gtgaggccat tgtggacaca ggcacttccc
      901 tcatggtggg cccggtggat gaggtgcgcg agctgcagaa ggccatcggg gccgtgccgc
      961 tgattcaggg cgagtacatg atcccctgtg agaaggtgtc caccctgccc gcgatcacac
     1021 tgaagctggg aggcaaaggc tacaagctgt ccccagagga ctacacgctc aaggtgtcgc
     1081 aggccgggaa gaccctctgc ctgagcggct tcatgggcat ggacatcccg ccacccagcg
     1141 ggccactctg gatcctgggc gacgtcttca tcggccgcta ctacactgtg tttgaccgtg
     1201 acaacaacag ggtgggcttc gccgaggctg cccgcctcta gttcccaagg cgtccgcgcg
     1261 ccagcacaga aacagaggag agtcccagag caggaggccc ctggcccagc ggcccctccc
     1321 acacacaccc acacactcgc ccgcccactg tcctgggcgc cctggaagcc ggcggcccaa
     1381 gcccgacttg ctgttttgtt ctgtggtttt cccctccctg ggttcagaaa tgctgcctgc
     1441 ctgtctgtct ctccatctgt ttggtggggg tagagctgat ccagagcaca gatctgtttc
     1501 gtgcattgga agaccccacc caagcttggc agccgagctc gtgtatcctg gggctccctt
     1561 catctccagg gagtcccctc cccggcccta ccagcgcccg ctggctgagc ccctacccca
     1621 caccaggccg tcctcccggg ccctcccttg gaaacctgcc ctgcctgagg gcccctctgc
     1681 ccagcttggg cccagctggg ctctgccacc ctacctgttc agtgtcccgg gcccgttgag
     1741 gatgaggccg ctagaggcct gaggatgagc tggaaggagt gagaggggac aaaacccacc
     1801 ttgttggagc ctgcagggtg gtgctgggac tgagccagtc ccaggggcat gtattggcct
     1861 ggaggtgggg ttgggattgg gggctggtgc cagccttcct ctgcagctga cctctgttgt
     1921 cctccccttg ggcggctgag agccccagct gacatggaaa tacagttgtt ggcctccggc
     1981 ctcccctc
//