LOCUS       X07549                  1106 bp    mRNA    linear   HUM 17-NOV-2004
DEFINITION  Human mRNA for cathepsin H (E.C.3.4.22.16.).
ACCESSION   X07549
VERSION     X07549.1
KEYWORDS    cathepsin; cysteine proteinase; glycoprotein; lysosomal enzyme.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1106)
  AUTHORS   Fuchs R.
  JOURNAL   Submitted (03-MAY-1988) to the INSDC. Fuchs R., Institut f.
            Biochemie, TH Darmstadt, Petersenstr. 22, D-6100 Darmstadt, FRG.
REFERENCE   2
  AUTHORS   Fuchs R., Machleidt W., Gassen H.G.
  TITLE     Molecular cloning and sequencing of a cDNA coding for mature human
            kidney cathepsin H
  JOURNAL   Biol. Chem. Hoppe-Seyler 369(6), 469-475(1988).
   PUBMED   2849458
COMMENT     Data kindly reviewed (13-Dec-1989) by Gassen H.G.
FEATURES             Location/Qualifiers
     source          1..1106
                     /db_xref="H-InvDB:HIT000321264"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /clone_lib="pUC9"
                     /clone="pRF15"
                     /tissue_type="kidney"
                     /db_xref="taxon:9606"
     CDS             <1..749
                     /codon_start=3
                     /product="cathepsin H"
                     /db_xref="GOA:P09668"
                     /db_xref="H-InvDB:HIT000321264.12"
                     /db_xref="HGNC:HGNC:2535"
                     /db_xref="InterPro:IPR000169"
                     /db_xref="InterPro:IPR000668"
                     /db_xref="InterPro:IPR013201"
                     /db_xref="InterPro:IPR025660"
                     /db_xref="InterPro:IPR025661"
                     /db_xref="InterPro:IPR038765"
                     /db_xref="InterPro:IPR039417"
                     /db_xref="PDB:1BZN"
                     /db_xref="PDB:6CZK"
                     /db_xref="PDB:6CZS"
                     /db_xref="UniProtKB/Swiss-Prot:P09668"
                     /protein_id="CAA30428.1"
                     /translation="AEIKHKYLWSEPQNCSATKSNYLRGTGPYPPSVDWRKKGNFVSP
                     VKNQGACGSCWTFSTTGALESAIAIATGKMLSLAEQQLVDCAQDFNNYGCQGGLPSQA
                     FEYILYNKGIMGEDTYPYQGKDGYCKFQPGKAIGFVKDVANITIYDEEAMVEAVALYN
                     PVSFAFEVTQDFMMYRTGIYSSTSCHKTPDKVNHAVLAVGYGEKNGIPYWIVKNSWGP
                     QWGMNGYFLIERGKNMCGLAACASYPIPLV"
     CDS             <33..>56
                     /note="minichain"
                     /db_xref="GOA:P09668"
                     /db_xref="HGNC:HGNC:2535"
                     /db_xref="InterPro:IPR000169"
                     /db_xref="InterPro:IPR000668"
                     /db_xref="InterPro:IPR013201"
                     /db_xref="InterPro:IPR025660"
                     /db_xref="InterPro:IPR025661"
                     /db_xref="InterPro:IPR038765"
                     /db_xref="InterPro:IPR039417"
                     /db_xref="PDB:1BZN"
                     /db_xref="PDB:6CZK"
                     /db_xref="PDB:6CZS"
                     /db_xref="UniProtKB/Swiss-Prot:P09668"
                     /protein_id="CAA30429.1"
                     /translation="EPQNCSAT"
     mat_peptide     87..248
                     /product="cathepsin H"
     regulatory      1082..1087
                     /regulatory_class="polyA_signal_sequence"
BASE COUNT          277 a          296 c          288 g          245 t
ORIGIN      
        1 ttgctgaaat aaaacacaag tatctctggt cagagcctca gaattgctca gccaccaaaa
       61 gtaactacct tcgaggtact ggtccctacc caccttccgt ggactggcgg aaaaaaggaa
      121 attttgtctc acctgtgaaa aatcagggtg cctgcggcag ttgctggact ttctccacca
      181 ctggggccct ggagtctgca atcgccatcg caaccggaaa gatgctgtcc ttggcggaac
      241 agcagctggt ggactgcgcc caggacttca ataattacgg ctgccaaggg ggtctcccca
      301 gccaggcttt cgagtatatc ctgtacaaca aggggatcat gggtgaagac acctacccct
      361 accagggcaa ggatggttat tgcaagttcc aacctggaaa ggccatcggc tttgtcaagg
      421 atgtagccaa catcacaatc tatgacgagg aagcgatggt ggaggctgtg gccctctaca
      481 accctgtgag ctttgccttt gaggtgactc aggacttcat gatgtataga acgggcatct
      541 actccagtac ttcctgccat aaaactccag ataaagtaaa ccatgcagta ctggctgttg
      601 ggtatggaga aaaaaatggg atcccttact ggatcgtgaa aaactcttgg ggtccccagt
      661 ggggaatgaa cgggtacttc ctcatcgagc gcggaaagaa catgtgtggc ctggctgcct
      721 gcgcctccta ccccatccct ctggtgtgag ccgtggcagc cgcagcgcag actggcggag
      781 aaggagagga acgggcagcc tgggcctggg tggaaatcct gccctggagg aagttgtggg
      841 gagatccact gggaccccca acattctgcc ctcacctctg tgcccagcct ggaaacctac
      901 agacaaggag gagttccacc atgagctcac ccgtgtctat gacgcaaaga tcaccagcca
      961 tgtgccttag tgtccttctt aacagactca aaccacatgg accacgaata ttctttctgt
     1021 ccagaagggc tactttccac atatagagct ccagggactg tcttttctgt attcgctgtt
     1081 caataaacat tgagtgagca cctcca
//