LOCUS       AF088886                2039 bp    mRNA    linear   HUM 13-FEB-2004
DEFINITION  Homo sapiens cathepsin F precursor, mRNA, complete cds.
ACCESSION   AF088886
VERSION     AF088886.2
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2039)
  AUTHORS   Nagler,D.K., Sulea,T. and Menard,R.
  TITLE     Full-length cDNA of human cathepsin F predicts the presence of a
            cystatin domain at the N-terminus of the cysteine protease zymogen
  JOURNAL   Biochem. Biophys. Res. Commun. 257 (2), 313-318 (1999)
   PUBMED   10198209
REFERENCE   2  (bases 1 to 2039)
  AUTHORS   Nagler,D.K. and Menard,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (01-SEP-1998) Biopharmaceutical sector, Biotechnology
            Research Institute, 6100 Royalmount Avenue, Montreal, Quebec H4P
            2R2, Canada
REFERENCE   3  (bases 1 to 2039)
  AUTHORS   Nagler,D.K. and Menard,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (05-NOV-1998) Biopharmaceutical sector, Biotechnology
            Research Institute, 6100 Royalmount Avenue, Montreal, Quebec H4P
            2R2, Canada
  REMARK    Sequence update submitted by submitter
REFERENCE   4  (bases 1 to 2039)
  AUTHORS   Nagler,D.K. and Menard,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (03-MAY-1999) Biopharmaceutical sector, Biotechnology
            Research Institute, 6100 Royalmount Avenue, Montreal, Quebec H4P
            2R2, Canada
  REMARK    Sequence update by submitter
COMMENT     On May 3, 1999 this sequence version replaced AF088886.1.
            Name: cathepsin F.
FEATURES             Location/Qualifiers
     source          1..2039
                     /db_xref="H-InvDB:HIT000068140"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="#3, #26, #9"
                     /tissue_type="ovary"
     CDS             91..1545
                     /note="preproprotein; cysteine protease of the papain
                     family"
                     /codon_start=1
                     /product="cathepsin F precursor"
                     /protein_id="AAD26616.2"
                     /translation="MAPWLQLLSLLGLLPGAVAAPAQPRAASFQAWGPPSPELLAPTR
                     FALEMFNRGRAAGTRAVLGLVRGRVRRAGQGSLYSLEATLEEPPCNDPMVCRLPVSKK
                     TLLCSFQVLDELGRHVLLRKDCGPVDTKVPGAGEPKSAFTQGSAMISSLSQNHPDNRN
                     ETFSSVISLLNEDPLSQDLPVKMASIFKNFVITYNRTYESKEEARWRLSVFVNNMVRA
                     QKIQALDRGTAQYGVTKFSDLTEEEFRTIYLNTLLRKEPGNKMKQAKSVGDLAPPEWD
                     WRSKGAVTKVKDQGMCGSCWAFSVTGNVEGQWFLNQGTLLSLSEQELLDCDKMDKACM
                     GGLPSNAYSAIKNLGGLETEDDYSYQGHMQSCNFSAEKAKVYINDSVELSQNEQKLAA
                     WLAKRGPISVAINAFGMQFYRHGISRPLRPLCSPWLIDHAVLLVGYGNRSDVPFWAIK
                     NSWGTDWGEKGYYYLHRGSGACGVNTMASSAVVD"
     sig_peptide     91..147
     misc_feature    148..1542
                     /note="encodes cathepsin F proprotein"
     misc_feature    148..465
                     /note="Region: cystatin-like domain"
     misc_feature    568..576
                     /note="glycosylation site"
     misc_feature    673..681
                     /note="glycosylation site"
     mat_peptide     901..1542
                     /product="cathepsin F"
     misc_feature    1189..1197
                     /note="glycosylation site"
     misc_feature    1222..1230
                     /note="glycosylation site"
     misc_feature    1408..1416
                     /note="glycosylation site"
     variation       455
                     /replace="g"
     variation       565
                     /replace="g"
     regulatory      1991..1996
                     /regulatory_class="polyA_signal_sequence"
BASE COUNT          421 a          592 c          609 g          417 t
ORIGIN      
        1 ggaggactca ggccccgctg gccgcgggct cggtacccgg tgggtcggtg gagcgtctgt
       61 tgggtccggg ccgccggctt cgccctcgcc atggcgccct ggctgcagct cctgtcgctg
      121 ctggggctgc tcccgggcgc agtggccgcc cccgcccagc cccgagccgc cagctttcag
      181 gcctgggggc cgccgtcccc ggagctgctg gcgcctaccc gcttcgcgct ggagatgttc
      241 aaccgcggcc gggctgcggg gacgcgggcc gtgctgggcc ttgtgcgcgg ccgcgtccgc
      301 cgggcgggcc aagggtcgct gtactccctg gaggccaccc tggaggagcc accctgcaac
      361 gaccccatgg tgtgccggct ccccgtgtcc aagaaaaccc tgctctgcag cttccaagtc
      421 ctggatgagc tcggaagaca cgtgctgctg cggaaggact gtggcccagt ggacaccaag
      481 gttccaggtg ctggggagcc caagtcagcc ttcactcagg gctcagccat gatttcttct
      541 ctgtcccaaa accatccaga caacagaaac gagactttca gctcagtcat ttccctgttg
      601 aatgaggatc ccctgtccca ggacttgcct gtgaagatgg cttcaatctt caagaacttt
      661 gtcattacct ataaccggac atatgagtca aaggaagaag cccggtggcg cctgtccgtc
      721 tttgtcaata acatggtgcg agcacagaag atccaggccc tggaccgtgg cacagctcag
      781 tatggagtca ccaagttcag tgatctcaca gaggaggagt tccgcactat ctacctgaat
      841 actctcctga gaaaagagcc tggcaacaag atgaagcaag ccaagtctgt gggtgacctc
      901 gccccacctg aatgggactg gaggagtaag ggggctgtca caaaagtcaa agaccagggc
      961 atgtgtggct cctgctgggc cttctcagtc acaggcaatg tggagggcca gtggtttctc
     1021 aaccagggga ccctgctctc cctctctgaa caggagctct tggactgtga caagatggac
     1081 aaggcctgca tgggcggctt gccctccaat gcctactcgg ccataaagaa tttgggaggg
     1141 ctggagacag aggatgacta cagctaccag ggtcacatgc agtcctgcaa cttctcagca
     1201 gagaaggcca aggtctacat caatgactcc gtggagctga gccagaacga gcagaagctg
     1261 gcagcctggc tggccaagag aggcccaatc tccgtggcca tcaatgcctt tggcatgcag
     1321 ttttaccgcc acgggatctc ccgccctctc cggcccctct gcagcccttg gctcattgac
     1381 catgcggtgt tgcttgtggg ctacggcaac cgctctgacg ttcccttttg ggccatcaag
     1441 aacagctggg gcactgactg gggtgagaag ggttactact acttgcatcg cgggtccggg
     1501 gcctgtggcg tgaacaccat ggccagctcg gcggtggtgg actgaagagg ggcccccagc
     1561 tcgggacctg gtgctgatca gagtggctgc tgccccagcc tgacatgtgt ccaggcccct
     1621 ccccgggagg tacagctggc agagggaaag gcactgggta cctcagggtg agcagagggc
     1681 actgggctgg ggcacagccc ctgcttccct gcaccccatt cccaccctga agttctgcac
     1741 ctgcaccttt gttgaattgt ggtagcttag gaggatgtcg gggtgaaggg tggtatcttg
     1801 gcagttgaag ctggggcaag aactctgggc ttgggtaatg agcaggaaga aaattttctg
     1861 atcttaagcc cagctctgtt ctgcccccgc tttcctctgt ttgatactat aaattttctg
     1921 gttcccttgg atttagggat agtgtccctc tccatgtcca ggaaacttgt aaccaccctt
     1981 ttctaacagc aataaagagg tgtccttgta aaaaaaaaaa aaaaaaaaaa aaaaaaaaa
//