LOCUS       HSU40434                2114 bp    mRNA    linear   HUM 19-JAN-1996
DEFINITION  Human mesothelin or CAK1 antigen precursor mRNA, complete cds.
ACCESSION   U40434
VERSION     U40434.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2114)
  AUTHORS   Chang,K. and Pastan,I.
  TITLE     Molecular cloning of mesothelin, a differentiation antigen present
            on mesothelium, mesotheliomas, and ovarian cancers
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 93 (1), 136-140 (1996)
   PUBMED   8552591
REFERENCE   2  (bases 1 to 2114)
  AUTHORS   Chang,K.
  TITLE     Direct Submission
  JOURNAL   Submitted (09-NOV-1995) Kai Chang, Laboratory of Molecular Biology,
            National Cancer Institute, Building 37, Room 4B19, 37 Convent
            Drive, MSC4255, Bethesda, MD MD20892-4255, USA
FEATURES             Location/Qualifiers
     source          1..2114
                     /db_xref="H-InvDB:HIT000219720"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /chromosome="16"
                     /clone="pcD3CAK1-9"
                     /cell_line="KB, HeLa, OVCAR-3"
                     /cell_type="HeLa"
                     /tissue_type="ovarian cancers and squamous cell
                     carcinoma."
     CDS             100..1986
                     /codon_start=1
                     /product="mesothelin or CAK1 antigen precursor"
                     /protein_id="AAC50348.1"
                     /translation="MALQRLDPCWSCGDRPGSLLFLLFSLGWVHPARTLAGETGTESA
                     PLGGVLTTPHNISSLSPRQLLGFPCAEVSGLSTERVRELAVALAQKNVKLSTEQLRCL
                     AHRLSEPPEDLDALPLDLLLFLNPDAFSGPQACTRFFSRITKANVDLLPRGAPERQRL
                     LPAALACWGVRGSLLSEADVRALGGLACDLPGRFVAESAEVLLPRLVSCPGPLDQDQQ
                     EAARAALQGGGPPYGPPSTWSVSTMDALRGLLPVLGQPIIRSIPQGIVAAWRQRSSRD
                     PSWRQPERTILRPRFRREVEKTACPSGKKAREIDESLIFYKKWELEACVDAALLATQM
                     DRVNAIPFTYEQLDVLKHKLDELYPQGYPESVIQHLGYLFLKMSPEDIRKWNVTSLET
                     LKALLEVDKGHEMSPQAPRRPLPQVATLIDRFVKGRGQLDKDTLDTLTAFYPGYLCSL
                     SPEELSSVPPSSIWAVRPQDLDTCDPRQLDVLYPKARLAFQNMNGSEYFVKIQSFLGG
                     APTEDLKALSQQNVSMDLATFMKLRTDAVLPLTVAEVQKLLGPHVEGLKAEERHRPVR
                     DWILRQRQDDLDTLGLGLQGGIPNGYLVLDLSVQETLSGTPCLLGPGPVLTVLALLLA
                     STLA"
     sig_peptide     100..192
     mat_peptide     193..1857
                     /product="mesothelin"
     misc_feature    193..978
                     /note="encodes putative cleaved N-terminal portion of
                     mesothelin"
     misc_feature    973..978
                     /note="encodes putative proteolytic site"
     misc_feature    979..1983
                     /note="encodes putative membrane bound portion of
                     mesothelin, bearing epitope(s) recognized by MAb K1"
     misc_feature    1858..1983
                     /note="encodes putative hydrophobic region for GPI
                     anchorage"
     regulatory      2087..2093
                     /regulatory_class="polyA_signal_sequence"
                     /note="putative"
     polyA_site      2114
BASE COUNT          361 a          722 c          661 g          370 t
ORIGIN      
        1 aggaattccg gtggccggcc actcccgtct gctgtgacgc gcggacagag agctaccggt
       61 ggacccacgg tgcctccctc cctgggatct acacagacca tggccttgca acggctcgac
      121 ccctgttggt cctgtgggga ccgccctggc agcctcctgt tcctgctctt cagcctcgga
      181 tgggtgcatc ccgcgaggac cctggctgga gagacaggga cggagtctgc ccccctgggg
      241 ggagtcctga caacccccca taacatttcc agcctctccc ctcgccaact ccttggcttc
      301 ccgtgtgcgg aggtgtccgg cctgagcacg gagcgtgtcc gggagctggc tgtggccttg
      361 gcacagaaga atgtcaagct ctcaacagag cagctgcgct gtctggctca ccggctctct
      421 gagccccccg aggacctgga cgccctccca ttggacctgc tgctattcct caacccagat
      481 gcgttctcgg ggccccaggc ctgcacccgt ttcttctccc gcatcacgaa ggccaatgtg
      541 gacctgctcc cgaggggggc tcccgagcga cagcggctgc tgcctgcggc tctggcctgc
      601 tggggtgtgc gggggtctct gctgagcgag gctgatgtgc gggctctggg aggcctggct
      661 tgcgacctgc ctgggcgctt tgtggccgag tcggccgaag tgctgctacc ccggctggtg
      721 agctgcccgg gacccctgga ccaggaccag caggaggcag ccagggcggc tctgcagggc
      781 gggggacccc cctacggccc cccgtcgaca tggtctgtct ccacgatgga cgctctgcgg
      841 ggcctgctgc ccgtgctggg ccagcccatc atccgcagca tcccgcaggg catcgtggcc
      901 gcgtggcggc aacgctcctc tcgggaccca tcctggcggc agcctgaacg gaccatcctc
      961 cggccgcggt tccggcggga agtggagaag acagcctgtc cttcaggcaa gaaggcccgc
     1021 gagatagacg agagcctcat cttctacaag aagtgggagc tggaagcctg cgtggatgcg
     1081 gccctgctgg ccacccagat ggaccgcgtg aacgccatcc ccttcaccta cgagcagctg
     1141 gacgtcctaa agcataaact ggatgagctc tacccacaag gttaccccga gtctgtgatc
     1201 cagcacctgg gctacctctt cctcaagatg agccctgagg acattcgcaa gtggaatgtg
     1261 acgtccctgg agaccctgaa ggctttgctt gaagtcgaca aagggcacga aatgagtcct
     1321 caggctcctc ggcggcccct cccacaggtg gccaccctga tcgaccgctt tgtgaaggga
     1381 aggggccagc tagacaaaga caccctagac accctgaccg ccttctaccc tgggtacctg
     1441 tgctccctca gccccgagga gctgagctcc gtgcccccca gcagcatctg ggcggtcagg
     1501 ccccaggacc tggacacgtg tgacccaagg cagctggacg tcctctatcc caaggcccgc
     1561 cttgctttcc agaacatgaa cgggtccgaa tacttcgtga agatccagtc cttcctgggt
     1621 ggggccccca cggaggattt gaaggcgctc agtcagcaga atgtgagcat ggacttggcc
     1681 acgttcatga agctgcggac ggatgcggtg ctgccgttga ctgtggctga ggtgcagaaa
     1741 cttctgggac cccacgtgga gggcctgaag gcggaggagc ggcaccgccc ggtgcgggac
     1801 tggatcctac ggcagcggca ggacgacctg gacacgctgg ggctggggct acagggcggc
     1861 atccccaacg gctacctggt cctagacctc agcgtgcaag agaccctctc ggggacgccc
     1921 tgcctcctag gacctggacc tgttctcacc gtcctggcac tgctcctagc ctccaccctg
     1981 gcctgagggc cccactccct tgctggcccc agccctgctg gggatccccg cctggccagg
     2041 agcaggcacg ggtgatcccc gttccacccc aagagaactc gcgctcagta aacgggaaca
     2101 tgccccctgc agac
//