LOCUS       HSU79725                2793 bp    mRNA    linear   HUM 04-FEB-1997
DEFINITION  Human A33 antigen precursor mRNA, complete cds.
ACCESSION   U79725
VERSION     U79725.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2793)
  AUTHORS   Heath,J.K., White,S.J., Johnstone,C.N., Catimel,B., Simpson,R.J.,
            Moritz,R.L., Tu,G.-F., Ji,H., Whitehead,R.H., Groenen,L.C.,
            Scott,A.M., Ritter,G., Cohen,L., Welt,S., Old,L.J., Nice,E.C. and
            Burgess,A.W.
  TITLE     The human A33 antigen is a transmembrane glycoprotein and a novel
            member of the immunoglobulin superfamily
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 94 (2), 469-474 (1997)
   PUBMED   9012807
REFERENCE   2  (bases 1 to 2793)
  AUTHORS   Heath,J.K. and White,S.J.
  TITLE     Direct Submission
  JOURNAL   Submitted (26-NOV-1996) Melbourne Branch, Ludwig Institute for
            Cancer Research, Post Office Royal Melbourne Hospital, Parkville,
            Victoria 3050, Australia
FEATURES             Location/Qualifiers
     source          1..2793
                     /db_xref="H-InvDB:HIT000221550"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /cell_line="LIM1215"
                     /tissue_type="colon carcinoma"
     5'UTR           1..344
     CDS             345..1304
                     /note="intestine-specific antigen; novel member of the
                     immunoglobulin superfamily; transmembrane protein;
                     contains an extracellular domain, a transmembrane domain,
                     and an intracellular domain"
                     /codon_start=1
                     /product="A33 antigen precursor"
                     /protein_id="AAC50957.1"
                     /translation="MVGKMWPVLWTLCAVRVTVDAISVETPQDVLRASQGKSVTLPCT
                     YHTSTSSREGLIQWDKLLLTHTERVVIWPFSNKNYIHGELYKNRVSISNNAEQSDASI
                     TIDQLTMADNGTYECSVSLMSDLEGNTKSRVRLLVLVPPSKPECGIEGETIIGNNIQL
                     TCQSKEGSPTPQYSWKRYNILNQEQPLAQPASGQPVSLKNISTDTSGYYICTSSNEEG
                     TQFCNITVAVRSPSMNVALYVGIAVGVVAALIIIGIIIYCCCCRGKDDNTEDKEDARP
                     NREAYEEPPEQLRELSREREEEDDYRQEEQRSTGRESPDHLDQ"
     sig_peptide     345..407
     mat_peptide     408..1301
                     /product="A33 antigen"
     3'UTR           1305..2793
     regulatory      2777..2782
                     /regulatory_class="polyA_signal_sequence"
BASE COUNT          620 a          781 c          730 g          662 t
ORIGIN      
        1 ctaccccttt gtgagcagtc taggactttg tacacctgtt aagtagggag aaggcagggg
       61 aggtggctgg tttaagggga acttgaggga agtagggaag actcctcttg ggacctttgg
      121 agtaggtgac acatgagccc agccccagct cacctgccaa tccagctgag gagctcacct
      181 gccaatccag ctgaggctgg gcagaggtgg gtgagaagag ggaaaattgc agggacctcc
      241 agttgggcca ggccagaagc tgctgtagct ttaaccagac agctcagacc tgtctggagg
      301 ctgccagtga caggttaggt ttagggcaga gaagaagcaa gaccatggtg gggaagatgt
      361 ggcctgtgtt gtggacactc tgtgcagtca gggtgaccgt cgatgccatc tctgtggaaa
      421 ctccgcagga cgttcttcgg gcttcgcagg gaaagagtgt caccctgccc tgcacctacc
      481 acacttccac ctccagtcga gagggactta ttcaatggga taagctcctc ctcactcata
      541 cggaaagggt ggtcatctgg ccgttttcaa acaaaaacta catccatggt gagctttata
      601 agaatcgcgt cagcatatcc aacaatgctg agcagtccga tgcctccatc accattgatc
      661 agctgaccat ggctgacaac ggcacctacg agtgttctgt ctcgctgatg tcagacctgg
      721 agggcaacac caagtcacgt gtccgcctgt tggtcctcgt gccaccctcc aaaccagaat
      781 gcggcatcga gggagagacc ataattggga acaacatcca gctgacctgc caatcaaagg
      841 agggctcacc aacccctcag tacagctgga agaggtacaa catcctgaat caggagcagc
      901 ccctggccca gccagcctca ggtcagcctg tctccctgaa gaatatctcc acagacacat
      961 cgggttacta catctgtacc tccagcaatg aggaggggac gcagttctgc aacatcacgg
     1021 tggccgtcag atctccctcc atgaacgtgg ccctgtatgt gggcatcgcg gtgggcgtgg
     1081 ttgcagccct cattatcatt ggcatcatca tctactgctg ctgctgccga gggaaggacg
     1141 acaacactga agacaaggag gatgcaaggc cgaaccggga agcctatgag gagccaccag
     1201 agcagctaag agaactttcc agagagaggg aggaggagga tgactacagg caagaagagc
     1261 agaggagcac tgggcgtgaa tccccggacc acctcgacca gtgacaggcc agcagcagag
     1321 ggcggcggag gaagggttag gggttcattc tcccgcttcc tggcctccct tctcctttct
     1381 aagccctgtt ctcctgtccc tccatcccag acattgatgg ggacatttct tccccagtgt
     1441 cagctgtggg gaacatggct ggcctggtaa gggggtccct gtgctgatcc tgctgacctc
     1501 actgtcctgt gaagtaaccc ctcctggctg tgacacctgg tgcgggcctg gccctcactc
     1561 aagaccaggc tgcagcctcc acttccctcg tagttggcag gagctcctgg aagcacagcg
     1621 ctgagcatgg ggcgctccca ctcagaactc tccagggagg cgatgccagc cttggggggt
     1681 gggggctgtc ctgctcacct gtgtgcccag cacctggagg ggcaccaggt ggagggtttg
     1741 cactccacac atctttcttg aatgaatgaa agaataagtg agtatgcttg ggccctgcat
     1801 tggcctggcc tccagctccc actccctttc caacctcact tcccgtagct gccagtatgt
     1861 tccaaaccct cctgggaagg ccacctccca ctcctgctgc acaggccctg gggagctttt
     1921 gcccacacac tttccatctc tgcctgtcaa tatcgtacct gtccctccag gcccatctca
     1981 aatcacaagg atttctctaa ccctatccta attgtccaca tacgtggaaa caatcctgtt
     2041 actctgtccc acgtccaatc atgggccaca aggcacagtc ttctgagcga gtgctctcac
     2101 tgtattagag cgccagctcc ttggggcagg gcctgggcct catggctttt gctttccctg
     2161 aagccctagt agctggcgcc catcctagtg ggcacttaag cttaattggg gaaactgctt
     2221 tgattggttg tgccttccct tctctggtct ccttgagatg atcgtagaca cagggatgat
     2281 tcccacccaa acccacgtat tcattcagtg agttaaacac gaattgattt aaagtgaaca
     2341 cacacaaggg agcttgcttg cagatggtct gagttcttgt gtcctggtaa ttcctctcca
     2401 ggccagaata attggcatgt ctcctcaacc cacatggggt tcctggttgt tcctgcatcc
     2461 cgatacctca gccctggccc tgcccagccc atttgggctc tggttttctg gtggggctgt
     2521 cctgctgccc tcccacagcc tccttctgtt tgtcgagcat ttcttctact cttgagagct
     2581 caggcagcgt tagggctgct taggtctcat ggaccagtgg ctggtctcac ccaactgcag
     2641 tttactattg ctatcttttc tggatgatca gaaaaataat tccataaatc tattgtctac
     2701 ttgcgatttt ttaaaaaatg tatattttta tatatattgt taaatccttt gcttcattcc
     2761 aaatgctttc agtaataata aaattgtggg tgg
//