LOCUS       HSU07343                2484 bp    mRNA    linear   HUM 03-FEB-2003
DEFINITION  Homo sapiens DNA mismatch repair protein homolog (MLH1) mRNA,
            complete cds.
ACCESSION   U07343
VERSION     U07343.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2484)
  AUTHORS   Bronner,C.E., Baker,S.M., Morrison,P.T., Warren,G., Smith,L.G.,
            Lescoe,M.K., Kane,M., Earibino,C., Lipford,J., Linblom,A.,
            Tannergard,P., Bollag,R.J., Godwin,A.R., Ward,D.C.,
            Nordenskjold,M., Fishel,R., Kolodner,R.D. and Liskay,R.M.
  TITLE     Mutation in the DNA mismatch repair gene homologue hMLH1 is
            associated with hereditary non-polyposis colon cancer
  JOURNAL   Nature 368 (6468), 258-261 (1994)
   PUBMED   8145827
REFERENCE   2  (bases 1 to 2484)
  AUTHORS   Morrison,P.T.
  TITLE     Direct Submission
  JOURNAL   Submitted (02-MAR-1994) Paul T. Morrison, Molecular Biology Core
            Facility, Dana-Farber Cancer Institute, 44 Binney Street, Boston,
            MA 002115, USA
FEATURES             Location/Qualifiers
     source          1..2484
                     /db_xref="H-InvDB:HIT000217657"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /chromosome="3"
                     /map="3p22-p23"
     gene            1..2484
                     /gene="MLH1"
     CDS             22..2292
                     /gene="MLH1"
                     /note="homolog of S. cerevisiae PMS1 (Swiss-Prot Accession
                     Number P14242), S. cerevisiae MLH1 (GenBank Accession
                     Number U07187), E. coli MUTL (Swiss-Prot Accession Number
                     P23367), Salmonella typhimurium MUTL (Swiss-Prot Accession
                     Number P14161) and Streptococcus pneumoniae (Swiss-Prot
                     Accession Number P14160)"
                     /codon_start=1
                     /product="DNA mismatch repair protein homolog"
                     /protein_id="AAC50285.1"
                     /translation="MSFVAGVIRRLDETVVNRIAAGEVIQRPANAIKEMIENCLDAKS
                     TSIQVIVKEGGLKLIQIQDNGTGIRKEDLDIVCERFTTSKLQSFEDLASISTYGFRGE
                     ALASISHVAHVTITTKTADGKCAYRASYSDGKLKAPPKPCAGNQGTQITVEDLFYNIA
                     TRRKALKNPSEEYGKILEVVGRYSVHNAGISFSVKKQGETVADVRTLPNASTVDNIRS
                     IFGNAVSRELIEIGCEDKTLAFKMNGYISNANYSVKKCIFLLFINHRLVESTSLRKAI
                     ETVYAAYLPKNTHPFLYLSLEISPQNVDVNVHPTKHEVHFLHEESILERVQQHIESKL
                     LGSNSSRMYFTQTLLPGLAGPSGEMVKSTTSLTSSSTSGSSDKVYAHQMVRTDSREQK
                     LDAFLQPLSKPLSSQPQAIVTEDKTDISSGRARQQDEEMLELPAPAEVAAKNQSLEGD
                     TTKGTSEMSEKRGPTSSNPRKRHREDSDVEMVEDDSRKEMTAACTPRRRIINLTSVLS
                     LQEEINEQGHEVLREMLHNHSFVGCVNPQWALAQHQTKLYLLNTTKLSEELFYQILIY
                     DFANFGVLRLSEPAPLFDLAMLALDSPESGWTEEDGPKEGLAEYIVEFLKKKAEMLAD
                     YFSLEIDEEGNLIGLPLLIDNYVPPLEGLPIFILRLATEVNWDEEKECFESLSKECAM
                     FYSIRKQYISEESTLSGQQSEVPGSIPNSWKWTVEHIVYKALRSHILPPKHFTEDGNI
                     LQLANLPDLYKVFERC"
BASE COUNT          720 a          535 c          594 g          635 t
ORIGIN      
        1 cttggctctt ctggcgccaa aatgtcgttc gtggcagggg ttattcggcg gctggacgag
       61 acagtggtga accgcatcgc ggcgggggaa gttatccagc ggccagctaa tgctatcaaa
      121 gagatgattg agaactgttt agatgcaaaa tccacaagta ttcaagtgat tgttaaagag
      181 ggaggcctga agttgattca gatccaagac aatggcaccg ggatcaggaa agaagatctg
      241 gatattgtat gtgaaaggtt cactactagt aaactgcagt cctttgagga tttagccagt
      301 atttctacct atggctttcg aggtgaggct ttggccagca taagccatgt ggctcatgtt
      361 actattacaa cgaaaacagc tgatggaaag tgtgcataca gagcaagtta ctcagatgga
      421 aaactgaaag cccctcctaa accatgtgct ggcaatcaag ggacccagat cacggtggag
      481 gacctttttt acaacatagc cacgaggaga aaagctttaa aaaatccaag tgaagaatat
      541 gggaaaattt tggaagttgt tggcaggtat tcagtacaca atgcaggcat tagtttctca
      601 gttaaaaaac aaggagagac agtagctgat gttaggacac tacccaatgc ctcaaccgtg
      661 gacaatattc gctccatctt tggaaatgct gttagtcgag aactgataga aattggatgt
      721 gaggataaaa ccctagcctt caaaatgaat ggttacatat ccaatgcaaa ctactcagtg
      781 aagaagtgca tcttcttact cttcatcaac catcgtctgg tagaatcaac ttccttgaga
      841 aaagccatag aaacagtgta tgcagcctat ttgcccaaaa acacacaccc attcctgtac
      901 ctcagtttag aaatcagtcc ccagaatgtg gatgttaatg tgcaccccac aaagcatgaa
      961 gttcacttcc tgcacgagga gagcatcctg gagcgggtgc agcagcacat cgagagcaag
     1021 ctcctgggct ccaattcctc caggatgtac ttcacccaga ctttgctacc aggacttgct
     1081 ggcccctctg gggagatggt taaatccaca acaagtctga cctcgtcttc tacttctgga
     1141 agtagtgata aggtctatgc ccaccagatg gttcgtacag attcccggga acagaagctt
     1201 gatgcatttc tgcagcctct gagcaaaccc ctgtccagtc agccccaggc cattgtcaca
     1261 gaggataaga cagatatttc tagtggcagg gctaggcagc aagatgagga gatgcttgaa
     1321 ctcccagccc ctgctgaagt ggctgccaaa aatcagagct tggaggggga tacaacaaag
     1381 gggacttcag aaatgtcaga gaagagagga cctacttcca gcaaccccag aaagagacat
     1441 cgggaagatt ctgatgtgga aatggtggaa gatgattccc gaaaggaaat gactgcagct
     1501 tgtacccccc ggagaaggat cattaacctc actagtgttt tgagtctcca ggaagaaatt
     1561 aatgagcagg gacatgaggt tctccgggag atgttgcata accactcctt cgtgggctgt
     1621 gtgaatcctc agtgggcctt ggcacagcat caaaccaagt tataccttct caacaccacc
     1681 aagcttagtg aagaactgtt ctaccagata ctcatttatg attttgccaa ttttggtgtt
     1741 ctcaggttat cggagccagc accgctcttt gaccttgcca tgcttgcctt agatagtcca
     1801 gagagtggct ggacagagga agatggtccc aaagaaggac ttgctgaata cattgttgag
     1861 tttctgaaga agaaggctga gatgcttgca gactatttct ctttggaaat tgatgaggaa
     1921 gggaacctga ttggattacc ccttctgatt gacaactatg tgcccccttt ggagggactg
     1981 cctatcttca ttcttcgact agccactgag gtgaattggg acgaagaaaa ggaatgtttt
     2041 gaaagcctca gtaaagaatg cgctatgttc tattccatcc ggaagcagta catatctgag
     2101 gagtcgaccc tctcaggcca gcagagtgaa gtgcctggct ccattccaaa ctcctggaag
     2161 tggactgtgg aacacattgt ctataaagcc ttgcgctcac acattctgcc tcctaaacat
     2221 ttcacagaag atggaaatat cctgcagctt gctaacctgc ctgatctata caaagtcttt
     2281 gagaggtgtt aaatatggtt atttatgcac tgtgggatgt gttcttcttt ctctgtattc
     2341 cgatacaaag tgttgtatca aagtgtgata tacaaagtgt accaacataa gtgttggtag
     2401 cacttaagac ttatacttgc cttctgatag tattccttta tacacagtgg attgattata
     2461 aataaataga tgtgtcttaa cata
//