LOCUS       BC020982                1416 bp    mRNA    linear   HUM 15-JUL-2006
DEFINITION  Homo sapiens keratin 18, mRNA (cDNA clone MGC:9716 IMAGE:3850724),
            complete cds.
ACCESSION   BC020982
VERSION     BC020982.1
KEYWORDS    MGC.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1416)
  AUTHORS   Strausberg,R.L., Feingold,E.A., Grouse,L.H., Derge,J.G.,
            Klausner,R.D., Collins,F.S., Wagner,L., Shenmen,C.M., Schuler,G.D.,
            Altschul,S.F., Zeeberg,B., Buetow,K.H., Schaefer,C.F., Bhat,N.K.,
            Hopkins,R.F., Jordan,H., Moore,T., Max,S.I., Wang,J., Hsieh,F.,
            Diatchenko,L., Marusina,K., Farmer,A.A., Rubin,G.M., Hong,L.,
            Stapleton,M., Soares,M.B., Bonaldo,M.F., Casavant,T.L.,
            Scheetz,T.E., Brownstein,M.J., Usdin,T.B., Toshiyuki,S.,
            Carninci,P., Prange,C., Raha,S.S., Loquellano,N.A., Peters,G.J.,
            Abramson,R.D., Mullahy,S.J., Bosak,S.A., McEwan,P.J.,
            McKernan,K.J., Malek,J.A., Gunaratne,P.H., Richards,S.,
            Worley,K.C., Hale,S., Garcia,A.M., Gay,L.J., Hulyk,S.W.,
            Villalon,D.K., Muzny,D.M., Sodergren,E.J., Lu,X., Gibbs,R.A.,
            Fahey,J., Helton,E., Ketteman,M., Madan,A., Rodrigues,S.,
            Sanchez,A., Whiting,M., Madan,A., Young,A.C., Shevchenko,Y.,
            Bouffard,G.G., Blakesley,R.W., Touchman,J.W., Green,E.D.,
            Dickson,M.C., Rodriguez,A.C., Grimwood,J., Schmutz,J., Myers,R.M.,
            Butterfield,Y.S., Krzywinski,M.I., Skalska,U., Smailus,D.E.,
            Schnerch,A., Schein,J.E., Jones,S.J. and Marra,M.A.
  CONSRTM   Mammalian Gene Collection Program Team
  TITLE     Generation and initial analysis of more than 15,000 full-length
            human and mouse cDNA sequences
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 99 (26), 16899-16903 (2002)
   PUBMED   12477932
REFERENCE   2  (bases 1 to 1416)
  CONSRTM   NIH MGC Project
  TITLE     Direct Submission
  JOURNAL   Submitted (03-JAN-2002) National Institutes of Health, Mammalian
            Gene Collection (MGC), Bethesda, MD 20892-2590, USA
  REMARK    NIH-MGC Project URL: http://mgc.nci.nih.gov
COMMENT     Contact: MGC help desk
            Email: cgapbs-r@mail.nih.gov
            Tissue Procurement: ATCC
            cDNA Library Preparation: Life Technologies, Inc.
            cDNA Library Arrayed by: The I.M.A.G.E. Consortium (LLNL)
            DNA Sequencing by: Sequencing Group at the Stanford Human Genome
            Center, Stanford University School of Medicine, Stanford, CA  94305
            Web site:       http://www-shgc.stanford.edu
            Contact:  (Dickson, Mark) mcd@paxil.stanford.edu
            Dickson, M., Schmutz, J., Grimwood, J., Rodriquez, A., and Myers,
            R. M.
            
            Clone distribution: MGC clone distribution information can be found
            through the I.M.A.G.E. Consortium/LLNL at: http://image.llnl.gov
            Series: IRAK Plate: 20 Row: m Column: 12
            This clone was selected for full length sequencing because it
            passed the following selection criteria: Hexamer frequency ORF
            analysis.
FEATURES             Location/Qualifiers
     source          1..1416
                     /db_xref="H-InvDB:HIT000039066"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="MGC:9716 IMAGE:3850724"
                     /tissue_type="Colon, adenocarcinoma"
                     /clone_lib="NIH_MGC_65"
                     /lab_host="DH10B"
                     /note="Vector: pCMV-SPORT6"
     gene            1..1416
                     /gene="KRT18"
                     /gene_synonym="CYK18"
                     /gene_synonym="K18"
                     /db_xref="GeneID:3875"
                     /db_xref="HGNC:HGNC:6430"
                     /db_xref="MIM:148070"
     CDS             50..1342
                     /gene="KRT18"
                     /gene_synonym="CYK18"
                     /gene_synonym="K18"
                     /codon_start=1
                     /product="keratin 18"
                     /protein_id="AAH20982.1"
                     /db_xref="GeneID:3875"
                     /db_xref="HGNC:HGNC:6430"
                     /db_xref="MIM:148070"
                     /translation="MSFTTRSTFSTNYRSLGSVQAPSYGARPVSSAASVYAGAGGSGS
                     RISVSRSTSFRGGMGSGGLATGIAGGLAGMGGIQNEKETMQSLNDRLASYLDRVRSLE
                     TENRRLESKIREHLEKKGPQVRDWSHYFKIIEDLRAQIFANTVDNARIVLQIDNARLA
                     ADDFRVKYETELAMRQSVENDIHGLRKVIDDTNITRLQLETEIEALKEELLFMKKNHE
                     EEVKGLQAQIASSGLTVEVDAPKSQDLAKIMADIRAQYDELARKNREELDKYWSQQIE
                     ESTTVVTTQSAEVGAAETTLTELRRTVQSLEIDLDSMRNLKASLENSLREVEARYALQ
                     MEQLNGILLHLESELAQTRAEGQRQAQEYEALLNIKVKLEAEIATYRRLLEDGEDFNL
                     GDALDSSNSMQTIQKTTTRRIVDGKVVSETNDTKVLRH"
BASE COUNT          364 a          392 c          423 g          237 t
ORIGIN      
        1 ccgtcgtccg caaagcctga gtcctgtcct ttctctctcc ccggacagca tgagcttcac
       61 cactcgctcc accttctcca ccaactaccg gtccctgggc tctgtccagg cgcccagcta
      121 cggcgcccgg ccggtcagca gcgcggccag cgtctatgca ggcgctgggg gctctggttc
      181 ccggatctcc gtgtcccgct ccaccagctt caggggcggc atggggtccg ggggcctggc
      241 caccgggata gccgggggtc tggcaggaat gggaggcatc cagaacgaga aggagaccat
      301 gcaaagcctg aacgaccgcc tggcctctta cctggacaga gtgaggagcc tggagaccga
      361 gaaccggagg ctggagagca aaatccggga gcacttggag aagaagggac cccaggtcag
      421 agactggagc cattacttca agatcatcga ggacctgagg gctcagatct tcgcaaatac
      481 tgtggacaat gcccgcatcg ttctgcagat tgacaatgcc cgtcttgctg ctgatgactt
      541 tagagtcaag tatgagacag agctggccat gcgccagtct gtggagaacg acatccatgg
      601 gctccgcaag gtcattgatg acaccaatat cacacgactg cagctggaga cagagatcga
      661 ggctctcaag gaggagctgc tcttcatgaa gaagaaccac gaagaggaag taaaaggcct
      721 acaagcccag attgccagct ctgggttgac cgtggaggta gatgccccca aatctcagga
      781 cctcgccaag atcatggcag acatccgggc ccaatatgac gagctggctc ggaagaaccg
      841 agaggagcta gacaagtact ggtctcagca gattgaggag agcaccacag tggtcaccac
      901 acagtctgct gaggttggag ctgctgagac gacgctcaca gagctgagac gtacagtcca
      961 gtccttggag atcgacctgg actccatgag aaatctgaag gccagcttgg agaacagcct
     1021 gagggaggtg gaggcccgct acgccctaca gatggagcag ctcaacggga tcctgctgca
     1081 ccttgagtca gagctggcac agacccgggc agagggacag cgccaggccc aggagtatga
     1141 ggccctgctg aacatcaagg tcaagctgga ggctgagatc gccacctacc gccgcctgct
     1201 ggaagatggc gaggacttta atcttggtga tgccttggac agcagcaact ccatgcaaac
     1261 catccaaaag accaccaccc gccggatagt ggatggcaaa gtggtgtctg agaccaatga
     1321 caccaaagtt ctgaggcatt aagccagcag aagcagggta ccctttgggg agcaggaggc
     1381 caataaaaag ttcagagttc aaaaaaaaaa aaaaaa
//