LOCUS       X04571                  4871 bp    mRNA    linear   HUM 07-OCT-2008
DEFINITION  Human mRNA for kidney epidermal growth factor (EGF) precursor.
ACCESSION   X04571
VERSION     X04571.1
KEYWORDS    epidermal growth factor; glycoprotein; growth factor; membrane
            protein; signal peptide.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 4871)
  AUTHORS   Bell G.I., Fong N.M., Stempien M.M., Wormsted M.A., Caput D.,
            Ku L., Urdea M.S., Rall L.B., Sanchez-Pescador R.
  TITLE     Human epidermal growth factor precursor: cDNA sequence, expression
            in vitro and gene organization
  JOURNAL   Nucleic Acids Res. 14(21), 8427-8446(1986).
   PUBMED   3491360
REFERENCE   2  (bases 4242 to 4243)
  AUTHORS   Bell G.I.
  JOURNAL   Submitted (21-MAY-1987) to the INSDC.
FEATURES             Location/Qualifiers
     source          1..4871
                     /db_xref="H-InvDB:HIT000321049"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /dev_stage="adult"
                     /tissue_type="kidney"
                     /db_xref="taxon:9606"
     CDS             437..4060
                     /note="precursor polypeptide (AA -22 to 1185)"
                     /db_xref="GOA:P01133"
                     /db_xref="H-InvDB:HIT000321049.15"
                     /db_xref="HGNC:HGNC:3229"
                     /db_xref="InterPro:IPR000033"
                     /db_xref="InterPro:IPR000152"
                     /db_xref="InterPro:IPR000742"
                     /db_xref="InterPro:IPR001881"
                     /db_xref="InterPro:IPR009030"
                     /db_xref="InterPro:IPR011042"
                     /db_xref="InterPro:IPR013032"
                     /db_xref="InterPro:IPR016317"
                     /db_xref="InterPro:IPR018097"
                     /db_xref="PDB:1IVO"
                     /db_xref="PDB:1JL9"
                     /db_xref="PDB:1NQL"
                     /db_xref="PDB:1P9J"
                     /db_xref="PDB:2KV4"
                     /db_xref="PDB:3NJP"
                     /db_xref="UniProtKB/Swiss-Prot:P01133"
                     /protein_id="CAA28240.1"
                     /translation="MLLTLIILLPVVSKFSFVSLSAPQHWSCPEGTLAGNGNSTCVGP
                     APFLIFSHGNSIFRIDTEGTNYEQLVVDAGVSVIMDFHYNEKRIYWVDLERQLLQRVF
                     LNGSRQERVCNIEKNVSGMAINWINEEVIWSNQQEGIITVTDMKGNNSHILLSALKYP
                     ANVAVDPVERFIFWSSEVAGSLYRADLDGVGVKALLETSEKITAVSLDVLDKRLFWIQ
                     YNREGSNSLICSCDYDGGSVHISKHPTQHNLFAMSLFGDRIFYSTWKMKTIWIANKHT
                     GKDMVRINLHSSFVPLGELKVVHPLAQPKAEDDTWEPEQKLCKLRKGNCSSTVCGQDL
                     QSHLCMCAEGYALSRDRKYCEDVNECAFWNHGCTLGCKNTPGSYYCTCPVGFVLLPDG
                     KRCHQLVSCPRNVSECSHDCVLTSEGPLCFCPEGSVLERDGKTCSGCSSPDNGGCSQL
                     CVPLSPVSWECDCFPGYDLQLDEKSCAASGPQPFLLFANSQDIRHMHFDGTDYGTLLS
                     QQMGMVYALDHDPVENKIYFAHTALKWIERANMDGSQRERLIEEGVDVPEGLAVDWIG
                     RRFYWTDRGKSLIGRSDLNGKRSKIITKENISQPRGIAVHPMAKRLFWTDTGINPRIE
                     SSSLQGLGRLVIASSDLIWPSGITIDFLTDKLYWCDAKQSVIEMANLDGSKRRRLTQN
                     DVGHPFAVAVFEDYVWFSDWAMPSVIRVNKRTGKDRVRLQGSMLKPSSLVVVHPLAKP
                     GADPCLYQNGGCEHICKKRLGTAWCSCREGFMKASDGKTCLALDGHQLLAGGEVDLKN
                     QVTPLDILSKTRVSEDNITESQHMLVAEIMVSDQDDCAPVGCSMYARCISEGEDATCQ
                     CLKGFAGDGKLCSDIDECEMGVPVCPPASSKCINTEGGYVCRCSEGYQGDGIHCLDID
                     ECQLGVHSCGENASCTNTEGGYTCMCAGRLSEPGLICPDSTPPPHLREDDHHYSVRNS
                     DSECPLSHDGYCLHDGVCMYIEALDKYACNCVVGYIGERCQYRDLKWWELRHAGHGQQ
                     QKVIVVAVCVVVLVMLLLLSLWGAHYYRTQKLLSKNPKNPYEESSRDVRSRRPADTED
                     GMSSCPQPWFVVIKEHQDLKNGGQPVAGEDGQAADGSMQPTSWRQEPQLCGMGTEQGC
                     WIPVSSDKGSCPQVMERSFHMPSYGTQTLEGGVEKPHSLLSANPLWQQRALDPPHQME
                     LTQ"
     misc_feature    437..3532
                     /note="put. extracellular domain (AA 1 to 1010)"
     sig_peptide     437..502
                     /note="pot. signal peptide (AA -22 to -1)"
     misc_feature    548..556
                     /note="pot. N-glycosylation site"
     misc_feature    746..754
                     /note="pot. N-glycosylation site"
     misc_feature    785..793
                     /note="pot. N-glycosylation site"
     misc_feature    878..886
                     /note="pot. N-glycosylation site"
     misc_feature    1406..1414
                     /note="pot. N-glycosylation site"
     misc_feature    1646..1654
                     /note="pot. N-glycosylation site"
     misc_feature    2222..2230
                     /note="pot. N-glycosylation site"
     misc_feature    2879..2887
                     /note="pot. N-glycosylation site"
     misc_feature    3212..3220
                     /note="pot. N-glycosylation site"
     mat_peptide     3347..3505
                     /note="mature EGF (AA 949-1001)"
     misc_feature    3533..3607
                     /note="transmembrane domain (AA 1011-1035)"
     misc_feature    3608..4057
                     /note="cytoplasmic domain (AA 1036-1185)"
     old_sequence    4242..4243
                     /note="gc was cg in [1]"
                     /citation=[1]
     misc_feature    4852..4857
                     /note="pot. polyA signal"
BASE COUNT         1356 a          974 c         1187 g         1354 t
ORIGIN      
        1 gggagaggaa tcgtatctcc atatttcttc tttcagcccc aatccaaggg ttgtagctgg
       61 aactttccat cagttcttcc tttctttttc ctctctaagc ctttgccttg ctctgtcaca
      121 gtgaagtcag ccagagcagg gctgttaaac tctgtgaaat ttgtcataag ggtgtcaggt
      181 atttcttact ggcttccaaa gaaacataga taaagaaatc tttcctgtgg cttcccttgg
      241 caggctgcat tcagaaggtc tctcagttga agaaagagct tggaggacaa cagcacaaca
      301 ggagagtaaa agatgcccca gggctgaggc ctccgctcag gcagccgcat ctggggtcaa
      361 tcatactcac cttgcccggg ccatgctcca gcaaaatcaa gctgttttct tttgaaagtt
      421 caaactcatc aagattatgc tgctcactct tatcattctg ttgccagtag tttcaaaatt
      481 tagttttgtt agtctctcag caccgcagca ctggagctgt cctgaaggta ctctcgcagg
      541 aaatgggaat tctacttgtg tgggtcctgc acccttctta attttctccc atggaaatag
      601 tatctttagg attgacacag aaggaaccaa ttatgagcaa ttggtggtgg atgctggtgt
      661 ctcagtgatc atggattttc attataatga gaaaagaatc tattgggtgg atttagaaag
      721 acaacttttg caaagagttt ttctgaatgg gtcaaggcaa gagagagtat gtaatataga
      781 gaaaaatgtt tctggaatgg caataaattg gataaatgaa gaagttattt ggtcaaatca
      841 acaggaagga atcattacag taacagatat gaaaggaaat aattcccaca ttcttttaag
      901 tgctttaaaa tatcctgcaa atgtagcagt tgatccagta gaaaggttta tattttggtc
      961 ttcagaggtg gctggaagcc tttatagagc agatctcgat ggtgtgggag tgaaggctct
     1021 gttggagaca tcagagaaaa taacagctgt gtcattggat gtgcttgata agcggctgtt
     1081 ttggattcag tacaacagag aaggaagcaa ttctcttatt tgctcctgtg attatgatgg
     1141 aggttctgtc cacattagta aacatccaac acagcataat ttgtttgcaa tgtccctttt
     1201 tggtgaccgt atcttctatt caacatggaa aatgaagaca atttggatag ccaacaaaca
     1261 cactggaaag gacatggtta gaattaacct ccattcatca tttgtaccac ttggtgaact
     1321 gaaagtagtg catccacttg cacaacccaa ggcagaagat gacacttggg agcctgagca
     1381 gaaactttgc aaattgagga aaggaaactg cagcagcact gtgtgtgggc aagacctcca
     1441 gtcacacttg tgcatgtgtg cagagggata cgccctaagt cgagaccgga agtactgtga
     1501 agatgttaat gaatgtgctt tttggaatca tggctgtact cttgggtgta aaaacacccc
     1561 tggatcctat tactgcacgt gccctgtagg atttgttctg cttcctgatg ggaaacgatg
     1621 tcatcaactt gtttcctgtc cacgcaatgt gtctgaatgc agccatgact gtgttctgac
     1681 atcagaaggt cccttatgtt tctgtcctga aggctcagtg cttgagagag atgggaaaac
     1741 atgtagcggt tgttcctcac ccgataatgg tggatgtagc cagctctgcg ttcctcttag
     1801 cccagtatcc tgggaatgtg attgctttcc tgggtatgac ctacaactgg atgaaaaaag
     1861 ctgtgcagct tcaggaccac aaccattttt gctgtttgcc aattctcaag atattcgaca
     1921 catgcatttt gatggaacag actatggaac tctgctcagc cagcagatgg gaatggttta
     1981 tgccctagat catgaccctg tggaaaataa gatatacttt gcccatacag ccctgaagtg
     2041 gatagagaga gctaatatgg atggttccca gcgagaaagg cttattgagg aaggagtaga
     2101 tgtgccagaa ggtcttgctg tggactggat tggccgtaga ttctattgga cagacagagg
     2161 gaaatctctg attggaagga gtgatttaaa tgggaaacgt tccaaaataa tcactaagga
     2221 gaacatctct caaccacgag gaattgctgt tcatccaatg gccaagagat tattctggac
     2281 tgatacaggg attaatccac gaattgaaag ttcttccctc caaggccttg gccgtctggt
     2341 tatagccagc tctgatctaa tctggcccag tggaataacg attgacttct taactgacaa
     2401 gttgtactgg tgcgatgcca agcagtctgt gattgaaatg gccaatctgg atggttcaaa
     2461 acgccgaaga cttacccaga atgatgtagg tcacccattt gctgtagcag tgtttgagga
     2521 ttatgtgtgg ttctcagatt gggctatgcc atcagtaata agagtaaaca agaggactgg
     2581 caaagataga gtacgtctcc aaggcagcat gctgaagccc tcatcactgg ttgtggttca
     2641 tccattggca aaaccaggag cagatccctg cttatatcaa aacggaggct gtgaacatat
     2701 ttgcaaaaag aggcttggaa ctgcttggtg ttcgtgtcgt gaaggtttta tgaaagcctc
     2761 agatgggaaa acgtgtctgg ctctggatgg tcatcagctg ttggcaggtg gtgaagttga
     2821 tctaaagaac caagtaacac cattggacat cttgtccaag actagagtgt cagaagataa
     2881 cattacagaa tctcaacaca tgctagtggc tgaaatcatg gtgtcagatc aagatgactg
     2941 tgctcctgtg ggatgcagca tgtatgctcg gtgtatttca gagggagagg atgccacatg
     3001 tcagtgtttg aaaggatttg ctggggatgg aaaactatgt tctgatatag atgaatgtga
     3061 gatgggtgtc ccagtgtgcc cccctgcctc ctccaagtgc atcaacaccg aaggtggtta
     3121 tgtctgccgg tgctcagaag gctaccaagg agatgggatt cactgtcttg atattgatga
     3181 gtgccaactg ggggtgcaca gctgtggaga gaatgccagc tgcacaaata cagagggagg
     3241 ctatacctgc atgtgtgctg gacgcctgtc tgaaccagga ctgatttgcc ctgactctac
     3301 tccaccccct cacctcaggg aagatgacca ccactattcc gtaagaaata gtgactctga
     3361 atgtcccctg tcccacgatg ggtactgcct ccatgatggt gtgtgcatgt atattgaagc
     3421 attggacaag tatgcatgca actgtgttgt tggctacatc ggggagcgat gtcagtaccg
     3481 agacctgaag tggtgggaac tgcgccacgc tggccacggg cagcagcaga aggtcatcgt
     3541 ggtggctgtc tgcgtggtgg tgcttgtcat gctgctcctc ctgagcctgt ggggggccca
     3601 ctactacagg actcagaagc tgctatcgaa aaacccaaag aatccttatg aggagtcgag
     3661 cagagatgtg aggagtcgca ggcctgctga cactgaggat gggatgtcct cttgccctca
     3721 accttggttt gtggttataa aagaacacca agacctcaag aatgggggtc aaccagtggc
     3781 tggtgaggat ggccaggcag cagatgggtc aatgcaacca acttcatgga ggcaggagcc
     3841 ccagttatgt ggaatgggca cagagcaagg ctgctggatt ccagtatcca gtgataaggg
     3901 ctcctgtccc caggtaatgg agcgaagctt tcatatgccc tcctatggga cacagaccct
     3961 tgaagggggt gtcgagaagc cccattctct cctatcagct aacccattat ggcaacaaag
     4021 ggccctggac ccaccacacc aaatggagct gactcagtga aaactggaat taaaaggaaa
     4081 gtcaagaaga atgaactatg tcgatgcaca gtatcttttc tttcaaaagt agagcaaaac
     4141 tataggtttt ggttccacaa tctctacgac taatcaccta ctcaatgcct ggagacagat
     4201 acgtagttgt gcttttgttt gctcttttaa gcagtctcac tgcagtctta tttccaagta
     4261 agagtactgg gagaatcact aggtaactta ttagaaaccc aaattgggac aacagtgctt
     4321 tgtaaattgt gttgtcttca gcagtcaata caaatagatt tttgtttttg ttgttcctgc
     4381 agccccagaa gaaattaggg gttaaagcag acagtcacac tggtttggtc agttacaaag
     4441 taatttcttt gatctggaca gaacatttat atcagtttca tgaaatgatt ggaatattac
     4501 aataccgtta agatacagtg taggcattta actcctcatt ggcgtggtcc atgctgatga
     4561 ttttgccaaa atgagttgtg atgaatcaat gaaaaatgta atttagaaac tgatttcttc
     4621 agaattagat ggccttattt tttaaaatat ttgaatgaaa acattttatt tttaaaatat
     4681 tacacaggag gccttcggag tttcttagtc attactgtcc ttttccccta cagaattttc
     4741 cctcttggtg tgattgcaca gaatttgtat gtattttcag ttacaagatt gtaagtaaat
     4801 tgcctgattt gttttcatta tagacaacga tgaatttctt ctaattattt aaataaaatc
     4861 accaaaaaca t
//