LOCUS       HSU27109                4198 bp    mRNA    linear   HUM 04-AUG-1995
DEFINITION  Human prepromultimerin mRNA, complete cds.
ACCESSION   U27109
VERSION     U27109.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 4198)
  AUTHORS   Hayward,C.P., Hassell,J.A., Denomme,G.A., Rachubinski,R.A.,
            Brown,C. and Kelton,J.G.
  TITLE     The cDNA sequence of human endothelial cell multimerin. A unique
            protein with RGDS, coiled-coil, and epidermal growth factor-like
            domains and a carboxyl terminus similar to the globular domain of
            complement C1q and collagens type VIII and X
  JOURNAL   J. Biol. Chem. 270 (31), 18246-18251 (1995)
   PUBMED   7629143
REFERENCE   2  (bases 1 to 4198)
  AUTHORS   Hayward,C.P.
  TITLE     Direct Submission
  JOURNAL   Submitted (15-MAY-1995) Catherine P. M. Hayward, Pathology,
            McMaster University, HSC 2N32, 1200 Main St. W., Hamilton, Ontario
            L8N 3Z5, Canada
FEATURES             Location/Qualifiers
     source          1..4198
                     /db_xref="H-InvDB:HIT000218849"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="overlapping clones: mmlambda 4, 5, 7, 11 & 17"
                     /cell_type="endothelial"
                     /clone_lib="Clonetech library and libraries VII-91-4 and
                     VII-91-5 (J Biol Chem 262 page 3718)"
     5'UTR           1..71
     CDS             72..3758
                     /codon_start=1
                     /product="prepromultimerin"
                     /protein_id="AAC52065.1"
                     /translation="MKGARLFVLLSSLWSGGIGLNNSKHSWTIPEDGNSQKTMPSASV
                     PPNKIQSLQILPTTRVMSAEIATTPEARTSEDSLLKSTLPPSETSAPAEGVRNQTLTS
                     TEKAEGVVKLQNLTLPTNASIKFNPGAESVVLSNSTLKFLQSFARKSNEQATSLNTVG
                     GTGGIGGVGGTGGVGNRAPRETYLSRGDSSSSQRTDYQKSNFETTRGKNWCAYVHTRL
                     SPTVTLDNQVTYVPGGKGPCGWTGGSCPQRSQKISNPVYRMQHKIVTSLDWRCCPGYS
                     GPKCQLRAQEQQSLIHTNQAESHTAVGRGVAEQQQQQGCGDPEVMQKMTDQVNYQAMK
                     LTLLQKKIDNISLTVNDVRNTYSSLEGKVSEDKSREFQSLLKGLKSKSINVLIRDIVR
                     EQFKIFQNDMQETVAQLFKTVSSLSEDLESTRQIIQKVNESVVSIAAQQKFVLVQENR
                     PTLTDIVELRNHIVNVRQEMTLTCEKPIKELEVKQTHLEGALEQEHSRSILYYESLNK
                     TLSKLKEVHEQLLSTEQVSDQKNAPAAESVSNNVTEYMSTLHENIKKQSLMMLQMFED
                     LHIQESKINNLTVSLEMEKESLRGECEDMLSKCRNDFKFQLKDTEENLHVLNQTLAEV
                     LFPMDNKMDKMSEQLNDLTYDMEILQPLLEQGASLRQTMTYEQPKEAIVIRKKIENLT
                     SAVNSLNFIIKELTKRHNLLRNEVQGRDDALERRINEYALEMEDGLNKTMTIINNAID
                     FIQDNYALKETLSTIKDNSEIHHKCTSDMETILTFIPQFHRLNDSIQTLVNDNQRYNF
                     VLQVAKTLAGIPRDEKLNQSNFQKMYQMFNETTSQVRKYQQNMSHLEEKLLLTTKISK
                     NFETRLQDIESKVTQTLIPYYISVKKGSVVTNERDQALQLQVLNSRFKALEAKSIHLS
                     INFFSLNKTLHEVLTMCHNASTSVSELNATIPKWIKHSLPDIQLLQKGLTEFVEPIIQ
                     IKTQAALSNSTCCIDRSLPGSLANVVKSQKQVKSLPKKINALKKPTVNLTTVLIGRTQ
                     RNTDNIIYPEEYSSCSRHPCQNGGTCINGRTSFTCACRHPFTGDNCTIKLVEENALAP
                     DFSKGSYRYAPMVAFFASHTYGMTIPGPILFNNLDVNYGASYTPRTGKFRIPYLGVYV
                     FKYTIESFSAHISGFLVVDGIDKLAFESENINSEIHCDRVLTGDALLELNYGQEVWLR
                     LAKGTIPAKFPPVTTFSGYLLYRT"
     sig_peptide     72..128
     mat_peptide     129..3755
                     /product="multimerin"
     misc_structure  627..638
                     /note="encodes RGDS domain"
     misc_structure  876..911
                     /note="encodes partial EGF-like domain"
     misc_structure  1020..1196
                     /note="encodes putative coiled-coil structures in protein"
     misc_feature    1173..1199
                     /note="encodes sequence confirmed from protein sequencing"
     misc_structure  1269..1406
                     /note="encodes putative coiled-coil structures in protein"
     misc_structure  2073..2285
                     /note="encodes putative coiled-coil structures in protein"
     misc_structure  2523..2690
                     /note="encodes putative coiled-coil structures in protein"
     misc_feature    3183..3185
                     /note="encodes putative tyrosine sulfation site"
     misc_feature    3243..3245
                     /note="encodes putative asparagine hydroxylation site"
     misc_structure  3264..3299
                     /note="encodes EGF-like domain"
     misc_structure  3420..3755
                     /note="encodes putative globular head domain in protein"
     3'UTR           3759..4198
     regulatory      4179..4184
                     /regulatory_class="polyA_signal_sequence"
BASE COUNT         1436 a          791 c          808 g         1163 t
ORIGIN      
        1 ctgctatcaa aaaggccata aggattttgt ccccaaattt cacatgagct accttgcttc
       61 aaactactga gatgaagggg gcaagattat ttgtccttct ttctagttta tggagtgggg
      121 gcattgggct taacaacagt aagcattctt ggactatacc tgaggatggg aactctcaga
      181 agactatgcc ttctgcttca gttcctccaa ataaaataca aagtttgcaa atactgccaa
      241 ccactcgggt catgtcggcg gagatagcta caactccaga ggcaagaact tctgaagaca
      301 gtcttcttaa atcaacactg cctccctcag aaacaagtgc acctgctgag ggtgtgagaa
      361 atcaaactct cacatccaca gagaaagcag aaggagtggt caagttacag aatcttaccc
      421 tcccaaccaa cgctagcatc aagttcaatc ctggagcaga atcagtggtc ctttccaatt
      481 ctacactgaa atttcttcag agctttgcca gaaagtcaaa tgaacaagca acttctctaa
      541 acacagttgg aggcactgga ggcattggag gcgttggagg cactggaggc gtgggaaatc
      601 gagccccacg ggaaacatac ctcagccggg gtgacagcag ttccagccaa agaactgact
      661 accaaaaatc aaatttcgaa acaactagag gaaagaattg gtgtgcttat gtacatacca
      721 ggttatctcc cacagtgaca ttggacaacc aggtcactta tgtcccaggt gggaaaggac
      781 cttgtggctg gaccggtgga tcctgtcctc agagatctca gaagatatcc aatcctgtct
      841 ataggatgca acataaaatt gtcacctcat tggattggag gtgctgtcct ggatacagtg
      901 ggccgaaatg tcaactaaga gcccaggaac agcaaagttt gatacacacc aaccaggctg
      961 aaagtcatac agctgttggc agaggagtag ctgagcagca gcagcagcaa ggctgtggtg
     1021 acccagaagt gatgcaaaaa atgactgatc aggtgaacta ccaggcaatg aaactgactc
     1081 ttctgcagaa gaagattgac aatatttctt tgactgtgaa tgatgtaagg aacacttact
     1141 cctccctaga aggaaaagtc agcgaagata aaagcagaga atttcaatct cttctaaaag
     1201 gtctaaaatc caaaagcatt aatgtactga taagagacat agtaagagaa caatttaaaa
     1261 tttttcaaaa tgacatgcaa gagactgtag cacagctctt caagactgta tcaagtctat
     1321 cagaggacct cgaaagcacc aggcaaataa ttcaaaaagt taatgaatct gtggtttcaa
     1381 tagcagccca gcaaaagttt gttttggtgc aagagaatcg gcccactttg actgatatag
     1441 tggaactaag gaatcacatt gtgaatgtaa ggcaagaaat gactcttaca tgtgagaagc
     1501 ctattaaaga actagaagta aagcagactc atttagaagg tgctctagaa caggaacact
     1561 caagaagcat tctgtattat gaatccctca ataaaactct ttctaaattg aaggaagtac
     1621 atgagcagct tttatcaact gaacaggtat cagaccagaa gaatgctcca gctgctgagt
     1681 cagttagcaa taatgtcact gagtacatgt ctactttaca tgaaaatata aagaagcaga
     1741 gtttgatgat gctgcaaatg tttgaagatt tgcacattca agaaagcaag attaacaatc
     1801 tcaccgtctc tttggagatg gagaaagagt ctctcagagg tgaatgtgaa gacatgttat
     1861 ccaaatgcag aaatgatttt aaatttcaac ttaaggacac agaagagaat ttacatgtgt
     1921 taaatcaaac attggctgaa gttctctttc caatggacaa taagatggac aaaatgagtg
     1981 agcaactaaa tgatttgact tatgatatgg agatccttca acccttgctt gagcagggag
     2041 catcactcag acagacaatg acatatgaac aaccaaagga agcaatagtg ataaggaaaa
     2101 agatagaaaa tctgactagt gctgtcaata gtctaaattt tattatcaaa gaacttacaa
     2161 aaagacacaa cttacttaga aatgaagtac agggtcgtga tgatgcctta gaaagacgta
     2221 tcaatgaata tgccttagaa atggaagatg gcctcaataa gacaatgact attataaata
     2281 atgctattga tttcattcaa gataactatg ccctaaaaga gactttaagt actattaagg
     2341 ataatagtga gatccatcat aaatgtacct ccgatatgga aactattttg acatttattc
     2401 ctcagttcca ccgtctgaat gattctattc agactttggt caatgacaat cagagatata
     2461 actttgtttt gcaagtcgcc aagacccttg caggtattcc cagagatgag aaactaaatc
     2521 agtccaactt ccaaaagatg tatcaaatgt tcaatgaaac cacttcccaa gtgagaaaat
     2581 accagcaaaa tatgagtcat ttggaagaaa aactactctt aactaccaag atttccaaaa
     2641 attttgagac tcggttgcaa gacattgagt ctaaagttac ccagacgctc ataccttatt
     2701 atatttcagt taaaaaaggc agtgtagtta caaatgagag agatcaggct cttcaactgc
     2761 aagtattaaa ttccagattt aaggcgttgg aagcaaaatc tatccatctt tcaattaact
     2821 tcttttcgct taacaaaact ctccacgaag ttttaacaat gtgtcacaat gcttctacaa
     2881 gtgtgtcaga actgaatgct accatcccta agtggataaa acattccctg ccagatattc
     2941 aacttcttca gaaaggtcta acagaatttg tggaaccaat aattcaaata aaaactcaag
     3001 ctgccctatc taattcaact tgttgtatag atcgatcgtt gcctggtagt ctggcaaatg
     3061 ttgtcaagtc tcagaagcaa gtaaaatcat tgccaaagaa aattaacgca cttaagaaac
     3121 caacggtaaa tcttaccaca gtcctgatag gccggactca aagaaacacg gacaacataa
     3181 tatatcctga ggagtattca agctgtagtc ggcatccgtg ccaaaatggg ggcacgtgca
     3241 taaatggaag aactagcttt acctgtgcct gcagacatcc ttttactggt gacaactgca
     3301 ctatcaagct tgtggaagaa aatgctttag ctccagattt ttccaaagga tcttacagat
     3361 atgcacccat ggtggcattt tttgcatctc atacgtatgg aatgactata cctggtccta
     3421 tcctgtttaa taacttggat gtcaattatg gagcttcata taccccaaga actggaaaat
     3481 ttagaattcc gtatcttgga gtatatgttt tcaagtacac catcgagtca tttagtgctc
     3541 atatttctgg atttttagtg gttgatggaa tagacaagct tgcatttgag tctgaaaata
     3601 ttaacagtga aatacactgt gatagggttt taactgggga tgccttatta gaattaaatt
     3661 atgggcagga agtctggtta cgacttgcaa aaggaacaat tccagccaag tttccccctg
     3721 ttactacatt tagtggctat ttattatatc gtacataagt tagtatgaaa aacagactat
     3781 cacctttatt gagaaacagc cagtgttttc atttatcttt gcttgcacat ctgctctgtt
     3841 ttggtttttc tacaggaaat gaaaatcaac ttgttttttt aatatgagta aacttgtatg
     3901 tctattttat aaaattattt gaatattgtt taatgtctga atatgaaaga gttcttgatc
     3961 ctaaagaaat ttagtggcac agaaaacaaa gtgaatttgt tagcataatt attcctattc
     4021 ttatttcttc attttaagtc attgcaatgg aaagtaatat tataaaacgg taattacaac
     4081 atattatcag tcacagtttt ctttccaatt aaacacttaa cttttgttat tccctgtata
     4141 taaatatata acacacattt tctagattca caaatttaaa taaattactc aaaaaatg
//