LOCUS HSU27109 4198 bp mRNA linear HUM 04-AUG-1995 DEFINITION Human prepromultimerin mRNA, complete cds. ACCESSION U27109 VERSION U27109.1 KEYWORDS . SOURCE Homo sapiens (human) ORGANISM Homo sapiens Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini; Catarrhini; Hominidae; Homo. REFERENCE 1 (bases 1 to 4198) AUTHORS Hayward,C.P., Hassell,J.A., Denomme,G.A., Rachubinski,R.A., Brown,C. and Kelton,J.G. TITLE The cDNA sequence of human endothelial cell multimerin. A unique protein with RGDS, coiled-coil, and epidermal growth factor-like domains and a carboxyl terminus similar to the globular domain of complement C1q and collagens type VIII and X JOURNAL J. Biol. Chem. 270 (31), 18246-18251 (1995) PUBMED 7629143 REFERENCE 2 (bases 1 to 4198) AUTHORS Hayward,C.P. TITLE Direct Submission JOURNAL Submitted (15-MAY-1995) Catherine P. M. Hayward, Pathology, McMaster University, HSC 2N32, 1200 Main St. W., Hamilton, Ontario L8N 3Z5, Canada FEATURES Location/Qualifiers source 1..4198 /db_xref="H-InvDB:HIT000218849" /organism="Homo sapiens" /mol_type="mRNA" /db_xref="taxon:9606" /clone="overlapping clones: mmlambda 4, 5, 7, 11 & 17" /cell_type="endothelial" /clone_lib="Clonetech library and libraries VII-91-4 and VII-91-5 (J Biol Chem 262 page 3718)" 5'UTR 1..71 CDS 72..3758 /codon_start=1 /product="prepromultimerin" /protein_id="AAC52065.1" /translation="MKGARLFVLLSSLWSGGIGLNNSKHSWTIPEDGNSQKTMPSASV PPNKIQSLQILPTTRVMSAEIATTPEARTSEDSLLKSTLPPSETSAPAEGVRNQTLTS TEKAEGVVKLQNLTLPTNASIKFNPGAESVVLSNSTLKFLQSFARKSNEQATSLNTVG GTGGIGGVGGTGGVGNRAPRETYLSRGDSSSSQRTDYQKSNFETTRGKNWCAYVHTRL SPTVTLDNQVTYVPGGKGPCGWTGGSCPQRSQKISNPVYRMQHKIVTSLDWRCCPGYS GPKCQLRAQEQQSLIHTNQAESHTAVGRGVAEQQQQQGCGDPEVMQKMTDQVNYQAMK LTLLQKKIDNISLTVNDVRNTYSSLEGKVSEDKSREFQSLLKGLKSKSINVLIRDIVR EQFKIFQNDMQETVAQLFKTVSSLSEDLESTRQIIQKVNESVVSIAAQQKFVLVQENR PTLTDIVELRNHIVNVRQEMTLTCEKPIKELEVKQTHLEGALEQEHSRSILYYESLNK TLSKLKEVHEQLLSTEQVSDQKNAPAAESVSNNVTEYMSTLHENIKKQSLMMLQMFED LHIQESKINNLTVSLEMEKESLRGECEDMLSKCRNDFKFQLKDTEENLHVLNQTLAEV LFPMDNKMDKMSEQLNDLTYDMEILQPLLEQGASLRQTMTYEQPKEAIVIRKKIENLT SAVNSLNFIIKELTKRHNLLRNEVQGRDDALERRINEYALEMEDGLNKTMTIINNAID FIQDNYALKETLSTIKDNSEIHHKCTSDMETILTFIPQFHRLNDSIQTLVNDNQRYNF VLQVAKTLAGIPRDEKLNQSNFQKMYQMFNETTSQVRKYQQNMSHLEEKLLLTTKISK NFETRLQDIESKVTQTLIPYYISVKKGSVVTNERDQALQLQVLNSRFKALEAKSIHLS INFFSLNKTLHEVLTMCHNASTSVSELNATIPKWIKHSLPDIQLLQKGLTEFVEPIIQ IKTQAALSNSTCCIDRSLPGSLANVVKSQKQVKSLPKKINALKKPTVNLTTVLIGRTQ RNTDNIIYPEEYSSCSRHPCQNGGTCINGRTSFTCACRHPFTGDNCTIKLVEENALAP DFSKGSYRYAPMVAFFASHTYGMTIPGPILFNNLDVNYGASYTPRTGKFRIPYLGVYV FKYTIESFSAHISGFLVVDGIDKLAFESENINSEIHCDRVLTGDALLELNYGQEVWLR LAKGTIPAKFPPVTTFSGYLLYRT" sig_peptide 72..128 mat_peptide 129..3755 /product="multimerin" misc_structure 627..638 /note="encodes RGDS domain" misc_structure 876..911 /note="encodes partial EGF-like domain" misc_structure 1020..1196 /note="encodes putative coiled-coil structures in protein" misc_feature 1173..1199 /note="encodes sequence confirmed from protein sequencing" misc_structure 1269..1406 /note="encodes putative coiled-coil structures in protein" misc_structure 2073..2285 /note="encodes putative coiled-coil structures in protein" misc_structure 2523..2690 /note="encodes putative coiled-coil structures in protein" misc_feature 3183..3185 /note="encodes putative tyrosine sulfation site" misc_feature 3243..3245 /note="encodes putative asparagine hydroxylation site" misc_structure 3264..3299 /note="encodes EGF-like domain" misc_structure 3420..3755 /note="encodes putative globular head domain in protein" 3'UTR 3759..4198 regulatory 4179..4184 /regulatory_class="polyA_signal_sequence" BASE COUNT 1436 a 791 c 808 g 1163 t ORIGIN 1 ctgctatcaa aaaggccata aggattttgt ccccaaattt cacatgagct accttgcttc 61 aaactactga gatgaagggg gcaagattat ttgtccttct ttctagttta tggagtgggg 121 gcattgggct taacaacagt aagcattctt ggactatacc tgaggatggg aactctcaga 181 agactatgcc ttctgcttca gttcctccaa ataaaataca aagtttgcaa atactgccaa 241 ccactcgggt catgtcggcg gagatagcta caactccaga ggcaagaact tctgaagaca 301 gtcttcttaa atcaacactg cctccctcag aaacaagtgc acctgctgag ggtgtgagaa 361 atcaaactct cacatccaca gagaaagcag aaggagtggt caagttacag aatcttaccc 421 tcccaaccaa cgctagcatc aagttcaatc ctggagcaga atcagtggtc ctttccaatt 481 ctacactgaa atttcttcag agctttgcca gaaagtcaaa tgaacaagca acttctctaa 541 acacagttgg aggcactgga ggcattggag gcgttggagg cactggaggc gtgggaaatc 601 gagccccacg ggaaacatac ctcagccggg gtgacagcag ttccagccaa agaactgact 661 accaaaaatc aaatttcgaa acaactagag gaaagaattg gtgtgcttat gtacatacca 721 ggttatctcc cacagtgaca ttggacaacc aggtcactta tgtcccaggt gggaaaggac 781 cttgtggctg gaccggtgga tcctgtcctc agagatctca gaagatatcc aatcctgtct 841 ataggatgca acataaaatt gtcacctcat tggattggag gtgctgtcct ggatacagtg 901 ggccgaaatg tcaactaaga gcccaggaac agcaaagttt gatacacacc aaccaggctg 961 aaagtcatac agctgttggc agaggagtag ctgagcagca gcagcagcaa ggctgtggtg 1021 acccagaagt gatgcaaaaa atgactgatc aggtgaacta ccaggcaatg aaactgactc 1081 ttctgcagaa gaagattgac aatatttctt tgactgtgaa tgatgtaagg aacacttact 1141 cctccctaga aggaaaagtc agcgaagata aaagcagaga atttcaatct cttctaaaag 1201 gtctaaaatc caaaagcatt aatgtactga taagagacat agtaagagaa caatttaaaa 1261 tttttcaaaa tgacatgcaa gagactgtag cacagctctt caagactgta tcaagtctat 1321 cagaggacct cgaaagcacc aggcaaataa ttcaaaaagt taatgaatct gtggtttcaa 1381 tagcagccca gcaaaagttt gttttggtgc aagagaatcg gcccactttg actgatatag 1441 tggaactaag gaatcacatt gtgaatgtaa ggcaagaaat gactcttaca tgtgagaagc 1501 ctattaaaga actagaagta aagcagactc atttagaagg tgctctagaa caggaacact 1561 caagaagcat tctgtattat gaatccctca ataaaactct ttctaaattg aaggaagtac 1621 atgagcagct tttatcaact gaacaggtat cagaccagaa gaatgctcca gctgctgagt 1681 cagttagcaa taatgtcact gagtacatgt ctactttaca tgaaaatata aagaagcaga 1741 gtttgatgat gctgcaaatg tttgaagatt tgcacattca agaaagcaag attaacaatc 1801 tcaccgtctc tttggagatg gagaaagagt ctctcagagg tgaatgtgaa gacatgttat 1861 ccaaatgcag aaatgatttt aaatttcaac ttaaggacac agaagagaat ttacatgtgt 1921 taaatcaaac attggctgaa gttctctttc caatggacaa taagatggac aaaatgagtg 1981 agcaactaaa tgatttgact tatgatatgg agatccttca acccttgctt gagcagggag 2041 catcactcag acagacaatg acatatgaac aaccaaagga agcaatagtg ataaggaaaa 2101 agatagaaaa tctgactagt gctgtcaata gtctaaattt tattatcaaa gaacttacaa 2161 aaagacacaa cttacttaga aatgaagtac agggtcgtga tgatgcctta gaaagacgta 2221 tcaatgaata tgccttagaa atggaagatg gcctcaataa gacaatgact attataaata 2281 atgctattga tttcattcaa gataactatg ccctaaaaga gactttaagt actattaagg 2341 ataatagtga gatccatcat aaatgtacct ccgatatgga aactattttg acatttattc 2401 ctcagttcca ccgtctgaat gattctattc agactttggt caatgacaat cagagatata 2461 actttgtttt gcaagtcgcc aagacccttg caggtattcc cagagatgag aaactaaatc 2521 agtccaactt ccaaaagatg tatcaaatgt tcaatgaaac cacttcccaa gtgagaaaat 2581 accagcaaaa tatgagtcat ttggaagaaa aactactctt aactaccaag atttccaaaa 2641 attttgagac tcggttgcaa gacattgagt ctaaagttac ccagacgctc ataccttatt 2701 atatttcagt taaaaaaggc agtgtagtta caaatgagag agatcaggct cttcaactgc 2761 aagtattaaa ttccagattt aaggcgttgg aagcaaaatc tatccatctt tcaattaact 2821 tcttttcgct taacaaaact ctccacgaag ttttaacaat gtgtcacaat gcttctacaa 2881 gtgtgtcaga actgaatgct accatcccta agtggataaa acattccctg ccagatattc 2941 aacttcttca gaaaggtcta acagaatttg tggaaccaat aattcaaata aaaactcaag 3001 ctgccctatc taattcaact tgttgtatag atcgatcgtt gcctggtagt ctggcaaatg 3061 ttgtcaagtc tcagaagcaa gtaaaatcat tgccaaagaa aattaacgca cttaagaaac 3121 caacggtaaa tcttaccaca gtcctgatag gccggactca aagaaacacg gacaacataa 3181 tatatcctga ggagtattca agctgtagtc ggcatccgtg ccaaaatggg ggcacgtgca 3241 taaatggaag aactagcttt acctgtgcct gcagacatcc ttttactggt gacaactgca 3301 ctatcaagct tgtggaagaa aatgctttag ctccagattt ttccaaagga tcttacagat 3361 atgcacccat ggtggcattt tttgcatctc atacgtatgg aatgactata cctggtccta 3421 tcctgtttaa taacttggat gtcaattatg gagcttcata taccccaaga actggaaaat 3481 ttagaattcc gtatcttgga gtatatgttt tcaagtacac catcgagtca tttagtgctc 3541 atatttctgg atttttagtg gttgatggaa tagacaagct tgcatttgag tctgaaaata 3601 ttaacagtga aatacactgt gatagggttt taactgggga tgccttatta gaattaaatt 3661 atgggcagga agtctggtta cgacttgcaa aaggaacaat tccagccaag tttccccctg 3721 ttactacatt tagtggctat ttattatatc gtacataagt tagtatgaaa aacagactat 3781 cacctttatt gagaaacagc cagtgttttc atttatcttt gcttgcacat ctgctctgtt 3841 ttggtttttc tacaggaaat gaaaatcaac ttgttttttt aatatgagta aacttgtatg 3901 tctattttat aaaattattt gaatattgtt taatgtctga atatgaaaga gttcttgatc 3961 ctaaagaaat ttagtggcac agaaaacaaa gtgaatttgt tagcataatt attcctattc 4021 ttatttcttc attttaagtc attgcaatgg aaagtaatat tataaaacgg taattacaac 4081 atattatcag tcacagtttt ctttccaatt aaacacttaa cttttgttat tccctgtata 4141 taaatatata acacacattt tctagattca caaatttaaa taaattactc aaaaaatg //