LOCUS       X04665                  4434 bp    mRNA    linear   HUM 21-OCT-2008
DEFINITION  Human mRNA for thrombospondin.
ACCESSION   X04665
VERSION     X04665.1
KEYWORDS    glycoprotein; signal peptide; thrombospondin.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 4434)
  AUTHORS   Lawler J., Hynes R.O.
  TITLE     The structure of human thrombospondin, an adhesive glycoprotein
            with multiple calcium-binding sites and homologies with several
            different proteins
  JOURNAL   J. Cell Biol. 103(5), 1635-1648(1986).
   PUBMED   2430973
COMMENT     Three types of repeating amino acid sequence are present in
            thrombospondin. The first is 57 amino acids long and shows homology
            with circumsporozoite protein from Plasmodium falciparum. The
            second is 50-60 amino acids long and shows homology with epidermal
            growth factor precursor. The third occurs as a continuous eightfold
            repeat of a 38-residue sequence; structural homology with
            parvalbumin and calmodulin indicates that these repeats constitute
            the multiple calcium-binding sites of thrombospondin.
            
            Data kindly reviewed (15-SEP-1987) by Lawler J.
FEATURES             Location/Qualifiers
     source          1..4434
                     /db_xref="H-InvDB:HIT000321055"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /cell_type="umbilical vein endothelial cells"
                     /db_xref="taxon:9606"
     CDS             76..3588
                     /note="precursor polypeptide (AA -18 to 1152)"
                     /db_xref="GOA:P07996"
                     /db_xref="H-InvDB:HIT000321055.14"
                     /db_xref="HGNC:HGNC:11785"
                     /db_xref="InterPro:IPR000742"
                     /db_xref="InterPro:IPR000884"
                     /db_xref="InterPro:IPR001007"
                     /db_xref="InterPro:IPR001791"
                     /db_xref="InterPro:IPR001881"
                     /db_xref="InterPro:IPR003367"
                     /db_xref="InterPro:IPR008859"
                     /db_xref="InterPro:IPR013032"
                     /db_xref="InterPro:IPR013320"
                     /db_xref="InterPro:IPR017897"
                     /db_xref="InterPro:IPR028499"
                     /db_xref="InterPro:IPR028974"
                     /db_xref="InterPro:IPR036383"
                     /db_xref="PDB:1LSL"
                     /db_xref="PDB:1UX6"
                     /db_xref="PDB:1Z78"
                     /db_xref="PDB:1ZA4"
                     /db_xref="PDB:2ERF"
                     /db_xref="PDB:2ES3"
                     /db_xref="PDB:2OUH"
                     /db_xref="PDB:2OUJ"
                     /db_xref="PDB:3R6B"
                     /db_xref="PDB:5FOE"
                     /db_xref="UniProtKB/Swiss-Prot:P07996"
                     /protein_id="CAA28370.1"
                     /translation="MGLAWGLGVLFLMHVCGTNRIPESGGDNSVFDIFELTGAARKGS
                     GRRLVKGPDPSSPAFRIEDANLIPPVPDDKFQDLVDAVRTEKGFLLLASLRQMKKTRG
                     TLLALERKDHSGQVFSVVSNGKAGTLDLSLTVQGKQHVVSVEEALLATGQWKSITLFV
                     QEDRAQLYIDCEKMENAELDVPIQSVFTRDLASIARLRIAKGGVNDNFQGVLQNVRFV
                     FGTTPEDILRNKGCSSSTSVLLTLDNNVVNGSSPAIRTNYIGHKTKDLQAICGISCDE
                     LSSMVLELRGLRTIVTTLQDSIRKVTEENKELANELRRPPLCYHNGVQYRNNEEWTVD
                     SCTECHCQNSVTICKKVSCPIMPCSNATVPDGECCPRCWPSDSADDGWSPWSEWTSCS
                     TSCGNGIQQRGRSCDSLNNRCEGSSVQTRTCHIQECDKRFKQDGGWSHWSPWSSCSVT
                     CGDGVITRIRLCNSPSPQMNGKPCEGEARETKACKKDACPINGGWGPWSPWDICSVTC
                     GGGVQKRSRLCNNPTPQFGGKDCVGDVTENQICNKQDCPIDGCLSNPCFAGVKCTSYP
                     DGSWKCGACPPGYSGNGIQCTDVDECKEVPDACFNHNGEHRCENTDPGYNCLPCPPRF
                     TGSQPFGQGVEHATANKQVCKPRNPCTDGTHDCNKNAKCNYLGHYSDPMYRCECKPGY
                     AGNGIICGEDTDLDGWPNENLVCVANATYHCKKDNCPNLPNSGQEDYDKDGIGDACDD
                     DDDNDKIPDDRDNCPFHYNPAQYDYDRDDVGDRCDNCPYNHNPDQADTDNNGEGDACA
                     ADIDGDGILNERDNCQYVYNVDQRDTDMDGVGDQCDNCPLEHNPDQLDSDSDRIGDTC
                     DNNQDIDEDGHQNNLDNCPYVPNANQADHDKDGKGDACDHDDDNDGIPDDKDNCRLVP
                     NPDQKDSDGDGRGDACKDDFDHDSVPDIDDICPENVDISETDFRRFQMIPLDPKGTSQ
                     NDPNWVVRHQGKELVQTVNCDPGLAVGYDEFNAVDFSGTFFINTERDDDYAGFVFGYQ
                     SSSRFYVVMWKQVTQSYWDTNPTRAQGYSGLSVKVVNSTTGPGEHLRNALWHTGNTPG
                     QVRTLWHDPRHIGWKDFTAYRWRLSHRPKTGFIRVVMYEGKKIMADSGPIYDKTYAGG
                     RLGLFVFSQEMVFFSDLKYECRDP"
     sig_peptide     76..129
                     /note="put. signal peptide (AA -18 to -1)"
     mat_peptide     130..3585
                     /note="mature peptide (AA 1-1152)"
     misc_feature    817..825
                     /note="pot. N-glycosylation site"
     misc_feature    1153..1161
                     /note="pot. N-glycosylation site"
     misc_feature    1636..1644
                     /note="pot. N-glycosylation site"
     misc_feature    2197..2205
                     /note="pot. N-glycosylation site"
     misc_feature    3226..3234
                     /note="pot. N-glycosylation site"
     misc_feature    3274..3282
                     /note="pot. N-glycosylation site"
BASE COUNT         1139 a         1185 c         1177 g          933 t
ORIGIN      
        1 gccgccctcg ccaccgctcc cggccgccgc gctccggtac acacaggatc cctgctgggc
       61 accaacagct ccaccatggg gctggcctgg ggactaggcg tcctgttcct gatgcatgtg
      121 tgtggcacca accgcattcc agagtctggc ggagacaaca gcgtgtttga catctttgaa
      181 ctcaccgggg ccgcccgcaa ggggtctggg cgccgactgg tgaagggccc cgacccttcc
      241 agcccagctt tccgcatcga ggatgccaac ctgatccccc ctgtgcctga tgacaagttc
      301 caagacctgg tggatgctgt gcggacagaa aagggtttcc tccttctggc atccctgagg
      361 cagatgaaga agacccgggg cacgctgctg gccctggagc ggaaagacca ctctggccag
      421 gtcttcagcg tggtgtccaa tggcaaggcg ggcaccctgg acctcagcct gaccgtccaa
      481 ggaaagcagc acgtggtgtc tgtggaagaa gctctcctgg caaccggcca gtggaagagc
      541 atcaccctgt ttgtgcagga agacagggcc cagctgtaca tcgactgtga aaagatggag
      601 aatgctgagt tggacgtccc catccaaagc gtcttcacca gagacctggc cagcatcgcc
      661 agactccgca tcgcaaaggg gggcgtcaat gacaatttcc agggggtgct gcagaatgtg
      721 aggtttgtct ttggaaccac accagaagac atcctcagga acaaaggctg ctccagctct
      781 accagtgtcc tcctcaccct tgacaacaac gtggtgaatg gttccagccc tgccatccgc
      841 actaactaca ttggccacaa gacaaaggac ttgcaagcca tctgcggcat ctcctgtgat
      901 gagctgtcca gcatggtcct ggaactcagg ggcctgcgca ccattgtgac cacgctgcag
      961 gacagcatcc gcaaagtgac tgaagagaac aaagagttgg ccaatgagct gaggcggcct
     1021 cccctatgct atcacaacgg agttcagtac agaaataacg aggaatggac tgttgatagc
     1081 tgcactgagt gtcactgtca gaactcagtt accatctgca aaaaggtgtc ctgccccatc
     1141 atgccctgct ccaatgccac agttcctgat ggagaatgct gtcctcgctg ttggcccagc
     1201 gactctgcgg acgatggctg gtctccatgg tccgagtgga cctcctgttc tacgagctgt
     1261 ggcaatggaa ttcagcagcg cggccgctcc tgcgatagcc tcaacaaccg atgtgagggc
     1321 tcctcggtcc agacacggac ctgccacatt caggagtgtg acaagagatt taaacaggat
     1381 ggtggctgga gccactggtc cccgtggtca tcttgttctg tgacatgtgg tgatggtgtg
     1441 atcacaagga tccggctctg caactctccc agcccccaga tgaacgggaa accctgtgaa
     1501 ggcgaagcgc gggagaccaa agcctgcaag aaagacgcct gccccatcaa tggaggctgg
     1561 ggtccttggt caccatggga catctgttct gtcacctgtg gaggaggggt acagaaacgt
     1621 agtcgtctct gcaacaaccc cacaccccag tttggaggca aggactgcgt tggtgatgta
     1681 acagaaaacc agatctgcaa caagcaggac tgtccaattg atggatgcct gtccaatccc
     1741 tgctttgccg gcgtgaagtg tactagctac cctgatggca gctggaaatg tggtgcttgt
     1801 ccccctggtt acagtggaaa tggcatccag tgcacagatg ttgatgagtg caaagaagtg
     1861 cctgatgcct gcttcaacca caatggagag caccggtgtg agaacacgga ccccggctac
     1921 aactgcctgc cctgcccccc acgcttcacc ggctcacagc ccttcggcca gggtgtcgaa
     1981 catgccacgg ccaacaaaca ggtgtgcaag ccccgtaacc cctgcacgga tgggacccac
     2041 gactgcaaca agaacgccaa gtgcaactac ctgggccact atagcgaccc catgtaccgc
     2101 tgcgagtgca agcctggcta cgctggcaat ggcatcatct gcggggagga cacagacctg
     2161 gatggctggc ccaatgagaa cctggtgtgc gtggccaatg cgacttacca ctgcaaaaag
     2221 gataattgcc ccaaccttcc caactcaggg caggaagact atgacaagga tggaattggt
     2281 gatgcctgtg atgatgacga tgacaatgat aaaattccag atgacaggga caactgtcca
     2341 ttccattaca acccagctca gtatgactat gacagagatg atgtgggaga ccgctgtgac
     2401 aactgtccct acaaccacaa cccagatcag gcagacacag acaacaatgg ggaaggagac
     2461 gcctgtgctg cagacattga tggagacggt atcctcaatg aacgggacaa ctgccagtac
     2521 gtctacaatg tggaccagag agacactgat atggatgggg ttggagatca gtgtgacaat
     2581 tgccccttgg aacacaatcc ggatcagctg gactctgact cagaccgcat tggagatacc
     2641 tgtgacaaca atcaggatat tgatgaagat ggccaccaga acaatctgga caactgtccc
     2701 tatgtgccca atgccaacca ggctgaccat gacaaagatg gcaagggaga tgcctgtgac
     2761 cacgatgatg acaacgatgg cattcctgat gacaaggaca actgcagact cgtgcccaat
     2821 cccgaccaga aggactctga cggcgatggt cgaggtgatg cctgcaaaga tgattttgac
     2881 catgacagtg tgccagacat cgatgacatc tgtcctgaga atgttgacat cagtgagacc
     2941 gatttccgcc gattccagat gattcctctg gaccccaaag ggacatccca aaatgaccct
     3001 aactgggttg tacgccatca gggtaaagaa ctcgtccaga ctgtcaactg tgatcctgga
     3061 ctcgctgtag gttatgatga gtttaatgct gtggacttca gtggcacctt cttcatcaac
     3121 accgaaaggg acgatgacta tgctggattt gtctttggct accagtccag cagccgcttt
     3181 tatgttgtga tgtggaagca agtcacccag tcctactggg acaccaaccc cacgagggct
     3241 cagggatact cgggcctttc tgtgaaagtt gtaaactcca ccacagggcc tggcgagcac
     3301 ctgcggaacg ccctgtggca cacaggaaac acccctggcc aggtgcgcac cctgtggcat
     3361 gaccctcgtc acataggctg gaaagatttc accgcctaca gatggcgtct cagccacagg
     3421 ccaaagacgg gtttcattag agtggtgatg tatgaaggga agaaaatcat ggctgactca
     3481 ggacccatct atgataaaac ctatgctggt ggtagactag ggttgtttgt cttctctcaa
     3541 gaaatggtgt tcttctctga cctgaaatac gaatgtagag atccctaatc atcaaattgt
     3601 tgattgaaag actgatcata aaccaatgct ggtattgcac cttctggaac tatgggcttg
     3661 agaaaacccc caggatcact tctccttggc ttccttcttt tctgtgcttg catcagtgtg
     3721 gactcctaga acgtgcgacc tgcctcaaga aaatgcagtt ttcaaaaaca gactcagcat
     3781 tcagcctcca atgaataaga catcttccaa gcatataaac aattgctttg gtttcctttt
     3841 gaaaaagcat ctacttgctt cagttgggaa ggtgcccatt ccactctgcc tttgtcacag
     3901 agcagggtgc tattgtgagg ccatctctga gcagtggact caaaagcatt ttcaggcatg
     3961 tcagagaagg gaggactcac tagaattagc aaacaaaacc accctgacat cctccttcag
     4021 gaacacgggg agcagaggcc aaagcactaa ggggagggcg catacccgag acgattgtat
     4081 gaagaaaata tggaggaact gttacatgtt cggtactaag tcattttcag gggattgaaa
     4141 gactattgct ggatttcatg atgctgactg gcgttagctg attaacccat gtaaataggc
     4201 acttaaatag aagcaggaaa gggagacaaa gactggcttc tggacttcct ccctgatccc
     4261 cacccttact catcacctgc agtggccaga attagggaat cagaatcgaa accagtgtaa
     4321 ggcagtgctg gctgccattg cctggtcaca ttgaaattgg tggcttcatt ctagatgtag
     4381 cttgtgcaga tgtagcagga aaataggaaa acctaccatc tcagtgagca ccag
//