LOCUS       X06268                  1382 bp    mRNA    linear   HUM 13-JUL-1995
DEFINITION  Human mRNA for pro-alpha 1 (II) collagen  3'end C-term. triple
            helical and C-terminal non-helical domain.
ACCESSION   X06268 X02664 X06584
VERSION     X06268.1
KEYWORDS    collagen; collagen alpha 1 type II.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1382)
  AUTHORS   Vuorio E.
  JOURNAL   Submitted (19-NOV-1987) to the INSDC. Vuorio E., Univ. of Turku,
            Dept. of Medical Biochemistry, Kiinamyllynkatu 10, SF-20520 Turku,
            Finland.
REFERENCE   2  (bases 1 to 1382)
  AUTHORS   Vuorio E., Vuorio T., Elima K.
  TITLE     Determination of the single polyadenylation site of the human pro
            alpha 1(II) collagen gene.
  JOURNAL   Nucleic Acids Res. 15(22), 9499-9504(1987).
   PUBMED   2825137
REFERENCE   3  (bases 343 to 879)
  AUTHORS   Elima K., Maekelae J.K., Vuorio T., Kauppinen S., Knowles J.,
            Vuorio E.
  TITLE     Construction and identification of a cDNA clone for human type II
            procollagen mRNA
  JOURNAL   Biochem. J. 229(1), 183-188(1985).
   PUBMED   3840017
COMMENT     Data kindly reviewed (7-OCT-1988) by Elima K.
FEATURES             Location/Qualifiers
     source          1..1382
                     /db_xref="H-InvDB:HIT000321172"
                     /organism="Homo sapiens"
                     /map="12ql.31-32"
                     /mol_type="mRNA"
                     /clone="pHCAR3"
                     /tissue_type="epiphyseal cartilage"
                     /db_xref="taxon:9606"
     CDS             <1..942
                     /codon_start=1
                     /product="pro-alpha 1 (II) collagen (313 AA; AA 975-271c)"
                     /db_xref="GOA:P02458"
                     /db_xref="H-InvDB:HIT000321172.14"
                     /db_xref="HGNC:HGNC:2200"
                     /db_xref="InterPro:IPR000885"
                     /db_xref="InterPro:IPR001007"
                     /db_xref="InterPro:IPR008160"
                     /db_xref="PDB:1U5M"
                     /db_xref="PDB:2FSE"
                     /db_xref="PDB:2SEB"
                     /db_xref="PDB:5NIR"
                     /db_xref="PDB:5OCX"
                     /db_xref="PDB:5OCY"
                     /db_xref="PDB:6BIN"
                     /db_xref="UniProtKB/Swiss-Prot:P02458"
                     /protein_id="CAA29604.1"
                     /translation="DGANGIPGPIGPPGPRGRSGETGPAGPPGNPGPPGPPGPPGPGI
                     DMSAFAGLGPREKGPDPLQYMRADQAAGGLRQHDAEVDATLKSLNNQIESIRSPEGSR
                     KNPARTCRDLKLCHPEWKSGDYWIDPNQGCTLDAMKVFCNMETGETCVYPNPANVPKK
                     NWWSSKSKEKKHIWFGETINGGFHFSYGDDNLAPNTANVQMTFLRLLSTEGSQNITYH
                     CKNSIAYLDEAAGNLKKALLIQGSNDVEIRAEGNSRFTYTALKDGCTKHTGKWGKTVI
                     EYRSQKTSRLPIIDIAPMDIGGPEQEFGVDIGPVCFL"
     misc_feature    <1..120
                     /note="triple-helical domain"
     exon            <1..75
                     /note="exon 5"
     exon            76..364
                     /note="exon 4"
     misc_feature    121..201
                     /note="C-terminal telopeptide domain"
     misc_feature    202..939
                     /note="C-terminal propeptide domain"
     exon            365..552
                     /note="exon 3"
     exon            553..795
                     /note="exon 2"
     exon            796..939
                     /note="exon 1"
     regulatory      1354..1359
                     /note="polyA signal"
                     /regulatory_class="polyA_signal_sequence"
     polyA_site      1359..1359
                     /note="polyA site"
BASE COUNT          353 a          407 c          341 g          281 t
ORIGIN      
        1 gatggtgcta atggaatccc tggccccatt gggcctcctg gtccccgtgg acgatcaggc
       61 gaaaccggcc ctgctggtcc tcctggaaat cctggacccc ctggtcctcc aggtccccct
      121 ggccctggca tcgacatgtc cgcctttgct ggcttaggcc cgagagagaa gggccccgac
      181 cccctgcagt acatgcgggc cgaccaggca gccggtggcc tgagacagca tgacgccgag
      241 gtggatgcca cactcaagtc cctcaacaac cagattgaga gcatccgcag ccccgagggc
      301 tcccgcaaga accctgctcg cacctgcaga gacctgaaac tctgccaccc tgagtggaag
      361 agtggagact actggattga ccccaaccaa ggctgcacct tggacgccat gaaggttttc
      421 tgcaacatgg agactggcga gacttgcgtc taccccaatc cagcaaacgt tcccaagaag
      481 aactggtgga gcagcaagag caaggagaag aaacacatct ggtttggaga aaccatcaat
      541 ggtggcttcc atttcagcta tggagatgac aatctggctc ccaacactgc caacgtccag
      601 atgaccttcc tacgcctgct gtccacggaa ggctcccaga acatcaccta ccactgcaag
      661 aacagcattg cctatctgga cgaagcagct ggcaacctca agaaggccct gctcatccag
      721 ggctccaatg acgtggagat ccgggcagag ggcaatagca ggttcacgta cactgccctg
      781 aaggatggct gcacgaaaca taccggtaag tggggcaaga ctgttatcga gtaccggtca
      841 cagaagacct cacgcctccc catcattgac attgcaccca tggacatagg agggcccgag
      901 caggaattcg gtgtggacat agggccggtc tgcttcttgt aaaaacctga acccagaaac
      961 aacacaatcc gttgcaaacc caaaggaccc aagtactttc caatctcagt cactctagga
     1021 ctctgcactg aatggctgac ctgacctgat gtccattcat cccaccctct cacagttcgg
     1081 acttttctcc cctctctttc taagagacct gaactgggca gactgcaaaa taaaatctcg
     1141 gtgttctatt tatttattgt cttcctgtaa gaccttcggg tcaaggcaga ggcaggaaac
     1201 taactggtgt gagtcaaatg ccccctgagt gactgccccc agcccaggcc agaagacctc
     1261 ccttcaggtg ccgggcgcag gaactgtgtg tgtcctacac aatggtgcta ttctgtgtca
     1321 aacacctctg tattttttaa aacatcaatt gatattaaaa atgaaaagat tattggaaag
     1381 ta
//