LOCUS       X07173                  3089 bp    mRNA    linear   HUM 07-OCT-2008
DEFINITION  Human mRNA for second protein of inter-alpha-trypsin inhibitor
            complex.
ACCESSION   X07173
VERSION     X07173.1
KEYWORDS    inter-alpha-trypsin inhibitor.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 3089)
  AUTHORS   Gebhard W., Schreitmueller T., Hochstrasser K.
  TITLE     Complementary DNA and derived amino acid sequence of the precursor
            of one of the three protein components of the inter-alpha-trypsin
            inhibitor complex
  JOURNAL   FEBS Lett. 229(1), 63-67(1988).
   PUBMED   2450046
COMMENT     [1] revisions partial sequence published in:
            Schreitmueller et. al. (1987) Biol. Chem. Hoppe-Seyler 368, 963-
            970; 3 differences revisioned
            
            Data kindly reviewed (17-APR-1988) by Gebhard W.
FEATURES             Location/Qualifiers
     source          1..3089
                     /db_xref="H-InvDB:HIT000321243"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /tissue_type="liver"
                     /db_xref="taxon:9606"
     CDS             64..2904
                     /product="trypsin inhibitor"
                     /note="preproprotein (AA -18 to 928)"
                     /db_xref="GOA:P19823"
                     /db_xref="H-InvDB:HIT000321243.12"
                     /db_xref="HGNC:HGNC:6167"
                     /db_xref="InterPro:IPR002035"
                     /db_xref="InterPro:IPR010600"
                     /db_xref="InterPro:IPR013694"
                     /db_xref="InterPro:IPR036465"
                     /db_xref="UniProtKB/Swiss-Prot:P19823"
                     /protein_id="CAA30160.1"
                     /translation="MKRLTCFFICFFLSEVSGFEIPINGLSEFVDYEDLVELAPGKFQ
                     LVAENRRYQRSLPGESEEMMEEVDQVTLYSYKVQSTITSRMATTMIQSKVVNNSPQPQ
                     NVVFDVQIPKGAFISNFSMTVDGKTFRSSIKEKTVGRALYAQARAKGKTAGLVRSSAL
                     DMENFRTEVNVLPGAKVQFELHYQEVKWRKLGSYEHRIYLQPGRLAKHLEVDVWVIEP
                     QGLRFLHVPDTFEGHFDGVPVISKGQQKAHVSFKPTVAQQRICPSCRETAVDGELVVL
                     YDVKREEKAGELEVFNGYFVHFFAPDNLDPIPKNILFVIDVSGSMWGVKMKQTVEAMK
                     TILDDLRAEDHFSVIDFNQNIRTWRNDLFQLQKHRLQIAKRYIEKIQPSGGTNINEAL
                     LRAIFILNEANNLGLLDPNSVSLIILVSDGDPTVGELKLSKIQKNVKENIQDNISLFS
                     LGMGFDVDYDFLKRLSNENHGIAQRIYGNQDTSSQLKKFYNQVSTPLLRNVQFNYPHT
                     SVTDVTQNNFHNYFGGSEIVVAGKFDPAKLDQIESVITATSANTQLVLETLAQMDDLQ
                     DFLSKDKHADPDFTRKLWAYLTINQLLAERSLAPTAAAKRRITRSILQMSLDHHIVTP
                     LTSLVIENEAGDERMLADAPPQDPSCCSGALYYGSKVVPDSTPSWANPSPTPVISMLA
                     QGSQVLESTPPPHVMRVENDPHFIIYLPKSQKNICFNIDSEPGKILNLVSDPESGIVV
                     NGQLVGAKKPNNGKLSTYFGKLGFYFQSEDIKIEISTETITLSHGSSTFSLSWSDTAQ
                     VTNQRVQISVKKEKVVTITLDKEMSFSVLLHRVWKKHPVNVDFLGIYIPPTNKFSPKA
                     HGLIGQFMQEPKIHIFNERPGKDPEKPEASMEVKGQKLIITRGLQKDYRTDLVFGTDV
                     TCWFVHNSGKGFIDGHYKDYFVPQLYSFLKRP"
     sig_peptide     64..117
                     /note="signal peptide (AA -18 to -1)"
     mat_peptide     118..2901
                     /note="proprotein (AA 1 - 928)"
     misc_feature    226..226
                     /note="mat. peptide N-term."
     misc_feature    2158..2159
                     /note="pot. C-terminal processing site"
     misc_feature    2307..2308
                     /note="pot. C-terminal processing site"
     polyA_site      3089..3089
                     /note="polyA site"
BASE COUNT          925 a          701 c          711 g          752 t
ORIGIN      
        1 gaaagaagtg atatcctccc cagaccatct gctttgggga gcttggcaaa actgtccagc
       61 aaaatgaaaa gactcacgtg ctttttcatc tgcttctttc tttctgaagt atcaggcttc
      121 gaaatcccca taaatggact ttctgaattt gtagactatg aagatcttgt ggaactggcc
      181 ccaggcaaat ttcaattggt ggcagagaac cggagatatc agagaagcct tccaggagaa
      241 tcggaagaaa tgatggaaga ggttgatcaa gtaactcttt atagctataa agtccagtct
      301 actattactt ctcggatggc caccaccatg atccagagca aagtggtgaa caattccccg
      361 cagcctcaga atgtcgtgtt tgatgttcag atccccaaag gagcattcat ttccaacttc
      421 tccatgactg tggacggcaa gacatttagg agctctatta aggagaaaac tgtgggccga
      481 gctctttatg cacaggccag agcaaaaggc aagacggctg gcttggtgag gagcagcgct
      541 cttgatatgg aaaacttcag aacggaagta aatgtcctcc caggagcaaa ggtgcagttc
      601 gaacttcact accaggaggt gaagtggagg aagctgggct cctatgagca caggatctat
      661 ctgcaacctg gacggctggc caaacactta gaggtagatg tgtgggttat cgaaccacag
      721 ggactgagat ttcttcatgt tcccgacaca tttgaaggcc atttcgatgg tgttccggtc
      781 atttctaaag gacaacagaa ggcgcacgtc tccttcaagc ccacggtagc acagcagaga
      841 atatgcccta gctgccggga gactgcggta gatggggaac tggtggtgct gtatgacgtg
      901 aaaagagaag agaaggctgg tgaactggag gtgtttaatg gatattttgt ccacttcttt
      961 gctcctgaca acctggaccc aattcccaaa aacatcctct ttgtcatcga tgtgagtggc
     1021 tccatgtggg gagttaaaat gaaacaaact gtggaagcaa tgaagaccat attggatgac
     1081 ctcagagcag aagaccattt ctctgtgatt gatttcaacc agaacattcg aacttggaga
     1141 aatgatttat ttcagctaca aaaacacagg ttgcagatag ccaagaggta tattgagaaa
     1201 atccagccca gtggaggcac aaacatcaac gaagcactcc tacgggcaat cttcattttg
     1261 aatgaagcca ataacttggg actgttagac cccaactccg tctcgctgat cattttggtt
     1321 tctgatggag atccaacagt gggcgaacta aaactgtcaa aaattcagaa aaacgttaag
     1381 gagaacatcc aagacaatat ctccttgttc agtttgggca tgggatttga tgtggactat
     1441 gattttttga agagactgtc caatgaaaac catggaattg cacaaaggat ttatggaaac
     1501 caggacacgt cttcccagct taagaaattc tacaaccagg tctccactcc attgctccgg
     1561 aatgttcagt tcaactatcc ccatacatca gtcacggacg tcactcaaaa caatttccat
     1621 aactactttg gaggctcaga gattgtggtg gcaggaaaat ttgaccctgc taaattggat
     1681 caaatagaga gcgttatcac ggcgacttcg gctaacacgc agttagtctt ggagaccctg
     1741 gcccagatgg acgacttgca ggattttcta tcgaaagaca agcatgcaga tcccgatttc
     1801 accaggaaac tgtgggccta tctaaccatc aaccaactgc tagctgaacg aagcctggct
     1861 cctacagctg ccgccaagag aagaattaca agatcgatcc tgcagatgtc tctagaccac
     1921 cacattgtga ctccgctgac ctcgctggtg atcgagaacg aggctgggga tgagcgcatg
     1981 ctggcggatg ccccaccgca ggatccctcc tgctgctcag gggccctgta ttacggcagc
     2041 aaagtggttc cagattccac cccgtcttgg gccaatcctt caccaacgcc cgtgatctcc
     2101 atgctggcac aaggatctca ggtgctagag tccacgccac ccccacatgt gatgagagtt
     2161 gaaaatgacc cacatttcat catttatcta ccaaaaagcc aaaagaacat ttgtttcaat
     2221 attgactcag aacctggaaa aatcctcaac ctggtttctg acccagaatc aggaattgta
     2281 gtcaacggtc agcttgttgg tgccaagaag cccaacaatg gaaaactaag cacctatttt
     2341 ggaaaactgg gattttattt ccaaagtgaa gacataaaaa tagaaatcag cactgagacc
     2401 atcaccctga gccatggttc tagcacattc tccttgtcct ggtccgacac ggctcaagtc
     2461 acgaatcaga gggtgcagat ctcagtgaag aaagaaaaag tggtaactat caccctggat
     2521 aaagagatgt ccttttctgt tttacttcat cgtgtttgga agaagcatcc cgtcaatgtt
     2581 gactttctgg gaatctacat accccctaca aacaagttct cacctaaagc ccacggacta
     2641 ataggccagt tcatgcagga accaaagata cacatcttca atgagagacc aggaaaggac
     2701 cctgagaagc cagaggccag catggaagtg aaggggcaga agctgatcat caccaggggc
     2761 ttacagaaag actacagaac ggatctagtg tttggaacgg acgttacctg ctggtttgtg
     2821 cacaacagtg gaaaaggatt cattgacggg cattacaagg attacttcgt gcctcagctc
     2881 tacagctttc tcaaacggcc ttaaaggttt atagtttggg aaattatata tattaatata
     2941 catctttccc ctgtcacttt tgcagatatt cttcggtttg aataattaaa atgaaccaga
     3001 tatcagggtg gttaattaaa atgaaccaga tatcagggtg gtttataaag cctgtaaaca
     3061 cacctaagaa aataaacatt ttacaaatg
//