LOCUS       HSU52852                8672 bp    DNA     linear   HUM 13-MAR-2001
DEFINITION  Homo sapiens TS PST1 (STP1) gene, complete cds.
ACCESSION   U52852
VERSION     U52852.2
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 8672)
  AUTHORS   Raftogianis,R.B., Her,C. and Weinshilboum,R.M.
  TITLE     Human phenol sulfotransferase pharmacogenetics: STP1 gene cloning
            and structural characterization
  JOURNAL   Pharmacogenetics 6 (6), 473-487 (1996)
   PUBMED   9014197
REFERENCE   2  (bases 1 to 8672)
  AUTHORS   Carlini,E.J., Raftogianis,R.B., Wood,T.C., Jin,F., Zheng,W.,
            Rebbeck,T.R. and Weinshilboum,R.M.
  TITLE     Sulfation pharmacogenetics: SULT1A1 and SULT1A2 allele frequencies
            in Caucasian, Chinese and African-American subjects
  JOURNAL   Pharmacogenetics 11 (1), 57-68 (2001)
   PUBMED   11207031
REFERENCE   3  (bases 1 to 8672)
  AUTHORS   Raftogianis,R.B., Her,C. and Weinshilboum,R.M.
  TITLE     Direct Submission
  JOURNAL   Submitted (26-MAR-1996) R.B. Raftogianis, Pharmacology, Mayo
            Foundation, 200 First St. SW, Rochester, MN 55905, USA
REFERENCE   4  (bases 1 to 8672)
  AUTHORS   Raftogianis,R.B., Her,C. and Weinshilboum,R.M.
  TITLE     Direct Submission
  JOURNAL   Submitted (08-JUN-2000) R.B. Raftogianis, Pharmacology, Mayo
            Foundation, 200 First St. SW, Rochester, MN 55905, USA
  REMARK    Sequence update by submitter
COMMENT     On Jun 8, 2000 this sequence version replaced U52852.1.
FEATURES             Location/Qualifiers
     source          1..8672
                     /organism="Homo sapiens"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:9606"
                     /chromosome="16"
                     /map="16p12.1"
                     /note="cloned from NIGMS Hybrid Somatic cell line Mapping
                     Panel 2, cell line #GM/NA10479"
     gene            1..7065
                     /gene="STP1"
     misc_feature    1..2628
                     /gene="STP1"
                     /note="5' flanking region"
     mRNA            join(2629..2734,3806..3957,4062..4187,4277..4374,
                     5584..5710,5806..5900,6426..6606,6729..7065)
                     /gene="STP1"
     5'UTR           2629..2734
                     /gene="STP1"
                     /note="5' UTR alternative exon IB"
     mRNA            join(3337..3957,4062..4187,4277..4374,5584..5710,
                     5806..5900,6426..6606,6729..7065)
                     /gene="STP1"
     5'UTR           3337..3606
                     /gene="STP1"
                     /note="5' UTR alternative exon IA"
     exon            3806..3957
                     /gene="STP1"
                     /note="exon II"
     CDS             join(3810..3957,4062..4187,4277..4374,5584..5710,
                     5806..5900,6426..6606,6729..6841)
                     /gene="STP1"
                     /note="thermostable (monamine) phenol sulfotransferase"
                     /codon_start=1
                     /product="TS PST1"
                     /protein_id="AAC51816.1"
                     /translation="MELIQDTSRPPLEYVKGVPLIKYFAEALGPLQSFQARPDDLLIS
                     TYPKSGTTWVSQILDMIYQGGDLEKCHRAPIFMRVPFLEFKAPGIPSGMETLKDTPAP
                     RLLKTHLPLALLPQTLLDQKVKVVYVARNAKDVAVSYYHFYHMAKVHPEPGTWDSFLE
                     KFMVGEVSYGSWYQHVQEWWELSRTHPVLYLFYEDMKENPKREIQKILEFVGHSLPEE
                     TVDFMVQHTSFKEMKKNPMTNYTTVPQEFMDHSISPFMRKGMAGDWKTTFTVAQNERF
                     DADYAEKMAGCSLSFRSEL"
     exon            4062..4187
                     /gene="STP1"
                     /note="exon III"
     exon            4277..4374
                     /gene="STP1"
                     /note="exon IV"
     exon            5584..5710
                     /gene="STP1"
                     /note="exon V"
     exon            5806..5900
                     /gene="STP1"
                     /note="exon VI"
     exon            6426..6606
                     /gene="STP1"
                     /note="exon VII"
     exon            6729..7065
                     /gene="STP1"
                     /note="exon VIII"
     3'UTR           6842..7065
                     /gene="STP1"
     misc_feature    7066..8672
                     /note="3' flanking region"
BASE COUNT         1985 a         2355 c         2374 g         1958 t
ORIGIN      
        1 ttgctgccag ctgcctctcc ctccttgtct cttacctgcc tgctgcctgg gacaggatga
       61 agcggggccc ttgtgttgcc ccaaccctgg ctgttggcta agagcccacg tgatctgcct
      121 gtgagaggag ttccttccgg aagaaccagg gcagcttctg cccctagagg gccaatgccc
      181 tagctgagtg cagtcccccg gccccagcct ggtccagctt tgggaagagg gtgcccagtt
      241 gtgcaatcca ggccggggca gccgtgtcct gatcttggta ttcagggctg agcctggagg
      301 gggcttgtga tgcctgactc tgtctctctc tctggcccca tgccttggta gctgtgaggc
      361 gtcactgctt tgggtgacct gatctggctg tgatggatga gcacggggga aatagtggaa
      421 gactcggaat tagaagacgt gagtgggctt tggccccagc ctccctaccc cactccctgt
      481 cctgggctgc ctgtgaccaa ccttgtttct gcaggcacac tggatagccc tgctggagct
      541 cagtgtccct aatcccctcc agatactggt ggcctagggg aggtcatcaa agaccggtgg
      601 gacatcgacc tcagcccgtt tccacgcttt tttttgtttt tttttttttt ttgagaccga
      661 gtttcactct tgttgcccag gctggagtgc aatggcgtga tcttggctca ccgcaacctc
      721 cgcctcctgg gttcaagcga ttctcctgcc tcagcctccc aagtagctgg gattacaggc
      781 gtgtgccacc aggcttgact aattttctat ttttagtaga gacaaggttt ctccatgttg
      841 gtcaggctgg tctcaaactc ccgacttcag gtgatctgcc tgcctcggcc tcccaaagtg
      901 ctgggattac aggagtgagc caccgtgcca ggccttctcc aggctcttgg caccttagcc
      961 agaaacaatt taaggacaag tgcaaaagtc atgaatgtag gcagatttcc tgcagagtaa
     1021 agggactcac tcaagaagag gaacgtgggg gtcctcaaga gagtgtctca tgccctacaa
     1081 ggtgtggggc tgacctttat gggcttcttc aactaaagag gggtatattc atgaagagtc
     1141 caggaaaagg taaagatttc tcaagaccgt ggtgccacaa tttacaccca aatacaggtg
     1201 ttcctggagc cgtcttggca ctggtgggtg tacggtttca tatgttactg atcatacaat
     1261 gagatcctag gtgaaaccta catcaaatac agcgccatgt tgtgtctggt tggtcgtagc
     1321 cagcttggtc ctcatcctat ttttcaggga cttattggcc cttagcgcat gcagctattt
     1381 caagtttcct tcttctcctc atgtgaaact gctgcctggg attttgtatt cacttgctac
     1441 cactctatta atctcacatt ctcgcctctt ttctgtgtca ccccgtgtgg gtccgacagg
     1501 ttgttactag agtgcaatac aaagtcttag tcaagggaac ctcctgaggg ttgctgaggg
     1561 caggggtgga gctagtagcc tgaggacctg ccagtcacgg ggattcctca tgggcacaga
     1621 ggagggagga ggggtccatg gccctagcat atgagaagcc tctcctctgc ctggaattcc
     1681 catgcctcag cttcccccac actcccacct gtccgcttgc ctctgaactc acgcatttct
     1741 tggaagtctt gggagattca cctttactca gatggttgtt tacctgtctc gtgcacagct
     1801 tgaccttgga ctttaaagtg aggataaaga acgaggagga tggggggatg ccccccttcc
     1861 acggggccct gtggcttcca aacctcggcc tcctctggtc tcttgtctgt ggagcctcct
     1921 tcaaacccag ggaaataaaa ccacctgcca cgggttgtgg ttcttctagg atcttctatc
     1981 aatgttctct gaggtcccca ggagccatga agctggggct gactcccagg gcaatgggac
     2041 tgcagtgtcc ttgttctttc ttgttctatg catccatgct ctgctccacc cctgcccctt
     2101 cactctgccc acacacatcc ctctagactg gccttgtggt cagagcctgg agtgcatggg
     2161 ctgctggggg cctgtgggct gcactgggcc agaacccctg gcaccttcaa gactggcctg
     2221 gagccagcag gtaggtgacc tttccagggc ctgcctatcc cagctttctc ctccaatccc
     2281 tcccctctct tgcctgggtc aattagagag agcttgtctg ttggctgcct ggcagggtgg
     2341 agttcagggg caggtcagga gcccagtgac agctcggaaa aaaaaaaaaa aaaaaaaaaa
     2401 acagaaaaaa aaacctacaa aaacaaaccc accattgggc ctttcccctt tcattcttct
     2461 gttttctaca cagcaaactc agtcgtggct ttggagatca ctttaagctt gtctccagct
     2521 ggcacactaa ggagggtaat ggagaagctc ccccaccccc aaccccaccc cttccttccg
     2581 gaagcaaatc taagtccagc cccggctcca gatccctccc acagtggacc taggaaaccc
     2641 tcagctcaga gaacaaccct gcattcccca cacagcaccc acaatcagcc actgcgggcg
     2701 aggagggcac gaggccaggt tcccaagagc tcaggtgagt gacacagtgg aacggcccag
     2761 ggcgccctca ccctgctcag cttgtggctc taacattcca gaagctgagg cctctggcat
     2821 ccctgccctt tccccatgga tatcccattt cagacaaccc tggcctgcgt gaatccccct
     2881 cccttccctt gtttgtttgt ttttttcccc ggggaggcca ggtcttgctg tcacccaggc
     2941 tggagtgctg tgggatcctg gccactgcag ccttgaattc ctgggctcaa gtgattctct
     3001 tgcctcagcc tctggagtag ctaggactac aggccctcat catcctgcct ggttaatgtt
     3061 taagaatttt tttaaagatt tttagagatg gggtcttgca atgctgcacc aggttggtct
     3121 ccaactcctg gcctcagcct ccctagggtc tgggattata ggtgggagcc accctgccta
     3181 ggcctgtgct tttgctgagt catcagagtt ttgttcattc ccacagcagc tctggcccct
     3241 agtagcagct cagttcctca atgggccgtg tttgtcctgg agcccagatg gactgtggcc
     3301 aggcaagtgg atcacaggcc tggctggcct gggcggtttc cacatgtgag gggctgaggg
     3361 gctcaaggag gggagcatct ccactgggtg gaggctgggg gtcccagcag gaaatggtga
     3421 gacaaagggc gctggctggc agggagacag cacaggaagg tcctagagct tcctcagtgc
     3481 agctggactc tcctggagac cttcacacac cctgatatct gggccttgcc cgacgagggt
     3541 gctttcactg gtctgcacca tggcccaggc cctgggattt tgaacagctc cgcaggtgaa
     3601 tgaaaggtga ggccaggctg gggaaccacc gcattagagc ccgacctggt tttcagcccc
     3661 agccccgcca ctgactggct ttgtgagtgc gggcaagtca ctcagcctcc ctaggcctca
     3721 gtgacttccc tgaaagcaag aattccactt tcttgctgtt gtgatggtgg taagggaacg
     3781 ggcctggctc tggcccctga cgcaggaaca tggagctgat ccaggacacc tcccgcccgc
     3841 cactggagta cgtgaagggg gtcccgctca tcaagtactt tgcagaggca ctggggcccc
     3901 tgcagagctt ccaggcccgg cctgatgacc tgctcatcag cacctacccc aagtccggta
     3961 agtgaggagg gccacccacc ctctcccagg tggcagtccc caccttggcc agcgaggtcg
     4021 tgccctcagc ctgctcaccc cccatctccc tccctctcca ggcaccacct gggtgagcca
     4081 gattctggac atgatctacc agggtggtga cctggagaag tgtcaccgag ctcccatctt
     4141 catgcgggtg cccttccttg agttcaaagc cccagggatt ccctcaggtg tgtgagtgtg
     4201 tcctgggtgc aaggggagtg gaggaagaca gggctggggc ttcagctcac cagaccttcc
     4261 ctgacccact gctcagggat ggagactctg aaagacacac cggccccacg actcctgaag
     4321 acacacctgc ccctggctct gctcccccag actctgttgg atcagaaggt caaggtgagg
     4381 cagggcacag tgtttcacat ccataatccc agcactttgg gaggctgagg caggcagatc
     4441 acctgaggtt gggagtttga gagcaccctg agcaacatag aagaaccttg tctctactaa
     4501 aaatacagaa ttagccgggt gtggtggcgg gtgcctgtaa tcccagctac tccgaagcct
     4561 gagacaggag aatcacttga acccgggaga aggaggttgt ggtgagccag agatcccacc
     4621 attgcattcc agcctgagca acaagagcaa aactcacaaa aataaataaa taaatagata
     4681 tataaataaa aataaaactg tggcacctgt ggtggctcac tgctgtaatg ccagcacttt
     4741 gggaggccaa attgggtgga tcacttgagc tcaggagtta cagaccagcc cgggaaacat
     4801 ggggaacttc catctctata aaaatgcaaa atatcagcag ggcatggtgg catggcgctg
     4861 tagttccagc tactggaaag tctgaggttg gaggattgct tgagcctggg aggtcaaggt
     4921 tgcagtgagt tattatcact ccagtgcact ccaacctggg cgacagaaaa aaagaaagac
     4981 caaggtcttt tttctttttt gagattgtct caataaataa ataaatgaat aaataaaaat
     5041 aaaataaagt aaaataaatc ccacaattaa aagaaaaagc aaaggtccag gtgtggggca
     5101 tgtgaatcca gggaaggagg ccctggctca gcccagcttt ggtcctgttc ttctgggaaa
     5161 gtcgcctcac ttcctccagc cttgtctcat cttctgcggc ggggactgtc tgcctcttgc
     5221 tctgatgacc aagaacgtaa ggctcttcag tgtagaccta agaaagctag agggtgggtc
     5281 ctcacaggcc cacaaaattt ggtggcggtg ggatcacggc tggtggagcg tgccttgctc
     5341 cagatcgggg tgtgacgcat tgatgcagat tatattgcta tagaatatga tggtctcagg
     5401 gaccaggcag gactttggct tctgagcagg gttcagatcc tgacttggcc ctaccggtgc
     5461 cgtgagatct caaacaagtc agcctctaag cctcaggttc ctcctttgcc aatccaagag
     5521 atgagctggc ctggggcagg ctgtgtggtg atggtgctgg ggttgagtct tctgcccctg
     5581 caggtggtct atgttgcccg caacgcaaag gatgtggcag tttcctacta ccacttctac
     5641 cacatggcca aggtgcaccc tgagcctggg acctgggaca gcttcctgga gaagttcatg
     5701 gtcggagaag gtgggtttga tgggaggaag gaaagtgtgg agccgagggg tggtggctac
     5761 aacgcacagc aaccctgtgt tggcacccct tgcctgcttc tccagtgtcc tacggatcct
     5821 ggtaccagca cgtgcaggag tggtgggagc tgagccgcac ccaccctgtt ctctacctct
     5881 tctatgaaga catgaaggag gtgagaccac ctgtgaagct tccctccatg tgacacctgg
     5941 gggccggcac ctcacaggga cccaccaggg tcacccagcc ccctcccttg gcagccccca
     6001 cagcaggccc ggattcccca tcctgccttc ttggcccagg cctccccgct acaggcccca
     6061 cctggcagcg ggccccacac ggctctcatc acccacatct gagtcagctg catggggggc
     6121 cacggatcag aaacttagtc ctattgctac tccctgccaa agggtgtgcc acccagggcc
     6181 acagtcatgg aagaagacca tcacggtcct cacccatagg agccaagccc agctcatgat
     6241 gggatcacag ggcagacagc aattcttttt acccccggga ctggggccct gggggttgag
     6301 gagttggctc tgcagggtct ctaggagagg tggccagatc gcctctgagg ttagagaagg
     6361 ggaccccttt tacttttcct gaatcagcaa tccgagcctc cactgaggag ccctctgctg
     6421 ctcagaaccc caaaagggag attcaaaaga tcctggagtt tgtggggcac tccctgccag
     6481 aggagaccgt ggacttcatg gttcagcaca cgtcgttcaa ggagatgaag aagaacccta
     6541 tgaccaacta caccaccgtc ccccaggagt tcatggacca cagcatctcc cccttcatga
     6601 ggaaaggtgg gtgctggcca gtacgggggt ttggggcggg tgggagcagc agctgcagcc
     6661 tccccatagg cactcggggc ctcccctggg atgagactcc agccttgctc cctgccttcc
     6721 ccccccaggc atggctgggg actggaagac caccttcacc gtggcgcaga atgagcgctt
     6781 cgatgcggac tatgcggaga agatggcagg ctgcagcctc agcttccgct ctgagctgtg
     6841 agaggggctc ctggggtcac tgcagaggga gtgtgcgaat caaacctgac caagcggctc
     6901 aagaataaaa tatgaattga gggcctggga cggtaggtca tgtctgtaat cccagcaatt
     6961 tggaggctga ggtgggagga tcatttgagc ccaggagttc gagaccaacc tgggcaacat
     7021 agtgagattc tgttaaaaaa ataaaataaa ataaaaccaa tttttaaaaa gagaataaaa
     7081 tatgattgtg ggccaggcat agtggctcat gcctgtaatc ccagcaattt gagaagttga
     7141 ggctagagga tcactggagg acaggagttt gggaccagcc tgttcaacat tacaagacat
     7201 catccctaca aaaatttgag aaaattatct gtacgtgatg gtgggcacct gtagtcccag
     7261 ctacttgaca agtgaaggca gtaggatcgc ctgagccagg gaggttatgg ctgcagtggg
     7321 ctgactgggc taatccactc aagcctgagg gacagagcaa atcttgcttg agaaataaat
     7381 aaaatacaat ttacttaaca taaattatga ttcaggacca gtctggccaa catggtgaaa
     7441 ccccgtctct actaaaaaaa aaaaaagata caaaaattag ccgggcatgg tggcagacac
     7501 ctgtaacctc agctactctg gaggctgagg caggagaatt gctcgaaccc agggacggat
     7561 gatgcagtga gccaagatca tgccacttca ctccagcctg ggcataagag caaaactctg
     7621 gcttgaaaat aaataaataa ttaaattaaa ttaaggtatt atttgacctg ggctcggtgg
     7681 cttatgcctg gaatctcagc acttcagcct ggcagatcac ttgaggtcag gagttcaaga
     7741 ccaggctggc cagcatggga aaaccccatc tctactaaaa atacaaaaat tagctgggca
     7801 tgatgatggg cgcctgtaat cccagctact ccagaggctg aggtgggaga atcgattgaa
     7861 tccatgaggt ggaggtttca ttgaaccggg atcacaccac tgcactccag tctgggcgac
     7921 agagcaagac tcagtcttaa aacaacaaca acaacaacaa caacaacaca actatgattt
     7981 gtgttcaatg cagagtctct attccaagcc aagagaaacc ctgagctgaa agagtgatcg
     8041 cccactgggg ccaaatacgg ccacctctcc gctccagctc ctcaacttga cctgtttgga
     8101 gaggggagag ggtctggaga agtaaaaccc aggagacgag tggaggggga atgtgtttaa
     8161 tcccagcaca tcctttgctg tcctgccctg tgtcgttggt ggatggcgaa gtccgccagg
     8221 cagcgtcact ttttcttggg ctccttacaa gccaccacct acctctgggc cacgctgagg
     8281 ggaggggaat gcttgaagac actcaagcat aggagtgtct tcaaacagga ccaagtagtc
     8341 atcctggggc tgtggggcag gcagacagga ggggctgctc agagatcccc aggccatgac
     8401 aggcaccccc ttcccccagc ctagaccaca ggaggctctg ggccgtggac tttcagccac
     8461 tcctgccatt gttcactctg gggtcaagaa gtcttggccc agtccctgct gctatggagc
     8521 tcttttctca gtggctggag gcccagagca gtgaaaaagg tggagggagg aagaggtgct
     8581 gactccttcc ccagtggggc catagctaga gggtctgctg cctttcaggg actctgtgtt
     8641 cagaggaccg agggcagccc agatggtggc aa
//