LOCUS       HSU18918                3901 bp    mRNA    linear   HUM 11-SEP-1995
DEFINITION  Human heparan sulfate-N-deacetylase/N-sulfotransferase mRNA, clone
            HSST, complete cds.
ACCESSION   U18918
VERSION     U18918.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 3901)
  AUTHORS   Dixon,J., Loftus,S.K., Gladwin,A.J., Scambler,P.J., Wasmuth,J.J.
            and Dixon,M.J.
  TITLE     Cloning of the human heparan
            sulfate-N-deacetylase/N-sulfotransferase gene from the Treacher
            Collins syndrome candidate region at 5q32-q33.1
  JOURNAL   Genomics 26 (2), 239-244 (1995)
   PUBMED   7601448
REFERENCE   2  (bases 1 to 3901)
  AUTHORS   Dixon,M.J.
  TITLE     Direct Submission
  JOURNAL   Submitted (20-DEC-1994) Michael J. Dixon, University of Manchester,
            School of Biological Sciences, Stopford Building, Oxford Road,
            Manchester, M13 9PT, UK
FEATURES             Location/Qualifiers
     source          1..3901
                     /db_xref="H-InvDB:HIT000218481"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /chromosome="5"
                     /map="5q32-33.1"
                     /clone="HSST"
                     /sex="female"
                     /tissue_type="placenta"
                     /dev_stage="adult"
     5'UTR           1..216
     CDS             217..2865
                     /codon_start=1
                     /product="heparan
                     sulfate-N-deacetylase/N-sulfotransferase"
                     /protein_id="AAA75281.1"
                     /translation="MPALACLRRLCRHVSPQAVLFLLFIFCLFSVFISAYYLYGWKRG
                     LEPSADAPEPDCGDPPPVAPSRLLPLKPVQAATPSRTDPLVLVFVESLYSQLGQEVVA
                     ILESSRFKYRTEIAPGKGDMPTLTDKGRGRFALIIYENILKYVNLDAWNRELLDKYCV
                     AYGVGIIGFFKANENSLLSAQLKGFPLFLHSNLGLKDCSINPKSPLLYVTRPSEVEKG
                     VLPGEDWTVFQSNHSTYEPVLLAKTRSSESIPHLGADAGLHAALHATVVQDLGLHDGI
                     QRVLFGNNLNFWLHKLVFVDAVAFLTGKRLSLPLDRYILVDIDDIFVGKEGTRMKVED
                     VKALFDTQNELRAHIPNFTFNLGYSGKFFHTGTNAEDAGDDLLLSYVKEFWWFPHMWS
                     HMQPHLFHNQSVLAEQMALNKKFAVEHGIPTDMGYAVAPHHSGVYPVHVQLYEAWKQV
                     WSIRVTSTEEYPHLKPARYRRGFIHNGIMVLPRQTCGLFTHTIFYNEYPGGSSELDKI
                     INGGELFLTVLLNPISIFMTHLSNYGNDRLGLYTFKHLVRFLHSWTNLRLQTLPPVQL
                     AQKYFQIFSEEKDPLWQDPCEDKRHKDIWSKEKTCDRFPKLLIIGPQKTGTTALYLFL
                     GMHPDLSSNYPSSETFEEIQFFNGHNYHKGIDWYMEFFPIPSNTTSDFYFEKSANYFD
                     SEVAPRRAAALLPKAKVLTILINPADRAYSWYQHQRAHDDPVALKYTFHEVITAGSDA
                     SSKLRALQNRCLVPGWYATHIERWLSAYHANQILVLDGKLLRTEPAKVMDMVQKFLGV
                     TNTIDYHKTLAFDPKKGFWCQLLEGGKTKCLGKSKGRKYPEMDLDSRAFLKDYYRDHN
                     IELSKLLYKMGQTLPTWLREDLQNTR"
     3'UTR           2866..3901
     polyA_site      3901
                     /note="12 A nucleotides"
BASE COUNT          793 a         1245 c         1050 g          813 t
ORIGIN      
        1 gaaggaagga gcgtgaccag cctgtggact gcgcccctgg ctgggaggaa ggactggggg
       61 cccagatcct ccactcccag tgccccacaa gggcgtcgct tcctaagtct ctgtgaattt
      121 gttggtcagt ggacgattct cgtgtctcct cctgtgtggg gccttggggt agccagggca
      181 ggccgggcct ccgtggccaa ggtctcggag gccaggatgc ctgccctggc atgcctccgg
      241 aggctgtgtc ggcacgtgtc cccgcaggct gtccttttcc tgctgttcat cttctgcctg
      301 ttcagcgttt tcatctcggc ctactaccta tatggctgga agcgaggcct ggagccctcg
      361 gcggatgccc ccgagcctga ctgcggggac ccgccgcctg tggcccccag tcgcctgctg
      421 ccactcaagc ctgtgcaggc agccacccct tcccgcacag acccgttggt gctggtcttt
      481 gtggagagcc tctactcgca actgggccag gaggtggtgg ccatcctgga gtccagccgc
      541 ttcaaatacc gcacagagat tgcgccgggc aagggtgaca tgcccacgct cactgacaag
      601 ggccgtggcc gcttcgccct catcatctat gagaacatcc tcaagtatgt caacctggac
      661 gcctggaacc gggagctgct ggacaagtac tgtgtggcct acggcgtggg catcattggc
      721 ttcttcaagg ccaatgagaa cagcctgctg agtgcgcagc tcaagggctt ccccctgttc
      781 ctgcactcaa acctgggcct gaaggactgc agcatcaacc ccaagtcccc gctgctctac
      841 gtgacgcgac ctagcgaggt ggagaaaggt gtgctccccg gcgaggactg gacggttttc
      901 cagtcaaatc actccaccta tgagccagtg ctgctggcca agacgcgctc gtctgagtcc
      961 atcccacacc tgggcgcaga cgccggcctg catgctgcac tgcacgccac tgtggtccag
     1021 gacctgggcc tgcacgacgg catccagcgc gtgctgtttg gcaacaacct gaacttctgg
     1081 ctgcacaagc ttgtcttcgt ggatgccgtg gccttcctca cggggaagcg cctctccctg
     1141 ccattggacc gctacatcct ggtggacatt gatgacatct tcgtgggcaa ggagggcaca
     1201 cgcatgaagg tggaggacgt gaaggccctg tttgacacac agaacgaact acgcgcacac
     1261 atcccaaact tcaccttcaa cctgggctac tcagggaaat tcttccacac aggtaccaat
     1321 gctgaggacg ctggggatga tctgctgctg tcgtatgtga aggagttctg gtggttcccc
     1381 cacatgtgga gccacatgca gccccacctt ttccacaacc agtccgtgtt ggccgagcag
     1441 atggccttga acaagaagtt cgctgtcgag catggcattc ccacagacat ggggtatgca
     1501 gtggcgcccc accactcggg cgtgtacccc gtgcacgtgc agctgtacga ggcttggaag
     1561 caggtgtgga gcatccgcgt gaccagcacg gaggagtacc cccacctgaa gccagcccgc
     1621 taccgccgtg gcttcatcca caatggcatc atggttctcc cacggcagac ctgcggcctc
     1681 ttcacacaca ccatcttcta caacgagtac cctggcggct ccagtgagct ggacaaaatc
     1741 atcaacgggg gcgagctctt cctcaccgtg ctcctcaatc ctatcagcat cttcatgacg
     1801 cacctgtcca actatgggaa tgaccgcctg ggcctgtaca ccttcaagca cctggtgcgc
     1861 ttcctgcact cctggacgaa cctccggctg cagacactgc cccctgtgca gttggcgcag
     1921 aagtacttcc agatcttctc cgaggagaag gacccgctct ggcaggaccc ctgcgaggac
     1981 aaacgtcaca aagacatctg gtccaaggag aagacgtgtg accgcttccc aaagctcctc
     2041 atcatcggcc cccagaaaac aggcaccact gccctctacc tgttcctggg catgcaccct
     2101 gacctaagca gcaactaccc cagctctgag acctttgagg agatccagtt ttttaatggc
     2161 cacaactatc acaaaggcat cgactggtac atggagttct tccccatccc ttccaacacc
     2221 acctccgact tctactttga gaaaagcgcc aactactttg attcagaagt ggcgccccgg
     2281 cgggcagcag ccctcttgcc caaagccaag gtcctgacca tcctcatcaa ccccgcggac
     2341 cgggcctatt cctggtacca gcaccagcga gcccatgacg acccagtggc cctaaagtac
     2401 accttccatg aggtgattac cgccggctct gacgcatcct cgaagctgcg tgccctccag
     2461 aaccgctgcc tggtccctgg ctggtacgcc acccacatcg agcgctggct cagtgcctat
     2521 cacgccaacc agattctggt cttggatggc aaactgcttc gcacagaacc tgccaaagtg
     2581 atggacatgg tgcagaagtt ccttggggtg accaacacca ttgactacca caaaaccttg
     2641 gcgtttgatc caaagaaagg attttggtgc caactgcttg aaggaggaaa aaccaagtgt
     2701 ctgggcaaaa gcaagggccg gaaatatccc gagatggact tggattcccg agccttcctg
     2761 aaggactatt accgggacca caacatcgag ctctccaagc tgctgtataa gatgggccag
     2821 acacttccca cttggctacg agaggacctc cagaacacca ggtagccgtg gccaccacag
     2881 ccagactgaa cgtttgtgaa agctgggaca tcccaccaca cgctgagcca gacctgcaga
     2941 gtgggaagct ggaccagggc agctgcgcac ttatgagcaa tactctgtgg aggtctggtg
     3001 gggctggggg agcacccagg cggatctgca agcacctcgg agcacccacc gctgggtctg
     3061 cggcctaagg gacctccctc gccagcagag gtccattccg ttcccagctg ctcctgggga
     3121 ggccgcttcc tggtaggagg gagtccacga gactcttttc tgtccctcac tgtgttccgc
     3181 cgactgtccc ctctcgtcac ccatcactcc ctgcttccgc agggcgcccc tcagtattcg
     3241 ctgccatatg tccctgtcct ccaggctgta ggggaggaga gcctggccgg gggagacaga
     3301 ctggacattt ccctgtttcg agccaggctc ttccaagggg ccagctgggt ccccggagtc
     3361 agtcctaggc tggatgggag ggtggccccc tcaagaggac tcccagcctc cacatctggt
     3421 tcctaccttc acatctcacc ctcccgttct ggggaagaat ttctggttcc tacagtatcc
     3481 actccatcct caaggcttcc cgcagggcct tggggcactg ccttgccatc gggcccagtt
     3541 ctccgggccc cacctgcacc cctttcttcc ccctgggata tgatgtgtgg tgtttcctgt
     3601 ggtaaaagac tgaggcaggc caggggtctg ccagtaacat gttcccatgt acagacacgg
     3661 tccccacacc ctcccagcct caggcccagg cagacatggg cgagctggtg agactgccag
     3721 ccacggcttt gcttagccac ctgtggccga gggctctcag agaccccctt aacctcccaa
     3781 atactaagaa gctaaaatat tttaatattt tgtttttttt tttcttggtg ccagagttta
     3841 taccctgggt gctggggtcg cactgtgtta tatatatata tatatatata tataatgtgt
     3901 a
//