LOCUS       HUMARSBX                2802 bp    mRNA    linear   HUM 31-OCT-1994
DEFINITION  Human arylsulfatase B (ASB) mRNA, complete cds.
ACCESSION   M32373
VERSION     M32373.1
KEYWORDS    arylsulfatase; lysosomal hydrolase.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2802)
  AUTHORS   Schuchman,E.H., Jackson,C.E. and Desnick,R.J.
  TITLE     Human arylsulfatase B: MOPAC cloning, nucleotide sequence of a
            full-length cDNA, and regions of amino acid identity with
            arylsulfatases A and C
  JOURNAL   Genomics 6 (1), 149-158 (1990)
   PUBMED   1968043
COMMENT     Original source text: Human liver, cDNA to mRNA.
FEATURES             Location/Qualifiers
     source          1..2802
                     /db_xref="H-InvDB:HIT000195474"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /map="5p11-q13"
     gene            1..2802
                     /gene="ARSB"
     mRNA            <1..2802
                     /gene="ARSB"
                     /product="ASB mRNA"
     CDS             560..2161
                     /gene="ARSB"
                     /note="arylsulfatase B precursor"
                     /codon_start=1
                     /protein_id="AAA51779.1"
                     /db_xref="GDB:G00-119-008"
                     /translation="MGPRGAASLPRGPGPRRLLLPVVLPLLLLLLLAPPGSGAGASRP
                     PHLVFLLADDLGWNDVGFHGSRIRTPHLDALAAGGVLLDNYYTQPLCTPSRSQLLTGR
                     YQIRTGLQHQIIWPCQPSCVPLDEKLLPQLLKEAGYTTHMVGKWHLGMYRKECLPTRR
                     GFDTYFGYLLGSEDYYSHERCTLIDALNVTRCALDFRDGEEVATGYKNMYSTNIFTKR
                     AIALITNHPPEKPLFLYLALQSVHEPLQVPEEYLKPYDFIQDKNRHHYAGMVSLMDEA
                     VGNVTAALKSSGLWNNTVFIFSTDNGGQTLAGGNNWPLRGRKWSLWEGGVRGVGFVAS
                     PLLKQKGVKNRELIHISDWLPTLVKLARGHTNGTKPLDGFDMWKTISEGSPSPRIELL
                     HNIDPNFVDSSPCPRNSMAPAKDDSSLPEYSAFNTSVHAAIRHGNWKLLTGYPGCGYW
                     FPPPSQYNVSEIPSSDPPTKTLWLFDIDRDPEERHDLSREYPHIVTKLLSRLQFYHKH
                     SVPVYFPAQDPRCDPKATGVWGPWM"
     sig_peptide     560..679
                     /gene="ARSB"
                     /note="arylsulfatase B signal peptide"
     mat_peptide     680..2158
                     /gene="ARSB"
                     /product="arylsulfatase B"
BASE COUNT          646 a          767 c          726 g          663 t
ORIGIN      
        1 catggatttc gacattgctg gacctgccac aggctgggct cttgtgctag aaatgacttg
       61 ctagctagac atcatggttc aggatctgag tcagaggttt aaccatttat aagctttttt
      121 cttatgaaaa attggcacta attataatgt ctaactgtca gagttgttgc aggctttaca
      181 ggagacgcgg gctgtgaaga tgctttgtaa attgtgaagc gttattaaag aacacatctt
      241 tttttttagg aaaccacggt gcaaatttaa ttgccgggga agataacggg ccttggtgcc
      301 ctccaagcgt cagctgagtt tccaagaagc cgggcagcgg gcgcccgcgg gttcgtctct
      361 ggctcctcct ccgccacagc agccgggggc ccgggtcgga ggcggcgggg gccgagcgcc
      421 cggcctcgca agcccacggc ccgctggggg tgccgtcccg cgccggggcg gagcaggccc
      481 cggcagccca gttcctcatt ctatcagcgg tacaaggggc tggtggcgcc acaggcgctg
      541 ggaccgcggg cggacaagga tgggtccgcg cggcgcggcg agcttgcccc gaggccccgg
      601 acctcggcgg ctgctcctcc ccgtcgtcct cccgctgctg ctgctgctgt tgttggcgcc
      661 gccgggctcg ggcgccgggg ccagccggcc gccccacctg gtcttcttgc tggcagacga
      721 cctaggctgg aacgacgtcg gcttccacgg ctcccgcatc cgcacgccgc acctggacgc
      781 gctggcggcc ggcggggtgc tcctggacaa ctactacacg cagccgctgt gcacgccgtc
      841 gcggagccag ctgctcactg gccgctacca gatccgtaca ggtttacagc accaaataat
      901 ctggccctgt cagcccagct gtgttcctct ggatgaaaaa ctcctgcccc agctcctaaa
      961 agaagcaggt tatactaccc atatggtcgg aaaatggcac ctgggaatgt accggaaaga
     1021 atgccttcca acccgccgag gatttgatac ctactttgga tatctcctgg gtagtgaaga
     1081 ttattattcc catgaacgct gtacattaat tgacgctctg aatgtcacac gatgtgctct
     1141 tgattttcga gatggcgaag aagttgcaac aggatataaa aatatgtatt caacaaacat
     1201 attcaccaaa agggctatag ccctcataac taaccatcca ccagagaagc ctctgtttct
     1261 ctaccttgct ctccagtctg tgcatgagcc ccttcaggtc cctgaggaat acttgaagcc
     1321 atatgacttt atccaagaca agaacaggca tcactatgca ggaatggtgt cccttatgga
     1381 tgaagcagta ggaaatgtca ctgcagcttt aaaaagcagt gggctctgga acaacacggt
     1441 gttcatcttt tctacagata acggagggca gactttggca gggggtaata actggcccct
     1501 tcgaggaaga aaatggagcc tgtgggaagg aggcgtccga ggggtgggct ttgtggcaag
     1561 ccccttgctg aagcagaagg gcgtgaagaa ccgggagctc atccacatct ctgactggct
     1621 gccaacactc gtgaagctgg ccaggggaca caccaatggc acaaagcctc tggatggctt
     1681 cgacatgtgg aaaaccatca gtgaaggaag cccatccccc agaattgagc tgctgcataa
     1741 tattgacccg aacttcgtgg actcttcacc gtgtcccagg aacagcatgg ctccagcaaa
     1801 ggatgactct tctcttccag aatattcagc ctttaacaca tctgtccatg ctgcaattag
     1861 acatggaaat tggaaactcc tcacgggcta cccaggctgt ggttactggt tccctccacc
     1921 gtctcaatac aatgtttctg agataccctc atcagaccca ccaaccaaga ccctctggct
     1981 ctttgatatt gatcgggacc ctgaagaaag acatgacctg tccagagaat atcctcacat
     2041 cgtcacaaag ctcctgtccc gcctacagtt ctaccataaa cactcagtcc ccgtgtactt
     2101 ccctgcacag gacccccgct gtgatcccaa ggccactggg gtgtggggcc cttggatgta
     2161 ggatttcagg gaggctagaa aacctttcaa ttggaagttg gacctcaggc cttttctcac
     2221 gactcttgtc tcatttgtta tcccaacctg ggttcacttg gcccttctct tgctcttaaa
     2281 ccacaccgag gtgtctaatt tcaaccccta atgcatttaa gaagctgata aaatctgcaa
     2341 cactcctgct gttggctgga gcatgtgtct agaggtggct ggagcatgtg tctagaggtg
     2401 ggggtggctg ggtttatccc cctttcctaa gccttgggac agctgggaac ttaacttgaa
     2461 ataggaagtt ctcactgaat cctggaggct ggaacagctg gctcttttag actcacaagt
     2521 cagacgttcg attcccctct gccaatagcc agttttattg gagtgaatca catttcttac
     2581 gcaaatgaag ggagcagaca gtgattaatg gttctgttgg caaggcttct ccctgtcggt
     2641 gaaggatcat gttcaggcac tccaagtgaa ccacccctct tggttcaccc cttactcact
     2701 tatctcatca cagagcataa ggcccatttt gttgttcagg tcaacagcaa aatgcctgca
     2761 ccatgactgt ggcttttaaa ataaagaaat gtgtttttat cg
//