LOCUS       AY035399                3357 bp    mRNA    linear   HUM 07-NOV-2001
DEFINITION  Homo sapiens UDP-N-acetyl-alpha-D-galactosamine:polypeptide
            N-acetylgalactosaminyltransferase 7 (GALNT7) mRNA, complete cds.
ACCESSION   AY035399
VERSION     AY035399.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 3357)
  AUTHORS   Kumar,S., Connor,J.R., Dodds,R.A., Halsey,W., Van Horn,M., Mao,J.,
            Sathe,G.M., Mui,P., Agarwal,P., Badger,A.M., Lee,J.C., Gowen,M. and
            Lark,M.W.
  TITLE     Identification and initial characterization of 5000 expressed
            sequenced tags (ESTs) each from adult human normal and
            osteoarthritic cartilage cDNA libraries
  JOURNAL   Osteoarthr. Cartil. 9 (7), 641-653 (2001)
   PUBMED   11597177
REFERENCE   2  (bases 1 to 3357)
  AUTHORS   Kumar,S.
  TITLE     Direct Submission
  JOURNAL   Submitted (14-MAY-2001) Musculoskeletal Diseases, UW 2109,
            GlaxoSmithKline, 709 Swedeland Rd., King of Prussia, PA 19406, USA
FEATURES             Location/Qualifiers
     source          1..3357
                     /db_xref="H-InvDB:HIT000083512"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /tissue_type="osteoarthritic cartilage"
     gene            1..3357
                     /gene="GALNT7"
     CDS             284..2203
                     /gene="GALNT7"
                     /note="GalNAc-T7"
                     /codon_start=1
                     /product="UDP-N-acetyl-alpha-D-galactosamine:polypeptide
                     N-acetylgalactosaminyltransferase 7"
                     /protein_id="AAK63127.1"
                     /translation="MLLRKRYRHRPCRLQFLLLLLMLGCVLMMVAMLHPPHHTLHQTV
                     TAQASKHSPEARYRLDFGESQDWVLEAEDEGEEYSPLEGLPPFISLREDQLLVAVALP
                     QARRNQSQGRRGGSYRLIKQPRRQDKEAPKRDWGADEDGEVSEEEELTPFSLDPRGLQ
                     EALSARIPLQRALPEVRHPLCLQQHPQDSLPTASVILCFHDEAWSTLLRTVHSILDTV
                     PRAFLKEIILVDDLSQQGQLKSALSEYVARLEGVKLLRSNKRLGAIRARMLGATRATG
                     DVLVFMDAHCECHPGWLEPLLSRIAGDRSRVVSPVIDVIDWKTFQYYPSKDLQRGVLD
                     WKLDFHWEPLPEHVRKALQSPISPIRSPVVPGEVVAMDRHYFQNTGAYDSLMSLRGGE
                     NLELSFKAWLCGGSVEILPCSRVGHIYQNQDSHSPLDQEATLRNRVRIAETWLGSFKE
                     TFYKHSPEAFSLSKAEKPDCMERLQLQRRLGCRTFHWFLANVYPELYPSEPRPSFSGK
                     LHNTGLGLCADCQAEGDILGCPMVLAPCSDSRQQQYLQHTSRKEIHFGSPQHLCFAVR
                     QEQVILQNCTEEGLAIHQQHWDFQENGMIVHILSGKCMEAVVQENNKDLYLRPCDGKA
                     RQQWRFDQINAVDER"
     misc_feature    284..322
                     /gene="GALNT7"
                     /note="Region: cytoplasmic tail"
     misc_feature    323..388
                     /gene="GALNT7"
                     /note="Region: hydrophobic domain"
     misc_feature    389..757
                     /gene="GALNT7"
                     /note="Region: stem region"
     misc_feature    758..2200
                     /gene="GALNT7"
                     /note="Region: catalytic domain"
BASE COUNT          858 a          839 c          895 g          765 t
ORIGIN      
        1 acgcgtccga tttgaagtcc ctgtgaatgg gctttcagaa ggcaattaaa gaaatccact
       61 cagagaggac ttggggtgaa acttgggtcc tgtggttttc tgattgtaag tggaagcagg
      121 tcttgcacac gctgttggca aatgtcagga ccaggttaag tgactggcag aaaaacttcc
      181 aggtggaaca agcaacccag gttctgctgc aagcttgaag gagcctggag cgggagaaag
      241 ctaacttgaa catgacctgt tgcatttggc aagttctagc aacatgctcc taaggaagcg
      301 atacaggcac agaccatgca gactccagtt cctcctgctg ctcctgatgc tgggatgcgt
      361 cctgatgatg gtggcgatgt tgcaccctcc ccaccacacc ctgcaccaga ctgtcacagc
      421 ccaagccagc aagcacagcc ctgaagccag gtaccgcctg gactttgggg aatcccagga
      481 ttgggtactg gaagctgagg atgagggtga agagtacagc cctctggagg gcctgccacc
      541 ctttatctca ctgcgggagg atcagctgct ggtggccgtg gccttacccc aggccagaag
      601 gaaccagagc cagggcagga gaggtgggag ctaccgcctc atcaagcagc caaggaggca
      661 ggataaggaa gccccaaaga gggactgggg ggctgatgag gacggggagg tgtctgaaga
      721 agaggagttg accccgttca gcctggaccc acgtggcctc caggaggcac tcagtgcccg
      781 catccccctc cagagggctc tgcccgaggt gcggcaccca ctgtgtctgc agcagcaccc
      841 tcaggacagc ctgcccacag ccagcgtcat cctctgtttc catgatgagg cctggtccac
      901 tctcctgcgg actgtacaca gcatcctcga cacagtgccc agggccttcc tgaaggagat
      961 catcctcgtg gacgacctca gccagcaagg acaactcaag tctgctctca gcgaatatgt
     1021 ggccaggctg gagggggtga agttactcag gagcaacaag aggctgggtg ccatcagggc
     1081 ccggatgctg ggggccacca gagccaccgg ggatgtgctc gtcttcatgg atgcccactg
     1141 cgagtgccac ccaggctggc tggagcccct cctcagcaga atagctggtg acaggagccg
     1201 agtggtatct ccggtgatag atgtgattga ctggaagact ttccagtatt acccctcaaa
     1261 ggacctgcag cgtggggtgt tggactggaa gctggatttc cactgggaac ctttgccaga
     1321 gcatgtgagg aaggccctcc agtcccccat aagccccatc aggagccctg tggtgcccgg
     1381 agaggtggtg gccatggaca gacattactt ccaaaacact ggagcgtatg actctcttat
     1441 gtcgctgcga ggtggtgaaa acctcgaact gtctttcaag gcctggctct gtggtggctc
     1501 tgttgaaatc cttccctgct ctcgggtagg acacatctac caaaatcagg attcccattc
     1561 ccccctcgac caggaggcca ccctgaggaa cagggttcgc attgctgaga cctggctggg
     1621 gtcattcaaa gaaaccttct acaagcatag cccagaggcc ttctccttga gcaaggctga
     1681 gaagccagac tgcatggaac gcttgcagct gcaaaggaga ctgggttgtc ggacattcca
     1741 ctggtttctg gctaatgtct accctgagct gtacccatct gaacccaggc ccagtttctc
     1801 tggaaagctc cacaacactg gacttgggct ctgtgcagac tgccaggcag aaggggacat
     1861 cctgggctgt cccatggtgt tggctccttg cagtgacagc cggcagcaac agtacctgca
     1921 gcacaccagc aggaaggaga ttcactttgg cagcccacag cacctgtgct ttgctgtcag
     1981 gcaggagcag gtgattcttc agaactgcac ggaggaaggc ctggccatcc accagcagca
     2041 ctgggacttc caggagaatg ggatgattgt ccacattctt tctgggaaat gcatggaagc
     2101 tgtggtgcaa gaaaacaata aagatttgta cctgcgtccg tgtgatggaa aagcccgcca
     2161 gcagtggcgt tttgaccaga tcaatgctgt ggatgaacga tgaatgtcaa tgtcagaagg
     2221 aaaagagaat tttggccatc aaaatccagc tccaagtgaa cttaaagagc ttatatattt
     2281 catgaagctg atccttttgt gtgtgtgctc ctggtgttag gagagaaaaa agctctatga
     2341 aagaatatag gaagtttctc cttttcacac cttatttcat tgactgctgg ctgctttaaa
     2401 aaaaaaaaaa ggatccattg taccgttgtc ttcatcactg ggaaatgatt attacatagt
     2461 acagaagatt ctttgttttt ctccactgag cacttaacaa ttgctttctc tctggcctgg
     2521 acattctctg gcagcacctc caggatacat aaattcaatg gatcaattta tttgtcttca
     2581 aatggcctta acttggattg tctgtttggc caaccatgaa aattaaagag tgaagcagat
     2641 gtaatggcct gacattccaa aaactctgaa ttgggtttat tagcacaaat gttgtgttca
     2701 tttgttgagc catatctcag aagaaggaaa gggagctaca gaaaggaggt ttaggattgc
     2761 agagaagatg caagagcact ttggcccaat tctccagctc aacccagcag ctgaaaagct
     2821 tcaagagatc taggaaaaga cattttcatg ttaatgagaa tttccaccat tgtagagaat
     2881 ttccttccta ctgagaatct acctctattc cccctgccct agctcttctc taacttggtt
     2941 aaccataacc ataaccagat tcccttgcaa tcgatttctc tttagtcgtt ggtgttagaa
     3001 gtaccagcac aatttgagca ttcccattaa caaaggtgtt cacagttgag aaactctcct
     3061 gccgggcgcg gtggctcatg cctgtaattc cagcactttg ggaggcagag ttgggaggat
     3121 cacctgatgt caggggtttg agaccagcct ggtcaacatt gcaaaacctt gtctctacta
     3181 aaaatacaaa aattagctgg gcatggtggc gcatacctgt aatcccagct acttgggagg
     3241 ctgaggcaag agaatcgctt gaacccagga ggcagaggtt gcagtgagct gagatcatgc
     3301 cattgcactc caacctgggt gacagagtga gactccatct caaaaaaaaa aaaaaaa
//