LOCUS       HSU35612                3131 bp    mRNA    linear   HUM 09-SEP-1997
DEFINITION  Homo sapiens SOX22 protein (SOX22) mRNA, complete cds.
ACCESSION   U35612
VERSION     U35612.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 3131)
  AUTHORS   Jay,P., Sahly,I., Goze,C., Taviaux,S., Poulat,F., Couly,G.,
            Abitbol,M. and Berta,P.
  TITLE     SOX22 is a new member of the SOX gene family, mainly expressed in
            human nervous tissue
  JOURNAL   Hum. Mol. Genet. 6 (7), 1069-1077 (1997)
   PUBMED   9215677
REFERENCE   2  (bases 1 to 3131)
  AUTHORS   Jay,P.
  TITLE     Direct Submission
  JOURNAL   Submitted (06-SEP-1995) Philippe Jay, Centre de Recherches de
            Biologie Macromoleculaire, CNRS/INSER, Campus CNRS, 1919 route de
            Mende, Montpellier 34033, France
FEATURES             Location/Qualifiers
     source          1..3131
                     /db_xref="H-InvDB:HIT000219432"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /dev_stage="fetus"
     gene            1..3131
                     /gene="SOX22"
     CDS             330..1277
                     /gene="SOX22"
                     /codon_start=1
                     /product="SOX22 protein"
                     /protein_id="AAB69627.1"
                     /translation="MVQQRGARAKRDGGPPPPGPGPAEEGAREPGWCKTPSGHIKRPM
                     NAFMVWSQHERRKIMDQWPDMHNAEISKRLGRRWQLLQDSEKIPFVREAERLRLKHMA
                     DYPDYKYRPRKKSKGAPAKARPRPPGGSGGGSGSSPGRSCLAAGAAEQREGLWGAGRR
                     RPRTTMKTTTRSCWKCAWSRPRGGSCGGWSRRDGPLGDKRSRAQGPSGEGAAAAAAAS
                     PTPSEDEEPEEEEEEAAAAEEGEEETVASGEESLGFLSRLPPGPAGLDCSALDRDPDL
                     QPPSGTSHFEFPDYCTPEVTEMIAGDWRPSSIADLVFTY"
BASE COUNT          532 a         1105 c          982 g          512 t
ORIGIN      
        1 ccgcggcgga gccagaggct gcaggaagag cccgcggggg cccggagggt gcgattcctc
       61 ggcccccgca aaacaatgtg tgttgtgagc caggacgcaa cttgccggag cggcgggggc
      121 gcgccgagcc cgcctgagac cgcgctgacc ttctcccccc gccgtccgtt gggcccgagc
      181 gcccagctcc tcgctcccca gttcgcgggg gccgggccga gccgcggggc ggggccgccc
      241 ctccgtcgcc gctgcctcct cccccacccc cagccgcgga ggatgcggac ggcccccggc
      301 ggcgtctagc ggccccgggc ccaggcgcga tggtgcagca gcggggcgcg agggccaagc
      361 gggacggcgg gccgccgccc ccgggacccg ggccggccga ggagggggcg cgcgagcccg
      421 gctggtgcaa gaccccgagc ggccacatca agaggccgat gaacgcattc atggtgtggt
      481 cgcagcacga acggcggaag atcatggacc agtggcccga catgcacaac gccgagatct
      541 ccaagcgcct gggccgccgc tggcagctgc tgcaggactc ggagaagatc ccgttcgtgc
      601 gggaggcgga gcggctgcgg ctcaagcaca tggcggatta cccggactac aagtaccggc
      661 cgcgcaaaaa gagcaagggg gcgcccgcca aggcgcggcc ccgccccccc ggtggtagcg
      721 gtggcggcag cggctcaagc ccgggccgca gctgcctggc cgcgggggcc gccgagcagc
      781 gggagggcct ttggggggcg gggcggcggc gcccgaggac gacgatgaag acgacgacga
      841 ggagctgctg gaagtgcgcc tggtcgagac cccggggcgg gagctgtgga ggatggtccc
      901 ggcgggacgg gccgctcggg gacaagcgga gccgcgccca agggccgtcg ggcgaggggg
      961 cggccgccgc cgccgccgcc tccccgacac cgtcggagga cgaggagccg gaggaagagg
     1021 aggaggaggc ggcagcggct gaggaaggtg aagaggagac ggtggcgtcg ggggaggagt
     1081 cgctgggctt tctgtccagg ctgccccctg gcccggccgg cctggactgc agcgccctgg
     1141 atcgcgaccc ggacctgcag cctccctcgg gcacgtcgca cttcgagttc ccggactact
     1201 gcacccccga ggttaccgag atgatcgcgg gggactggcg cccgtctagc atcgcagacc
     1261 tggttttcac ctactgagcc caccgtcagc ggggcgcgca cgcccccaaa ccagctgttt
     1321 acatacagga atcaggtatt ggggcccctc ggaggccgag gctggcaccc catctcccgc
     1381 gcagcctccc ccctcctgga cgtgcccatc ccccctcaga tccagacatc ccctcccccg
     1441 cagacacacc ccaaggcagt ccaaccccca ccccttcccc gacacccaag cccctcccca
     1501 cgtcgccccc tcctgcacag ccaccagcag ccagccccct ccgatacacc tcccgtcctc
     1561 tcctacagac ctgcacccct cccccctttt gcacacgccc ctcctcgtgg ccggaggacc
     1621 gccccctcct ttgctccgga atctctcctc cctcgcccgg cccgccttct ctgggttagg
     1681 ggggcgatgc ggccgggtgg caacgcacgc gcctcctgcg cccctccctt ccctgggggg
     1741 aggggcgcac cccttttatc cccggagcgc tagggcccgc ccctccgctg gggcccaccc
     1801 ccttcgtgcg catgcttaat gcttctgggg aggagggggc tggtcccagc ggagccgcac
     1861 tcttcgcccg ctccgggcaa aagcgggggc gagtgtagag cgatcctggg aaatcctttg
     1921 atccgggagc cctaggtttc ctctccaccc agcggggcgt cgctgcctta atgggaggag
     1981 cactcggaag ggttggtttg ggcctgaaac tctcccaagt ggcatagccc cttttccggt
     2041 atggggtctc ctacacccac gcgcaccacc tctccggtcg cgtggctgcc tctacagcct
     2101 acctatacgt ccctttttcc ccccaactgg gaattgagag gtaaggtctt tctctggaaa
     2161 tccagcagta gaggaaggga ccacccaaga aaactaaaaa ccaaggcacc ttaccagtct
     2221 gtctggggac aggatccctg ctgcaccttc cccaccccct cctgggaagt gccccctcac
     2281 ctcagggcac ccgcaacctg ggctcctccc tgagcccacc ggcccttcct gtcacccagg
     2341 tccaccctca gtactcaagc tgcagtatac agcgggaaaa actgaggcac tttggtgcta
     2401 ggggtttggg actgaggcgt ggagagcaga tctgatggca ggaagactct cgcttttaaa
     2461 catctgggtt tggggagaga catcgacttg gccagtgaga ctgagaatgg attccgagta
     2521 gtgatgggcc gttgcacctc ggtttttcca cgtgagaaat ggggagaacg ctgctgttag
     2581 gaggaagttg tgtccagttc agggtgccct cgggagccct gtccctgttg ctgtggcccc
     2641 tctcacgccg ccatctctct gccccgcccc gcccctccgg cctccccaca cccgccttgc
     2701 cctcactacc tgtatctcac cggcgtgtgt tcaccctccc gggtggctca cacactctca
     2761 ttcacacaca caaatctcag gaacaaacgg tcccagagtc ctccggaccc ctgcccaggg
     2821 tctctgcagg tctctgcccc acgcgttccc gtcgctgaca aagccaccag ctgcctcctt
     2881 taagcttggt gctccggctc tgggcctttc ttgcgctctt tctatttttt tttttttttt
     2941 tttaagaaaa acaacaacaa caaaaaaaga caatgaaaaa aaaaacgtca tgtgagtgaa
     3001 gagatgtcac tgtctgtggt cttggagaac tagtctcgta gctgaggggt ggggtccctc
     3061 tgtctggggc actggcaccc acagcaggac tccgccagtc tgatgccagg actgaataaa
     3121 gtgtatttgc g
//