LOCUS       AB033888                1339 bp    mRNA    linear   HUM 27-JUN-2001
DEFINITION  Homo sapiens SOX18 mRNA, complete cds.
ACCESSION   AB033888
VERSION     AB033888.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 1339)
  AUTHORS   Azuma,T., Seki,N., Yoshikawa,T., Masuho,Y. and Muramatsu,M.
  TITLE     Direct Submission
  JOURNAL   Submitted (25-OCT-1999) to the DDBJ/EMBL/GenBank databases.
            Contact:Takanori Azuma
            Helix Research Institute, Biological Technology Laboratory; 1532-3
            Yana, Kisarazu, Chiba 292-0812, Japan
REFERENCE   2
  AUTHORS   Azuma,T., Seki,N., Yoshikawa,T., Saito,T., Masuho,Y. and
            Muramatsu,M.
  TITLE     cDNA cloning, tissue expression, and chromosome mapping of human
            homolog of SOX18
  JOURNAL   J. Hum. Genet. 45, 192-195 (2000)
REFERENCE   3
  AUTHORS   Dunn,T.L., Mynett-Johnson,L., Wright,E.M., Hosking,B.M.,
            Koopman,P.A. and Muscat,G.E.
  TITLE     Sequence and expression of sox-18 encoding a new HMG-box
            transcription factor
  JOURNAL   Gene 161, 223-225 (1995)
COMMENT     
FEATURES             Location/Qualifiers
     source          1..1339
                     /chromosome="20"
                     /db_xref="H-InvDB:HIT000059100"
                     /db_xref="taxon:9606"
                     /dev_stage="Fetus"
                     /map="26.92 cR from D20S173"
                     /mol_type="mRNA"
                     /organism="Homo sapiens"
                     /tissue_type="Brain"
     CDS             146..1300
                     /codon_start=1
                     /gene="SOX18"
                     /note="new HMG-box transacription factor"
                     /protein_id="BAA94874.1"
                     /transl_table=1
                     /translation="MQRSPPGYGAQDDPPARRDCAWAPGHGAAADTRGLAAGPAALAA
                     PAAPASPPSPQRSPPRSPEPGRYGLSPAGRGERQAADESRIRRPMNAFMVWAKDERKR
                     LAQQNPDLHNAVLSKMLGKAWKELNAAEKRPFVEEAERLRVQHLRDHPNYKYRPRRKK
                     QARKARRLEPGLLLPGLAPPQPPPEPFPAASGSARAFRELPPLGAEFDGLGLPTPERS
                     PLDGLEPGEAAFFPPPAAPEDCALRPFRAPYAPTELSRDPGGCYGAPLAEALRTAPPA
                     APLAGLYYGTLGTPGPYPGPLSPPPEAPPLESAEPLGPAADLWADVDLTEFDQYLNCS
                     RTRPDAPGLPYHVALAKLGPRAMSCPEESSLISALSDASSAVYYSACISG"
BASE COUNT          166 a          577 c          449 g          147 t
ORIGIN      
        1 gggaggaagc gctgcaggga ccaccgccgt ccccaccgcc atccgccctc ccggcctggc
       61 ctgcccttgc gcccggctcc ccagtgcccg ccgcccgccc gccgcgctcc cgcgctccgt
      121 tccgcccagg ccgcgcccag ctggaatgca gagatcgccg cccggctacg gcgcacagga
      181 cgacccgccc gcccgccgcg actgtgcatg ggccccggga cacggggccg ccgctgacac
      241 gcgcggcctc gccgccggcc ccgccgccct cgccgcgccc gccgcgcccg cctcgccgcc
      301 cagcccgcag cgcagtcccc cgcgcagccc cgagccgggg cgctatggcc tcagcccggc
      361 cggccgcggg gaacgccagg cggcagacga gtcgcgcatc cggcggccca tgaacgcctt
      421 catggtgtgg gcaaaggacg agcgcaagcg gctggctcag cagaacccgg acctgcacaa
      481 cgcggtgctc agcaagatgc tgggcaaagc gtggaaggag ctgaacgcgg cggagaagcg
      541 gcccttcgtg gaggaagccg aacggctgcg cgtgcagcac ttgcgcgacc accccaacta
      601 caagtaccgg ccgcgccgca agaagcaggc gcgcaaggcc cggcggctgg agcccggcct
      661 cctgctcccg ggattagcgc ccccgcagcc accgcccgag cctttccccg cggcgtctgg
      721 ctcggctcgc gccttccgcg agctgccccc gctgggcgcc gagttcgacg gcctggggct
      781 gcccacgccc gagcgctcgc ctctggacgg cctggagccc ggcgaggctg ccttcttccc
      841 accgcccgcg gcgcccgagg actgcgcgct gcggcccttc cgcgcgccct acgcgcccac
      901 cgagttgtcg cgggaccccg gcggttgcta cggggctccc ctggcggagg cgctcaggac
      961 cgcgcccccc gcggcgccgc tcgctggcct gtactacggc accctgggca cgcccggccc
     1021 gtaccccggc ccgctgtcgc cgccgcccga ggccccgccg ctggagagcg ccgagccgct
     1081 ggggcccgcc gccgatctgt gggccgacgt ggacctcacc gagttcgacc agtacctcaa
     1141 ctgcagccgg actcggcccg acgcccccgg gctcccgtac cacgtggcac tggccaaact
     1201 gggcccgcgc gccatgtcct gcccagagga gagcagcctg atctccgcgc tgtcggacgc
     1261 cagcagcgcg gtctattaca gcgcgtgcat ctccggctag gccgccggcg ccgcccgggt
     1321 ccctgcagcg cttcctccc
//