LOCUS       HSU80742                3103 bp    mRNA    linear   HUM 18-DEC-1997
DEFINITION  Homo sapiens CAGH45 mRNA, complete cds.
ACCESSION   U80742
VERSION     U80742.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 3103)
  AUTHORS   Margolis,R.L., Abraham,M.R., Gatchell,S.B., Li,S.H., Kidwai,A.S.,
            Breschel,T.S., Stine,O.C., Callahan,C., McInnis,M.G. and Ross,C.A.
  TITLE     cDNAs with long CAG trinucleotide repeats from human brain
  JOURNAL   Hum. Genet. 100 (1), 114-122 (1997)
   PUBMED   9225980
REFERENCE   2  (bases 1 to 3103)
  AUTHORS   Margolis,R.L., Abraham,M.R., Gatchell,S.B., Li,S.H., Kidwai,A.S.,
            Breschel,T.S., Stine,O.C., Callahan,C., McInnis,M.G. and Ross,C.A.
  TITLE     Direct Submission
  JOURNAL   Submitted (02-DEC-1996) Psychiatry, Johns Hopkins Univ. Sch. of
            Med., 600 N. Wolfe Street, Meyer 2-181, Baltimore, MD 21205, USA
FEATURES             Location/Qualifiers
     source          1..3103
                     /db_xref="H-InvDB:HIT000221581"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /chromosome="1"
                     /tissue_type="brain"
                     /dev_stage="fetus"
     gene            1..3103
                     /gene="CAGH45"
     CDS             826..2784
                     /gene="CAGH45"
                     /note="glutamine rich"
                     /codon_start=1
                     /product="CAGH45"
                     /protein_id="AAB91440.1"
                     /translation="MHEALKLRLNLVGGMFDTVQRSTQQTTEWAMLLLEIIISGTVDM
                     QSNNELFTTVLDMLSVLINGTLAADMSSISQGSMEENKRAYMNLAKKLQKELGERQSD
                     SLEKVRQLLPLPKQTRDVITCEPQGSLIDTKGNKIAGFDSIFKKEGLQVSTKQKISPW
                     DLFEGLKPSAPLSWGWFGTVRVDRRVARGEEQQRLLLYHTHLRPRPRAYYLEPLPLPP
                     EDEEPPAPTLLEPEKKAPEPPKTDKPGAAPPSTEERKKKSTKGKKRSQPATKTEDYGM
                     GPGRSGPYGVTVPPDLLHHPNPGSITHLNYRQGSIGLYTQNQPLPAGGPRVDPYRPVR
                     LPMQKLPTRPTYPGVLPTTMTGVMGLEPSSYKTSVYRQQQPAVPQGQRLRQQLQAKIQ
                     SQGMLGQSSVHQMTPSSSYGLQTSQGYTPYVSHVGLQQHTGPAGTMVPPSYSSQPYQS
                     THPSTNPTLVDPTRHLQQRPSGYVHQQAPTYGHGLTSTQRFSHQTLQQTPMISTMTPM
                     SAQGVQAGVRSTAILPEQQQQQQQQQQQQQQQQQQQQQQQQQQYHIRQQQQQQILRQQ
                     QQQQQQQQQQQQQQQQQQQQQQQQHQQQQQQQAAPPQPQPQSQPQFQRQGLQQTQQQQ
                     QTAALVRQLQQQLSNTQPQPSTNIFGRY"
     repeat_region   2401..2508
                     /gene="CAGH45"
                     /note="interrupted CAG repeat; 25 consecutive glutamine
                     amino acids"
                     /rpt_type=tandem
                     /rpt_unit_seq="cag"
     repeat_region   2518..2619
                     /gene="CAGH45"
                     /note="interrupted CAG repeat; 25 consecutive glutamine
                     amino acids"
                     /rpt_type=tandem
                     /rpt_unit_seq="cag"
BASE COUNT          856 a          914 c          769 g          563 t
ORIGIN      
        1 ttccggtggc agtggtggtc ggaggcaggg tggccgcaac atctctgtgg agacagccag
       61 tctggatgtc tatgccaagt acgtgctgcg cagcatctgc caacaggaat gggtaggaga
      121 acgttgcctt aagtctctgt gtgaggacag caatgacctg caagacccag tgttgagtag
      181 tgcccaggcg cagcgcctca tgcagctcat ttgctatcca catcgactgc tggacaatga
      241 ggatggggaa aacccccagc ggcagcgcat aaagcgcatt ctccagaact tggaccagtg
      301 gaccatgcgc cagtcttcct tggagctgca gctcatgatc aaagcagacc cctaacaatg
      361 agattgaact ccctcttgga ggaacatcgc caaggccaca atcgaggttt tccaacagtc
      421 agcagagaca gggtcatctt cctggaagta ctgcaagcaa catgccagca gcagcaagac
      481 caagcctgtg ctcagctctc tagagcgctc tggtgtatgg ctggtggccc ccctcattgc
      541 taaactgccc acctcagtcc agggacatgt gttaaaggct gctggggaag aattggagaa
      601 gggtcagcac ctgggttcct cttcacgcaa agaacgtgat cgacaaaagc agaagagcat
      661 gtccctattg agccagcagc ccttcttatc gctggtgcta acatgtctga aagggcagga
      721 tgaacaacgc gagggactcc ttacctccct ctacagccag gtgcaccaga ttgtgaataa
      781 ttggcgagat gacagtactt agatgattgc aaaccaaagc agcttatgca tgaggcactc
      841 aaactgcggc tcaacctggt ggggggcatg tttgacacgg tgcagcgcag cacccagcag
      901 accacggagt gggccatgct cctcctggag atcatcatca gcggcactgt cgacatgcag
      961 tccaacaatg agctcttcac tactgtgttg gacatgctga gcgtgctcat caatgggaca
     1021 ttggctgcag acatgtctag catctcgcaa ggtagcatgg aggaaaacaa gcgtgcatac
     1081 atgaacctgg cgaagaagtt gcagaaggag ttgggggagc gccagtcaga cagtctggaa
     1141 aaggttcgcc agctgctgcc actgcccaag cagacccgag atgtcatcac gtgtgagcca
     1201 cagggctccc ttatcgatac caagggcaac aagattgctg gcttcgattc catcttcaag
     1261 aaggagggtc tacaggtttc caccaaacag aagatctcgc cctgggatct ttttgagggg
     1321 ttgaagccgt cagcaccact ctcttggggc tggtttggaa cagtccgagt ggaccggcga
     1381 gtggctcgag gagaggagca gcagcggttg ctgctctacc acacacacct gaggccccgg
     1441 ccccgcgcct attacctgga gccactgcca ctgcccccag aagatgagga gccgcctgct
     1501 cctaccctgc tagagcctga gaaaaaggct ccagagcccc ccaaaactga caaaccgggg
     1561 gctgctccac ccagtactga ggaacgcaag aagaagtcca ccaagggcaa gaaacgcagc
     1621 cagccagcta ccaagacaga ggactatgga atgggcccgg gtcggagcgg cccttatggt
     1681 gtgacagtgc ctccggacct cctgcaccac ccaaaccctg gttctataac acaccttaac
     1741 tacaggcaag gctccatagg cctgtacacc cagaaccagc cactacctgc aggtggccct
     1801 cgtgtggacc cataccgtcc tgtgcgctta ccaatgcaga agctgcccac ccgaccaact
     1861 taccctggag tgctgcccac aaccatgact ggcgtcatgg gtttagaacc ctcctcttat
     1921 aagacctctg tgtaccggca gcagcaacct gcggtgcccc aaggacagcg ccttcgccaa
     1981 cagctccagg caaagataca gagtcagggc atgttgggac agtcatctgt ccatcagatg
     2041 actcccagct cttcctacgg tttgcagact tcccagggct atactcctta tgtttctcat
     2101 gtgggattgc agcaacacac aggccctgca ggtaccatgg tgccccccag ctactccagc
     2161 cagccttacc agagcaccca cccttctacc aatcctactc ttgtagatcc tacccgccac
     2221 ctgcaacagc ggcccagtgg ctatgtgcac cagcaggccc ccacctatgg acatggactg
     2281 acctccactc aaaggttttc acaccagaca ctgcagcaga cacccatgat aagtaccatg
     2341 actccaatga gtgcccaggg cgtccaggca ggcgtccgtt caacagccat cctacctgag
     2401 cagcagcagc agcagcaaca gcagcaacag caacagcagc agcagcagca acagcaacag
     2461 cagcagcagc agcagcagta ccacatccgg cagcagcagc agcagcagat cctgcggcag
     2521 cagcagcaac agcaacagca gcagcagcag cagcagcaac agcaacagca gcagcagcaa
     2581 cagcaacaac agcaacacca gcagcaacag cagcaacagg cggctcctcc ccaaccccag
     2641 ccccagtccc agccccagtt ccagcgccag gggcttcagc agacccagca gcagcaacag
     2701 acagcagctt tggtccggca acttcaacaa cagctctcta atacccagcc acagcccagt
     2761 accaacatat ttggacgcta ctgagccacc tggaggarct gcttgtgcac tggatgtggc
     2821 cccacccttt cctcttaatt cccaatccca ttcctgggct agcaccagta gtggttgggg
     2881 ccctcccctc aggctccatt tttaataagt ttttagtatt tttgttaatg tgaggcattg
     2941 agctgttggg ttttgtatat tatttatata gagaccccag agctgttgca cccaatacac
     3001 agagcttctt tgcaaaaaaa aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa
     3061 aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa aaaaaaaaaa aaa
//