LOCUS       BC006083                2504 bp    mRNA    linear   HUM 16-SEP-2003
DEFINITION  Homo sapiens tyrosyl-DNA phosphodiesterase 1, mRNA (cDNA clone
            IMAGE:2961386), complete cds.
ACCESSION   BC006083
VERSION     BC006083.1
KEYWORDS    .
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 2504)
  AUTHORS   Strausberg,R.L., Feingold,E.A., Grouse,L.H., Derge,J.G.,
            Klausner,R.D., Collins,F.S., Wagner,L., Shenmen,C.M., Schuler,G.D.,
            Altschul,S.F., Zeeberg,B., Buetow,K.H., Schaefer,C.F., Bhat,N.K.,
            Hopkins,R.F., Jordan,H., Moore,T., Max,S.I., Wang,J., Hsieh,F.,
            Diatchenko,L., Marusina,K., Farmer,A.A., Rubin,G.M., Hong,L.,
            Stapleton,M., Soares,M.B., Bonaldo,M.F., Casavant,T.L.,
            Scheetz,T.E., Brownstein,M.J., Usdin,T.B., Toshiyuki,S.,
            Carninci,P., Prange,C., Raha,S.S., Loquellano,N.A., Peters,G.J.,
            Abramson,R.D., Mullahy,S.J., Bosak,S.A., McEwan,P.J.,
            McKernan,K.J., Malek,J.A., Gunaratne,P.H., Richards,S.,
            Worley,K.C., Hale,S., Garcia,A.M., Gay,L.J., Hulyk,S.W.,
            Villalon,D.K., Muzny,D.M., Sodergren,E.J., Lu,X., Gibbs,R.A.,
            Fahey,J., Helton,E., Ketteman,M., Madan,A., Rodrigues,S.,
            Sanchez,A., Whiting,M., Madan,A., Young,A.C., Shevchenko,Y.,
            Bouffard,G.G., Blakesley,R.W., Touchman,J.W., Green,E.D.,
            Dickson,M.C., Rodriguez,A.C., Grimwood,J., Schmutz,J., Myers,R.M.,
            Butterfield,Y.S., Krzywinski,M.I., Skalska,U., Smailus,D.E.,
            Schnerch,A., Schein,J.E., Jones,S.J. and Marra,M.A.
  TITLE     Generation and initial analysis of more than 15,000 full-length
            human and mouse cDNA sequences
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 99 (26), 16899-16903 (2002)
   PUBMED   12477932
REFERENCE   2  (bases 1 to 2504)
  AUTHORS   Strausberg,R.
  TITLE     Direct Submission
  JOURNAL   Submitted (02-APR-2001) National Institutes of Health, Mammalian
            Gene Collection (MGC), Cancer Genomics Office, National Cancer
            Institute, 31 Center Drive, Room 11A03, Bethesda, MD 20892-2590,
            USA
  REMARK    NIH-MGC Project URL: http://mgc.nci.nih.gov
COMMENT     Contact: MGC help desk
            Email: cgapbs-r@mail.nih.gov
            Tissue Procurement: ATCC
            cDNA Library Preparation: Rubin Laboratory
            cDNA Library Arrayed by: The I.M.A.G.E. Consortium (LLNL)
            DNA Sequencing by: Genome Sequence Centre,
            BC Cancer Agency, Vancouver, BC, Canada
            info@bcgsc.bc.ca
            Steven Jones, Jennifer Asano, Ian Bosdet, Yaron Butterfield,
            Susanna Chan, Readman Chiu, Chris Fjell, Erin Garland, Ran Guin,
            Letticia Hsiao, Martin Krzywinski, Reta Kutsche, Oliver Lee, Soo
            Sen Lee, Victor Ling, Carrie Mathewson, Candice McLeavy, Steven
            Ness, Pawan Pandoh, Anna-Liisa Prabhu, Parvaneh Saeedi, Jacqueline
            Schein, Duane Smailus, Michael Smith, Lorraine Spence, Jeff Stott,
            Michael Thorne, Miranada Tsai, Natasja van den Bosch, Jill Vardy,
            George Yang, Scott Zuyderduyn, Marco Marra.
            
            Clone distribution: MGC clone distribution information can be found
            through the I.M.A.G.E. Consortium/LLNL at: http://image.llnl.gov
            Series: IRAL Plate: 18 Row: b Column: 23
            This clone was selected for full length sequencing because it
            passed the following selection criteria: matched mRNA gi: 20127585
            This clone has the following problem: The cds is short compared to
            the longest cds in the locus.
FEATURES             Location/Qualifiers
     source          1..2504
                     /db_xref="H-InvDB:HIT000032592"
                     /organism="Homo sapiens"
                     /mol_type="mRNA"
                     /db_xref="taxon:9606"
                     /clone="IMAGE:2961386"
                     /tissue_type="Muscle, rhabdomyosarcoma"
                     /clone_lib="NIH_MGC_17"
                     /lab_host="DH10B-R"
                     /note="Vector: pOTB7"
     gene            1..2504
                     /gene="TDP1"
                     /gene_synonym="FLJ11090"
                     /gene_synonym="SCAN1"
                     /db_xref="GeneID:55775"
                     /db_xref="MIM:607198"
     CDS             244..1140
                     /gene="TDP1"
                     /gene_synonym="FLJ11090"
                     /gene_synonym="SCAN1"
                     /codon_start=1
                     /product="TDP1 protein"
                     /protein_id="AAH06083.1"
                     /db_xref="GeneID:55775"
                     /db_xref="MIM:607198"
                     /translation="MSQEGDYGRWTISSSDESEEEKPKPDKPSTSSLLCARQGAANEP
                     RYTCSEAQKAAHKRKISPVKFSNTDSVLPPKRQKSGSQEDLGWCLSSSDDELQPEMPQ
                     KQAEKVVIKKEKDISAPNDGTAQRTENHGAPACHRLKEEEDEYETSGEGQDIWDMLDK
                     GNPFQFYLTRVSGVKPKYNSGALHIKDILSPLFGTLVSSAQFNYCFDVDWLVKQYPPE
                     FRKKPILLVHGDKREAKAHLHAQAKPYENISLCQAKLDIAFGTHHTKMMLLLYEEGLR
                     VVIHTSNLIHADWHQKTQGTHL"
BASE COUNT          714 a          590 c          591 g          609 t
ORIGIN      
        1 ccattctccg cagagttgga gcacacagct gtattaaaaa ggcaaatcga aggccgggcg
       61 cggtgactca cgcctgtcat cctagcactt tgggaggccg aggcggctga atcacttgag
      121 gttaggagtt tgagatcagc ccgggcaaca tggtgaaacc ccgtctctac aaaaatagaa
      181 aaattagccg agcgtgatgg tggatgcctg taatcctagc tcttcgggag gctaaggagt
      241 ataatgtctc aggaaggcga ttatgggagg tggaccatat ctagtagtga tgaaagtgag
      301 gaagaaaagc caaaaccaga caagccatct acctcttctc ttctctgtgc caggcaagga
      361 gcagcaaatg agcccaggta cacctgttcc gaggcccaga aagctgcaca caagaggaaa
      421 atatcacctg tgaaattcag caatacagat tcagttttac ctcccaaaag gcagaaaagc
      481 ggttcccagg aggacctcgg ctggtgtctg tccagcagtg atgatgagct gcaaccagaa
      541 atgccgcaga agcaggctga gaaagtggtg atcaaaaagg agaaagacat ctctgctccc
      601 aatgacggca ctgcccaaag aactgaaaat catggcgctc ccgcctgcca caggctcaaa
      661 gaggaggaag acgagtatga gacatcaggg gagggccagg acatttggga catgctggat
      721 aaagggaacc ccttccagtt ttacctcact agagtctctg gagttaagcc aaagtataac
      781 tctggagccc tccacatcaa ggatatttta tctcctttat ttgggacgct tgtttcttca
      841 gctcagttta actactgctt tgacgtggac tggctcgtaa aacagtatcc accagagttc
      901 aggaagaagc caatcctgct tgtgcatggt gataagcgag aggctaaggc tcacctccat
      961 gcccaggcca agccttacga gaacatctct ctctgccagg caaagttgga tattgcgttt
     1021 ggaacacacc acacgaaaat gatgctgctg ctctatgaag aaggcctccg ggttgtcata
     1081 cacacctcca acctcatcca tgctgactgg caccagaaaa ctcaaggaac tcacctgtga
     1141 gtgaatctct gatccaggag gagcctcact cagcctggga actttgaggt gctattgcaa
     1201 ggggaggtcc tccacgtctg tccagcccaa cctggtcatt ttacacacgg aggcaaaggc
     1261 ccagagagat cacagagctt acccaaaatg aatatggttg agccccttat acccacgaat
     1321 tgctgatgga acccacaaat ctggagagtc gccaacacat tttaaagctg atctcatcag
     1381 ttacttgatg gcttataatg ccccttctct caaggagtgg atagatgtca ttcacaagca
     1441 cgatctctct gaaacaaatg tttatcttat tggttcaacc ccaggacgct ttcaaggaag
     1501 tcaaaaagat aattggggac attttagact taagaagctt tgcataatta tcaaagcagg
     1561 aaatgcagat cagtcttctg cagtgtttta gctgcttctg aaagaccatg cctcatccat
     1621 gcctaacgca gagtcctggc ctgtcgtagg tcagttttca agcgttggct ccttgggagc
     1681 cgatgaatca aagtggttat gttctgagtt taaagagagc atgctgacac tggggaagga
     1741 aagcaagact ccaggaaaaa gctctgttcc tctttacttg atctatcctt ctgtggaaaa
     1801 tgtgcggacc agtttagaag gatatcctgc tgggggctct cttccctata gcatccagac
     1861 agctgaaaaa cagaattggc tgcattccta ttttcacaaa tggtcagctg agacttctgg
     1921 ccgcagcaat gccatgccac atattaagac atatatgagg ccttctccag acttcagtaa
     1981 aattgcttgg ttccttgtca caagcgcaaa tctgtccaag gctgcctggg gagcattgga
     2041 gaagaatggc acccagctga tgatccgctc ctacgagctc ggggtccttt tcctcccttc
     2101 agcatttggt ctagacagtt tcaaagtgaa acagaagttc ttcgctggca gccaggagcc
     2161 aatggccacc tttcctgtgc catatgattt gcctccagaa ctgtatggaa gtaaagatcg
     2221 gccatggata tggaacattc cttatgtcaa agcaccggat acgcatggga acatgtgggt
     2281 gccctcctga gaatcttgag gcactgtgaa atttaagtgt aagacattga gccacaaaca
     2341 tggaatctct tctttgtact ggatgtccac ttcccttaaa gtcttatttg cacccttaca
     2401 aaatctttcc aaaggtcact cttatgaatg gatgttggtt atacttttaa tggacattaa
     2461 cattcctaat aaagtattag tttcttaaaa aaaaaaaaaa aaaa
//