LOCUS       CAG33200.1               227 aa    PRT              HUM 16-OCT-2008
DEFINITION  Homo sapiens CPSF5 protein.
ACCESSION   CR456919-1
PROTEIN_ID  CAG33200.1
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 684)
  AUTHORS   Ebert L., Schick M., Neubert P., Schatten R., Henze S., Korn B.
  TITLE     Cloning of human full open reading frames in Gateway(TM) system
            entry vector (pDONR201)
  JOURNAL   Unpublished.
REFERENCE   2  (bases 1 to 684)
  AUTHORS   Ebert L., Schick M., Neubert P., Schatten R., Henze S., Korn B.
  JOURNAL   Submitted (03-JUN-2004) to the INSDC. RZPD Deutsches
            Ressourcenzentrum fuer Genomforschung GmbH, Im Neuenheimer Feld
            580, D-69120 Heidelberg, Germany
COMMENT     RZPD; RZPDo834F1115D, ORFNo 1285
            www.rzpd.de/cgi-bin/products/cl.cgi?CloneID=RZPDo834F1115D
            RZPDLIB; Human Full ORF Clones Gateway(TM) - RZPD (kan-resist.)
            RZPD LIB No. 834
            www.rzpd.de/cgi-bin/products/showLib.pl.cgi/response?libNo=834
            www.rzpd.de/products/orfclones/
            Contact: Inge Arlart
            RZPD Deutsches Ressourcenzentrum fuer Genomforschung GmbH,
            Heubnerweg 6, D-14059 Berlin, Germany
            Tel: +49 30 32639 100
            Fax: +49 30 32639 111
            www.rzpd.de
            This clone is available from RZPD;
            contact RZPD (customer.service@rzpd.de) for further information.
            
            This CDS clone is a part of a collection of human full length
            expression clones generated by RZPD.
            This CDS has been cloned incl. stopcodon.
            The CDS has been inserted into pDONR201 via a BP Clonase(TM)
            reaction.
            Additional sequence has been added in front of the start codon:
            att..AAAAAA GCA GGC (ATG).
            The last base of the last coding triplett has been changed to T,
            which might lead to an amino acid change at the C terminus of the
            polypeptide.
            The stop codon has been set to TAA followed by
            TTAACCCAGCTTTCTT..att.
            Compared to the reference sequence NM_007006 we found amino acid
            exchange(s) at position (first base of changed triplet):
            169(asp->gly)
            Clone distribution: http://www.rzpd.de/products/orfclones/
FEATURES             Qualifiers
     source          /db_xref="H-InvDB:HIT000267769"
                     /organism="Homo sapiens"
                     /lab_host="DH10B"
                     /mol_type="mRNA"
                     /clone_lib="Human Full ORF Clones Gateway(TM) - RZPD"
                     /clone="RZPDo834F1115D"
                     /note="Vector: pDONR201, Site_1: attP1; Site_2: attP2"
                     /db_xref="taxon:9606"
     protein         /gene="CPSF5"
                     /db_xref="GOA:O43809"
                     /db_xref="H-InvDB:HIT000267769.13"
                     /db_xref="HGNC:HGNC:13870"
                     /db_xref="InterPro:IPR000086"
                     /db_xref="InterPro:IPR015797"
                     /db_xref="InterPro:IPR016706"
                     /db_xref="PDB:2CL3"
                     /db_xref="PDB:2J8Q"
                     /db_xref="PDB:3BAP"
                     /db_xref="PDB:3BHO"
                     /db_xref="PDB:3MDG"
                     /db_xref="PDB:3MDI"
                     /db_xref="PDB:3N9U"
                     /db_xref="PDB:3P5T"
                     /db_xref="PDB:3P6Y"
                     /db_xref="PDB:3Q2S"
                     /db_xref="PDB:3Q2T"
                     /db_xref="UniProtKB/Swiss-Prot:O43809"
BEGIN
        1 MSVVPPNRSQ TGWPRGVTQF GNKYIQQTKP LTLERTINLY PLTNYTFGTK EPLYEKGSSV
       61 AARFQRMREE FDKIGMRRTV EGVLIVHEHR LPHVLLLQLG TTFFKLPGGE LNPGEDEVEG
      121 LKRLMTEILG RQDGVLQDWV IDDCIGNWWR PNFEPPQYPY IPAHITKPKE HKKLFLVQLQ
      181 EKALFAVPKN YKLVAAPLFE LYDNAPGYGP IISSLPQLLS RFNFIYN
//