LOCUS       AH002817                5440 bp    DNA     linear   HUM 10-JUN-2016
DEFINITION  Homo sapiens clone lambda-601 eosinophil peroxidase (EPP) gene,
            complete cds.
ACCESSION   AH002817 J05050 M26515 M29904 M29905 M29906 M29907 M29908 M29909
            M29910 M29911 M29912 M29913
VERSION     AH002817.2
KEYWORDS    eosinophil peroxidase.
SOURCE      Homo sapiens (human)
  ORGANISM  Homo sapiens
            Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi;
            Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini;
            Catarrhini; Hominidae; Homo.
REFERENCE   1  (bases 1 to 5440)
  AUTHORS   Sakamaki,K., Tomonaga,M., Tsukui,K. and Nagata,S.
  TITLE     Molecular cloning and characterization of a chromosomal gene for
            human eosinophil peroxidase
  JOURNAL   J. Biol. Chem. 264 (28), 16828-16836 (1989)
   PUBMED   2550461
COMMENT     On or before Jun 10, 2016 this sequence version replaced M29904.1,
            M29905.1, M29906.1, M29907.1, M29908.1, M29909.1, M29910.1,
            M29911.1, M29912.1, M29913.1, AH002817.1.
FEATURES             Location/Qualifiers
     source          1..5440
                     /organism="Homo sapiens"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:9606"
                     /chromosome="17"
                     /clone="lambda-601"
                     /tissue_type="placenta"
                     /tissue_lib="M.Shibuya"
     gene            274..5440
                     /gene="EPP"
     regulatory      274..280
                     /regulatory_class="TATA_box"
                     /gene="EPP"
     mRNA            join(306..500,616..709,1030..1205,1323..1440,1572..1701,
                     1896..2102,2365..2683,3059..3219,3494..3749,4074..4244,
                     4542..4779,5018..>5219)
                     /gene="EPP"
                     /product="eosinophil peroxidase"
     exon            306..500
                     /gene="EPP"
                     /number=1
     CDS             join(425..500,616..709,1030..1205,1323..1440,1572..1701,
                     1896..2102,2365..2683,3059..3219,3494..3749,4074..4244,
                     4542..4779,5018..5219)
                     /gene="EPP"
                     /note="precursor"
                     /codon_start=1
                     /product="eosinophil peroxidase"
                     /protein_id="AAA58458.1"
                     /translation="MHLLPALAGVLATLVLAQPCEGTDPASPGAVETSVLRDCIAEAK
                     LLVDAAYNWTQKSIKQRLRSGSASPMDLLSYFKQPVAATRTVVRAADYMHVALGLLEE
                     KLQPQRSGPFNVTDVLTEPQLRLLSQASGCALRDQAERCSDKYRTITGRCNNKRRPLL
                     GASNQALARWLPAEYEDGLSLPFGWTPSRRRNGFLLPLVRAVSNQIVRFPNERLTSDR
                     GRALMFMQWGQFIDHDLDFSPESPARVAFTAGVDCERTCAQLPPCFPIKIPPNDPRIK
                     NQRDCIPFFRSAPSCPQNKNRVRNQINALTSFVDASMVYGSEVSLSLRLRNRTNYLGL
                     LAINQRFQDNGRALLPFDNLHDDPCLLTNRSARIPCFLAGDTRSTETPKLAAMHTLFM
                     REHNRLATELRRLNPRWNGDKLYNEARKIMGAMVQIITYRDFLPLVLGKARARRTLGH
                     YRGYCSNVDPRVANVFTLAFRFGHTMLQPFMFRLDSQYRASAPNSHVPLSSAFFASWR
                     IVYEGGIDPILRGLMATPAKLNRQDAMLVDELRDRLFRQVRRIGLDLAALNMQRSRDH
                     GLPGYNAWRRFCGLSQPRNLAQLSRVLKNQDLARKFLNLYGTPDNIDIWIGAIAEPLL
                     PGARVGPLLACLFENQFRRARDGDRFWWQKRGVFTKRQRKALSRISLSRIICDNTGIT
                     TVSRDIFRANIYPRGFVNCSRIPRLNLSAWRGT"
     mat_peptide     join(1367..1440,1572..1701,1896..2051)
                     /gene="EPP"
                     /product="eosinophil peroxidase"
                     /note="light chain"
     mat_peptide     join(2052..2102,2365..2683,3059..3219,3494..3749,
                     4074..4244,4542..4779,5018..5216)
                     /gene="EPP"
                     /product="eosinophil peroxidase"
                     /note="heavy chain"
     intron          501..615
                     /gene="EPP"
                     /number=1
     exon            616..709
                     /gene="EPP"
                     /number=2
     intron          710..>752
                     /gene="EPP"
                     /number=2
     gap             753..852
                     /estimated_length=unknown
     intron          <853..1029
                     /gene="EPP"
                     /number=2
     exon            1030..1205
                     /gene="EPP"
                     /number=3
     intron          1206..>1209
                     /gene="EPP"
                     /number=3
     gap             1210..1309
                     /estimated_length=unknown
     intron          <1310..1322
                     /gene="EPP"
                     /number=3
     exon            1323..1440
                     /gene="EPP"
                     /number=4
     intron          1441..1571
                     /gene="EPP"
                     /number=4
     exon            1572..1701
                     /gene="EPP"
                     /number=5
     intron          1702..>1738
                     /gene="EPP"
                     /number=5
     gap             1739..1838
                     /estimated_length=unknown
     intron          <1839..1895
                     /gene="EPP"
                     /number=5
     exon            1896..2102
                     /gene="EPP"
                     /number=6
     intron          2103..>2241
                     /gene="EPP"
                     /number=6
     gap             2242..2341
                     /estimated_length=unknown
     intron          <2342..2364
                     /gene="EPP"
                     /number=6
     exon            2365..2683
                     /gene="EPP"
                     /number=7
     intron          2684..>2823
                     /gene="EPP"
                     /number=7
     gap             2824..2923
                     /estimated_length=unknown
     intron          <2924..3058
                     /gene="EPP"
                     /number=7
     exon            3059..3219
                     /gene="EPP"
                     /number=8
     intron          3220..>3248
                     /gene="EPP"
                     /number=8
     gap             3249..3348
                     /estimated_length=unknown
     intron          <3349..3493
                     /gene="EPP"
                     /number=8
     exon            3494..3749
                     /gene="EPP"
                     /number=9
     intron          3750..>3812
                     /gene="EPP"
                     /number=9
     gap             3813..3912
                     /estimated_length=unknown
     intron          <3913..4073
                     /gene="EPP"
                     /number=9
     exon            4074..4244
                     /gene="EPP"
                     /number=10
     intron          4245..>4322
                     /gene="EPP"
                     /number=10
     gap             4323..4422
                     /estimated_length=unknown
     intron          <4423..4541
                     /gene="EPP"
                     /number=10
     exon            4542..4779
                     /gene="EPP"
                     /number=11
     intron          4780..>4903
                     /gene="EPP"
                     /number=11
     gap             4904..5003
                     /estimated_length=unknown
     intron          <5004..5017
                     /gene="EPP"
                     /number=11
     exon            5018..>5219
                     /gene="EPP"
                     /number=12
BASE COUNT          945 a         1357 c         1267 g          971 t
ORIGIN      
        1 caccgctcct gtcagccaac aaatatccat tgagcgacac ctgtgtccca ggtgctgctc
       61 tgggccctgg gagaagtgca tcagtgggct tggtagtaga gggtagggat ggagtgaagg
      121 gtaggcagga agaatgtccc caggctggta ggaggtgggg tggggggttt cagtctcaaa
      181 actcccatga aaaccagaga gaagtttcag aactccaccc aagaggctgg gtttctaggg
      241 cccagagctg ccctccccca ccctagaatg ggctataaaa gtcccttccc agctacgtcc
      301 agagaagagc tggaggaagt gagaggtcgg ctgggggtcc tcaaagtgag aggggagcag
      361 aggatcctcc cgtgcaggct gtggatgtca ctcacttccc agctggtgaa gcctcgctgc
      421 agagatgcat ctgctcccag ccctggcagg ggtcctggcc acactcgtcc tcgcccagcc
      481 ctgtgagggc actgacccag gtaatagtcc cctagacagg caaggaggag ggaggggaaa
      541 tggaagggga agcacttggg tcttggaggg ggtcttgtgg cttgctgaac cctgagtccc
      601 catctctttg aacagcctcc cctggggcag tggagacctc ggtcctgcga gactgcatag
      661 cagaggccaa gttgctggtg gatgctgcct acaattggac ccagaagagg tggacttggg
      721 tctgggggct gcatgggcct gggaggatca gtnnnnnnnn nnnnnnnnnn nnnnnnnnnn
      781 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
      841 nnnnnnnnnn nncaagttca tctcactcat cagccacctc tggaccccat gaacatttcc
      901 tgttggtaga gcctcccttc catccatcct tctgtccgct tgccctgtcc tgactgtgcc
      961 ccaggactgg gtctctgctg ggtgggtctg caccctctct ccagccctca ctcctcctct
     1021 cctgggcagc atcaagcagc ggcttcgcag cggttcagcc agccccatgg acctcctgtc
     1081 ctacttcaaa caaccggtag cagccaccag gacagttgtt cgggccgcag attatatgca
     1141 tgtggctttg gggctgcttg aagagaagtt acaaccccag cggtccggac ccttcaatgt
     1201 cactggtacn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     1261 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnt gccttcccac
     1321 agatgtgcta acagaaccac agctgcggct gctgtcccag gccagtggct gtgctctccg
     1381 ggaccaggcc gagcgctgca gcgacaagta ccgcaccatc actggacggt gcaacaacaa
     1441 gtgcgtgcgg ggcggcagga ggggctgccc ctgcctgggg gacctctccc ttcctgcacc
     1501 caccctctcc ctccatgctg agccatctcc aggccctgcc ccctgctaac ctatcccacc
     1561 catggctgca ggaggagacc cttgctaggg gcctccaacc aggctctggc tcgctggctg
     1621 cccgccgagt atgaggatgg gctgtcgctc cccttcggct ggacccccag caggaggcgc
     1681 aatggcttcc ttctccctct tgtgagttgg ggctgagggt ttgggaggtt gcttgatcnn
     1741 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     1801 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnta ataccttgtg gggtcaggga
     1861 gcccatgtcc cgtgctgatg ttatttcccc accaggtccg ggctgtctcc aaccagattg
     1921 tgcgcttccc caatgagaga ctgacctccg accgtggccg agccctcatg ttcatgcagt
     1981 ggggccagtt cattgaccat gacctggact tctccccgga gtccccggcc agagtggcct
     2041 tcactgcagg cgttgactgt gagaggacct gcgcccagct gcccccctgc tttcccatca
     2101 aggtacctac cctcagccaa tctcccatgc ccttgtgtgg cctcccccaa aggcaaggtg
     2161 ctgggggtgg ggatctggaa gactggagca ccatccttaa ggagctgcct gtggagctag
     2221 ggtatgagac agagacacaa gnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     2281 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     2341 ncactgtctc ctcttccatc tcagatccca cccaatgacc cccgcatcaa gaaccagcgt
     2401 gactgcatcc ctttcttccg ctcggcaccc tcatgccccc aaaacaagaa cagagtccgc
     2461 aaccagatca acgcgctcac ctcctttgtg gacgccagca tggtgtatgg cagtgaggtc
     2521 tccctctcgc tgcggctccg caaccggacc aactacctgg ggctgctggc catcaaccag
     2581 cgctttcaag acaacggccg ggccctgctg cccttcgaca acctgcacga tgacccctgt
     2641 ctcctcacca accgctcggc gcgcatcccc tgcttcctgg caggtcagac agggaggaag
     2701 gtggtgtctt cccaggaaac agccatccct ggggtcccaa ctgggaagca atggtgggat
     2761 gtggtgaagg tacatggttt gggacctcag tattaggcac accataagca tggatctgtg
     2821 cacnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     2881 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnntgaagag atggaggtcc
     2941 agtgagggcc aggagtttgg cccaccccgt ctctcccatc cccagccctg ggtctaccct
     3001 ggtagaaaga catttctctg ggaaaggctg cagtaaatct gagcttgggg ttttcaaggt
     3061 gacacccgat caacggaaac ccccaaactg gcagccatgc acaccctctt tatgcgagag
     3121 cacaaccggc tggccaccga gctgagacgc ctgaatcccc ggtggaatgg agacaaactg
     3181 tacaatgagg ctcggaagat catgggggcc atggtccagg taaggagctc tgcatcccag
     3241 catcccccnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     3301 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnct ttgtatctcc
     3361 acccaccaat agtaaattaa tgttgtcaca tttgacgtga tgacaataaa gaatatgtct
     3421 gagccaccct ttgaaaaggc aagggtatgg gtgagtagcc tctggggaat gttcctcctg
     3481 tcttcccttc cagatcatca cctaccgaga ctttctgccc ctggttctgg gcaaggcccg
     3541 ggccaggaga accctggggc actacagggg gtactgctcc aatgtggacc cacgggtggc
     3601 caatgtcttc accctggcct tccgctttgg ccacacaatg ctccagccct tcatgttccg
     3661 cttggacagt cagtaccggg cctccgcacc caactcgcat gtcccactta gctctgcctt
     3721 ctttgccagc tggcggatcg tgtatgaagg tgaccaggtt ttccaggggg caaatggggg
     3781 tgagggtggg gagcatgccc tcccctaggt ggnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     3841 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     3901 nnnnnnnnnn nntccagctg cttcatgtct ctccagaact ctgtttcctg acaaacgtta
     3961 ctaacatacc cgactggctt gtccagctct gggctagctt ggcatcatgt gataacccaa
     4021 gtagcttccc agaggctggt ccaatctgtg ctgctcacat tccctgccac cagggggcat
     4081 cgaccccatc ctccggggcc tcatggccac ccctgccaag ctgaaccgtc aggatgccat
     4141 gttagtggat gagctccggg accggctgtt tcggcaagtg aggaggattg ggctggacct
     4201 ggcagctctc aacatgcaac gaagccggga ccacggcctt ccaggtgagg gggctgtcca
     4261 cctcttctcc cagctttgct cgggccaggc tgctcaaggg gttctgggaa gaccctggta
     4321 ccnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     4381 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnccgtctgg ttctgcccaa
     4441 tattgactgg ccacagcttc cccccagagg actggtggag aaaaacagaa gctaatggga
     4501 gatcagcaag actgaagctg cttctccccg ttcccctgca gggtacaatg cttggaggcg
     4561 cttctgtggg ctctcccagc cccggaattt ggcacagctt agccgggtgc tgaaaaacca
     4621 ggacttggca aggaagttcc tgaatttgta tggaacacct gacaacattg acatctggat
     4681 tggggccatc gctgagcctc ttttgccggg ggctcgagtg gggcctcttc tggcttgtct
     4741 gttcgagaac cagttcagaa gagcccgaga cggagacagg taagtgaccc tatcataaaa
     4801 gacatcagca ccagaggcag agcagaaaaa cactagcatt tcaagactaa acattgaaga
     4861 acactgctct ttttagtatc atttcttcca agttcacagg atcnnnnnnn nnnnnnnnnn
     4921 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn
     4981 nnnnnnnnnn nnnnnnnnnn nnncgactgc ctggtaggtt ctggtggcag aaacgaggtg
     5041 ttttcaccaa aagacagcgc aaggccctga gcagaatttc cttgtctcga attatatgtg
     5101 acaataccgg tatcaccacg gtttcaaggg acatcttcag agccaacatc taccctcggg
     5161 gctttgtgaa ctgcagccgt atccccaggt tgaacctatc agcctggcga gggacatgag
     5221 gcttctgcag gtaaggggag gccacctcca gcaccctggg ctggttaagc ctcacatcct
     5281 tccctggatg gatggctgag tcctcttagg tctctaagca gagaaaacag aacttgtcac
     5341 taggtactct ttccaagtgg cttcccaatg tgctagtttc tgggctgaca gtcaattcca
     5401 ggccctagga ctttgggggg aaattaggag catccaacta
//