LOCUS AH002817 5440 bp DNA linear HUM 10-JUN-2016 DEFINITION Homo sapiens clone lambda-601 eosinophil peroxidase (EPP) gene, complete cds. ACCESSION AH002817 J05050 M26515 M29904 M29905 M29906 M29907 M29908 M29909 M29910 M29911 M29912 M29913 VERSION AH002817.2 KEYWORDS eosinophil peroxidase. SOURCE Homo sapiens (human) ORGANISM Homo sapiens Eukaryota; Metazoa; Chordata; Craniata; Vertebrata; Euteleostomi; Mammalia; Eutheria; Euarchontoglires; Primates; Haplorrhini; Catarrhini; Hominidae; Homo. REFERENCE 1 (bases 1 to 5440) AUTHORS Sakamaki,K., Tomonaga,M., Tsukui,K. and Nagata,S. TITLE Molecular cloning and characterization of a chromosomal gene for human eosinophil peroxidase JOURNAL J. Biol. Chem. 264 (28), 16828-16836 (1989) PUBMED 2550461 COMMENT On or before Jun 10, 2016 this sequence version replaced M29904.1, M29905.1, M29906.1, M29907.1, M29908.1, M29909.1, M29910.1, M29911.1, M29912.1, M29913.1, AH002817.1. FEATURES Location/Qualifiers source 1..5440 /organism="Homo sapiens" /mol_type="genomic DNA" /db_xref="taxon:9606" /chromosome="17" /clone="lambda-601" /tissue_type="placenta" /tissue_lib="M.Shibuya" gene 274..5440 /gene="EPP" regulatory 274..280 /regulatory_class="TATA_box" /gene="EPP" mRNA join(306..500,616..709,1030..1205,1323..1440,1572..1701, 1896..2102,2365..2683,3059..3219,3494..3749,4074..4244, 4542..4779,5018..>5219) /gene="EPP" /product="eosinophil peroxidase" exon 306..500 /gene="EPP" /number=1 CDS join(425..500,616..709,1030..1205,1323..1440,1572..1701, 1896..2102,2365..2683,3059..3219,3494..3749,4074..4244, 4542..4779,5018..5219) /gene="EPP" /note="precursor" /codon_start=1 /product="eosinophil peroxidase" /protein_id="AAA58458.1" /translation="MHLLPALAGVLATLVLAQPCEGTDPASPGAVETSVLRDCIAEAK LLVDAAYNWTQKSIKQRLRSGSASPMDLLSYFKQPVAATRTVVRAADYMHVALGLLEE KLQPQRSGPFNVTDVLTEPQLRLLSQASGCALRDQAERCSDKYRTITGRCNNKRRPLL GASNQALARWLPAEYEDGLSLPFGWTPSRRRNGFLLPLVRAVSNQIVRFPNERLTSDR GRALMFMQWGQFIDHDLDFSPESPARVAFTAGVDCERTCAQLPPCFPIKIPPNDPRIK NQRDCIPFFRSAPSCPQNKNRVRNQINALTSFVDASMVYGSEVSLSLRLRNRTNYLGL LAINQRFQDNGRALLPFDNLHDDPCLLTNRSARIPCFLAGDTRSTETPKLAAMHTLFM REHNRLATELRRLNPRWNGDKLYNEARKIMGAMVQIITYRDFLPLVLGKARARRTLGH YRGYCSNVDPRVANVFTLAFRFGHTMLQPFMFRLDSQYRASAPNSHVPLSSAFFASWR IVYEGGIDPILRGLMATPAKLNRQDAMLVDELRDRLFRQVRRIGLDLAALNMQRSRDH GLPGYNAWRRFCGLSQPRNLAQLSRVLKNQDLARKFLNLYGTPDNIDIWIGAIAEPLL PGARVGPLLACLFENQFRRARDGDRFWWQKRGVFTKRQRKALSRISLSRIICDNTGIT TVSRDIFRANIYPRGFVNCSRIPRLNLSAWRGT" mat_peptide join(1367..1440,1572..1701,1896..2051) /gene="EPP" /product="eosinophil peroxidase" /note="light chain" mat_peptide join(2052..2102,2365..2683,3059..3219,3494..3749, 4074..4244,4542..4779,5018..5216) /gene="EPP" /product="eosinophil peroxidase" /note="heavy chain" intron 501..615 /gene="EPP" /number=1 exon 616..709 /gene="EPP" /number=2 intron 710..>752 /gene="EPP" /number=2 gap 753..852 /estimated_length=unknown intron <853..1029 /gene="EPP" /number=2 exon 1030..1205 /gene="EPP" /number=3 intron 1206..>1209 /gene="EPP" /number=3 gap 1210..1309 /estimated_length=unknown intron <1310..1322 /gene="EPP" /number=3 exon 1323..1440 /gene="EPP" /number=4 intron 1441..1571 /gene="EPP" /number=4 exon 1572..1701 /gene="EPP" /number=5 intron 1702..>1738 /gene="EPP" /number=5 gap 1739..1838 /estimated_length=unknown intron <1839..1895 /gene="EPP" /number=5 exon 1896..2102 /gene="EPP" /number=6 intron 2103..>2241 /gene="EPP" /number=6 gap 2242..2341 /estimated_length=unknown intron <2342..2364 /gene="EPP" /number=6 exon 2365..2683 /gene="EPP" /number=7 intron 2684..>2823 /gene="EPP" /number=7 gap 2824..2923 /estimated_length=unknown intron <2924..3058 /gene="EPP" /number=7 exon 3059..3219 /gene="EPP" /number=8 intron 3220..>3248 /gene="EPP" /number=8 gap 3249..3348 /estimated_length=unknown intron <3349..3493 /gene="EPP" /number=8 exon 3494..3749 /gene="EPP" /number=9 intron 3750..>3812 /gene="EPP" /number=9 gap 3813..3912 /estimated_length=unknown intron <3913..4073 /gene="EPP" /number=9 exon 4074..4244 /gene="EPP" /number=10 intron 4245..>4322 /gene="EPP" /number=10 gap 4323..4422 /estimated_length=unknown intron <4423..4541 /gene="EPP" /number=10 exon 4542..4779 /gene="EPP" /number=11 intron 4780..>4903 /gene="EPP" /number=11 gap 4904..5003 /estimated_length=unknown intron <5004..5017 /gene="EPP" /number=11 exon 5018..>5219 /gene="EPP" /number=12 BASE COUNT 945 a 1357 c 1267 g 971 t ORIGIN 1 caccgctcct gtcagccaac aaatatccat tgagcgacac ctgtgtccca ggtgctgctc 61 tgggccctgg gagaagtgca tcagtgggct tggtagtaga gggtagggat ggagtgaagg 121 gtaggcagga agaatgtccc caggctggta ggaggtgggg tggggggttt cagtctcaaa 181 actcccatga aaaccagaga gaagtttcag aactccaccc aagaggctgg gtttctaggg 241 cccagagctg ccctccccca ccctagaatg ggctataaaa gtcccttccc agctacgtcc 301 agagaagagc tggaggaagt gagaggtcgg ctgggggtcc tcaaagtgag aggggagcag 361 aggatcctcc cgtgcaggct gtggatgtca ctcacttccc agctggtgaa gcctcgctgc 421 agagatgcat ctgctcccag ccctggcagg ggtcctggcc acactcgtcc tcgcccagcc 481 ctgtgagggc actgacccag gtaatagtcc cctagacagg caaggaggag ggaggggaaa 541 tggaagggga agcacttggg tcttggaggg ggtcttgtgg cttgctgaac cctgagtccc 601 catctctttg aacagcctcc cctggggcag tggagacctc ggtcctgcga gactgcatag 661 cagaggccaa gttgctggtg gatgctgcct acaattggac ccagaagagg tggacttggg 721 tctgggggct gcatgggcct gggaggatca gtnnnnnnnn nnnnnnnnnn nnnnnnnnnn 781 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 841 nnnnnnnnnn nncaagttca tctcactcat cagccacctc tggaccccat gaacatttcc 901 tgttggtaga gcctcccttc catccatcct tctgtccgct tgccctgtcc tgactgtgcc 961 ccaggactgg gtctctgctg ggtgggtctg caccctctct ccagccctca ctcctcctct 1021 cctgggcagc atcaagcagc ggcttcgcag cggttcagcc agccccatgg acctcctgtc 1081 ctacttcaaa caaccggtag cagccaccag gacagttgtt cgggccgcag attatatgca 1141 tgtggctttg gggctgcttg aagagaagtt acaaccccag cggtccggac ccttcaatgt 1201 cactggtacn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 1261 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnt gccttcccac 1321 agatgtgcta acagaaccac agctgcggct gctgtcccag gccagtggct gtgctctccg 1381 ggaccaggcc gagcgctgca gcgacaagta ccgcaccatc actggacggt gcaacaacaa 1441 gtgcgtgcgg ggcggcagga ggggctgccc ctgcctgggg gacctctccc ttcctgcacc 1501 caccctctcc ctccatgctg agccatctcc aggccctgcc ccctgctaac ctatcccacc 1561 catggctgca ggaggagacc cttgctaggg gcctccaacc aggctctggc tcgctggctg 1621 cccgccgagt atgaggatgg gctgtcgctc cccttcggct ggacccccag caggaggcgc 1681 aatggcttcc ttctccctct tgtgagttgg ggctgagggt ttgggaggtt gcttgatcnn 1741 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 1801 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnta ataccttgtg gggtcaggga 1861 gcccatgtcc cgtgctgatg ttatttcccc accaggtccg ggctgtctcc aaccagattg 1921 tgcgcttccc caatgagaga ctgacctccg accgtggccg agccctcatg ttcatgcagt 1981 ggggccagtt cattgaccat gacctggact tctccccgga gtccccggcc agagtggcct 2041 tcactgcagg cgttgactgt gagaggacct gcgcccagct gcccccctgc tttcccatca 2101 aggtacctac cctcagccaa tctcccatgc ccttgtgtgg cctcccccaa aggcaaggtg 2161 ctgggggtgg ggatctggaa gactggagca ccatccttaa ggagctgcct gtggagctag 2221 ggtatgagac agagacacaa gnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 2281 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 2341 ncactgtctc ctcttccatc tcagatccca cccaatgacc cccgcatcaa gaaccagcgt 2401 gactgcatcc ctttcttccg ctcggcaccc tcatgccccc aaaacaagaa cagagtccgc 2461 aaccagatca acgcgctcac ctcctttgtg gacgccagca tggtgtatgg cagtgaggtc 2521 tccctctcgc tgcggctccg caaccggacc aactacctgg ggctgctggc catcaaccag 2581 cgctttcaag acaacggccg ggccctgctg cccttcgaca acctgcacga tgacccctgt 2641 ctcctcacca accgctcggc gcgcatcccc tgcttcctgg caggtcagac agggaggaag 2701 gtggtgtctt cccaggaaac agccatccct ggggtcccaa ctgggaagca atggtgggat 2761 gtggtgaagg tacatggttt gggacctcag tattaggcac accataagca tggatctgtg 2821 cacnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 2881 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnntgaagag atggaggtcc 2941 agtgagggcc aggagtttgg cccaccccgt ctctcccatc cccagccctg ggtctaccct 3001 ggtagaaaga catttctctg ggaaaggctg cagtaaatct gagcttgggg ttttcaaggt 3061 gacacccgat caacggaaac ccccaaactg gcagccatgc acaccctctt tatgcgagag 3121 cacaaccggc tggccaccga gctgagacgc ctgaatcccc ggtggaatgg agacaaactg 3181 tacaatgagg ctcggaagat catgggggcc atggtccagg taaggagctc tgcatcccag 3241 catcccccnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 3301 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnct ttgtatctcc 3361 acccaccaat agtaaattaa tgttgtcaca tttgacgtga tgacaataaa gaatatgtct 3421 gagccaccct ttgaaaaggc aagggtatgg gtgagtagcc tctggggaat gttcctcctg 3481 tcttcccttc cagatcatca cctaccgaga ctttctgccc ctggttctgg gcaaggcccg 3541 ggccaggaga accctggggc actacagggg gtactgctcc aatgtggacc cacgggtggc 3601 caatgtcttc accctggcct tccgctttgg ccacacaatg ctccagccct tcatgttccg 3661 cttggacagt cagtaccggg cctccgcacc caactcgcat gtcccactta gctctgcctt 3721 ctttgccagc tggcggatcg tgtatgaagg tgaccaggtt ttccaggggg caaatggggg 3781 tgagggtggg gagcatgccc tcccctaggt ggnnnnnnnn nnnnnnnnnn nnnnnnnnnn 3841 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 3901 nnnnnnnnnn nntccagctg cttcatgtct ctccagaact ctgtttcctg acaaacgtta 3961 ctaacatacc cgactggctt gtccagctct gggctagctt ggcatcatgt gataacccaa 4021 gtagcttccc agaggctggt ccaatctgtg ctgctcacat tccctgccac cagggggcat 4081 cgaccccatc ctccggggcc tcatggccac ccctgccaag ctgaaccgtc aggatgccat 4141 gttagtggat gagctccggg accggctgtt tcggcaagtg aggaggattg ggctggacct 4201 ggcagctctc aacatgcaac gaagccggga ccacggcctt ccaggtgagg gggctgtcca 4261 cctcttctcc cagctttgct cgggccaggc tgctcaaggg gttctgggaa gaccctggta 4321 ccnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 4381 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnccgtctgg ttctgcccaa 4441 tattgactgg ccacagcttc cccccagagg actggtggag aaaaacagaa gctaatggga 4501 gatcagcaag actgaagctg cttctccccg ttcccctgca gggtacaatg cttggaggcg 4561 cttctgtggg ctctcccagc cccggaattt ggcacagctt agccgggtgc tgaaaaacca 4621 ggacttggca aggaagttcc tgaatttgta tggaacacct gacaacattg acatctggat 4681 tggggccatc gctgagcctc ttttgccggg ggctcgagtg gggcctcttc tggcttgtct 4741 gttcgagaac cagttcagaa gagcccgaga cggagacagg taagtgaccc tatcataaaa 4801 gacatcagca ccagaggcag agcagaaaaa cactagcatt tcaagactaa acattgaaga 4861 acactgctct ttttagtatc atttcttcca agttcacagg atcnnnnnnn nnnnnnnnnn 4921 nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn nnnnnnnnnn 4981 nnnnnnnnnn nnnnnnnnnn nnncgactgc ctggtaggtt ctggtggcag aaacgaggtg 5041 ttttcaccaa aagacagcgc aaggccctga gcagaatttc cttgtctcga attatatgtg 5101 acaataccgg tatcaccacg gtttcaaggg acatcttcag agccaacatc taccctcggg 5161 gctttgtgaa ctgcagccgt atccccaggt tgaacctatc agcctggcga gggacatgag 5221 gcttctgcag gtaaggggag gccacctcca gcaccctggg ctggttaagc ctcacatcct 5281 tccctggatg gatggctgag tcctcttagg tctctaagca gagaaaacag aacttgtcac 5341 taggtactct ttccaagtgg cttcccaatg tgctagtttc tgggctgaca gtcaattcca 5401 ggccctagga ctttgggggg aaattaggag catccaacta //