LOCUS       HUMHPVME18              6042 bp    DNA     linear   VRL 30-NOV-1999
DEFINITION  Human cellular DNA/Human papillomavirus proviral DNA.
ACCESSION   M73258
VERSION     M73258.1
KEYWORDS    proviral gene.
SOURCE      Human papillomavirus
  ORGANISM  Human papillomavirus
            Viruses; dsDNA viruses, no RNA stage; Papillomaviridae;
            unclassified Papillomaviridae.
REFERENCE   1  (bases 1 to 6042)
  AUTHORS   Reuter,S., Delius,H., Kahn,T., Hofmann,B., zur Hausen,H. and
            Schwarz,E.
  TITLE     Characterization of a novel human papillomavirus DNA in the
            cervical carcinoma cell line ME180
  JOURNAL   J. Virol. 65 (10), 5564-5568 (1991)
   PUBMED   1716694
FEATURES             Location/Qualifiers
     source          1..5993
                     /organism="Human papillomavirus"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:10566"
                     /focus
     source          5994..6042
                     /organism="Homo sapiens"
                     /mol_type="genomic DNA"
                     /db_xref="taxon:9606"
                     /cell_line="ME180"
                     /cell_type="carcinoma"
                     /tissue_type="cervix"
     CDS             227..1636
                     /codon_start=1
                     /product="L2"
                     /protein_id="AAF14009.1"
                     /translation="MVSHRAARRKRASATELYKTCKQSGTCPPDVINKVEGTTLADKL
                     LQWTSLGIFLGGLGIGTGSGTGGRTGYIPLGGKPNTVVDVSPARPPVVIEPVGPTEPS
                     IVQLVEDSSVITSGTPVPTFTGTSGFEITSSSTTTPAVLDITPSSGSVQVSSTSFTNP
                     AFADPTIIEVPQTGEVSGNVFVSTPTSGTHGYEEIPMQVFATHGTGTEPISSTPIPGV
                     SRVAGPRLYSRAHQQVRVSNFDFVTHPSSFVTFDNPAFEPVDTTLTYEPADIAPDPDF
                     LDIVRLHRPALTSRRGTVRFSRVGKKATMFTRRGTQIGAQVHYYHDISGIAPADSIEL
                     QPLVAPEQSDPMDTLYDIYAPDTDNTTVLDTAFHNATFTSRSHISVPSLASTASTTYA
                     NTTIPIGTAWNTPVNTGPDVVLPATSPQLPLTPSTPIDTTYAITIYGTNYYLLPLLFF
                     LLKKRKRLPYFFADGIVAL"
     CDS             1617..3134
                     /codon_start=1
                     /product="L1"
                     /protein_id="AAF14010.1"
                     /translation="MALWRSSDNMVYLPPPSVAKVVNTDDYVTRTGIYYYAGTSRLLT
                     VGHPYFKVPMSGGRKQDIPKVSAYQYRVFRISLPDPNKFSLPESTLYNPDTQRLVWAC
                     VGVEIGRGQPLGVGLSGHPLYNRLDDTENSPFSSNKNPKDSRDNVSVDYKQTQLCIIG
                     CVPAIGEHWAKGKSCKPSNVQPGDCPPLELVNTPIQDGDMIDTGYGAMDFSTLQETKS
                     EVPLDICQSVCKYPDYLQMSADVYGDSMFFCLRREQLFARHFWNRGGMVGDTIPTELY
                     IKGTDIRDSPSSYVYAPSPSGSMVSSDSQLFNKPYWLHKAQGHNNGICWHNQLFLTVV
                     DTTRSTNFTLSTTTESAVPNIYDPNKFKEYIRHVEEYDLQFIFQLCTITLSTDVMSYI
                     HTMNPAILDDWNFGVAPPPSASLVDTYRYLQSAAITCQKDAPAPTKKDPYDGLNFWNV
                     NLKEKFSSELDQFPLGRKFLLQAGVRRRPTIGPRKRPATATTASTSKHKRKRVSK"
     CDS             3934..4422
                     /codon_start=1
                     /product="E6"
                     /protein_id="AAF14011.1"
                     /translation="MSIPMALFHNPEERPYKLPDLCRTLDTTLHDVTIDCVYCRRQLQ
                     RTEVYEFAFGDLNVVYRDGVPLAACQSCIKFYAKIRELRYYSESVYATTLETITNTKL
                     YDLSIRCMCCLKPLSPAEKLRHLNSKRRFHKIAGNFTGQCRHCWTSKREDRRRTRQET
                     QV"
     CDS             4430..4762
                     /codon_start=1
                     /product="E7"
                     /protein_id="AAF14012.1"
                     /translation="MHGPKPTVQEIVLELCPCNEIEPVDLVCHEQLGDSDDEIDEPDH
                     AVNHHQHQLLARRDEQQRHTIQCTCCKCNNLLQLVVEASRENLRNVELLFMDSLNFVC
                     PWCATETQ"
     CDS             4769..5119
                     /codon_start=1
                     /product="E1a"
                     /protein_id="AAF14013.1"
                     /translation="MANCEGTDGDGTGCNGWFFVQAIVDKQTGDTVSEDEDENATDTG
                     SDMVDFIDDATDICIQAERETAQVLLNMQQAQRDAQTVRALKRKYTDSIESSPLAKSP
                     LQELSIWKWKLTRR"
     CDS             5092..6042
                     /codon_start=1
                     /product="E1b"
                     /protein_id="AAF14014.1"
                     /translation="MEVETNSEVTVATNTNGADGEDEGENGDSIREDCSSVDSAIDSE
                     NQDPKSPTTQLKVLLQCNNKKAAMLTEFKKVYGLSFNDLVRTFKSDKTTCTDWVAAIF
                     GVNPTIAEGFKTLIKQYALYTHIQCLDTKNGILILMLIRYKCGKNRITVGKGLSTLLH
                     VPDSCMLLQPPKLRSPVAALYWYRTGISNISEVCGDTPEWIKRLTIIQHGIDDSVFDL
                     SDMVQWAFDNELTDESDIAFSYAMLADCNSNAAAFLKSNCQAKYVKDCATMCRHYKRA
                     QKRQMSMPQWIKFRCSKCDEGGDWRMDCRIYYLCLLQAIS"
BASE COUNT         1810 a         1155 c         1279 g         1798 t
ORIGIN      
        1 tatgtatgtt gcactgtccc gcttctgcag tccatgcatg tgtgtgtgta tgtgtggata
       61 cttgtgtttg tgtttatatt agtacgtacc acaccattgg aggtctttgc tgtatatata
      121 cttttttttt tactgcctat gtgggtatta cacagttttg ctcgttatag tatgccttaa
      181 gttttgtatt gtgcatttgt attggtgtat atttttataa ataaatatgg tatcacaccg
      241 tgctgccagg cgcaagcgtg catctgcaac tgaattatat aaaacatgca aacaatcagg
      301 cacatgtcct cctgatgtta taaataaggt tgaaggcacc acacttgcag acaaactatt
      361 gcaatggacc agtttaggta tttttttggg tggcctaggc attggtactg ggtcaggaac
      421 cgggggtcgt actgggtaca ttcctttagg tggtaaacct aatactgttg tagatgtttc
      481 gcctgcacgt ccacctgtgg ttattgaacc tgtgggtcct acagaaccct ccattgtgca
      541 attggtggaa gattccagtg ttattacatc tggcacaccg gtaccaacat ttacaggcac
      601 ttctgggttt gaaattacat cttcttctac cactacacct gctgtgttag acattacccc
      661 ttcgtctggg tctgtgcaag taagcagtac tagttttact aaccctgcat ttgcagaccc
      721 cactattata gaagtgcctc aaacaggtga agtctctggt aatgtgtttg taagtacccc
      781 cacatcggga acacatggat atgaagaaat acctatgcag gtatttgcaa cacatggcac
      841 tggtacagaa cctattagta gtacacctat acctggggtt agtcgtgtgg cagggccacg
      901 tttatatagt agggcacatc aacaggttcg tgttagtaat tttgattttg taactcaccc
      961 ttcatcattt gtaacatttg ataatcctgc ttttgagcct gttgatacta cacttacata
     1021 tgaacctgct gacatagctc ctgatccgga ttttctggac attgttcgtt tacataggcc
     1081 tgccttaact tcccgaagag gcacagtacg ttttagcaga gtaggcaaaa aggcaactat
     1141 gtttacacgc cggggtacac aaattggggc acaggtgcac tattatcatg atattagtgg
     1201 cattgctcct gctgacagca ttgaactaca acctttggtt gccccagagc agtctgaccc
     1261 tatggatact ttatatgata tatatgcacc agatactgac aatactacag tattggatac
     1321 tgcattccat aatgctacat ttacctcccg ttcccatata tctgttcctt cattagcgtc
     1381 tacagcatct actacatatg ctaacactac tattcctatt ggtactgctt ggaacacgcc
     1441 tgtaaatact ggtcctgatg ttgtgttacc agcaacgtct ccacagttgc ctttaacacc
     1501 ctctacacca attgatacaa cctatgccat aactatatat ggcaccaatt attatttatt
     1561 accattattg ttctttttat taaaaaaacg taaacgcctt ccttattttt ttgcagatgg
     1621 cattgtggcg ctctagcgac aacatggtgt atttgcctcc cccctcagtg gcgaaggttg
     1681 tcaatacaga tgattacgta acacgcactg gcatttatta ctatgctggt acatctaggt
     1741 tattaactgt aggccatcca tattttaagg tccctatgtc tgggggccgc aagcaggaca
     1801 ttcctaaggt gtctgcatat caatacaggg tgtttaggat ttccctacct gatcctaata
     1861 aatttagtct tcctgagtct acattatata accctgatac gcagcgattg gtatgggcct
     1921 gtgttggtgt tgaaataggt agggggcagc cattaggtgt tggccttagt gggcatccat
     1981 tatataatag gctagatgat actgaaaatt ccccgttttc ctccaacaaa aatcctaagg
     2041 acagtaggga caatgtttca gtggactata aacaaacgca actatgtatt ataggctgtg
     2101 ttcctgccat tggggagcac tgggccaaag gtaaatcttg taagcctagc aatgtgcagc
     2161 ccggggactg tccaccattg gaattagtaa atacacctat tcaggatggc gatatgattg
     2221 atacaggata tggtgctatg gactttagta cattacaaga aacaaaaagc gaggtgcctt
     2281 tagatatatg tcaatcagtc tgcaaatatc ctgactattt acaaatgtct gcagatgtat
     2341 atggagacag tatgttcttt tgtttacgta gggaacagtt atttgctagg catttttgga
     2401 atagaggggg catggtaggg gacactatac ctactgaatt gtatattaag ggcactgaca
     2461 tacgtgacag tcctagtagt tatgtatatg ccccctcgcc tagtgggtct atggtatcct
     2521 cagactccca gttatttaac aagccctatt ggctgcacaa ggcacaggga cacaacaatg
     2581 gtatttgttg gcataatcaa ttatttctta ctgttgtgga taccactcgc agtaccaatt
     2641 ttactttgtc tactactact gaatcagctg taccaaatat ttatgatcct aataaattta
     2701 aggaatatat taggcatgtt gaggaatatg atttgcaatt tatatttcag ttgtgtacta
     2761 taacattgtc cactgatgta atgtcctata tacatactat gaatcctgct attttggatg
     2821 attggaattt tggtgttgcc cctccaccat ctgctagtct tgtagataca taccgctatc
     2881 tgcaatcagc agcaattaca tgtcaaaaag acgcccctgc acctactaaa aaggatccat
     2941 atgatggctt aaacttttgg aatgtaaatt taaaggaaaa gtttagttct gaactggacc
     3001 agtttccttt aggacgcaaa tttcttttac aggcaggtgt ccgccgacga cccactatag
     3061 gcccccgtaa acgccctgcc acagcaacta ctgcatctac ctctaagcac aaacgtaaac
     3121 gtgtgtcaaa gtaattgttg tatgttttgt tttgtatgtt ggttgtatgt gtggttgtat
     3181 atgtgtcatg ttgttgttgg tatgttgtgc atgtatgtgt atatgtatat gtgtatgttt
     3241 gcaggtatgt ttgtataatc tgtttttgtt aataaagtat gtatgtcagt ttactttgtg
     3301 gttgcaccct gtgactaaca tatgtccttg ttttacatat cataggactg caacatttcc
     3361 tacataattt gtagccctac cctaaggtgt gttacagtac atgtaatata tatatagttc
     3421 tatattatac caagtggcca ttttgtaagg ccattttgtg tgcaaccgtt ttcggtcggt
     3481 ggtgctattt ccttctatac agtattaaaa actatgtgtt tcagcaaaaa catgtttcac
     3541 cttggtttac ccacatagtt ggcaccggta acagtatgta ctggcgcacc ttacttagtc
     3601 atcatcctgt ccaggtgcag tgcaacaata gtttggcagc ctatatatct ccacccttgt
     3661 aataaaactg cttttaggca taggttttta actgttttta cttgcctaat agcatagttg
     3721 gcctgtataa ctacttttgc attcaagaat gtgtcttgta gtgtaagtta tacagtgact
     3781 aataccacat ccataaattt gtgcaaccga aataggttgg gcacacatac caatactttt
     3841 acttataaca ttttacaatc attttatagt ataaagggag tgaccgaaaa cggtcatgac
     3901 cgaaaacggt gtatataaag ctgaacacag cagttgtcta taccaatggc gctatttcac
     3961 aaccctgagg aacggccata caaattgcca gacctgtgca ggacattgga caccacattg
     4021 catgacgtta caatagactg tgtctattgc agaaggcaac tacaacggac agaggtatat
     4081 gaatttgcct ttggtgactt aaatgtagta tatagggacg gggtaccatt agctgcatgc
     4141 caatcatgta ttaaatttta tgcgaaaata cgggaactac gatattactc agaatcggtg
     4201 tatgcaacaa cattagaaac cataactaat acaaagttat atgatttatc aataaggtgc
     4261 atgtgttgcc tgaaaccatt gagtcctgct gaaaaactaa ggcacctaaa ttcaaaacga
     4321 agatttcata aaatagcagg aaactttaca ggacagtgtc gccactgctg gaccagtaaa
     4381 cgagaggacc gcagacgcac acggcaggaa acacaagtat aaactaacta tgcatggacc
     4441 aaagcccacc gtgcaggaaa ttgtgttaga gttatgtcca tgcaatgaaa tagagccggt
     4501 cgaccttgta tgtcacgagc aattaggaga ttcagacgat gaaatagatg aacccgacca
     4561 tgcagttaat caccaccaac atcaactact agccagacgg gacgaacaac agcgtcacac
     4621 aattcagtgt acgtgttgta agtgtaacaa cctactgcaa ctagtagtag aagcgtcgcg
     4681 ggagaacctg cggaacgtag aactgctgtt tatggactca ctaaattttg tgtgtccgtg
     4741 gtgtgcaacg gaaacccagt aatctgcaat ggccaattgt gaaggtacag atggggacgg
     4801 gacggggtgt aacggatggt tttttgtaca agcaatagta gataaacaaa caggtgacac
     4861 agtctcagag gatgaggatg aaaacgcgac agatacaggt tcagacatgg tagatttcat
     4921 tgatgatgct acagatattt gtatacaggc agagcgtgag acagcacagg tactgttaaa
     4981 tatgcaacag gcccaaaggg atgcacaaac agtgcgtgcc ctaaaacgaa agtatacaga
     5041 cagtatagaa agcagccctt tagcaaagtc gccattacag gaactatcaa tatggaagtg
     5101 gaaactaact cggaggtaac tgtagcaact aatacaaatg gggcggacgg ggaggatgaa
     5161 ggggaaaatg gcgacagcat acgggaggac tgtagtagtg tagacagtgc tatagatagt
     5221 gaaaaccagg atcctaaatc acctactacg caactaaaag tattattaca atgtaataat
     5281 aaaaaagctg caatgttaac agaatttaaa aaagtatatg gattgtcctt taatgaccta
     5341 gtacgtacat ttaaaagtga taagaccaca tgtacggact gggtagcagc aatattcgga
     5401 gtaaatccaa ccattgccga agggtttaaa acactaatta aacaatatgc attatatacc
     5461 catatacaat gtttagatac aaaaaacgga atattaatat taatgttaat aagatacaaa
     5521 tgtgggaaaa atagaataac agtaggaaaa ggattaagta cattgttgca tgttccagac
     5581 agctgtatgc ttttgcagcc accaaaattg cgtagccctg ttgcagcatt gtattggtat
     5641 agaacaggaa tatctaatat tagtgaggtg tgtggagaca cgccagaatg gataaaaaga
     5701 ttaactataa tacaacatgg aatagatgat agtgtatttg atctatcaga catggtacaa
     5761 tgggcatttg ataatgagtt aacagatgaa agtgatatag cattttcata tgctatgttg
     5821 gcagattgta atagtaatgc tgcagcgttt ttaaaaagca actgtcaagc aaaatatgta
     5881 aaagattgtg caacaatgtg tagacattac aaacgggcac aaaaacgaca aatgtcaatg
     5941 ccgcaatgga ttaaatttag atgcagtaaa tgtgatgaag gcggtgattg gcgcatggac
     6001 tgcagaattt actacttgtg tttattacag gcgatttcct ga
//