LOCUS       AF043239                6125 bp    DNA     linear   BCT 04-OCT-1999
DEFINITION  Salmonella typhimurium SopE (sopE) gene, complete cds.
ACCESSION   AF043239
VERSION     AF043239.1
KEYWORDS    .
SOURCE      Salmonella enterica subsp. enterica serovar Typhimurium str. SL1344
  ORGANISM  Salmonella enterica subsp. enterica serovar Typhimurium str. SL1344
            Bacteria; Proteobacteria; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Salmonella.
REFERENCE   1  (bases 1 to 6125)
  AUTHORS   Hardt,W.D., Urlaub,H. and Galan,J.E.
  TITLE     A substrate of the centisome 63 type III protein secretion system
            of Salmonella typhimurium is encoded by a cryptic bacteriophage
  JOURNAL   Proc. Natl. Acad. Sci. U.S.A. 95 (5), 2574-2579 (1998)
   PUBMED   9482928
REFERENCE   2  (bases 1 to 6125)
  AUTHORS   Galan,J.E.
  TITLE     Direct Submission
  JOURNAL   Submitted (15-JAN-1998) Molecular Genetics and Microbiology, School
            of Medicine, State University of New York at Stony Brook, Stony
            Brook, NY 11794-5222, USA
FEATURES             Location/Qualifiers
     source          1..6125
                     /organism="Salmonella enterica subsp. enterica serovar
                     Typhimurium str. SL1344"
                     /mol_type="genomic DNA"
                     /strain="SL1344"
                     /serovar="Typhimurium"
                     /sub_species="enterica"
                     /db_xref="taxon:216597"
     CDS             <1..950
                     /note="OrfK; similar to OrfK protein of bacteriophage 186
                     and other P2-like bacteriophages"
                     /codon_start=3
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02069.1"
                     /translation="AALDTLNELAAALGNDPNFATTMLNALGGKQPLDNTLTNLSGKD
                     VAGLLAYLCLGETINRAADALQKSQNGADIPDKPRFVQNIGLKETLNPTKRVSIGNIG
                     TGVFDGSTPCINIGDSDSGFIGSADGVLDIYCNGAKVGYINGNGLHMLTDIHFDNARM
                     TTNGDIFSSVWGDNWLSIWITNQLNTRGTIDWINSELAIRDNNINTRATIDYVNQTFA
                     RKNTGSIQDWGWILDDSTGFIMQWGTLGNSNGTYNFPRAFPVGCFAVFVTNTNAQGTQ
                     VDNAFGYPVSNSQFFAATKSSAIANMVNNFPVAWFAIGR"
     CDS             957..1241
                     /note="Orf45; similar to Orf45 protein of bacteriophage
                     186 and other P2-like bacteriophages"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02070.1"
                     /translation="MSDYYYSFKEKGFFWQPDTESDNYPDDLIPLTDEYYRELMQGQV
                     DGKYIEHRKGGPVLVEHRNIRLKSWLHRLKPEKRNFLLRQSQLLRHWRGR"
     gene            complement(1560..2282)
                     /gene="sopE"
     CDS             complement(1560..2282)
                     /gene="sopE"
                     /note="similar to Salmonella dublin SopE protein;
                     substrate of the centisome 63 type III protein secretion
                     system"
                     /codon_start=1
                     /transl_table=11
                     /product="SopE"
                     /protein_id="AAC02071.1"
                     /translation="MTKITLSPQNFRIQKQETTLLKEKSTEKNSLAKSILAVKNHFIE
                     LRSKLSERFISHKNTESSATHFHRGSASEGRAVLTNKVVKDFMLQTLNDIDIRGSASK
                     DPAYASQTREAILSAVYSKNKDQCCNLLISKGINIAPFLQEIGEAAKNAGLPGTTKND
                     VFTPSGAGANPFITPLISSANSKYPRMFINQHQQASFKIYAEKIIMTEVAPLFNECAM
                     PTPQQFQLILENIANKYIQNTP"
     CDS             2496..2699
                     /note="OrfR; similar to bacterial DNA recombinases;
                     incomplete sequence; probably not expressed"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02072.1"
                     /translation="MECELIVERTSAGLEVVRSKGRIGGRRPKLTPEQWEQAGRLLAA
                     GETRHRVGLLFDVSIPLFTRNSL"
     CDS             2816..3988
                     /note="OrfJ; similar to OrfJ protein of bacteriophage 186
                     and other P2-like bacteriophages"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02073.1"
                     /translation="MAQDYHHGVRVVEINEGTRPITTLSTAIVGMVCTGDDADASVFP
                     LNKPVLLTDVLTASGKAGESGTLARSLDAIADQAKPVTVVVRVAQGETEAETTSNIIG
                     GVTSDGKKTGMKALLSAQSQLGVKPRILGVPGHDTQAVATELLGVAQSLRGFAYLAAN
                     GCKTVEEAIAYRENFSQREGMLIWPDFINFDTVLKADATAYASARALGLRAKIDEQIG
                     WHKTLSNVGVNGVTGISADVFWDLQDPATDAGLLNKNDVTTLIRKDGFRFWGSRCLSD
                     DPLFAFENYTRTAQVLADTMAEAHMWAVDGVLNPSLARDIIEGLRAKMRSLVNQGYLI
                     GGDCWLDESVNDKDALKAGKLTIDYDYTPVPPLENLMLRQRITDRYLVDFASRVAA"
     CDS             3998..4513
                     /note="OrfI; similar to OrfI protein of bacteriophage 186
                     and other P2-like bacteriophages"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02074.1"
                     /translation="MALPRKLKHLNLFNDGNNWQGIVESLTLPKFTRKFEKYRGGGMP
                     GAVDVDMGLDDGALDTEFSIGGTELLLFKQMGKATVDGIQLRFTGSIQRDDTGEVQAV
                     ELVVRGRHKEVDSGEWKTGESSSTKVSSTNSYAKLTINGEVLYEVDLVNMVEIVGGVD
                     LMEAHRNALGL"
     CDS             4568..4870
                     /note="OrfH; similar to OrfH protein of bacteriophage 186
                     and other P2-like bacteriophages"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02075.1"
                     /translation="MSDKLTEKTVELDTPIMRGKAEITEIVLRKPQSGALRGTRLQAI
                     MDMDVGAMMTVIPRISTPTLTAQEMAELDPADLTALSVEVVTFLLKKSVLAGLPTA"
     CDS             5015..>6125
                     /note="OrfG; similar to OrfG protein of bacteriophage 186"
                     /codon_start=1
                     /transl_table=11
                     /product="unknown"
                     /protein_id="AAC02076.1"
                     /translation="MSDNNLRLQVILNAVDKLTRPFRSAQASSKELAAAIQQSRARLK
                     ELDAQAGRIDGFRKASAQLAVTGNSLKAAREEAAKLATQFSATNRPTAAQARLLEQAK
                     NRVTELQSKYNGLRQSVQRQRLALNEAGLDTKKLSSAQRELRQNADETRQALDRQQKS
                     LKRLGEQQARMNAVRDQYSRRLEVRDRIAGAGATTTAAGVAMGAPVVAAVKSYASMED
                     AMKGVAKQVNGLRDDNGNRTKQFYDMQDAIKAASEQLPMENGAIDYAALVEGGARMGV
                     TNQDDPYEEQKRDLLAFASTAAKAATAFELPADELAEGLGKIAQLYKVPTRNIEQLGD
                     ALNYLDDNAMSKGGDIINVLQRMGGVADRLDFRKAA"
BASE COUNT         1525 a         1463 c         1689 g         1448 t
ORIGIN      
        1 ctgcagcact ggatacgctg aacgagctgg cagcggctct ggggaatgac ccgaattttg
       61 ccacaacgat gttaaacgct cttggtggaa agcagccgct ggacaatacg ctgacgaatt
      121 taagcggaaa agatgtcgcc ggccttctcg catacctctg tttaggagaa acgataaatc
      181 gtgccgccga tgcgctacaa aaatcacaga acggtgcaga cattcctgac aagccgcggt
      241 ttgtacaaaa tatcggttta aaagaaaccc tgaacccgac aaaacgcgtg agtatcggca
      301 atatcggaac cggcgttttt gacggcagca caccgtgtat aaatatcggt gacagtgaca
      361 gtggatttat cggcagcgcg gatggcgtac tggatattta ctgtaacggt gccaaagtgg
      421 gttatatcaa tggtaacgga ttacacatgc tcactgatat tcatttcgat aatgcgcgca
      481 tgaccactaa tggtgacatt tttagttcag tgtgggggga taactggctg agtatctgga
      541 ttactaatca gctaaatacc cgtggaacga ttgactggat caatagtgaa ctggcaattc
      601 gtgacaacaa catcaacacc cgcgccacca ttgattatgt taaccagact ttcgcccgta
      661 aaaataccgg cagcattcag gactggggct ggattctgga cgacagcacc ggatttataa
      721 tgcagtgggg aacacttggt aactcaaacg gaacctacaa tttcccgcgc gctttccctg
      781 ttggttgctt tgccgttttt gtaaccaata ccaacgctca gggcacccag gtggataacg
      841 cattcggata cccggtgagc aacagtcagt tttttgccgc caccaagtca tcagcaatag
      901 ccaatatggt caataatttt cctgtagcct ggtttgcaat tgggagataa atatcaatga
      961 gcgattatta ttacagcttt aaagaaaaag gttttttctg gcaaccggat accgaatccg
     1021 ataattaccc tgacgattta attcccctga cagatgagta ttatcgcgag ctgatgcagg
     1081 gccaggtgga cggaaaatat atcgagcaca ggaaaggagg cccggtactg gttgagcatc
     1141 ggaatatacg cctgaagagc tggttgcaca ggctgaagcc agaaaagcgg aacttcttgc
     1201 tgaggcagag tcagttattg cgccactggc gcgggcggta aaactgaaaa ttgccacaga
     1261 tgaagagatt aaacggctgg aagcatggga actttatagc gtaatggtaa accgggtgga
     1321 tacagctaac ccagactggc cggagaaacc agctcagata taaaaatata gatatgtagt
     1381 agagactgct gctatatgtt atatagcagc aatggctatt tttttgatgg ttgagtgtat
     1441 aattttagca ctggtaaatg acggtttagc tccggagtta gttcctgggg gaaattatgg
     1501 atactattgg ttcatattaa tcaggaagag gctccgcata ttttttggtt tttcagtgtt
     1561 cagggagtgt tttgtatata tttattagca atgttttcta gtatcagttg gaattgctgt
     1621 ggagtcggca tagcacactc attaaacagt ggtgcaactt ctgtcataat gatcttctcc
     1681 gcatagattt taaaggatgc ctgctgatgt tgattgataa acatacgtgg atacttactg
     1741 tttgctgatg aaatcaacgg agttataaaa ggattggccc ctgcgccgct tggcgtaaaa
     1801 acgtcatttt tggttgttcc gggcagacct gcatttttcg ctgcttcgcc aatttcctga
     1861 agaaaaggcg ctatgttgat ccctttgctg atgagcaaat tacaacactg atctttattc
     1921 ttgctgtaaa ctgccgatag tatagcttca cgggtctggc tggcgtatgc ggggtcttta
     1981 ctcgcactac ctctaatatc tatatcattg agcgtttgaa gcataaaatc tttaacgact
     2041 ttatttgtca acactgcccg gccctcagat gcgcttcctc ggtgaaagtg tgttgcagaa
     2101 gactcagtgt tcttatgcga aataaaacgt tccgataatt ttgaccttaa ttcgatgaag
     2161 tgatttttta ctgcgagaat actttttgct aaagaatttt tctcggttga tttttctttt
     2221 agtagtgtgg tttcctgttt ttggattcta aaattctggg gagataaagt tatttttgtc
     2281 acggtaatga tccttttata tgtacataat tcatttatat atagatagca ggaatgcttt
     2341 tattttttat agcaaatgct atgtccatct gattgatgaa ttagaaaaat tcggctgatt
     2401 caattaatgc tacaaatagt actattttta ttttccagaa actttcaaaa aaagtccttt
     2461 tcgctcagga ggagccttgc cgttctggca ttgaaatgga gtgtgagctg atcgttgagc
     2521 gtaccagcgc cgggttggaa gtggtgcgtt caaaaggtcg tattggtggc aggcgtccaa
     2581 agctcacccc ggaacaatgg gagcaggccg gacggttgct tgccgccggt gaaactcgtc
     2641 atcgtgttgg attgcttttt gatgttagca ttccactctt tacaagaaat tccctgtaaa
     2701 tcagtcgcgt tgaaagtggc gatattgtac cagcactgac acatcgtgaa atacgtgcgc
     2761 cgcacgcctg gcaaccagaa cataaggtac ccctgtcaac cggagagact gccttatggc
     2821 tcaggattac caccacgggg tgcgcgttgt tgaaatcaac gagggcaccc gacctattac
     2881 cacgttgagc actgccatcg tgggcatggt ctgcaccggc gatgatgctg atgcgtccgt
     2941 gttccccctc aataagccgg tcctgctgac tgatgtgctc accgccagcg gtaaagcggg
     3001 ggagtccggc acgctggccc gctcgctgga cgcgattgca gatcaggcaa aacccgtgac
     3061 tgtcgttgtg cgtgtggcgc agggcgaaac cgaagcggaa accacctcca atattatcgg
     3121 cggcgtaact tccgacggta agaaaacggg catgaaagcg ctactgtcgg cgcagtcgca
     3181 gctcggtgtc aagccgcgca ttcttggggt gccgggacat gacactcagg ccgttgctac
     3241 tgaactgctg ggcgtggcgc aaagcttgcg cgggtttgcc taccttgctg ctaatggctg
     3301 caaaacggtg gaggaagcta ttgcctatcg cgagaatttc agtcagcgcg agggaatgct
     3361 gatctggcct gacttcatca actttgacac cgtgctgaaa gcagacgcga cggcttacgc
     3421 ctccgcccgt gcgctcggcc tgcgtgccaa aatcgacgag cagatcggct ggcataaaac
     3481 cctgtccaat gtgggtgtaa acggtgtcac cggcatttcc gctgatgtgt tctgggattt
     3541 gcaggacccg gcaaccgatg cgggactgct gaacaaaaat gacgtcacca cattgatccg
     3601 caaagacggc ttccgcttct ggggttcccg ttgtctcagt gacgatccgc tgtttgcttt
     3661 tgagaactac acccgcacgg cgcaggtgct ggctgacact atggcggagg cgcacatgtg
     3721 ggcggtggat ggcgtgctta atccgtcgct ggcccgcgac attattgaag gactacgcgc
     3781 caagatgcgc agtctggtca accagggata cctgattggt ggtgactgct ggctggatga
     3841 gtctgttaac gataaagacg cccttaaagc cgggaaactg accatcgatt atgactacac
     3901 gccggtgcct ccgcttgaaa acctgatgct gcgccagcgc atcaccgatc gttatctggt
     3961 cgattttgcc agccgtgtcg ctgcataagg gggaatcatg gctttaccac gcaagttaaa
     4021 acacctgaac ctgttcaacg acgggaacaa ctggcagggg atcgttgagt ctctgaccct
     4081 gccgaaattt acccgcaagt ttgagaagta tcgcggcggc ggtatgccgg gcgcagtgga
     4141 tgtggacatg gggctggatg acggtgcact ggacacggaa ttttcaatcg gcggtaccga
     4201 gctgctgtta ttcaagcaga tgggcaaggc aaccgttgac ggcatccagc tgcgtttcac
     4261 cggttccatt cagcgtgacg ataccggcga agtgcaggcc gttgagctgg ttgtgcgcgg
     4321 gcgccataaa gaagttgatt ccggcgagtg gaaaaccggc gagagcagca gcaccaaagt
     4381 cagcagtacc aacagctacg cgaagctgac cattaatggt gaagtgctct atgaggtcga
     4441 tctggtcaac atggtagaaa tcgttggcgg cgtggacctg atggaagcac accgtaatgc
     4501 cctcggcctc tgattaacct taacggcgcg ggcagccgcg ccagtatttc attaacagga
     4561 tacgaacatg agcgacaagc tgactgaaaa gaccgtagaa ctggatactc ccatcatgcg
     4621 cggtaaagct gaaattaccg aaattgtgct gcgcaagcct cagtccggtg cactgcgtgg
     4681 cacccgtctg caggccatta tggatatgga cgtgggcgca atgatgactg tgatcccacg
     4741 aatctccacc ccgacgctga ccgcgcagga aatggcagag ctggaccccg ccgatctcac
     4801 cgcgctgtcg gtagaggtgg tgactttttt gttgaagaag tcggtgcttg ccggtttacc
     4861 gacagcctga cgattgatga tcttgtggcg gatatcgaat tcctgcagcc catcgccacc
     4921 atctttcact ggtcgccatc catcactgac gttatgccgc tgactgaggt gttggcgtgg
     4981 cggcataagg caattcagcg aagcggggcc agcgatgagt gacaataacc tgcgtctgca
     5041 ggtgattctt aatgcggttg acaagctcac ccgcccattt cgatccgcgc aggccagctc
     5101 aaaagagctg gctgcagcca ttcagcaaag ccgcgcccgt ctaaaagaat tagatgctca
     5161 ggcgggccgc attgacggtt tccgcaaggc cagcgcgcag ctggcagtca ccggtaacag
     5221 cctgaaagcc gcacgcgaag aagctgcgaa acttgccacg caattctctg ccaccaaccg
     5281 cccgacggcg gcgcaggcac ggttgcttga gcaggcaaaa aaccgcgtta cggagttaca
     5341 gagcaaatat aacggtctac gtcagtcggt gcagcgccag cgtcttgcgc tcaatgaagc
     5401 cgggctggac acgaaaaagc tcagtagtgc gcagcgggaa ctgcggcaga atgccgacga
     5461 aacccggcag gccctggacc ggcagcagaa atcccttaaa cgcctgggcg aacagcaggc
     5521 gcgaatgaac gccgtccgcg atcagtattc acgccgtctt gaggtgcggg atcgcatcgc
     5581 cggggcaggg gctaccacta cggctgcggg ggtggcaatg ggcgcacctg ttgtggcggc
     5641 agttaagagc tacgccagca tggaagatgc catgaaaggc gtggcaaagc aggtaaacgg
     5701 gctgcgggac gataatggca accgcacaaa acagttttat gacatgcagg atgccatcaa
     5761 ggccgccagc gaacagctgc cgatggagaa cggcgctata gactatgccg cgctggttga
     5821 aggtggtgct cgcatggggg tgaccaatca ggacgatcct tacgaagagc agaaacgtga
     5881 cctgctggct tttgcatcca cggcggcaaa agcggcaacg gcctttgagc tgcccgcaga
     5941 tgaactggca gaagggctgg ggaaaatcgc gcagctctat aaagttccga cgcgcaatat
     6001 tgaacaactg ggcgatgcgc tgaactacct ggacgataac gccatgtcaa agggtgggga
     6061 cattatcaac gtcctgcagc gtatgggggg cgtggctgac cgccttgact tccgaaaggc
     6121 cgcgg
//