LOCUS       BCA76770.1              1285 aa    PRT              BCT 06-NOV-2020
DEFINITION  Escherichia coli serine protease protein.
ACCESSION   AP022815-4800
PROTEIN_ID  BCA76770.1
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Pseudomonadota; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 5327513)
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Direct Submission
  JOURNAL   Submitted (21-FEB-2020) to the DDBJ/EMBL/GenBank databases.
            Contact:Ken-ichi Lee
            National Institute of Infectious Diseases, Deaprtment of
            Bacteriology I; 1-23-1,Toyama, Shinjuku, Tokyo 162-8640, Japan
REFERENCE   2
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Global distribution of epidemic-related Shiga toxin 2 encoding
            phages among enteroaggregative Escherichia coli
  JOURNAL   Sci. Rep. 10, 11738 (2020)
  REMARK    Publication Status: Online-Only
            DOI:10.1038/s41598-020-68462-9
COMMENT     ##Genome-Assembly-Data-START##
            Assembly Method       :: Unicycler v. 0.4.7
            Genome Coverage       :: 135.0X
            Sequencing Technology :: Illumina MiSeq, Oxford Nanopore MinION
            ##Genome-Assembly-Data-END##
FEATURES             Qualifiers
     source          /collection_date="2014"
                     /db_xref="taxon:562"
                     /host="Homo sapiens"
                     /mol_type="genomic DNA"
                     /organism="Escherichia coli"
                     /strain="JE86-ST05"
     protein         /EC_number="3.4.21.72"
                     /gene="sigA"
                     /inference="COORDINATES:ab initio
                     prediction:MetaGeneAnnotator"
                     /inference="similar to AA sequence:INSD:AAN44449.1"
                     /locus_tag="JE86ST05C_47990"
                     /note="DFAST-ECOLI:AAN44449.1 serine protease [pid:96.4%,
                     q_cov:100.0%, s_cov:100.0%, Eval:0.0e+00]"
                     /note="MGA_4813"
                     /transl_table=11
BEGIN
        1 MNKIYSLKYS HITGGLVAVS ELTRKVSVGT SRKKVILGII LSSIYGSYGE TAFAAMLDIN
       61 NIWTRDYLDL AQNRGEFRPG ATNVQLMMKD GKIFHFPELP VPDFSAVSNK GATTSIGGAY
      121 SVTATHNGTQ HHAITTQSWD QTAYKASNRV SSGDFSVHRL NKFVVETTGV TESADFSLSP
      181 EDAMKRYGVN YNGKEQIIGF RAGAGTTSTI LNGKQYLFGQ NYNPDLLSAS LFNLDWKNKS
      241 YIYTNRTPFK NSPIFGDSGS GSYLYDKEQQ KWVFHGVTST VGFISSTNIA WTNYALFNND
      301 RVNNLKNNFT NTMQLDGKKQ ELSSIIKDKD LSVSGGGELT LKQDTDLGIG GLIFDKNQTY
      361 KVSGKDKSYK GAGIDIDNNT TVEWNVKGVA GDNLHKIGSG TLDVKTAQGN NLKTGNGTVI
      421 LSAEKAFNKI YMAGGKGTVK INAKDALSES GNGEIYFTRN GGTLDLNGYD QSFQKIAATD
      481 AGTTVTNSNV KQSTLSLTNT DAYMYHGNVS GNISINHIIN TTQKHNNNTN LIFDGSVDIK
      541 NDISVRNAQL TLQGHATEHA IFKEGSNNCL IPLLCQKDYS AAIRDQESTV NKRYNTEYKS
      601 NNQVASFSQP DWESRKFNFR KLNLENATLS IGRDANVKGH IEAKNSQIVL GNKTAYIDMF
      661 SGRNITGEGF GFRQQVHSGD SAGESSFNGS LSAQNSKITV GDKSTVTMTG ALSLINTDLI
      721 INKGATVTAQ GKMYVDKAIE LAGTLTLTGT PTENNKYSPA IYMSDGYNMT EDGATLKAQN
      781 YAWVNGNIKS DKKASILFGV DQDKEDNLDK TTHIPLATGL LGGFDTSYTG GIDAPAASAS
      841 MYNTLWRVNG QSALQSLKTR DSLLLFSNIE NSGFHTVTVN TLDATNTAVI MRADLSQSVN
      901 QSDKLIVKNQ LTGSNNSLSV DIQKVGNNNS GLNVDLITAP KGSNKEIFKA STQAIGFSNM
      961 SPVISTKEDQ EHTTWTLTGY KVAENTASSG AAKSYMSGNY KAFLTEVNNL NKRMGDLRDT
     1021 NGEAGAWARI MSGAGSASGG YSDNYTHVQI GVDKKHELDG LDLFTGLTMT YTDSHASSNA
     1081 FSGKTKSVGA GLYASAIFDS GAYIDLIGKY VHHDNEYSAT FAGLGTKDYS SHSLYAGAEA
     1141 GYRYHVTEDA WIEPQAELVY GAVSGKRFDW QDRGMSVTMK DKDFNPVIGR AGVDVGKSFS
     1201 GKDWKVTARA GVGYQFDLLN NGETVLRDAS GEKRIKGEKD GRMLMNVGLN AEIRDNLRFG
     1261 LEFEKSAFGK YNVDNAVNAS FRYSF
//