LOCUS       BCA68236.1               464 aa    PRT              BCT 06-NOV-2020
DEFINITION  Escherichia coli invasin protein.
ACCESSION   AP022811-1560
PROTEIN_ID  BCA68236.1
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Pseudomonadota; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 5283470)
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Direct Submission
  JOURNAL   Submitted (21-FEB-2020) to the DDBJ/EMBL/GenBank databases.
            Contact:Ken-ichi Lee
            National Institute of Infectious Diseases, Deaprtment of
            Bacteriology I; 1-23-1,Toyama, Shinjuku, Tokyo 162-8640, Japan
REFERENCE   2
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Global distribution of epidemic-related Shiga toxin 2 encoding
            phages among enteroaggregative Escherichia coli
  JOURNAL   Sci. Rep. 10, 11738 (2020)
  REMARK    Publication Status: Online-Only
            DOI:10.1038/s41598-020-68462-9
COMMENT     ##Genome-Assembly-Data-START##
            Assembly Method       :: Unicycler v. 0.4.7
            Genome Coverage       :: 117.0X
            Sequencing Technology :: Illumina MiSeq, PacBio RSII
            ##Genome-Assembly-Data-END##
FEATURES             Qualifiers
     source          /collection_date="1999"
                     /db_xref="taxon:562"
                     /host="Homo sapiens"
                     /mol_type="genomic DNA"
                     /organism="Escherichia coli"
                     /strain="JE86-ST02"
     protein         /gene="ychO"
                     /inference="COORDINATES:ab initio
                     prediction:MetaGeneAnnotator"
                     /inference="similar to AA sequence:INSD:ADD56080.1"
                     /locus_tag="JE86ST02C_15600"
                     /note="DFAST-ECOLI:ADD56080.1 invasin [pid:98.3%,
                     q_cov:100.0%, s_cov:97.5%, Eval:2.1e-275]"
                     /note="MGA_1561"
                     /transl_table=11
BEGIN
        1 MSRFVPRIIP FYLLLLVAGG TANAQSTFEQ KAANPFDNNN DGLPDLGMAP ENHDGEKHFA
       61 EIVKDFGETS MNDNGLDTGE QAKAFALGKV RDALSQQVNQ HVESWLSPWG NASVDVKVDN
      121 EGHFTGSRGS WFVPLQDNDR YLTWSQLGLT QQDDGLVSNV GVGQRWARGN WLVGYNTFYD
      181 NLLDENLQRA GFGAEAWGEY LRLSANFYQP FAAWHEQTAT QEQRMARGYD LTARMRMPFY
      241 QHLNTSVSVE QYFGDRVDLF NSGTGYHNPV ALSLGLNYTP VPLVTVTAQH KQGESGENQN
      301 NLGLNLNYRF GVPLKKQLSA GEVAESQSLR GSRYDNPQRN NLPTLEYRQR KTLTVFLATP
      361 PWDLKPGETV PLKLQIRSRY GIRQLIWQGD TQILSLTPGA QANSAEGWTL IMPDWQNGER
      421 ASNHWRLSVV VEDNQGQRVS SNEITLTLVE PFDALSNDEL RWEP
//