LOCUS       BCA67051.1              1024 aa    PRT              BCT 06-NOV-2020
DEFINITION  Escherichia coli beta-D-galactosidase protein.
ACCESSION   AP022811-375
PROTEIN_ID  BCA67051.1
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Pseudomonadota; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 5283470)
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Direct Submission
  JOURNAL   Submitted (21-FEB-2020) to the DDBJ/EMBL/GenBank databases.
            Contact:Ken-ichi Lee
            National Institute of Infectious Diseases, Deaprtment of
            Bacteriology I; 1-23-1,Toyama, Shinjuku, Tokyo 162-8640, Japan
REFERENCE   2
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Global distribution of epidemic-related Shiga toxin 2 encoding
            phages among enteroaggregative Escherichia coli
  JOURNAL   Sci. Rep. 10, 11738 (2020)
  REMARK    Publication Status: Online-Only
            DOI:10.1038/s41598-020-68462-9
COMMENT     ##Genome-Assembly-Data-START##
            Assembly Method       :: Unicycler v. 0.4.7
            Genome Coverage       :: 117.0X
            Sequencing Technology :: Illumina MiSeq, PacBio RSII
            ##Genome-Assembly-Data-END##
FEATURES             Qualifiers
     source          /collection_date="1999"
                     /db_xref="taxon:562"
                     /host="Homo sapiens"
                     /mol_type="genomic DNA"
                     /organism="Escherichia coli"
                     /strain="JE86-ST02"
     protein         /EC_number="3.2.1.23"
                     /gene="lacZ"
                     /inference="COORDINATES:ab initio
                     prediction:MetaGeneAnnotator"
                     /inference="similar to AA sequence:INSD:EDU66561.1"
                     /locus_tag="JE86ST02C_03750"
                     /note="DFAST-ECOLI:EDU66561.1 beta-D-galactosidase
                     [pid:98.9%, q_cov:99.8%, s_cov:97.5%, Eval:0.0e+00]"
                     /note="MGA_376"
                     /transl_table=11
BEGIN
        1 MTMITDSLAV VLQRRDWENP GVTQLNRLAA HPPFASWRNS EEARTDRPSQ QLRSLNGEWR
       61 FAWFPAPEAV PESWLECDLP EADTVVVPSN WQMHGYDAPI YTNVTYPITV NPPFVPTENP
      121 TGCYSLTFNV DESWLQEGQT RIIFDGVNSA FHLWCNGRWV GYGQDSRLPS EFDLSAFLRA
      181 GENRLAVMVL RWSDGSYLED QDMWRMSGIF RDVSLLHKPT TQISDFHVAT RFNDDFSRAV
      241 LEAEVQMCGE LRDYLRVTVS LWQGETQVAS GTAPFGGEII DERGSYADRV TLRLNVENPK
      301 LWSAEIPNLY RAVVELHTAD GTLIEAEACD VGFREVRIEN GLLLLNGKPL LIRGVNRHEH
      361 HPLHGQVMDE QTMVQDILLM KQNNFNAVRC SHYPNHPLWY TLCDRYGLYV VDEANIETHG
      421 MVPMNRLTDD PRWLPAMSER VTRMVQRDRN HPSVIIWSLG NESGHGANHD ALYRWIKSVD
      481 PSRPVQYEGG GADTTATDII CPMYARVDED QPFPAVPKWS IKKWLSLPGE TRPLILCEYA
      541 HAMGNSLGGF AKYWQAFRQY PRLQGGFVWD WVDQSLIKYD ENGNPWSAYG GDFGDTPNDR
      601 QFCMNGLVFA DRTPHPALTE AKHQQQFFQF RLSGQTIEVT SEYLFRHSDN ELLHWMVALD
      661 GKPLASGEVP LDVAPQGKQL IELPELPQPE SAGQLWLTVR VVQPNATAWS EAGHISAWQQ
      721 WRLAENLSVT LPSASHIIPQ LTTSETDFCI ELGNKRWQFN RQSGLLSQMW IGDKKQLLTP
      781 LRDQFTRAPL DNDIGVSEAT RIDPNAWVER WKATGHYQAE AALLQCTADT LADAVLITTA
      841 HAWQHQGKTL FISRKTYRID GSGQMAITVD VEVASDTPHP ARIGLTCQLA QVAERVNWLG
      901 LGPQENYPDR LTAACFDRWD LPLSDMYTPY VFPSENGLRC GTRELNYGPH QWRGDFQFNI
      961 SRYSQQQLME TSHRHLLHAE EGTWLNIDGF HMGIGGDDSW SPSVSAEFQL SAGRYHYQLV
     1021 WCQK
//