LOCUS       BCA70636.1               429 aa    PRT              BCT 06-NOV-2020
DEFINITION  Escherichia coli arylsulfatase protein.
ACCESSION   AP022811-3960
PROTEIN_ID  BCA70636.1
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Pseudomonadota; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 5283470)
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Direct Submission
  JOURNAL   Submitted (21-FEB-2020) to the DDBJ/EMBL/GenBank databases.
            Contact:Ken-ichi Lee
            National Institute of Infectious Diseases, Deaprtment of
            Bacteriology I; 1-23-1,Toyama, Shinjuku, Tokyo 162-8640, Japan
REFERENCE   2
  AUTHORS   Kimata,K., Lee,K., Watahiki,M., Isobe,J., Ohnishi,M. and Iyoda,S.
  TITLE     Global distribution of epidemic-related Shiga toxin 2 encoding
            phages among enteroaggregative Escherichia coli
  JOURNAL   Sci. Rep. 10, 11738 (2020)
  REMARK    Publication Status: Online-Only
            DOI:10.1038/s41598-020-68462-9
COMMENT     ##Genome-Assembly-Data-START##
            Assembly Method       :: Unicycler v. 0.4.7
            Genome Coverage       :: 117.0X
            Sequencing Technology :: Illumina MiSeq, PacBio RSII
            ##Genome-Assembly-Data-END##
FEATURES             Qualifiers
     source          /collection_date="1999"
                     /db_xref="taxon:562"
                     /host="Homo sapiens"
                     /mol_type="genomic DNA"
                     /organism="Escherichia coli"
                     /strain="JE86-ST02"
     protein         /gene="arsB"
                     /inference="COORDINATES:ab initio
                     prediction:MetaGeneAnnotator"
                     /inference="similar to AA sequence:INSD:ABB63534.1"
                     /locus_tag="JE86ST02C_39600"
                     /note="DFAST-ECOLI:ABB63534.1 arylsulfatase [pid:94.9%,
                     q_cov:100.0%, s_cov:98.4%, Eval:1.9e-230]"
                     /note="MGA_3967"
                     /transl_table=11
BEGIN
        1 MLLAGAIFVL TIVLVIWQPK GLGIGWSATL GAVLALVTGV VHPGDIPVVW NIVWNATAAF
       61 IAVIIISLLL DESGFFEWAA LHVSRWGNGR GRLLFTWIVL LGAAVAALFA NDGAALILTP
      121 IVIAMLLALG FSKGTTLAFV MAAGFIADTA SLPLIVSNLV NIVSADFFGL GFREYASVMV
      181 PVDIAAIVAT LVMLHLYFRK DIPQNYDMAL LKSPAEAIKD PATFKTGWVV LLLLLVGFFV
      241 LEPLGIPVSA IAAVGALILF VVAKRGHAIN TGKVLRGAPW QIVIFSLGMY LVVYGLRNAG
      301 LTEYLSGVLN VLADNGLWAA TLGTGFLTAF LSSIMNNMPT VLVGALSIDG STASGVIKEA
      361 MVYANVIGCD LGPKITPIGS LATLLWLHVL SQKNMTISWG YYFRTGIIMT LPVLFVTLAA
      421 LALRLSFTL
//