LOCUS       BBF49997.1               429 aa    PRT              BCT 27-JUL-2018
DEFINITION  Escherichia coli arylsulfatase protein.
ACCESSION   AP018796-4357
PROTEIN_ID  BBF49997.1
SOURCE      Escherichia coli
  ORGANISM  Escherichia coli
            Bacteria; Pseudomonadota; Gammaproteobacteria; Enterobacterales;
            Enterobacteriaceae; Escherichia.
REFERENCE   1  (bases 1 to 5470440)
  AUTHORS   Kusumoto,M. and Akiba,M.
  TITLE     Direct Submission
  JOURNAL   Submitted (20-JUL-2018) to the DDBJ/EMBL/GenBank databases.
            Contact:Masahiro Kusumoto
            National Institute of Animal Health; Chuzan 2702, Kagoshima,
            Kagoshima 891-0105, Japan
REFERENCE   2
  AUTHORS   Kusumoto,M., Misumi,W., Ogura,Y., Hayashi,T. and Akiba,M.
  TITLE     Genomic analysis of colistin resistant EHEC isolated from cattle
            in Japan.
  JOURNAL   Unpublished (2018)
COMMENT     Annotated using prokka 1.11 from http://www.vicbioinformatics.com.
            Annotated at DFAST https://dfast.nig.ac.jp/
            
            ##Genome-Assembly-Data-START##
            Assembly Method       :: RS HGAP Assembly v. 3.0
            Genome Coverage       :: 143x
            Sequencing Technology :: PacBio RSII
            ##Genome-Assembly-Data-END##
FEATURES             Qualifiers
     source          /collection_date="2001"
                     /country="Japan"
                     /db_xref="taxon:562"
                     /host="Bos taurus"
                     /isolation_source="feces"
                     /mol_type="genomic DNA"
                     /organism="Escherichia coli"
                     /strain="E2855"
     protein         /gene="arsB"
                     /inference="ab initio prediction:Prodigal:2.6"
                     /inference="similar to AA sequence:INSD:ABB63534.1"
                     /locus_tag="E2855_04449"
                     /transl_table=11
BEGIN
        1 MLLAGAIFVL TIVLVIWQPK GLGIGWSATL GAVLALVTGV VHPGDIPVVW NIVWNATAAF
       61 IAVIIISLLL DESGFFEWAA LHVSRWGNGR GRLLFTWIVL LGAAVAALFA NDGAALILTP
      121 IVIAMLLALG FSKGTTLAFV MAAGFIADTA SLPLIVSNLV NIVSADFFGL GFREYASVMV
      181 PVDIAAIVAT LVMLHLYFRK DIPQNYDMAL LKSPAEAIKD PATFKTGWVV LLLLLVGFFV
      241 LEPLGIPVSA IAAVGALILF VVAKRGHAIN TGKVLRGAPW QIVIFSLGMY LVVYGLRNAG
      301 LTEYLSGVLN VLADNGLWAA TLGTGFLTAF LSSIMNNMPT VLVGALSIDG STASGVIKEA
      361 MVYANVIGCD LGPKITPIGS LATLLWLHVL SQKNMTISWG YYFRTGIIMT LPVLFVTLAA
      421 LALRLSFTL
//