LOCUS       ALR16554.1               376 aa    PRT              BCT 02-SEP-2016
DEFINITION  Vibrio natriegens NBRC 15636 = ATCC 14048 = DSM 759 flagellin
            protein.
ACCESSION   CP009977-2182
PROTEIN_ID  ALR16554.1
SOURCE      Vibrio natriegens NBRC 15636 = ATCC 14048 = DSM 759
  ORGANISM  Vibrio natriegens NBRC 15636 = ATCC 14048 = DSM 759
            Bacteria; Proteobacteria; Gammaproteobacteria; Vibrionales;
            Vibrionaceae; Vibrio.
REFERENCE   1  (bases 1 to 3248023)
  AUTHORS   Lee,H. and Church,G.M.
  TITLE     Vibrio natriegens genome v1.0
  JOURNAL   Unpublished
REFERENCE   2  (bases 1 to 3248023)
  AUTHORS   Lee,H. and Church,G.M.
  TITLE     Direct Submission
  JOURNAL   Submitted (21-NOV-2014) Genetics, Harvard Medical School, 77 Avenue
            Louis Pasteur, NRB 233, Boston, MA 02115, USA
COMMENT     Annotation was added by the NCBI Prokaryotic Genome Annotation
            Pipeline (released 2013). Information about the Pipeline can be
            found here: http://www.ncbi.nlm.nih.gov/genome/annotation_prok/
            
            ##Genome-Assembly-Data-START##
            Assembly Method        :: RS HGAP v. 3
            Assembly Name          :: Vnat1.0
            Genome Representation  :: Full
            Expected Final Version :: Yes
            Genome Coverage        :: 96.48x
            Sequencing Technology  :: PacBio
            ##Genome-Assembly-Data-END##
            
            ##Genome-Annotation-Data-START##
            Annotation Provider          :: NCBI
            Annotation Date              :: 11/24/2014 10:39:19
            Annotation Pipeline          :: NCBI Prokaryotic Genome Annotation
                                            Pipeline
            Annotation Method            :: Best-placed reference protein set;
                                            GeneMarkS+
            Annotation Software revision :: 2.9 (rev. 452286)
            Features Annotated           :: Gene; CDS; rRNA; tRNA; ncRNA;
                                            repeat_region
            Genes                        :: 4,665
            CDS                          :: 4,459
            Pseudo Genes                 :: 42
            rRNAs                        :: 34 (5S, 16S, 23S)
            tRNAs                        :: 129
            ncRNA                        :: 1
            Frameshifted Genes           :: 10
            ##Genome-Annotation-Data-END##
FEATURES             Qualifiers
     source          /organism="Vibrio natriegens NBRC 15636 = ATCC 14048 = DSM
                     759"
                     /mol_type="genomic DNA"
                     /strain="ATCC 14048"
                     /isolation_source="salt marsh mud"
                     /culture_collection="ATCC:14048"
                     /type_material="type strain of Vibrio natriegens"
                     /db_xref="taxon:1219067"
                     /chromosome="1"
                     /country="USA"
                     /collection_date="27-Feb-2012"
     protein         /locus_tag="PN96_11475"
                     /inference="EXISTENCE: similar to AA
                     sequence:RefSeq:WP_020335860.1"
                     /note="structural flagella protein; Vibrio contains
                     multiple flagellin genes usually localized into two region
                     on the chromosome, flaAC and flaCEDB in V. cholerae,
                     flaFBA and flaCDE in V. parahemolyticus; FlaA is sigma 54
                     dependent and essential for motility in V.cholerae but not
                     in V. parahaemolyticus; Derived by automated computational
                     analysis using gene prediction method: Protein Homology."
                     /transl_table=11
BEGIN
        1 MTLSLHNNTA ALATRRHVAD ASEDFNSSIL KLSSGKKINS AKDDAAGLQI SNRLHVQTRG
       61 LDVAAKNVND GVAIVQTAEG SMREISHILQ DMRDQSLQAA NGAYSIADRQ AIQKNVQALK
      121 DELHSIASSA NFAGTNLLDG TYGKKALQVG SNNETILLEL KDMRSSASSM GGKIFVAQEA
      181 KGADWVVGED GHKLSIDFID KSGNDVSLNI EAKIGDDIEE LATYINGQQE FITASVSGSG
      241 ELQMFVGSDI AEDEICFSGC LAKELNFDNG RKSIVENIDV TSTGGAHEAV AVIDSALNYV
      301 DGHQADMGAL HNRFDRMLSN LTNMHENISA SKGNRTDTDF AKETTEMTRA KILQQSSSSM
      361 LAQARVIPNA ALNLLN
//