LOCUS       CP053347               22113 bp    DNA     circular BCT 18-MAY-2020
DEFINITION  Sphingomonas sp. AP4-R1 plasmid unnamed1, complete sequence.
ACCESSION   CP053347
VERSION     CP053347.1
DBLINK      BioProject: PRJNA631068
            BioSample: SAMN14851439
KEYWORDS    .
SOURCE      Sphingomonas sp. AP4-R1
  ORGANISM  Sphingomonas sp. AP4-R1
            Bacteria; Proteobacteria; Alphaproteobacteria; Sphingomonadales;
            Sphingomonadaceae; Sphingomonas.
REFERENCE   1  (bases 1 to 22113)
  AUTHORS   Heo,J., Kim,S.-J., Kim,J.-S., Hong,S.-B. and Kwon,S.-W.
  TITLE     Genome sequencing of strain KACC 21605
  JOURNAL   Unpublished
REFERENCE   2  (bases 1 to 22113)
  AUTHORS   Heo,J., Kim,S.-J., Kim,J.-S., Hong,S.-B. and Kwon,S.-W.
  TITLE     Direct Submission
  JOURNAL   Submitted (08-MAY-2020) Agricultural Mircrobiology Division,
            National Institute of Agricultural Sciences, 166
            Nongsaengmyeong-ro, Iseo-myeon, Wanju-gun, Jeollabuk-do 55365,
            South Korea
COMMENT     The annotation was added by the NCBI Prokaryotic Genome Annotation
            Pipeline (PGAP). Information about PGAP can be found here:
            https://www.ncbi.nlm.nih.gov/genome/annotation_prok/
            This genome has a base modification file available.
            
            ##Genome-Assembly-Data-START##
            Assembly Date          :: APR-2020
            Assembly Method        :: RS HGAP Assembly v. 3.0
            Genome Representation  :: Full
            Expected Final Version :: Yes
            Genome Coverage        :: 99.0x
            Sequencing Technology  :: PacBio RSII
            ##Genome-Assembly-Data-END##
            
            ##Genome-Annotation-Data-START##
            Annotation Provider               :: NCBI
            Annotation Date                   :: 05/11/2020 21:04:38
            Annotation Pipeline               :: NCBI Prokaryotic Genome
                                                 Annotation Pipeline (PGAP)
            Annotation Method                 :: Best-placed reference protein
                                                 set; GeneMarkS-2+
            Annotation Software revision      :: 4.11
            Features Annotated                :: Gene; CDS; rRNA; tRNA; ncRNA;
                                                 repeat_region
            Genes (total)                     :: 4,788
            CDSs (total)                      :: 4,729
            Genes (coding)                    :: 4,613
            CDSs (with protein)               :: 4,613
            Genes (RNA)                       :: 59
            rRNAs                             :: 2, 2, 2 (5S, 16S, 23S)
            complete rRNAs                    :: 2, 2, 2 (5S, 16S, 23S)
            tRNAs                             :: 50
            ncRNAs                            :: 3
            Pseudo Genes (total)              :: 116
            CDSs (without protein)            :: 116
            Pseudo Genes (ambiguous residues) :: 0 of 116
            Pseudo Genes (frameshifted)       :: 56 of 116
            Pseudo Genes (incomplete)         :: 58 of 116
            Pseudo Genes (internal stop)      :: 26 of 116
            Pseudo Genes (multiple problems)  :: 22 of 116
            ##Genome-Annotation-Data-END##
FEATURES             Location/Qualifiers
     source          1..22113
                     /organism="Sphingomonas sp. AP4-R1"
                     /mol_type="genomic DNA"
                     /strain="AP4-R1"
                     /host="Malus prunifolia (crab apple)"
                     /culture_collection="KACC:21605"
                     /db_xref="taxon:2735134"
                     /plasmid="unnamed1"
                     /country="South Korea: Naju-si"
                     /collection_date="23-Oct-2019"
                     /collected_by="Jun Heo, Soon-Wo Kwon"
                     /identified_by="Jun Heo, Soon-Wo Kwon"
     gene            join(21562..22113,1..27)
                     /locus_tag="HL653_23815"
     CDS             join(21562..22113,1..27)
                     /locus_tag="HL653_23815"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_018950967.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="recombinase family protein"
                     /protein_id="QJU60966.1"
                     /translation="MLVGYARVSTRDQNPALQLEALRAVGCDKIFTEKASGAQRDRPE
                     LQAALGYLRAGDALVVWKLDRLARSVRQLVETAELLQTREIGLKVITQAIDTTSPSGR
                     LTFHLLAAIAEFERELTLERTHAGLAQARALGRRGGRKPAMGEPEIRRAKAMLSDPSI
                     TVEEVARQLGVQPSTLYRHIPGGRSSLLEHAA"
     gene            24..1487
                     /locus_tag="HL653_23820"
     CDS             24..1487
                     /locus_tag="HL653_23820"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_011911239.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="N-6 DNA methylase"
                     /protein_id="QJU60942.1"
                     /translation="MTVRLSQKEAGAYYTPNMVVAALVSWAVRRDGDRMLDPSCGDGR
                     FLVEHSNSVGIEQDPVSAHVAIDRAPGALVHEGDFFQWAEATAERFECAAGNPPFIRY
                     QTFKGAVRARALAFCSAHGAMFNGLASSWAPFLVATAALLKPGGRMAFVVPAEIGHAP
                     YASPLIEYLVAHFKRVQIVAVREKLFPDLSEDCWLLYAEGFGGKTDHIAFTVCDRFEW
                     STRPPKQAEKVAVGEWRDSWNRRLRPYLLPAAIRDAYRAFADDVGGHRLSSFASVGIG
                     YVSGDNRFFHLRPSEAQRWKIPASHLHPTVRTGRMLAQRAITPTTVAAWQRADEPVML
                     LRLQRGQELSASVRRYLDSSAGQEARQGYKCRNRDPWYAVPDVQVPDFFMSYMSGRSA
                     SLVQNTAGATCTNTVHSVRVRDRALAAKLLPSWGTPLSQLSCELEGHPLGGGMLKLEP
                     REAGRLLFTPPPLAKKVNMPILEEGISIMQRWRHYGG"
     gene            1477..2391
                     /locus_tag="HL653_23825"
     CDS             1477..2391
                     /locus_tag="HL653_23825"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_018099694.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60943.1"
                     /translation="MAGEVCRWTSQKDALEAFAGFQGKIESAGQIKPLHWYVACRLVL
                     EGGFDPADITPRPPFRIQTRSGKPPLLHYDESKAGGGERTILGGLKTKNVDVVVTRDG
                     LGPVLAVSCKGVTAALRNLTNRLEETVGECTNLHITYPALVLGYLVVLRANRQVDSVL
                     EDALAEAAEAEAIEEKQPGRALTKNDIAMGEGGEPVALVMRFHNALREMTGRRGIRND
                     VSRYEAIGFGMVEMEPSALGTLLDSYPAPESTLRLERFFETLYLRHDERFVTSAPDLA
                     SKTRRLEWASDSPALALPELDYEPRVAS"
     gene            2388..2876
                     /locus_tag="HL653_23830"
     CDS             2388..2876
                     /locus_tag="HL653_23830"
                     /inference="COORDINATES: ab initio
                     prediction:GeneMarkS-2+"
                     /note="Derived by automated computational analysis using
                     gene prediction method: GeneMarkS-2+."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60944.1"
                     /translation="MTPVELILARKTHLARLANAKGAAGESHVIATASEWISRPKGAS
                     LKLLLEELARTGIHIKPSSFDAIAVTESVDFGDPLSIRSVLDQMIFIEIKTANQGRVK
                     AGFGGFFFALTENEISAADQLGSRHQVALFNKVTGELLITDIPSILARSRSTTWQVSV
                     QL"
     gene            complement(2957..4243)
                     /locus_tag="HL653_23835"
     CDS             complement(2957..4243)
                     /locus_tag="HL653_23835"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_004152098.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="arsenic transporter"
                     /protein_id="QJU60945.1"
                     /translation="MIAAILIFLLTITLVIWQPKGLGIGWSAIGGAAIALLAGVVSLH
                     DIPVVWHIVWNATATFVAVIIISLLLDEAGFFEWAALHVARWGKGQGRKLFALIVLLG
                     AAVSSLFANDGAALILTPIVIAMLRALGYGDKATLAFVMAAGFIADTASLPLIVSNLV
                     NIVSADFFNIGFGRYAMVMVPVDLASIAATLAMLMLYFRRDIPTAYDVGQLHHPQQAI
                     KDRATFRAGWVVLVMLLAGFFLLEPLGVPVSAVAAVGAILLLVIAARGHVISTGKVLK
                     GAPWQVVIFSLGMYLVVYGLRNAGLTGQISILLDRFAQGGIWGAAIGTGVLTAVLSSI
                     MNNMPTVLVGALSIDGTHATGVVKEAMIYANVIGCDLGPKITPIGSLATLLWLHVLGN
                     KGIKIQWGYYFKVGVAMTFPILLVTLAALAIRLSTT"
     gene            complement(4320..5075)
                     /gene="arsH"
                     /locus_tag="HL653_23840"
     CDS             complement(4320..5075)
                     /gene="arsH"
                     /locus_tag="HL653_23840"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_019368255.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="arsenical resistance protein ArsH"
                     /protein_id="QJU60946.1"
                     /translation="MPLRALADPTDLPNLDRAYAIERPALGLGAGDPAPRILLLYGSL
                     RERSFSRLCVEEAARLLQFFGAETRIFDPSTLPLPDQIAGDDHDAVHELREHSMWSEG
                     HVWCSPERHGQITGVMKTQIDHLPLSMGGMRPTQGRTLAVMQVSAGSQSFNSVNTLRV
                     LGRWMRMFTIPNQSSVAMAYKEFDDAGRMKPSSYYDRIVDVMEELVRITVLMRPHAAQ
                     LVDRYSERKEAGVPIDPAIDHSAIAIAPQPASA"
     gene            complement(5075..5551)
                     /locus_tag="HL653_23845"
     CDS             complement(5075..5551)
                     /locus_tag="HL653_23845"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_018251258.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="GNAT family N-acetyltransferase"
                     /protein_id="QJU60967.1"
                     /translation="MPAHGSEAPSPTRLRATPIGESDFDGLAFFLAGAGLPTADLKEP
                     GRLFYRVDAGDLIGYAGIEGSGPDRLLRSLVVLPDRRRVGLGRVVLELIEDEAASMGV
                     ERLHLLTTTAARFFRTQGYADAARATAPATIAASAEFTKLCPASAAYLVKYLKDAS"
     gene            complement(5532..5963)
                     /gene="arsC"
                     /locus_tag="HL653_23850"
     CDS             complement(5532..5963)
                     /gene="arsC"
                     /locus_tag="HL653_23850"
                     /EC_number="1.20.4.1"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_020810062.1"
                     /note="This arsenate reductase requires both glutathione
                     and glutaredoxin to convert arsenate to arsenite, after
                     which the efflux transporter formed by ArsA and ArsB can
                     extrude the arsenite from the cell, providing resistance;
                     Derived by automated computational analysis using gene
                     prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="arsenate reductase (glutaredoxin)"
                     /protein_id="QJU60947.1"
                     /translation="MSGPVDIVVYHNPECGTSRNTLGLIRNAGIEPHVVEYLKTPPTR
                     ELLVQLIARAGITPRELLREKGTPYAELGLADTSLSDDALLDAMMAHPILINRPLVVS
                     PLGVKLCRPSEAVLDLLPNAQLGAFAKEDGQLVVNDAGARV"
     gene            complement(5960..6487)
                     /locus_tag="HL653_23855"
     CDS             complement(5960..6487)
                     /locus_tag="HL653_23855"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_002713264.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="arsenate reductase ArsC"
                     /protein_id="QJU60948.1"
                     /translation="MSDKVFNVLFLCTGNSARSILAESALNKRGGNFRAFSAGSHPKG
                     TVNPDAIALLERIGYPTEGLHSKGWEAFSEPDSPVMDFVFTVCDDAAGEVCPIWPGHP
                     MTAHWGIEDPSHVEGNEIERERAFVKALRYLENRIDLFTALPIGKLEERVLATKLKDI
                     GRTEGATVERLEDAR"
     gene            complement(6499..6828)
                     /locus_tag="HL653_23860"
     CDS             complement(6499..6828)
                     /locus_tag="HL653_23860"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_008065098.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="helix-turn-helix transcriptional regulator"
                     /protein_id="QJU60949.1"
                     /translation="MIDDDALASLAALAHPTRLATFRLLVRHEPDGLSTGQLVEAAGL
                     TQSTFSTHLAVLVKAGLVTPEKQGRQMIQRANIDALRALMLFLAKDCCQGRAELCEPL
                     LAELTCC"
     gene            7326..7955
                     /locus_tag="HL653_23865"
     CDS             7326..7955
                     /locus_tag="HL653_23865"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_017503386.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="transcription elongation protein SprT"
                     /protein_id="QJU60950.1"
                     /translation="MIHDNREAWLNAVALGMAPLFEGLGAPLPGRIRVAIGFTSAGRK
                     GKAIGECWDNRRSADGHFEIFIRPDLAHAPDAMPVQIAAILAHELVHAAVGIAAGHGK
                     LFKRVAIGLGLVGPMRATTPGEGFVALAAPILDGVGPLPHARLDTDGQTTAPKKQTTR
                     LLKCECETCGYTARIARKWLELAGAPLCPVPDHGPMRHDPLDDPDEEDV"
     gene            8020..8703
                     /locus_tag="HL653_23870"
     CDS             8020..8703
                     /locus_tag="HL653_23870"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_010189084.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="ParA family protein"
                     /protein_id="QJU60951.1"
                     /translation="MKTISIISQKGGAGKTTLAIHLAAAGVEAGLSTLILDADPQATA
                     SQWSQWRGGSDPEVVDCASPTLLARKVQQAADLGADLVIIDTPPHADIMAREACKLAD
                     LILIPCRPQAFDLSAVETTADLVKAAGKPAFVLFMGGPQRAPATYKDARELIEGSEGV
                     AGMGVPVAPVMLTQRAIYHHSTAQGKAANESEPEGKAAEEVAALWTWIREHVNLSTRK
                     PTRGKRSAA"
     gene            8700..8978
                     /locus_tag="HL653_23875"
     CDS             8700..8978
                     /locus_tag="HL653_23875"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_010189082.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60952.1"
                     /translation="MSRFGAMKQQRVEKARATEAAPAAEPDPGDGTPSPRAVARQGKK
                     AVSAYFSPEVSRGLNVLAAENGTTLQALLGEAIDLLMRQHGKHPFGER"
     gene            complement(9041..9223)
                     /locus_tag="HL653_23880"
     CDS             complement(9041..9223)
                     /locus_tag="HL653_23880"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_006954994.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60953.1"
                     /translation="MDRALLSSIILAAPAWARVGLTMRDAQMRERAADALAATIVERL
                     EEPPALPDRNQLCLPI"
     gene            complement(9337..10212)
                     /locus_tag="HL653_23885"
     CDS             complement(9337..10212)
                     /locus_tag="HL653_23885"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_010165325.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="replication initiation protein"
                     /protein_id="QJU60954.1"
                     /translation="MSQTAVADPSIRTIAQKGRGNPFDPANYGEIVKPGELVDIVELT
                     PLTLADRRIYNLLIANAWDRIDEPIIHRIAKTVLKGTHQGNERVESSLLRLMGTIAIV
                     TIRKGGKAFRRRVQLLGPSDESLEKDGFLHYRIPEELIEILRNSEVYARLKTQVMYCF
                     ESKYALCLYEMIERRIGLDYKQNEEFTIEEIRGLLNVPEGKLERFADLNKYCLKVAQD
                     EINKLCPFYVDFKPIKNGRKVERVALYWFPKTSSGKRDAQSLIEQHSVVRRAKLRGLA
                     AELPVLVDFGLAAER"
     gene            complement(10844..12505)
                     /locus_tag="HL653_23890"
     CDS             complement(10844..12505)
                     /locus_tag="HL653_23890"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_019086529.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="type IV secretory system conjugative DNA
                     transfer family protein"
                     /protein_id="QJU60955.1"
                     /translation="MIWVRLTGRAFRNMLRWVARDPLSAVHAILFSPMRVLKHLIGVV
                     VIFLVATLVLSSASTSLLYFAKVRDGSPIGSIVQIGTMLILVGLLFRALVKPMVMRFG
                     FEGGDSDTHGSARFATRDETRALDRTDGLLIGRDLKTKRLMRYAGPAHLLTIAPTRSG
                     KGVGTIIPNLLEYPFGLVCIDPKGENARIAARQRSRFGPVHILDPFGITGVVGAAAYN
                     PLDRIDPQGLDHADDCMTLADALVHDAHNEMSEAHWNEEAKALIAGLLLHIVETEPLA
                     TRTLATLRDRLTLAPAAFEKLLNDMQAQGGLVARAANRHLGKSDREAAGVLSSAQRHT
                     HFLDSPRMTAALGRSDFAFADIKSAPATIFLVLPPDRLDTYARWLRLMIAQALTELAR
                     VPGKAPWPVLFLLDEFAALGHLEPVERAMGLMAGYGIQLWPILQDIHQLRALYGQRAG
                     TFLSNAGVLQIFGVNDQQSAQLVSDLLGQETVVFETVSRAIDAEESGLSFTQHHTARA
                     LLTPDEVRTLKPDRQLLFLAGQRPIIATKLRYYADREFAGRFDQA"
     gene            complement(12507..12920)
                     /locus_tag="HL653_23895"
     CDS             complement(12507..12920)
                     /locus_tag="HL653_23895"
                     /inference="COORDINATES: ab initio
                     prediction:GeneMarkS-2+"
                     /note="Derived by automated computational analysis using
                     gene prediction method: GeneMarkS-2+."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60956.1"
                     /translation="MSTDLGEWMMWGHAAASITFNDPVWAAQSYEMDRGERQRNDYDP
                     PLPRHFVDALRERQRRLNGLADRMAAEGRNDVPPESEPDAWACPQVPPFNQGRPVAGG
                     IRWVPAALMAEYRSLYLTPLPTSGDARREVTSGEA"
     gene            complement(12917..13144)
                     /locus_tag="HL653_23900"
     CDS             complement(12917..13144)
                     /locus_tag="HL653_23900"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_017501678.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="conjugal transfer protein TraD"
                     /protein_id="QJU60957.1"
                     /translation="MERRTRTRHLIELGGLVQKAGLVDLADDDRATLYGAMLDLVAKA
                     RSDDAGDLLALWKRRGKRAFDAEAETKEDRV"
     gene            complement(13182..13490)
                     /locus_tag="HL653_23905"
     CDS             complement(13182..13490)
                     /locus_tag="HL653_23905"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_015460622.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="conjugal transfer protein TraD"
                     /protein_id="QJU60958.1"
                     /translation="MRKVRDYDAELKALNDKARALKAQKIQQLGELVAATGADALDTG
                     TLVGGLLHILKEAKAPAVQEAWRSDGAAFFQRRGRKASGSSGSDGQGAGAGRASDAQS
                     "
     gene            13661..16708
                     /gene="traA"
                     /locus_tag="HL653_23910"
     CDS             13661..16708
                     /gene="traA"
                     /locus_tag="HL653_23910"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_020817746.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="Ti-type conjugative transfer relaxase TraA"
                     /protein_id="QJU60959.1"
                     /translation="MAIYHFSAKVISRANGSSAVASAAYRAAERLSDERIGRDHDFSN
                     KAGVVHSEVMLPEGAPAHLADRETLWNAVEAGEKRKDAQLAREVEFSIPREMNQEQGV
                     ALARDFVQEQFVDRGMIADLNVHWDHAEDGSPKPHAHVMLSMREVGPDGFGAKVREWN
                     ATQLLQEWREAWADHVNERLSELDIDARIDHRTLEAQGIDLEPQHKIGPAGMRRLDRG
                     EDAERADDHRRIARENGAKIIAEPGVALDAITRMQATFTTRDLAMFAHRHSDGKEQFD
                     QVMGAVRASPELVALGQDGKGQDRFTSREMIAIEQRLERAGDSLAATDGHFVAAPHVY
                     RALEAAEGRGLSLSAEQRDALGRITERDGLASVVGYAGTGKSAMLGVAREAWEDAGYT
                     VRGAALSGIAAENLEGGSGIASRTIASLEYQWAQGREQLGPRDVLVIDEAGMIGTRQM
                     ERVLSAADQAGAKVVLVGDPEQLQAIEAGAAFRSIAEQHGAVEITAIRRQHEDWQRDA
                     TKALATGRTAEAVQSYEQHGMVQAADTRDGARGELVDQWDSQRIADRDQTRIILTHTN
                     AEVRDLNLAARDRLRASGELGEDVSVSAERGARDFADGDRIMFLKNERGLGVKNGSLG
                     TVERVSPTSMAVRLDDGRDVAFDLKDYAHVDHGYAATIHKSQGVTVDRAHVLATPGMD
                     RHSAYVALSRHRDGVQLHYGRDDFDDQRSLVRTLSRERTKDMAADYGRDPAEGVRAFA
                     DRRGLAGEQWSAKARTGVEISGAEMPAAGVGGADPAAVDPSGTSLRAFEDQKRGVFRP
                     DVAATTGDTAGRKRSMFDGLKLGGSPTPTPAKARNLVSDQGLAGAVERVSRSAVTMME
                     ARAQGRPVLEHQRIALEKAQAALDQIRPQASRDLASVLERNPGLIRDAAQGASGPAIQ
                     AMAHETRVRADPQLRADRFVENWQGIQRQRGQAEGRGDQAGVDRSTKALERMAKGLER
                     DPQMESVLRNRRPELGLQRDMGRELSRDLTQALSRGREQGLGR"
     gene            16719..17426
                     /locus_tag="HL653_23915"
     CDS             16719..17426
                     /locus_tag="HL653_23915"
                     /inference="COORDINATES: similar to AA
                     sequence:RefSeq:WP_008831345.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60960.1"
                     /translation="MDEDGYRDEDGAGDDPAAAFERLRGEVSLLRLAVGSLATARETI
                     EIPDYEPTLARTERILTVLTEQLEPIVESPMLAMTPPKMANEIVSAALQARREDQRLL
                     TEGRAALDQATRDMRQMVASARTGEEQNRWIFLYGIGGLVVGIVVWAVFAGIVARAMP
                     ASWHWPERMAARTLDTDMWDAGQRLASVANPDGWRGIVAGDAIVRANHDAIEACRKSA
                     AKAKKAVRCAIDVKAGE"
     gene            17429..17785
                     /locus_tag="HL653_23920"
     CDS             17429..17785
                     /locus_tag="HL653_23920"
                     /inference="COORDINATES: ab initio
                     prediction:GeneMarkS-2+"
                     /note="Derived by automated computational analysis using
                     gene prediction method: GeneMarkS-2+."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60961.1"
                     /translation="MDAVTDPDGRAIVALLDQAIHAEARTDAPPEAEQRDWLYGGVDP
                     TTYTEPDAHGWMGIVPPSTVGWVPRALVFWHTVLASGGSISREQMRQPAHSLSRWPTI
                     EIAVGDYLTASPWLIA"
     gene            17961..18104
                     /locus_tag="HL653_23925"
     CDS             17961..18104
                     /locus_tag="HL653_23925"
                     /inference="COORDINATES: ab initio
                     prediction:GeneMarkS-2+"
                     /note="Derived by automated computational analysis using
                     gene prediction method: GeneMarkS-2+."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60962.1"
                     /translation="MKSLSLPGGGVSGLLIMAGHPAWGAIVATLSIAMPFVADIIRAS
                     KGR"
     gene            18129..18716
                     /locus_tag="HL653_23930"
     CDS             18129..18716
                     /locus_tag="HL653_23930"
                     /inference="COORDINATES: ab initio
                     prediction:GeneMarkS-2+"
                     /note="Derived by automated computational analysis using
                     gene prediction method: GeneMarkS-2+."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60963.1"
                     /translation="MGKEPIDTTPASAEVVARVQTISDKKALKRHFSAMFKQGQPHYA
                     DFYDIDAEPWNLWPGMVSDFVEGWEPITFDDGRKPAAIAMALTLSMSAGTDAVGNQGA
                     ALALARREFGDREHVWVAGDHNGPFVKFLVQYRNEEGRPLSPGPSDLRRYRETYAEEL
                     CARDITARATTRGSRGLGFSEGRLALKARRRLSGS"
     gene            complement(18792..19085)
                     /locus_tag="HL653_23935"
     CDS             complement(18792..19085)
                     /locus_tag="HL653_23935"
                     /inference="COORDINATES: ab initio
                     prediction:GeneMarkS-2+"
                     /note="Derived by automated computational analysis using
                     gene prediction method: GeneMarkS-2+."
                     /codon_start=1
                     /transl_table=11
                     /product="hypothetical protein"
                     /protein_id="QJU60964.1"
                     /translation="MHGGLSTSGFECPDICWRARVLVLWVAAEPASEPTRQQETELCA
                     SLLGLAIGFAVIDRDELVEGAANEIRDACRMVQICRWLPSDLHALTVLTSVHD"
     gene            19605..21320
                     /locus_tag="HL653_23940"
     CDS             19605..21320
                     /locus_tag="HL653_23940"
                     /inference="COORDINATES: protein motif:HMM:NF012307.1"
                     /note="Derived by automated computational analysis using
                     gene prediction method: Protein Homology."
                     /codon_start=1
                     /transl_table=11
                     /product="RNA-directed DNA polymerase"
                     /protein_id="QJU60965.1"
                     /translation="MLDDLKSCTSRSGLAVLLGVKPSELSYTLYKIPDAAKYTSFCIS
                     KKSGGTRQIQAPCPPLKWLQGRLLDLLYQCEDDISAASGLKRNLHSGFRRGVNIYENA
                     NAHRGKRFVFNIDIESFFDQYNFGRVRAFFINDRDFALQPAVATTIAQIVCFNNVLPQ
                     GSPTSPHIANLLTQFFDNRMARFLRPRRCGYTRYADDITISTNVREFPADVAIMTPAD
                     PQGWSIAPELAAIFGRANLPPNPSKTRMSAYSSRQTVTGLVVNQRPNVTREYYLHTRA
                     MCDRLFKTGTIQIPDITSSYGKNCPVSDDAEPEADVDPLKVLEGRLSHIHHIREKSDL
                     RNIQEKQDNPTQFWNMLQDFFLFKYFVANSKPLILTEGPSDIFYLRSAIINNTTLLVP
                     ELKKVVSGKPEILPTFFRFNTVAAKVIGLTGGAGNIKRFLYLYHKQEKRFNRSLRHKP
                     VIIIIDNDSGGADVINMVNGIYKTNISLSDPIMAHKITDGLILVKTPHVGSKTHTAIE
                     DLLPASVKAVKLNGKSFSAAKKFDATKHFGKIALGSYVQANASSISFQGFDDFIVAIN
                     GAITM"
BASE COUNT         4435 a         6472 c         7057 g         4149 t
ORIGIN      
        1 agctcgctgc tcgagcacgc ggcatgactg tccgtctctc ccagaaggaa gcaggggcgt
       61 attacacgcc caacatggtc gtggccgccc tggtaagctg ggcggtgcgt agggatgggg
      121 atcggatgct cgatccaagt tgcggcgatg gtcgctttct agtcgaacac tcgaacagtg
      181 ttggcatcga gcaagatcca gtttccgctc acgtcgcaat tgatcgtgcg cctggcgctc
      241 tcgtccacga aggcgacttt ttccagtggg ccgaggcaac cgccgaacgg ttcgagtgtg
      301 ccgctggcaa cccacccttc attcgttatc agaccttcaa aggcgcggtt cgggctcgag
      361 cgctggcttt ttgcagcgct cacggtgcga tgttcaacgg gctcgcgtct tcgtgggccc
      421 ccttcctcgt tgcgacggcg gcgctgctta aaccaggcgg ccgtatggcg ttcgttgtgc
      481 cggccgagat tggacatgcg ccttatgcct cgccgctgat cgagtacctt gtggcccact
      541 ttaagcgggt gcagatcgtc gcggttcgcg aaaagctgtt tccagacctc tccgaagatt
      601 gttggcttct gtatgcggaa ggctttggcg gtaagacgga ccatatcgcg ttcaccgtct
      661 gcgatcggtt cgaatggagc acgcggcccc ctaaacaggc tgaaaaggtg gccgtcggtg
      721 agtggcggga tagctggaac cggcgattgc ggccgtatct gttgcccgcc gcaattcgcg
      781 atgcgtaccg tgcattcgcg gatgatgtgg gcggccatcg actaagcagc ttcgccagcg
      841 tcggtattgg ctacgtgagt ggcgacaaca gattcttcca cctccgtcct tcagaggcgc
      901 agcgttggaa aataccggca tctcatttgc atcctacggt gcgaacaggg cggatgctcg
      961 cccaacgagc cattacgcct actacggttg cagcatggca gagggccgac gagcccgtga
     1021 tgctgcttcg tctccaacgc gggcaggaac tgtcggcatc ggttcgtcgc tatcttgata
     1081 gcagcgccgg ccaagaggcg cgccagggct ataaatgccg taatcgtgat ccatggtacg
     1141 ctgtcccaga cgtgcaggtg ccggatttct ttatgagcta catgtcggga cgcagtgcga
     1201 gcctggttca aaacacggcg ggtgccacct gcacgaacac agtccatagc gttcgtgtcc
     1261 gtgatcgagc gctcgcggcc aaattgctgc cgagctgggg gacgcctttg tcgcagctta
     1321 gctgcgaact cgaaggacac ccgctgggcg gcggcatgtt gaagctagag ccgagagagg
     1381 cgggacgctt gctatttacg ccccctcccc tagccaaaaa ggtgaacatg ccaatccttg
     1441 aagaggggat ctcgatcatg cagcgttggc gccattatgg cgggtgaagt ttgtcgctgg
     1501 actagccaga aagacgcgct ggaggccttc gccggttttc agggaaagat cgagagtgca
     1561 ggccagatta aaccgctaca ttggtatgta gcctgccgcc ttgtcttgga gggtgggttt
     1621 gatccagccg acatcacgcc acgccctcct tttcgcatcc aaacgagatc cggaaagccg
     1681 cctcttctcc actatgatga gagtaaagct ggcggcggcg agcgcactat cttgggtggc
     1741 ctcaagacaa aaaatgtgga cgttgtcgta acccgtgatg ggctcggccc cgtgctggcg
     1801 gtatcctgta agggcgtgac tgcagcgctt cgaaacttga ccaatcggct tgaagagaca
     1861 gttggcgaat gcactaattt acacatcacc tacccggctc ttgtgctcgg ttacctggtt
     1921 gtgttgcgcg ccaatcggca agtcgattcc gttctagagg acgcattggc ggaagcagca
     1981 gaagccgaag caatcgagga aaagcagccc ggccgagcgc tgaccaaaaa cgatattgct
     2041 atgggtgaag gtggcgaacc cgttgcgctg gttatgcggt ttcacaatgc tttgcgggag
     2101 atgaccggcc gacgaggcat tcggaacgat gtcagtcgct atgaagcaat cggctttggt
     2161 atggtcgaga tggagccgag tgctcttggc accttgctcg acagctatcc ggcgccggaa
     2221 agtacgcttc ggctggagcg gttcttcgag acgctctacc tgcgacatga cgagcgtttc
     2281 gttaccagcg caccggacct ggcgagcaag acccgccggc tcgaatgggc atcggattcc
     2341 cctgcgctcg ctcttcctga gctggattac gagccgcgcg tggcgtcgtg acgcctgtcg
     2401 agctgatcct ggccagaaag acgcatctgg ccaggcttgc gaatgcaaaa ggtgcggcgg
     2461 gagagtcgca tgtcattgcc acagcctcag aatggatatc gaggccgaaa ggtgcgtcac
     2521 taaagctact tctagaggag ctggctcgta ctggcattca catcaagcca tctagtttcg
     2581 atgctatcgc agtgactgag agcgtcgatt ttggagaccc gctcagcata cgatcagttc
     2641 tcgaccagat gatcttcatc gagatcaaaa cagccaacca gggccgggtg aaggccggtt
     2701 ttggcgggtt cttttttgcg ctcaccgaaa acgagatatc ggccgctgac cagcttggta
     2761 gccggcatca agtagcgttg ttcaataagg tgacgggaga gctgttgatc acggatatcc
     2821 cgagcatttt agcgcgatcg aggtccacga cgtggcaggt atccgtccag ctctgacgac
     2881 cgccctagca tatatcggtg tgcgtgtcag catgtgaaca tgtccacgtg tgatgagcgc
     2941 gctaatatct gtcggttcat gtggtgctga gccggatcgc cagcgcggcc agggtgacga
     3001 gcagaatcgg gaaggtcatc gccacgccga ccttgaagta atagccccat tggatcttga
     3061 tgcccttgtt gccgaggacg tgcagccaga gcagcgtcgc cagagagccg atcggggtga
     3121 tcttgggtcc gagatcacag ccgatcacat tggcgtagat catcgcttcc ttgacgacgc
     3181 cggtcgcatg ggtgccgtcg atcgagagcg cgccgacaag cacggtcggc atgttgttca
     3241 tgatcgagga aagcacggcg gtcagcacgc cggttccgat cgcagcaccc cagatgccac
     3301 cttgtgcgaa gcgatcgagc aggattgaga tttgcccggt caggcccgca tttcgcaggc
     3361 catagacgac caggtacatg ccgagcgaga agatcacgac ctgccacggc gcgcccttca
     3421 gcaccttgcc ggtgctgatg acgtgaccgc gcgcggcgat caccagcagc aggatcgcgc
     3481 cgacagcggc gaccgcactg accggcacgc ccagcggctc caacaggaag aagcccgcca
     3541 gcagcatcac gagcaccacc cagcccgccc gaaaggtcgc acgatccttg atcgcttgtt
     3601 ggggatggtg gagctggccg acgtcgtagg ccgtggggat gtcgcggcgg aaatagagca
     3661 tcagcatggc gagcgtggcc gcgatcgagg cgagatcgac cgggaccatc accatcgcat
     3721 atcggccgaa gccgatgttg aagaagtcgg ccgacacgat gttgacgaga ttcgagacga
     3781 tcagcggcag gctcgcggtg tcggcgatga agcctgcggc catgacgaag gcgagcgtgg
     3841 ctttgtcgcc atagccgagc gcgcgcagca tcgcgatcac gatcggggtc aggatgagcg
     3901 ctgcgccgtc attagcgaac agtgacgata ccgccgcacc gagcagcacg atcagcgcga
     3961 agagcttgcg gccctggccc ttgccccagc gtgcgacgtg cagcgccgcc cactcgaaaa
     4021 agccggcctc gtcgagcagc aggctgatga tgatgaccgc cacgaacgtg gcggtcgcgt
     4081 tccagacgat gtgccagacg accgggatat catggagcga taccacgccc gccagcaacg
     4141 cgatcgcggc gcccccgatc gcgctccagc caatgccgag ccccttgggt tgccaaataa
     4201 cgagggtgat cgtcagcagg aagatcagga tcgcagcgat catcaggaca tctttctcgg
     4261 ggcctcagat cgaggccgga cggataggag cagccaccag tctgagccgc tggcttgcgt
     4321 cacgcgcttg cgggctgcgg tgctatggcg attgccgaat ggtcgattgc cggatcgatc
     4381 ggcacgccgg cttccttgcg ctccgaatag cgatcgacga gctgggcggc gtggggccgc
     4441 atcaacacgg tgatacggac cagctcctcc atcacatcga cgatgcgatc ataatagctc
     4501 gacggcttca tgcggcccgc atcgtcgaac tccttgtacg ccatcgcgac cgacgactgg
     4561 ttggggatgg tgaacatccg catccagcga ccgaggacgc gcagtgtgtt gacgctgttg
     4621 aacgactgcg atccggctga cacctgcatc accgcgagcg tgcggccttg cgtcggccgc
     4681 atcccaccca tcgacagcgg cagatgatcg atctgtgtct tcatgacgcc ggtgatctgg
     4741 ccgtgccgct ccgggctgca ccagacatga ccctcgctcc acatcgaatg ctcgcgcagc
     4801 tcatgcacgg catcgtgatc gtcgccggcg atttggtcgg gcagcggcaa tgtcgaggga
     4861 tcgaatatcc gcgtctcggc gccgaaaaat tggagcaggc gcgccgcttc ctcgacgcag
     4921 agccgcgaaa aggagcgttc tcgcaaagat ccgtagagca gcaggatgcg gggcgccgga
     4981 tcgcccgcgc caagaccaag agcgggacgc tcgatcgcat aggcgcgatc gaggttcgga
     5041 aggtcggtcg gatcggcaag cgcacgcagg ggcatcagga agcgtctttc aggtatttga
     5101 cgagataggc ggcgctggcc ggacacagct tggtgaactc ggccgaggcc gcgatcgtgg
     5161 ccggcgccgt ggcgcgggcc gcgtcggcat agccctgcgt ccggaagaag cgcgcggcgg
     5221 tcgtggtcag caggtgcaac cgctcgaccc ccatgcttgc agcttcgtcc tcgatcagtt
     5281 cgagcacgac gcggcccaag ccgacacgac ggcgatcggg cagcaccacc agcgagcgaa
     5341 gcagtcggtc cggacccgaa ccttcgatcc cggcatagcc aatgagatcg ccagcatcga
     5401 cgcggtagaa gagccggccc ggctccttca gatcggcggt cggcagtccg gcgccggcca
     5461 ggaagaaggc gagcccatca aagtcggatt cgccgatcgg cgtcgcgcgc agccgcgtcg
     5521 ggctcggcgc ctcagacccg tgcgccggca tcattgacga ccaactggcc gtcctctttg
     5581 gcgaaggcac cgagctgcgc gttgggcagg agatctagca cggcctcgga agggcggcac
     5641 agcttcacgc caagcggcga gacgaccagc gggcggttaa tcaggatcgg atgcgccatc
     5701 atcgcatcaa gcagcgcgtc gtccgacagc gatgtgtcgg cgaggcccaa ttccgcatag
     5761 ggcgtgccct tctcgcgcag cagctcgcgc ggggtgatcc cagcgcgcgc gatcaactgg
     5821 accagcagct cgcgcgtggg cggcgtcttg agatattcga cgacgtgcgg ctcgatgcca
     5881 gcattgcgga tcagcccgag cgtgttgcgg gacgtgccgc attcggggtt gtgatagacg
     5941 acgatatcga cgggaccgct catcgggcgt cctccagacg ctcgacggtc gcgccctcgg
     6001 tgcggccgat gtccttcagc ttggtagcaa gcacacgctc ttcgagctta ccgatcggga
     6061 gcgcggtgaa cagatcaatc cggttttcga gatagcgcag ggccttcacg aaagcgcgct
     6121 cgcgctcgat ctcgttgcct tcgacatgcg agggatcttc gataccccaa tgggccgtca
     6181 tcgggtgtcc gggccaaatc ggacagactt cgcccgctgc gtcgtcgcaa acggtgaaca
     6241 cgaaatccat caccggggag tccggctctg aaaaggcttc ccagcctttg gagtgcagcc
     6301 cctcggtcgg atagccaatc cgctccagga gcgcgatggc atcgggattg accgtgccct
     6361 tggggtggct cccggccgag aaggcgcgga aattaccgcc gcgcttgttg agcgcacttt
     6421 cggcgaggat cgaacgggca gaattgcccg tgcagaggaa caggacattg aacaccttgt
     6481 cggacatggc gggctccatc agcagcaggt gagttcggca agcagcggct cgcaaagttc
     6541 agcacggccc tggcaacagt ctttggcgag gaagagcatg agggcgcgca gcgcgtcgat
     6601 attggcgcgc tggatcatct ggcggccctg cttttcaggc gtgaccagcc ccgccttcac
     6661 cagcaccgcg agatgggtcg agaaggtgct ttgcgtcagc ccggccgcct cgacgagctg
     6721 gcccgtggac aggccatcag gttcatgccg cacaagaagg cggaatgtcg cgagcctggt
     6781 cggatgcgcg agggcggcaa gcgaggcgag agcgtcatca tcgatcatat atcgggaata
     6841 aacgatgcgt tcgataccgt caataaccta tcggatattt ccgttggatt tggttgctcc
     6901 gaagacatgt ccacacgcga acatgtggac atgttggaca gaggtgatcg cctggcgatg
     6961 agcttgtgag cagtggtcgg gcgcgtccta gcggaccacg ctctatcttc gcgttccgct
     7021 ccgacagagc cgcgtggacg cgtctccgcc ccttcggggt gacgatcgtt cgcgcaggcg
     7081 agcgccgctc gcgatgaggc tgccggcaat gccggcaacg atatcttgtc agaggggaaa
     7141 ggggcgctcc gccccctctc cccagcaacg acaatccacc gggccgtggc tcagtcgcta
     7201 gcgctccctg cgcccgcacc accccgatgg attctcgctg cccccctcgc ccccggctgt
     7261 tcgccacgag gcagggccga tggccgaggc catcgccctg acggccgatg cgaaggagaa
     7321 gaacgatgat ccatgataac cgcgaggcgt ggctgaacgc ggtcgcgctg ggcatggcgc
     7381 ccttgttcga ggggttggga gcccccctcc ccggccgcat ccgggtggcg atcggcttca
     7441 ccagcgcagg ccggaaaggc aaggcgatcg gggaatgctg ggataaccgt cgcagcgctg
     7501 acgggcattt cgagatcttt atccggcctg acctcgcgca cgcgcccgat gccatgccgg
     7561 tgcagatcgc cgcgatcctc gcgcatgagc ttgtccatgc cgctgtcggc atcgcggccg
     7621 ggcatgggaa gctgtttaaa cgtgtcgcca tcggcttggg gctcgtcggg ccgatgcgtg
     7681 cgacgacacc cggagagggc ttcgtcgcgc ttgcggcccc gatcctcgat ggcgttggtc
     7741 ccctccccca tgcgcgcctc gatacggatg gacagaccac cgcgcctaag aagcagacca
     7801 ccagactgct caaatgcgaa tgtgaaacct gcggctatac ggctcggatc gcgcgcaaat
     7861 ggctggagct tgccggcgcg ccgctgtgtc ccgtgccaga ccacggaccc atgcgacatg
     7921 atccgctgga cgatccggac gaggaggacg tatagatgcg gacacgtcca cctgtcaggc
     7981 atccaacatg ttcacacgcg aacacgtggg ggagttaaca tgaaaaccat ctcgatcatc
     8041 agccagaagg gcggcgccgg gaagaccacc ctcgccattc acctggccgc agcgggcgtg
     8101 gaggccgggc tttcgacgct aatcctcgac gccgaccccc aggcgaccgc cagccagtgg
     8161 agccagtggc ggggaggatc ggaccccgaa gtcgtggact gcgcctcccc gacccttctt
     8221 gcccgcaagg tgcagcaagc ggccgacctc ggcgcggatc ttgttatcat cgacacacca
     8281 ccgcacgccg acatcatggc gcgcgaggcc tgcaagctcg ccgatctgat tctcatcccg
     8341 tgtcgcccgc aggccttcga tctctcggcc gtcgaaacga cggccgatct ggtcaaggct
     8401 gcaggcaagc cggcgttcgt cctgttcatg ggcggtccgc agcgggcgcc ggcaacctat
     8461 aaggacgctc gcgagctgat cgaggggagt gaaggcgtcg ccggcatggg cgtgccggtc
     8521 gctccggtca tgctcaccca gcgcgcgatc taccatcaca gcacggcgca ggggaaagcc
     8581 gccaacgaga gcgagcccga aggcaaggcg gccgaagagg tcgccgccct ctggacgtgg
     8641 atacgcgaac atgtgaacct gtccacacgt aaaccaacgc gaggcaagcg gagcgcggca
     8701 tgagcagatt cggtgcgatg aagcagcagc gggtagaaaa ggcccgcgct acggaagccg
     8761 ctcctgcggc ggagcctgat cccggcgatg ggacgccatc gccgcgcgcg gtggctcgcc
     8821 agggcaagaa ggcggtgagc gcctatttca gcccggaggt cagccgaggc ctcaacgtgc
     8881 tggcggccga gaacggaacc acgctccagg ctttactagg cgaggcgatc gatctgctga
     8941 tgcgccagca cggcaagcat ccgttcggcg agcgctaata tgtggatgcg tggacgtgtc
     9001 cacacgtcca caagctaaaa taccctgagc ctctgccggg tcagatcggg agacagagct
     9061 ggttccggtc gggcagggca gggggctctt ccaggcgctc gacgatcgtc gctgccaagg
     9121 catcggcggc tcgctcgcgc atttgtgcat cccgcattgt caggccgaca cgagcccagg
     9181 cgggagccgc cagaatgatc gaggagagaa gggcgcgatc catggcagcc aaaagaacat
     9241 aagaagaacg attcggcaag ccatgccggc agggcggtca ggaattttag cggctaaaat
     9301 tctggccgcc tgaaaggtga gttttggggt aggggctcac cgttcggcgg cgaggccgaa
     9361 atccaccaac acgggaagct cggccgccag gccgcgcaac ttggcacgcc gcaccacgct
     9421 gtgctgctcg atcaggcttt gggcgtcacg cttgccgctc gacgttttgg ggaaccagta
     9481 gagggcgacc cgctcaacct tgcggccatt cttgatcggc ttgaagtcga catagaaggg
     9541 gcagagcttg ttgatctcgt cctgagcgac cttcaggcag tatttgttga ggtcagcgaa
     9601 gcgctccagc ttgccctcag gcacgttcag caggccccgt atttcctcga tcgtgaactc
     9661 ttcgttctgt ttgtaatcga gaccgatacg acgctcgatc atctcgtaca ggcagagcgc
     9721 atatttcgac tcgaaacagt acatcacctg cgttttgagc cgggcgtaaa cctcgctgtt
     9781 acgcaggatc tcgatcagct cctccggaat ccggtaatga aggaagccgt ctttttcgag
     9841 gctttcgtca ctcgggccga ggagctggac gcgacggcgg aaggccttgc cgcccttgcg
     9901 gatcgtgacg atcgcgatcg tacccatcaa ccgcagaagc gagctttcca cccgctcatt
     9961 gccctggtgg gtgcccttga ggacggtctt cgcgatccgg tggatgatcg gctcgtcgat
    10021 ccgatcccaa gcgttcgcga tcagaaggtt atagatgcgg cgatcggcga gggtgagggg
    10081 ggtcagctcg acaatatcga ccagttcgcc cggcttgacg atctcgccat aattggcggg
    10141 atcgaacgga tttccgcgcc ctttttgggc aattgtcctg atggacggat cagcaacagc
    10201 ggtctgcgac atggcaccat ccacgggtga gccaccaagt tgggcgggct cacacttagc
    10261 atgaagggtg agctaggcaa tatggacagc tcgtttttca catctagcgc ggagataccc
    10321 caaaactcac cgatgatatg cgggataccc caaagctcac cgcagcccac cccaacactc
    10381 acttttggat accccatccc tcaccgtagg ctaccccaac actcacgcga ctcgtcccca
    10441 aagctcactt ttggagccaa ttttccgcag ttttctgcgg gtttgcgtac ccctgaatct
    10501 tgaacttaga agaattagaa gaatctgaag ggcattggtg agctttgggg tagtcccgaa
    10561 ccctttcacc tgtggataac atcgcctcgc acaccaatgg cgcatcgcgc aacaacaccg
    10621 tcagaaggga atgcggaatc ggccttcggc cgatgcgcta tagtttcgtg ccggctaacg
    10681 ccgtcacaag gcggcctaac ggccgcaggc ttggcgagga aggagtcggg cgaggtcggg
    10741 atcaaattgc cctcgcagcg tcccagggaa ggccgctcag cctcaaacga ggttgcgggc
    10801 ttccctattc ctctatccca tatcggacat gcgacagcgg cgctcaggct tgatcgaacc
    10861 gcccggcaaa ttcgcgatcg gcatagtagc gcagtttagt cgcgatgatc ggccgctgcc
    10921 cggcaaggaa gaggagctgg cggtcgggtt tgagcgtgcg aacctcgtcc ggcgtcagca
    10981 gtgcgcgggc ggtatggtgc tgggtgaagg agaggccgga ctcctccgcg tcgatcgcgc
    11041 ggctcaccgt ctcgaacacg accgtttcct ggccgagcag atccgagacg agctgcgcgc
    11101 tttgttgatc gttcacaccg aagatctgaa ggacgccggc attggacagg aaggtgccgg
    11161 cgcgctggcc gtaaagcgcg cggagctggt ggatgtcctg caaaatcggc caaagctgga
    11221 tgccatagcc ggccatcaat cccatcgcgc gctcgacagg ctcaaggtgt ccgagcgccg
    11281 cgaactcatc gagcaggaat aggaccggcc acggggcctt gcctggtacg cgggccagct
    11341 cggtcaacgc ctgggcgatc atcagacgga gccagcgcgc ataggtgtcg agccgatcgg
    11401 gcggcagcac gaggaagatc gtggcgggcg cagacttgat atcggcgaag gcgaaatcgg
    11461 atcggccaag cgccgccgtc atgcgcgggc tatcgagaaa atgggtatgg cgctgtgccg
    11521 aagacaatac gccggccgcc tcgcgatcgg acttgccgag atgtcggttg gcggcgcgcg
    11581 cgaccaggcc gccttgtgct tgcatgtcgt tgagcagctt ttcgaatgcg gcaggtgcca
    11641 atgtcagccg atcgcgcagc gtggcgagcg tgcgggtcgc cagcggctct gtctcgacaa
    11701 tgtggagcag caggccggcg atcagcgcct tggcctcctc gttccagtgc gcctcgctca
    11761 tctcgttatg ggcatcgtgg accagtgcgt cggcgagcgt catgcaatca tcggcgtggt
    11821 cgagaccctg cgggtcgata cgatcgagcg gattataggc agcggcgccg acgactcccg
    11881 tgatcccgaa gggatcgagg atatggaccg ggccgaagcg ggaccgctgg cgcgcggcga
    11941 tccgcgcgtt ctcgcccttg gggtcgatgc agaccaggcc gaaggggtat tcgagcagat
    12001 tgggaatgat cgtgccgacg cccttgccgc tgcgcgtcgg agcgatcgtc aacagatggg
    12061 cagggccagc atagcgcatg aggcgcttgg tcttaaggtc gcggccgatc agcaggccgt
    12121 cggtgcgatc aagggcgcgg gtttcgtcgc gggtcgcgaa gcgggccgag ccatgcgtgt
    12181 cgctgtctcc gccttcgaag ccaaaacgca tcaccatcgg tttgacgagc gcccgaaata
    12241 gcagaccgac cagaatgagc atcgtgccga tctggacgat gctcccgatg ggcgatccat
    12301 cccggacctt ggcgaagtag aggagggacg tgctcgcgct gctcagcacc agcgttgcca
    12361 ctagaaagat taccaccacg ccgatgagat gcttcagcac ccgcatcggg ctgaacagga
    12421 ttgcgtggac ggcgcttagc ggatctcgtg cgacccatcg gagcatgttg cggaaagcgc
    12481 gtccggtcag cctcacccag atcatgtcag gcctctccgg atgtcacctc gcgacgcgcg
    12541 tcgcccgagg tcgggagggg ggtcaggtag agcgatcgat actccgccat caatgccgct
    12601 ggcacccacc ggatgccacc cgcgacaggc ctgccttgat tgaacggagg gacttgagga
    12661 cacgcccagg cgtcgggttc ggattcaggc ggaacgtcat ttcgcccttc ggccgccatg
    12721 cgatcggcga ggccgtttaa acgacgctga cgctcgcgta acgcgtcgac gaaatggcgg
    12781 ggcaggggtg ggtcgtagtc gttccgctgg cgctcgccgc gatccatctc ataggattgt
    12841 gcggcccaaa ccggatcgtt gaaggtgatg ctggcggctg catggcccca catcatccat
    12901 tcgccgagat cggtactcat accctgtcct ccttggtctc cgcctccgcg tcgaaagcgc
    12961 gtttgccacg tcgcttccaa agcgcgagaa gatccccggc atcatcgctg cgcgccttcg
    13021 ccaccaggtc gagcatcgcg ccgtaaaggg tggcgcgatc gtcatcggcg agatcgacca
    13081 gaccggcttt ctggacgagg ccacccagct cgatcaggtg acgggtgcgc gtgcgacgtt
    13141 ccaccaccca ctccctcgta tcggttcgcc gttgtccgcc ttcagctctg cgcgtcgctt
    13201 gcgcgacccg cgccagcgcc ttgtccgtcg ctgccagatg atcccgaagc cttgcgtccc
    13261 cgtcgttgaa agaaggccgc gccatcggag cgccacgcct cctgcaccgc aggcgcctta
    13321 gcttccttta ggatatgaag gaggccgccc acgagcgtac ccgtatcgag cgcatcggcc
    13381 ccggttgcgg cgaccagctc gccgagttgc tggatcttct gagccttgag cgcgcgagcc
    13441 ttgtcattca gcgctttcag ctccgcatca tagtcgcgga cctttcgcat tgcagtctcc
    13501 cggcaatatc gaagaccgga cgatgccatg cggaatcgat ccgcacaaaa cagcttgtcg
    13561 ggaaattggc acggtcagtc acaacgaacg cgagagagtg agagtgcgcg cttatacgtc
    13621 gtttcgacgt gcactcagaa gaagcaggta agaagctgtc atggcgatct accatttctc
    13681 tgcgaaggtg atcagccgtg cgaacggatc gagcgcggtc gcgtccgcag cctatcgtgc
    13741 tgccgagcgc ctgtcggatg aacggatcgg acgcgaccat gatttttcaa acaaggccgg
    13801 tgtcgttcat tcggaagtga tgctgccgga aggtgcaccc gcgcatctcg ccgatcgcga
    13861 aaccctttgg aatgcagtcg aggcagggga aaagcgtaag gacgcgcagc ttgcccgcga
    13921 ggtagagttt tcgatccccc gcgagatgaa ccaggagcag ggcgtcgcgc ttgcccgcga
    13981 cttcgtacag gagcaattcg tcgatcgcgg gatgatcgcg gatctcaatg tgcattggga
    14041 tcatgcggag gacggaagcc ccaagccgca cgcgcatgtc atgctgtcga tgcgcgaggt
    14101 ggggcctgat gggttcggcg cgaaggtgcg cgagtggaac gcgacccagc ttttgcagga
    14161 gtggcgcgag gcgtgggcag atcacgtcaa cgagcgcctg tccgaactcg atatcgatgc
    14221 gcggatcgac catcgtacct tggaggcgca ggggatcgat ctggagcccc agcacaagat
    14281 cgggccggca ggaatgcggc gtctcgatcg cggcgaggat gccgaacgcg ccgacgatca
    14341 tcggcggatc gcgcgcgaga atggcgcgaa gatcattgcc gagccgggcg tggcgctcga
    14401 tgcgatcacg cggatgcagg caaccttcac gacccgcgat ctggcgatgt ttgcgcatcg
    14461 tcattcggac gggaaggaac agttcgacca ggtgatgggg gcggtgcgcg cgtcgcccga
    14521 gctggtggcg ctggggcaag atgggaaggg gcaggaccgc ttcacgtcgc gcgagatgat
    14581 cgcgatcgag cagcgacttg aacgggcagg ggacagcctc gccgccacgg atggtcactt
    14641 cgttgccgcc ccccatgtgt accgcgctct tgaggcggcc gagggtaggg gactgtccct
    14701 gtcggccgag caacgtgacg cgctcggacg cattaccgag cgcgatgggc tcgcttccgt
    14761 cgtcggctat gccggcaccg gcaagtcggc gatgctcggt gtcgcgcgcg aggcatggga
    14821 ggatgctggc tacaccgtgc gcggtgctgc cctgtcgggg atcgcggccg agaatctgga
    14881 aggcggttca ggtatcgcat cgcggacgat cgctagcctt gaatatcagt gggcgcaggg
    14941 acgtgagcag cttggtccgc gcgatgtgtt ggtgatcgac gaggccggca tgatcggcac
    15001 gcgccagatg gagcgggtgc tgtcggcagc ggaccaagcc ggcgctaagg tggtgctggt
    15061 gggcgatccc gagcagttgc aggcgatcga ggccggcgct gcgttccgat cgatcgctga
    15121 gcagcatggc gccgtcgaga tcaccgccat tcgccggcag cacgaggact ggcagcgcga
    15181 cgcgaccaag gcgctggcga ccgggcgcac ggccgaggcg gtccagtctt acgaacagca
    15241 cggcatggtc caggcggccg acacgcgcga tggcgcgcga ggcgagctgg tggaccaatg
    15301 ggactcgcag cgtatcgccg atcgcgacca gacccggatc atcctcacgc acaccaacgc
    15361 cgaggtgcga gacctcaatc tggccgcgcg cgaccggctg cgcgcgtcgg gcgagctggg
    15421 cgaggatgtc agcgtgtcgg ccgagcgcgg cgcccgtgac ttcgctgacg gcgaccgcat
    15481 catgttcttg aagaacgagc gcggccttgg cgtgaagaac ggatcgctag ggacggtcga
    15541 gcgggtgtcg ccgaccagca tggcggtccg cctcgatgac gggcgcgatg ttgccttcga
    15601 cctgaaggat tatgcccatg tcgatcatgg ctatgccgcc accatccaca aatcgcaggg
    15661 ggtgacggtc gatcgcgcgc atgtgctggc gacgcccggc atggatcgtc attccgccta
    15721 tgtggcgctg tcccggcacc gtgacggcgt gcagctccat tatggccgcg acgatttcga
    15781 cgaccagcgc agccttgtcc gcaccctgtc gcgcgagcgg accaaggaca tggcggcgga
    15841 ctatgggcgc gatccggccg agggcgttcg ggccttcgcc gatcggcgtg gcttggccgg
    15901 cgagcaatgg tccgcgaaag cacgaaccgg cgttgagatt tccggcgcgg agatgccggc
    15961 cgcgggcgtc gggggcgctg atccggccgc ggtcgatccg tctggcacat cgcttcgtgc
    16021 tttcgaggac caaaagcggg gcgtgttccg gcctgatgtc gcggcgacca ctggagacac
    16081 agcgggccgc aagcggagca tgttcgacgg attgaagctc gggggctcac cgacacccac
    16141 ccctgccaag gcgcgaaacc tcgtttcgga ccaaggtttg gccggcgccg tcgagcgcgt
    16201 gtcacgctcg gccgtgacga tgatggaagc gcgcgcacaa ggaaggcccg tccttgagca
    16261 tcagaggatt gcgcttgaga aggcgcaagc cgcgctcgat cagatccgcc cgcaagcatc
    16321 gcgcgacctc gcatccgtcc tcgagcgcaa tccggggctg atccgtgatg cggcgcaggg
    16381 cgcgtccggc ccggcgatcc aggcgatggc gcacgagacg cgcgtgcgtg ccgacccgca
    16441 gttgcgggcc gatcggttcg tggagaattg gcagggcatc cagcgccagc ggggccaggc
    16501 ggaaggacgc ggcgaccaag ccggcgttga tcggtccacc aaggcgctgg agcgcatggc
    16561 aaaagggttg gagcgcgatc cgcagatgga atcggtgctt cgcaaccgcc gaccggaact
    16621 cggcttgcag agggatatgg ggcgcgagtt gagccgggat ctgacccagg cgctcagtcg
    16681 cggtcgcgaa cagggacttg gccgataggg aggcacgtat ggacgaggac gggtatcgcg
    16741 acgaggatgg tgccggtgac gatccggcag cggcgttcga gcggctacgc ggcgaggttt
    16801 ccttgctccg ccttgcggtg ggatcgctgg cgacggcccg cgagacgatc gagatccccg
    16861 actatgagcc gacgctagcg cgtaccgaga ggattttgac cgtcctcacc gagcagttgg
    16921 agcccatcgt cgaaagcccg atgttggcga tgacgccgcc taaaatggcg aacgagatcg
    16981 tgtcggctgc ccttcaagcc cggcgcgagg accagcggct tctcactgaa ggccgcgctg
    17041 cactcgatca ggcgacccgc gacatgcggc agatggtcgc ttccgcgcgc accggcgaag
    17101 agcagaaccg ctggatcttc ctgtacggca taggcggctt agtggtgggg attgtcgtat
    17161 gggcggtatt cgctgggatc gtcgcacggg ctatgccggc gagctggcat tggcccgagc
    17221 ggatggcggc gcgcacgctc gacacggata tgtgggatgc ggggcaacgc ctggcgagcg
    17281 tcgccaatcc ggatgggtgg cgcgggatcg ttgccggtga cgctatcgtg cgcgcgaacc
    17341 atgacgcgat cgaggcgtgc cgcaagtcgg ccgccaaggc caaaaaggcc gtgcgctgcg
    17401 cgatcgatgt gaaggcggga gaatagagat ggatgctgtg accgatccgg acgggcgggc
    17461 gatcgtggcc ttgctcgacc aagctatcca tgccgaggcg cgcaccgatg ctccgcccga
    17521 ggcagaacag cgcgattggc tctatggcgg cgtcgatccc accacctaca ccgagcccga
    17581 cgcgcatggt tggatgggga tcgtgccgcc cagcaccgtg ggatgggtgc cgcgtgcgct
    17641 ggtattctgg cacacggtgc tggcgagcgg aggctccatc agccgcgagc agatgcgcca
    17701 acctgctcat tcgcttagcc gctggccgac gatcgagatt gcggtgggtg actatctcac
    17761 ggcgtcgcct tggctgatag cgtaacgcac gcccaggcgg cgggctcatc tcttgaccct
    17821 gaatcgaatt catggccaaa attcagtccc aggcggtgac ggtcgcttca tcaatttgaa
    17881 gcccggagtc cgtctgtggt taagccaggt gcgaaaatcc gccgtaaacc ctgcttcagc
    17941 aatacggcaa agatgccgct atgaaatcac tgagccttcc tggcggcggc gtgagcggcc
    18001 tgttgataat ggcggggcat ccggcgtggg gcgcgattgt cgcgacctta tcgattgcga
    18061 tgcctttcgt agcggatatc atccgagcat cgaagggccg ttgatgacat tcctaactgg
    18121 acggagcagt gggtaaagaa cctatcgata caacacctgc ttcggcggag gtggtcgcgc
    18181 gggtgcagac catatcggat aagaaggcct tgaagcggca cttctccgcg atgtttaaac
    18241 aaggtcagcc gcactatgcg gatttctacg acatagatgc tgagccatgg aatctctggc
    18301 ccggaatggt ttcagacttc gtagaaggtt gggaaccgat cactttcgac gacgggcgca
    18361 agccagccgc gatagccatg gctcttacgt tgtcaatgtc tgctggcacc gatgctgtcg
    18421 ggaaccaggg tgcagcactt gccttggccc gaagggagtt tggcgatcgc gagcacgtct
    18481 gggtagctgg cgaccataac ggccccttcg tcaaattcct ggtccaatat cggaacgaag
    18541 aaggtaggcc tctctcacca ggtccgtcag atcttcgacg ttaccgggag acatatgccg
    18601 aggagctatg cgcccgggac attacggcgc gggcaacaac gcgcggcagt cggggtctag
    18661 gctttagcga agggcgacta gccctgaaag cgcgccgacg tttgagcggt agctgatcgg
    18721 gcaaatcgcg agcccagagg cttccatagt atatatggcc gaggtaagaa cataggagca
    18781 cagagagggg tttaatcgtg aacggaggtc agtaccgtca aagcgtgcag atcggacgga
    18841 agccagcggc aaatctgcac catgcgacac gcatcgcgga tctcgttggc tgctccctca
    18901 accaattcat cacgatcaat tacagcaaaa ccaatagcaa gcccgaggag gctagcgcac
    18961 agttccgtct cctgctggcg agttggttcg ctcgctggct ccgccgccac ccaaagaaca
    19021 agaacgcgtg ccctccaaca tatgtctggg cattcgaagc cgctggtgga cagaccgccg
    19081 tgcattggct tgtccatatc ccccgaggct taatccgcga gttttggcga atggtgcccg
    19141 tatgggtggc gacaacgacg ggcggcgaga tagatgccaa caccgtcaaa catcgacgga
    19201 tctacaatct cataggtgcc aagcgttatg tgctgaaagg aatggacccg catttcgccc
    19261 gcatgtggca aatcaggccc tcgccgcagg gaacgataac ggggaagcgt agtggcttca
    19321 gccggaatct tggcccggtc gcacgaaagg cgctggcgta taggccgcta cgtcgccaag
    19381 ttggccaatg ggctgaggcc acgaccacat agttccggtg gggttgccaa gtaaggacgt
    19441 gccgacctat gacgtgacta ggaccgtgaa cagaattttc tgctgagttt cttggcagtt
    19501 gagaagtacg cgagcagcgc ttgctgctat gatgcgatca tgatgatatg atgttatgat
    19561 gatcgattga cgatgatatc gcataagagt gttcacggtc caaaatgctc gatgacctta
    19621 aatcctgtac tagtagatca ggtctcgcgg ttttgcttgg tgttaagcca agtgagctgt
    19681 catatactct ttataaaatt cctgatgcgg caaaatatac tagcttttgt ataagcaaga
    19741 agagcggcgg cacgcgccaa attcaagctc cttgtccgcc actaaaatgg cttcaggggc
    19801 gccttctgga tcttctgtat caatgcgaag atgatatcag cgcagcctca gggcttaagc
    19861 gcaatctcca ttccgggttc aggcggggcg tcaatatata cgagaacgca aatgcgcaca
    19921 gaggcaagag gtttgttttt aacatagata tagagagctt cttcgatcag tataattttg
    19981 gccgagttag agcatttttc attaatgatc gagactttgc tctgcagcct gcagtggcaa
    20041 caactatagc tcagatagtc tgttttaata atgttttgcc acaaggcagt cctacgtcgc
    20101 ctcacatagc taaccttctc acgcaattct ttgataaccg catggcgaga tttctacggc
    20161 ctaggcgatg tggatatact cgctatgcag acgacataac tatctcgacc aatgtacgcg
    20221 agtttcctgc tgatgtggcg ataatgacgc cggctgatcc tcaagggtgg tcaatcgctc
    20281 ctgagcttgc agcgatcttt gggcgggcga acctgccgcc taacccgtca aaaacacgga
    20341 tgagtgcgta ttcaagcagg caaaccgtaa cgggccttgt cgtcaatcag cggcctaatg
    20401 taacgcgcga gtattacctg catacgagag cgatgtgcga tcgacttttt aaaacgggaa
    20461 caattcagat tcccgatatt acctcgtcat atggtaaaaa ctgtccggtt tctgatgatg
    20521 cggaaccaga agccgatgta gatccgctaa aggttctcga aggccgccta tcgcacatac
    20581 accacatacg tgagaagagt gatcttagaa atatacagga aaagcaggac aatccgactc
    20641 agttctggaa catgttgcaa gacttcttct tgtttaaata ttttgttgca aattcaaagc
    20701 cgctcatact gaccgagggg ccgtcagata tattttatct acgatctgcc attataaaca
    20761 atacaactct gcttgttcct gaactaaaga aggtcgtgtc gggtaagccc gagatcttac
    20821 caacattctt tcggtttaat acggttgctg caaaggttat cggcctgacg ggaggcgcag
    20881 gaaatattaa gcgtttccta tacttatatc ataaacagga aaagcgattt aacagatcgc
    20941 ttcggcataa gcctgttata ataattatcg acaacgattc aggcggcgcc gacgttatca
    21001 acatggtcaa cggtatatat aaaacaaata tatctttgtc cgatccaatc atggctcata
    21061 agataactga tggcctcata cttgtgaaaa ctcctcatgt cggttcaaag acacatactg
    21121 ccattgaaga tcttcttccg gccagcgtta aggcggtgaa gctaaatgga aaatcattct
    21181 cagcagccaa aaaatttgat gctacgaagc attttggaaa aattgctttg ggcagttatg
    21241 tgcaggctaa tgcatcgtcg attagttttc agggttttga cgatttcatc gtcgctatca
    21301 atggcgcgat caccatgtga gtgatccggt gccgcatgga gcgggttgcc gtcatccgag
    21361 ctgttggcac gccgttttaa gtcgccccta aaccaacact cgtgggcggg tgcttggacg
    21421 ttcccgcaaa cggcggtttg acggagagca ccttagcaga aaaacgtact cctttcgttc
    21481 ttggctattg tctccgaaaa tggtctcttg tatgcctctc cgaaatccgg ccctgtcggc
    21541 atgagttttc ggaggattgc gatgcttgtt ggctatgccc gtgtctcgac ccgagatcag
    21601 aatcctgcat tacagctcga ggcgttgcgg gctgtcggct gcgataagat atttaccgag
    21661 aaggcctcag gagcgcagcg ggatagaccg gagctgcagg cggcgcttgg gtatctgcgg
    21721 gctggcgacg cattggtcgt atggaagctg gaccgcttgg cacgatcggt tcgacagtta
    21781 gtcgaaacgg ccgagctgct acaaactcgc gagattggtc tcaaggtcat aacccaggca
    21841 atcgatacca ccagtcccag cggccgactg acctttcatc ttctcgctgc gattgctgag
    21901 tttgaacgcg agctcaccct cgagcggaca catgcgggcc tcgcccaggc ccgcgcgctt
    21961 ggcaggcgtg gcggtcgtaa gcctgctatg ggtgaacccg agatccggcg agccaaggca
    22021 atgctgtccg atccctcaat cacggttgag gaggtcgctc gccagctggg cgttcagcct
    22081 tctacgctct atcgacacat acctggtggt cgc
//