LOCUS       DS571286               42641 bp    DNA     linear   CON 17-APR-2008
DEFINITION  Entamoeba histolytica HM-1:IMSS scf_1104750516671 genomic scaffold,
            whole genome shotgun sequence.
ACCESSION   DS571286 AAFB02000000
VERSION     DS571286.1
DBLINK      BioProject: PRJNA142
            BioSample: SAMN02953605
KEYWORDS    WGS.
SOURCE      Entamoeba histolytica HM-1:IMSS
  ORGANISM  Entamoeba histolytica HM-1:IMSS
            Eukaryota; Amoebozoa; Evosea; Archamoebae; Mastigamoebida;
            Entamoebidae; Entamoeba.
REFERENCE   1  (bases 1 to 42641)
  AUTHORS   Loftus,B., Anderson,I., Davies,R., Alsmark,U.C., Samuelson,J.,
            Amedeo,P., Roncaglia,P., Berriman,M., Hirt,R.P., Mann,B.J.,
            Nozaki,T., Suh,B., Pop,M., Duchene,M., Ackers,J., Tannich,E.,
            Leippe,M., Hofer,M., Bruchhaus,I., Willhoeft,U., Bhattacharya,A.,
            Chillingworth,T., Churcher,C., Hance,Z., Harris,B., Harris,D.,
            Jagels,K., Moule,S., Mungall,K., Ormond,D., Squares,R.,
            Whitehead,S., Quail,M.A., Rabbinowitsch,E., Norbertczak,H.,
            Price,C., Wang,Z., Guillen,N., Gilchrist,C., Stroup,S.E.,
            Bhattacharya,S., Lohia,A., Foster,P.G., Sicheritz-Ponten,T.,
            Weber,C., Singh,U., Mukherjee,C., El-Sayed,N.M., Petri,W.A. Jr.,
            Clark,C.G., Embley,T.M., Barrell,B., Fraser,C.M. and Hall,N.
  TITLE     The genome of the protist parasite Entamoeba histolytica
  JOURNAL   Nature 433 (7028), 865-868 (2005)
   PUBMED   15729342
REFERENCE   2  (bases 1 to 42641)
  AUTHORS   Lorenzi,H., Amedeo,P., Inman,J., Schobel,S. and Caler,E.
  TITLE     Direct Submission
  JOURNAL   Submitted (01-MAR-2007) The Institute for Genomic Research, 9712
            Medical Center Drive, Rockville, MD 20850, USA
COMMENT     This version of the project, JCVI-ESG2-1.0, represents 8x coverage
            of the genome.
FEATURES             Location/Qualifiers
     source          1..42641
                     /organism="Entamoeba histolytica HM-1:IMSS"
                     /mol_type="genomic DNA"
                     /strain="HM-1:IMSS"
                     /db_xref="taxon:294381"
     repeat_region   complement(1..2261)
                     /rpt_family="LINE1"
     gap             3227..3326
                     /estimated_length=100
     gene            complement(<4994..>6469)
                     /locus_tag="EHI_026200"
                     /old_locus_tag="241.t00004"
                     /db_xref="Pathema:EHI_026200"
     mRNA            complement(<4994..>6469)
                     /locus_tag="EHI_026200"
                     /old_locus_tag="241.t00004"
                     /product="hypothetical protein"
                     /note="transcript EHI_026200A"
                     /db_xref="Pathema:EHI_026200"
     CDS             complement(4994..6469)
                     /locus_tag="EHI_026200"
                     /old_locus_tag="241.t00004"
                     /note="encoded by transcript EHI_026200A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL44788.2"
                     /db_xref="Pathema:EHI_026200"
                     /translation="MEKIEDCIVEFIWNYSPVSLVNIGKMKLLKRCKIDIGRQKFDIN
                     SVFSNKQQHLKILRLSNIGNYKEIEEFKEYKNIERVIIEIDDDTKEEYIEQMSKYAVL
                     VSDQWYSQLNKNVIVMMDKKFHLQIKEKPNVETLEFIQQNYLPYKMIIDADYYDGIQT
                     QFKLFDNVMKLTLNVEIDPQEEVDQDDIMQRRMDRINGIERSDDDDFVEETEEQKEER
                     ERLHKLEIERRKHSIILPQHLTSITINDMTPYFHQTLSITLKELTTSNIPIDFIYQLT
                     SLTKINISNTNITQSLKSLEKLIDITFNLCVDECSEFICPHSVECLKLYNCRNWKFQE
                     LSHLKLLDKLMIYDARPNVLSTLQLNEATSVKKLYLNNVITASMPTSLTCLIIGSAGN
                     RAIDMTKYLQLKDVCIENSNQVRVKLPLSIKSLYLYCSSIRIFNKNDIQLKELHLEDC
                     EDINFESFNLNHVTKLSLLPFDEEYLEYLEQFPVLEEKNFN"
     gap             6662..6761
                     /estimated_length=100
     repeat_region   8370..10842
                     /rpt_family="LINE1"
     gene            complement(<11337..>12785)
                     /locus_tag="EHI_026310"
                     /old_locus_tag="201.t00003"
                     /db_xref="Pathema:EHI_026310"
     mRNA            complement(<11337..>12785)
                     /locus_tag="EHI_026310"
                     /old_locus_tag="201.t00003"
                     /product="hypothetical protein"
                     /note="transcript EHI_026310A"
                     /db_xref="Pathema:EHI_026310"
     CDS             complement(11337..12785)
                     /locus_tag="EHI_026310"
                     /old_locus_tag="201.t00003"
                     /note="encoded by transcript EHI_026310A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL45353.1"
                     /db_xref="Pathema:EHI_026310"
                     /translation="MLGGFGAFSSNNPSSNNGSQQFNTMGSTGNSIPNMGTNSFGGNG
                     LGTNTMGGNTFGTNPLGGNGLSTNAFGGNTFGTNSLGGNGLSTNTMGGNGLGTNTFGG
                     NGLGTNTFGGNGLGTNMIGGNGLGTNSLGGNGLGTNTMGGNTFGTNSLGGNTFGTNSL
                     GGNGLGTNVMGGNGLGTNMMGGNTFGTNGQGTNTGIGTPTPQDFTKSRFPTESIKNRE
                     SIQIIPESNKIKREKKKQEVTTPTIINETNENKSKLDDVFDLSRKNTTNEQPLFLRRF
                     NQTFNSPYRRNGMVPLIRPSYINNSTQRQSIYSCNPIGTLNPSYNCNINNSIVTSIPG
                     NISRNSILPNTTINNQTSILFNNNQQSVLYGLNQGNNSILSNSPIVQNIKEYAIILSN
                     LTIQDTPLIINVLSQFGVIVNVIEWKNGVKVIFADETVVNYLIDMKKIMIAGKMCYIS
                     DPNESFLLKLFDGQTWKSLFSNLFNFLHSIWN"
     gene            <12998..>13654
                     /locus_tag="EHI_026320"
                     /old_locus_tag="201.t00004"
                     /db_xref="Pathema:EHI_026320"
     mRNA            <12998..>13654
                     /locus_tag="EHI_026320"
                     /old_locus_tag="201.t00004"
                     /product="hypothetical protein, conserved"
                     /note="transcript EHI_026320A"
                     /db_xref="Pathema:EHI_026320"
     CDS             12998..13654
                     /locus_tag="EHI_026320"
                     /old_locus_tag="201.t00004"
                     /note="encoded by transcript EHI_026320A"
                     /codon_start=1
                     /product="hypothetical protein, conserved"
                     /protein_id="EAL45354.1"
                     /db_xref="Pathema:EHI_026320"
                     /translation="MGCDGGVVARRDDLVKDKKKETKKCNTEDRYRYCSLTHKLFKKR
                     VVCDVVGRLYNKDGLLKALINHEMPEELRYIHSKKDFIELNIEWSNGIIVCPLKKVEF
                     SPGHQFVALKCGCVISKLALDEIKSINGNKCPLCETEGLEFIPLNLPLEEMEKQMELH
                     CKLFDQKQNKTKFIQKEENKIALVTQPIANTIADQAKVNVNKQDDDEIYKSLFKSSQN
                     "
     gene            complement(<13965..>15551)
                     /locus_tag="EHI_026330"
                     /old_locus_tag="30.t00050"
                     /db_xref="Pathema:EHI_026330"
     mRNA            complement(<13965..>15551)
                     /locus_tag="EHI_026330"
                     /old_locus_tag="30.t00050"
                     /product="pumilio family RNA-binding protein"
                     /note="transcript EHI_026330A"
                     /db_xref="Pathema:EHI_026330"
     CDS             complement(13965..15551)
                     /locus_tag="EHI_026330"
                     /old_locus_tag="30.t00050"
                     /note="encoded by transcript EHI_026330A;
                     GO_component: GO:0005622 - intracellular;
                     GO_function: GO:0003723 - RNA binding;
                     GO_function: GO:0005096 - GTPase activator activity;
                     GO_process: GO:0008152 - metabolic process;
                     GO_process: GO:0051056 - regulation of small GTPase
                     mediated signal transduction"
                     /codon_start=1
                     /product="pumilio family RNA-binding protein"
                     /protein_id="EAL49999.2"
                     /db_xref="Pathema:EHI_026330"
                     /translation="MTNTSKDIVQQLLFNESRSTSAPPQMDRIGSSGEVISLEDLEKQ
                     AYRAHPEYHQYYFQQKPADPRLPKPLFEENLPKGYESVLKKAFKTTPFNLDKILEGLS
                     GPNLRNELRIENEESYEEEDDDDNSEEDNSEEDNTNESSEEGNSEEDSEEESESSEES
                     SEEEESESYEEDNQMNRYSRYQQQYQPNYQYNGNSYPINFGYIYPINDNVTLDYVSMS
                     KEHNGSRTVQQSIEKGSEDERQKIWRTLQEHVVELSSDLFANYVIQKAIEFIPESRHI
                     VPQKMKGNVLRLTLHMYGCRVVQKAVEYASMKDRRLLFEELRKSLVRCIEDQNGNHVI
                     QKCVEKGDRQMVMDIVNALQGIVLECCKHPYGCRVVQRVIESVDYDCVTELLQVIEPH
                     SLDLTEDQYGNYVVQNVLERGYPNDRHNILQQIKGNIVRLSMGKYSSNVIEKCFKFAT
                     QNERQQILEEIYQNNGILQMMQDQFANYVVQKIIEAIDSSEREKIVELFIKPNLTILK
                     KVTYTKHILNLLETLDDIHL"
     gene            <16004..>16387
                     /locus_tag="EHI_026340"
                     /old_locus_tag="30.t00049"
                     /db_xref="Pathema:EHI_026340"
     mRNA            <16004..>16387
                     /locus_tag="EHI_026340"
                     /old_locus_tag="30.t00049"
                     /product="thioredoxin, putative"
                     /note="transcript EHI_026340A"
                     /db_xref="Pathema:EHI_026340"
     CDS             16004..16387
                     /locus_tag="EHI_026340"
                     /old_locus_tag="30.t00049"
                     /note="encoded by transcript EHI_026340A;
                     GO_function: GO:0003756 - protein disulfide isomerase
                     activity;
                     GO_function: GO:0016209 - antioxidant activity;
                     GO_function: GO:0016491 - oxidoreductase activity"
                     /codon_start=1
                     /product="thioredoxin, putative"
                     /protein_id="EAL49998.1"
                     /db_xref="Pathema:EHI_026340"
                     /translation="MRTFFALLLIALVSANSEGLVSLNPDNFKTYQNSGKTLLVKFFA
                     PWCGHCKRLAPTYEEVAQAFTENEDVIIAEVNCDDYRELCQEHGIRGFPTVLVFNGEE
                     SKKFQEQRTVEELKKFVLENVPAKN"
     gene            <16476..>17954
                     /locus_tag="EHI_026350"
                     /old_locus_tag="30.t00048"
                     /db_xref="Pathema:EHI_026350"
     mRNA            <16476..>17954
                     /locus_tag="EHI_026350"
                     /old_locus_tag="30.t00048"
                     /product="Rho guanine nucleotide exchange factor,
                     putative"
                     /note="transcript EHI_026350A"
                     /db_xref="Pathema:EHI_026350"
     CDS             16476..17954
                     /locus_tag="EHI_026350"
                     /old_locus_tag="30.t00048"
                     /note="encoded by transcript EHI_026350A;
                     Contains PF01363 : FYVE zinc finger PF00621 : RhoGEF
                     domain PF00169 : PH domain;
                     GO_component: GO:0005622 - intracellular;
                     GO_function: GO:0005089 - Rho guanyl-nucleotide exchange
                     factor activity;
                     GO_function: GO:0008270 - zinc ion binding;
                     GO_process: GO:0035023 - regulation of Rho protein signal
                     transduction"
                     /codon_start=1
                     /product="Rho guanine nucleotide exchange factor,
                     putative"
                     /protein_id="EAL49997.1"
                     /db_xref="Pathema:EHI_026350"
                     /translation="METISPQSYPSFPRMHEGKCRVKGCNCNRFEGMTDLPDERCSNC
                     FHSIEAHTLPVELFNNIKCDKPTILTTPREVYRKKIAMELLTTERTYVRMLMTCLRCY
                     ADPLQSCEPPLLPPTLYKSIFLFYRDIVRVNLVFLQSLEDLVEKNQLVSGLSSVFLGT
                     LPYLRVYRMFVGNNSVGLQAVEQAEHMKDVVKLLHHCSKYGYEGETVQPLRSYLILPI
                     QRIPRYNLLLSDFLKHTDRNDPLFEETTALVGSLKSLAKEINDEVKLQDNRRKLLAIK
                     KKFCEGPYHLTLVEAHRYIMREGILFKLSKTKPKKRYFYLFNDILVYGRMQLQLFYPN
                     LYLRLNSVHIEDGLQPNTFNLLSPFKSFTVICSSIEERNTWANDLKSAIQKESDKKFS
                     KNIDTVGFDAPLYQPFNEATLCFICKRKFGIFCFKYHCERCGFVVCDSCSKNRKIVPP
                     NPVPQRICNFCVRSADRNIEVFKGLRKRSKQERARLALALLE"
     gene            <18552..>19628
                     /locus_tag="EHI_026360"
                     /old_locus_tag="30.t00047"
                     /db_xref="Pathema:EHI_026360"
     mRNA            <18552..>19628
                     /locus_tag="EHI_026360"
                     /old_locus_tag="30.t00047"
                     /product="phosphoserine aminotransferase, putative"
                     /note="transcript EHI_026360A"
                     /db_xref="Pathema:EHI_026360"
     CDS             18552..19628
                     /locus_tag="EHI_026360"
                     /old_locus_tag="30.t00047"
                     /note="encoded by transcript EHI_026360A;
                     GO_function: GO:0004648 - phosphoserine transaminase
                     activity;
                     GO_function: GO:0008483 - transaminase activity;
                     GO_process: GO:0008152 - metabolic process"
                     /codon_start=1
                     /product="phosphoserine aminotransferase, putative"
                     /protein_id="EAL49996.1"
                     /db_xref="Pathema:EHI_026360"
                     /translation="MERQNIHNFGAGPAAMAKEVIEATAKAVNNFWEGLSILEISHRS
                     KEWINVMNETKALMKEVMDIPEGYEILFFGGGASLQFLMVAMNLLNKKACYLDTGVWA
                     SKAIKEAENIGEVKIIGTSKDKNYTYIPEYQIPSDYDYFHITTNNTIYGTEIRKDIES
                     PIPLVADMSSDILSKPIDISKYSLIYAGAQKNCGAAGVTIVIIKKEILGKVQRKIPII
                     LDYQVHILNNSMYNTPPVISIFTVNQTLKYIKKIGGLKKIQELNEEKARLLYAEIDRN
                     KIFRGTVRKKDRSIMNVCFVMEEQYKQLENEFSEYALQKGIIGIKGHRSVGGFRASIY
                     NAVTIESVQALIKCMHDFEQLHTH"
     gene            complement(<19718..>21817)
                     /locus_tag="EHI_026370"
                     /old_locus_tag="30.t00046"
                     /db_xref="Pathema:EHI_026370"
     mRNA            complement(<19718..>21817)
                     /locus_tag="EHI_026370"
                     /old_locus_tag="30.t00046"
                     /product="ENTH domain protein, putative"
                     /note="transcript EHI_026370A"
                     /db_xref="Pathema:EHI_026370"
     CDS             complement(19718..21817)
                     /locus_tag="EHI_026370"
                     /old_locus_tag="30.t00046"
                     /note="encoded by transcript EHI_026370A;
                     GO_function: GO:0005543 - phospholipid binding"
                     /codon_start=1
                     /product="ENTH domain protein, putative"
                     /protein_id="EAL49995.1"
                     /db_xref="Pathema:EHI_026370"
                     /translation="MQFVDYKVKLATRKACNTSNCPPKPKHIRTIVVKSFSGGVPSFY
                     SELTKWILSFNPLQQYKSLVTLHRVLRDGSSQLLGGYLDAFLPTINRLVNTPQQLNAY
                     YAFQQIIKHYAKYIQIRFVFHQKHRIFTGSLLVPHELPEEYYSDQKTLSVLSYMMDLM
                     DYLLVIPLPIIQNYIGDNCKMDCTIPLILDSYSLVKDITFFLTNLAHIEQNQSVFTFL
                     YDRFTKTYSKLNQLYSAAKNNGYIVSLIEVPNLPPLPTFNVNDEERKLYLKKHPHSIT
                     KNNHLQKTFLHQNNNNTKEILELGNHFSQQLSKLFDLLIPPQLSSEDPESKLETMASC
                     LMQELQNPSNLDDIKIHIWKTLIGTKYLLQQRNLDYVDANNNGEKVINELYDLQSIAD
                     KIKVSFQMNEGYEELQKYIEEFVSILSSSSANTSETTPTNQDNDLVLFDYIGDSSHDK
                     VIQTSQDDFIDEQSFNSFIPPNLQNQENSSNEEEDFSIVLNQINDQINKIEDVRDALK
                     NCNTNGNETIKRFGDSTQGLIDFIQIAGECEKERIREGKEKNNQTYSNNEVWSEGLLS
                     CAKKIVEWAQYISSALMNGEPDERILAGLKQFKSHCSQLLTAARVSMEDQSPLLQRLE
                     KSLCSLMSQIQKIIQNILSREQEQRQEIKEQNKTQDNGIESKKELMESQVRVLQLQKE
                     LEKAQNHLYSLRKEEYN"
     gene            <22021..>26211
                     /locus_tag="EHI_026380"
                     /old_locus_tag="30.t00045"
                     /db_xref="Pathema:EHI_026380"
     mRNA            <22021..>26211
                     /locus_tag="EHI_026380"
                     /old_locus_tag="30.t00045"
                     /product="Sec7 domain protein"
                     /note="transcript EHI_026380A"
                     /db_xref="Pathema:EHI_026380"
     CDS             22021..26211
                     /locus_tag="EHI_026380"
                     /old_locus_tag="30.t00045"
                     /note="encoded by transcript EHI_026380A;
                     GO_component: GO:0005622 - intracellular;
                     GO_function: GO:0005086 - ARF guanyl-nucleotide exchange
                     factor activity;
                     GO_process: GO:0032012 - regulation of ARF protein signal
                     transduction"
                     /codon_start=1
                     /product="Sec7 domain protein"
                     /protein_id="EAL49994.1"
                     /db_xref="Pathema:EHI_026380"
                     /translation="MSQKNTPSPLPDPSSKLSLLVETLESIHYRSKDDIVYQASKVFL
                     ESTSSLEDPLLVLSPLNQNLFVQLLDAIFKSKDRNKLLSIFVPLITPDLMTSETLSLV
                     CSSMLSILPFSSTGKDSLLPIVLTSFTNLSRCRLHDEVYSLLISSLFDLHVILLPNAP
                     EAQRVKDLIQTFIDVSPQTPMYSNGVPPVVTLLTTSAKYSTDDWCLPDAVHVKSDNKY
                     MTSVNFSSRIRSDIEKHREEKMKFVKTLSNENQKYFNSRAHAHAVKSILLIFTIADHH
                     ILQQYDDWKKPLIDCLIANGFTTEPQKYIPTLKIFIEVMSSPTLHVKGLSVIFERLYL
                     FILNSSLSTPQQKQLTLEMLVSLTEKQECIISMFQLYDCSIAAPNVIRSLVKTLSDVV
                     YGKIKSMEKFVSKQFDTDNRMRALKCILNIIDNISTIQINYSPLPSTIEQRMERKVLL
                     ENGFPLFANNPKDGVEYFISNKFCENSSRSIADFLLSTQGLDKRRVTEYISNLGNDGN
                     DALNNLIKEIDFSGERFDDALQRMFWMFCAPREVQLVDNIIERFSVRYAECNAALNMT
                     PEQIYLLATSVMCVALDTKTKRITFKEFSEMLGNAGNIDIKGLFQRATSGSFALAECL
                     TGIGPNTVNDLEVKERVLRTLSGIDANMIRIYQTKEEGKLENSIDVIKAFIKSTLISC
                     TDICRYLFFNEETGDFVENSLRGMQKLIHITAYCGMAECDDLTSDISLWTMLLSPEEM
                     SPKHVLAIRYIINICKEEGPLLKNAWLSCLKVISHLDNLGLMPKPYGDVSEIKVMPKP
                     QHPIYYPEYLGIFTFVNNDLRVANKKFDQKTLTTLKQLLQKHLSVINDIFIKEAVAPN
                     ENFLCFLNSLKTVIMTEINTLSPQYFLFNILIQILLMIVGREQNVINQALIIACDIYV
                     KAGLHPHHILAKQAVKALGLLQSKFPQNDIILNSLMIVMADSAVPPVRDAIIETIESI
                     LDDYKPSQKMNWKAIINILNLAAVDSSPNVIIRGFSSFRLLTIKTFDDETQYLITKGL
                     QLYSKKCSNEKMARDLVALANSYLQEKKQLTEVMYIWGGIIGSKYVECAVEAMKYLLI
                     QLENNNSEMTWNVVYTQIVPLVYSNIEKKDKEWITTVGMTFALNLSSFIANKKVPIRY
                     IEVVLMICHMFCCSPLQFGISVSGLLVQDIVEVVSHHDNCYDGFKLIMELVHSHIAAV
                     VLKKVNLRVKTPKGNKEMIGVIKCSTCNKEFSSHLSFLCPYCKEHYYCSLECQKKKET
                     KHLPQPIINHYETFQPTDNKTLLTCDLKIFIVLKEMVHDIASHEKSDEMLQSLQSVID
                     EYSSVYSDIEKTTYMECFGLAVDAAVDCFVSLAIESSQFTMINLLFKMTDKIISIVCD
                     KLLQEHTTIVCFISFFFN"
     gene            complement(<26429..>27844)
                     /locus_tag="EHI_026390"
                     /old_locus_tag="30.t00044"
                     /db_xref="Pathema:EHI_026390"
     mRNA            complement(<26429..>27844)
                     /locus_tag="EHI_026390"
                     /old_locus_tag="30.t00044"
                     /product="cation transporter, putative"
                     /note="transcript EHI_026390A"
                     /db_xref="Pathema:EHI_026390"
     CDS             complement(26429..27844)
                     /locus_tag="EHI_026390"
                     /old_locus_tag="30.t00044"
                     /note="encoded by transcript EHI_026390A;
                     weak similarity to: TIGR01297: cation diffusion
                     facilitator family transporter;
                     GO_component: GO:0016020 - membrane;
                     GO_function: GO:0008324 - cation transmembrane transporter
                     activity;
                     GO_process: GO:0006812 - cation transport"
                     /codon_start=1
                     /product="cation transporter, putative"
                     /protein_id="EAL49993.2"
                     /db_xref="Pathema:EHI_026390"
                     /translation="MVHPSTSLATLLPISSPTVLILHIILHIFSLSWWSIIPLICIPF
                     QYVLRKKQTIPLSQSLALLPLCVIVYFLPVKVVNGYIPQILSIIISFLVHIPLSHDPQ
                     YRHVSIVITCIISNFLRGTSLLPILVIIPLWYISLPTNNDMQLFSIGGSSGMMRINIP
                     LKVLFTRGLQQTIGHPKSRKLFYYFLINLAFMFVEVAYGWWSGSLGLISDGFHMLFDC
                     VALAMGLVATVIARWAPDRLFTYGYGRSETLSGFVNALFLVYIAFFVLLESIHRLIHP
                     SDIKVDALLMVSFLGLLVNIIGVFAFRDTDEDIEISNCNCPIHLNQPKKKKAKDNNME
                     GIFLHVLSDTLGSVGVIISSYLVEYFGWVISDPICSLCLSAMIFCSVLPLLKNSASML
                     LQSVPKGYDDDLIKSKLNQIAGVKDVIKLNLWEFSESCLVATTVISIFPEVDSTTIRS
                     AVITALKHEDFNDITVELVVQ"
     gene            complement(<28210..>29700)
                     /locus_tag="EHI_026400"
                     /old_locus_tag="30.t00043"
                     /db_xref="Pathema:EHI_026400"
     mRNA            complement(<28210..>29700)
                     /locus_tag="EHI_026400"
                     /old_locus_tag="30.t00043"
                     /product="hypothetical protein"
                     /note="transcript EHI_026400A"
                     /db_xref="Pathema:EHI_026400"
     CDS             complement(28210..29700)
                     /locus_tag="EHI_026400"
                     /old_locus_tag="30.t00043"
                     /note="encoded by transcript EHI_026400A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL49992.1"
                     /db_xref="Pathema:EHI_026400"
                     /translation="MKKGQNKCVMEVQINYLKNVPSDDGDFLLKWSFSNMKGVIENLK
                     CSNRTITGTENDIIEVLCNEVKLYGTKITKQNLKFMLIQNITSQKKKKEINFGTGFID
                     LSPFTTIRIKREISIKIKAEKSDFSFECHLTIWNKDTLTDITYANNSDEKKVKMVGFK
                     QIESEEEEENIIPKKIDNSLEIPRTLEDMVNDIDEETDEQLMVVTYPPSTGPIDLQEI
                     FDSLKNMKGDFDSIDNFIELLKKWWSDNDAHIELNIIPISMEDWIDCVWLIKTLETFK
                     VIKFGFEEENNIESQCKLQIEKALKDTKKRLTKLVQERVEGMLKNLILSTAFDSTKSN
                     FEEGIATAYVRFISSVYESVCKISSTYANSFIRQLFHFSIYSIFEGIVDSHNVDGSKG
                     FQLNYFGVCIQNEMDQVTVLRKYREEFIPIIEVSRLLTMPLDVDLMKLKEEVFPTVKY
                     NLLLKILQEFKPGNSNPNPIPKSVFKFLSKHLEQEPIPSKYDLIEN"
     gene            <29965..30390
                     /locus_tag="EHI_026410"
                     /old_locus_tag="30.t00042"
                     /db_xref="Pathema:EHI_026410"
     mRNA            join(<29965..30267,30320..30390)
                     /locus_tag="EHI_026410"
                     /old_locus_tag="30.t00042"
                     /product="40S ribosomal protein S20, putative"
                     /note="transcript EHI_026410A"
                     /db_xref="Pathema:EHI_026410"
     CDS             join(29965..30267,30320..30373)
                     /locus_tag="EHI_026410"
                     /old_locus_tag="30.t00042"
                     /note="encoded by transcript EHI_026410A;
                     GO_component: GO:0005622 - intracellular;
                     GO_component: GO:0005840 - ribosome;
                     GO_function: GO:0003735 - structural constituent of
                     ribosome;
                     GO_process: GO:0006412 - translation"
                     /codon_start=1
                     /product="40S ribosomal protein S20, putative"
                     /protein_id="EAL49991.1"
                     /db_xref="Pathema:EHI_026410"
                     /translation="MANIKKDIKAPVTPKVYKNITITITSTKVKAVESLCAEVKENGK
                     KKGVQVKGPVRIPTKTLRITTRKTPCGEGSKTWDHYQMRIYKRVLSMKTTPETVKEIT
                     SLKVEPGVELEVAMFD"
     gene            <30559..>31206
                     /locus_tag="EHI_026420"
                     /old_locus_tag="30.t00041"
                     /db_xref="Pathema:EHI_026420"
     mRNA            join(<30559..30837,30898..>31206)
                     /locus_tag="EHI_026420"
                     /old_locus_tag="30.t00041"
                     /product="Rab family GTPase"
                     /note="transcript EHI_026420A"
                     /db_xref="Pathema:EHI_026420"
     CDS             join(30559..30837,30898..31206)
                     /locus_tag="EHI_026420"
                     /old_locus_tag="30.t00041"
                     /note="encoded by transcript EHI_026420A;
                     GO_component: GO:0005622 - intracellular;
                     GO_function: GO:0004767 - sphingomyelin phosphodiesterase
                     activity;
                     GO_function: GO:0005525 - GTP binding;
                     GO_process: GO:0007264 - small GTPase mediated signal
                     transduction"
                     /codon_start=1
                     /product="Rab family GTPase"
                     /protein_id="EAL49990.1"
                     /db_xref="Pathema:EHI_026420"
                     /translation="MSEGNTYQFKIVLLGDSSVGKSSIVLRVCKDEYKEFQENTIGAA
                     FLTKTLIVDGETIKFEIWDTAGQERYHSLTPMYYRGSNAALVVYDITSDSSFIQAKKW
                     IDELRGSGNEAIIFLVGNKCDLDNSRVITKEEAEGYARSLSIDYIETSAKANINVNEL
                     FDQIARKLPRNEKGLIDPDEVVISNNKNENKKGCC"
     gene            complement(<31392..>31967)
                     /locus_tag="EHI_026430"
                     /old_locus_tag="30.t00040"
                     /db_xref="Pathema:EHI_026430"
     mRNA            complement(join(<31392..31528,31577..31850,31902..>31967))
                     /locus_tag="EHI_026430"
                     /old_locus_tag="30.t00040"
                     /product="hypothetical protein"
                     /note="transcript EHI_026430A"
                     /db_xref="Pathema:EHI_026430"
     CDS             complement(join(31392..31528,31577..31850,31902..31967))
                     /locus_tag="EHI_026430"
                     /old_locus_tag="30.t00040"
                     /note="encoded by transcript EHI_026430A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL49989.2"
                     /db_xref="Pathema:EHI_026430"
                     /translation="MSATSVKKLCRDLGIKRWPHRKLQRIEGEIKKIDESMKDPSKTS
                     FERNQYHERYLELIQLKQQVYDDPNIPLSNPPKKKYYCKSTPNPKPFHQIKFQLNGKT
                     IPISCSAPLSSIVFGPDYLGVIISQQPNITPPDCPIPEAESYEISCLPSEDPLQQS"
     gene            <32437..>33390
                     /locus_tag="EHI_026440"
                     /old_locus_tag="30.t00039"
                     /db_xref="Pathema:EHI_026440"
     mRNA            join(<32437..32625,32860..>33390)
                     /locus_tag="EHI_026440"
                     /old_locus_tag="30.t00039"
                     /product="RNA recognition motif domain containing protein"
                     /note="transcript EHI_026440A"
                     /db_xref="Pathema:EHI_026440"
     CDS             join(32437..32625,32860..33390)
                     /locus_tag="EHI_026440"
                     /old_locus_tag="30.t00039"
                     /note="encoded by transcript EHI_026440A;
                     GO_function: GO:0003676 - nucleic acid binding"
                     /codon_start=1
                     /product="RNA recognition motif domain containing protein"
                     /protein_id="EAL49988.1"
                     /db_xref="Pathema:EHI_026440"
                     /translation="MERRRYGNRSFSNSRRYRNNDQRTNGDSMPPRRTKNDKEVSAPQ
                     YVKVRVTNLGPKVTEEDINKLCSMNKVEPLKVFLKSQQDGNNVATVLFKTEEDANKII
                     NAYKNVEFDGKLMNFEIISTKSQQGYHNDRRRRFHDGRNRQRQFGGMRRGFRNSLIDN
                     VTREIIRRERMYEQSLYGNRGRFDGRRGLNHIGRRHMNHNNRRNDNRIKRNTNERRQP
                     RMSYEKRLENMNSKLEAYMKS"
     gene            <34332..>35717
                     /locus_tag="EHI_026450"
                     /old_locus_tag="30.t00038"
                     /db_xref="Pathema:EHI_026450"
     mRNA            <34332..>35717
                     /locus_tag="EHI_026450"
                     /old_locus_tag="30.t00038"
                     /product="hypothetical protein"
                     /note="transcript EHI_026450A"
                     /db_xref="Pathema:EHI_026450"
     CDS             34332..35717
                     /locus_tag="EHI_026450"
                     /old_locus_tag="30.t00038"
                     /note="encoded by transcript EHI_026450A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL49987.1"
                     /db_xref="Pathema:EHI_026450"
                     /translation="MDRCDHGPNVRCLKCMARDAQKAAELKKKDLNKTAQNPSNSTKL
                     SSSSSQQGEKVYTVGGGVKKNASTHFSSGVYRLGDGGPIKPATQTAKGKPVKWLCNHP
                     PGQKCSNCLCPKGAANVKRQCNHPPTMKCPNCIAPEEVKPNQPQQPRIYFPATCPNHG
                     PHGCCTLCLAKWDYEKVRIQKQEAVCKLCRMNFMETDNFQRYVFQRSFYVNRIGILYG
                     TFKQDRVQVEAIYEPPQVINEEGDFEMKQEQTLLQVQQMAVELGLERVGIIFSHARRE
                     EILTSREIISAAQRQLDWDKRCVTVVVTPNETGSESKVECYQASEQLMELVKKAIVQP
                     SQPKNNEINLKESVYLSQKEIMTVDPIVFVCNVPIRAFKAKTMFLSSKYPIENRPQED
                     VTLLQFKKYFESVKTLPIYQQISDFHLLVFCLDYGVFSSLHSVKECIVNKIEKHDIKE
                     DIKQWLEMPLD"
     gene            complement(<35805..>36386)
                     /locus_tag="EHI_026460"
                     /old_locus_tag="30.t00037"
                     /db_xref="Pathema:EHI_026460"
     mRNA            complement(<35805..>36386)
                     /locus_tag="EHI_026460"
                     /old_locus_tag="30.t00037"
                     /product="hypothetical protein"
                     /note="transcript EHI_026460A"
                     /db_xref="Pathema:EHI_026460"
     CDS             complement(35805..36386)
                     /locus_tag="EHI_026460"
                     /old_locus_tag="30.t00037"
                     /note="encoded by transcript EHI_026460A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL49986.1"
                     /db_xref="Pathema:EHI_026460"
                     /translation="MQNKEIERLYLLIEYIQYPIKVVCSKEYVERKKKEHIEFLQNYT
                     LKVNEPWFKEITELPWYNNHKLLNQVTSLIKQGKLSPICEMVESDDDNEICFSCLCQP
                     KNNVIGLNWIHCSQATSNHLICTPCLLNTLSSNGFKISLNNLTCECQICKKVSPLICH
                     EPSDETILKDVPQEELQTKIVYGRRGKELNSNL"
     gene            complement(<38456..>39583)
                     /locus_tag="EHI_026470"
                     /old_locus_tag="30.t00036"
                     /db_xref="Pathema:EHI_026470"
     mRNA            complement(<38456..>39583)
                     /locus_tag="EHI_026470"
                     /old_locus_tag="30.t00036"
                     /product="hypothetical protein"
                     /note="transcript EHI_026470A"
                     /db_xref="Pathema:EHI_026470"
     CDS             complement(38456..39583)
                     /locus_tag="EHI_026470"
                     /old_locus_tag="30.t00036"
                     /note="encoded by transcript EHI_026470A;
                     Weak similarity to: PF00018: SH3 domain"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EAL49985.2"
                     /db_xref="Pathema:EHI_026470"
                     /translation="MSSISRSFFTIKSVLGVNKKTIDNEYETMKKKLSDMSNEFQKVI
                     TYVEELPKTVSNISGNHLNILNSLHLCVQISEGEEAKMEQISDTISIFQKMERDAARY
                     QGLMNELATPLRAYGQQFKELLGRCKVAEKRKEDMEFYNERLMEITKKPVNRQKGLAD
                     AQTDFTYAKEKYEWLKQELIEDTNKLCKDFQGVVLPVVRALMVNFTEVMNGMNGIWEE
                     VPKKVENLPSNGINLEYVIKAPGDSMEKETNVQQRRIQLYNSPMINQTIMSQPYIQQQ
                     PTFNQPPQNPMPNPYIPPQQTYQVPYGNSTQQPTPISQQPNTNNNNMCRANYDYSAQE
                     TNELTIKAGDVIKILSKEGDWWIGELNGQTGQFPSNYVTLL"
     gene            complement(<40545..>41324)
                     /locus_tag="EHI_026480"
                     /old_locus_tag="10.t00015"
                     /db_xref="Pathema:EHI_026480"
     mRNA            complement(<40545..>41324)
                     /locus_tag="EHI_026480"
                     /old_locus_tag="10.t00015"
                     /product="(2r)-phospho-3-sulfolactate synthase, putative"
                     /note="transcript EHI_026480A"
                     /db_xref="Pathema:EHI_026480"
     CDS             complement(40545..41324)
                     /locus_tag="EHI_026480"
                     /old_locus_tag="10.t00015"
                     /note="encoded by transcript EHI_026480A;
                     GO_process: GO:0019295 - coenzyme M biosynthetic process"
                     /codon_start=1
                     /product="(2r)-phospho-3-sulfolactate synthase, putative"
                     /protein_id="EAL51236.1"
                     /db_xref="Pathema:EHI_026480"
                     /translation="MTEMMKMIDFLPPRTVKPRNKGYTMVMDKGLGNHATEDLCMTAA
                     PYIDFLKLGFGTLIFTGGLREKLAIYKKYGVEMYVGGTFLEAFIARNKMADFHKIMKE
                     FGIKMVEVSDGSYEMGQKRKLEIIKECTEHGYFVISEVGNKCKNREYTREEWITSMKA
                     ELAAGSKVVIVEARESGTTGIYNKDGSVNKEMVDYLISEVDPSKIMWEAPLKSQQAWL
                     ISTFGINVNLGNIAPADIVALEALRNGLRGDTFIQVLEGRY"
     gene            <41988..>42530
                     /locus_tag="EHI_026490"
                     /db_xref="Pathema:EHI_026490"
     mRNA            <41988..>42530
                     /locus_tag="EHI_026490"
                     /product="hypothetical protein"
                     /note="transcript EHI_026490A"
                     /db_xref="Pathema:EHI_026490"
     CDS             41988..42530
                     /locus_tag="EHI_026490"
                     /note="encoded by transcript EHI_026490A"
                     /codon_start=1
                     /product="hypothetical protein"
                     /protein_id="EDS89347.1"
                     /db_xref="Pathema:EHI_026490"
                     /translation="MRKTIPVVIWVLILLIENCVAAVITDFNSIEKQPRKFKGKIFAI
                     IESDEDMNIAIEHKDRIDQVIGKGFSAESFPSGSPKIEGEWVYKKNFTHNIGHIMFGN
                     FASIVNWTFEMTEAVIETINKYGLDGVCMEDLENVYFITGRSTRDVRLILRRLGIELH
                     KIQKQVFAIIPVCLINTLRI"
CONTIG      join(AAFB02001038.1:1..3226,gap(100),AAFB02001013.1:1..3335,
            gap(100),AAFB02000145.1:1..35880)
//