LOCUS DS571286 42641 bp DNA linear CON 17-APR-2008
DEFINITION Entamoeba histolytica HM-1:IMSS scf_1104750516671 genomic scaffold,
whole genome shotgun sequence.
ACCESSION DS571286 AAFB02000000
VERSION DS571286.1
DBLINK BioProject: PRJNA142
BioSample: SAMN02953605
KEYWORDS WGS.
SOURCE Entamoeba histolytica HM-1:IMSS
ORGANISM Entamoeba histolytica HM-1:IMSS
Eukaryota; Amoebozoa; Evosea; Archamoebae; Mastigamoebida;
Entamoebidae; Entamoeba.
REFERENCE 1 (bases 1 to 42641)
AUTHORS Loftus,B., Anderson,I., Davies,R., Alsmark,U.C., Samuelson,J.,
Amedeo,P., Roncaglia,P., Berriman,M., Hirt,R.P., Mann,B.J.,
Nozaki,T., Suh,B., Pop,M., Duchene,M., Ackers,J., Tannich,E.,
Leippe,M., Hofer,M., Bruchhaus,I., Willhoeft,U., Bhattacharya,A.,
Chillingworth,T., Churcher,C., Hance,Z., Harris,B., Harris,D.,
Jagels,K., Moule,S., Mungall,K., Ormond,D., Squares,R.,
Whitehead,S., Quail,M.A., Rabbinowitsch,E., Norbertczak,H.,
Price,C., Wang,Z., Guillen,N., Gilchrist,C., Stroup,S.E.,
Bhattacharya,S., Lohia,A., Foster,P.G., Sicheritz-Ponten,T.,
Weber,C., Singh,U., Mukherjee,C., El-Sayed,N.M., Petri,W.A. Jr.,
Clark,C.G., Embley,T.M., Barrell,B., Fraser,C.M. and Hall,N.
TITLE The genome of the protist parasite Entamoeba histolytica
JOURNAL Nature 433 (7028), 865-868 (2005)
PUBMED 15729342
REFERENCE 2 (bases 1 to 42641)
AUTHORS Lorenzi,H., Amedeo,P., Inman,J., Schobel,S. and Caler,E.
TITLE Direct Submission
JOURNAL Submitted (01-MAR-2007) The Institute for Genomic Research, 9712
Medical Center Drive, Rockville, MD 20850, USA
COMMENT This version of the project, JCVI-ESG2-1.0, represents 8x coverage
of the genome.
FEATURES Location/Qualifiers
source 1..42641
/organism="Entamoeba histolytica HM-1:IMSS"
/mol_type="genomic DNA"
/strain="HM-1:IMSS"
/db_xref="taxon:294381"
repeat_region complement(1..2261)
/rpt_family="LINE1"
gap 3227..3326
/estimated_length=100
gene complement(<4994..>6469)
/locus_tag="EHI_026200"
/old_locus_tag="241.t00004"
/db_xref="Pathema:EHI_026200"
mRNA complement(<4994..>6469)
/locus_tag="EHI_026200"
/old_locus_tag="241.t00004"
/product="hypothetical protein"
/note="transcript EHI_026200A"
/db_xref="Pathema:EHI_026200"
CDS complement(4994..6469)
/locus_tag="EHI_026200"
/old_locus_tag="241.t00004"
/note="encoded by transcript EHI_026200A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL44788.2"
/db_xref="Pathema:EHI_026200"
/translation="MEKIEDCIVEFIWNYSPVSLVNIGKMKLLKRCKIDIGRQKFDIN
SVFSNKQQHLKILRLSNIGNYKEIEEFKEYKNIERVIIEIDDDTKEEYIEQMSKYAVL
VSDQWYSQLNKNVIVMMDKKFHLQIKEKPNVETLEFIQQNYLPYKMIIDADYYDGIQT
QFKLFDNVMKLTLNVEIDPQEEVDQDDIMQRRMDRINGIERSDDDDFVEETEEQKEER
ERLHKLEIERRKHSIILPQHLTSITINDMTPYFHQTLSITLKELTTSNIPIDFIYQLT
SLTKINISNTNITQSLKSLEKLIDITFNLCVDECSEFICPHSVECLKLYNCRNWKFQE
LSHLKLLDKLMIYDARPNVLSTLQLNEATSVKKLYLNNVITASMPTSLTCLIIGSAGN
RAIDMTKYLQLKDVCIENSNQVRVKLPLSIKSLYLYCSSIRIFNKNDIQLKELHLEDC
EDINFESFNLNHVTKLSLLPFDEEYLEYLEQFPVLEEKNFN"
gap 6662..6761
/estimated_length=100
repeat_region 8370..10842
/rpt_family="LINE1"
gene complement(<11337..>12785)
/locus_tag="EHI_026310"
/old_locus_tag="201.t00003"
/db_xref="Pathema:EHI_026310"
mRNA complement(<11337..>12785)
/locus_tag="EHI_026310"
/old_locus_tag="201.t00003"
/product="hypothetical protein"
/note="transcript EHI_026310A"
/db_xref="Pathema:EHI_026310"
CDS complement(11337..12785)
/locus_tag="EHI_026310"
/old_locus_tag="201.t00003"
/note="encoded by transcript EHI_026310A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL45353.1"
/db_xref="Pathema:EHI_026310"
/translation="MLGGFGAFSSNNPSSNNGSQQFNTMGSTGNSIPNMGTNSFGGNG
LGTNTMGGNTFGTNPLGGNGLSTNAFGGNTFGTNSLGGNGLSTNTMGGNGLGTNTFGG
NGLGTNTFGGNGLGTNMIGGNGLGTNSLGGNGLGTNTMGGNTFGTNSLGGNTFGTNSL
GGNGLGTNVMGGNGLGTNMMGGNTFGTNGQGTNTGIGTPTPQDFTKSRFPTESIKNRE
SIQIIPESNKIKREKKKQEVTTPTIINETNENKSKLDDVFDLSRKNTTNEQPLFLRRF
NQTFNSPYRRNGMVPLIRPSYINNSTQRQSIYSCNPIGTLNPSYNCNINNSIVTSIPG
NISRNSILPNTTINNQTSILFNNNQQSVLYGLNQGNNSILSNSPIVQNIKEYAIILSN
LTIQDTPLIINVLSQFGVIVNVIEWKNGVKVIFADETVVNYLIDMKKIMIAGKMCYIS
DPNESFLLKLFDGQTWKSLFSNLFNFLHSIWN"
gene <12998..>13654
/locus_tag="EHI_026320"
/old_locus_tag="201.t00004"
/db_xref="Pathema:EHI_026320"
mRNA <12998..>13654
/locus_tag="EHI_026320"
/old_locus_tag="201.t00004"
/product="hypothetical protein, conserved"
/note="transcript EHI_026320A"
/db_xref="Pathema:EHI_026320"
CDS 12998..13654
/locus_tag="EHI_026320"
/old_locus_tag="201.t00004"
/note="encoded by transcript EHI_026320A"
/codon_start=1
/product="hypothetical protein, conserved"
/protein_id="EAL45354.1"
/db_xref="Pathema:EHI_026320"
/translation="MGCDGGVVARRDDLVKDKKKETKKCNTEDRYRYCSLTHKLFKKR
VVCDVVGRLYNKDGLLKALINHEMPEELRYIHSKKDFIELNIEWSNGIIVCPLKKVEF
SPGHQFVALKCGCVISKLALDEIKSINGNKCPLCETEGLEFIPLNLPLEEMEKQMELH
CKLFDQKQNKTKFIQKEENKIALVTQPIANTIADQAKVNVNKQDDDEIYKSLFKSSQN
"
gene complement(<13965..>15551)
/locus_tag="EHI_026330"
/old_locus_tag="30.t00050"
/db_xref="Pathema:EHI_026330"
mRNA complement(<13965..>15551)
/locus_tag="EHI_026330"
/old_locus_tag="30.t00050"
/product="pumilio family RNA-binding protein"
/note="transcript EHI_026330A"
/db_xref="Pathema:EHI_026330"
CDS complement(13965..15551)
/locus_tag="EHI_026330"
/old_locus_tag="30.t00050"
/note="encoded by transcript EHI_026330A;
GO_component: GO:0005622 - intracellular;
GO_function: GO:0003723 - RNA binding;
GO_function: GO:0005096 - GTPase activator activity;
GO_process: GO:0008152 - metabolic process;
GO_process: GO:0051056 - regulation of small GTPase
mediated signal transduction"
/codon_start=1
/product="pumilio family RNA-binding protein"
/protein_id="EAL49999.2"
/db_xref="Pathema:EHI_026330"
/translation="MTNTSKDIVQQLLFNESRSTSAPPQMDRIGSSGEVISLEDLEKQ
AYRAHPEYHQYYFQQKPADPRLPKPLFEENLPKGYESVLKKAFKTTPFNLDKILEGLS
GPNLRNELRIENEESYEEEDDDDNSEEDNSEEDNTNESSEEGNSEEDSEEESESSEES
SEEEESESYEEDNQMNRYSRYQQQYQPNYQYNGNSYPINFGYIYPINDNVTLDYVSMS
KEHNGSRTVQQSIEKGSEDERQKIWRTLQEHVVELSSDLFANYVIQKAIEFIPESRHI
VPQKMKGNVLRLTLHMYGCRVVQKAVEYASMKDRRLLFEELRKSLVRCIEDQNGNHVI
QKCVEKGDRQMVMDIVNALQGIVLECCKHPYGCRVVQRVIESVDYDCVTELLQVIEPH
SLDLTEDQYGNYVVQNVLERGYPNDRHNILQQIKGNIVRLSMGKYSSNVIEKCFKFAT
QNERQQILEEIYQNNGILQMMQDQFANYVVQKIIEAIDSSEREKIVELFIKPNLTILK
KVTYTKHILNLLETLDDIHL"
gene <16004..>16387
/locus_tag="EHI_026340"
/old_locus_tag="30.t00049"
/db_xref="Pathema:EHI_026340"
mRNA <16004..>16387
/locus_tag="EHI_026340"
/old_locus_tag="30.t00049"
/product="thioredoxin, putative"
/note="transcript EHI_026340A"
/db_xref="Pathema:EHI_026340"
CDS 16004..16387
/locus_tag="EHI_026340"
/old_locus_tag="30.t00049"
/note="encoded by transcript EHI_026340A;
GO_function: GO:0003756 - protein disulfide isomerase
activity;
GO_function: GO:0016209 - antioxidant activity;
GO_function: GO:0016491 - oxidoreductase activity"
/codon_start=1
/product="thioredoxin, putative"
/protein_id="EAL49998.1"
/db_xref="Pathema:EHI_026340"
/translation="MRTFFALLLIALVSANSEGLVSLNPDNFKTYQNSGKTLLVKFFA
PWCGHCKRLAPTYEEVAQAFTENEDVIIAEVNCDDYRELCQEHGIRGFPTVLVFNGEE
SKKFQEQRTVEELKKFVLENVPAKN"
gene <16476..>17954
/locus_tag="EHI_026350"
/old_locus_tag="30.t00048"
/db_xref="Pathema:EHI_026350"
mRNA <16476..>17954
/locus_tag="EHI_026350"
/old_locus_tag="30.t00048"
/product="Rho guanine nucleotide exchange factor,
putative"
/note="transcript EHI_026350A"
/db_xref="Pathema:EHI_026350"
CDS 16476..17954
/locus_tag="EHI_026350"
/old_locus_tag="30.t00048"
/note="encoded by transcript EHI_026350A;
Contains PF01363 : FYVE zinc finger PF00621 : RhoGEF
domain PF00169 : PH domain;
GO_component: GO:0005622 - intracellular;
GO_function: GO:0005089 - Rho guanyl-nucleotide exchange
factor activity;
GO_function: GO:0008270 - zinc ion binding;
GO_process: GO:0035023 - regulation of Rho protein signal
transduction"
/codon_start=1
/product="Rho guanine nucleotide exchange factor,
putative"
/protein_id="EAL49997.1"
/db_xref="Pathema:EHI_026350"
/translation="METISPQSYPSFPRMHEGKCRVKGCNCNRFEGMTDLPDERCSNC
FHSIEAHTLPVELFNNIKCDKPTILTTPREVYRKKIAMELLTTERTYVRMLMTCLRCY
ADPLQSCEPPLLPPTLYKSIFLFYRDIVRVNLVFLQSLEDLVEKNQLVSGLSSVFLGT
LPYLRVYRMFVGNNSVGLQAVEQAEHMKDVVKLLHHCSKYGYEGETVQPLRSYLILPI
QRIPRYNLLLSDFLKHTDRNDPLFEETTALVGSLKSLAKEINDEVKLQDNRRKLLAIK
KKFCEGPYHLTLVEAHRYIMREGILFKLSKTKPKKRYFYLFNDILVYGRMQLQLFYPN
LYLRLNSVHIEDGLQPNTFNLLSPFKSFTVICSSIEERNTWANDLKSAIQKESDKKFS
KNIDTVGFDAPLYQPFNEATLCFICKRKFGIFCFKYHCERCGFVVCDSCSKNRKIVPP
NPVPQRICNFCVRSADRNIEVFKGLRKRSKQERARLALALLE"
gene <18552..>19628
/locus_tag="EHI_026360"
/old_locus_tag="30.t00047"
/db_xref="Pathema:EHI_026360"
mRNA <18552..>19628
/locus_tag="EHI_026360"
/old_locus_tag="30.t00047"
/product="phosphoserine aminotransferase, putative"
/note="transcript EHI_026360A"
/db_xref="Pathema:EHI_026360"
CDS 18552..19628
/locus_tag="EHI_026360"
/old_locus_tag="30.t00047"
/note="encoded by transcript EHI_026360A;
GO_function: GO:0004648 - phosphoserine transaminase
activity;
GO_function: GO:0008483 - transaminase activity;
GO_process: GO:0008152 - metabolic process"
/codon_start=1
/product="phosphoserine aminotransferase, putative"
/protein_id="EAL49996.1"
/db_xref="Pathema:EHI_026360"
/translation="MERQNIHNFGAGPAAMAKEVIEATAKAVNNFWEGLSILEISHRS
KEWINVMNETKALMKEVMDIPEGYEILFFGGGASLQFLMVAMNLLNKKACYLDTGVWA
SKAIKEAENIGEVKIIGTSKDKNYTYIPEYQIPSDYDYFHITTNNTIYGTEIRKDIES
PIPLVADMSSDILSKPIDISKYSLIYAGAQKNCGAAGVTIVIIKKEILGKVQRKIPII
LDYQVHILNNSMYNTPPVISIFTVNQTLKYIKKIGGLKKIQELNEEKARLLYAEIDRN
KIFRGTVRKKDRSIMNVCFVMEEQYKQLENEFSEYALQKGIIGIKGHRSVGGFRASIY
NAVTIESVQALIKCMHDFEQLHTH"
gene complement(<19718..>21817)
/locus_tag="EHI_026370"
/old_locus_tag="30.t00046"
/db_xref="Pathema:EHI_026370"
mRNA complement(<19718..>21817)
/locus_tag="EHI_026370"
/old_locus_tag="30.t00046"
/product="ENTH domain protein, putative"
/note="transcript EHI_026370A"
/db_xref="Pathema:EHI_026370"
CDS complement(19718..21817)
/locus_tag="EHI_026370"
/old_locus_tag="30.t00046"
/note="encoded by transcript EHI_026370A;
GO_function: GO:0005543 - phospholipid binding"
/codon_start=1
/product="ENTH domain protein, putative"
/protein_id="EAL49995.1"
/db_xref="Pathema:EHI_026370"
/translation="MQFVDYKVKLATRKACNTSNCPPKPKHIRTIVVKSFSGGVPSFY
SELTKWILSFNPLQQYKSLVTLHRVLRDGSSQLLGGYLDAFLPTINRLVNTPQQLNAY
YAFQQIIKHYAKYIQIRFVFHQKHRIFTGSLLVPHELPEEYYSDQKTLSVLSYMMDLM
DYLLVIPLPIIQNYIGDNCKMDCTIPLILDSYSLVKDITFFLTNLAHIEQNQSVFTFL
YDRFTKTYSKLNQLYSAAKNNGYIVSLIEVPNLPPLPTFNVNDEERKLYLKKHPHSIT
KNNHLQKTFLHQNNNNTKEILELGNHFSQQLSKLFDLLIPPQLSSEDPESKLETMASC
LMQELQNPSNLDDIKIHIWKTLIGTKYLLQQRNLDYVDANNNGEKVINELYDLQSIAD
KIKVSFQMNEGYEELQKYIEEFVSILSSSSANTSETTPTNQDNDLVLFDYIGDSSHDK
VIQTSQDDFIDEQSFNSFIPPNLQNQENSSNEEEDFSIVLNQINDQINKIEDVRDALK
NCNTNGNETIKRFGDSTQGLIDFIQIAGECEKERIREGKEKNNQTYSNNEVWSEGLLS
CAKKIVEWAQYISSALMNGEPDERILAGLKQFKSHCSQLLTAARVSMEDQSPLLQRLE
KSLCSLMSQIQKIIQNILSREQEQRQEIKEQNKTQDNGIESKKELMESQVRVLQLQKE
LEKAQNHLYSLRKEEYN"
gene <22021..>26211
/locus_tag="EHI_026380"
/old_locus_tag="30.t00045"
/db_xref="Pathema:EHI_026380"
mRNA <22021..>26211
/locus_tag="EHI_026380"
/old_locus_tag="30.t00045"
/product="Sec7 domain protein"
/note="transcript EHI_026380A"
/db_xref="Pathema:EHI_026380"
CDS 22021..26211
/locus_tag="EHI_026380"
/old_locus_tag="30.t00045"
/note="encoded by transcript EHI_026380A;
GO_component: GO:0005622 - intracellular;
GO_function: GO:0005086 - ARF guanyl-nucleotide exchange
factor activity;
GO_process: GO:0032012 - regulation of ARF protein signal
transduction"
/codon_start=1
/product="Sec7 domain protein"
/protein_id="EAL49994.1"
/db_xref="Pathema:EHI_026380"
/translation="MSQKNTPSPLPDPSSKLSLLVETLESIHYRSKDDIVYQASKVFL
ESTSSLEDPLLVLSPLNQNLFVQLLDAIFKSKDRNKLLSIFVPLITPDLMTSETLSLV
CSSMLSILPFSSTGKDSLLPIVLTSFTNLSRCRLHDEVYSLLISSLFDLHVILLPNAP
EAQRVKDLIQTFIDVSPQTPMYSNGVPPVVTLLTTSAKYSTDDWCLPDAVHVKSDNKY
MTSVNFSSRIRSDIEKHREEKMKFVKTLSNENQKYFNSRAHAHAVKSILLIFTIADHH
ILQQYDDWKKPLIDCLIANGFTTEPQKYIPTLKIFIEVMSSPTLHVKGLSVIFERLYL
FILNSSLSTPQQKQLTLEMLVSLTEKQECIISMFQLYDCSIAAPNVIRSLVKTLSDVV
YGKIKSMEKFVSKQFDTDNRMRALKCILNIIDNISTIQINYSPLPSTIEQRMERKVLL
ENGFPLFANNPKDGVEYFISNKFCENSSRSIADFLLSTQGLDKRRVTEYISNLGNDGN
DALNNLIKEIDFSGERFDDALQRMFWMFCAPREVQLVDNIIERFSVRYAECNAALNMT
PEQIYLLATSVMCVALDTKTKRITFKEFSEMLGNAGNIDIKGLFQRATSGSFALAECL
TGIGPNTVNDLEVKERVLRTLSGIDANMIRIYQTKEEGKLENSIDVIKAFIKSTLISC
TDICRYLFFNEETGDFVENSLRGMQKLIHITAYCGMAECDDLTSDISLWTMLLSPEEM
SPKHVLAIRYIINICKEEGPLLKNAWLSCLKVISHLDNLGLMPKPYGDVSEIKVMPKP
QHPIYYPEYLGIFTFVNNDLRVANKKFDQKTLTTLKQLLQKHLSVINDIFIKEAVAPN
ENFLCFLNSLKTVIMTEINTLSPQYFLFNILIQILLMIVGREQNVINQALIIACDIYV
KAGLHPHHILAKQAVKALGLLQSKFPQNDIILNSLMIVMADSAVPPVRDAIIETIESI
LDDYKPSQKMNWKAIINILNLAAVDSSPNVIIRGFSSFRLLTIKTFDDETQYLITKGL
QLYSKKCSNEKMARDLVALANSYLQEKKQLTEVMYIWGGIIGSKYVECAVEAMKYLLI
QLENNNSEMTWNVVYTQIVPLVYSNIEKKDKEWITTVGMTFALNLSSFIANKKVPIRY
IEVVLMICHMFCCSPLQFGISVSGLLVQDIVEVVSHHDNCYDGFKLIMELVHSHIAAV
VLKKVNLRVKTPKGNKEMIGVIKCSTCNKEFSSHLSFLCPYCKEHYYCSLECQKKKET
KHLPQPIINHYETFQPTDNKTLLTCDLKIFIVLKEMVHDIASHEKSDEMLQSLQSVID
EYSSVYSDIEKTTYMECFGLAVDAAVDCFVSLAIESSQFTMINLLFKMTDKIISIVCD
KLLQEHTTIVCFISFFFN"
gene complement(<26429..>27844)
/locus_tag="EHI_026390"
/old_locus_tag="30.t00044"
/db_xref="Pathema:EHI_026390"
mRNA complement(<26429..>27844)
/locus_tag="EHI_026390"
/old_locus_tag="30.t00044"
/product="cation transporter, putative"
/note="transcript EHI_026390A"
/db_xref="Pathema:EHI_026390"
CDS complement(26429..27844)
/locus_tag="EHI_026390"
/old_locus_tag="30.t00044"
/note="encoded by transcript EHI_026390A;
weak similarity to: TIGR01297: cation diffusion
facilitator family transporter;
GO_component: GO:0016020 - membrane;
GO_function: GO:0008324 - cation transmembrane transporter
activity;
GO_process: GO:0006812 - cation transport"
/codon_start=1
/product="cation transporter, putative"
/protein_id="EAL49993.2"
/db_xref="Pathema:EHI_026390"
/translation="MVHPSTSLATLLPISSPTVLILHIILHIFSLSWWSIIPLICIPF
QYVLRKKQTIPLSQSLALLPLCVIVYFLPVKVVNGYIPQILSIIISFLVHIPLSHDPQ
YRHVSIVITCIISNFLRGTSLLPILVIIPLWYISLPTNNDMQLFSIGGSSGMMRINIP
LKVLFTRGLQQTIGHPKSRKLFYYFLINLAFMFVEVAYGWWSGSLGLISDGFHMLFDC
VALAMGLVATVIARWAPDRLFTYGYGRSETLSGFVNALFLVYIAFFVLLESIHRLIHP
SDIKVDALLMVSFLGLLVNIIGVFAFRDTDEDIEISNCNCPIHLNQPKKKKAKDNNME
GIFLHVLSDTLGSVGVIISSYLVEYFGWVISDPICSLCLSAMIFCSVLPLLKNSASML
LQSVPKGYDDDLIKSKLNQIAGVKDVIKLNLWEFSESCLVATTVISIFPEVDSTTIRS
AVITALKHEDFNDITVELVVQ"
gene complement(<28210..>29700)
/locus_tag="EHI_026400"
/old_locus_tag="30.t00043"
/db_xref="Pathema:EHI_026400"
mRNA complement(<28210..>29700)
/locus_tag="EHI_026400"
/old_locus_tag="30.t00043"
/product="hypothetical protein"
/note="transcript EHI_026400A"
/db_xref="Pathema:EHI_026400"
CDS complement(28210..29700)
/locus_tag="EHI_026400"
/old_locus_tag="30.t00043"
/note="encoded by transcript EHI_026400A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL49992.1"
/db_xref="Pathema:EHI_026400"
/translation="MKKGQNKCVMEVQINYLKNVPSDDGDFLLKWSFSNMKGVIENLK
CSNRTITGTENDIIEVLCNEVKLYGTKITKQNLKFMLIQNITSQKKKKEINFGTGFID
LSPFTTIRIKREISIKIKAEKSDFSFECHLTIWNKDTLTDITYANNSDEKKVKMVGFK
QIESEEEEENIIPKKIDNSLEIPRTLEDMVNDIDEETDEQLMVVTYPPSTGPIDLQEI
FDSLKNMKGDFDSIDNFIELLKKWWSDNDAHIELNIIPISMEDWIDCVWLIKTLETFK
VIKFGFEEENNIESQCKLQIEKALKDTKKRLTKLVQERVEGMLKNLILSTAFDSTKSN
FEEGIATAYVRFISSVYESVCKISSTYANSFIRQLFHFSIYSIFEGIVDSHNVDGSKG
FQLNYFGVCIQNEMDQVTVLRKYREEFIPIIEVSRLLTMPLDVDLMKLKEEVFPTVKY
NLLLKILQEFKPGNSNPNPIPKSVFKFLSKHLEQEPIPSKYDLIEN"
gene <29965..30390
/locus_tag="EHI_026410"
/old_locus_tag="30.t00042"
/db_xref="Pathema:EHI_026410"
mRNA join(<29965..30267,30320..30390)
/locus_tag="EHI_026410"
/old_locus_tag="30.t00042"
/product="40S ribosomal protein S20, putative"
/note="transcript EHI_026410A"
/db_xref="Pathema:EHI_026410"
CDS join(29965..30267,30320..30373)
/locus_tag="EHI_026410"
/old_locus_tag="30.t00042"
/note="encoded by transcript EHI_026410A;
GO_component: GO:0005622 - intracellular;
GO_component: GO:0005840 - ribosome;
GO_function: GO:0003735 - structural constituent of
ribosome;
GO_process: GO:0006412 - translation"
/codon_start=1
/product="40S ribosomal protein S20, putative"
/protein_id="EAL49991.1"
/db_xref="Pathema:EHI_026410"
/translation="MANIKKDIKAPVTPKVYKNITITITSTKVKAVESLCAEVKENGK
KKGVQVKGPVRIPTKTLRITTRKTPCGEGSKTWDHYQMRIYKRVLSMKTTPETVKEIT
SLKVEPGVELEVAMFD"
gene <30559..>31206
/locus_tag="EHI_026420"
/old_locus_tag="30.t00041"
/db_xref="Pathema:EHI_026420"
mRNA join(<30559..30837,30898..>31206)
/locus_tag="EHI_026420"
/old_locus_tag="30.t00041"
/product="Rab family GTPase"
/note="transcript EHI_026420A"
/db_xref="Pathema:EHI_026420"
CDS join(30559..30837,30898..31206)
/locus_tag="EHI_026420"
/old_locus_tag="30.t00041"
/note="encoded by transcript EHI_026420A;
GO_component: GO:0005622 - intracellular;
GO_function: GO:0004767 - sphingomyelin phosphodiesterase
activity;
GO_function: GO:0005525 - GTP binding;
GO_process: GO:0007264 - small GTPase mediated signal
transduction"
/codon_start=1
/product="Rab family GTPase"
/protein_id="EAL49990.1"
/db_xref="Pathema:EHI_026420"
/translation="MSEGNTYQFKIVLLGDSSVGKSSIVLRVCKDEYKEFQENTIGAA
FLTKTLIVDGETIKFEIWDTAGQERYHSLTPMYYRGSNAALVVYDITSDSSFIQAKKW
IDELRGSGNEAIIFLVGNKCDLDNSRVITKEEAEGYARSLSIDYIETSAKANINVNEL
FDQIARKLPRNEKGLIDPDEVVISNNKNENKKGCC"
gene complement(<31392..>31967)
/locus_tag="EHI_026430"
/old_locus_tag="30.t00040"
/db_xref="Pathema:EHI_026430"
mRNA complement(join(<31392..31528,31577..31850,31902..>31967))
/locus_tag="EHI_026430"
/old_locus_tag="30.t00040"
/product="hypothetical protein"
/note="transcript EHI_026430A"
/db_xref="Pathema:EHI_026430"
CDS complement(join(31392..31528,31577..31850,31902..31967))
/locus_tag="EHI_026430"
/old_locus_tag="30.t00040"
/note="encoded by transcript EHI_026430A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL49989.2"
/db_xref="Pathema:EHI_026430"
/translation="MSATSVKKLCRDLGIKRWPHRKLQRIEGEIKKIDESMKDPSKTS
FERNQYHERYLELIQLKQQVYDDPNIPLSNPPKKKYYCKSTPNPKPFHQIKFQLNGKT
IPISCSAPLSSIVFGPDYLGVIISQQPNITPPDCPIPEAESYEISCLPSEDPLQQS"
gene <32437..>33390
/locus_tag="EHI_026440"
/old_locus_tag="30.t00039"
/db_xref="Pathema:EHI_026440"
mRNA join(<32437..32625,32860..>33390)
/locus_tag="EHI_026440"
/old_locus_tag="30.t00039"
/product="RNA recognition motif domain containing protein"
/note="transcript EHI_026440A"
/db_xref="Pathema:EHI_026440"
CDS join(32437..32625,32860..33390)
/locus_tag="EHI_026440"
/old_locus_tag="30.t00039"
/note="encoded by transcript EHI_026440A;
GO_function: GO:0003676 - nucleic acid binding"
/codon_start=1
/product="RNA recognition motif domain containing protein"
/protein_id="EAL49988.1"
/db_xref="Pathema:EHI_026440"
/translation="MERRRYGNRSFSNSRRYRNNDQRTNGDSMPPRRTKNDKEVSAPQ
YVKVRVTNLGPKVTEEDINKLCSMNKVEPLKVFLKSQQDGNNVATVLFKTEEDANKII
NAYKNVEFDGKLMNFEIISTKSQQGYHNDRRRRFHDGRNRQRQFGGMRRGFRNSLIDN
VTREIIRRERMYEQSLYGNRGRFDGRRGLNHIGRRHMNHNNRRNDNRIKRNTNERRQP
RMSYEKRLENMNSKLEAYMKS"
gene <34332..>35717
/locus_tag="EHI_026450"
/old_locus_tag="30.t00038"
/db_xref="Pathema:EHI_026450"
mRNA <34332..>35717
/locus_tag="EHI_026450"
/old_locus_tag="30.t00038"
/product="hypothetical protein"
/note="transcript EHI_026450A"
/db_xref="Pathema:EHI_026450"
CDS 34332..35717
/locus_tag="EHI_026450"
/old_locus_tag="30.t00038"
/note="encoded by transcript EHI_026450A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL49987.1"
/db_xref="Pathema:EHI_026450"
/translation="MDRCDHGPNVRCLKCMARDAQKAAELKKKDLNKTAQNPSNSTKL
SSSSSQQGEKVYTVGGGVKKNASTHFSSGVYRLGDGGPIKPATQTAKGKPVKWLCNHP
PGQKCSNCLCPKGAANVKRQCNHPPTMKCPNCIAPEEVKPNQPQQPRIYFPATCPNHG
PHGCCTLCLAKWDYEKVRIQKQEAVCKLCRMNFMETDNFQRYVFQRSFYVNRIGILYG
TFKQDRVQVEAIYEPPQVINEEGDFEMKQEQTLLQVQQMAVELGLERVGIIFSHARRE
EILTSREIISAAQRQLDWDKRCVTVVVTPNETGSESKVECYQASEQLMELVKKAIVQP
SQPKNNEINLKESVYLSQKEIMTVDPIVFVCNVPIRAFKAKTMFLSSKYPIENRPQED
VTLLQFKKYFESVKTLPIYQQISDFHLLVFCLDYGVFSSLHSVKECIVNKIEKHDIKE
DIKQWLEMPLD"
gene complement(<35805..>36386)
/locus_tag="EHI_026460"
/old_locus_tag="30.t00037"
/db_xref="Pathema:EHI_026460"
mRNA complement(<35805..>36386)
/locus_tag="EHI_026460"
/old_locus_tag="30.t00037"
/product="hypothetical protein"
/note="transcript EHI_026460A"
/db_xref="Pathema:EHI_026460"
CDS complement(35805..36386)
/locus_tag="EHI_026460"
/old_locus_tag="30.t00037"
/note="encoded by transcript EHI_026460A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL49986.1"
/db_xref="Pathema:EHI_026460"
/translation="MQNKEIERLYLLIEYIQYPIKVVCSKEYVERKKKEHIEFLQNYT
LKVNEPWFKEITELPWYNNHKLLNQVTSLIKQGKLSPICEMVESDDDNEICFSCLCQP
KNNVIGLNWIHCSQATSNHLICTPCLLNTLSSNGFKISLNNLTCECQICKKVSPLICH
EPSDETILKDVPQEELQTKIVYGRRGKELNSNL"
gene complement(<38456..>39583)
/locus_tag="EHI_026470"
/old_locus_tag="30.t00036"
/db_xref="Pathema:EHI_026470"
mRNA complement(<38456..>39583)
/locus_tag="EHI_026470"
/old_locus_tag="30.t00036"
/product="hypothetical protein"
/note="transcript EHI_026470A"
/db_xref="Pathema:EHI_026470"
CDS complement(38456..39583)
/locus_tag="EHI_026470"
/old_locus_tag="30.t00036"
/note="encoded by transcript EHI_026470A;
Weak similarity to: PF00018: SH3 domain"
/codon_start=1
/product="hypothetical protein"
/protein_id="EAL49985.2"
/db_xref="Pathema:EHI_026470"
/translation="MSSISRSFFTIKSVLGVNKKTIDNEYETMKKKLSDMSNEFQKVI
TYVEELPKTVSNISGNHLNILNSLHLCVQISEGEEAKMEQISDTISIFQKMERDAARY
QGLMNELATPLRAYGQQFKELLGRCKVAEKRKEDMEFYNERLMEITKKPVNRQKGLAD
AQTDFTYAKEKYEWLKQELIEDTNKLCKDFQGVVLPVVRALMVNFTEVMNGMNGIWEE
VPKKVENLPSNGINLEYVIKAPGDSMEKETNVQQRRIQLYNSPMINQTIMSQPYIQQQ
PTFNQPPQNPMPNPYIPPQQTYQVPYGNSTQQPTPISQQPNTNNNNMCRANYDYSAQE
TNELTIKAGDVIKILSKEGDWWIGELNGQTGQFPSNYVTLL"
gene complement(<40545..>41324)
/locus_tag="EHI_026480"
/old_locus_tag="10.t00015"
/db_xref="Pathema:EHI_026480"
mRNA complement(<40545..>41324)
/locus_tag="EHI_026480"
/old_locus_tag="10.t00015"
/product="(2r)-phospho-3-sulfolactate synthase, putative"
/note="transcript EHI_026480A"
/db_xref="Pathema:EHI_026480"
CDS complement(40545..41324)
/locus_tag="EHI_026480"
/old_locus_tag="10.t00015"
/note="encoded by transcript EHI_026480A;
GO_process: GO:0019295 - coenzyme M biosynthetic process"
/codon_start=1
/product="(2r)-phospho-3-sulfolactate synthase, putative"
/protein_id="EAL51236.1"
/db_xref="Pathema:EHI_026480"
/translation="MTEMMKMIDFLPPRTVKPRNKGYTMVMDKGLGNHATEDLCMTAA
PYIDFLKLGFGTLIFTGGLREKLAIYKKYGVEMYVGGTFLEAFIARNKMADFHKIMKE
FGIKMVEVSDGSYEMGQKRKLEIIKECTEHGYFVISEVGNKCKNREYTREEWITSMKA
ELAAGSKVVIVEARESGTTGIYNKDGSVNKEMVDYLISEVDPSKIMWEAPLKSQQAWL
ISTFGINVNLGNIAPADIVALEALRNGLRGDTFIQVLEGRY"
gene <41988..>42530
/locus_tag="EHI_026490"
/db_xref="Pathema:EHI_026490"
mRNA <41988..>42530
/locus_tag="EHI_026490"
/product="hypothetical protein"
/note="transcript EHI_026490A"
/db_xref="Pathema:EHI_026490"
CDS 41988..42530
/locus_tag="EHI_026490"
/note="encoded by transcript EHI_026490A"
/codon_start=1
/product="hypothetical protein"
/protein_id="EDS89347.1"
/db_xref="Pathema:EHI_026490"
/translation="MRKTIPVVIWVLILLIENCVAAVITDFNSIEKQPRKFKGKIFAI
IESDEDMNIAIEHKDRIDQVIGKGFSAESFPSGSPKIEGEWVYKKNFTHNIGHIMFGN
FASIVNWTFEMTEAVIETINKYGLDGVCMEDLENVYFITGRSTRDVRLILRRLGIELH
KIQKQVFAIIPVCLINTLRI"
CONTIG join(AAFB02001038.1:1..3226,gap(100),AAFB02001013.1:1..3335,
gap(100),AAFB02000145.1:1..35880)
//