LOCUS DS114150 29326 bp DNA linear CON 15-DEC-2022 DEFINITION Trichomonas vaginalis G3 strain G3; ATCC PRA-98 unplaced genomic scaffold 1047229021876, whole genome shotgun sequence. ACCESSION DS114150 AAHC03000000 VERSION DS114150.1 DBLINK BioProject: PRJNA16084 BioSample: SAMN02953626 KEYWORDS WGS. SOURCE Trichomonas vaginalis G3 ORGANISM Trichomonas vaginalis G3 Eukaryota; Metamonada; Parabasalia; Trichomonadida; Trichomonadidae; Trichomonas. REFERENCE 1 (bases 1 to 29326) AUTHORS Carlton,J.M., Hirt,R.P., Silva,J.C., Delcher,A.L., Schatz,M., Zhao,Q., Wortman,J.R., Bidwell,S.L., Alsmark,U.C., Besteiro,S., Sicheritz-Ponten,T., Noel,C.J., Dacks,J.B., Foster,P.G., Simillion,C., Van de Peer,Y., Miranda-Saavedra,D., Barton,G.J., Westrop,G.D., Muller,S., Dessi,D., Fiori,P.L., Ren,Q., Paulsen,I., Zhang,H., Bastida-Corcuera,F.D., Simoes-Barbosa,A., Brown,M.T., Hayes,R.D., Mukherjee,M., Okumura,C.Y., Schneider,R., Smith,A.J., Vanacova,S., Villalvazo,M., Haas,B.J., Pertea,M., Feldblyum,T.V., Utterback,T.R., Shu,C.L., Osoegawa,K., de Jong,P.J., Hrdy,I., Horvathova,L., Zubacova,Z., Dolezal,P., Malik,S.B., Logsdon,J.M. Jr., Henze,K., Gupta,A., Wang,C.C., Dunne,R.L., Upcroft,J.A., Upcroft,P., White,O., Salzberg,S.L., Tang,P., Chiu,C.H., Lee,Y.S., Embley,T.M., Coombs,G.H., Mottram,J.C., Tachezy,J., Fraser-Liggett,C.M. and Johnson,P.J. TITLE Draft genome sequence of the sexually transmitted pathogen Trichomonas vaginalis JOURNAL Science 315 (5809), 207-212 (2007) PUBMED 17218520 REFERENCE 2 (bases 1 to 29326) AUTHORS Carlton,J., Miller,J., Delcher,A.L., Schatz,M., Schobel,S. and Fraser,C.M. TITLE Direct Submission JOURNAL Submitted (23-MAY-2005) The Institute for Genomic Research, 9712 Medical Center Drive, Rockville, MD 20850, USA FEATURES Location/Qualifiers source 1..29326 /organism="Trichomonas vaginalis G3" /mol_type="genomic DNA" /submitter_seqid="1047229021876" /strain="G3; ATCC PRA-98" /db_xref="ATCC:PRA-98" /db_xref="taxon:412133" /chromosome="Unknown" gene complement(<89..>1591) /locus_tag="TVAG_124310" mRNA complement(<89..>1591) /locus_tag="TVAG_124310" /product="hypothetical protein" /note="transcript TVAG_124310A" CDS complement(89..1591) /locus_tag="TVAG_124310" /note="encoded by transcript TVAG_124310A; Identical to: GlimmerHMM gene prediction Covered by: TigrScan gene prediction" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89951.1" /translation="MHIDAPCELKERLSYIDAMKAVIDNECHAGCPYQLKKNPNLGET KLKFRCSADKCEACISFLKDDEEYILTEYNGTHNHNQIKDETKKYHTLSQCYRRVLIN FIKQGGDPKMAQIECDKKLDLDDPLNRPSFLNASSDQMKTIQEKGNKKIKGIQKYDDN QFKSTQLFKGIKEQESPKDLIYFDVDNYNKPKKLIFYYASFKFLDIIKIVKEHFIDAT HSLLEFKMLFYMISAKFPNTHAFPIFQFVVYPNTSENIAFCLKAFFNWAKVKPKYFMS DCAQEIENAIINSFPEVILHWCAVHVMRAFRKNLKDYAFESSDKLILDTKMNYLAYGR NGKKEWIEPTFKKILEIAEKFPEFSKYIQNQWISNQERWTAAERDENLALTNNISESI NKKIKYYYFGGTIFMRFDRFVMKLIDFIVPSFYYRISQDIRLRDKIPNPLPSEKKPKK STIRLDTEKCIMLTDKIKSLIVNSSANLNTLQLGLDDLLDKVVKAAKVQK" gene <2373..>4913 /locus_tag="TVAG_124320" mRNA <2373..>4913 /locus_tag="TVAG_124320" /product="hypothetical protein" /note="transcript TVAG_124320A" CDS 2373..4913 /locus_tag="TVAG_124320" /note="encoded by transcript TVAG_124320A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89952.1" /translation="MADGNDPSLVTTASLKGRETPIEGVQTKRASKVLIETPSMPFET ESYKFRQTATKSQQQTSPSRRAPQTSSGKRIKEGLYSVKMKNSTWTHTDPDVPDHYAS RKEILEVLNNFESAVKSLTGVDDTKTASAMQNITDLLLEQLACMLRAECREQELIVEK SRESYAEVFLLLRKEINKSHDEMDKLKNHNVQLEAELTKVIDTSSERVNEIQFDCERQ LKAKDDEMEQRKQEYDLSMKRFLEQKSQLEEHVKALHRVFLDFQSDSVYITLEDLKQK LANTEKKLRYKETEIQKLNDKIDKHKKQILDLQAQKTNLDQANGELRRKLQNALASKG RLERQIEIQQFGEEEDGEKKGKRNLSVDSTPYISVLQKLNQIYDKISDILQRSNVNVP SQQQYTDDIDKVLLSGNPALMIQAVEKRVIDVLQTTENLDSVDIHADNDFIYDSIQNP RFLQYVAPHIDVPLPNTQSSDYNPFQIMRQIFQAKYLQDEWMKRTGGQVQRFPEFIVS FFTRNDESLFVALTNAARLWRCISDEKYSEMKLFKSFALEEYTCDELTFFLRCRYLLL GLPGIDSQAPKKIMVDISEIKNMMNSVVGQYSHVAQSVIEKAEKQANNENRIDYAEFM IIFLEFYERERRKRRNAVRLMFQSKQYMQGNIKIDFENFCALVKSLGYQGDSQTVFEL YREATMVSKGDLNLESLLTAMDSMGFHFYSIEAPITLLHNTPVTELKRSDLFKRWIRF GRWFEGFLKPLGTFDTWLHAELKQAVKRVDNIFKTNSPVPVMFNEYRKLLDYFQFMLD MLAEGSKNPMTPEKSNRELLLMENLVDLLVTHVVTECDKDYIFEELTS" assembly_gap 5102..5201 /estimated_length=unknown /gap_type="within scaffold" /linkage_evidence="paired-ends" gene complement(<11644..>12309) /locus_tag="TVAG_124330" mRNA complement(<11644..>12309) /locus_tag="TVAG_124330" /product="hypothetical protein" /note="transcript TVAG_124330A" CDS complement(11644..12309) /locus_tag="TVAG_124330" /note="encoded by transcript TVAG_124330A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89953.1" /translation="MTLHMIDIFSQIRAKDIKLFTELHKKILNEFSCLIKPKNEKLAT LLYYKCFNFEIFKPEIEEEEIVNLYSTESPLYYIAWDKVDDLKSKFPNLDINWEINEI TPLNCSIKYGSELCFNYLKNLGAKYTDNSEKYAVQGGNKNIFMEMIEDGKSFDNMIDT ALDYHNYEIANYLKSNFGQTPDSIAESMYFGNYDVASYLLSNGEDINKIYSFLLFIFI IVL" gene <12976..>13155 /locus_tag="TVAG_124340" mRNA <12976..>13155 /locus_tag="TVAG_124340" /product="hypothetical protein" /note="transcript TVAG_124340A" CDS 12976..13155 /locus_tag="TVAG_124340" /note="encoded by transcript TVAG_124340A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89954.1" /translation="MSDIYQAITEDNVEQMQACISGGVDINKPGANGLTPLMFAVQEG KEKCLGALIKAKADV" gene <13273..>15090 /locus_tag="TVAG_124350" mRNA <13273..>15090 /locus_tag="TVAG_124350" /product="hypothetical protein" /note="transcript TVAG_124350A" CDS 13273..15090 /locus_tag="TVAG_124350" /note="encoded by transcript TVAG_124350A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89955.1" /translation="MTPLHHAAKNNRKKTCELLIRSKATVNMPDAEGNTPFLTALIAG SSDAVASFIKADATDLTVQNKKQQTPAHFLAAMGNIAILKSLAKKGLNWNAQDDQGRT PVELCADSGNAQCFEFLLTKLGGDPSVTNAAGESLAHIISAKGHAPLLGILKASGGNV DSEDANGCHPIQQAAASNSVAVIEALIKLMAQVNCTDAKGDTPIHYAANNGAVEAMEC LVNSGADINSKNKAGESALHIAVKKGDCKMINALSDKNVDVSLRDNNGNTALHLAIPL HNTEVINTLIGISVPPNSQNNDNMTALHLAATLGDVELVQNLIKAGADVDMKNNDGET PLELASACGDVPVVKALIEARADVNSKDGQGMTPLHKAVQKNQVEVIKCLKEANANIN AKTGDGETPLIIATKMKNVDLIMMLIDMGCDVNIGDINGTTPLHYACKLDLTKPALQL IEKGSDIMAKGEGNNTPLHFASLNMNKQLVEVLIKKGANAREMNSEGRTPLQGIRLTF AKFMKQLMGEDKGDKKEDIKIDVSEVLNQSGEKLETQTELKDTFCLLCRRRAATAALL PCGHLCICDACQHERLATLKQCPICKKDVYGACAIFCEN" gene <15513..>16880 /locus_tag="TVAG_124360" mRNA <15513..>16880 /locus_tag="TVAG_124360" /product="hypothetical protein" /note="transcript TVAG_124360A" CDS 15513..16880 /locus_tag="TVAG_124360" /note="encoded by transcript TVAG_124360A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89956.1" /translation="MNSTVFIDSYEPVLEQLHKMSLEEEMNQEHAVYLVKILNRCLKR NPEADFPHNIFKQDDLVLLLDFCLNEKYIDTDFHKALYRTIYNVIMENPRYNRSSFIP LLIDRFDHFCKLFDSIPPNSSNMITKIGIFNLMSSLMHENSESFAHVYEKFNLDMAYE LFQNFPCFCSYLYNLVKNPSIEYDAMPQIVSSIINHAISIIPKISISSKEDTMKRDRT ISKDLRKMNDCLLALNSCTRFPEIFFEVFQGIDIYDKYINNIMQYKDAFSNVIKLSKS ILQIKSDFDYEISIYGIVFMISYILEQLYNLYKWVNIAEDGIYLLTLLSERKIYNKQI DSICNQMILNKLLQDSIEIGCQQQYLQLLCNLAKDDINYTMVTDESSLKIAINFLGDD NPVFALEFILMRVQKSVSQNNFEDSLDVLDVSEKESIIELVESEDEKISILAQNLSDL IASYA" gene <18298..>19245 /locus_tag="TVAG_124370" mRNA <18298..>19245 /locus_tag="TVAG_124370" /product="ankyrin repeat protein, putative" /note="transcript TVAG_124370A" CDS 18298..19245 /locus_tag="TVAG_124370" /note="encoded by transcript TVAG_124370A; Identical to: GlimmerHMM gene prediction Covered by: TigrScan gene prediction" /codon_start=1 /product="ankyrin repeat protein, putative" /protein_id="EAX89957.1" /translation="MKNAIISHNIDFVCFLMNEYQLKIDFVLCIMFDNIQAFFVYLDQ TREISVCFVNLPYFRLKSLVNYFMQHGIDINTVVLSDTALINSIKVESLDLLEYLVLN GANINTGYKSSHSPIHIAAGRGNEEIVRFLISLGAKIKNNKKITPPLLVAAGKNKIKN AKILISNGADINVKDSADRNVLYLSLENSNEEMTKYFISCGADIHAKDFYGNTTLHYA AKNNLTNTIIYLISQGLNINEKNLEGKTALHYAAMGNSKDAVELLISLDANIHIKDND KKPAIHYVKINKYKEIIRILRSHKNDHYGLRHLSLCNIV" gene <19538..>21385 /locus_tag="TVAG_124380" mRNA <19538..>21385 /locus_tag="TVAG_124380" /product="ankyrin repeat protein, putative" /note="transcript TVAG_124380A" CDS 19538..21385 /locus_tag="TVAG_124380" /note="encoded by transcript TVAG_124380A; Identical to: GlimmerHMM gene prediction Covered by: TigrScan gene prediction" /codon_start=1 /product="ankyrin repeat protein, putative" /protein_id="EAX89958.1" /translation="MNKIQHNELIDLSKDYCNTFCALYRLNTQDEAEIDKIYKQIKIK LIDTKMFLPSQILEVICNVAKLNNRYMKSYWELFRKTAENYKIQQIFSSTYNQSKYKT YESYLKERYIKYFIWDEIYFEKEEKTNDKNKNINYSLDIHESNPICRSLVLDDLGSFI FYTEQDGFDKYQRVKSNFYPYSLLGYSLLELCCYYGAIRCFKFLRTKFNSEITEKCLQ FSFLSGVPDIMNECLKFQRPYKECMECAIISHNIDFVSFLMNEYHLKIDLEDCCRYHN LQVYLMYLDITKDINNCFVLSPSFHFPELCKYLISHGANVNAIGHSSKTHLCYSAVNS SRETVDYITTYGVNFVRDYNYEWFAIMDAAWNNSAEIAEILISHGARIDSHGINEKTA CHIAIERNSIETIKVFVAHKDLINDSTLHLALIYDKEEIAKFLILNGININTHDNNGK TPLHIVADGNKTEMAELLISHGANINLTDKNDETALHYALKYDRKEMTELLISHGVNI DAKDKDGKTALHIAAERNNKEIAEFLISHGANLEETDNEGKSALDYAIRYDRKEIEKL LISYGANINAQVINGESAAITNRTNNEGKTFSQYYHNFINYTFSNCIII" gene complement(<21573..>22634) /locus_tag="TVAG_124390" mRNA complement(<21573..>22634) /locus_tag="TVAG_124390" /product="hypothetical protein" /note="transcript TVAG_124390A" CDS complement(21573..22634) /locus_tag="TVAG_124390" /note="encoded by transcript TVAG_124390A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89959.1" /translation="MQYIKAKELLNETLQLEQYPSMYRQIPDRSCNPKFYDAQIQFWS KFLIDWSKRYNVVSFHATKLEETLMWNDIYPPLAPTLKTLLKSKIIQKSSKFVIKRSL LSSIIASMRCEDPSDYENIEYNFYQNFEQISRTVRDNIMKNVRPSYDLVISDEELIEK FNITSISHLSNVLEKNRYASRLPDGGFLFSSDIITTPPQNQISLFLALKKSIYQMKKK IKSIDDMISTAQDNKYFETARKLQQIKSNAEELLKNGEKANNILQKGFSHETILNQTE NSVNSLQKFLISSIDQLMKEVEVESRDPPENFGHQKEENEETQKFENDASDPHPNEAH NVGNDDFDLGFMPTRSVYK" gene <22903..>24999 /locus_tag="TVAG_124400" mRNA <22903..>24999 /locus_tag="TVAG_124400" /product="hypothetical protein" /note="transcript TVAG_124400A" CDS 22903..24999 /locus_tag="TVAG_124400" /note="encoded by transcript TVAG_124400A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89960.1" /translation="MGGALSSSDAIPAFLRTLLSGACPPAHPIWASFNITSFNTSEMT KEDILLLQEVRDKRPDNFAELVRCITDAFTREIKLAENEIQNDSMYLDFSMYSDMICL LLSISGLPQKISPWFKAPTLYLKQSLPLHQVLLAEFRLLNMTDSIFNCYSDELQANIT FVKTLLFVQQAEAFTYPVKSDPSQYLLSFDIFPAKAFLPVLFEFIPKAILTTRSEPIL KYVRALITASILPIYCCNTWKTALSCVEQNIIHRAFEPLLTLTDNIYPTGLPGRVLAC SDQLISLLYTVILRFPTFLKFIDTNKLAQKYIEVLLLLFRYKMDNGSITFIHSIILLI ISHLTSDFHSLLTLNDPFVETLQIKEQRPHRGTYADLIIEIITFPLIKDFKSAFPLAP LVTAIIQNLSSTTAHLSFFNANRIYEILRLFFKSKAAEHPESKLPIARLLNSIYQFIR FQTLGKKSILLYGIVHRVIIDSLAASALPEWRKPAEKIKKLLDAADEPLKSKEKNADA VLQNAMAPILIEFADSPVPQTSFTMGAEVETIWYDWSRILLWRVFPDEAEFYHLNFLT FKSPGNEKAIPNPVPEESLSTEPAPTESFATGIINQAEQQKKNEIEEKEESEPEVQQY KAIEQTPVQQSSAQSIIEATKPAISKIRNPKLQIKEVSEPDQLQAPVKHAKTLEELDN PFGSDDEDELAKFLED" gene complement(25200..>25685) /locus_tag="TVAG_124410" mRNA complement(25200..>25685) /locus_tag="TVAG_124410" /product="hypothetical protein" /note="transcript TVAG_124410A" CDS complement(25407..25685) /locus_tag="TVAG_124410" /note="encoded by transcript TVAG_124410A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89961.1" /translation="MARRTKKVGICGKYGVRYGASLRKTIKKIEISQRKKYPCAFCGK DSVKRNAVGIWTCTKCGKAVAGGAYTPTTPAALTARAAYKRIREAQAK" gene <25964..>26866 /locus_tag="TVAG_124420" mRNA <25964..>26866 /locus_tag="TVAG_124420" /product="hypothetical protein" /note="transcript TVAG_124420A" CDS 25964..26866 /locus_tag="TVAG_124420" /note="encoded by transcript TVAG_124420A; Identical to: TigrScan, GlimmerHMM gene predictions" /codon_start=1 /product="hypothetical protein" /protein_id="EAX89962.1" /translation="MSSSEQTKNEVGCDFNDIKPIEIFEYPSQASKHIWNLNSNNILQ TSSQIIEFIKSNKIPIQMTLYLIDIFSQIREKDIKLFTELYEKILNEFSCLIKPENEK LAMLLYYKCFNFENFESEMKEEKILNLYPTESPLYYIAWDKVDDLKSKFPNLDINEKI NEITPLDCSIKYGSELCFNYLKNLGAKYTEYSEMYAVQGGNTNIFMEMIEDGKSFDNM INTALDYHNYEIANYLKSNFGQTPDSIAESMYFGNYDVASYLLSNGEDINKIYILFIF TFFIVLFNSLSFCIYHYFVKFSQY" repeat_region 28789..28813 /rpt_type=tandem /rpt_unit_seq="a" /satellite="microsatellite" CONTIG join(AAHC03004810.1:1..5101,gap(unk100),AAHC03001156.1:1..24125) //