LOCUS       WKY05663.1              5208 aa    PRT              INV 31-JUL-2023
DEFINITION  Nippostrongylus brasiliensis hypothetical protein protein.
ACCESSION   CP130735-2487
PROTEIN_ID  WKY05663.1
SOURCE      Nippostrongylus brasiliensis
  ORGANISM  Nippostrongylus brasiliensis
            Eukaryota; Metazoa; Ecdysozoa; Nematoda; Chromadorea; Rhabditida;
            Rhabditina; Rhabditomorpha; Strongyloidea; Heligmosomidae;
            Nippostrongylus.
REFERENCE   1  (bases 1 to 50441521)
  AUTHORS   Schwarz,E.M., Baniya,A., Rodriguez,I.M., Lu,D., Bobardt,S.D.,
            Anesko,K., Baker,L., Gouil,Q., Ritchie,M.E., Jex,A.R., Nair,M.G.
            and Dillman,A.R.
  TITLE     A Nippostrongylus brasiliensis chromosomal reference genome and its
            transcriptomics
  JOURNAL   Unpublished
REFERENCE   2  (bases 1 to 50441521)
  AUTHORS   Schwarz,E.M., Baniya,A., Rodriguez,I.M., Lu,D., Bobardt,S.D.,
            Anesko,K., Baker,L., Gouil,Q., Ritchie,M.E., Jex,A.R., Nair,M.G.
            and Dillman,A.R.
  TITLE     Direct Submission
  JOURNAL   Submitted (16-JUL-2023) Molecular Biology and Genetics, Cornell
            University, Biotechnology Bldg., 526 Campus Road, Ithaca, NY 14853,
            USA
COMMENT     ##Genome-Assembly-Data-START##
            Assembly Date          :: 03-JUN-2022
            Assembly Method        :: raven v. 1.7.0; sourmash v. MAR-2022;
                                      racon v. 1.4.20; POLCA (in MaSuRCA) v.
                                      4.0.8; 3d-dna v. 180419
            Assembly Name          :: Nippo_1.0
            Genome Representation  :: Full
            Expected Final Version :: Yes
            Genome Coverage        :: 76.0x
            Sequencing Technology  :: Oxford Nanopore PromethION; Illumina
                                      HiSeq; Omni-C
            ##Genome-Assembly-Data-END##
FEATURES             Qualifiers
     source          /organism="Nippostrongylus brasiliensis"
                     /mol_type="genomic DNA"
                     /strain="MIMR"
                     /db_xref="taxon:27835"
                     /chromosome="IV"
                     /sex="pooled male and female"
                     /tissue_type="Whole animal"
                     /dev_stage="Adults"
                     /geo_loc_name="USA: Laboratory of Meera Nair, UC Riverside
                     School of Medicine, Riverside, CA"
                     /collection_date="2021/2022"
     protein         /locus_tag="Q1695_006118"
                     /note="NIPPO_CHRIV.G9958.T3"
     intron_pos      47:0 (1/76)
     intron_pos      105:1 (2/76)
     intron_pos      136:0 (3/76)
     intron_pos      210:0 (4/76)
     intron_pos      283:0 (5/76)
     intron_pos      430:0 (6/76)
     intron_pos      503:0 (7/76)
     intron_pos      576:0 (8/76)
     intron_pos      649:0 (9/76)
     intron_pos      722:0 (10/76)
     intron_pos      795:0 (11/76)
     intron_pos      868:0 (12/76)
     intron_pos      941:0 (13/76)
     intron_pos      957:0 (14/76)
     intron_pos      1001:0 (15/76)
     intron_pos      1074:0 (16/76)
     intron_pos      1147:0 (17/76)
     intron_pos      1220:0 (18/76)
     intron_pos      1293:0 (19/76)
     intron_pos      1366:0 (20/76)
     intron_pos      1439:0 (21/76)
     intron_pos      1487:0 (22/76)
     intron_pos      1560:0 (23/76)
     intron_pos      1635:0 (24/76)
     intron_pos      1710:0 (25/76)
     intron_pos      1783:0 (26/76)
     intron_pos      1856:0 (27/76)
     intron_pos      1929:0 (28/76)
     intron_pos      2002:0 (29/76)
     intron_pos      2075:0 (30/76)
     intron_pos      2148:0 (31/76)
     intron_pos      2221:0 (32/76)
     intron_pos      2294:0 (33/76)
     intron_pos      2367:0 (34/76)
     intron_pos      2444:0 (35/76)
     intron_pos      2516:0 (36/76)
     intron_pos      2592:0 (37/76)
     intron_pos      2697:0 (38/76)
     intron_pos      2753:0 (39/76)
     intron_pos      2812:0 (40/76)
     intron_pos      2888:0 (41/76)
     intron_pos      2960:0 (42/76)
     intron_pos      3032:0 (43/76)
     intron_pos      3104:0 (44/76)
     intron_pos      3176:0 (45/76)
     intron_pos      3248:0 (46/76)
     intron_pos      3320:0 (47/76)
     intron_pos      3392:0 (48/76)
     intron_pos      3464:0 (49/76)
     intron_pos      3536:0 (50/76)
     intron_pos      3608:0 (51/76)
     intron_pos      3680:0 (52/76)
     intron_pos      3752:0 (53/76)
     intron_pos      3824:0 (54/76)
     intron_pos      3896:0 (55/76)
     intron_pos      3968:0 (56/76)
     intron_pos      4040:0 (57/76)
     intron_pos      4103:0 (58/76)
     intron_pos      4166:0 (59/76)
     intron_pos      4277:0 (60/76)
     intron_pos      4343:0 (61/76)
     intron_pos      4469:0 (62/76)
     intron_pos      4595:0 (63/76)
     intron_pos      4649:0 (64/76)
     intron_pos      4776:0 (65/76)
     intron_pos      4830:0 (66/76)
     intron_pos      4875:0 (67/76)
     intron_pos      4936:2 (68/76)
     intron_pos      4987:0 (69/76)
     intron_pos      5019:0 (70/76)
     intron_pos      5043:1 (71/76)
     intron_pos      5063:1 (72/76)
     intron_pos      5093:0 (73/76)
     intron_pos      5121:2 (74/76)
     intron_pos      5158:2 (75/76)
     intron_pos      5180:0 (76/76)
BEGIN
        1 MAKRDRLQET TIPQQEAVVE IVDSKREVKR KTDTDRVTTT DSLIEQDIVK RTEVRNNQMK
       61 ERITWTTRER IVETTDELVA NAPGPRRSGQ SLTWMGKRQE VNDKGLSSAP SRSDTPLTSK
      121 GNSQTTPDPN TLTGEKANSK HQDEKVHGQM KVPEAANERE RSFKGKEEKD ITRVDLPSRV
      181 HQASNRDSDK PLARNASQTI SEPNSLLDQS ASRRHKDAKV ERKKAVPRKV AESERRAKGE
      241 RIALSQYDLP SGLKSASNTD FDGPLERDIS GTNSEPNSLH EQGESRRHED AKGPKQKEGP
      301 RKAPDRDRRT KGERITRAQY DLPPGLQSAS NTEFDSPLAK DISETNSEPN SLLEQVAVFQ
      361 QALLKRIFHG TSPHNGNIKE IQRAKGTRTT RKQIDLPPGL KNQPNTDRDE PFARDILRVN
      421 SEPNSLHEQS SSRNHKDAKV ERKKEVPRKV AESERSAKVE RITRTQYDLP PGLNNASSTD
      481 IDGAFARDIS RTDTEPNSLR EQSVGRKHKD AKVERKKEVP RKVAESERSA KVERITRTQY
      541 DLPPGLNNAS STDIDGPFAR DISRTDTEPN SLREQSVGRK HKDAKVERKK EVPRKVAESE
      601 RSAKVERITR TQYDLPPGLN NASSTDIDGP FARDISRTDT EPNSLREQSV DRRHRDAKVE
      661 RKKEVPRKVS ESERSAKVER ITRTQYDLPP GLNNASSTDI DGPFARDISR TDTEPNSLRE
      721 QSAGRRRRDA KVERKKEVPR KVSESERSAK VERITRTQYD LPTGLNNASK VETDGPVAGD
      781 TSRANTEPNS LREQSVGRKH KDAKVERKKE VPRKVAESER SAKVERITRT QYDLPPGLNN
      841 ASSTDIDGPF ARDISRTDTE PNSLREQSVG GKHKVAKVER KKEVTRKVAK SERNAKVERI
      901 TKTQYDLPPG LNNASSTDFD GPVAGDTSRA NTEPNSLREQ SVGGKHKVAK VERKKEVERI
      961 TKTQYDLPPG LNNASSTDFD GPVAGDTSRA NTEPNSLREQ SVGGKHKVAK VERKKEVTRK
     1021 VAKSERSAKV GRITKTQYDL PPGLNNASST DFDGPVAGDT SRANTEPNSL REQSVGGKHK
     1081 VAKVERKKEV TRKVAKSERN AKVERITRTQ YDLPPGLNNA SSTDIDGPFA RDISRTDTEP
     1141 NSLREQSVGR KHKDAKVERK KEVPRKVSER ERSAKVERIT KTQHDLPPGL NNASRTDIDG
     1201 QFARDISRTD TEPNSLREQS VGRKHKDAKV ESKKEVPRKV SESERSAKVE RITRTQYDLP
     1261 PGLNNASSTD IDGPFARDIS RTDTEPNSLR EQSAGRRRRD AKVERKKEVP RKVSESERSA
     1321 KVERITRTQY DLPPGLNNAS NVETDGPVAG DTSRANTEPN SLREQSVGRK HKDAKVERKK
     1381 EVPRKVSERE RSAKVERITK TQHDLPPGLN NASSTDIDGP FARDISRTDT EPNSLREQGI
     1441 GRRKMKSAQH NLTSRKTSNA SNTGFEITLP KDTSTVDPEP NTLINQSVKR RHEKRSKPVE
     1501 LQKESDSESV DKKRKTKAFT NVLYGLPYGL ICVSNWAIER TLERDNSGTR SEPNSLIGQS
     1561 VGRRLKNGKD RKHQNQPRKA QENEGISKGK RTTTAFTNSQ HDLPFGMKNT PERLHEKLLA
     1621 RDTSLSEPNS LLNQNVDQGH MDKKDRKQKK KNRKALKIVK AAKEKRTTKV FMNVQHDLPS
     1681 GLKNTSERDF KKSWDASETL SEPNSLANQS VSRKRDSEKR PEEVHREEPE SKRSAKERRT
     1741 SKAFLNVQHD LPSGLKNASE RDFRKSMDVS ETLCEPNYLA NQSVSRKRDS EKGPEEVHRE
     1801 EPESKRSAKE RRTSKAFLNV QHDLPSGLKN ASERDFRKSM DVSETLSEPN YLANQSVSRK
     1861 RDSEKRPEEV HREEPESKRS AKERRTSKAF LNVQHDLPFG LKNASERDFR KSMDVSETLS
     1921 EPNYLANQSV SRKRDSEKRP EEVHMEEPES KRSAKERHTS KAFLNVQHDL PFGLKNASER
     1981 DFRKSMDVSE TLSEPNYLAN QSVSRKRDSE KGPEEVHREE PESKRSAKER RTSKAFLNVQ
     2041 HDLPSGLKNA SERDFRKSMD VSETLSESNY LANQSVSRKR DSEKRPEEVH REEPESKRSA
     2101 KERRTSKAFL NVQHDLPFGL KNASERDFRK SMDVSETLSE PNYLANQSVS RKRDSEKRPE
     2161 EVHREEPESK RSAKERRTSK AFLNVQHDLP FGLKNASERD FRKSMDVSET LSEPNYLANQ
     2221 SVSRKRDSEK RPEEVHREEP ESRRSAKERR TSKAFLNVQH DLPFGLKNAS ERDFRKSMDV
     2281 SETLSEPNYL ANQSVSRKRD SEKRPEEVHR EEPESKRSAK ERRTSKAFLN AQHDLPSGLK
     2341 NASERDFKKS MDASETLSEP NYLDNQSTSK RPKTEHGEMQ QNVSREARES GRIAKGKPSP
     2401 KVFMNLQHDL PPGLNNASKK DFERPFAKES SEKLPETNSL RCQSLSRRHK DEKGRKQQEL
     2461 LEIASISHRK ADEMNTMKPF ENAQHDLPRG LVDASKTEFK CVSGENPEPN YLTPQAFSAE
     2521 HNKWKDETQK TVLPENKGRT TEKHSAMALT NVQHDLHHAP TLSSVPSTKS KMTLQEDRVE
     2581 KLPDPSNIMD KSVCLKPEKA KEEPCKELNS VSTAKEKCVS TVCRSSRDEH AWVGQRFEEG
     2641 KREVATKAEP KSVAENGTAA PPQDTDLKTA MNVLVETETA KADTDRVTTT DSLIENKMVK
     2701 TTEVIGNQTR ERITWTIRKR IVERTDEWKR EPGTPGPRKS GQSITWKGKR KEKLLNKEEL
     2761 AKSSAEKKLS DVPSNLKRNL LFEPPPNMDF GTPLPNDSSA ASSQPNSSIV QSVSSTHEHV
     2821 RGPIQKEKPG QRPDNVDVSG KRTKSVLTNV LYGLPIGLKK ATNWVMERPL AKGSSRTESE
     2881 PNSLLSQSVS RRHKDAEVLI QKEKPRNMPE SEGAREKKTT ETFMSVQHDL PSGLEDACRR
     2941 VFENQPSGTN SEPNCLLGQS VSGGHKDAEI PIQKEEPRRV PENEDEKEIA TTKTLMSIQH
     3001 DLPSGLEDAC RRVSENQPSG TNSEPNYLLG QSVTRRHKDA EIPIQKEEPR HVPESEDAKE
     3061 KPTTRTLMSI QHDLPIGLEN ASKRVFENQP SGTSSEPNSL LGQSISRRHK DAEVSIEKEE
     3121 PRIVPESEDA KKKPTSKAFM SVQHDLPIGL ENASKRVFEN QPSGTSSEPN SLLGQTVSRR
     3181 HKDAEIPIQK EEPRVVHERE DAKKKPTSKA FMSVQHDLPI GLENASKRVF ENQPSGTSSE
     3241 PNSLLGQTVS RRHKDAEIPI QKEEPRDVHE REGVKEKPTK KTFMSVQHDL PSGLENASKR
     3301 VFENQPSGTS SEPNSLLGQT VSRRHKDAEI PIQKEEPRDV HEREDAKKKP TSKAFMSVQH
     3361 DLPIGLENAS KRVFENQPSG TSSEPNSLLG QTVSRRHKDA EIPIQKEEPR DVHEREGVKE
     3421 KPTKKTFMSV QHDLPSGLEN ASRRIFENQS SGTIFEPNSL LGQSISRRHK DAEVSIEKEE
     3481 PRIVPESEDA KKKPTSKAFM SVQHDLPIGL ENASKRVFEN QPSGTSSEPN SLLGQSISRR
     3541 HKDAEVSIEK EEPRIVPERE GVKEKPTTKT FMNVQHDLPI GLENASKRVF ENQPSGTSSE
     3601 PNSLLGQSIS RRHKDAEVSI EKEEPRIVPE REGVKEKPTT KTFMNVQHDL PSGLENASRR
     3661 IFENQSSGTI FEPNSLLGQS ISRRHKDAEI PIQKEEPRIV PEREGVKEKP TTKTFMNVQH
     3721 DLPSGLENAS RRIFENQSSG TNSEPNSLLG QSISRRHKDA EVSIEKEEPR IVPEREGVKE
     3781 KPTTKTFMNV QHDLPIGLEN ASKRVFENQP SGTSSEPNSL LGQTVSRRHK DAEIPIQKEE
     3841 PRDVHEREDA KKKPTSKAFM SVQHDLPIGL ENASKRVFEN QPSGTSSEPN SLLGQSISRR
     3901 HKGAEVSIEK EEPRIVPESE GVKEKPTKKT FMSVQHDLPS GLENASRRIF ENQSSGTISE
     3961 PNSLLGQSIS RRHKDAEVSI EKEEPRIVPE REGVKEKPTT KTFMNVQHDL PIGLENASKR
     4021 VFENQPSGTS SEPNSLLGQS ISRRYKDAEV PIEKEESKEK PTTKTFMNVQ HDLPIGLENA
     4081 SRRVFENRSS GTNSEPNSLL GQSMSRRHKD AEVSIEKEEP KEKPTTKTFM NVQHDLPFGM
     4141 ENASKRVFEN QSTGANSEPN SLFGQNVTPQ RLAHDNSDRS QRGKIVPLLL LPLYVKHGLR
     4201 RTAEPAESEG SVVHGEHKCE QDIDPERGRE RRRTDDKRET LKRKQYNLPS GFASTSRCCK
     4261 KSTSGRHSDP NSLTKQSVNG KKDVVNNHLE KREKSTLIGN KQLKERPKQT DLPTGIAGRH
     4321 NGTEYRDRPS ECNSLTEQIN NRRPDKKRDE GTLQYKDRRK EHKKRKRPSV TCCRKRRAMK
     4381 RAQREGQDLS RKEKFKETGG RRKNKKERHR SPRRAKDRSS RGTNDRYVPM SNAPSEQPDQ
     4441 PPRTASASRR SEPLSAKTPD EPNSLLEQNL DNEGDVAAPQ RDEEPHMEHT KKNGPSLSCC
     4501 CKRRATRRIA IRAGKEGKDI DTREGRGAMN RPPKSDDSSR REPSDKSRQK SKSSKNEEQN
     4561 LPPGIASASR RGYKEALSRK GSKTPSEPNS LLEQKLHINP ELAAIPHKEK RLKKHKEHKK
     4621 NGRLSLSCCC RRRRARRAAI RAGKETQESL DKQPEEKRRN KQRRKRRTSL SCCRRRRGTK
     4681 RAAMRAGKEK EPRKEKLGRS NGHKDSIKVI NRASKSASIS RKEPSNKSKQ KSKPPKSAQQ
     4741 DLPSEIASAS RRSSKESLSR KSSKTPPEPN SLLKQSLDKQ PENKRRSKHK KRRRPSLSCC
     4801 RRRRGTKRAG VRAGKEKLGR SIGATGSRGT PKSHRSVQQD LPPGIASASR RNSKEPLSRK
     4861 SSKTPPEPNS LSKQSLDEQR EKDHRSKHER KRRPSLSCCR RRRGMKRAAM RAGKEKQVVP
     4921 NEERLGRSSR RKRSRRGVPR HTPKSPSSVQ QDLPPGIASA SRRSSKELLS RKSPTTPFDP
     4981 NSLLKQNLDR QPEVATVPHD KRKNMRRPSL SCCRKKRAPE FQPHRKADRS KDGEIPSTAI
     5041 DIDSSIRPRR RRTEGSSEEA RGDRQKYSGE LVKDKDEQYH VTKPPSDDAA FEPSIGRGSE
     5101 LVPLEDSIDP QYPAQRIVIT SFVRNGCHIK RWLYEDSYPI GGVRPAIADL VCSGPRDMRC
     5161 RCGRRSVCDR SCVEDFSAKR HSTYHNYDSE RIRGELQRLD AIVKNLDD
//