{"id":"https://openalex.org/W4394895538","doi":"https://doi.org/10.1109/kst61284.2024.10499674","title":"Hybrid Information Retrieval with Masked and Permuted Language Modeling (MPNet) and BM25L for Indonesian Drug Data Retrieval","display_name":"Hybrid Information Retrieval with Masked and Permuted Language Modeling (MPNet) and BM25L for Indonesian Drug Data Retrieval","publication_year":2024,"publication_date":"2024-02-28","ids":{"openalex":"https://openalex.org/W4394895538","doi":"https://doi.org/10.1109/kst61284.2024.10499674"},"language":"en","primary_location":{"id":"doi:10.1109/kst61284.2024.10499674","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/kst61284.2024.10499674","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 16th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5063210975","display_name":"Maryamah Maryamah","orcid":"https://orcid.org/0000-0001-9540-4427"},"institutions":[{"id":"https://openalex.org/I205133468","display_name":"Airlangga University","ror":"https://ror.org/04ctejd88","country_code":"ID","type":"education","lineage":["https://openalex.org/I205133468"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Maryamah Maryamah","raw_affiliation_strings":["Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","institution_ids":["https://openalex.org/I205133468"]},{"raw_affiliation_string":"Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia","institution_ids":["https://openalex.org/I205133468"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095747478","display_name":"Geraldus Wilsen","orcid":null},"institutions":[{"id":"https://openalex.org/I205133468","display_name":"Airlangga University","ror":"https://ror.org/04ctejd88","country_code":"ID","type":"education","lineage":["https://openalex.org/I205133468"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Geraldus Wilsen","raw_affiliation_strings":["Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","institution_ids":["https://openalex.org/I205133468"]},{"raw_affiliation_string":"Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia","institution_ids":["https://openalex.org/I205133468"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095747479","display_name":"Christeigen Theodore Suhalim","orcid":null},"institutions":[{"id":"https://openalex.org/I205133468","display_name":"Airlangga University","ror":"https://ror.org/04ctejd88","country_code":"ID","type":"education","lineage":["https://openalex.org/I205133468"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Christeigen Theodore Suhalim","raw_affiliation_strings":["Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","institution_ids":["https://openalex.org/I205133468"]},{"raw_affiliation_string":"Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia","institution_ids":["https://openalex.org/I205133468"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5095747480","display_name":"Rafik Septiana","orcid":null},"institutions":[{"id":"https://openalex.org/I205133468","display_name":"Airlangga University","ror":"https://ror.org/04ctejd88","country_code":"ID","type":"education","lineage":["https://openalex.org/I205133468"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Rafik Septiana","raw_affiliation_strings":["Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","institution_ids":["https://openalex.org/I205133468"]},{"raw_affiliation_string":"Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia","institution_ids":["https://openalex.org/I205133468"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042525390","display_name":"Aziz Fajar","orcid":"https://orcid.org/0000-0002-1393-3470"},"institutions":[{"id":"https://openalex.org/I205133468","display_name":"Airlangga University","ror":"https://ror.org/04ctejd88","country_code":"ID","type":"education","lineage":["https://openalex.org/I205133468"]}],"countries":["ID"],"is_corresponding":false,"raw_author_name":"Aziz Fajar","raw_affiliation_strings":["Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Universitas Airlangga,Data Science Technology Faculty of Advanced Technology and Multidisipline,Surabaya,Indonesia","institution_ids":["https://openalex.org/I205133468"]},{"raw_affiliation_string":"Data Science Technology Faculty of Advanced Technology and Multidisipline, Universitas Airlangga, Surabaya, Indonesia","institution_ids":["https://openalex.org/I205133468"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017573135","display_name":"Mahmud Iwan Solihin","orcid":"https://orcid.org/0000-0002-5293-7466"},"institutions":[{"id":"https://openalex.org/I55285296","display_name":"UCSI University","ror":"https://ror.org/019787q29","country_code":"MY","type":"education","lineage":["https://openalex.org/I55285296"]}],"countries":["MY"],"is_corresponding":false,"raw_author_name":"Mahmud Iwan Solihin","raw_affiliation_strings":["Technology and Built Environment, UCSI University,Mechanical Engineering Faculty of Engineering,Kuala Lumpur,Malaysia","Mechanical Engineering Faculty of Engineering, Technology and Built Environment, UCSI University, Kuala Lumpur, Malaysia"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Technology and Built Environment, UCSI University,Mechanical Engineering Faculty of Engineering,Kuala Lumpur,Malaysia","institution_ids":["https://openalex.org/I55285296"]},{"raw_affiliation_string":"Mechanical Engineering Faculty of Engineering, Technology and Built Environment, UCSI University, Kuala Lumpur, Malaysia","institution_ids":["https://openalex.org/I55285296"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3055,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.60598845,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"19","issue":null,"first_page":"242","last_page":"247"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9930999875068665,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11710","display_name":"Biomedical Text Mining and Ontologies","score":0.9922999739646912,"subfield":{"id":"https://openalex.org/subfields/1312","display_name":"Molecular Biology"},"field":{"id":"https://openalex.org/fields/13","display_name":"Biochemistry, Genetics and Molecular Biology"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7791603803634644},{"id":"https://openalex.org/keywords/indonesian","display_name":"Indonesian","score":0.60648113489151},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.5921629667282104},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.5071957111358643},{"id":"https://openalex.org/keywords/data-retrieval","display_name":"Data retrieval","score":0.5055034160614014},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.401854008436203},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.07350274920463562}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7791603803634644},{"id":"https://openalex.org/C2779207338","wikidata":"https://www.wikidata.org/wiki/Q9240","display_name":"Indonesian","level":2,"score":0.60648113489151},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.5921629667282104},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.5071957111358643},{"id":"https://openalex.org/C551230270","wikidata":"https://www.wikidata.org/wiki/Q4368942","display_name":"Data retrieval","level":2,"score":0.5055034160614014},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.401854008436203},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.07350274920463562},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/kst61284.2024.10499674","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/kst61284.2024.10499674","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 16th International Conference on Knowledge and Smart Technology (KST)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5099999904632568}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1786079047","https://openalex.org/W2087696423","https://openalex.org/W2131744502","https://openalex.org/W2148972377","https://openalex.org/W2170245882","https://openalex.org/W2517736607","https://openalex.org/W2536015822","https://openalex.org/W2536723159","https://openalex.org/W2539671052","https://openalex.org/W2578432654","https://openalex.org/W2610935556","https://openalex.org/W2896457183","https://openalex.org/W3016473712","https://openalex.org/W3158608480","https://openalex.org/W3175526344","https://openalex.org/W3197008538","https://openalex.org/W3198073108","https://openalex.org/W4294991509","https://openalex.org/W4300427681","https://openalex.org/W4301466821","https://openalex.org/W4321435313","https://openalex.org/W4361989158","https://openalex.org/W4389921502"],"related_works":["https://openalex.org/W3204019825","https://openalex.org/W166528628","https://openalex.org/W2349208793","https://openalex.org/W3071741001","https://openalex.org/W2239628679","https://openalex.org/W226599711","https://openalex.org/W2377391927","https://openalex.org/W1588529408","https://openalex.org/W2163096760","https://openalex.org/W1566389542"],"abstract_inverted_index":{"Lexical":[0],"or":[1],"statistical":[2],"information":[3,89],"retrieval":[4,90,126,141,161],"confronts":[5],"challenges":[6],"such":[7,178],"as":[8,110,120,179],"the":[9,16,51,72,104,125,133,139,157,220],"semantic":[10,52,60,94,108,118,136,158,189,224],"gap":[11,53],"and":[12,34,46,95,159,183,196,225],"vocabulary":[13],"mismatch.":[14],"In":[15,83,98],"context":[17],"of":[18,38,74,124,135,222],"medical":[19,39,55],"data,":[20],"these":[21,64],"difficulties":[22],"are":[23,163],"compounded":[24],"by":[25,116],"users'":[26],"diverse":[27],"backgrounds,":[28],"resulting":[29,228],"in":[30,32,54,71,138,229,233],"disparities":[31],"perspective":[33],"vocabulary.":[35],"The":[36,152,172],"intricacies":[37],"language,":[40],"including":[41,191],"spelling":[42],"variations,":[43],"frequent":[44],"acronyms,":[45],"ambiguous":[47],"concepts,":[48],"further":[49],"amplify":[50],"texts.":[56],"However,":[57],"adopting":[58],"a":[59,68,75,87,121],"approach":[61,114],"can":[62],"address":[63],"issues,":[65],"albeit":[66],"introducing":[67],"new":[69],"challenge":[70],"form":[73],"soft":[76],"matching":[77],"nature":[78],"leading":[79],"to":[80,100,131,166,203],"lower":[81],"recall.":[82],"response,":[84],"we":[85],"propose":[86],"hybrid":[88,209],"method":[91,174],"that":[92],"combines":[93],"lexical":[96,160,176,226],"approaches.":[97],"contrast":[99],"recent":[101],"experiments":[102],"with":[103,188],"emphasis":[105],"on":[106,147,219],"utilizing":[107],"methods":[109,177],"re-ranker,":[111],"our":[112],"current":[113],"diverges":[115],"incorporating":[117],"techniques":[119],"fundamental":[122],"part":[123],"model.":[127],"This":[128,214],"shift":[129],"aims":[130],"explore":[132],"efficacy":[134],"methodologies":[137],"initial":[140],"stage":[142],"rather":[143],"than":[144,207],"exclusively":[145],"relying":[146],"them":[148],"for":[149],"post-retrieval":[150],"refinement.":[151],"results":[153],"obtained":[154],"from":[155],"both":[156,223],"approaches":[162],"subsequently":[164],"subjected":[165],"reranking":[167],"through":[168],"Reciprocal":[169],"Rank":[170],"Fusion.":[171],"proposed":[173],"outperforms":[175],"BM25L,":[180],"Jaccard":[181],"Similarity,":[182],"Query":[184],"Likelihood":[185],"Model,":[186],"along":[187],"methods,":[190,227],"doc2vec,":[192],"multilingual":[193],"BERT,":[194],"IndoBERT,":[195],"MiniLM.":[197],"It":[198],"has":[199,216],"additionally":[200],"been":[201],"demonstrated":[202],"be":[204],"more":[205],"effective":[206],"other":[208],"models,":[210],"PLM-based":[211],"dense":[212],"retrieval.":[213],"technique":[215],"successfully":[217],"capitalized":[218],"strengths":[221],"enhanced":[230],"overall":[231],"performance":[232],"retrieving":[234],"relevant":[235],"documents.":[236]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
