{"id":"https://openalex.org/W4416078567","doi":"https://doi.org/10.1145/3746252.3760824","title":"TwinBandit Prompt Optimizer: Adaptive Prompt Optimization via Synergistic Dual MAB-Guided Feedback","display_name":"TwinBandit Prompt Optimizer: Adaptive Prompt Optimization via Synergistic Dual MAB-Guided Feedback","publication_year":2025,"publication_date":"2025-11-10","ids":{"openalex":"https://openalex.org/W4416078567","doi":"https://doi.org/10.1145/3746252.3760824"},"language":null,"primary_location":{"id":"doi:10.1145/3746252.3760824","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746252.3760824","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5112714877","display_name":"Young-Joon Park","orcid":"https://orcid.org/0009-0000-2177-0563"},"institutions":[{"id":"https://openalex.org/I28927889","display_name":"IQVIA (United Kingdom)","ror":"https://ror.org/040g76k92","country_code":"GB","type":"company","lineage":["https://openalex.org/I28927889","https://openalex.org/I4210108991"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Young-Joon Park","raw_affiliation_strings":["Agilesoda, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0000-2177-0563","affiliations":[{"raw_affiliation_string":"Agilesoda, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I28927889"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5091841817","display_name":"Seong-Ryeong Lee","orcid":"https://orcid.org/0009-0009-0594-3052"},"institutions":[{"id":"https://openalex.org/I28927889","display_name":"IQVIA (United Kingdom)","ror":"https://ror.org/040g76k92","country_code":"GB","type":"company","lineage":["https://openalex.org/I28927889","https://openalex.org/I4210108991"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Seong-Ryeong Lee","raw_affiliation_strings":["Agilesoda, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0009-0594-3052","affiliations":[{"raw_affiliation_string":"Agilesoda, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I28927889"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025543654","display_name":"Anh-Dung Vo","orcid":"https://orcid.org/0000-0002-4363-2177"},"institutions":[{"id":"https://openalex.org/I28927889","display_name":"IQVIA (United Kingdom)","ror":"https://ror.org/040g76k92","country_code":"GB","type":"company","lineage":["https://openalex.org/I28927889","https://openalex.org/I4210108991"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Anh-Dung Vo","raw_affiliation_strings":["Agilesoda, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0000-0002-4363-2177","affiliations":[{"raw_affiliation_string":"Agilesoda, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I28927889"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112524412","display_name":"Min Jung","orcid":"https://orcid.org/0009-0004-7610-8090"},"institutions":[{"id":"https://openalex.org/I28927889","display_name":"IQVIA (United Kingdom)","ror":"https://ror.org/040g76k92","country_code":"GB","type":"company","lineage":["https://openalex.org/I28927889","https://openalex.org/I4210108991"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Minsung Jung","raw_affiliation_strings":["Agilesoda, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0004-7610-8090","affiliations":[{"raw_affiliation_string":"Agilesoda, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I28927889"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113755242","display_name":"Daewoo Choi","orcid":"https://orcid.org/0009-0004-4540-3564"},"institutions":[{"id":"https://openalex.org/I83436808","display_name":"Hankuk University of Foreign Studies","ror":"https://ror.org/051q2m369","country_code":"KR","type":"education","lineage":["https://openalex.org/I83436808"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Daewoo Choi","raw_affiliation_strings":["Hankuk University of Foreign Studies, Seoul, Republic of Korea"],"raw_orcid":"https://orcid.org/0009-0004-4540-3564","affiliations":[{"raw_affiliation_string":"Hankuk University of Foreign Studies, Seoul, Republic of Korea","institution_ids":["https://openalex.org/I83436808"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5112714877"],"corresponding_institution_ids":["https://openalex.org/I28927889"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17359865,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"5115","last_page":"5119"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.4717000126838684,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12535","display_name":"Machine Learning and Data Classification","score":0.4717000126838684,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.09449999779462814,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.044199999421834946,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.5945000052452087},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.5654000043869019},{"id":"https://openalex.org/keywords/dual","display_name":"Dual (grammatical number)","score":0.4307999908924103},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.4189000129699707},{"id":"https://openalex.org/keywords/selection","display_name":"Selection (genetic algorithm)","score":0.4020000100135803},{"id":"https://openalex.org/keywords/adaptation","display_name":"Adaptation (eye)","score":0.39469999074935913},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.3646000027656555},{"id":"https://openalex.org/keywords/probabilistic-logic","display_name":"Probabilistic logic","score":0.3481999933719635}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7027999758720398},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.5945000052452087},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.5654000043869019},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.4307999908924103},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.4189000129699707},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4171999990940094},{"id":"https://openalex.org/C81917197","wikidata":"https://www.wikidata.org/wiki/Q628760","display_name":"Selection (genetic algorithm)","level":2,"score":0.4020000100135803},{"id":"https://openalex.org/C139807058","wikidata":"https://www.wikidata.org/wiki/Q352374","display_name":"Adaptation (eye)","level":2,"score":0.39469999074935913},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.3646000027656555},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.35910001397132874},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.3481999933719635},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.3244999945163727},{"id":"https://openalex.org/C167393769","wikidata":"https://www.wikidata.org/wiki/Q4680768","display_name":"Adaptive strategies","level":2,"score":0.3010999858379364},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2985999882221222},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.29670000076293945},{"id":"https://openalex.org/C165464430","wikidata":"https://www.wikidata.org/wiki/Q1570441","display_name":"Parameterized complexity","level":2,"score":0.2937999963760376},{"id":"https://openalex.org/C149672232","wikidata":"https://www.wikidata.org/wiki/Q337048","display_name":"Adaptive optimization","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C61326573","wikidata":"https://www.wikidata.org/wiki/Q1496376","display_name":"Gaussian process","level":3,"score":0.26339998841285706},{"id":"https://openalex.org/C52970973","wikidata":"https://www.wikidata.org/wiki/Q2497134","display_name":"Adaptive system","level":2,"score":0.2590000033378601},{"id":"https://openalex.org/C2780735816","wikidata":"https://www.wikidata.org/wiki/Q28324931","display_name":"Incremental learning","level":2,"score":0.25859999656677246}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746252.3760824","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746252.3760824","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":4,"referenced_works":["https://openalex.org/W3038620866","https://openalex.org/W4234228486","https://openalex.org/W4385573003","https://openalex.org/W4416035346"],"related_works":[],"abstract_inverted_index":{"A":[0,91],"common":[1,193],"deficiency":[2],"in":[3,17],"Automatic":[4],"Prompt":[5,36],"Engineering":[6],"(APE)":[7],"is":[8,207],"the":[9,20,66,99,104,138,176],"failure":[10,15],"to":[11,56,82,120,137,163],"strategically":[12,146,190],"employ":[13],"specific":[14],"feedback":[16,74],"concert":[18],"with":[19,124],"adaptive":[21,52,186],"and":[22,86,97,117,148,185,195],"coordinated":[23],"selection":[24],"of":[25,107,152],"diverse":[26],"generation":[27,199],"strategies.":[28],"To":[29],"address":[30,129],"this":[31,135],"deficiency,":[32],"we":[33],"introduce":[34],"TwinBandit":[35],"Optimizer":[37],"(TBPO),":[38],"an":[39,72],"APE":[40,165,187],"framework":[41],"that":[42,127,157],"employs":[43],"a":[44,143,150,169,182,202],"synergistic":[45],"dual":[46],"Multi-Armed":[47],"Bandit":[48],"(MAB)":[49],"mechanism":[50],"for":[51,77,201],"prompt":[53,84],"generation,":[54],"applicable":[55],"black-box":[57],"Large":[58],"Language":[59],"Models":[60],"(LLMs).":[61],"The":[62],"first":[63],"MAB":[64,93],"identifies":[65],"most":[67],"challenging":[68,131],"training":[69],"instances,":[70],"informing":[71],"LLM-driven":[73],"pipeline":[75],"responsible":[76],"generating":[78,147],"(1)":[79],"parameterized":[80],"changes":[81,101],"guide":[83],"evolution":[85],"(2)":[87],"n-shot":[88,118],"example":[89],"configurations.":[90],"second":[92],"then":[94,112],"adaptively":[95],"selects":[96],"ranks":[98],"proposed":[100],"based":[102],"on":[103,175],"empirical":[105],"performance":[106,161],"previously":[108],"generated":[109],"prompts.":[110,154],"TBPO":[111,141,158],"combines":[113],"these":[114,130],"ranked":[115],"modifications":[116],"configurations":[119],"generate":[121],"child":[122],"prompts":[123],"targeted":[125,184],"enhancements":[126],"specifically":[128],"instances.":[132],"Iteratively":[133],"applying":[134],"process":[136],"best-performing":[139],"prompts,":[140],"forms":[142],"closed-loop":[144],"cycle,":[145],"exploring":[149],"tree":[151],"enhanced":[153],"Benchmarking":[155],"shows":[156],"achieves":[159],"stronger":[160],"compared":[162],"state-of-the-art":[164],"baselines,":[166],"highlighted":[167],"by":[168,189],"3.87%":[170],"higher":[171],"exact":[172],"match":[173],"rate":[174],"GPQA-Diamond":[177],"dataset.":[178,204],"Our":[179],"approach":[180],"offers":[181],"more":[183],"method":[188],"learning":[191],"from":[192],"failures":[194],"leveraging":[196],"empirically":[197],"validated":[198],"strategies":[200],"given":[203],"More":[205],"information":[206],"available":[208],"at":[209],"https://github.com/yjpark-pub/tbpo_release.":[210]},"counts_by_year":[],"updated_date":"2025-11-28T09:49:17.034403","created_date":"2025-11-10T00:00:00"}
