{"id":"https://openalex.org/W4403582536","doi":"https://doi.org/10.1145/3627673.3680040","title":"Sequential Optimum Test with Multi-armed Bandits for Online Experimentation","display_name":"Sequential Optimum Test with Multi-armed Bandits for Online Experimentation","publication_year":2024,"publication_date":"2024-10-20","ids":{"openalex":"https://openalex.org/W4403582536","doi":"https://doi.org/10.1145/3627673.3680040"},"language":"en","primary_location":{"id":"doi:10.1145/3627673.3680040","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627673.3680040","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5091538328","display_name":"Fang Kong","orcid":"https://orcid.org/0000-0002-8148-8911"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Fang Kong","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-8148-8911","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Penglei Zhao","orcid":"https://orcid.org/0009-0004-6840-5343"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Penglei Zhao","raw_affiliation_strings":["Tencent Inc., Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0004-6840-5343","affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102573146","display_name":"Shichao Han","orcid":null},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shichao Han","raw_affiliation_strings":["Tencent Inc., Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0005-1217-3966","affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5026783600","display_name":"Yong Qi Wang","orcid":"https://orcid.org/0009-0009-4464-352X"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Wang","raw_affiliation_strings":["Tencent Inc., Shenzhen, China"],"raw_orcid":"https://orcid.org/0009-0009-4464-352X","affiliations":[{"raw_affiliation_string":"Tencent Inc., Shenzhen, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5066355409","display_name":"Shuai Li","orcid":"https://orcid.org/0000-0002-3935-0708"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuai Li","raw_affiliation_strings":["Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0002-3935-0708","affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5091538328"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.21897137,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4645","last_page":"4652"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12814","display_name":"Gaussian Processes and Bayesian Inference","score":0.9560999870300293,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7336277961730957},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.7331398129463196},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38629308342933655}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7336277961730957},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.7331398129463196},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38629308342933655},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3627673.3680040","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3627673.3680040","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 33rd ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":18,"referenced_works":["https://openalex.org/W1504908594","https://openalex.org/W1556779599","https://openalex.org/W1861050369","https://openalex.org/W2017919516","https://openalex.org/W2147967768","https://openalex.org/W2590512785","https://openalex.org/W2604738573","https://openalex.org/W2744538883","https://openalex.org/W2963366444","https://openalex.org/W3003196782","https://openalex.org/W3008801451","https://openalex.org/W3166445665","https://openalex.org/W3166853481","https://openalex.org/W3190343448","https://openalex.org/W4290943465","https://openalex.org/W4381785738","https://openalex.org/W6707756096","https://openalex.org/W6795501815"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"In":[0,111],"large-scale":[1],"online":[2],"experimentation":[3],"platforms,":[4],"experimenters":[5],"aim":[6],"to":[7,77,118,125,141,192,195,268],"discover":[8],"the":[9,38,48,53,61,69,79,96,106,114,120,132,145,148,171,198,210,213,218,221,227,231,243,251,270],"best":[10],"treatment":[11],"(arm)":[12],"among":[13],"multiple":[14],"candidates.":[15],"Traditional":[16],"A/B":[17,72,181,214],"testing":[18,64,73,80,182,215,219],"and":[19,74,90,105,180,230,246,261],"multi-armed":[20],"bandits":[21],"(MAB)":[22],"algorithms":[23,76,176,233],"are":[24,266],"two":[25,104],"popular":[26],"designs.":[27],"The":[28,237],"former":[29],"usually":[30,101],"achieves":[31],"a":[32,44,127,154],"higher":[33],"power":[34,81],"but":[35,59],"may":[36],"hurt":[37],"customers'":[39,54],"satisfaction":[40],"when":[41],"always":[42],"recommending":[43],"poor":[45],"arm,":[46],"while":[47,82],"latter":[49],"aims":[50],"at":[51],"improving":[52],"experience":[55],"(collecting":[56],"more":[57,84,155],"rewards)":[58],"faces":[60],"loss":[62],"of":[63,71,98,134,173,212,250,256,272],"power.":[65],"Recently,":[66],"[26]":[67],"combine":[68],"advantage":[70,211],"MAB":[75,175,232],"maximize":[78],"maintaining":[83],"rewards":[85,179],"for":[86],"experiments":[87,257],"with":[88,131,165,206,276],"two-arm":[89],"Bernoulli":[91],"rewards.":[92,236],"However,":[93],"in":[94,177,183,216,225,234],"practice,":[95],"number":[97],"arms":[99],"is":[100],"larger":[102],"than":[103],"reward":[107,167],"type":[108],"also":[109],"varies.":[110],"multi-arm":[112],"experiments,":[113],"required":[115],"sample":[116,228],"size":[117],"find":[119],"optimal":[121],"arm":[122,135],"blows":[123],"up":[124],"guarantee":[126],"false":[128],"discovery":[129],"rate":[130],"increase":[133],"numbers,":[136],"bringing":[137],"high":[138],"opportunity":[139],"costs":[140],"experimenters.":[142],"To":[143],"save":[144],"cost":[146],"during":[147],"long":[149],"experimental":[150],"process,":[151],"we":[152,186],"propose":[153,187],"efficient":[156],"sequential":[157,222],"test":[158,223],"framework":[159,194],"named":[160],"Soptima":[161,207],"that":[162],"can":[163],"work":[164],"general":[166],"types.":[168],"Inspired":[169],"by":[170],"design":[172],"traditional":[174],"chasing":[178],"maximizing":[184,217],"power,":[185,220],"an":[188],"Elimination-type":[189],"strategy":[190,204],"adapted":[191],"this":[193],"dynamically":[196],"adjust":[197],"traffic":[199],"split":[200],"on":[201,242],"arms.":[202],"This":[203],"cooperating":[205],"simultaneously":[208],"maintains":[209],"methods":[224],"saving":[226],"size,":[229],"collecting":[235],"theoretical":[238],"analysis":[239],"gives":[240],"guarantees":[241],"Type-I,":[244],"Type-II,":[245],"optimality":[247],"error":[248],"rates":[249],"proposed":[252],"approach.":[253],"A":[254],"series":[255],"from":[258],"both":[259],"simulation":[260],"industrial":[262],"historical":[263],"data":[264],"sets":[265],"conducted":[267],"verify":[269],"superiority":[271],"our":[273],"approach":[274],"compared":[275],"available":[277],"baselines.":[278]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
