{"id":"https://openalex.org/W4224685053","doi":"https://doi.org/10.1145/3477495.3531991","title":"Human Preferences as Dueling Bandits","display_name":"Human Preferences as Dueling Bandits","publication_year":2022,"publication_date":"2022-07-06","ids":{"openalex":"https://openalex.org/W4224685053","doi":"https://doi.org/10.1145/3477495.3531991"},"language":"en","primary_location":{"id":"doi:10.1145/3477495.3531991","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3531991","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2204.10362","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101018904","display_name":"Xinyi Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":true,"raw_author_name":"Xinyi Yan","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079520606","display_name":"Chengxi Luo","orcid":"https://orcid.org/0009-0000-3733-1717"},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Chengxi Luo","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5112750759","display_name":"Charles L. A. Clarke","orcid":null},"institutions":[{"id":"https://openalex.org/I151746483","display_name":"University of Waterloo","ror":"https://ror.org/01aff2v68","country_code":"CA","type":"education","lineage":["https://openalex.org/I151746483"]}],"countries":["CA"],"is_corresponding":false,"raw_author_name":"Charles L. A. Clarke","raw_affiliation_strings":["University of Waterloo, Waterloo, ON, Canada"],"affiliations":[{"raw_affiliation_string":"University of Waterloo, Waterloo, ON, Canada","institution_ids":["https://openalex.org/I151746483"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5055132321","display_name":"Nick Craswell","orcid":"https://orcid.org/0000-0002-9351-8137"},"institutions":[{"id":"https://openalex.org/I4210108985","display_name":"Bellevue Hospital Center","ror":"https://ror.org/01ky34z31","country_code":"US","type":"healthcare","lineage":["https://openalex.org/I1283621791","https://openalex.org/I4210086933","https://openalex.org/I4210108985"]},{"id":"https://openalex.org/I1290206253","display_name":"Microsoft (United States)","ror":"https://ror.org/00d0nc645","country_code":"US","type":"company","lineage":["https://openalex.org/I1290206253"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Nick Craswell","raw_affiliation_strings":["Microsoft, Bellevue, WA, USA"],"affiliations":[{"raw_affiliation_string":"Microsoft, Bellevue, WA, USA","institution_ids":["https://openalex.org/I1290206253","https://openalex.org/I4210108985"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5028019543","display_name":"Ellen M. Voorhees","orcid":"https://orcid.org/0000-0002-5658-2308"},"institutions":[{"id":"https://openalex.org/I1321296531","display_name":"National Institute of Standards and Technology","ror":"https://ror.org/05xpvk416","country_code":"US","type":"funder","lineage":["https://openalex.org/I1321296531","https://openalex.org/I1343035065"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ellen M. Voorhees","raw_affiliation_strings":["National Institute of Standards and Technology, Gaithersburg, MD, USA"],"affiliations":[{"raw_affiliation_string":"National Institute of Standards and Technology, Gaithersburg, MD, USA","institution_ids":["https://openalex.org/I1321296531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5052940596","display_name":"Pablo Castells","orcid":"https://orcid.org/0000-0003-0668-6317"},"institutions":[{"id":"https://openalex.org/I63634437","display_name":"Universidad Aut\u00f3noma de Madrid","ror":"https://ror.org/01cby8j38","country_code":"ES","type":"education","lineage":["https://openalex.org/I63634437"]}],"countries":["ES"],"is_corresponding":false,"raw_author_name":"Pablo Castells","raw_affiliation_strings":["Universidad Aut\u00f3noma de Madrid, Madrid, Spain"],"affiliations":[{"raw_affiliation_string":"Universidad Aut\u00f3noma de Madrid, Madrid, Spain","institution_ids":["https://openalex.org/I63634437"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101018904"],"corresponding_institution_ids":["https://openalex.org/I151746483"],"apc_list":null,"apc_paid":null,"fwci":1.5487,"has_fulltext":true,"cited_by_count":7,"citation_normalized_percentile":{"value":0.82486772,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"567","last_page":"577"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12072","display_name":"Machine Learning and Algorithms","score":0.9976999759674072,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.74537193775177},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.7342147827148438},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.7077709436416626},{"id":"https://openalex.org/keywords/preference-learning","display_name":"Preference learning","score":0.5940690636634827},{"id":"https://openalex.org/keywords/relevance","display_name":"Relevance (law)","score":0.589965283870697},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5177128314971924},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.5041760206222534},{"id":"https://openalex.org/keywords/test","display_name":"Test (biology)","score":0.48079195618629456},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.4555072784423828},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.10569587349891663}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.74537193775177},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.7342147827148438},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.7077709436416626},{"id":"https://openalex.org/C181204326","wikidata":"https://www.wikidata.org/wiki/Q7239820","display_name":"Preference learning","level":3,"score":0.5940690636634827},{"id":"https://openalex.org/C158154518","wikidata":"https://www.wikidata.org/wiki/Q7310970","display_name":"Relevance (law)","level":2,"score":0.589965283870697},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5177128314971924},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.5041760206222534},{"id":"https://openalex.org/C2777267654","wikidata":"https://www.wikidata.org/wiki/Q3519023","display_name":"Test (biology)","level":2,"score":0.48079195618629456},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.4555072784423828},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.10569587349891663},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C151730666","wikidata":"https://www.wikidata.org/wiki/Q7205","display_name":"Paleontology","level":1,"score":0.0}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1145/3477495.3531991","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3477495.3531991","pdf_url":null,"source":{"id":"https://openalex.org/S4363608773","display_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 45th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2204.10362","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.10362","pdf_url":"https://arxiv.org/pdf/2204.10362","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:repositorio.uam.es:10486/711205","is_oa":true,"landing_page_url":"http://hdl.handle.net/10486/711205","pdf_url":"https://repositorio.uam.es/bitstream/10486/711205/1/human_yan_SIGIR_2022.pdf","source":{"id":"https://openalex.org/S4306400963","display_name":"Biblos-e Archivo (Universidad Aut\u00f3noma de Madrid)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I63634437","host_organization_name":"Universidad Aut\u00f3noma de Madrid","host_organization_lineage":["https://openalex.org/I63634437"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"conferenceObject"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2204.10362","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2204.10362","pdf_url":"https://arxiv.org/pdf/2204.10362","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[{"score":0.49000000953674316,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":39,"referenced_works":["https://openalex.org/W1989344419","https://openalex.org/W2004918107","https://openalex.org/W2009948657","https://openalex.org/W2015236210","https://openalex.org/W2031459112","https://openalex.org/W2043457403","https://openalex.org/W2072615624","https://openalex.org/W2081242122","https://openalex.org/W2109244020","https://openalex.org/W2126559945","https://openalex.org/W2127131211","https://openalex.org/W2155961949","https://openalex.org/W2159048649","https://openalex.org/W2343707533","https://openalex.org/W2500119194","https://openalex.org/W2569307494","https://openalex.org/W2587627907","https://openalex.org/W2614730337","https://openalex.org/W2751647711","https://openalex.org/W2798782484","https://openalex.org/W2799108077","https://openalex.org/W2883737864","https://openalex.org/W2903058329","https://openalex.org/W2911563201","https://openalex.org/W2946248329","https://openalex.org/W3034858659","https://openalex.org/W3035278698","https://openalex.org/W3048156405","https://openalex.org/W3085534303","https://openalex.org/W3151947762","https://openalex.org/W3152534132","https://openalex.org/W3152624702","https://openalex.org/W3159852056","https://openalex.org/W3175111331","https://openalex.org/W3188970555","https://openalex.org/W3196754070","https://openalex.org/W3201860539","https://openalex.org/W4224316921","https://openalex.org/W4289743144"],"related_works":["https://openalex.org/W4205262062","https://openalex.org/W2002629668","https://openalex.org/W181477314","https://openalex.org/W1515481220","https://openalex.org/W2060303324","https://openalex.org/W4206238124","https://openalex.org/W4324116389","https://openalex.org/W2161073979","https://openalex.org/W3126212998","https://openalex.org/W2516425091"],"abstract_inverted_index":{"The":[0],"dramatic":[1],"improvements":[2],"in":[3,26],"core":[4],"information":[5],"retrieval":[6],"tasks":[7],"engendered":[8],"by":[9,105,208,218],"neural":[10],"rankers":[11,104],"create":[12],"a":[13,66,82,125,147],"need":[14],"for":[15,98,135,149,160,191,245,267,292],"novel":[16],"evaluation":[17,138,151,288],"methods.":[18],"If":[19,87],"every":[20],"ranker":[21,137],"returns":[22],"highly":[23],"relevant":[24],"items":[25,63,70,97,111,123,175],"the":[27,74,78,94,118,158,186,204,258,273,284],"top":[28],"ranks,":[29],"it":[30,183],"becomes":[31],"difficult":[32],"to":[33,40,55,81,92,108,180,230,252,272],"recognize":[34],"meaningful":[35],"differences":[36],"between":[37],"them":[38],"and":[39,72,182,289,295],"build":[41],"reusable":[42],"test":[43,228,283],"collections.":[44],"Several":[45],"recent":[46],"papers":[47,131],"explore":[48,132],"pairwise":[49],"preference":[50,90,154,165,220,265],"judgments":[51,91,189,266],"as":[52,112,114,124,146],"an":[53,200],"alternative":[54],"traditional":[56],"graded":[57],"relevance":[58],"assessments.":[59],"Rather":[60],"than":[61],"viewing":[62],"one":[64,75,241],"at":[65],"time,":[67],"assessors":[68],"view":[69],"side-by-side":[71],"indicate":[73],"that":[76,214],"provides":[77],"better":[79],"response":[80],"query,":[83,100],"allowing":[84],"fine-grained":[85],"distinctions.":[86],"we":[88,101,222,261],"employ":[89],"identify":[93],"probably":[95],"best":[96,122],"each":[99,196],"can":[102],"measure":[103],"their":[106,234],"ability":[107],"place":[109],"these":[110,239],"high":[113],"possible.":[115],"We":[116,156,282],"frame":[117],"problem":[119],"of":[120,188,286],"finding":[121],"dueling":[126,133],"bandits":[127,134],"problem.":[128],"While":[129],"many":[130],"online":[136],"via":[139,152],"interleaving,":[140],"they":[141],"have":[142],"not":[143,216],"been":[144],"considered":[145],"framework":[148],"offline":[150],"human":[153,164,219],"judgments.":[155],"review":[157],"literature":[159],"possible":[161],"solutions.":[162],"For":[163],"judgments,":[166,221],"any":[167,192],"usable":[168],"algorithm":[169,242],"must":[170,184],"tolerate":[171],"ties,":[172],"since":[173,195],"two":[174],"may":[176],"appear":[177],"nearly":[178],"equal":[179],"assessors,":[181],"minimize":[185],"number":[187],"required":[190],"specific":[193],"pair,":[194],"such":[197],"comparison":[198],"requires":[199],"independent":[201],"assessor.":[202],"Since":[203],"theoretical":[205,294],"guarantees":[206],"provided":[207],"most":[209],"algorithms":[210,225],"depend":[211],"on":[212,226,238],"assumptions":[213],"are":[215],"satisfied":[217],"simulate":[223],"selected":[224],"representative":[227],"cases":[229],"provide":[231],"insight":[232],"into":[233],"practical":[235,296],"utility.":[236],"Based":[237],"simulations,":[240],"stands":[243],"out":[244],"its":[246,255,280],"potential.":[247],"Our":[248],"simulations":[249],"suggest":[250,290],"modifications":[251],"further":[253,293],"improve":[254],"performance.":[256],"Using":[257],"modified":[259],"algorithm,":[260],"collect":[262],"over":[263],"10,000":[264],"pools":[268],"derived":[269],"from":[270],"submissions":[271],"TREC":[274],"2021":[275],"Deep":[276],"Learning":[277],"Track,":[278],"confirming":[279],"suitability.":[281],"idea":[285],"best-item":[287],"ideas":[291],"progress.":[297]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":2}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
