{"id":"https://openalex.org/W4384625752","doi":"https://doi.org/10.1145/3539618.3591865","title":"How Well do Offline Metrics Predict Online Performance of Product Ranking Models?","display_name":"How Well do Offline Metrics Predict Online Performance of Product Ranking Models?","publication_year":2023,"publication_date":"2023-07-18","ids":{"openalex":"https://openalex.org/W4384625752","doi":"https://doi.org/10.1145/3539618.3591865"},"language":"en","primary_location":{"id":"doi:10.1145/3539618.3591865","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3539618.3591865","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3539618.3591865","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100351306","display_name":"Xiaojie Wang","orcid":"https://orcid.org/0000-0003-2565-5831"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiaojie Wang","raw_affiliation_strings":["Amazon.com, Palo Alto, CA, USA"],"raw_orcid":"https://orcid.org/0000-0003-2565-5831","affiliations":[{"raw_affiliation_string":"Amazon.com, Palo Alto, CA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069584457","display_name":"Ruoyuan Gao","orcid":"https://orcid.org/0000-0002-8784-4171"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ruoyuan Gao","raw_affiliation_strings":["Amazon.com, Palo Alto, CA, USA"],"raw_orcid":"https://orcid.org/0000-0002-8784-4171","affiliations":[{"raw_affiliation_string":"Amazon.com, Palo Alto, CA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101446981","display_name":"Anoop Jain","orcid":"https://orcid.org/0009-0002-5542-6191"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anoop Jain","raw_affiliation_strings":["Amazon.com, Palo Alto, CA, USA"],"raw_orcid":"https://orcid.org/0009-0002-5542-6191","affiliations":[{"raw_affiliation_string":"Amazon.com, Palo Alto, CA, USA","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079016988","display_name":"Graham Edge","orcid":"https://orcid.org/0009-0009-9730-808X"},"institutions":[{"id":"https://openalex.org/I1311688040","display_name":"Amazon (United States)","ror":"https://ror.org/04mv4n011","country_code":"US","type":"company","lineage":["https://openalex.org/I1311688040"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Graham Edge","raw_affiliation_strings":["Amazon.com, Seattle, WA, USA"],"raw_orcid":"https://orcid.org/0009-0009-9730-808X","affiliations":[{"raw_affiliation_string":"Amazon.com, Seattle, WA, USA","institution_ids":["https://openalex.org/I1311688040"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5062448275","display_name":"Sachin Ahuja","orcid":"https://orcid.org/0009-0000-2156-0128"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sachin Ahuja","raw_affiliation_strings":["Amazon.com, Palo Alto, CA, USA"],"raw_orcid":"https://orcid.org/0009-0000-2156-0128","affiliations":[{"raw_affiliation_string":"Amazon.com, Palo Alto, CA, USA","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.5881,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.91389074,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"3415","last_page":"3420"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/discriminative-model","display_name":"Discriminative model","score":0.8445419073104858},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7968287467956543},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.7502789497375488},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7303448915481567},{"id":"https://openalex.org/keywords/learning-to-rank","display_name":"Learning to rank","score":0.6608126759529114},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.6008392572402954},{"id":"https://openalex.org/keywords/rank","display_name":"Rank (graph theory)","score":0.5799601674079895},{"id":"https://openalex.org/keywords/online-and-offline","display_name":"Online and offline","score":0.5544984936714172},{"id":"https://openalex.org/keywords/data-mining","display_name":"Data mining","score":0.543624997138977},{"id":"https://openalex.org/keywords/search-engine","display_name":"Search engine","score":0.42797213792800903},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4218946397304535},{"id":"https://openalex.org/keywords/predictive-power","display_name":"Predictive power","score":0.4157862961292267},{"id":"https://openalex.org/keywords/product","display_name":"Product (mathematics)","score":0.41047540307044983},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.34963878989219666},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.14396575093269348},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.1175224781036377}],"concepts":[{"id":"https://openalex.org/C97931131","wikidata":"https://www.wikidata.org/wiki/Q5282087","display_name":"Discriminative model","level":2,"score":0.8445419073104858},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7968287467956543},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.7502789497375488},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7303448915481567},{"id":"https://openalex.org/C86037889","wikidata":"https://www.wikidata.org/wiki/Q4330127","display_name":"Learning to rank","level":3,"score":0.6608126759529114},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.6008392572402954},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.5799601674079895},{"id":"https://openalex.org/C2780102126","wikidata":"https://www.wikidata.org/wiki/Q10928179","display_name":"Online and offline","level":2,"score":0.5544984936714172},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.543624997138977},{"id":"https://openalex.org/C97854310","wikidata":"https://www.wikidata.org/wiki/Q19541","display_name":"Search engine","level":2,"score":0.42797213792800903},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4218946397304535},{"id":"https://openalex.org/C2778136018","wikidata":"https://www.wikidata.org/wiki/Q10350689","display_name":"Predictive power","level":2,"score":0.4157862961292267},{"id":"https://openalex.org/C90673727","wikidata":"https://www.wikidata.org/wiki/Q901718","display_name":"Product (mathematics)","level":2,"score":0.41047540307044983},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.34963878989219666},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.14396575093269348},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.1175224781036377},{"id":"https://openalex.org/C114614502","wikidata":"https://www.wikidata.org/wiki/Q76592","display_name":"Combinatorics","level":1,"score":0.0},{"id":"https://openalex.org/C111472728","wikidata":"https://www.wikidata.org/wiki/Q9471","display_name":"Epistemology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3539618.3591865","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3539618.3591865","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3539618.3591865","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3539618.3591865","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 46th International ACM SIGIR Conference on Research and Development in Information Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/10","display_name":"Reduced inequalities","score":0.7400000095367432}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":44,"referenced_works":["https://openalex.org/W1966835268","https://openalex.org/W1968927634","https://openalex.org/W1982530130","https://openalex.org/W1985514943","https://openalex.org/W1988619666","https://openalex.org/W2006811637","https://openalex.org/W2017292914","https://openalex.org/W2020018978","https://openalex.org/W2027382829","https://openalex.org/W2047221353","https://openalex.org/W2058896506","https://openalex.org/W2059120814","https://openalex.org/W2094790959","https://openalex.org/W2106404250","https://openalex.org/W2116008435","https://openalex.org/W2130076000","https://openalex.org/W2169783907","https://openalex.org/W2336343120","https://openalex.org/W2338216121","https://openalex.org/W2604525406","https://openalex.org/W2624553223","https://openalex.org/W2737403195","https://openalex.org/W2741497758","https://openalex.org/W2744538883","https://openalex.org/W2769473018","https://openalex.org/W2797400361","https://openalex.org/W2798283910","https://openalex.org/W2808234013","https://openalex.org/W2808599418","https://openalex.org/W2911802745","https://openalex.org/W2946387282","https://openalex.org/W2955792106","https://openalex.org/W3010870049","https://openalex.org/W3080913646","https://openalex.org/W3105712174","https://openalex.org/W3144984979","https://openalex.org/W3153682915","https://openalex.org/W3201357833","https://openalex.org/W4212900074","https://openalex.org/W4220802549","https://openalex.org/W4284713556","https://openalex.org/W4292419518","https://openalex.org/W4302322961","https://openalex.org/W4306317018"],"related_works":["https://openalex.org/W2965546495","https://openalex.org/W4389116644","https://openalex.org/W2153315159","https://openalex.org/W3103844505","https://openalex.org/W259157601","https://openalex.org/W4205463238","https://openalex.org/W2761785940","https://openalex.org/W2110523656","https://openalex.org/W1482209366","https://openalex.org/W4379381520"],"abstract_inverted_index":{"Online":[0],"evaluation":[1,24,38],"techniques":[2],"are":[3,43,194],"widely":[4],"adopted":[5],"by":[6],"industrial":[7],"search":[8,86,109,199],"engines":[9],"to":[10,36,39,45,62,80,120,187],"determine":[11],"which":[12,69,178,208],"ranking":[13,70,182,200],"models":[14,71,183],"perform":[15,72],"better":[16,73,185],"under":[17,103],"a":[18,28,58,104,210],"certain":[19],"business":[20,105,131],"metric.":[21,132],"However,":[22],"online":[23,48,75,155,173],"can":[25],"only":[26],"evaluate":[27,121],"small":[29],"number":[30],"of":[31,98,126,140,180,189],"rankers":[32,41],"and":[33,147,156,164],"people":[34],"resort":[35],"offline":[37,52,66,122,136,151,157,162],"select":[40],"that":[42],"likely":[44],"yield":[46],"good":[47],"performance.":[49],"To":[50],"use":[51,116],"metrics":[53,67,123,137,163,169,193],"for":[54],"effective":[55],"model":[56],"selection,":[57],"major":[59],"challenge":[60,83],"is":[61,184],"understand":[63],"how":[64],"well":[65,171],"predict":[68],"in":[74,84,95,107,124,138],"experiments.":[76],"This":[77],"paper":[78],"aims":[79],"address":[81],"this":[82,89],"product":[85],"ranking.":[87],"Towards":[88],"end,":[90],"we":[91,115,134,159],"collect":[92],"gold":[93,118],"data":[94,119],"the":[96,112,130],"form":[97],"preferences":[99],"over":[100,213],"ranker":[101],"pairs":[102],"metric":[106],"e-commerce":[108],"engine.":[110],"For":[111],"first":[113],"time,":[114],"such":[117],"terms":[125,139],"directional":[127],"agreement":[128],"with":[129,172],"Furthermore,":[133],"analyze":[135],"discriminative":[141,196,211],"power":[142,212],"through":[143],"paired":[144],"sample":[145],"t-test":[146],"rank":[148],"correlations":[149],"among":[150],"metrics.":[152],"Through":[153],"extensive":[154],"experiments,":[158],"studied":[160],"36":[161],"observed":[165],"that:":[166],"(1)":[167],"Offline":[168,192],"align":[170],"metrics:":[174],"they":[175],"agree":[176],"on":[177,197],"one":[179],"two":[181],"up":[186],"97%":[188],"times;":[190],"(2)":[191],"highly":[195],"large-scale":[198],"data,":[201],"especially":[202],"NDCG":[203],"(Normalized":[204],"Discounted":[205],"Cumulative":[206],"Gain)":[207],"has":[209],"99%.":[214]},"counts_by_year":[{"year":2025,"cited_by_count":2},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
