{"id":"https://openalex.org/W7140199844","doi":"https://doi.org/10.48550/arxiv.2603.21485","title":"Off-Policy Evaluation for Ranking Policies under Deterministic Logging Policies","display_name":"Off-Policy Evaluation for Ranking Policies under Deterministic Logging Policies","publication_year":2026,"publication_date":"2026-03-23","ids":{"openalex":"https://openalex.org/W7140199844","doi":"https://doi.org/10.48550/arxiv.2603.21485"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.21485","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21485","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.21485","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Tanaka, Koichi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tanaka, Koichi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kawamura, Kazuki","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kawamura, Kazuki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Muroi, Takanori","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Muroi, Takanori","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Narita, Yusuke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Narita, Yusuke","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Sasamoto, Yuki","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sasamoto, Yuki","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Tateno, Kei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tateno, Kei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Udagawa, Takuma","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Udagawa, Takuma","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Du, Wei-Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Du, Wei-Wei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Saito, Yuta","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saito, Yuta","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10991","display_name":"Game Theory and Voting Systems","score":0.7577000260353088,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10991","display_name":"Game Theory and Voting Systems","score":0.7577000260353088,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.06499999761581421,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.041099999099969864,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/logging","display_name":"Logging","score":0.7896999716758728},{"id":"https://openalex.org/keywords/ranking","display_name":"Ranking (information retrieval)","score":0.7623999714851379},{"id":"https://openalex.org/keywords/estimator","display_name":"Estimator","score":0.6847000122070312},{"id":"https://openalex.org/keywords/variance","display_name":"Variance (accounting)","score":0.6172000169754028},{"id":"https://openalex.org/keywords/range","display_name":"Range (aeronautics)","score":0.414900004863739},{"id":"https://openalex.org/keywords/propensity-score-matching","display_name":"Propensity score matching","score":0.29510000348091125}],"concepts":[{"id":"https://openalex.org/C125620115","wikidata":"https://www.wikidata.org/wiki/Q845249","display_name":"Logging","level":2,"score":0.7896999716758728},{"id":"https://openalex.org/C189430467","wikidata":"https://www.wikidata.org/wiki/Q7293293","display_name":"Ranking (information retrieval)","level":2,"score":0.7623999714851379},{"id":"https://openalex.org/C185429906","wikidata":"https://www.wikidata.org/wiki/Q1130160","display_name":"Estimator","level":2,"score":0.6847000122070312},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.680899977684021},{"id":"https://openalex.org/C196083921","wikidata":"https://www.wikidata.org/wiki/Q7915758","display_name":"Variance (accounting)","level":2,"score":0.6172000169754028},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.414900004863739},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.37229999899864197},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.31610000133514404},{"id":"https://openalex.org/C17923572","wikidata":"https://www.wikidata.org/wiki/Q7250160","display_name":"Propensity score matching","level":2,"score":0.29510000348091125},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.2897000014781952},{"id":"https://openalex.org/C207467116","wikidata":"https://www.wikidata.org/wiki/Q4385666","display_name":"Inverse","level":2,"score":0.28949999809265137},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.28529998660087585},{"id":"https://openalex.org/C160920958","wikidata":"https://www.wikidata.org/wiki/Q7662746","display_name":"Synthetic data","level":2,"score":0.2840999960899353},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.2800000011920929},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.26330000162124634}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.21485","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21485","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.21485","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.21485","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Off-Policy":[0],"Evaluation":[1],"(OPE)":[2],"is":[3,15,68],"an":[4],"important":[5],"practical":[6],"problem":[7],"in":[8],"algorithmic":[9],"ranking":[10,24],"systems,":[11],"where":[12,127],"the":[13,18,41,51,65,84,101,104,138,144],"goal":[14],"to":[16,55,91,162],"estimate":[17],"expected":[19],"performance":[20],"of":[21,87,103,116,137,143,168],"a":[22,33,113,166],"new":[23,114],"policy":[25,54,67],"using":[26],"only":[27],"offline":[28],"logged":[29],"data":[30,52],"collected":[31],"under":[32,123],"different,":[34],"logging":[35,66,105,125,174],"policy.":[36],"Existing":[37],"estimators,":[38,49,77],"such":[39],"as":[40,112],"ranking-wise":[42],"and":[43,59,140,147,151],"position-wise":[44],"inverse":[45],"propensity":[46],"score":[47],"(IPS)":[48],"require":[50],"collection":[53],"be":[56],"sufficiently":[57],"stochastic":[58],"suffer":[60],"from":[61],"severe":[62],"bias":[63,139,160],"when":[64],"fully":[69],"deterministic.":[70],"In":[71],"this":[72,93],"paper,":[73],"we":[74],"propose":[75],"novel":[76],"Click-based":[78],"Inverse":[79],"Propensity":[80],"Score":[81],"(CIPS),":[82],"exploiting":[83],"intrinsic":[85],"stochasticity":[86,102],"user":[88],"click":[89,110],"behavior":[90],"address":[92],"challenge.":[94],"Unlike":[95],"existing":[96,128],"methods":[97,129],"that":[98,154],"rely":[99],"on":[100],"policy,":[106],"our":[107,155],"approach":[108],"uses":[109],"probability":[111],"form":[115],"importance":[117],"weighting,":[118],"enabling":[119],"low-bias":[120],"OPE":[121],"even":[122],"deterministic":[124,173],"policies":[126],"incur":[130],"substantial":[131],"bias.":[132],"We":[133],"provide":[134],"theoretical":[135],"analyses":[136],"variance":[141],"properties":[142],"proposed":[145],"estimators":[146,156],"show,":[148],"through":[149],"synthetic":[150],"real-world":[152],"experiments,":[153],"achieve":[157],"significantly":[158],"lower":[159],"compared":[161],"strong":[163],"baselines,":[164],"for":[165],"range":[167],"experimental":[169],"settings":[170],"with":[171],"completely":[172],"policies.":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-25T00:00:00"}
