{"id":"https://openalex.org/W3088936686","doi":"https://doi.org/10.1145/3383313.3412252","title":"Keeping Dataset Biases out of the Simulation","display_name":"Keeping Dataset Biases out of the Simulation","publication_year":2020,"publication_date":"2020-09-19","ids":{"openalex":"https://openalex.org/W3088936686","doi":"https://doi.org/10.1145/3383313.3412252","mag":"3088936686"},"language":"en","primary_location":{"id":"doi:10.1145/3383313.3412252","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3383313.3412252","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Fourteenth ACM Conference on Recommender Systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://pure.uva.nl/ws/files/54624795/3383313.3412252.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5069858475","display_name":"Jin Huang","orcid":"https://orcid.org/0000-0003-2285-5248"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":true,"raw_author_name":"Jin Huang","raw_affiliation_strings":["University of Amsterdam Amsterdam, The Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002072527","display_name":"Harrie Oosterhuis","orcid":"https://orcid.org/0000-0002-0458-9233"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Harrie Oosterhuis","raw_affiliation_strings":["University of Amsterdam Amsterdam, The Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I887064364"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031439294","display_name":"Maarten de Rijke","orcid":"https://orcid.org/0000-0002-1086-0202"},"institutions":[{"id":"https://openalex.org/I4210112722","display_name":"Ahold Delhaize (Netherlands)","ror":"https://ror.org/01v6p2g18","country_code":"NL","type":"company","lineage":["https://openalex.org/I4210112722"]},{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Maarten de Rijke","raw_affiliation_strings":["University of Amsterdam &amp; Ahold Delhaize Amsterdam, The Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam &amp; Ahold Delhaize Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I4210112722","https://openalex.org/I887064364"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5057277609","display_name":"Herke van Hoof","orcid":"https://orcid.org/0000-0002-1583-3692"},"institutions":[{"id":"https://openalex.org/I887064364","display_name":"University of Amsterdam","ror":"https://ror.org/04dkp9463","country_code":"NL","type":"education","lineage":["https://openalex.org/I887064364"]}],"countries":["NL"],"is_corresponding":false,"raw_author_name":"Herke van Hoof","raw_affiliation_strings":["University of Amsterdam Amsterdam, The Netherlands"],"affiliations":[{"raw_affiliation_string":"University of Amsterdam Amsterdam, The Netherlands","institution_ids":["https://openalex.org/I887064364"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5069858475"],"corresponding_institution_ids":["https://openalex.org/I887064364"],"apc_list":null,"apc_paid":null,"fwci":8.1714,"has_fulltext":true,"cited_by_count":62,"citation_normalized_percentile":{"value":0.97669358,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"190","last_page":"199"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9984999895095825,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9958000183105469,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/debiasing","display_name":"Debiasing","score":0.9833216667175293},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8555370569229126},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.6891950964927673},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.46435025334358215},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3794774115085602},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3129178285598755}],"concepts":[{"id":"https://openalex.org/C2779458634","wikidata":"https://www.wikidata.org/wiki/Q24963715","display_name":"Debiasing","level":2,"score":0.9833216667175293},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8555370569229126},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.6891950964927673},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.46435025334358215},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3794774115085602},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3129178285598755},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0}],"mesh":[],"locations_count":4,"locations":[{"id":"doi:10.1145/3383313.3412252","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3383313.3412252","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Fourteenth ACM Conference on Recommender Systems","raw_type":"proceedings-article"},{"id":"pmh:oai:dare.uva.nl:publications/c902af09-f699-4e40-86b2-f317eed290d4","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/keeping-dataset-biases-out-of-the-simulation(c902af09-f699-4e40-86b2-f317eed290d4).html","pdf_url":"https://pure.uva.nl/ws/files/54624795/3383313.3412252.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Huang, J, Oosterhuis, H, de Rijke, M & van Hoof, H 2020, Keeping Dataset Biases out of the Simulation : A Debiased Simulator for Reinforcement Learning based Recommender Systems. in RECSYS 2020 : 14th ACM Conference on Recommender Systems : Virtual Event, Brazil, September 22-26, 2020. New York, NY, pp. 190\u2013199, 14th ACM Conference on Recommender Systems, Brazil, 22/09/20. https://doi.org/10.1145/3383313.3412252","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:dare.uva.nl:openaire_cris_publications/c902af09-f699-4e40-86b2-f317eed290d4","is_oa":true,"landing_page_url":"https://hdl.handle.net/11245.1/c902af09-f699-4e40-86b2-f317eed290d4","pdf_url":null,"source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Huang , J , Oosterhuis , H , de Rijke , M &amp; van Hoof , H 2020 , Keeping Dataset Biases out of the Simulation : A Debiased Simulator for Reinforcement Learning based Recommender Systems . in RECSYS 2020 : 14th ACM Conference on Recommender Systems : Virtual Event, Brazil, September 22-26, 2020 . New York, NY , pp. 190\u2013199 , 14th ACM Conference on Recommender Systems , Brazil , 22/09/20 . https://doi.org/10.1145/3383313.3412252","raw_type":"contributionToPeriodical"},{"id":"pmh:uvapub:oai:dare.uva.nl:publications/c902af09-f699-4e40-86b2-f317eed290d4","is_oa":true,"landing_page_url":"https://dare.uva.nl/personal/pure/en/publications/keeping-dataset-biases-out-of-the-simulation(c902af09-f699-4e40-86b2-f317eed290d4).html","pdf_url":null,"source":{"id":"https://openalex.org/S4306401843","display_name":"Data Archiving and Networked Services (DANS)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1322597698","host_organization_name":"Royal Netherlands Academy of Arts and Sciences","host_organization_lineage":["https://openalex.org/I1322597698"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"RECSYS 2020: 14th ACM Conference on Recommender Systems : Virtual Event, Brazil, September 22-26, 2020","raw_type":"info:eu-repo/semantics/conferencepaper"}],"best_oa_location":{"id":"pmh:oai:dare.uva.nl:publications/c902af09-f699-4e40-86b2-f317eed290d4","is_oa":true,"landing_page_url":"https://handle.uba.uva.nl/personal/pure/en/publications/keeping-dataset-biases-out-of-the-simulation(c902af09-f699-4e40-86b2-f317eed290d4).html","pdf_url":"https://pure.uva.nl/ws/files/54624795/3383313.3412252.pdf","source":{"id":"https://openalex.org/S4306400088","display_name":"UvA-DARE (University of Amsterdam)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I887064364","host_organization_name":"University of Amsterdam","host_organization_lineage":["https://openalex.org/I887064364"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Huang, J, Oosterhuis, H, de Rijke, M & van Hoof, H 2020, Keeping Dataset Biases out of the Simulation : A Debiased Simulator for Reinforcement Learning based Recommender Systems. in RECSYS 2020 : 14th ACM Conference on Recommender Systems : Virtual Event, Brazil, September 22-26, 2020. New York, NY, pp. 190\u2013199, 14th ACM Conference on Recommender Systems, Brazil, 22/09/20. https://doi.org/10.1145/3383313.3412252","raw_type":"info:eu-repo/semantics/publishedVersion"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2586376837","display_name":null,"funder_award_id":"612.001.551","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"},{"id":"https://openalex.org/G629491556","display_name":null,"funder_award_id":"(NWO)","funder_id":"https://openalex.org/F4320321800","funder_display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek"}],"funders":[{"id":"https://openalex.org/F4320321800","display_name":"Nederlandse Organisatie voor Wetenschappelijk Onderzoek","ror":"https://ror.org/04jsz6e67"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W3088936686.pdf","grobid_xml":"https://content.openalex.org/works/W3088936686.grobid-xml"},"referenced_works_count":36,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1992665562","https://openalex.org/W2005415325","https://openalex.org/W2020631728","https://openalex.org/W2045745608","https://openalex.org/W2046974451","https://openalex.org/W2105256943","https://openalex.org/W2112420033","https://openalex.org/W2507134384","https://openalex.org/W2774321216","https://openalex.org/W2784068709","https://openalex.org/W2787933113","https://openalex.org/W2788295351","https://openalex.org/W2799048248","https://openalex.org/W2799544270","https://openalex.org/W2809162153","https://openalex.org/W2902572901","https://openalex.org/W2905101140","https://openalex.org/W2955774983","https://openalex.org/W2963561234","https://openalex.org/W2963619374","https://openalex.org/W2963654596","https://openalex.org/W2963842088","https://openalex.org/W2972561734","https://openalex.org/W2972905192","https://openalex.org/W2985671795","https://openalex.org/W3007094061","https://openalex.org/W3011985620","https://openalex.org/W3035734059","https://openalex.org/W3099420497","https://openalex.org/W3102778384","https://openalex.org/W3102862020","https://openalex.org/W3102899483","https://openalex.org/W3103141630","https://openalex.org/W3150893739","https://openalex.org/W4214854509"],"related_works":["https://openalex.org/W4386875279","https://openalex.org/W4362554880","https://openalex.org/W4281684980","https://openalex.org/W2171721708","https://openalex.org/W3214527415","https://openalex.org/W4287887864","https://openalex.org/W1495104519","https://openalex.org/W4390963114","https://openalex.org/W4225584739","https://openalex.org/W2199432031"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1],"for":[2,128,159,187,212,223],"recommendation":[3],"(RL4Rec)":[4],"methods":[5,195],"are":[6,81],"increasingly":[7],"receiving":[8],"attention":[9],"as":[10,49,209],"an":[11,86],"effective":[12],"way":[13],"to":[14,29,40,114,140,199,227],"improve":[15],"long-term":[16],"user":[17,33,53,61,78,101,142],"engagement.":[18],"However,":[19],"applying":[20],"RL4Rec":[21,151],"online":[22],"comes":[23],"with":[24,168,188],"risks:":[25],"exploration":[26],"may":[27],"lead":[28],"periods":[30],"of":[31,89,148,165],"detrimental":[32],"experience.":[34],"Moreover,":[35],"few":[36],"researchers":[37],"have":[38,45],"access":[39],"real-world":[41],"recommender":[42],"systems.":[43],"Simulations":[44],"been":[46],"put":[47],"forward":[48],"a":[50,112,119,155],"solution":[51,113],"where":[52],"feedback":[54],"is":[55,138],"simulated":[56],"based":[57],"on":[58,150],"logged":[59,100,134,178],"historical":[60],"data,":[62,102],"thus":[63],"enabling":[64],"optimization":[65,228],"and":[66,80,103,215,229],"evaluation":[67,157,216],"without":[68],"being":[69],"run":[70],"online.":[71],"While":[72,192],"simulators":[73,160],"do":[74],"not":[75],"risk":[76],"the":[77,95,108,123,129,133,146,163,169,175,182,210,218],"experience":[79],"widely":[82],"accessible,":[83],"we":[84,117,153,202],"identify":[85],"important":[87],"limitation":[88],"existing":[90],"simulation":[91,124],"methods.":[92],"They":[93],"ignore":[94],"interaction":[96,224],"biases":[97,106,130,176,225],"present":[98,131],"in":[99,122,132],"consequently,":[104],"these":[105],"affect":[107],"resulting":[109,183],"simulation.":[110],"As":[111],"this":[115],"issue,":[116],"introduce":[118],"debiasing":[120,190,194],"step":[121],"pipeline,":[125],"which":[126],"corrects":[127],"data":[135,179],"before":[136],"it":[137],"used":[139],"simulate":[141],"behavior.":[143],"To":[144],"evaluate":[145],"effects":[147],"bias":[149],"simulations,":[152],"propose":[154],"novel":[156],"approach":[158],"that":[161,174,221],"considers":[162],"performance":[164],"policies":[166],"optimized":[167],"simulator.":[170],"Our":[171],"results":[172],"reveal":[173],"from":[177],"negatively":[180],"impact":[181],"policies,":[184],"unless":[185],"corrected":[186],"our":[189,193,204],"method.":[191],"can":[196],"be":[197],"applied":[198],"any":[200],"simulator,":[201],"make":[203],"complete":[205],"pipeline":[206],"publicly":[207],"available":[208],"Simulator":[211],"OFfline":[213],"leArning":[214],"(SOFA):":[217],"first":[219],"simulator":[220],"accounts":[222],"prior":[226],"evaluation.":[230]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":14},{"year":2022,"cited_by_count":13},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2020-10-01T00:00:00"}
