{"id":"https://openalex.org/W4385567603","doi":"https://doi.org/10.1145/3580305.3599473","title":"PrefRec: Recommender Systems with Human Preferences for Reinforcing Long-term User Engagement","display_name":"PrefRec: Recommender Systems with Human Preferences for Reinforcing Long-term User Engagement","publication_year":2023,"publication_date":"2023-08-04","ids":{"openalex":"https://openalex.org/W4385567603","doi":"https://doi.org/10.1145/3580305.3599473"},"language":"en","primary_location":{"id":"doi:10.1145/3580305.3599473","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3580305.3599473","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599473","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599473","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088881854","display_name":"Wanqi Xue","orcid":"https://orcid.org/0000-0003-3490-1088"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":true,"raw_author_name":"Wanqi Xue","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016589992","display_name":"Qingpeng Cai","orcid":"https://orcid.org/0000-0001-6451-9299"},"institutions":[{"id":"https://openalex.org/I4401726859","display_name":"Kuaishou (China)","ror":"https://ror.org/0258as409","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qingpeng Cai","raw_affiliation_strings":["Kuaishou Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Kuaishou Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054607440","display_name":"Zhenghai Xue","orcid":"https://orcid.org/0000-0002-9340-0366"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Zhenghai Xue","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004036450","display_name":"Shuo Sun","orcid":"https://orcid.org/0000-0001-7153-1878"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Shuo Sun","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100600807","display_name":"Shuchang Liu","orcid":"https://orcid.org/0000-0002-1440-911X"},"institutions":[{"id":"https://openalex.org/I4401726859","display_name":"Kuaishou (China)","ror":"https://ror.org/0258as409","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuchang Liu","raw_affiliation_strings":["Kuaishou Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Kuaishou Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086177569","display_name":"Dong Zheng","orcid":"https://orcid.org/0000-0003-0424-9658"},"institutions":[{"id":"https://openalex.org/I4401726859","display_name":"Kuaishou (China)","ror":"https://ror.org/0258as409","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Zheng","raw_affiliation_strings":["Kuaishou Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Kuaishou Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001339397","display_name":"Peng Jiang","orcid":"https://orcid.org/0000-0002-9266-0780"},"institutions":[{"id":"https://openalex.org/I4401726859","display_name":"Kuaishou (China)","ror":"https://ror.org/0258as409","country_code":null,"type":"company","lineage":["https://openalex.org/I4401726859"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Peng Jiang","raw_affiliation_strings":["Kuaishou Technology, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Kuaishou Technology, Beijing, China","institution_ids":["https://openalex.org/I4401726859"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062939922","display_name":"Kun Gai","orcid":"https://orcid.org/0000-0002-3636-3618"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kun Gai","raw_affiliation_strings":["Unaffiliated, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Unaffiliated, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017743551","display_name":"Bo An","orcid":"https://orcid.org/0000-0002-7064-7438"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Bo An","raw_affiliation_strings":["Nanyang Technological University, Singapore, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Singapore, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5088881854"],"corresponding_institution_ids":["https://openalex.org/I172675005"],"apc_list":null,"apc_paid":null,"fwci":9.5896,"has_fulltext":true,"cited_by_count":21,"citation_normalized_percentile":{"value":0.98017543,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2874","last_page":"2884"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9959999918937683,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.9087636470794678},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8354032039642334},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7394163608551025},{"id":"https://openalex.org/keywords/crowdsourcing","display_name":"Crowdsourcing","score":0.7115935683250427},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.6184033155441284},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.5743280649185181},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5686134696006775},{"id":"https://openalex.org/keywords/user-engagement","display_name":"User engagement","score":0.558491587638855},{"id":"https://openalex.org/keywords/preference","display_name":"Preference","score":0.546820878982544},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.5392360687255859},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.5305020809173584},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46782487630844116},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.45303213596343994},{"id":"https://openalex.org/keywords/preference-learning","display_name":"Preference learning","score":0.4176377058029175},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.155155211687088}],"concepts":[{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.9087636470794678},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8354032039642334},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7394163608551025},{"id":"https://openalex.org/C62230096","wikidata":"https://www.wikidata.org/wiki/Q275969","display_name":"Crowdsourcing","level":2,"score":0.7115935683250427},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.6184033155441284},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.5743280649185181},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5686134696006775},{"id":"https://openalex.org/C2984870255","wikidata":"https://www.wikidata.org/wiki/Q5196451","display_name":"User engagement","level":2,"score":0.558491587638855},{"id":"https://openalex.org/C2781249084","wikidata":"https://www.wikidata.org/wiki/Q908656","display_name":"Preference","level":2,"score":0.546820878982544},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.5392360687255859},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.5305020809173584},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46782487630844116},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.45303213596343994},{"id":"https://openalex.org/C181204326","wikidata":"https://www.wikidata.org/wiki/Q7239820","display_name":"Preference learning","level":3,"score":0.4176377058029175},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.155155211687088},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C21547014","wikidata":"https://www.wikidata.org/wiki/Q1423657","display_name":"Operations management","level":1,"score":0.0},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3580305.3599473","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3580305.3599473","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599473","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3580305.3599473","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3580305.3599473","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3580305.3599473","source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 29th ACM SIGKDD Conference on Knowledge Discovery and Data Mining","raw_type":"proceedings-article"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"},{"id":"https://openalex.org/F4320320709","display_name":"National Research Foundation Singapore","ror":"https://ror.org/03cpyc314"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4385567603.pdf","grobid_xml":"https://content.openalex.org/works/W4385567603.grobid-xml"},"referenced_works_count":28,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W2111094216","https://openalex.org/W2138108551","https://openalex.org/W2763110165","https://openalex.org/W2767807341","https://openalex.org/W2784068709","https://openalex.org/W2809162153","https://openalex.org/W2914933231","https://openalex.org/W2948345531","https://openalex.org/W2963654596","https://openalex.org/W2963842088","https://openalex.org/W2965744319","https://openalex.org/W2984100107","https://openalex.org/W2998145016","https://openalex.org/W3012950066","https://openalex.org/W3035084859","https://openalex.org/W3080585915","https://openalex.org/W3099420497","https://openalex.org/W3100480425","https://openalex.org/W3116249021","https://openalex.org/W3200556911","https://openalex.org/W3210967257","https://openalex.org/W4241996101","https://openalex.org/W4290827187","https://openalex.org/W4290927958","https://openalex.org/W4290944246","https://openalex.org/W4367047389","https://openalex.org/W4367310822"],"related_works":["https://openalex.org/W3032998312","https://openalex.org/W1503094549","https://openalex.org/W4384486036","https://openalex.org/W135177976","https://openalex.org/W2337920774","https://openalex.org/W4318823662","https://openalex.org/W2886410948","https://openalex.org/W2025875869","https://openalex.org/W3207526114","https://openalex.org/W1524294987"],"abstract_inverted_index":{"Current":[0],"advances":[1],"in":[2,9,36,60,148,167,233],"recommender":[3,93,105],"systems":[4,94,106],"have":[5,32],"been":[6],"remarkably":[7],"successful":[8],"optimizing":[10,56,149],"immediate":[11],"engagement.":[12],"However,":[13],"long-term":[14,40,57,78,150,218],"user":[15,58,79,219],"engagement,":[16],"a":[17,37,52,90,164,215],"more":[18],"desirable":[19],"performance":[20],"metric,":[21],"remains":[22],"difficult":[23],"to":[24,77,107,161,177,181,207],"improve.":[25],"Meanwhile,":[26],"recent":[27],"reinforcement":[28],"learning":[29,179],"(RL)":[30],"algorithms":[31],"shown":[33],"their":[34],"effectiveness":[35],"variety":[38,216],"of":[39,66,146,217],"goal":[41],"optimization":[42,191,221],"tasks.":[43,222,236],"For":[44],"this":[45],"reason,":[46],"RL":[47,67,104,147],"is":[48,81,174],"widely":[49],"considered":[50],"as":[51,128,130],"promising":[53],"framework":[54],"for":[55,193],"engagement":[59,80,220],"recommendation.":[61],"Though":[62],"promising,":[63],"the":[64,86,144,159,183,209,235],"application":[65],"heavily":[68],"relies":[69],"on":[70,214],"well-designed":[71],"rewards,":[72],"but":[73],"designing":[74],"rewards":[75],"related":[76],"quite":[82],"difficult.":[83],"To":[84],"mitigate":[85],"problem,":[87],"we":[88,140,187],"propose":[89],"novel":[91],"paradigm,":[92],"with":[95],"human":[96],"preferences":[97,110,121,160],"(or":[98],"Preference-based":[99],"Recommender":[100],"systems),":[101],"which":[102,195],"allows":[103],"learn":[108],"from":[109],"about":[111],"users'":[112],"historical":[113],"behaviors":[114],"rather":[115],"than":[116],"explicitly":[117],"defined":[118],"rewards.":[119],"Such":[120],"are":[122],"easily":[123],"accessible":[124],"through":[125],"techniques":[126],"such":[127],"crowdsourcing,":[129],"they":[131],"do":[132],"not":[133],"require":[134],"any":[135],"expert":[136],"knowledge.":[137],"With":[138],"PrefRec,":[139,194],"can":[141],"fully":[142],"exploit":[143],"advantages":[145],"goals,":[151],"while":[152],"avoiding":[153],"complex":[154],"reward":[155,165,172,204],"engineering.":[156],"PrefRec":[157,227],"uses":[158,196],"automatically":[162],"train":[163,182],"function":[166,173],"an":[168,189,197],"end-to-end":[169],"manner.":[170],"The":[171,223],"then":[175],"used":[176],"generate":[178],"signals":[180],"recommendation":[184],"policy.":[185],"Furthermore,":[186],"design":[188],"effective":[190],"method":[192],"additional":[198],"value":[199],"function,":[200],"expectile":[201],"regression":[202],"and":[203],"model":[205],"pre-training":[206],"improve":[208],"performance.":[210],"We":[211],"conduct":[212],"experiments":[213],"results":[224],"show":[225],"that":[226],"significantly":[228],"outperforms":[229],"previous":[230],"state-of-the-art":[231],"methods":[232],"all":[234]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":6},{"year":2023,"cited_by_count":2}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
