{"id":"https://openalex.org/W3012886296","doi":"https://doi.org/10.1145/3366423.3380294","title":"RLPer: A Reinforcement Learning Model for Personalized Search","display_name":"RLPer: A Reinforcement Learning Model for Personalized Search","publication_year":2020,"publication_date":"2020-04-20","ids":{"openalex":"https://openalex.org/W3012886296","doi":"https://doi.org/10.1145/3366423.3380294","mag":"3012886296"},"language":"en","primary_location":{"id":"doi:10.1145/3366423.3380294","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380294","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3366423.3380294","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5084847804","display_name":"Jing Yao","orcid":"https://orcid.org/0000-0002-0527-6095"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jing Yao","raw_affiliation_strings":["School of Information Renmin University of China"],"affiliations":[{"raw_affiliation_string":"School of Information Renmin University of China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5010558184","display_name":"Zhicheng Dou","orcid":"https://orcid.org/0000-0002-9781-948X"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhicheng Dou","raw_affiliation_strings":["Gaoling School of Artificial Intelligence Renmin University of China"],"affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence Renmin University of China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020766468","display_name":"Jun Xu","orcid":"https://orcid.org/0000-0001-7170-111X"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jun Xu","raw_affiliation_strings":["Gaoling School of Artificial Intelligence Renmin University of China"],"affiliations":[{"raw_affiliation_string":"Gaoling School of Artificial Intelligence Renmin University of China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025631695","display_name":"Ji-Rong Wen","orcid":"https://orcid.org/0000-0002-9777-9676"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ji-Rong Wen","raw_affiliation_strings":["Beijing Key Laboratory of Big Data Management and Analysis Methods and Key Laboratory of Data Engineering and Knowledge Engineering, MOE"],"affiliations":[{"raw_affiliation_string":"Beijing Key Laboratory of Big Data Management and Analysis Methods and Key Laboratory of Data Engineering and Knowledge Engineering, MOE","institution_ids":[]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5084847804"],"corresponding_institution_ids":["https://openalex.org/I78988378"],"apc_list":null,"apc_paid":null,"fwci":6.6661,"has_fulltext":false,"cited_by_count":35,"citation_normalized_percentile":{"value":0.96843157,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"2298","last_page":"2308"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10286","display_name":"Information Retrieval and Search Behavior","score":0.9940000176429749,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9883000254631042,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.864790141582489},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.747626543045044},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4598653316497803},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.40663301944732666}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.864790141582489},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.747626543045044},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4598653316497803},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40663301944732666}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3366423.3380294","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380294","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3366423.3380294","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3366423.3380294","pdf_url":null,"source":null,"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of The Web Conference 2020","raw_type":"proceedings-article"},"sustainable_development_goals":[{"score":0.7400000095367432,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1546897512","https://openalex.org/W1975409939","https://openalex.org/W1979809564","https://openalex.org/W1980617223","https://openalex.org/W1982858363","https://openalex.org/W2023599408","https://openalex.org/W2105059961","https://openalex.org/W2108279663","https://openalex.org/W2109677301","https://openalex.org/W2118286847","https://openalex.org/W2119717200","https://openalex.org/W2120724560","https://openalex.org/W2121863487","https://openalex.org/W2122654842","https://openalex.org/W2125682643","https://openalex.org/W2127799072","https://openalex.org/W2132314908","https://openalex.org/W2135500808","https://openalex.org/W2138108551","https://openalex.org/W2139873966","https://openalex.org/W2143331230","https://openalex.org/W2145413874","https://openalex.org/W2151049666","https://openalex.org/W2152314154","https://openalex.org/W2155482025","https://openalex.org/W2168717408","https://openalex.org/W2171392812","https://openalex.org/W2171806843","https://openalex.org/W2250539671","https://openalex.org/W2257117461","https://openalex.org/W2564434159","https://openalex.org/W2739916191","https://openalex.org/W2740384884","https://openalex.org/W2786171444","https://openalex.org/W2788295351","https://openalex.org/W2799544270","https://openalex.org/W2889658777","https://openalex.org/W2897050313","https://openalex.org/W2955887579","https://openalex.org/W2962770891","https://openalex.org/W2962957031","https://openalex.org/W2963403868","https://openalex.org/W2963561234","https://openalex.org/W3102778384","https://openalex.org/W3102899483","https://openalex.org/W4214717370","https://openalex.org/W4252076394"],"related_works":["https://openalex.org/W2961085424","https://openalex.org/W4306674287","https://openalex.org/W3046775127","https://openalex.org/W4394896187","https://openalex.org/W3170094116","https://openalex.org/W4386462264","https://openalex.org/W3107602296","https://openalex.org/W4364306694","https://openalex.org/W4312192474","https://openalex.org/W4283697347"],"abstract_inverted_index":{"Personalized":[0],"search":[1,16,44,80,82,90,97,113,151,163,211,223],"improves":[2],"generic":[3],"ranking":[4,56,124,173,185],"models":[5,40],"by":[6],"taking":[7],"user":[8,51,100,168,197],"interests":[9,101],"into":[10],"consideration":[11],"and":[12,26,53,92,121,150],"returning":[13],"more":[14,108],"accurate":[15],"results":[17,205],"to":[18,139,142,169,187],"individual":[19],"users.":[20],"In":[21,127,160],"recent":[22],"years,":[23],"machine":[24],"learning":[25,28,134],"deep":[27],"techniques":[29],"have":[30,65],"been":[31,66],"successfully":[32],"applied":[33],"in":[34],"personalized":[35,112,184,222],"search.":[36],"Most":[37],"existing":[38],"personalization":[39,136],"simply":[41],"regard":[42],"the":[43,60,75,79,89,93,96,99,117,144,148,162,167,171,189,196,201,207],"history":[45],"as":[46,140],"a":[47,84,111,132,154,182],"static":[48],"set":[49],"of":[50,78,86],"behaviours":[52],"learn":[54],"fixed":[55],"strategies":[57],"based":[58,135],"on":[59,195,206],"recorded":[61],"data.":[62],"Though":[63],"improvements":[64],"observed,":[67],"it":[68],"is":[69,83],"obvious":[70],"that":[71,214],"these":[72],"methods":[73],"ignore":[74],"dynamic":[76],"nature":[77],"process:":[81],"sequence":[85],"interactions":[87,146],"between":[88,147],"engine":[91,152,164],"user.":[94],"During":[95],"process,":[98],"may":[102],"dynamically":[103],"change.":[104],"It":[105],"would":[106],"be":[107],"helpful":[109],"if":[110],"model":[114,174,217],"could":[115],"track":[116,143],"whole":[118],"interaction":[119],"process":[120],"update":[122,170],"its":[123],"strategy":[125],"continuously.":[126],"this":[128],"paper,":[129],"we":[130,180],"propose":[131],"reinforcement":[133],"model,":[137],"referred":[138],"RLPer,":[141,161],"sequential":[145],"users":[149],"with":[153,166,176],"hierarchical":[155],"Markov":[156],"Decision":[157],"Process":[158],"(MDP).":[159],"interacts":[165],"underlying":[172],"continuously":[175],"real-time":[177],"feedback.":[178],"And":[179],"design":[181],"feedback-aware":[183],"component":[186],"catch":[188],"user\u2019s":[190],"feedback":[191],"which":[192],"has":[193],"impacts":[194],"interest":[198],"profile":[199],"for":[200],"next":[202],"query.":[203],"Experimental":[204],"publicly":[208],"available":[209],"AOL":[210],"log":[212],"verify":[213],"our":[215],"proposed":[216],"can":[218],"significantly":[219],"outperform":[220],"state-of-the-art":[221],"models.":[224]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":8},{"year":2021,"cited_by_count":9},{"year":2020,"cited_by_count":1}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2025-10-10T00:00:00"}
