{"id":"https://openalex.org/W4416017570","doi":"https://doi.org/10.1145/3746252.3761384","title":"Autonomous Reasoning-Retrieval for Large Language Model Based Recommendation","display_name":"Autonomous Reasoning-Retrieval for Large Language Model Based Recommendation","publication_year":2025,"publication_date":"2025-11-08","ids":{"openalex":"https://openalex.org/W4416017570","doi":"https://doi.org/10.1145/3746252.3761384"},"language":null,"primary_location":{"id":"doi:10.1145/3746252.3761384","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746252.3761384","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5036939414","display_name":"Bowen Zheng","orcid":"https://orcid.org/0009-0002-3010-7899"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Bowen Zheng","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0002-3010-7899","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100367735","display_name":"Xiaolei Wang","orcid":"https://orcid.org/0000-0003-3685-3606"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]},{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaolei Wang","raw_affiliation_strings":["Beijing Institute of Technology, Beijing, China","Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-3685-3606","affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042577552","display_name":"Enze Liu","orcid":"https://orcid.org/0009-0007-8344-4780"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Enze Liu","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0007-8344-4780","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Xi Wang","orcid":"https://orcid.org/0009-0005-1272-5273"},"institutions":[{"id":"https://openalex.org/I125839683","display_name":"Beijing Institute of Technology","ror":"https://ror.org/01skt4w74","country_code":"CN","type":"education","lineage":["https://openalex.org/I125839683","https://openalex.org/I890469752"]},{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xi Wang","raw_affiliation_strings":["Beijing Institute of Technology, Beijing, China","Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0005-1272-5273","affiliations":[{"raw_affiliation_string":"Beijing Institute of Technology, Beijing, China","institution_ids":["https://openalex.org/I125839683"]},{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101796004","display_name":"Hongyu Lu","orcid":"https://orcid.org/0000-0002-0247-2496"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongyu Lu","raw_affiliation_strings":["WeChat, Tencent, Guangzhou, China"],"raw_orcid":"https://orcid.org/0000-0002-0247-2496","affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Guangzhou, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108579011","display_name":"Yu Chen","orcid":"https://orcid.org/0009-0002-0726-2727"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yu Chen","raw_affiliation_strings":["WeChat, Tencent, Beijing, China"],"raw_orcid":"https://orcid.org/0009-0002-0726-2727","affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5037145565","display_name":"Wayne Xin Zhao","orcid":"https://orcid.org/0000-0002-8333-6196"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wayne Xin Zhao","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-8333-6196","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5025631695","display_name":"Ji-Rong Wen","orcid":"https://orcid.org/0000-0002-9777-9676"},"institutions":[{"id":"https://openalex.org/I78988378","display_name":"Renmin University of China","ror":"https://ror.org/041pakw92","country_code":"CN","type":"education","lineage":["https://openalex.org/I78988378"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ji-Rong Wen","raw_affiliation_strings":["Renmin University of China, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-9777-9676","affiliations":[{"raw_affiliation_string":"Renmin University of China, Beijing, China","institution_ids":["https://openalex.org/I78988378"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5036939414"],"corresponding_institution_ids":["https://openalex.org/I78988378"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.45538662,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"4423","last_page":"4433"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.6779999732971191,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.6779999732971191,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10664","display_name":"Sentiment Analysis and Opinion Mining","score":0.032499998807907104,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.03150000050663948,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.6729000210762024},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.670799970626831},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.5794000029563904},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.4921000003814697},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4875999987125397},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.4250999987125397},{"id":"https://openalex.org/keywords/rss","display_name":"RSS","score":0.4169999957084656}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.70660001039505},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.6729000210762024},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.670799970626831},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.618399977684021},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.5794000029563904},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.4921000003814697},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4875999987125397},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.4250999987125397},{"id":"https://openalex.org/C2385561","wikidata":"https://www.wikidata.org/wiki/Q45432","display_name":"RSS","level":2,"score":0.4169999957084656},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.414000004529953},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.41269999742507935},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.3962000012397766},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.383899986743927},{"id":"https://openalex.org/C164226766","wikidata":"https://www.wikidata.org/wiki/Q7293202","display_name":"Rank (graph theory)","level":2,"score":0.35100001096725464},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.3433000147342682},{"id":"https://openalex.org/C2776230583","wikidata":"https://www.wikidata.org/wiki/Q1322198","display_name":"Spoken language","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2842000126838684},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.2646999955177307},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.26100000739097595}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3746252.3761384","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3746252.3761384","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 34th ACM International Conference on Information and Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1065675187","display_name":null,"funder_award_id":"92470205 and 62222215","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":52,"referenced_works":["https://openalex.org/W2171279286","https://openalex.org/W2219888463","https://openalex.org/W2469952266","https://openalex.org/W2783272285","https://openalex.org/W2899457523","https://openalex.org/W2964926209","https://openalex.org/W2966483207","https://openalex.org/W2984100107","https://openalex.org/W3065542300","https://openalex.org/W4220974940","https://openalex.org/W4252076394","https://openalex.org/W4296591867","https://openalex.org/W4310418667","https://openalex.org/W4362515116","https://openalex.org/W4367047145","https://openalex.org/W4376312036","https://openalex.org/W4376312626","https://openalex.org/W4384828614","https://openalex.org/W4386728933","https://openalex.org/W4387157010","https://openalex.org/W4388481614","https://openalex.org/W4389470008","https://openalex.org/W4391286723","https://openalex.org/W4391620956","https://openalex.org/W4391631327","https://openalex.org/W4392576636","https://openalex.org/W4393063676","https://openalex.org/W4398191691","https://openalex.org/W4399317481","https://openalex.org/W4400531953","https://openalex.org/W4400909953","https://openalex.org/W4401834466","https://openalex.org/W4403220611","https://openalex.org/W4403577838","https://openalex.org/W4403767139","https://openalex.org/W4404317680","https://openalex.org/W4405655184","https://openalex.org/W4405766390","https://openalex.org/W4406167410","https://openalex.org/W4406774573","https://openalex.org/W4406779522","https://openalex.org/W4407814501","https://openalex.org/W4409049124","https://openalex.org/W4416031380","https://openalex.org/W6891928986","https://openalex.org/W6910528035","https://openalex.org/W6910529769","https://openalex.org/W6947866383","https://openalex.org/W6948305707","https://openalex.org/W6948310395","https://openalex.org/W6948368532","https://openalex.org/W6948405870"],"related_works":[],"abstract_inverted_index":{"Recently,":[0],"large":[1],"language":[2],"models":[3,20],"(LLMs)":[4],"have":[5],"been":[6],"introduced":[7],"into":[8],"recommender":[9,229],"systems":[10],"(RSs)":[11],"as":[12],"recommendation":[13,19,128,180],"backbones":[14],"or":[15],"to":[16,27,96,108,154,174,193],"enhance":[17],"traditional":[18,216],"(TRMs).":[21],"However,":[22],"existing":[23,218],"LLM-based":[24,66,219],"RSs":[25],"fail":[26],"fully":[28],"leverage":[29],"the":[30,54,105,110,176],"complementary":[31],"strengths":[32],"of":[33,53],"LLMs":[34,75,87,103,152,192],"(e.g.,":[35,43],"world":[36],"knowledge":[37,45],"and":[38,41,46,76,92,120,136,171,179,217],"reasoning":[39],"capabilities)":[40],"TRMs":[42,77,95],"recommendation-specific":[44],"computational":[47],"efficiency),":[48],"resulting":[49],"in":[50,124,228],"shallow":[51],"exploration":[52,227],"item":[55,80],"space.":[56],"To":[57],"address":[58],"this":[59],"limitation,":[60],"we":[61,145,161],"propose":[62,162],"DeepRec,":[63],"a":[64,137,147,163,222],"novel":[65,122],"RS":[67],"approach":[68],"that":[69,167,211],"facilitates":[70],"autonomous":[71],"multi-turn":[72,101],"interactions":[73,196],"between":[74],"for":[78,118,203,225],"deep":[79,226],"space":[81],"exploration.":[82],"In":[83],"each":[84],"interaction":[85,177],"turn,":[86],"reason":[88],"over":[89],"user":[90],"preferences":[91],"collaborate":[93],"with":[94,150,197],"retrieve":[97],"candidate":[98],"items.":[99],"After":[100],"interaction,":[102],"rank":[104],"aggregated":[106],"candidates":[107],"generate":[109],"final":[111],"recommendations.":[112],"We":[113],"utilize":[114],"reinforcement":[115],"learning":[116],"(RL)":[117],"optimization":[119],"introduce":[121],"contributions":[123],"three":[125],"key":[126],"aspects:":[127],"model":[129],"based":[130],"data":[131,143],"rollout,":[132,144],"recommendation-oriented":[133,201],"hierarchical":[134,164],"rewards,":[135],"two-stage":[138,187],"RL":[139,184,188,202],"training":[140],"strategy.":[141],"For":[142,158,183],"design":[146],"preference-aware":[148],"TRM,":[149],"which":[151],"interact":[153],"construct":[155],"trajectory":[156],"data.":[157],"reward":[159,165],"design,":[160],"function":[166],"comprises":[168],"both":[169,215],"process-level":[170],"outcome-level":[172],"rewards":[173],"optimize":[175],"process":[178],"quality,":[181],"respectively.":[182],"training,":[185],"our":[186],"strategy":[189],"first":[190],"guides":[191],"learn":[194],"effective":[195],"TRMs,":[198],"followed":[199],"by":[200],"performance":[204],"enhancement.":[205],"Experiments":[206],"on":[207],"public":[208],"datasets":[209],"show":[210],"DeepRec":[212],"substantially":[213],"outperforms":[214],"baselines,":[220],"establishing":[221],"new":[223],"paradigm":[224],"systems.":[230]},"counts_by_year":[],"updated_date":"2025-11-08T23:25:12.792448","created_date":"2025-11-08T00:00:00"}
