{"id":"https://openalex.org/W2963619374","doi":"https://doi.org/10.1609/aaai.v33i01.33013312","title":"Large-Scale Interactive Recommendation with Tree-Structured Policy Gradient","display_name":"Large-Scale Interactive Recommendation with Tree-Structured Policy Gradient","publication_year":2019,"publication_date":"2019-07-17","ids":{"openalex":"https://openalex.org/W2963619374","doi":"https://doi.org/10.1609/aaai.v33i01.33013312","mag":"2963619374"},"language":"en","primary_location":{"id":"doi:10.1609/aaai.v33i01.33013312","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33013312","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4204/4082","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4204/4082","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045308982","display_name":"Haokun Chen","orcid":"https://orcid.org/0000-0002-5485-2984"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Haokun Chen","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012370987","display_name":"Xinyi Dai","orcid":"https://orcid.org/0000-0002-3351-5401"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinyi Dai","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087929301","display_name":"Han Cai","orcid":"https://orcid.org/0000-0002-4906-1192"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Han Cai","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090720315","display_name":"Weinan Zhang","orcid":"https://orcid.org/0000-0002-0127-2425"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Weinan Zhang","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101935089","display_name":"Xuejian Wang","orcid":"https://orcid.org/0000-0002-8655-2062"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuejian Wang","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054330014","display_name":"Ruiming Tang","orcid":"https://orcid.org/0000-0002-9224-2431"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ruiming Tang","raw_affiliation_strings":["Huawei"],"affiliations":[{"raw_affiliation_string":"Huawei","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101668018","display_name":"Yuzhou Zhang","orcid":"https://orcid.org/0000-0001-8515-3388"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yuzhou Zhang","raw_affiliation_strings":["Huawei"],"affiliations":[{"raw_affiliation_string":"Huawei","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001571390","display_name":"Yong Yu","orcid":"https://orcid.org/0000-0003-0281-8271"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yong Yu","raw_affiliation_strings":["Shanghai Jiao Tong University"],"affiliations":[{"raw_affiliation_string":"Shanghai Jiao Tong University","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5045308982"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":28.6809,"has_fulltext":true,"cited_by_count":131,"citation_normalized_percentile":{"value":0.99589372,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"33","issue":"01","first_page":"3312","last_page":"3320"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9894999861717224,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8227670192718506},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7447032928466797},{"id":"https://openalex.org/keywords/tree","display_name":"Tree (set theory)","score":0.6718987226486206},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.6089958548545837},{"id":"https://openalex.org/keywords/action","display_name":"Action (physics)","score":0.5717336535453796},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.546241819858551},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48288726806640625},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4557061791419983},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.4427903890609741},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4309063255786896},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.416853666305542},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.09045624732971191}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8227670192718506},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7447032928466797},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.6718987226486206},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.6089958548545837},{"id":"https://openalex.org/C2780791683","wikidata":"https://www.wikidata.org/wiki/Q846785","display_name":"Action (physics)","level":2,"score":0.5717336535453796},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.546241819858551},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48288726806640625},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4557061791419983},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.4427903890609741},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4309063255786896},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.416853666305542},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.09045624732971191},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1609/aaai.v33i01.33013312","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33013312","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4204/4082","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1609/aaai.v33i01.33013312","is_oa":true,"landing_page_url":"https://doi.org/10.1609/aaai.v33i01.33013312","pdf_url":"https://ojs.aaai.org/index.php/AAAI/article/download/4204/4082","source":{"id":"https://openalex.org/S4210191458","display_name":"Proceedings of the AAAI Conference on Artificial Intelligence","issn_l":"2159-5399","issn":["2159-5399","2374-3468"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/P4310320058","host_organization_name":"Association for the Advancement of Artificial Intelligence","host_organization_lineage":["https://openalex.org/P4310320058"],"host_organization_lineage_names":["Association for the Advancement of Artificial Intelligence"],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the AAAI Conference on Artificial Intelligence","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G129499350","display_name":null,"funder_award_id":"61632017","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2702356746","display_name":null,"funder_award_id":"61702","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3256823474","display_name":null,"funder_award_id":"61702327","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4433206528","display_name":null,"funder_award_id":"61772333","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8605162970","display_name":null,"funder_award_id":"61632017, 61702327, 61772333","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2963619374.pdf","grobid_xml":"https://content.openalex.org/works/W2963619374.grobid-xml"},"referenced_works_count":32,"referenced_works":["https://openalex.org/W91851626","https://openalex.org/W1959608418","https://openalex.org/W2054141820","https://openalex.org/W2091780923","https://openalex.org/W2108738385","https://openalex.org/W2112420033","https://openalex.org/W2119717200","https://openalex.org/W2126552603","https://openalex.org/W2127480961","https://openalex.org/W2145339207","https://openalex.org/W2155027007","https://openalex.org/W2182342230","https://openalex.org/W2215378786","https://openalex.org/W2257979135","https://openalex.org/W2358698356","https://openalex.org/W2470873417","https://openalex.org/W2532022121","https://openalex.org/W2604822632","https://openalex.org/W2741274947","https://openalex.org/W2751185861","https://openalex.org/W2769883686","https://openalex.org/W2788125442","https://openalex.org/W2788295351","https://openalex.org/W2790532312","https://openalex.org/W2799544270","https://openalex.org/W2963864421","https://openalex.org/W3105140685","https://openalex.org/W4214717370","https://openalex.org/W4230563027","https://openalex.org/W6673543734","https://openalex.org/W6676077707","https://openalex.org/W6728105236"],"related_works":["https://openalex.org/W4390273403","https://openalex.org/W4386781444","https://openalex.org/W3092950680","https://openalex.org/W4246980185","https://openalex.org/W2150182025","https://openalex.org/W3197542405","https://openalex.org/W2418190244","https://openalex.org/W4238861846","https://openalex.org/W3125580266","https://openalex.org/W44246808"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,17],"(RL)":[2],"has":[3],"recently":[4],"been":[5],"introduced":[6],"to":[7,34,46,64,148],"interactive":[8],"recommender":[9],"systems":[10],"(IRS)":[11],"because":[12],"of":[13,16,32,38,92,152],"its":[14],"nature":[15],"from":[18,82,145],"dynamic":[19],"interactions":[20],"and":[21,55,96,105,109,135,173],"planning":[22],"for":[23],"long-run":[24],"performance.":[25],"As":[26],"IRS":[27],"is":[28,130,139],"always":[29],"with":[30,66],"thousands":[31,37],"items":[33,134],"recommend":[35],"(i.e.,":[36],"actions),":[39],"most":[40],"existing":[41,60],"RL-based":[42],"methods,":[43],"however,":[44],"fail":[45],"handle":[47],"such":[48,103],"a":[49,117,125,143,149],"large":[50,68],"discrete":[51,69,99],"action":[52,70,88],"space":[53,71],"problem":[54,72],"thus":[56],"become":[57],"inefficient.":[58],"The":[59],"work":[61],"that":[62,166],"tries":[63],"deal":[65],"the":[67,75,83,86,93,97,133,146,153],"by":[73],"utilizing":[74],"deep":[76],"deterministic":[77],"policy":[78],"gradient":[79],"framework":[80],"suffers":[81],"inconsistency":[84,104],"between":[85],"continuous":[87],"representation":[89],"(the":[90],"output":[91],"actor":[94],"network)":[95],"real":[98],"action.":[100],"To":[101],"avoid":[102],"achieve":[106],"high":[107],"efficiency":[108,175],"recommendation":[110,171],"effectiveness,":[111],"in":[112],"this":[113],"paper,":[114],"we":[115],"propose":[116],"Tree-structured":[118],"Policy":[119],"Gradient":[120],"Recommendation":[121],"(TPGR)":[122],"framework,":[123],"where":[124],"balanced":[126],"hierarchical":[127],"clustering":[128],"tree":[129],"built":[131],"over":[132,177],"picking":[136],"an":[137],"item":[138],"formulated":[140],"as":[141],"seeking":[142],"path":[144],"root":[147],"certain":[150],"leaf":[151],"tree.":[154],"Extensive":[155],"experiments":[156],"on":[157,161],"carefully-designed":[158],"environments":[159],"based":[160],"two":[162],"real-world":[163],"datasets":[164],"demonstrate":[165],"our":[167],"model":[168],"provides":[169],"superior":[170],"performance":[172],"significant":[174],"improvement":[176],"state-of-the-art":[178],"methods.":[179]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":10},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":31},{"year":2022,"cited_by_count":25},{"year":2021,"cited_by_count":26},{"year":2020,"cited_by_count":22},{"year":2019,"cited_by_count":3}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
