{"id":"https://openalex.org/W4318147827","doi":"https://doi.org/10.1109/bigdata55660.2022.10020921","title":"Collaborative Filtering Guided Deep Reinforcement Learning for Sequential Recommendations","display_name":"Collaborative Filtering Guided Deep Reinforcement Learning for Sequential Recommendations","publication_year":2022,"publication_date":"2022-12-17","ids":{"openalex":"https://openalex.org/W4318147827","doi":"https://doi.org/10.1109/bigdata55660.2022.10020921"},"language":"en","primary_location":{"id":"doi:10.1109/bigdata55660.2022.10020921","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bigdata55660.2022.10020921","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5030591692","display_name":"Vahid Azizi","orcid":"https://orcid.org/0000-0002-5640-8799"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Vahid Azizi","raw_affiliation_strings":["Adobe Inc,San Jose,USA","Adobe Inc, San Jose, USA"],"affiliations":[{"raw_affiliation_string":"Adobe Inc,San Jose,USA","institution_ids":["https://openalex.org/I1306409833"]},{"raw_affiliation_string":"Adobe Inc, San Jose, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003506066","display_name":"Saayan Mitra","orcid":"https://orcid.org/0000-0002-4048-2142"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Saayan Mitra","raw_affiliation_strings":["Adobe Research,San Jose,USA","Adobe Research, San Jose, USA"],"affiliations":[{"raw_affiliation_string":"Adobe Research,San Jose,USA","institution_ids":["https://openalex.org/I1306409833"]},{"raw_affiliation_string":"Adobe Research, San Jose, USA","institution_ids":["https://openalex.org/I1306409833"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100441911","display_name":"Xiang Chen","orcid":"https://orcid.org/0000-0002-1180-3891"},"institutions":[{"id":"https://openalex.org/I1306409833","display_name":"Adobe Systems (United States)","ror":"https://ror.org/059tvcg64","country_code":"US","type":"company","lineage":["https://openalex.org/I1306409833"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Xiang Chen","raw_affiliation_strings":["Adobe Research,San Jose,USA","Adobe Research, San Jose, USA"],"affiliations":[{"raw_affiliation_string":"Adobe Research,San Jose,USA","institution_ids":["https://openalex.org/I1306409833"]},{"raw_affiliation_string":"Adobe Research, San Jose, USA","institution_ids":["https://openalex.org/I1306409833"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5030591692"],"corresponding_institution_ids":["https://openalex.org/I1306409833"],"apc_list":null,"apc_paid":null,"fwci":0.1457,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.462442,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9509000182151794,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8248914480209351},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8108276128768921},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.7170174717903137},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.6823517084121704},{"id":"https://openalex.org/keywords/collaborative-filtering","display_name":"Collaborative filtering","score":0.6516212224960327},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5272437930107117},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4725513160228729},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.43068766593933105},{"id":"https://openalex.org/keywords/term","display_name":"Term (time)","score":0.42102867364883423},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.09736159443855286},{"id":"https://openalex.org/keywords/cognitive-science","display_name":"Cognitive science","score":0.07531484961509705}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8248914480209351},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8108276128768921},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.7170174717903137},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.6823517084121704},{"id":"https://openalex.org/C21569690","wikidata":"https://www.wikidata.org/wiki/Q94702","display_name":"Collaborative filtering","level":3,"score":0.6516212224960327},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5272437930107117},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4725513160228729},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.43068766593933105},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.42102867364883423},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.09736159443855286},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.07531484961509705},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/bigdata55660.2022.10020921","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/bigdata55660.2022.10020921","pdf_url":null,"source":{"id":"https://openalex.org/S4363607709","display_name":"2022 IEEE International Conference on Big Data (Big Data)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 IEEE International Conference on Big Data (Big Data)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6899999976158142,"id":"https://metadata.un.org/sdg/16","display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1191599655","https://openalex.org/W1487320471","https://openalex.org/W1788292133","https://openalex.org/W1924770834","https://openalex.org/W2024320089","https://openalex.org/W2026784708","https://openalex.org/W2027731328","https://openalex.org/W2042281163","https://openalex.org/W2054141820","https://openalex.org/W2071133755","https://openalex.org/W2100235918","https://openalex.org/W2107878631","https://openalex.org/W2116261113","https://openalex.org/W2117311203","https://openalex.org/W2127480961","https://openalex.org/W2138108551","https://openalex.org/W2295739661","https://openalex.org/W2475334473","https://openalex.org/W2509235963","https://openalex.org/W2532022121","https://openalex.org/W2604662567","https://openalex.org/W2606642831","https://openalex.org/W2787933113","https://openalex.org/W2787938642","https://openalex.org/W2788295351","https://openalex.org/W2793768763","https://openalex.org/W2799544270","https://openalex.org/W2898273872","https://openalex.org/W2963149042","https://openalex.org/W2964108915","https://openalex.org/W3035170973","https://openalex.org/W3100789280","https://openalex.org/W3102778384","https://openalex.org/W3102899483","https://openalex.org/W3104030692","https://openalex.org/W4214717370","https://openalex.org/W4288083766","https://openalex.org/W4297971002","https://openalex.org/W6627932998","https://openalex.org/W6629353124","https://openalex.org/W6630221451","https://openalex.org/W6640212811","https://openalex.org/W6685670348","https://openalex.org/W6737073507","https://openalex.org/W6748839928","https://openalex.org/W6755373136","https://openalex.org/W6917172014"],"related_works":["https://openalex.org/W1484355083","https://openalex.org/W2772628444","https://openalex.org/W4220714703","https://openalex.org/W2735929803","https://openalex.org/W2170391450","https://openalex.org/W2098758514","https://openalex.org/W3008845055","https://openalex.org/W2041004656","https://openalex.org/W4376854386","https://openalex.org/W1966742602"],"abstract_inverted_index":{"Earlier":[0],"recommendation":[1,36,82,136,152],"techniques,":[2],"such":[3],"as":[4,84,118,120],"Collaborative":[5],"Filtering":[6],"(CF),":[7],"assume":[8,57],"the":[9,21,46,67,74,77,140,146,151,165,170,180,227],"users\u2019":[10,40,93,113,161,206,213],"preferences":[11,41,214],"do":[12,64],"not":[13,65],"change":[14],"over":[15,42],"time":[16,43],"and":[17,44,63,100,163,186,208,222],"strive":[18],"to":[19,33,96,104,138,158,160,192,211],"maximize":[20,45,164],"immediate":[22],"reward.":[23,48,167],"In":[24,109],"recent":[25],"studies,":[26],"Reinforcement":[27,133],"Learning":[28,134],"(RL)":[29],"has":[30],"been":[31],"used":[32,103],"make":[34],"interactive":[35],"systems":[37],"that":[38,58,172],"capture":[39],"long-term":[47,166],"However,":[49],"these":[50],"methods":[51,89],"have":[52],"two":[53,223],"limitations.":[54],"First,":[55],"they":[56],"items":[59,80,183],"are":[60],"independently":[61],"distributed":[62],"consider":[66],"relations":[68,78,181],"between":[69,79,182],"items.":[70],"This":[71],"assumption":[72],"ignores":[73],"power":[75],"of":[76,197,229],"for":[81,124],"systems,":[83],"demonstrated":[85],"by":[86,169],"CF.":[87],"RL-based":[88],"rely":[90],"primarily":[91],"on":[92,204],"positive":[94,122,207],"feedback":[95,115,123,210],"understand":[97,212],"their":[98,106,121,126],"preferences,":[99],"sampling":[101],"is":[102,116],"incorporate":[105],"negative":[107,114,198,209],"feedback.":[108],"a":[110,130,154],"practical":[111],"setting,":[112],"just":[117],"crucial":[119],"understanding":[125],"preferences.":[127],"We":[128,143],"present":[129],"novel":[131],"Deep":[132],"(DRL)":[135],"framework":[137,191,202],"address":[139],"limitations":[141],"above.":[142],"specifically":[144],"utilize":[145],"actor-critic":[147],"paradigm,":[148],"which":[149],"considers":[150],"problem":[153],"sequential":[155],"decision-making":[156],"process":[157],"adapt":[159],"behaviors":[162],"Motivated":[168],"intuition":[171],"similar":[173,176],"users":[174],"like":[175],"items,":[177],"we":[178],"extract":[179],"using":[184],"CF":[185],"integrate":[187],"it":[188],"into":[189],"our":[190,200,220,230],"boost":[193],"overall":[194],"performance.":[195],"Instead":[196],"sampling,":[199],"proposed":[201,231],"relies":[203],"all":[205],"more":[215],"accurately.":[216],"Extensive":[217],"experiments":[218],"with":[219],"dataset":[221],"public":[224],"datasets":[225],"demonstrate":[226],"effectiveness":[228],"framework.":[232]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2025-12-24T23:09:58.560324","created_date":"2025-10-10T00:00:00"}
