{"id":"https://openalex.org/W2788295351","doi":"https://doi.org/10.1145/3219819.3219886","title":"Recommendations with Negative Feedback via Pairwise Deep Reinforcement Learning","display_name":"Recommendations with Negative Feedback via Pairwise Deep Reinforcement Learning","publication_year":2018,"publication_date":"2018-07-19","ids":{"openalex":"https://openalex.org/W2788295351","doi":"https://doi.org/10.1145/3219819.3219886","mag":"2788295351"},"language":"en","primary_location":{"id":"doi:10.1145/3219819.3219886","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3219819.3219886","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3219819.3219886","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://dl.acm.org/doi/pdf/10.1145/3219819.3219886","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100645854","display_name":"Xiangyu Zhao","orcid":"https://orcid.org/0000-0003-2926-4416"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Xiangyu Zhao","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100425225","display_name":"Liang Zhang","orcid":"https://orcid.org/0000-0002-5805-7099"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Liang Zhang","raw_affiliation_strings":["JD.com, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD.com, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008043408","display_name":"Zhuoye Ding","orcid":"https://orcid.org/0000-0001-7430-5980"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuoye Ding","raw_affiliation_strings":["JD.com, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD.com, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103251082","display_name":"Long Xia","orcid":"https://orcid.org/0000-0003-2580-6206"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Long Xia","raw_affiliation_strings":["JD.com, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD.com, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5040639891","display_name":"Jiliang Tang","orcid":"https://orcid.org/0000-0001-7125-3898"},"institutions":[{"id":"https://openalex.org/I87216513","display_name":"Michigan State University","ror":"https://ror.org/05hs6h993","country_code":"US","type":"education","lineage":["https://openalex.org/I87216513"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Jiliang Tang","raw_affiliation_strings":["Michigan State University, East Lansing, MI, USA"],"affiliations":[{"raw_affiliation_string":"Michigan State University, East Lansing, MI, USA","institution_ids":["https://openalex.org/I87216513"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5054482111","display_name":"Dawei Yin","orcid":"https://orcid.org/0000-0002-8846-2001"},"institutions":[{"id":"https://openalex.org/I4210103986","display_name":"Jingdong (China)","ror":"https://ror.org/01dkjkq64","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210103986"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dawei Yin","raw_affiliation_strings":["JD.com, Beijing, China"],"affiliations":[{"raw_affiliation_string":"JD.com, Beijing, China","institution_ids":["https://openalex.org/I4210103986"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5100645854"],"corresponding_institution_ids":["https://openalex.org/I87216513"],"apc_list":null,"apc_paid":null,"fwci":67.4311,"has_fulltext":true,"cited_by_count":386,"citation_normalized_percentile":{"value":0.9988429,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"1040","last_page":"1048"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9965999722480774,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T13274","display_name":"Expert finding and Q&A systems","score":0.9617000222206116,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.9282389879226685},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8345745801925659},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7569793462753296},{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.7510658502578735},{"id":"https://openalex.org/keywords/information-overload","display_name":"Information overload","score":0.7296454310417175},{"id":"https://openalex.org/keywords/pairwise-comparison","display_name":"Pairwise comparison","score":0.6913919448852539},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.6525102257728577},{"id":"https://openalex.org/keywords/negative-feedback","display_name":"Negative feedback","score":0.4737587571144104},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4673844575881958},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.45486775040626526},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4439196288585663},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.4358013868331909},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4195908308029175},{"id":"https://openalex.org/keywords/collaborative-filtering","display_name":"Collaborative filtering","score":0.41312795877456665},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.18443679809570312},{"id":"https://openalex.org/keywords/database","display_name":"Database","score":0.08108049631118774}],"concepts":[{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.9282389879226685},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8345745801925659},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7569793462753296},{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.7510658502578735},{"id":"https://openalex.org/C186625053","wikidata":"https://www.wikidata.org/wiki/Q1130191","display_name":"Information overload","level":2,"score":0.7296454310417175},{"id":"https://openalex.org/C184898388","wikidata":"https://www.wikidata.org/wiki/Q1435712","display_name":"Pairwise comparison","level":2,"score":0.6913919448852539},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.6525102257728577},{"id":"https://openalex.org/C93586867","wikidata":"https://www.wikidata.org/wiki/Q62527","display_name":"Negative feedback","level":3,"score":0.4737587571144104},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4673844575881958},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.45486775040626526},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4439196288585663},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.4358013868331909},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4195908308029175},{"id":"https://openalex.org/C21569690","wikidata":"https://www.wikidata.org/wiki/Q94702","display_name":"Collaborative filtering","level":3,"score":0.41312795877456665},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.18443679809570312},{"id":"https://openalex.org/C77088390","wikidata":"https://www.wikidata.org/wiki/Q8513","display_name":"Database","level":1,"score":0.08108049631118774},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1145/3219819.3219886","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3219819.3219886","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3219819.3219886","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:1802.06501","is_oa":true,"landing_page_url":"http://arxiv.org/abs/1802.06501","pdf_url":"https://arxiv.org/pdf/1802.06501","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"}],"best_oa_location":{"id":"doi:10.1145/3219819.3219886","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3219819.3219886","pdf_url":"https://dl.acm.org/doi/pdf/10.1145/3219819.3219886","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 24th ACM SIGKDD International Conference on Knowledge Discovery &amp; Data Mining","raw_type":"proceedings-article"},"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.4000000059604645,"id":"https://metadata.un.org/sdg/17"}],"awards":[{"id":"https://openalex.org/G2673388003","display_name":null,"funder_award_id":"IIS-1714741 and IIS-1715940","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5495925939","display_name":"III: Small: Unsupervised Feature Selection in the Era of Big Data","funder_award_id":"1714741","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G5921281487","display_name":null,"funder_award_id":"number","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7110045","display_name":null,"funder_award_id":"IIS-1714741","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7773032749","display_name":"III: Small: Collaborative Research: A General Feature Learning Framework for Dynamic Attributed Networks","funder_award_id":"1715940","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G848032724","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G8783789473","display_name":null,"funder_award_id":"IIS-1715940","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":true,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2788295351.pdf","grobid_xml":"https://content.openalex.org/works/W2788295351.grobid-xml"},"referenced_works_count":44,"referenced_works":["https://openalex.org/W91039700","https://openalex.org/W190893902","https://openalex.org/W281665770","https://openalex.org/W1486317198","https://openalex.org/W1512919909","https://openalex.org/W1595483645","https://openalex.org/W1601974704","https://openalex.org/W1757796397","https://openalex.org/W2024320089","https://openalex.org/W2026784708","https://openalex.org/W2048226872","https://openalex.org/W2069870183","https://openalex.org/W2101984404","https://openalex.org/W2110325612","https://openalex.org/W2117911558","https://openalex.org/W2125031621","https://openalex.org/W2127480961","https://openalex.org/W2135263912","https://openalex.org/W2137063737","https://openalex.org/W2138108551","https://openalex.org/W2159094788","https://openalex.org/W2169783907","https://openalex.org/W2189395077","https://openalex.org/W2262817822","https://openalex.org/W2295739661","https://openalex.org/W2341171179","https://openalex.org/W2341865734","https://openalex.org/W2422675628","https://openalex.org/W2605794033","https://openalex.org/W2767807341","https://openalex.org/W2781763969","https://openalex.org/W2799231033","https://openalex.org/W2799544270","https://openalex.org/W2908054697","https://openalex.org/W2950332743","https://openalex.org/W2953132212","https://openalex.org/W2953334758","https://openalex.org/W3023151133","https://openalex.org/W3122507327","https://openalex.org/W4232449914","https://openalex.org/W4245108548","https://openalex.org/W4298857966","https://openalex.org/W4299286960","https://openalex.org/W4323654227"],"related_works":["https://openalex.org/W1547737580","https://openalex.org/W2002205901","https://openalex.org/W2098758514","https://openalex.org/W2798828231","https://openalex.org/W2186523884","https://openalex.org/W4376849821","https://openalex.org/W2066036313","https://openalex.org/W2548120918","https://openalex.org/W2159151314","https://openalex.org/W2144867296"],"abstract_inverted_index":{"Recommender":[0],"systems":[1,26],"play":[2],"a":[3,32,39,47,72,76,157],"crucial":[4],"role":[5],"in":[6,201],"mitigating":[7],"the":[8,28,52,60,66,89,124,164,180,183,193],"problem":[9],"of":[10,23,54,99,115,126,134,182,195],"information":[11],"overload":[12],"by":[13,149],"suggesting":[14],"users'":[15,103],"personalized":[16],"items":[17,95,101],"or":[18],"services.":[19],"The":[20,171],"vast":[21],"majority":[22],"traditional":[24],"recommender":[25,49,73,167],"consider":[27],"recommendation":[29],"procedure":[30],"as":[31,75],"static":[33],"process":[34],"and":[35,71,81,96,110,112,198],"make":[36],"recommendations":[37],"following":[38],"fixed":[40],"strategy.":[41],"In":[42,152],"this":[43,153],"paper,":[44,154],"we":[45,155],"propose":[46],"novel":[48,158],"system":[50,74,168],"with":[51,62],"capability":[53],"continuously":[55],"improving":[56],"its":[57],"strategies":[58,91],"during":[59],"interactions":[61,68],"users.":[63],"We":[64],"model":[65],"sequential":[67],"between":[69],"users":[70],"Markov":[77],"Decision":[78],"Process":[79],"(MDP)":[80],"leverage":[82],"Reinforcement":[83],"Learning":[84],"(RL)":[85],"to":[86,120,160,191],"automatically":[87],"learn":[88],"optimal":[90],"via":[92],"recommending":[93],"trial-and-error":[94],"receiving":[97],"reinforcements":[98],"these":[100],"from":[102],"feedback.":[104],"Users'":[105],"feedback":[106,116,128,145,200],"can":[107],"be":[108,147],"positive":[109,135,144,197],"negative":[111,127,150,199],"both":[113,196],"types":[114],"have":[117,188],"great":[118],"potentials":[119],"boost":[121],"recommendations.":[122,202],"However,":[123],"number":[125],"is":[129,141],"much":[130],"larger":[131],"than":[132],"that":[133],"one;":[136],"thus":[137],"incorporating":[138],"them":[139,162],"simultaneously":[140],"challenging":[142],"since":[143],"could":[146],"buried":[148],"one.":[151],"develop":[156],"approach":[159],"incorporate":[161],"into":[163],"proposed":[165,184],"deep":[166],"(DEERS)":[169],"framework.":[170,185],"experimental":[172],"results":[173],"based":[174],"on":[175],"real-world":[176],"e-commerce":[177],"data":[178],"demonstrate":[179],"effectiveness":[181],"Further":[186],"experiments":[187],"been":[189],"conducted":[190],"understand":[192],"importance":[194]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":46},{"year":2024,"cited_by_count":48},{"year":2023,"cited_by_count":59},{"year":2022,"cited_by_count":62},{"year":2021,"cited_by_count":71},{"year":2020,"cited_by_count":52},{"year":2019,"cited_by_count":37},{"year":2018,"cited_by_count":4},{"year":2017,"cited_by_count":2}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
