{"id":"https://openalex.org/W3209481761","doi":"https://doi.org/10.1145/3459637.3481917","title":"Explore, Filter and Distill","display_name":"Explore, Filter and Distill","publication_year":2021,"publication_date":"2021-10-26","ids":{"openalex":"https://openalex.org/W3209481761","doi":"https://doi.org/10.1145/3459637.3481917","mag":"3209481761"},"language":"en","primary_location":{"id":"doi:10.1145/3459637.3481917","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3459637.3481917","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101577090","display_name":"Ruobing Xie","orcid":"https://orcid.org/0000-0003-3170-5647"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ruobing Xie","raw_affiliation_strings":["WeChat, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101432489","display_name":"Shaoliang Zhang","orcid":"https://orcid.org/0000-0002-3079-3377"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaoliang Zhang","raw_affiliation_strings":["WeChat, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100431163","display_name":"Rui Wang","orcid":"https://orcid.org/0000-0001-9048-2979"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Rui Wang","raw_affiliation_strings":["WeChat, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102973664","display_name":"Feng Xia","orcid":"https://orcid.org/0000-0001-5279-9908"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Xia","raw_affiliation_strings":["WeChat, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5023086553","display_name":"Leyu Lin","orcid":"https://orcid.org/0000-0001-5471-500X"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Leyu Lin","raw_affiliation_strings":["WeChat, Tencent, Beijing, China"],"affiliations":[{"raw_affiliation_string":"WeChat, Tencent, Beijing, China","institution_ids":["https://openalex.org/I2250653659"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101577090"],"corresponding_institution_ids":["https://openalex.org/I2250653659"],"apc_list":null,"apc_paid":null,"fwci":0.8262,"has_fulltext":false,"cited_by_count":8,"citation_normalized_percentile":{"value":0.7950531,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"4243","last_page":"4252"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.998199999332428,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9818000197410583,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7995824813842773},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7333821058273315},{"id":"https://openalex.org/keywords/divergence","display_name":"Divergence (linguistics)","score":0.6100351810455322},{"id":"https://openalex.org/keywords/filter","display_name":"Filter (signal processing)","score":0.5606746077537537},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.512024462223053},{"id":"https://openalex.org/keywords/recommender-system","display_name":"Recommender system","score":0.4879016578197479},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4832116365432739},{"id":"https://openalex.org/keywords/space","display_name":"Space (punctuation)","score":0.45946595072746277},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.3606678247451782},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31612429022789}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7995824813842773},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7333821058273315},{"id":"https://openalex.org/C207390915","wikidata":"https://www.wikidata.org/wiki/Q1230525","display_name":"Divergence (linguistics)","level":2,"score":0.6100351810455322},{"id":"https://openalex.org/C106131492","wikidata":"https://www.wikidata.org/wiki/Q3072260","display_name":"Filter (signal processing)","level":2,"score":0.5606746077537537},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.512024462223053},{"id":"https://openalex.org/C557471498","wikidata":"https://www.wikidata.org/wiki/Q554950","display_name":"Recommender system","level":2,"score":0.4879016578197479},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4832116365432739},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.45946595072746277},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3606678247451782},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31612429022789},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.0},{"id":"https://openalex.org/C178790620","wikidata":"https://www.wikidata.org/wiki/Q11351","display_name":"Organic chemistry","level":1,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3459637.3481917","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3459637.3481917","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 30th ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","score":0.6600000262260437,"id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":31,"referenced_works":["https://openalex.org/W2295739661","https://openalex.org/W2475334473","https://openalex.org/W2512971201","https://openalex.org/W2604662567","https://openalex.org/W2723293840","https://openalex.org/W2739879705","https://openalex.org/W2747909401","https://openalex.org/W2787933113","https://openalex.org/W2799544270","https://openalex.org/W2808847742","https://openalex.org/W2897405591","https://openalex.org/W2898085636","https://openalex.org/W2903574258","https://openalex.org/W2904340070","https://openalex.org/W2963323306","https://openalex.org/W2963842088","https://openalex.org/W2964052347","https://openalex.org/W2984100107","https://openalex.org/W2997130580","https://openalex.org/W3034345128","https://openalex.org/W3034457371","https://openalex.org/W3035084859","https://openalex.org/W3035313290","https://openalex.org/W3035404611","https://openalex.org/W3088966581","https://openalex.org/W3093502611","https://openalex.org/W3101704389","https://openalex.org/W3102899483","https://openalex.org/W3110945790","https://openalex.org/W3153675609","https://openalex.org/W3170587616"],"related_works":["https://openalex.org/W4390273403","https://openalex.org/W4386781444","https://openalex.org/W3092950680","https://openalex.org/W4246980185","https://openalex.org/W2150182025","https://openalex.org/W4317039510","https://openalex.org/W3197542405","https://openalex.org/W2418190244","https://openalex.org/W4238861846","https://openalex.org/W3125580266"],"abstract_inverted_index":{"Reinforcement":[0],"learning":[1,96],"(RL)":[2],"has":[3,188],"been":[4,189],"verified":[5],"in":[6,37,109,182,209],"real-world":[7],"list-wise":[8,110,151],"recommendation.":[9,111],"However,":[10,39],"RL-based":[11,40],"recommendation":[12,99,185],"suffers":[13],"from":[14,79,131],"huge":[15],"memory":[16],"and":[17,72,107,117,134,146,155,179],"computation":[18],"costs":[19],"due":[20,52],"to":[21,53,83,103,161],"its":[22],"large-scale":[23],"models.":[24,66],"Knowledge":[25],"distillation":[26,142],"(KD)":[27],"is":[28],"an":[29,115],"effective":[30],"approach":[31],"for":[32,98,169,195],"model":[33],"compression":[34],"widely":[35],"used":[36],"practice.":[38],"models":[41],"strongly":[42],"rely":[43],"on":[44,47,176,191],"sufficient":[45],"explorations":[46],"the":[48,54,60,68,75,121,127,165],"enormous":[49],"user-item":[50],"space":[51],"data":[55],"sparsity":[56],"issue,":[57],"which":[58,101,123,159],"multiplies":[59],"challenges":[61],"of":[62,202],"KD":[63],"with":[64,149],"RL":[65],"What":[67],"teacher":[69,128],"should":[70,77,129,167],"teach":[71,130],"how":[73,163],"much":[74,164],"student":[76,166],"learn":[78,168],"each":[80,170],"lesson":[81],"need":[82],"be":[84],"carefully":[85],"designed.":[86],"In":[87],"this":[88],"work,":[89],"we":[90,113],"propose":[91,114],"a":[92,140,150,156,183],"novel":[93],"Distilled":[94],"reinforcement":[95],"framework":[97],"(DRL-Rec),":[100],"aims":[102,160],"improve":[104],"both":[105,132,144,177],"effectiveness":[106],"efficiency":[108],"Specifically,":[112],"Exploring":[116],"filtering":[118],"module":[119],"before":[120],"distillation,":[122],"decides":[124],"what":[125],"lessons":[126],"teachers'":[133],"students'":[135],"aspects.":[136],"We":[137,172],"also":[138],"conduct":[139],"Confidence-guided":[141],"at":[143],"output":[145],"intermediate":[147],"levels":[148],"KL":[152],"divergence":[153],"loss":[154],"Hint":[157],"loss,":[158],"understand":[162],"lesson.":[171],"achieve":[173],"significant":[174],"improvements":[175],"offline":[178],"online":[180],"evaluations":[181],"well-known":[184],"system.":[186],"DRL-Rec":[187],"deployed":[190],"WeChat":[192],"Top":[193],"Stories":[194],"more":[196],"than":[197],"six":[198],"months,":[199],"affecting":[200],"millions":[201],"users.":[203],"The":[204],"source":[205],"codes":[206],"are":[207],"released":[208],"https://github.com/modriczhang/DRL-Rec.":[210]},"counts_by_year":[{"year":2025,"cited_by_count":5},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
