{"id":"https://openalex.org/W4306317659","doi":"https://doi.org/10.1145/3511808.3557611","title":"Hybrid Transfer in Deep Reinforcement Learning for Ads Allocation","display_name":"Hybrid Transfer in Deep Reinforcement Learning for Ads Allocation","publication_year":2022,"publication_date":"2022-10-16","ids":{"openalex":"https://openalex.org/W4306317659","doi":"https://doi.org/10.1145/3511808.3557611"},"language":"en","primary_location":{"id":"doi:10.1145/3511808.3557611","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3511808.3557611","pdf_url":null,"source":{"id":"https://openalex.org/S4363608762","display_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100443565","display_name":"Ze Wang","orcid":"https://orcid.org/0009-0004-6220-4938"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Ze Wang","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5036945708","display_name":"Guogang Liao","orcid":"https://orcid.org/0009-0002-6530-7102"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guogang Liao","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064189829","display_name":"Xiaowen Shi","orcid":"https://orcid.org/0000-0001-6532-4522"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaowen Shi","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027645208","display_name":"Xiaoxu Wu","orcid":"https://orcid.org/0000-0003-0598-4697"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoxu Wu","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5080460228","display_name":"Chuheng Zhang","orcid":null},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuheng Zhang","raw_affiliation_strings":["Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103324082","display_name":"Bingqi Zhu","orcid":"https://orcid.org/0009-0006-9127-2029"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bingqi Zhu","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109602541","display_name":"Yongkang Wang","orcid":"https://orcid.org/0000-0003-0192-3539"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yongkang Wang","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100673283","display_name":"Xingxing Wang","orcid":"https://orcid.org/0000-0003-4437-5229"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingxing Wang","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100391416","display_name":"Dong Wang","orcid":"https://orcid.org/0000-0001-6928-8725"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dong Wang","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5100443565"],"corresponding_institution_ids":["https://openalex.org/I4210087373"],"apc_list":null,"apc_paid":null,"fwci":2.7057,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.91554054,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"4560","last_page":"4564"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11161","display_name":"Consumer Market Behavior and Pricing","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1406","display_name":"Marketing"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10203","display_name":"Recommender Systems and Techniques","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11942","display_name":"Transportation and Mobility Innovations","score":0.9797999858856201,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7584754228591919},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7234310507774353},{"id":"https://openalex.org/keywords/transfer-of-learning","display_name":"Transfer of learning","score":0.6611092686653137},{"id":"https://openalex.org/keywords/revenue","display_name":"Revenue","score":0.6492533683776855},{"id":"https://openalex.org/keywords/similarity","display_name":"Similarity (geometry)","score":0.6389707922935486},{"id":"https://openalex.org/keywords/notice","display_name":"Notice","score":0.5961098670959473},{"id":"https://openalex.org/keywords/transfer","display_name":"Transfer (computing)","score":0.5069646835327148},{"id":"https://openalex.org/keywords/data-transmission","display_name":"Data transmission","score":0.4342370629310608},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.27315497398376465},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.1873631775379181},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.0721038281917572}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7584754228591919},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7234310507774353},{"id":"https://openalex.org/C150899416","wikidata":"https://www.wikidata.org/wiki/Q1820378","display_name":"Transfer of learning","level":2,"score":0.6611092686653137},{"id":"https://openalex.org/C195487862","wikidata":"https://www.wikidata.org/wiki/Q850210","display_name":"Revenue","level":2,"score":0.6492533683776855},{"id":"https://openalex.org/C103278499","wikidata":"https://www.wikidata.org/wiki/Q254465","display_name":"Similarity (geometry)","level":3,"score":0.6389707922935486},{"id":"https://openalex.org/C2779913896","wikidata":"https://www.wikidata.org/wiki/Q7063001","display_name":"Notice","level":2,"score":0.5961098670959473},{"id":"https://openalex.org/C2776175482","wikidata":"https://www.wikidata.org/wiki/Q1195816","display_name":"Transfer (computing)","level":2,"score":0.5069646835327148},{"id":"https://openalex.org/C557945733","wikidata":"https://www.wikidata.org/wiki/Q389772","display_name":"Data transmission","level":2,"score":0.4342370629310608},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.27315497398376465},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.1873631775379181},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.0721038281917572},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.0},{"id":"https://openalex.org/C121955636","wikidata":"https://www.wikidata.org/wiki/Q4116214","display_name":"Accounting","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3511808.3557611","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3511808.3557611","pdf_url":null,"source":{"id":"https://openalex.org/S4363608762","display_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 31st ACM International Conference on Information &amp; Knowledge Management","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W102349725","https://openalex.org/W2056716515","https://openalex.org/W2765302304","https://openalex.org/W2797234205","https://openalex.org/W2799173935","https://openalex.org/W2965163470","https://openalex.org/W3007094061","https://openalex.org/W3080386552","https://openalex.org/W3094577760","https://openalex.org/W3103141630","https://openalex.org/W3110995086","https://openalex.org/W3157410348","https://openalex.org/W3167957332","https://openalex.org/W3173331009","https://openalex.org/W3200113042","https://openalex.org/W4247154108"],"related_works":["https://openalex.org/W10042887","https://openalex.org/W1897440242","https://openalex.org/W2218233845","https://openalex.org/W2370550542","https://openalex.org/W2232108453","https://openalex.org/W2370124876","https://openalex.org/W2049188538","https://openalex.org/W2391359489","https://openalex.org/W2998706884","https://openalex.org/W2390100812"],"abstract_inverted_index":{"Ads":[0,79],"allocation,":[1],"which":[2,60,82],"involves":[3],"allocating":[4],"ads":[5],"and":[6,37,47,126,133,142,162],"organic":[7],"items":[8],"to":[9,67,93,104,129,138],"limited":[10],"slots":[11],"in":[12],"feed":[13],"with":[14],"the":[15,65,106,152,164,167],"purpose":[16],"of":[17,108],"maximizing":[18],"platform":[19,149],"revenue,":[20],"has":[21,57],"become":[22],"a":[23,119],"research":[24],"hotspot.":[25],"Notice":[26],"that,":[27],"platforms":[28,36],"(e.g.,":[29],"e-commerce":[30],"platforms,":[31,33],"video":[32],"food":[34,147],"delivery":[35,148],"so":[38],"on)":[39],"usually":[40],"have":[41,50],"multiple":[42],"entrances":[43,49,56],"for":[44,64,78,102,110,159,166],"different":[45,111],"categories":[46],"some":[48],"few":[51],"visits.":[52],"Data":[53],"from":[54,90,135],"these":[55],"low":[58],"coverage,":[59],"makes":[61],"it":[62],"difficult":[63],"agent":[66],"learn.":[68],"To":[69],"address":[70],"this":[71,115],"challenge,":[72],"we":[73,97,117],"propose":[74],"Similarity-based":[75],"Hybrid":[76],"Transfer":[77],"Allocation":[80],"(SHTAA),":[81],"effectively":[83],"transfers":[84],"samples":[85,132],"as":[86,88],"well":[87],"knowledge":[89,134],"data-rich":[91],"entrance":[92,137,161],"data-poor":[94,160],"entrance.":[95],"Specifically,":[96],"define":[98],"an":[99],"uncertainty-aware":[100],"similarity":[101,107],"MDP":[103,109],"estimate":[105],"entrances.":[112],"Based":[113],"on":[114,145],"similarity,":[116],"design":[118],"hybrid":[120],"transfer":[121,125,131],"method,":[122],"including":[123],"instance":[124],"strategy":[127],"transfer,":[128],"efficiently":[130],"one":[136],"another.":[139],"Both":[140],"offline":[141],"online":[143],"experiments":[144],"Meituan":[146],"demonstrate":[150],"that":[151],"proposed":[153],"method":[154],"could":[155],"achieve":[156],"better":[157],"performance":[158],"increase":[163],"revenue":[165],"platform.":[168]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
