{"id":"https://openalex.org/W4405838341","doi":"https://doi.org/10.1109/tkde.2024.3523472","title":"Hierarchical Multi-Agent Meta-Reinforcement Learning for Cross-Channel Bidding","display_name":"Hierarchical Multi-Agent Meta-Reinforcement Learning for Cross-Channel Bidding","publication_year":2024,"publication_date":"2024-12-27","ids":{"openalex":"https://openalex.org/W4405838341","doi":"https://doi.org/10.1109/tkde.2024.3523472"},"language":"en","primary_location":{"id":"doi:10.1109/tkde.2024.3523472","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2024.3523472","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102751081","display_name":"Shenghong He","orcid":null},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shenghong He","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074681163","display_name":"Chao Yu","orcid":"https://orcid.org/0000-0002-4371-3663"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chao Yu","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100659445","display_name":"Qian Lin","orcid":"https://orcid.org/0009-0000-7034-7331"},"institutions":[{"id":"https://openalex.org/I157773358","display_name":"Sun Yat-sen University","ror":"https://ror.org/0064kty71","country_code":"CN","type":"education","lineage":["https://openalex.org/I157773358"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qian Lin","raw_affiliation_strings":["School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Sun Yat-sen University, Guangzhou, China","institution_ids":["https://openalex.org/I157773358"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044454826","display_name":"Shangqin Mao","orcid":"https://orcid.org/0000-0002-3247-0483"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shangqin Mao","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Bo Tang","orcid":"https://orcid.org/0000-0001-7129-0250"},"institutions":[{"id":"https://openalex.org/I126520041","display_name":"University of Science and Technology of China","ror":"https://ror.org/04c4dkn09","country_code":"CN","type":"education","lineage":["https://openalex.org/I126520041","https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Tang","raw_affiliation_strings":["School of Artificial Intelligence and Data Science, University of Science and Technology of China, Hefei, China","School of Artificial Intelligence and Data Science, University of Science and Technology of China, Hefei 340101, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence and Data Science, University of Science and Technology of China, Hefei, China","institution_ids":["https://openalex.org/I126520041"]},{"raw_affiliation_string":"School of Artificial Intelligence and Data Science, University of Science and Technology of China, Hefei 340101, China","institution_ids":["https://openalex.org/I126520041"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5041270262","display_name":"Qianlong Xie","orcid":"https://orcid.org/0000-0001-8289-6039"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianlong Xie","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100673283","display_name":"Xingxing Wang","orcid":"https://orcid.org/0000-0003-4437-5229"},"institutions":[{"id":"https://openalex.org/I4210087373","display_name":"Meizu (China)","ror":"https://ror.org/0067g4302","country_code":"CN","type":"company","lineage":["https://openalex.org/I4210087373"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingxing Wang","raw_affiliation_strings":["Meituan, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Meituan, Beijing, China","institution_ids":["https://openalex.org/I4210087373"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5102751081"],"corresponding_institution_ids":["https://openalex.org/I157773358"],"apc_list":null,"apc_paid":null,"fwci":0.3422,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.67842041,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"37","issue":"3","first_page":"1241","last_page":"1254"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12782","display_name":"Assembly Line Balancing Optimization","score":0.9294000267982483,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12782","display_name":"Assembly Line Balancing Optimization","score":0.9294000267982483,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10551","display_name":"Scheduling and Optimization Algorithms","score":0.9099000096321106,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8251897096633911},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7922142744064331},{"id":"https://openalex.org/keywords/bidding","display_name":"Bidding","score":0.7092108726501465},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.444386750459671},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.41419339179992676},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.382161945104599},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.21115556359291077},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.09081059694290161},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.08670386672019958}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8251897096633911},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7922142744064331},{"id":"https://openalex.org/C9233905","wikidata":"https://www.wikidata.org/wiki/Q3276328","display_name":"Bidding","level":2,"score":0.7092108726501465},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.444386750459671},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.41419339179992676},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.382161945104599},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.21115556359291077},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.09081059694290161},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.08670386672019958},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tkde.2024.3523472","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tkde.2024.3523472","pdf_url":null,"source":{"id":"https://openalex.org/S30698027","display_name":"IEEE Transactions on Knowledge and Data Engineering","issn_l":"1041-4347","issn":["1041-4347","1558-2191","2326-3865"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Knowledge and Data Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1901648776","display_name":null,"funder_award_id":"62076259","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":58,"referenced_works":["https://openalex.org/W1845972764","https://openalex.org/W2010440649","https://openalex.org/W2021375049","https://openalex.org/W2039842578","https://openalex.org/W2088640816","https://openalex.org/W2088956500","https://openalex.org/W2132083787","https://openalex.org/W2140246545","https://openalex.org/W2149822245","https://openalex.org/W2562337727","https://openalex.org/W2788125442","https://openalex.org/W2788376840","https://openalex.org/W2947557559","https://openalex.org/W2951002685","https://openalex.org/W2978455699","https://openalex.org/W2988150581","https://openalex.org/W3166393923","https://openalex.org/W3167256053","https://openalex.org/W3175318851","https://openalex.org/W3185083385","https://openalex.org/W3190794503","https://openalex.org/W4282813721","https://openalex.org/W4306632355","https://openalex.org/W4307724961","https://openalex.org/W4319828019","https://openalex.org/W4323022392","https://openalex.org/W4379382506","https://openalex.org/W4380302195","https://openalex.org/W4383199651","https://openalex.org/W4389723380","https://openalex.org/W4393147227","https://openalex.org/W4393160024","https://openalex.org/W6683161245","https://openalex.org/W6738796088","https://openalex.org/W6748317118","https://openalex.org/W6748576644","https://openalex.org/W6748839928","https://openalex.org/W6757469721","https://openalex.org/W6763704811","https://openalex.org/W6765775151","https://openalex.org/W6768602481","https://openalex.org/W6769269530","https://openalex.org/W6771270455","https://openalex.org/W6771428195","https://openalex.org/W6779265984","https://openalex.org/W6779823529","https://openalex.org/W6780159193","https://openalex.org/W6785193213","https://openalex.org/W6796589144","https://openalex.org/W6796880758","https://openalex.org/W6802659552","https://openalex.org/W6802704075","https://openalex.org/W6804100093","https://openalex.org/W6838356327","https://openalex.org/W6838838702","https://openalex.org/W6841549819","https://openalex.org/W6855271737","https://openalex.org/W6858243023"],"related_works":["https://openalex.org/W2355561715","https://openalex.org/W2355326491","https://openalex.org/W2389286292","https://openalex.org/W2360751371","https://openalex.org/W2387920521","https://openalex.org/W2389754756","https://openalex.org/W2382224273","https://openalex.org/W2373538886","https://openalex.org/W2360290312","https://openalex.org/W2369836678"],"abstract_inverted_index":{"Real-time":[0],"bidding":[1,14,37,61,83,174],"(RTB)":[2],"plays":[3],"a":[4,67,75,92,117,137,164,181],"pivotal":[5],"role":[6],"in":[7,129],"online":[8],"advertising":[9,18],"ecosystems.":[10],"Advertisers":[11],"employ":[12],"strategic":[13],"to":[15,22,56,97,105,122,143],"optimize":[16],"their":[17,106],"impact":[19],"while":[20,112],"adhering":[21],"various":[23],"financial":[24],"constraints,":[25,41],"such":[26],"as":[27],"the":[28,47,53,88,102,113,124,145,150,154,171],"return-on-investment":[29],"(ROI)":[30],"and":[31,109,136],"cost-per-click":[32],"(CPC).":[33],"Primarily":[34],"focusing":[35],"on":[36,153,163],"with":[38,66],"fixed":[39],"budget":[40,49],"traditional":[42],"approaches":[43],"cannot":[44],"effectively":[45],"manage":[46],"dynamic":[48],"allocation":[50],"problem":[51,125],"where":[52],"goal":[54],"is":[55],"achieve":[57],"global":[58],"optimization":[59],"of":[60,126,149],"performance":[62],"across":[63],"multiple":[64],"channels":[65,103],"shared":[68,155],"budget.":[69],"In":[70,85],"this":[71,86],"paper,":[72],"we":[73],"propose":[74],"hierarchical":[76],"multi-agent":[77],"reinforcement":[78],"learning":[79,131,141],"framework":[80],"for":[81],"multi-channel":[82],"optimization.":[84],"framework,":[87],"top-level":[89],"strategy":[90,115],"applies":[91],"CPC":[93],"constrained":[94],"diffusion":[95],"model":[96],"dynamically":[98],"allocate":[99],"budgets":[100],"among":[101,157],"according":[104],"distinct":[107],"features":[108],"complex":[110],"interdependencies,":[111],"bottom-level":[114],"adopts":[116],"state-action":[118],"decoupled":[119],"actor-critic":[120],"method":[121,142,179],"address":[123],"extrapolation":[127],"errors":[128],"offline":[130],"caused":[132],"by":[133],"out-of-distribution":[134],"actions":[135],"context-based":[138],"meta-channel":[139],"knowledge":[140,156],"improve":[144],"state":[146],"representation":[147],"capability":[148],"policy":[151],"based":[152],"different":[158],"channels.":[159],"Comprehensive":[160],"experiments":[161],"conducted":[162],"large":[165],"scale":[166],"real-world":[167],"industrial":[168],"dataset":[169],"from":[170],"Meituan":[172],"ad":[173],"platform":[175],"demonstrate":[176],"that":[177],"our":[178],"achieves":[180],"state-of-the-art":[182],"performance.":[183]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
