{"id":"https://openalex.org/W7110871246","doi":"https://doi.org/10.1109/tase.2025.3641970","title":"Shapley Meets DCOP: A Unified Structural Credit Assignment for Multiagent Planning and Multiagent Reinforcement Learning","display_name":"Shapley Meets DCOP: A Unified Structural Credit Assignment for Multiagent Planning and Multiagent Reinforcement Learning","publication_year":2025,"publication_date":"2025-12-09","ids":{"openalex":"https://openalex.org/W7110871246","doi":"https://doi.org/10.1109/tase.2025.3641970"},"language":null,"primary_location":{"id":"doi:10.1109/tase.2025.3641970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3641970","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wanyuan Wang","orcid":"https://orcid.org/0000-0002-9080-4971"},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wanyuan Wang","raw_affiliation_strings":["School of Computer Science and Engineering, Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Qian Che","orcid":"https://orcid.org/0000-0001-6089-7970"},"institutions":[{"id":"https://openalex.org/I4210157581","display_name":"Jiangsu Police Officer College","ror":"https://ror.org/04k1m2t10","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210157581"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qian Che","raw_affiliation_strings":["Jiangsu Police College, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Jiangsu Police College, Nanjing, China","institution_ids":["https://openalex.org/I4210157581"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chunyu Liu","orcid":null},"institutions":[{"id":"https://openalex.org/I76569877","display_name":"Southeast University","ror":"https://ror.org/04ct4d772","country_code":"CN","type":"education","lineage":["https://openalex.org/I76569877"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunyu Liu","raw_affiliation_strings":["School of Computer Science and Engineering, Southeast University, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Southeast University, Nanjing, China","institution_ids":["https://openalex.org/I76569877"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Youzhi Zhang","orcid":"https://orcid.org/0000-0002-2984-734X"},"institutions":[{"id":"https://openalex.org/I4210121405","display_name":"Centre for Artificial Intelligence and Robotics","ror":"https://ror.org/01xnbq218","country_code":"IN","type":"facility","lineage":["https://openalex.org/I1340206300","https://openalex.org/I4210121405","https://openalex.org/I4210150591"]}],"countries":["IN"],"is_corresponding":false,"raw_author_name":"Youzhi Zhang","raw_affiliation_strings":["Centre for Artificial Intelligence and Robotics (CAIR), Hong Kong Institute of Science and Innovation, New Territories, Hong Kong"],"affiliations":[{"raw_affiliation_string":"Centre for Artificial Intelligence and Robotics (CAIR), Hong Kong Institute of Science and Innovation, New Territories, Hong Kong","institution_ids":["https://openalex.org/I4210121405"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jiuchuan Jiang","orcid":"https://orcid.org/0000-0002-8249-1725"},"institutions":[{"id":"https://openalex.org/I137056471","display_name":"Nanjing University of Finance and Economics","ror":"https://ror.org/031y8am81","country_code":"CN","type":"education","lineage":["https://openalex.org/I137056471"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiuchuan Jiang","raw_affiliation_strings":["Nanjing University of Finance and Economics, Nanjing, China"],"affiliations":[{"raw_affiliation_string":"Nanjing University of Finance and Economics, Nanjing, China","institution_ids":["https://openalex.org/I137056471"]}]},{"author_position":"last","author":{"id":null,"display_name":"Bo An","orcid":"https://orcid.org/0000-0002-7064-7438"},"institutions":[{"id":"https://openalex.org/I172675005","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302","country_code":"SG","type":"education","lineage":["https://openalex.org/I172675005"]}],"countries":["SG"],"is_corresponding":false,"raw_author_name":"Bo An","raw_affiliation_strings":["Nanyang Technological University, Jurong West, Singapore"],"affiliations":[{"raw_affiliation_string":"Nanyang Technological University, Jurong West, Singapore","institution_ids":["https://openalex.org/I172675005"]}]}],"institutions":[],"countries_distinct_count":3,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I76569877"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.62150649,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"23","issue":null,"first_page":"3967","last_page":"3983"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.678600013256073,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.678600013256073,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.07199999690055847,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10848","display_name":"Advanced Multi-Objective Optimization Algorithms","score":0.04800000041723251,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6647999882698059},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.48919999599456787},{"id":"https://openalex.org/keywords/monte-carlo-tree-search","display_name":"Monte Carlo tree search","score":0.48030000925064087},{"id":"https://openalex.org/keywords/shapley-value","display_name":"Shapley value","score":0.45890000462532043},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.44200000166893005},{"id":"https://openalex.org/keywords/quality","display_name":"Quality (philosophy)","score":0.41179999709129333},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.39160001277923584}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7450000047683716},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6647999882698059},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.48919999599456787},{"id":"https://openalex.org/C46149586","wikidata":"https://www.wikidata.org/wiki/Q11785332","display_name":"Monte Carlo tree search","level":3,"score":0.48030000925064087},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.47450000047683716},{"id":"https://openalex.org/C199022921","wikidata":"https://www.wikidata.org/wiki/Q240046","display_name":"Shapley value","level":3,"score":0.45890000462532043},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.44200000166893005},{"id":"https://openalex.org/C2779530757","wikidata":"https://www.wikidata.org/wiki/Q1207505","display_name":"Quality (philosophy)","level":2,"score":0.41179999709129333},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.39160001277923584},{"id":"https://openalex.org/C113174947","wikidata":"https://www.wikidata.org/wiki/Q2859736","display_name":"Tree (set theory)","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3422999978065491},{"id":"https://openalex.org/C2776291640","wikidata":"https://www.wikidata.org/wiki/Q2912517","display_name":"Value (mathematics)","level":2,"score":0.3377000093460083},{"id":"https://openalex.org/C72169020","wikidata":"https://www.wikidata.org/wiki/Q194404","display_name":"Monotonic function","level":2,"score":0.335099995136261},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.31450000405311584},{"id":"https://openalex.org/C164752517","wikidata":"https://www.wikidata.org/wiki/Q5570875","display_name":"Global optimization","level":2,"score":0.3043999969959259},{"id":"https://openalex.org/C50644808","wikidata":"https://www.wikidata.org/wiki/Q192776","display_name":"Artificial neural network","level":2,"score":0.29600000381469727},{"id":"https://openalex.org/C5894958","wikidata":"https://www.wikidata.org/wiki/Q2297769","display_name":"Software agent","level":2,"score":0.2651999890804291},{"id":"https://openalex.org/C18555067","wikidata":"https://www.wikidata.org/wiki/Q8375051","display_name":"Joint (building)","level":2,"score":0.2563000023365021}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tase.2025.3641970","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tase.2025.3641970","pdf_url":null,"source":{"id":"https://openalex.org/S34881539","display_name":"IEEE Transactions on Automation Science and Engineering","issn_l":"1545-5955","issn":["1545-5955","1558-3783"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Automation Science and Engineering","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W329015778","https://openalex.org/W1625390266","https://openalex.org/W1969302761","https://openalex.org/W1977031068","https://openalex.org/W2007894170","https://openalex.org/W2088956500","https://openalex.org/W2110116921","https://openalex.org/W2126316555","https://openalex.org/W2128862550","https://openalex.org/W2166533447","https://openalex.org/W2170400507","https://openalex.org/W2287429606","https://openalex.org/W2404646363","https://openalex.org/W2436401953","https://openalex.org/W2617547828","https://openalex.org/W2791580684","https://openalex.org/W2807741983","https://openalex.org/W2944424375","https://openalex.org/W2945991855","https://openalex.org/W2946478166","https://openalex.org/W2964749398","https://openalex.org/W2965647577","https://openalex.org/W2972122474","https://openalex.org/W2983178256","https://openalex.org/W2998299793","https://openalex.org/W3011232183","https://openalex.org/W3082358791","https://openalex.org/W3127463339","https://openalex.org/W3136998346","https://openalex.org/W3167061096","https://openalex.org/W3173782550","https://openalex.org/W3177401124","https://openalex.org/W3205875899","https://openalex.org/W4283021706","https://openalex.org/W4285007555","https://openalex.org/W4382202835","https://openalex.org/W4382239488","https://openalex.org/W4390968395","https://openalex.org/W4391640441","https://openalex.org/W4392007398","https://openalex.org/W4393032631","https://openalex.org/W4394564139","https://openalex.org/W4396891890","https://openalex.org/W4401607723","https://openalex.org/W4411336711","https://openalex.org/W7124169210","https://openalex.org/W7124239827","https://openalex.org/W7124263057","https://openalex.org/W7124317877"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,29,45,75,100,117,122,127,158,164,168,174,190,209],"construction":[2],"of":[3,9,31,78,126,167,225],"intelligent":[4],"agents,":[5],"coordinating":[6],"a":[7,84,112,135,147],"collection":[8],"agents":[10],"to":[11,34,38,67,82,94],"optimize":[12,189],"long-term":[13],"cumulative":[14],"global":[15,27,35,169,192],"reward":[16,108],"is":[17,42,81,178],"becoming":[18],"increasingly":[19],"important.":[20],"To":[21],"align":[22],"individual":[23,32],"agent":[24,183],"actions":[25,33],"with":[26],"rewards,":[28],"contribution":[30,77],"rewards":[36,187],"needs":[37],"be":[39,92],"determined,":[40],"which":[41,59],"known":[43],"as":[44],"structural":[46],"credit":[47],"assignment":[48],"(SCA).":[49],"Conventional":[50],"SCA":[51,88],"mechanisms":[52],"are":[53],"primarily":[54],"based":[55,130],"on":[56,131],"neural":[57],"networks,":[58],"lack":[60],"theoretical":[61],"foundations":[62],"and":[63,97,106,124,146,172,213,220,228],"preclude":[64],"their":[65],"application":[66],"model-based":[68,143],"MAP":[69,96,144],"tasks.":[70,153],"Leveraging":[71],"cooperative":[72],"game":[73],"theory,":[74],"main":[76],"this":[79],"study":[80],"propose":[83,111],"novel":[85,113],"Shapley":[86,118],"value-based":[87],"(SV-SCA)":[89],"that":[90,157,173,181,208],"can":[91,162],"generalized":[93],"both":[95],"MARL.":[98],"Combining":[99],"distributed":[101],"constraint":[102],"optimization":[103],"(DCOP)":[104],"model":[105],"its":[107,185],"structure,":[109],"we":[110,133,195],"algorithm":[114],"for":[115,142,150],"computing":[116],"value":[119,166],"while":[120],"ensuring":[121],"efficiency":[123],"fairness":[125],"SV-SCA.":[128],"Particularly,":[129],"SV-SCA,":[132],"design":[134],"coordinated":[136,160,176,211,214],"Monte":[137],"Carlo":[138],"tree":[139],"search":[140],"(MCTS)":[141],"tasks":[145],"fully-decentralized":[148],"method":[149],"model-free":[151],"MARL":[152,177,215,221],"Theoretical":[154],"analyses":[155],"show":[156],"proposed":[159,175,210],"MCTS":[161,212,219],"guarantee":[163],"expected":[165],"joint":[170],"action,":[171],"monotonic":[179],"such":[180],"each":[182],"optimizes":[184],"own":[186],"also":[188],"system\u2019s":[191],"reward.":[193],"Finally,":[194],"conduct":[196],"extensive":[197],"experiments":[198],"in":[199,223],"typical":[200],"sequential":[201],"multiagent":[202,218],"coordination":[203],"domains.":[204],"Our":[205],"results":[206],"demonstrate":[207],"outperform":[216],"existing":[217],"baselines":[222],"terms":[224],"solution":[226],"quality":[227],"scalability.":[229]},"counts_by_year":[],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-12-10T00:00:00"}
