{"id":"https://openalex.org/W4392904010","doi":"https://doi.org/10.1109/icassp48485.2024.10447913","title":"MaDE: Multi-Scale Decision Enhancement for Multi-Agent Reinforcement Learning","display_name":"MaDE: Multi-Scale Decision Enhancement for Multi-Agent Reinforcement Learning","publication_year":2024,"publication_date":"2024-03-18","ids":{"openalex":"https://openalex.org/W4392904010","doi":"https://doi.org/10.1109/icassp48485.2024.10447913"},"language":"en","primary_location":{"id":"doi:10.1109/icassp48485.2024.10447913","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447913","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5076546255","display_name":"Jingqing Ruan","orcid":"https://orcid.org/0000-0002-4857-9053"},"institutions":[{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]},{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingqing Ruan","raw_affiliation_strings":["Chinese Academy of Sciences,Institute of Automation","School of Future Technology, University of Chinese Academy of Sciences","Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Institute of Automation","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Future Technology, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5009498788","display_name":"Runpeng Xie","orcid":null},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Runpeng Xie","raw_affiliation_strings":["Chinese Academy of Sciences,Institute of Automation","Institute of Automation, Chinese Academy of Sciences","School of Artificial Intelligence, University of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Institute of Automation","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012772278","display_name":"Xuantang Xiong","orcid":"https://orcid.org/0000-0001-8824-1324"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuantang Xiong","raw_affiliation_strings":["Chinese Academy of Sciences,Institute of Automation","School of Artificial Intelligence, University of Chinese Academy of Sciences","Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Institute of Automation","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004363895","display_name":"Shuang Xu","orcid":"https://orcid.org/0000-0003-3576-6914"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuang Xu","raw_affiliation_strings":["Chinese Academy of Sciences,Institute of Automation","Institute of Automation, Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Institute of Automation","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5108642431","display_name":"Bo Xu","orcid":"https://orcid.org/0000-0002-1111-1529"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"funder","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Xu","raw_affiliation_strings":["Chinese Academy of Sciences,Institute of Automation","School of Artificial Intelligence, University of Chinese Academy of Sciences","Institute of Automation, Chinese Academy of Sciences","School of Future Technology, University of Chinese Academy of Sciences"],"affiliations":[{"raw_affiliation_string":"Chinese Academy of Sciences,Institute of Automation","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Artificial Intelligence, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]},{"raw_affiliation_string":"Institute of Automation, Chinese Academy of Sciences","institution_ids":["https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Future Technology, University of Chinese Academy of Sciences","institution_ids":["https://openalex.org/I4210165038"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5076546255"],"corresponding_institution_ids":["https://openalex.org/I19820366","https://openalex.org/I4210165038"],"apc_list":null,"apc_paid":null,"fwci":0.3407,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.61344454,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9973000288009644,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.9830999970436096,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7734050750732422},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7439643144607544},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4971955120563507},{"id":"https://openalex.org/keywords/flexibility","display_name":"Flexibility (engineering)","score":0.4762037992477417},{"id":"https://openalex.org/keywords/bottleneck","display_name":"Bottleneck","score":0.47607558965682983},{"id":"https://openalex.org/keywords/situation-awareness","display_name":"Situation awareness","score":0.4525446593761444},{"id":"https://openalex.org/keywords/automatic-summarization","display_name":"Automatic summarization","score":0.4524690806865692},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4412495195865631},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.4239214360713959},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.4143518805503845},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.40359944105148315},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.35734695196151733},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.14336469769477844}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7734050750732422},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7439643144607544},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4971955120563507},{"id":"https://openalex.org/C2780598303","wikidata":"https://www.wikidata.org/wiki/Q65921492","display_name":"Flexibility (engineering)","level":2,"score":0.4762037992477417},{"id":"https://openalex.org/C2780513914","wikidata":"https://www.wikidata.org/wiki/Q18210350","display_name":"Bottleneck","level":2,"score":0.47607558965682983},{"id":"https://openalex.org/C145804949","wikidata":"https://www.wikidata.org/wiki/Q478123","display_name":"Situation awareness","level":2,"score":0.4525446593761444},{"id":"https://openalex.org/C170858558","wikidata":"https://www.wikidata.org/wiki/Q1394144","display_name":"Automatic summarization","level":2,"score":0.4524690806865692},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4412495195865631},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.4239214360713959},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.4143518805503845},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.40359944105148315},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.35734695196151733},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.14336469769477844},{"id":"https://openalex.org/C111919701","wikidata":"https://www.wikidata.org/wiki/Q9135","display_name":"Operating system","level":1,"score":0.0},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.0},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icassp48485.2024.10447913","is_oa":false,"landing_page_url":"http://dx.doi.org/10.1109/icassp48485.2024.10447913","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"ICASSP 2024 - 2024 IEEE International Conference on Acoustics, Speech and Signal Processing (ICASSP)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.6299999952316284,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G8294312625","display_name":null,"funder_award_id":"XDA27030300","funder_id":"https://openalex.org/F4320321133","funder_display_name":"Chinese Academy of Sciences"}],"funders":[{"id":"https://openalex.org/F4320321133","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":54,"referenced_works":["https://openalex.org/W6043852","https://openalex.org/W41554520","https://openalex.org/W1597623052","https://openalex.org/W1967890032","https://openalex.org/W1976195538","https://openalex.org/W1995688924","https://openalex.org/W2012812921","https://openalex.org/W2049975267","https://openalex.org/W2088252378","https://openalex.org/W2138779671","https://openalex.org/W2143842650","https://openalex.org/W2397240726","https://openalex.org/W2405468764","https://openalex.org/W2626637010","https://openalex.org/W2736601468","https://openalex.org/W2963762747","https://openalex.org/W3034971464","https://openalex.org/W3089778445","https://openalex.org/W3125947392","https://openalex.org/W3208334305","https://openalex.org/W3211445425","https://openalex.org/W4221149741","https://openalex.org/W4224932507","https://openalex.org/W4225134865","https://openalex.org/W4229001981","https://openalex.org/W4281686999","https://openalex.org/W4285042965","https://openalex.org/W4285605187","https://openalex.org/W4286748781","https://openalex.org/W4293518929","https://openalex.org/W4387171239","https://openalex.org/W4387185165","https://openalex.org/W4388891134","https://openalex.org/W4389072228","https://openalex.org/W6600255050","https://openalex.org/W6635868183","https://openalex.org/W6712173889","https://openalex.org/W6713484144","https://openalex.org/W6739516088","https://openalex.org/W6741002519","https://openalex.org/W6766805167","https://openalex.org/W6775529125","https://openalex.org/W6779827379","https://openalex.org/W6783196708","https://openalex.org/W6802965437","https://openalex.org/W6804171592","https://openalex.org/W6810298798","https://openalex.org/W6810313676","https://openalex.org/W6810677780","https://openalex.org/W6838635778","https://openalex.org/W6839595714","https://openalex.org/W6840380725","https://openalex.org/W6858611676","https://openalex.org/W6858677385"],"related_works":["https://openalex.org/W2366403280","https://openalex.org/W1495108544","https://openalex.org/W2091301346","https://openalex.org/W3148229873","https://openalex.org/W4389760904","https://openalex.org/W2150160875","https://openalex.org/W4242223894","https://openalex.org/W4306886878","https://openalex.org/W2973759123","https://openalex.org/W1517524280"],"abstract_inverted_index":{"In":[0],"the":[1,8,81,98,112,119,137,141],"domain":[2],"of":[3,36,144],"multi-agent":[4,133],"reinforcement":[5],"learning":[6],"(MARL),":[7],"limited":[9],"information":[10],"availability,":[11],"complex":[12],"agent":[13,60],"interactions,":[14],"and":[15,77,153],"individual":[16,115],"capabilities":[17],"among":[18],"agents":[19,116,147],"often":[20],"pose":[21],"a":[22,44,54,84,89],"bottleneck":[23],"for":[24,58],"effective":[25],"decision-making.":[26],"Previous":[27],"studies":[28],"frequently":[29],"fall":[30],"short":[31],"due":[32],"to":[33,66,93,107,139,148],"insufficient":[34],"consideration":[35],"these":[37],"multi-dimensional":[38],"challenges.":[39],"Thus,":[40],"this":[41],"paper":[42],"introduces":[43],"novel":[45],"methodology,":[46],"termed":[47],"Multi-scale":[48],"Decision":[49],"Enhancement":[50],"(MaDE),":[51],"anchored":[52],"by":[53],"dual-wise":[55],"bisimulation":[56],"framework":[57,64],"pre-training":[59],"encoders.":[61],"The":[62],"MaDE":[63,127],"aims":[65],"facilitate":[67],"decision-making":[68,121],"across":[69],"three":[70],"pivotal":[71],"dimensions:":[72],"macroscale":[73],"awareness,":[74],"mesoscale":[75],"coordination,":[76],"microscale":[78],"insight.":[79],"At":[80,97,111],"macro":[82],"level,":[83,100,114],"pretrained":[85],"global":[86],"encoder":[87],"captures":[88],"situational":[90],"awareness":[91],"map":[92],"guide":[94],"overall":[95],"strategies.":[96],"meso":[99],"specialized":[101],"local":[102],"encoders":[103],"generate":[104],"cluster-based":[105],"representations":[106],"promote":[108],"inter-agent":[109],"cooperation.":[110],"micro":[113],"focus":[117],"on":[118],"accurate":[120],"process.":[122],"Empirical":[123],"evaluations":[124],"validate":[125],"that":[126],"outperforms":[128],"state-of-the-art":[129],"methods":[130],"in":[131],"various":[132],"environments,":[134],"which":[135],"shows":[136],"potential":[138],"tackle":[140],"intricate":[142],"challenges":[143],"MARL,":[145],"enabling":[146],"make":[149],"more":[150],"informed,":[151],"coordinated,":[152],"adaptive":[154],"decisions.":[155],"Code":[156],"is":[157],"available":[158],"at":[159],"https://github.com/paper2023/MaDE.":[160]},"counts_by_year":[{"year":2024,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
