{"id":"https://openalex.org/W4401414481","doi":"https://doi.org/10.1109/icra57147.2024.10611573","title":"MAexp: A Generic Platform for RL-based Multi-Agent Exploration","display_name":"MAexp: A Generic Platform for RL-based Multi-Agent Exploration","publication_year":2024,"publication_date":"2024-05-13","ids":{"openalex":"https://openalex.org/W4401414481","doi":"https://doi.org/10.1109/icra57147.2024.10611573"},"language":"en","primary_location":{"id":"doi:10.1109/icra57147.2024.10611573","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10611573","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109585715","display_name":"Shaohao Zhu","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaohao Zhu","raw_affiliation_strings":["Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5113325534","display_name":"Jiacheng Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiacheng Zhou","raw_affiliation_strings":["Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101770129","display_name":"Anjun Chen","orcid":"https://orcid.org/0000-0003-4209-8301"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Anjun Chen","raw_affiliation_strings":["Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043006828","display_name":"Mingming Bai","orcid":null},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mingming Bai","raw_affiliation_strings":["Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100726041","display_name":"Jiming Chen","orcid":"https://orcid.org/0000-0003-3155-3145"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiming Chen","raw_affiliation_strings":["Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027","institution_ids":["https://openalex.org/I76130692"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101511490","display_name":"Jinming Xu","orcid":"https://orcid.org/0009-0001-4316-9661"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinming Xu","raw_affiliation_strings":["Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Zhejiang University,College of Control Science and Engineering,Hangzhou,China,310027","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.0899,"has_fulltext":false,"cited_by_count":5,"citation_normalized_percentile":{"value":0.78365279,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"5155","last_page":"5161"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9983000159263611,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10906","display_name":"AI-based Problem Solving and Planning","score":0.9932000041007996,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6585974097251892}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6585974097251892}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra57147.2024.10611573","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra57147.2024.10611573","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2024 IEEE International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W1933691875","https://openalex.org/W2134877736","https://openalex.org/W2296693980","https://openalex.org/W2736601468","https://openalex.org/W2919289962","https://openalex.org/W2920854821","https://openalex.org/W2944778709","https://openalex.org/W2973525135","https://openalex.org/W2996134258","https://openalex.org/W3099689767","https://openalex.org/W3134938521","https://openalex.org/W3163926178","https://openalex.org/W3176265013","https://openalex.org/W3178888730","https://openalex.org/W3202938653","https://openalex.org/W3207022667","https://openalex.org/W4210356871","https://openalex.org/W4214484978","https://openalex.org/W4226300900","https://openalex.org/W4286748781","https://openalex.org/W4287112297","https://openalex.org/W4288594419","https://openalex.org/W4299802797","https://openalex.org/W4312863572","https://openalex.org/W4324119280","https://openalex.org/W4382050679","https://openalex.org/W4383108727","https://openalex.org/W4383109302","https://openalex.org/W4389473504","https://openalex.org/W6638018090","https://openalex.org/W6692846177","https://openalex.org/W6738796088","https://openalex.org/W6795908048","https://openalex.org/W6797065961","https://openalex.org/W6810220931","https://openalex.org/W6840380725"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052","https://openalex.org/W2382290278","https://openalex.org/W4395014643"],"abstract_inverted_index":{"The":[0],"sim-to-real":[1],"gap":[2],"poses":[3],"a":[4,51,59,85,104],"significant":[5],"challenge":[6],"in":[7,24,31,152],"RL-based":[8],"multi-agent":[9,55],"exploration":[10,56,77],"due":[11],"to":[12,74,80,126],"scene":[13],"quantization":[14],"and":[15,26,66,84,103,116],"action":[16],"discretization.":[17],"Existing":[18],"platforms":[19],"suffer":[20],"from":[21],"the":[22,27,128,146],"inefficiency":[23],"sampling":[25,86],"lack":[28],"of":[29,62,114,120,149],"diversity":[30],"Multi-Agent":[32,100],"Reinforcement":[33],"Learning":[34],"(MARL)":[35],"algorithms":[36,65,135],"across":[37,136],"different":[38,153],"scenarios,":[39,78],"restraining":[40],"their":[41],"widespread":[42],"applications.":[43],"To":[44],"fill":[45],"these":[46],"gaps,":[47],"we":[48,70],"propose":[49],"MAexp,":[50],"generic":[52],"platform":[53],"for":[54,139],"that":[57],"integrates":[58],"broad":[60],"range":[61],"state-of-the-art":[63],"MARL":[64,134],"representative":[67],"scenarios.":[68,154],"Moreover,":[69],"employ":[71],"point":[72],"clouds":[73],"represent":[75],"our":[76],"leading":[79],"high-fidelity":[81],"environment":[82],"mapping":[83],"speed":[87],"approximately":[88],"40":[89],"times":[90],"faster":[91],"than":[92],"existing":[93],"platforms.":[94],"Furthermore,":[95],"equipped":[96],"with":[97,111,141],"an":[98],"attention-based":[99],"Target":[101],"Generator":[102],"Single-Agent":[105],"Motion":[106],"Planner,":[107],"MAexp":[108],"can":[109],"work":[110],"arbitrary":[112],"numbers":[113],"agents":[115],"accommodate":[117],"various":[118],"types":[119],"robots.":[121],"Extensive":[122],"experiments":[123],"are":[124],"conducted":[125],"establish":[127],"first":[129],"benchmark":[130],"featuring":[131],"several":[132],"high-performance":[133],"typical":[137],"scenarios":[138],"robots":[140],"continuous":[142],"actions,":[143],"which":[144],"highlights":[145],"distinct":[147],"strengths":[148],"each":[150],"algorithm":[151]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4}],"updated_date":"2026-06-13T07:54:00.901334","created_date":"2025-10-10T00:00:00"}
