{"id":"https://openalex.org/W3129616587","doi":"https://doi.org/10.1109/iros45743.2020.9340876","title":"MAPPER: Multi-Agent Path Planning with Evolutionary Reinforcement Learning in Mixed Dynamic Environments","display_name":"MAPPER: Multi-Agent Path Planning with Evolutionary Reinforcement Learning in Mixed Dynamic Environments","publication_year":2020,"publication_date":"2020-10-24","ids":{"openalex":"https://openalex.org/W3129616587","doi":"https://doi.org/10.1109/iros45743.2020.9340876","mag":"3129616587"},"language":"en","primary_location":{"id":"doi:10.1109/iros45743.2020.9340876","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros45743.2020.9340876","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5037613999","display_name":"Zuxin Liu","orcid":"https://orcid.org/0000-0001-7412-5074"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Zuxin Liu","raw_affiliation_strings":["Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050306497","display_name":"Baiming Chen","orcid":"https://orcid.org/0000-0002-3782-0251"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baiming Chen","raw_affiliation_strings":["School of Vehicle and Mobility, Tsinghua University, China"],"affiliations":[{"raw_affiliation_string":"School of Vehicle and Mobility, Tsinghua University, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022257357","display_name":"Hongyi Zhou","orcid":"https://orcid.org/0000-0001-5074-5180"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hongyi Zhou","raw_affiliation_strings":["Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053373568","display_name":"Guru Koushik","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Guru Koushik","raw_affiliation_strings":["Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075246991","display_name":"Martial Hebert","orcid":"https://orcid.org/0000-0003-4566-5930"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Martial Hebert","raw_affiliation_strings":["The Robotics Institute, Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"The Robotics Institute, Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037644321","display_name":"Ding Zhao","orcid":"https://orcid.org/0000-0002-9400-8446"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ding Zhao","raw_affiliation_strings":["Carnegie Mellon University, USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University, USA","institution_ids":["https://openalex.org/I74973139"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5037613999"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":4.0238,"has_fulltext":false,"cited_by_count":111,"citation_normalized_percentile":{"value":0.951357,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"11748","last_page":"11754"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9986000061035156,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10191","display_name":"Robotics and Sensor-Based Localization","score":0.9944000244140625,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8897324800491333},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7252197265625},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6572843194007874},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.6435565948486328},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.46758389472961426},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.42264658212661743},{"id":"https://openalex.org/keywords/time-horizon","display_name":"Time horizon","score":0.41698652505874634},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.40593230724334717},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.1945227086544037}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8897324800491333},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7252197265625},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6572843194007874},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.6435565948486328},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46758389472961426},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.42264658212661743},{"id":"https://openalex.org/C28761237","wikidata":"https://www.wikidata.org/wiki/Q7805321","display_name":"Time horizon","level":2,"score":0.41698652505874634},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.40593230724334717},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.1945227086544037},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/iros45743.2020.9340876","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iros45743.2020.9340876","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2020 IEEE/RSJ International Conference on Intelligent Robots and Systems (IROS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.6499999761581421,"display_name":"Sustainable cities and communities","id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320306185","display_name":"Richard King Mellon Foundation","ror":"https://ror.org/03qevzg44"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":41,"referenced_works":["https://openalex.org/W192919555","https://openalex.org/W206679605","https://openalex.org/W1757796397","https://openalex.org/W1965760189","https://openalex.org/W1989407213","https://openalex.org/W2082585576","https://openalex.org/W2089527927","https://openalex.org/W2097639646","https://openalex.org/W2113256452","https://openalex.org/W2130422193","https://openalex.org/W2136207702","https://openalex.org/W2142943472","https://openalex.org/W2524241275","https://openalex.org/W2565402511","https://openalex.org/W2604216058","https://openalex.org/W2744921630","https://openalex.org/W2884634491","https://openalex.org/W2892258706","https://openalex.org/W2914296650","https://openalex.org/W2963407617","https://openalex.org/W2963428623","https://openalex.org/W2963809389","https://openalex.org/W2963821308","https://openalex.org/W2964043796","https://openalex.org/W2964319688","https://openalex.org/W2967177252","https://openalex.org/W2968430550","https://openalex.org/W2970720334","https://openalex.org/W3023169168","https://openalex.org/W3099533866","https://openalex.org/W3103635569","https://openalex.org/W4288331462","https://openalex.org/W4298857966","https://openalex.org/W4299802797","https://openalex.org/W6637967152","https://openalex.org/W6692846177","https://openalex.org/W6738796088","https://openalex.org/W6742667875","https://openalex.org/W6753596642","https://openalex.org/W6758754608","https://openalex.org/W6764173040"],"related_works":["https://openalex.org/W1904098742","https://openalex.org/W3158921809","https://openalex.org/W1980828932","https://openalex.org/W2161428574","https://openalex.org/W1972453571","https://openalex.org/W2077416514","https://openalex.org/W2618632915","https://openalex.org/W2150982344","https://openalex.org/W4292862729","https://openalex.org/W2170661558"],"abstract_inverted_index":{"Multi-agent":[0],"navigation":[1,67],"in":[2,44,84,111,127],"dynamic":[3,46,105,116,129,180],"environments":[4,130],"is":[5,161],"of":[6,16,76,97,103,178],"great":[7],"industrial":[8],"value":[9],"when":[10,172],"deploying":[11],"a":[12,24,77,125,175],"large":[13,85,153,176],"scale":[14],"fleet":[15],"robot":[17],"to":[18,37,152,163,174],"real-world":[19],"applications.":[20],"This":[21],"paper":[22],"proposes":[23],"decentralized":[25],"partially":[26],"observable":[27],"multi-agent":[28,90,136],"path":[29],"planning":[30,42,91],"with":[31,58,119,183],"evolutionary":[32,144],"reinforcement":[33],"learning":[34],"(MAPPER)":[35],"method":[36],"learn":[38],"an":[39,120,143],"effective":[40],"local":[41],"policy":[43,126],"mixed":[45,128],"environments.":[47,86,156],"Reinforcement":[48],"learning-based":[49,191],"methods":[50],"usually":[51],"suffer":[52],"performance":[53,83,171],"degradation":[54],"on":[55],"long-horizon":[56],"tasks":[57],"goal-conditioned":[59],"sparse":[60],"rewards,":[61],"so":[62],"we":[63,141],"decompose":[64],"the":[65,74,98,189],"long-range":[66],"task":[68],"into":[69],"many":[70],"easier":[71],"sub-tasks":[72],"under":[73],"guidance":[75],"global":[78],"planner,":[79],"which":[80,107],"increases":[81],"agents'":[82],"Moreover,":[87],"most":[88],"existing":[89],"approaches":[92],"assume":[93],"either":[94],"perfect":[95],"information":[96],"surrounding":[99],"environment":[100],"or":[101],"homogeneity":[102,132],"nearby":[104],"agents,":[106],"may":[108],"not":[109],"hold":[110],"practice.":[112],"Our":[113],"approach":[114,146],"models":[115],"obstacles'":[117],"behavior":[118],"image-based":[121],"representation":[122],"and":[123,139,154,168,188],"trains":[124],"without":[131],"assumption.":[133],"To":[134],"ensure":[135],"training":[137,145],"stability":[138],"performance,":[140],"propose":[142],"that":[147,159],"can":[148],"be":[149],"easily":[150],"scaled":[151],"complex":[155],"Experiments":[157],"show":[158],"MAPPER":[160],"able":[162],"achieve":[164],"higher":[165],"success":[166],"rates":[167],"more":[169],"stable":[170],"exposed":[173],"number":[177],"non-cooperative":[179],"obstacles":[181],"compared":[182],"traditional":[184],"reaction-based":[185],"planner":[186],"LRA*":[187],"state-of-the-art":[190],"method.":[192]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":39},{"year":2024,"cited_by_count":29},{"year":2023,"cited_by_count":18},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":10},{"year":2020,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
