{"id":"https://openalex.org/W4285102423","doi":"https://doi.org/10.1109/icra46639.2022.9812259","title":"Safe multi-agent motion planning via filtered reinforcement learning","display_name":"Safe multi-agent motion planning via filtered reinforcement learning","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W4285102423","doi":"https://doi.org/10.1109/icra46639.2022.9812259"},"language":"en","primary_location":{"id":"doi:10.1109/icra46639.2022.9812259","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9812259","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5050718717","display_name":"Abraham P. Vinod","orcid":"https://orcid.org/0000-0002-7955-9629"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Abraham P. Vinod","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032150510","display_name":"Sleiman Safaoui","orcid":"https://orcid.org/0000-0003-2408-4555"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Sleiman Safaoui","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074220429","display_name":"Ankush Chakrabarty","orcid":"https://orcid.org/0000-0001-9637-854X"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ankush Chakrabarty","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071606836","display_name":"Rien Quirynen","orcid":"https://orcid.org/0000-0003-4330-2896"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Rien Quirynen","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139","institution_ids":["https://openalex.org/I4210159266"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106232991","display_name":"Yoshikawa Nobuyuki","orcid":"https://orcid.org/0009-0001-8488-9913"},"institutions":[{"id":"https://openalex.org/I4210133125","display_name":"Mitsubishi Electric (Japan)","ror":"https://ror.org/033y26782","country_code":"JP","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125"]}],"countries":["JP"],"is_corresponding":false,"raw_author_name":"Nobuyuki Yoshikawa","raw_affiliation_strings":["Mitsubishi Electric Corporation,Japan","Mitsubishi Electric Corporation, Japan"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Corporation,Japan","institution_ids":["https://openalex.org/I4210133125"]},{"raw_affiliation_string":"Mitsubishi Electric Corporation, Japan","institution_ids":["https://openalex.org/I4210133125"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5004144091","display_name":"Stefano Di Cairano","orcid":"https://orcid.org/0000-0002-2363-2807"},"institutions":[{"id":"https://openalex.org/I4210159266","display_name":"Mitsubishi Electric (United States)","ror":"https://ror.org/053jnhe44","country_code":"US","type":"company","lineage":["https://openalex.org/I1306287861","https://openalex.org/I4210133125","https://openalex.org/I4210159266"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Stefano Di Cairano","raw_affiliation_strings":["Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139"],"affiliations":[{"raw_affiliation_string":"Mitsubishi Electric Research Laboratories,Cambridge,MA,USA,02139","institution_ids":["https://openalex.org/I4210159266"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5050718717"],"corresponding_institution_ids":["https://openalex.org/I4210159266"],"apc_list":null,"apc_paid":null,"fwci":1.5591,"has_fulltext":false,"cited_by_count":16,"citation_normalized_percentile":{"value":0.84943978,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"7270","last_page":"7276"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9819999933242798,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9772999882698059,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.9222546219825745},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.7350865602493286},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.705008327960968},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6318975687026978},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.5650591850280762},{"id":"https://openalex.org/keywords/planner","display_name":"Planner","score":0.5418298244476318},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.4670732319355011},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.4458956718444824},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.430203914642334},{"id":"https://openalex.org/keywords/trajectory","display_name":"Trajectory","score":0.42738670110702515},{"id":"https://openalex.org/keywords/collision","display_name":"Collision","score":0.36075514554977417},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.10655131936073303},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.09554210305213928}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.9222546219825745},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.7350865602493286},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.705008327960968},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6318975687026978},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.5650591850280762},{"id":"https://openalex.org/C2776999362","wikidata":"https://www.wikidata.org/wiki/Q2349274","display_name":"Planner","level":2,"score":0.5418298244476318},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.4670732319355011},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4458956718444824},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.430203914642334},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.42738670110702515},{"id":"https://openalex.org/C121704057","wikidata":"https://www.wikidata.org/wiki/Q352070","display_name":"Collision","level":2,"score":0.36075514554977417},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.10655131936073303},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.09554210305213928},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.0},{"id":"https://openalex.org/C1276947","wikidata":"https://www.wikidata.org/wiki/Q333","display_name":"Astronomy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra46639.2022.9812259","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9812259","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.5,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1968159474","https://openalex.org/W1990311592","https://openalex.org/W2024298935","https://openalex.org/W2062731992","https://openalex.org/W2095233962","https://openalex.org/W2107292630","https://openalex.org/W2201474395","https://openalex.org/W2573311857","https://openalex.org/W2736601468","https://openalex.org/W2769646558","https://openalex.org/W2886854944","https://openalex.org/W2946469828","https://openalex.org/W2976344064","https://openalex.org/W2991046523","https://openalex.org/W3008967682","https://openalex.org/W3101798601","https://openalex.org/W3119686839","https://openalex.org/W3120459386","https://openalex.org/W3123490258","https://openalex.org/W3126305458","https://openalex.org/W4205898582","https://openalex.org/W4250589301","https://openalex.org/W4250913065","https://openalex.org/W4297825594","https://openalex.org/W4299802797","https://openalex.org/W6644363009","https://openalex.org/W6696497002","https://openalex.org/W6738796088","https://openalex.org/W6741002519","https://openalex.org/W6765473059"],"related_works":["https://openalex.org/W804484174","https://openalex.org/W1568779110","https://openalex.org/W4244698559","https://openalex.org/W4246538999","https://openalex.org/W2002361198","https://openalex.org/W1819938260","https://openalex.org/W2340892746","https://openalex.org/W3005999311","https://openalex.org/W3042530408","https://openalex.org/W4381746183"],"abstract_inverted_index":{"We":[0,23],"study":[1],"the":[2,46,50,82,95,103,106],"problem":[3],"of":[4,49,105],"safe":[5,26],"multi-agent":[6,13,59],"motion":[7,16,60],"planning":[8],"in":[9,94],"cluttered":[10],"environments.":[11],"Existing":[12],"reinforcement":[14,27,33],"learning-based":[15],"planners":[17],"only":[18],"provide":[19],"approximate":[20],"safety":[21,48,69],"enforcement.":[22],"propose":[24],"a":[25,39,55],"learning":[28,34],"algorithm":[29],"that":[30,44,62],"leverages":[31],"single-agent":[32],"for":[35],"target":[36],"regulation":[37],"and":[38,67,78,84,90,99],"subsequent":[40],"convex":[41],"optimization-based":[42],"filtering":[43],"ensures":[45],"collective":[47],"system.":[51],"Our":[52,73],"approach":[53,74],"yields":[54],"safe,":[56],"real-time":[57],"implementable":[58],"planner":[61],"is":[63],"simpler":[64],"to":[65],"train":[66],"enforces":[68],"as":[70],"hard":[71],"constraints.":[72],"can":[75],"handle":[76],"state":[77],"control":[79],"constraints":[80],"on":[81],"agents,":[83],"enforce":[85],"collision":[86],"avoidance":[87],"among":[88],"themselves":[89],"with":[91],"static":[92],"obstacles":[93],"environment.":[96],"Numerical":[97],"simulations":[98],"hardware":[100],"experiments":[101],"show":[102],"efficacy":[104],"approach.":[107]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":4},{"year":2024,"cited_by_count":7},{"year":2023,"cited_by_count":4}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
