{"id":"https://openalex.org/W4285102394","doi":"https://doi.org/10.1109/icra46639.2022.9812341","title":"Enhancing Deep Reinforcement Learning Approaches for Multi-Robot Navigation via Single-Robot Evolutionary Policy Search","display_name":"Enhancing Deep Reinforcement Learning Approaches for Multi-Robot Navigation via Single-Robot Evolutionary Policy Search","publication_year":2022,"publication_date":"2022-05-23","ids":{"openalex":"https://openalex.org/W4285102394","doi":"https://doi.org/10.1109/icra46639.2022.9812341"},"language":"en","primary_location":{"id":"doi:10.1109/icra46639.2022.9812341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9812341","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5058298540","display_name":"Enrico Marchesini","orcid":"https://orcid.org/0000-0003-1858-7279"},"institutions":[{"id":"https://openalex.org/I119439378","display_name":"University of Verona","ror":"https://ror.org/039bp8j42","country_code":"IT","type":"education","lineage":["https://openalex.org/I119439378"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Enrico Marchesini","raw_affiliation_strings":["University of Verona,Department of Computer Science,Verona,Italy,37135"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Verona,Department of Computer Science,Verona,Italy,37135","institution_ids":["https://openalex.org/I119439378"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045922629","display_name":"Alessandro Farinelli","orcid":"https://orcid.org/0000-0002-2592-5814"},"institutions":[{"id":"https://openalex.org/I119439378","display_name":"University of Verona","ror":"https://ror.org/039bp8j42","country_code":"IT","type":"education","lineage":["https://openalex.org/I119439378"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessandro Farinelli","raw_affiliation_strings":["University of Verona,Department of Computer Science,Verona,Italy,37135"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Verona,Department of Computer Science,Verona,Italy,37135","institution_ids":["https://openalex.org/I119439378"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":1.8687,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.87649086,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":98,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"5525","last_page":"5531"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998999834060669,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12288","display_name":"Optimization and Search Problems","score":0.9958999752998352,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8760736584663391},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6414348483085632},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6231921315193176},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.5523970723152161},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5512529015541077},{"id":"https://openalex.org/keywords/evolutionary-robotics","display_name":"Evolutionary robotics","score":0.5006086826324463},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.4386861026287079}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8760736584663391},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6414348483085632},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6231921315193176},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.5523970723152161},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5512529015541077},{"id":"https://openalex.org/C199505168","wikidata":"https://www.wikidata.org/wiki/Q3267529","display_name":"Evolutionary robotics","level":3,"score":0.5006086826324463},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.4386861026287079}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icra46639.2022.9812341","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icra46639.2022.9812341","pdf_url":null,"source":{"id":"https://openalex.org/S4363607759","display_name":"2022 International Conference on Robotics and Automation (ICRA)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"conference"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2022 International Conference on Robotics and Automation (ICRA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Partnerships for the goals","score":0.4099999964237213,"id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":46,"referenced_works":["https://openalex.org/W1518858799","https://openalex.org/W1542670833","https://openalex.org/W2215378786","https://openalex.org/W2602275733","https://openalex.org/W2617547828","https://openalex.org/W2626637010","https://openalex.org/W2747213132","https://openalex.org/W2761873684","https://openalex.org/W2769883686","https://openalex.org/W2894662639","https://openalex.org/W2949963774","https://openalex.org/W2951799221","https://openalex.org/W2951799422","https://openalex.org/W2962975462","https://openalex.org/W2963019567","https://openalex.org/W3002855444","https://openalex.org/W3037430760","https://openalex.org/W3088310808","https://openalex.org/W3089695338","https://openalex.org/W3091760204","https://openalex.org/W3116714419","https://openalex.org/W3120345700","https://openalex.org/W3120778962","https://openalex.org/W3128707967","https://openalex.org/W3185656037","https://openalex.org/W4283793632","https://openalex.org/W4287755265","https://openalex.org/W4288091739","https://openalex.org/W4295252942","https://openalex.org/W4295598622","https://openalex.org/W4299802797","https://openalex.org/W6685444567","https://openalex.org/W6735650757","https://openalex.org/W6738796088","https://openalex.org/W6739516088","https://openalex.org/W6743629521","https://openalex.org/W6749304979","https://openalex.org/W6755459763","https://openalex.org/W6755903938","https://openalex.org/W6762491519","https://openalex.org/W6767327128","https://openalex.org/W6779884726","https://openalex.org/W6784152626","https://openalex.org/W6787843961","https://openalex.org/W6788085919","https://openalex.org/W6798969013"],"related_works":["https://openalex.org/W2122871747","https://openalex.org/W3114279067","https://openalex.org/W2930863966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W4220829754","https://openalex.org/W2165180011","https://openalex.org/W3165944253","https://openalex.org/W4381586542"],"abstract_inverted_index":{"Recent":[0],"Multi-Agent":[1],"Deep":[2],"Reinforcement":[3],"Learning":[4],"approaches":[5],"factorize":[6],"a":[7,47,98],"global":[8],"action-value":[9],"to":[10,27,34,62,85,135,146,159],"address":[11],"non-stationarity":[12],"and":[13,37,138],"favor":[14],"cooperation.":[15],"These":[16],"methods,":[17],"however,":[18],"hinder":[19],"exploration":[20,36],"by":[21,45,109],"introducing":[22],"constraints":[23],"(e.g.,":[24],"additive":[25],"value-decomposition)":[26],"guarantee":[28],"the":[29,55,59,64,72,80,90,110,119,129,150,157,160,164],"factorization.":[30],"Our":[31],"goal":[32],"is":[33,103],"enhance":[35],"improve":[38,116],"sample":[39,139],"efficiency":[40],"of":[41,82,89,153,166],"multi-robot":[42,111,130,161],"mapless":[43],"navigation":[44,106,154],"incorporating":[46],"periodical":[48],"Evolutionary":[49,83],"Policy":[50],"Search":[51],"(EPS).":[52],"In":[53],"detail,":[54],"multi-agent":[56],"training":[57],"\u201cspecializes\u201d":[58],"robots'":[60],"policies":[61,112],"learn":[63],"collision":[65],"avoidance":[66],"skills":[67,155],"that":[68,104],"are":[69],"mandatory":[70],"for":[71],"task.":[73],"Concurrently,":[74],"in":[75,93,118,142],"this":[76],"work":[77],"we":[78],"propose":[79],"use":[81],"Algorithms":[84],"explore":[86],"different":[87],"regions":[88],"policy":[91,123],"space":[92],"an":[94],"environment":[95],"with":[96,144],"only":[97],"single":[99],"robot.":[100],"The":[101],"idea":[102],"core":[105],"skills,":[107],"originated":[108],"using":[113,132],"mutation":[114],"operators,":[115],"faster":[117],"single-robot":[120],"EPS.":[121],"Hence,":[122],"parameters":[124],"can":[125],"be":[126],"injected":[127],"into":[128],"setting":[131],"crossovers,":[133],"leading":[134],"improved":[136],"performance":[137,165],"efficiency.":[140],"Experiments":[141],"tasks":[143],"up":[145],"12":[147],"robots":[148],"confirm":[149],"beneficial":[151],"transfer":[152],"from":[156],"EPS":[158],"setting,":[162],"improving":[163],"prior":[167],"methods.":[168]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":5},{"year":2023,"cited_by_count":7}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
