{"id":"https://openalex.org/W3134776497","doi":"https://doi.org/10.1109/tccn.2021.3063170","title":"Distributed Reinforcement Learning for Flexible and Efficient UAV Swarm Control","display_name":"Distributed Reinforcement Learning for Flexible and Efficient UAV Swarm Control","publication_year":2021,"publication_date":"2021-03-02","ids":{"openalex":"https://openalex.org/W3134776497","doi":"https://doi.org/10.1109/tccn.2021.3063170","mag":"3134776497"},"language":"en","primary_location":{"id":"doi:10.1109/tccn.2021.3063170","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tccn.2021.3063170","pdf_url":null,"source":{"id":"https://openalex.org/S2484188435","display_name":"IEEE Transactions on Cognitive Communications and Networking","issn_l":"2332-7731","issn":["2332-7731","2372-2045"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive Communications and Networking","raw_type":"journal-article"},"type":"article","indexed_in":["arxiv","crossref"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2103.04666","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Federico Venturini","orcid":"https://orcid.org/0000-0001-6623-7359"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":true,"raw_author_name":"Federico Venturini","raw_affiliation_strings":["University of Padova, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padova, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Federico Mason","orcid":"https://orcid.org/0000-0001-5681-1695"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Federico Mason","raw_affiliation_strings":["University of Padova, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padova, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Francesco Pase","orcid":"https://orcid.org/0000-0003-0116-8852"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Francesco Pase","raw_affiliation_strings":["University of Padova, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padova, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Federico Chiariotti","orcid":"https://orcid.org/0000-0002-7915-7275"},"institutions":[{"id":"https://openalex.org/I891191580","display_name":"Aalborg University","ror":"https://ror.org/04m5j1k67","country_code":"DK","type":"education","lineage":["https://openalex.org/I891191580"]}],"countries":["DK"],"is_corresponding":false,"raw_author_name":"Federico Chiariotti","raw_affiliation_strings":["Aalborg University, Aalborg, Denmark"],"affiliations":[{"raw_affiliation_string":"Aalborg University, Aalborg, Denmark","institution_ids":["https://openalex.org/I891191580"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Alberto Testolin","orcid":"https://orcid.org/0000-0001-7062-4861"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alberto Testolin","raw_affiliation_strings":["University of Padova, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padova, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Andrea Zanella","orcid":"https://orcid.org/0000-0003-3671-5190"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea Zanella","raw_affiliation_strings":["University of Padova, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padova, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]},{"author_position":"last","author":{"id":null,"display_name":"Michele Zorzi","orcid":"https://orcid.org/0000-0003-2870-4678"},"institutions":[{"id":"https://openalex.org/I138689650","display_name":"University of Padua","ror":"https://ror.org/00240q980","country_code":"IT","type":"education","lineage":["https://openalex.org/I138689650"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Michele Zorzi","raw_affiliation_strings":["University of Padova, Padua, Italy"],"affiliations":[{"raw_affiliation_string":"University of Padova, Padua, Italy","institution_ids":["https://openalex.org/I138689650"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I138689650"],"apc_list":null,"apc_paid":null,"fwci":32.8418,"has_fulltext":true,"cited_by_count":56,"citation_normalized_percentile":{"value":0.9941304,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"7","issue":"3","first_page":"955","last_page":"969"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.9083999991416931,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.9083999991416931,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.03620000183582306,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.02800000086426735,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.8424000144004822},{"id":"https://openalex.org/keywords/swarm-behaviour","display_name":"Swarm behaviour","score":0.7114999890327454},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6794999837875366},{"id":"https://openalex.org/keywords/information-exchange","display_name":"Information exchange","score":0.5135999917984009},{"id":"https://openalex.org/keywords/channel","display_name":"Channel (broadcasting)","score":0.49869999289512634},{"id":"https://openalex.org/keywords/reduction","display_name":"Reduction (mathematics)","score":0.4487999975681305},{"id":"https://openalex.org/keywords/wireless","display_name":"Wireless","score":0.38359999656677246}],"concepts":[{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.8424000144004822},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8331000208854675},{"id":"https://openalex.org/C181335050","wikidata":"https://www.wikidata.org/wiki/Q14915018","display_name":"Swarm behaviour","level":2,"score":0.7114999890327454},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6794999837875366},{"id":"https://openalex.org/C189693848","wikidata":"https://www.wikidata.org/wiki/Q6031064","display_name":"Information exchange","level":2,"score":0.5135999917984009},{"id":"https://openalex.org/C127162648","wikidata":"https://www.wikidata.org/wiki/Q16858953","display_name":"Channel (broadcasting)","level":2,"score":0.49869999289512634},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.46209999918937683},{"id":"https://openalex.org/C111335779","wikidata":"https://www.wikidata.org/wiki/Q3454686","display_name":"Reduction (mathematics)","level":2,"score":0.4487999975681305},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.4002000093460083},{"id":"https://openalex.org/C555944384","wikidata":"https://www.wikidata.org/wiki/Q249","display_name":"Wireless","level":2,"score":0.38359999656677246},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.34540000557899475},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3427000045776367},{"id":"https://openalex.org/C24590314","wikidata":"https://www.wikidata.org/wiki/Q336038","display_name":"Wireless sensor network","level":2,"score":0.3208000063896179},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2948000133037567},{"id":"https://openalex.org/C130120984","wikidata":"https://www.wikidata.org/wiki/Q2835898","display_name":"Distributed algorithm","level":2,"score":0.28049999475479126},{"id":"https://openalex.org/C2778820799","wikidata":"https://www.wikidata.org/wiki/Q3454688","display_name":"Cost reduction","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.2612999975681305},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.25519999861717224}],"mesh":[],"locations_count":6,"locations":[{"id":"doi:10.1109/tccn.2021.3063170","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tccn.2021.3063170","pdf_url":null,"source":{"id":"https://openalex.org/S2484188435","display_name":"IEEE Transactions on Cognitive Communications and Networking","issn_l":"2332-7731","issn":["2332-7731","2372-2045"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cognitive Communications and Networking","raw_type":"journal-article"},{"id":"pmh:oai:arXiv.org:2103.04666","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.04666","pdf_url":"https://arxiv.org/pdf/2103.04666","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"pmh:oai:pure.atira.dk:openaire/5bdf1921-f97f-47ed-9217-9693828506ee","is_oa":true,"landing_page_url":"https://vbn.aau.dk/da/publications/5bdf1921-f97f-47ed-9217-9693828506ee","pdf_url":"https://vbn.aau.dk/ws/files/475874659/Distributed_Reinforcement_Learning_for_Flexible_and_Efficient_UAV_Swarm_Control.pdf","source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by-sa","license_id":"https://openalex.org/licenses/cc-by-sa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Venturini, F, Mason, F, Pase, F, Chiariotti, F, Testolin, A, Zanella, A & Zorzi, M 2021, 'Distributed Reinforcement Learning for Flexible and Efficient UAV Swarm Control', IEEE Transactions on Cognitive Communications and Networking, vol. 7, no. 3, pp. 955-969. https://doi.org/10.1109/TCCN.2021.3063170","raw_type":"info:eu-repo/semantics/publishedVersion"},{"id":"pmh:oai:pure.atira.dk:publications/5bdf1921-f97f-47ed-9217-9693828506ee","is_oa":true,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=85102309125&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306401731","display_name":"VBN Forskningsportal (Aalborg Universitet)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I891191580","host_organization_name":"Aalborg University","host_organization_lineage":["https://openalex.org/I891191580"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Venturini , F , Mason , F , Pase , F , Chiariotti , F , Testolin , A , Zanella , A &amp; Zorzi , M 2021 , ' Distributed Reinforcement Learning for Flexible and Efficient UAV Swarm Control ' , IEEE Transactions on Cognitive Communications and Networking , vol. 7 , no. 3 , pp. 955-969 . https://doi.org/10.1109/TCCN.2021.3063170","raw_type":"article"},{"id":"pmh:oai:www.research.unipd.it:11577/3389431","is_oa":false,"landing_page_url":"http://hdl.handle.net/11577/3389431","pdf_url":null,"source":{"id":"https://openalex.org/S4377196283","display_name":"Research Padua  Archive (University of Padua)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I138689650","host_organization_name":"University of Padua","host_organization_lineage":["https://openalex.org/I138689650"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"","raw_type":"info:eu-repo/semantics/article"},{"id":"pmh:oai:www.research.unipd.it:11577/3494625","is_oa":false,"landing_page_url":"https://hdl.handle.net/11577/3494625","pdf_url":null,"source":{"id":"https://openalex.org/S4377196283","display_name":"Research Padua  Archive (University of Padua)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I138689650","host_organization_name":"University of Padua","host_organization_lineage":["https://openalex.org/I138689650"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2103.04666","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2103.04666","pdf_url":"https://arxiv.org/pdf/2103.04666","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G1486038497","display_name":null,"funder_award_id":"Law 232/2016","funder_id":"https://openalex.org/F4320321873","funder_display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca"},{"id":"https://openalex.org/G23227818","display_name":null,"funder_award_id":"\"Departments of Excellence\" (Law 232/2016)","funder_id":"https://openalex.org/F4320321873","funder_display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca"},{"id":"https://openalex.org/G5329322851","display_name":null,"funder_award_id":"232/2016","funder_id":"https://openalex.org/F4320317295","funder_display_name":"Dipartimenti di Eccellenza"},{"id":"https://openalex.org/G538436047","display_name":null,"funder_award_id":"Networks","funder_id":"https://openalex.org/F4320321873","funder_display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca"},{"id":"https://openalex.org/G5417130124","display_name":null,"funder_award_id":"232/2016","funder_id":"https://openalex.org/F4320321873","funder_display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca"},{"id":"https://openalex.org/G7452299184","display_name":null,"funder_award_id":"W911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G8254916772","display_name":null,"funder_award_id":"Law 232/2016","funder_id":"https://openalex.org/F4320317295","funder_display_name":"Dipartimenti di Eccellenza"},{"id":"https://openalex.org/G8998121839","display_name":null,"funder_award_id":"911NF","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G965573633","display_name":null,"funder_award_id":"W911NF1910","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"},{"id":"https://openalex.org/G987767699","display_name":null,"funder_award_id":"W911NF1910232","funder_id":"https://openalex.org/F4320338281","funder_display_name":"Army Research Office"}],"funders":[{"id":"https://openalex.org/F4320317295","display_name":"Dipartimenti di Eccellenza","ror":null},{"id":"https://openalex.org/F4320321873","display_name":"Ministero dell\u2019Istruzione, dell\u2019Universit\u00e0 e della Ricerca","ror":"https://ror.org/0166hxq48"},{"id":"https://openalex.org/F4320338281","display_name":"Army Research Office","ror":"https://ror.org/05epdh915"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W1932847118","https://openalex.org/W2145339207","https://openalex.org/W2155968351","https://openalex.org/W2497473826","https://openalex.org/W2522615148","https://openalex.org/W2747213132","https://openalex.org/W2775495931","https://openalex.org/W2886401384","https://openalex.org/W2886509985","https://openalex.org/W2887784286","https://openalex.org/W2893813411","https://openalex.org/W2896720518","https://openalex.org/W2958874452","https://openalex.org/W2962854114","https://openalex.org/W2963287938","https://openalex.org/W2963569053","https://openalex.org/W2964536243","https://openalex.org/W2969525674","https://openalex.org/W2981038142","https://openalex.org/W2982599276","https://openalex.org/W2986600625","https://openalex.org/W3010191728","https://openalex.org/W3033782504","https://openalex.org/W3036252686","https://openalex.org/W4213147678","https://openalex.org/W4214717370","https://openalex.org/W6635209275","https://openalex.org/W6637934594","https://openalex.org/W6712181171","https://openalex.org/W6712951187"],"related_works":[],"abstract_inverted_index":{"Over":[0],"the":[1,5,26,30,38,82,85,103,110],"past":[2],"few":[3],"years,":[4],"use":[6],"of":[7,9,33,132],"swarms":[8,74],"Unmanned":[10],"Aerial":[11],"Vehicles":[12],"(UAVs)":[13],"in":[14,37,47,95,141],"monitoring":[15],"and":[16,29,51,100,124,134],"remote":[17],"area":[18],"surveillance":[19],"applications":[20],"has":[21],"become":[22],"widespread":[23],"thanks":[24],"to":[25,41,49,72,87,97,120,148,166],"price":[27],"reduction":[28],"increased":[31],"capabilities":[32],"drones.":[34],"The":[35,77],"drones":[36],"swarm":[39],"need":[40],"cooperatively":[42],"explore":[43],"an":[44],"unknown":[45],"area,":[46],"order":[48,96],"identify":[50],"monitor":[52],"interesting":[53],"targets,":[54],"while":[55],"minimizing":[56],"their":[57],"movements.":[58],"In":[59],"this":[60],"work,":[61],"we":[62],"propose":[63],"a":[64,92,142,149,167],"distributed":[65],"Reinforcement":[66],"Learning":[67],"(RL)":[68],"approach":[69,161],"that":[70,109,125,159],"scales":[71],"larger":[73],"without":[75],"modifications.":[76],"proposed":[78,111],"framework":[79],"relies":[80],"on":[81],"possibility":[83],"for":[84],"UAVs":[86],"exchange":[88],"some":[89],"information":[90],"through":[91],"communication":[93,121],"channel,":[94],"achieve":[98],"context-awareness":[99],"implicitly":[101],"coordinate":[102],"swarm\u2019s":[104],"actions.":[105],"Our":[106],"experiments":[107],"show":[108,158],"method":[112],"can":[113,126,146],"yield":[114],"effective":[115],"strategies,":[116],"which":[117],"are":[118,139],"robust":[119],"channel":[122],"impairments,":[123],"easily":[127],"deal":[128],"with":[129,152],"non-uniform":[130],"distributions":[131],"targets":[133],"obstacles.":[135],"Moreover,":[136],"when":[137],"agents":[138],"trained":[140],"specific":[143],"scenario,":[144],"they":[145],"adapt":[147],"new":[150],"one":[151],"minimal":[153],"additional":[154],"training.":[155],"We":[156],"also":[157],"our":[160],"achieves":[162],"better":[163],"performance":[164],"compared":[165],"computationally":[168],"intensive":[169],"look-ahead":[170],"heuristic.":[171]},"counts_by_year":[{"year":2025,"cited_by_count":26},{"year":2024,"cited_by_count":15},{"year":2023,"cited_by_count":11},{"year":2022,"cited_by_count":2},{"year":2021,"cited_by_count":2}],"updated_date":"2026-04-12T07:58:50.170612","created_date":"2021-03-15T00:00:00"}
