{"id":"https://openalex.org/W4417291964","doi":"https://doi.org/10.48550/arxiv.2512.09682","title":"Dynamic one-time delivery of critical data by small and sparse UAV swarms: a model problem for MARL scaling studies","display_name":"Dynamic one-time delivery of critical data by small and sparse UAV swarms: a model problem for MARL scaling studies","publication_year":2025,"publication_date":"2025-12-10","ids":{"openalex":"https://openalex.org/W4417291964","doi":"https://doi.org/10.48550/arxiv.2512.09682"},"language":null,"primary_location":{"id":"pmh:oai:arXiv.org:2512.09682","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2512.09682","pdf_url":"https://arxiv.org/pdf/2512.09682","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2512.09682","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052102547","display_name":"Mikael Persson","orcid":"https://orcid.org/0000-0002-1335-2377"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Persson, Mika","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120790166","display_name":"Jonas Lidman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lidman, Jonas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120790167","display_name":"Jacob Ljungberg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ljungberg, Jacob","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120790168","display_name":"Samuel Sandelius","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sandelius, Samuel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5040822148","display_name":"Adam Andersson","orcid":"https://orcid.org/0000-0002-8342-4997"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Andersson, Adam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052102547"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.40389999747276306,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.40389999747276306,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.2689000070095062,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.11110000312328339,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.6410999894142151},{"id":"https://openalex.org/keywords/scaling","display_name":"Scaling","score":0.6317999958992004},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6189000010490417},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5382999777793884},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.4449999928474426},{"id":"https://openalex.org/keywords/dynamic-scaling","display_name":"Dynamic scaling","score":0.4018999934196472},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.39320001006126404},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3921000063419342}],"concepts":[{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.6410999894142151},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.6317999958992004},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6189000010490417},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6061000227928162},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5382999777793884},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.4449999928474426},{"id":"https://openalex.org/C2780500908","wikidata":"https://www.wikidata.org/wiki/Q28405357","display_name":"Dynamic scaling","level":3,"score":0.4018999934196472},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.39320001006126404},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3921000063419342},{"id":"https://openalex.org/C2778156585","wikidata":"https://www.wikidata.org/wiki/Q174053","display_name":"Relay","level":3,"score":0.3725999891757965},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.35670000314712524},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3416000008583069},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.33399999141693115},{"id":"https://openalex.org/C112758219","wikidata":"https://www.wikidata.org/wiki/Q16038819","display_name":"Duration (music)","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C37404715","wikidata":"https://www.wikidata.org/wiki/Q380679","display_name":"Dynamic programming","level":2,"score":0.3192000091075897},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3192000091075897},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.30649998784065247},{"id":"https://openalex.org/C205875254","wikidata":"https://www.wikidata.org/wiki/Q17156857","display_name":"Decentralised system","level":3,"score":0.29170000553131104},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2890999913215637},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.27709999680519104},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.2709999978542328},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.26969999074935913},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.2549999952316284}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2512.09682","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2512.09682","pdf_url":"https://arxiv.org/pdf/2512.09682","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2512.09682","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2512.09682","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2512.09682","is_oa":true,"landing_page_url":"https://arxiv.org/abs/2512.09682","pdf_url":"https://arxiv.org/pdf/2512.09682","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4417291964.pdf","grobid_xml":"https://content.openalex.org/works/W4417291964.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"This":[0],"work":[1],"studies":[2],"the":[3,70,83],"application":[4],"of":[5,13,32,76,85],"Multi-Agent":[6],"Reinforcement":[7],"Learning":[8],"(MARL)":[9],"to":[10,17,23],"decentralized":[11],"control":[12],"unmanned":[14],"aerial":[15],"vehicles":[16],"relay":[18],"a":[19,24,30,73],"critical":[20],"data":[21],"package":[22],"known":[25],"position.":[26],"For":[27],"this":[28],"purpose,":[29],"family":[31],"deterministic":[33],"games":[34],"is":[35,46],"introduced,":[36],"designed":[37],"for":[38,72],"MARL":[39,65],"scaling":[40],"studies.":[41],"A":[42],"robust":[43],"baseline":[44,71],"policy":[45],"proposed":[47],"which":[48],"restricts":[49],"agent":[50],"motion":[51],"and":[52,90],"applies":[53],"Dijkstra's":[54],"shortest":[55],"path":[56],"algorithm.":[57],"Computational":[58],"experiment":[59],"results":[60],"show":[61],"that":[62],"two":[63],"off-the-shelf":[64],"algorithms":[66],"perform":[67],"competitively":[68],"with":[69],"small":[74],"number":[75,84],"agents,":[77],"but":[78],"face":[79],"scalability":[80],"issues":[81],"as":[82],"agents":[86],"increases.":[87],"Source":[88],"code":[89],"animations":[91],"are":[92],"available":[93],"online":[94],"at":[95],"https://github.com/mikapersson/Information-Relaying.":[96]},"counts_by_year":[],"updated_date":"2026-05-12T06:07:45.972803","created_date":"2025-12-12T00:00:00"}
