{"id":"https://openalex.org/W4410453429","doi":"https://doi.org/10.1007/s10458-025-09707-7","title":"Entropy based blending of policies for multi-agent coexistence","display_name":"Entropy based blending of policies for multi-agent coexistence","publication_year":2025,"publication_date":"2025-05-16","ids":{"openalex":"https://openalex.org/W4410453429","doi":"https://doi.org/10.1007/s10458-025-09707-7"},"language":"en","primary_location":{"id":"doi:10.1007/s10458-025-09707-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10458-025-09707-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10458-025-09707-7.pdf","source":{"id":"https://openalex.org/S5405189","display_name":"Autonomous Agents and Multi-Agent Systems","issn_l":"1387-2532","issn":["1387-2532","1573-7454"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Autonomous Agents and Multi-Agent Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"hybrid","oa_url":"https://link.springer.com/content/pdf/10.1007/s10458-025-09707-7.pdf","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5088711780","display_name":"David Rother","orcid":null},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]},{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":true,"raw_author_name":"David Rother","raw_affiliation_strings":["Honda Research Institute EU, Offenbach, Germany","Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute EU, Offenbach, Germany","institution_ids":["https://openalex.org/I4210112253"]},{"raw_affiliation_string":"Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102741270","display_name":"Franziska Herbert","orcid":"https://orcid.org/0000-0003-4191-9366"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Franziska Herbert","raw_affiliation_strings":["Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5117576283","display_name":"Fabian Kalter","orcid":null},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Fabian Kalter","raw_affiliation_strings":["Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5063353075","display_name":"Dorothea Koert","orcid":"https://orcid.org/0000-0002-3571-6848"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Dorothea Koert","raw_affiliation_strings":["Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017983137","display_name":"Joni Pajarinen","orcid":"https://orcid.org/0000-0003-4469-8191"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]},{"id":"https://openalex.org/I9927081","display_name":"Aalto University","ror":"https://ror.org/020hwjq30","country_code":"FI","type":"education","lineage":["https://openalex.org/I9927081"]}],"countries":["DE","FI"],"is_corresponding":false,"raw_author_name":"Joni Pajarinen","raw_affiliation_strings":["Aalto University, Espoo, Finland","Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Aalto University, Espoo, Finland","institution_ids":["https://openalex.org/I9927081"]},{"raw_affiliation_string":"Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051054354","display_name":"Jan Peters","orcid":"https://orcid.org/0000-0002-0195-5357"},"institutions":[{"id":"https://openalex.org/I31512782","display_name":"Technical University of Darmstadt","ror":"https://ror.org/05n911h24","country_code":"DE","type":"education","lineage":["https://openalex.org/I31512782"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Jan Peters","raw_affiliation_strings":["Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany"],"affiliations":[{"raw_affiliation_string":"Intelligent Autonomos Systems (IAS), TU Darmstadt, Darmstadt, Germany","institution_ids":["https://openalex.org/I31512782"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5007402183","display_name":"Thomas H. Weisswange","orcid":"https://orcid.org/0000-0003-2119-6965"},"institutions":[{"id":"https://openalex.org/I4210112253","display_name":"Honda (Germany)","ror":"https://ror.org/022c1xk47","country_code":"DE","type":"company","lineage":["https://openalex.org/I1283473643","https://openalex.org/I4210112253"]}],"countries":["DE"],"is_corresponding":false,"raw_author_name":"Thomas H. Weisswange","raw_affiliation_strings":["Honda Research Institute Europe GmbH, Offenbach, Germany"],"affiliations":[{"raw_affiliation_string":"Honda Research Institute Europe GmbH, Offenbach, Germany","institution_ids":["https://openalex.org/I4210112253"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5088711780"],"corresponding_institution_ids":["https://openalex.org/I31512782","https://openalex.org/I4210112253"],"apc_list":{"value":2390,"currency":"EUR","value_usd":2990},"apc_paid":{"value":2390,"currency":"EUR","value_usd":2990},"fwci":2.3431,"has_fulltext":true,"cited_by_count":1,"citation_normalized_percentile":{"value":0.8905427,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"39","issue":"1","first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9962999820709229,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.9858999848365784,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/entropy","display_name":"Entropy (arrow of time)","score":0.4505411684513092},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4161769151687622},{"id":"https://openalex.org/keywords/statistical-physics","display_name":"Statistical physics","score":0.3477923274040222},{"id":"https://openalex.org/keywords/biological-system","display_name":"Biological system","score":0.3269680142402649},{"id":"https://openalex.org/keywords/thermodynamics","display_name":"Thermodynamics","score":0.21052652597427368},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.10945636034011841},{"id":"https://openalex.org/keywords/biology","display_name":"Biology","score":0.07452651858329773}],"concepts":[{"id":"https://openalex.org/C106301342","wikidata":"https://www.wikidata.org/wiki/Q4117933","display_name":"Entropy (arrow of time)","level":2,"score":0.4505411684513092},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4161769151687622},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.3477923274040222},{"id":"https://openalex.org/C186060115","wikidata":"https://www.wikidata.org/wiki/Q30336093","display_name":"Biological system","level":1,"score":0.3269680142402649},{"id":"https://openalex.org/C97355855","wikidata":"https://www.wikidata.org/wiki/Q11473","display_name":"Thermodynamics","level":1,"score":0.21052652597427368},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.10945636034011841},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.07452651858329773}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1007/s10458-025-09707-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10458-025-09707-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10458-025-09707-7.pdf","source":{"id":"https://openalex.org/S5405189","display_name":"Autonomous Agents and Multi-Agent Systems","issn_l":"1387-2532","issn":["1387-2532","1573-7454"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Autonomous Agents and Multi-Agent Systems","raw_type":"journal-article"},{"id":"pmh:oai:aaltodoc.aalto.fi:123456789/135831","is_oa":true,"landing_page_url":"http://www.scopus.com/inward/record.url?scp=105005398921&partnerID=8YFLogxK","pdf_url":null,"source":{"id":"https://openalex.org/S4306401663","display_name":"Aaltodoc (Aalto University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I9927081","host_organization_name":"Aalto University","host_organization_lineage":["https://openalex.org/I9927081"],"host_organization_lineage_names":[],"type":"repository"},"license":"other-oa","license_id":"https://openalex.org/licenses/other-oa","version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"publishedVersion"},{"id":"pmh:oai:tubiblio.ulb.tu-darmstadt.de:156484","is_oa":false,"landing_page_url":"http://tubiblio.ulb.tu-darmstadt.de/view/person/Rother=3ADavid=3A=3A.html>","pdf_url":null,"source":{"id":"https://openalex.org/S4377196390","display_name":"TUbilio (Technical University of Darmstadt)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I31512782","host_organization_name":"Technische Universit\u00e4t Darmstadt","host_organization_lineage":["https://openalex.org/I31512782"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":null,"raw_type":"NonPeerReviewed"}],"best_oa_location":{"id":"doi:10.1007/s10458-025-09707-7","is_oa":true,"landing_page_url":"https://doi.org/10.1007/s10458-025-09707-7","pdf_url":"https://link.springer.com/content/pdf/10.1007/s10458-025-09707-7.pdf","source":{"id":"https://openalex.org/S5405189","display_name":"Autonomous Agents and Multi-Agent Systems","issn_l":"1387-2532","issn":["1387-2532","1573-7454"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319900","host_organization_name":"Springer Science+Business Media","host_organization_lineage":["https://openalex.org/P4310319900","https://openalex.org/P4310319965"],"host_organization_lineage_names":["Springer Science+Business Media","Springer Nature"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Autonomous Agents and Multi-Agent Systems","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8647972370","display_name":null,"funder_award_id":"01IS20045","funder_id":"https://openalex.org/F4320321114","funder_display_name":"Bundesministerium f\u00fcr Bildung und Forschung"}],"funders":[{"id":"https://openalex.org/F4320321108","display_name":"Academy of Finland","ror":"https://ror.org/05k73zm37"},{"id":"https://openalex.org/F4320321114","display_name":"Bundesministerium f\u00fcr Bildung und Forschung","ror":"https://ror.org/04pz7b180"},{"id":"https://openalex.org/F4320323384","display_name":"Technische Universit\u00e4t Darmstadt","ror":"https://ror.org/05n911h24"}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4410453429.pdf","grobid_xml":"https://content.openalex.org/works/W4410453429.grobid-xml"},"referenced_works_count":72,"referenced_works":["https://openalex.org/W337580137","https://openalex.org/W1535554606","https://openalex.org/W1568062101","https://openalex.org/W1596507639","https://openalex.org/W1605268984","https://openalex.org/W2026003182","https://openalex.org/W2053410861","https://openalex.org/W2078844124","https://openalex.org/W2081034428","https://openalex.org/W2097714468","https://openalex.org/W2105925198","https://openalex.org/W2113423686","https://openalex.org/W2116064496","https://openalex.org/W2142583797","https://openalex.org/W2143398066","https://openalex.org/W2149551746","https://openalex.org/W2162104245","https://openalex.org/W2167150807","https://openalex.org/W2215257094","https://openalex.org/W2293816024","https://openalex.org/W2339027962","https://openalex.org/W2535584654","https://openalex.org/W2571600439","https://openalex.org/W2591951582","https://openalex.org/W2594103415","https://openalex.org/W2604704722","https://openalex.org/W2604873668","https://openalex.org/W2621226867","https://openalex.org/W2623431351","https://openalex.org/W2626637010","https://openalex.org/W2794643322","https://openalex.org/W2796238456","https://openalex.org/W2891963971","https://openalex.org/W2907855292","https://openalex.org/W2949693231","https://openalex.org/W2963366811","https://openalex.org/W2963403593","https://openalex.org/W2968526727","https://openalex.org/W2989824617","https://openalex.org/W2990138404","https://openalex.org/W3006009210","https://openalex.org/W3022553186","https://openalex.org/W3031172930","https://openalex.org/W3087935424","https://openalex.org/W3090814332","https://openalex.org/W3094349299","https://openalex.org/W3098074911","https://openalex.org/W3148143011","https://openalex.org/W3167419264","https://openalex.org/W3170070145","https://openalex.org/W3170717711","https://openalex.org/W3177102170","https://openalex.org/W3188746815","https://openalex.org/W3194443001","https://openalex.org/W3204828078","https://openalex.org/W3212905267","https://openalex.org/W4205559380","https://openalex.org/W4211240529","https://openalex.org/W4250731795","https://openalex.org/W4284960570","https://openalex.org/W4298181618","https://openalex.org/W4312867245","https://openalex.org/W4383108656","https://openalex.org/W4387185250","https://openalex.org/W4387520149","https://openalex.org/W4388623195","https://openalex.org/W6631190155","https://openalex.org/W6741883356","https://openalex.org/W6748203849","https://openalex.org/W6847672028","https://openalex.org/W6903351479","https://openalex.org/W7046269321"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W2180033908"],"abstract_inverted_index":{"Abstract":[0],"Research":[1],"on":[2,16],"multi-agent":[3],"interaction":[4,125],"involving":[5],"humans":[6],"is":[7,186],"still":[8],"in":[9,32,35,73,198],"its":[10],"infancy.":[11],"Most":[12],"approaches":[13,77],"have":[14],"focused":[15],"environments":[17,34,205],"with":[18,54,160,180],"collaborative":[19],"human":[20],"behavior":[21,106],"or":[22,56,87],"a":[23,61,120,141,171],"small,":[24],"defined":[25],"set":[26],"of":[27,40,45,157,163],"situations.":[28],"When":[29],"deploying":[30],"robots":[31,102],"human-inhabited":[33],"the":[36,38,43,79,134,155,161,181,217],"future,":[37],"diversity":[39],"interactions":[41,179],"surpasses":[42],"capabilities":[44],"pre-trained":[46],"collaboration":[47,208],"models.":[48],"\u201dCoexistence\u201d":[49],"environments,":[50],"characterized":[51],"by":[52],"agents":[53,151,159,164],"varying":[55],"partially":[57],"aligned":[58],"objectives,":[59],"present":[60],"unique":[62],"challenge":[63],"for":[64,145,177],"robotic":[65],"collaboration.":[66],"Traditional":[67],"reinforcement":[68],"learning":[69,130,214],"methods":[70],"fall":[71],"short":[72],"these":[74],"settings.":[75],"These":[76],"lack":[78],"flexibility":[80],"to":[81,83,219],"adapt":[82],"changing":[84],"agent":[85,201],"counts":[86],"task":[88,146,183,199],"requirements":[89],"without":[90,109],"undergoing":[91],"retraining.":[92],"Moreover,":[93],"existing":[94],"models":[95],"do":[96],"not":[97],"adequately":[98],"support":[99,189],"scenarios":[100],"where":[101],"should":[103],"exhibit":[104],"helpful":[105],"toward":[107],"others":[108],"compromising":[110],"their":[111],"primary":[112],"goals.":[113],"To":[114,168,188],"tackle":[115],"this":[116,169],"issue,":[117],"we":[118,192],"introduce":[119],"novel":[121],"framework":[122,196],"that":[123,194],"decomposes":[124],"and":[126,132,152,165,200,206],"task-solving":[127],"into":[128],"separate":[129],"problems":[131],"blends":[133],"resulting":[135],"policies":[136],"at":[137],"inference":[138,143],"time":[139],"using":[140],"goal":[142],"model":[144],"estimation.":[147],"We":[148],"create":[149],"impact-aware":[150],"linearly":[153],"scale":[154],"cost":[156],"training":[158],"number":[162],"available":[166],"tasks.":[167],"end,":[170],"weighting":[172],"function":[173],"blending":[174],"action":[175,184],"distributions":[176],"individual":[178],"original":[182],"distribution":[185],"proposed.":[187],"our":[190,195],"claims":[191],"demonstrate":[193],"scales":[197],"count":[202],"across":[203],"several":[204],"considers":[207],"opportunities":[209],"when":[210],"present.":[211],"The":[212],"new":[213],"paradigm":[215],"opens":[216],"path":[218],"more":[220],"complex":[221],"multi-robot,":[222],"multi-human":[223],"interactions.":[224]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2026-04-10T15:06:20.359241","created_date":"2025-10-10T00:00:00"}
