{"id":"https://openalex.org/W7125785686","doi":"https://doi.org/10.48550/arxiv.2601.18419","title":"Emergent Cooperation in Quantum Multi-Agent Reinforcement Learning Using Communication","display_name":"Emergent Cooperation in Quantum Multi-Agent Reinforcement Learning Using Communication","publication_year":2026,"publication_date":"2026-01-26","ids":{"openalex":"https://openalex.org/W7125785686","doi":"https://doi.org/10.48550/arxiv.2601.18419"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2601.18419","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.18419","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2601.18419","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5123883786","display_name":"Michael K\u00f6lle","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"K\u00f6lle, Michael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123919415","display_name":"Christian Reff","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Reff, Christian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5027573088","display_name":"Leo S\u00fcnkel","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"S\u00fcnkel, Leo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5123970327","display_name":"Julian Hager","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hager, Julian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075906510","display_name":"Gerhard Stenzel","orcid":"https://orcid.org/0009-0009-0280-4911"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Stenzel, Gerhard","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5123947722","display_name":"Claudia Linnhoff-Popien","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Linnhoff-Popien, Claudia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5123883786"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.6754999756813049,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.6754999756813049,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10646","display_name":"Experimental Behavioral Economics Studies","score":0.06360000371932983,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.02669999934732914,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8438000082969666},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5579000115394592},{"id":"https://openalex.org/keywords/incentive","display_name":"Incentive","score":0.45829999446868896},{"id":"https://openalex.org/keywords/quantum","display_name":"Quantum","score":0.4050000011920929},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4027999937534332},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.39969998598098755},{"id":"https://openalex.org/keywords/game-theory","display_name":"Game theory","score":0.3411000072956085}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8438000082969666},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6299999952316284},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5579000115394592},{"id":"https://openalex.org/C29122968","wikidata":"https://www.wikidata.org/wiki/Q1414816","display_name":"Incentive","level":2,"score":0.45829999446868896},{"id":"https://openalex.org/C84114770","wikidata":"https://www.wikidata.org/wiki/Q46344","display_name":"Quantum","level":2,"score":0.4050000011920929},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4027999937534332},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.39969998598098755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3634999990463257},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.3411000072956085},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.32179999351501465},{"id":"https://openalex.org/C189693848","wikidata":"https://www.wikidata.org/wiki/Q6031064","display_name":"Information exchange","level":2,"score":0.32019999623298645},{"id":"https://openalex.org/C169903001","wikidata":"https://www.wikidata.org/wiki/Q3264987","display_name":"Reciprocity (cultural anthropology)","level":2,"score":0.3028999865055084},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.29409998655319214},{"id":"https://openalex.org/C140479938","wikidata":"https://www.wikidata.org/wiki/Q5254619","display_name":"Iterated function","level":2,"score":0.2881999909877777},{"id":"https://openalex.org/C79416737","wikidata":"https://www.wikidata.org/wiki/Q2305519","display_name":"Social learning","level":2,"score":0.2827000021934509},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.27549999952316284},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.26600000262260437}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2601.18419","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.18419","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2601.18419","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2601.18419","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.44449275732040405,"display_name":"Partnerships for the goals","id":"https://metadata.un.org/sdg/17"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Emergent":[0],"cooperation":[1,121,136],"in":[2,12,88,137],"classical":[3,21],"Multi-Agent":[4,38,139],"Reinforcement":[5,39,140],"Learning":[6,40,82],"has":[7],"gained":[8],"significant":[9],"attention,":[10],"particularly":[11,43],"the":[13,57,74,91],"context":[14],"of":[15,101],"Sequential":[16],"Social":[17],"Dilemmas":[18],"(SSDs).":[19],"While":[20],"reinforcement":[22],"learning":[23],"approaches":[24,52,87,108],"have":[25],"demonstrated":[26],"capability":[27],"for":[28,133],"emergent":[29,135],"cooperation,":[30],"research":[31],"on":[32],"extending":[33],"these":[34,86],"methods":[35],"to":[36,53],"Quantum":[37,138],"remains":[41],"limited,":[42],"through":[44],"communication.":[45],"In":[46],"this":[47],"paper,":[48],"we":[49],"apply":[50],"communication":[51,128],"quantum":[54],"Q-Learning":[55],"agents:":[56],"Mutual":[58],"Acknowledgment":[59,70],"Token":[60,71],"Exchange":[61,72],"(MATE)":[62],"protocol,":[63],"its":[64],"extension":[65],"Mutually":[66],"Endorsed":[67],"Distributed":[68],"Incentive":[69],"(MEDIATE),":[73],"peer":[75],"rewarding":[76],"mechanism":[77,132],"Gifting,":[78],"and":[79,98,117],"Reinforced":[80],"Inter-Agent":[81],"(RIAL).":[83],"We":[84],"evaluate":[85],"three":[89],"SSDs:":[90],"Iterated":[92,95,99],"Prisoner's":[93],"Dilemma,":[94],"Stag":[96],"Hunt,":[97],"Game":[100],"Chicken.":[102],"Our":[103],"experimental":[104],"results":[105],"show":[106],"that":[107,127],"using":[109],"MATE":[110],"with":[111],"temporal-difference":[112],"measure":[113],"(MATE\\textsubscript{TD}),":[114],"AutoMATE,":[115],"MEDIATE-I,":[116],"MEDIATE-S":[118],"achieved":[119],"high":[120],"levels":[122],"across":[123],"all":[124],"dilemmas,":[125],"demonstrating":[126],"is":[129],"a":[130],"viable":[131],"fostering":[134],"Learning.":[141]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2026-01-28T00:00:00"}
