{"id":"https://openalex.org/W2087322096","doi":"https://doi.org/10.1145/1160633.1160770","title":"Learning to cooperate in multi-agent social dilemmas","display_name":"Learning to cooperate in multi-agent social dilemmas","publication_year":2006,"publication_date":"2006-05-08","ids":{"openalex":"https://openalex.org/W2087322096","doi":"https://doi.org/10.1145/1160633.1160770","mag":"2087322096"},"language":"en","primary_location":{"id":"doi:10.1145/1160633.1160770","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1160633.1160770","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the fifth international joint conference on Autonomous agents and multiagent systems","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5064277708","display_name":"Enrique Mu\u00f1oz de Cote","orcid":"https://orcid.org/0000-0002-3249-096X"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Enrique Munoz de Cote","raw_affiliation_strings":["Politecnico di Milano, piazza Leonardo da Vinci, Milan, Italy","Politecnico di Milano - Piazza Leonardo da Vinci, Milan, Italy#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Milano, piazza Leonardo da Vinci, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano - Piazza Leonardo da Vinci, Milan, Italy#TAB#","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5014791481","display_name":"Alessandro Lazaric","orcid":"https://orcid.org/0000-0002-8970-413X"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Alessandro Lazaric","raw_affiliation_strings":["Politecnico di Milano, piazza Leonardo da Vinci, Milan, Italy","Politecnico di Milano - Piazza Leonardo da Vinci, Milan, Italy#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Milano, piazza Leonardo da Vinci, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano - Piazza Leonardo da Vinci, Milan, Italy#TAB#","institution_ids":["https://openalex.org/I93860229"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5017130830","display_name":"Marcello Restelli","orcid":"https://orcid.org/0000-0002-6322-1076"},"institutions":[{"id":"https://openalex.org/I93860229","display_name":"Politecnico di Milano","ror":"https://ror.org/01nffqt88","country_code":"IT","type":"education","lineage":["https://openalex.org/I93860229"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Marcello Restelli","raw_affiliation_strings":["Politecnico di Milano, piazza Leonardo da Vinci, Milan, Italy","Politecnico di Milano - Piazza Leonardo da Vinci, Milan, Italy#TAB#"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Politecnico di Milano, piazza Leonardo da Vinci, Milan, Italy","institution_ids":["https://openalex.org/I93860229"]},{"raw_affiliation_string":"Politecnico di Milano - Piazza Leonardo da Vinci, Milan, Italy#TAB#","institution_ids":["https://openalex.org/I93860229"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":2.1315,"has_fulltext":false,"cited_by_count":51,"citation_normalized_percentile":{"value":0.91195956,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"783","last_page":"785"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.9787999987602234,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9757999777793884,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7950248718261719},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6747352480888367},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.5542956590652466},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.5352051854133606},{"id":"https://openalex.org/keywords/social-dilemma","display_name":"Social dilemma","score":0.5025560855865479},{"id":"https://openalex.org/keywords/pareto-principle","display_name":"Pareto principle","score":0.492903470993042},{"id":"https://openalex.org/keywords/social-learning","display_name":"Social learning","score":0.4672624468803406},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.38070523738861084},{"id":"https://openalex.org/keywords/distributed-computing","display_name":"Distributed computing","score":0.32926011085510254},{"id":"https://openalex.org/keywords/knowledge-management","display_name":"Knowledge management","score":0.3030989170074463},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.20247462391853333},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.17733830213546753},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.09084093570709229},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.07722154259681702}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7950248718261719},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6747352480888367},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.5542956590652466},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.5352051854133606},{"id":"https://openalex.org/C187206662","wikidata":"https://www.wikidata.org/wiki/Q55607920","display_name":"Social dilemma","level":2,"score":0.5025560855865479},{"id":"https://openalex.org/C137635306","wikidata":"https://www.wikidata.org/wiki/Q182667","display_name":"Pareto principle","level":2,"score":0.492903470993042},{"id":"https://openalex.org/C79416737","wikidata":"https://www.wikidata.org/wiki/Q2305519","display_name":"Social learning","level":2,"score":0.4672624468803406},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38070523738861084},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.32926011085510254},{"id":"https://openalex.org/C56739046","wikidata":"https://www.wikidata.org/wiki/Q192060","display_name":"Knowledge management","level":1,"score":0.3030989170074463},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.20247462391853333},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.17733830213546753},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.09084093570709229},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.07722154259681702},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/1160633.1160770","is_oa":false,"landing_page_url":"https://doi.org/10.1145/1160633.1160770","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the fifth international joint conference on Autonomous agents and multiagent systems","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/17","display_name":"Partnerships for the goals","score":0.44999998807907104}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":16,"referenced_works":["https://openalex.org/W28155157","https://openalex.org/W1513468570","https://openalex.org/W1519783625","https://openalex.org/W1542941925","https://openalex.org/W1641379095","https://openalex.org/W1656616331","https://openalex.org/W2053616263","https://openalex.org/W2104602264","https://openalex.org/W2120327309","https://openalex.org/W2124951424","https://openalex.org/W2132979098","https://openalex.org/W2133096155","https://openalex.org/W2142839172","https://openalex.org/W2164637474","https://openalex.org/W3091511613","https://openalex.org/W6680008307"],"related_works":["https://openalex.org/W4362501864","https://openalex.org/W4306904969","https://openalex.org/W4380318855","https://openalex.org/W2138720691","https://openalex.org/W2031695474","https://openalex.org/W2586732548","https://openalex.org/W2950219151","https://openalex.org/W2946123577","https://openalex.org/W3212652405","https://openalex.org/W2803797390"],"abstract_inverted_index":{"In":[0],"many":[1],"Multi-Agent":[2],"Systems":[3],"(MAS),":[4],"self-interested":[5],"agents":[6,29],"need":[7],"to":[8,12,25],"cooperate":[9],"in":[10,17],"order":[11],"maximize":[13],"their":[14],"own":[15],"utilities":[16],"time.":[18],"The":[19],"goal":[20],"of":[21,41,57],"this":[22],"work":[23],"is":[24],"improve":[26],"cooperation":[27],"among":[28],"that":[30,53],"use":[31],"best-response":[32],"Reinforcement":[33],"Learning":[34],"(RL)":[35],"algorithms":[36],"(Q-Learning),":[37],"by":[38],"the":[39,55],"introduction":[40],"two":[42],"new":[43],"principles":[44],"(Change":[45],"or":[46],"Learn":[47],"Fast":[48],"and":[49,51],"Change":[50],"Keep)":[52],"foster":[54],"reaching":[56],"Pareto":[58],"efficient":[59],"stable":[60],"outcomes.":[61]},"counts_by_year":[{"year":2025,"cited_by_count":3},{"year":2024,"cited_by_count":3},{"year":2023,"cited_by_count":6},{"year":2022,"cited_by_count":1},{"year":2021,"cited_by_count":4},{"year":2020,"cited_by_count":6},{"year":2019,"cited_by_count":4},{"year":2018,"cited_by_count":6},{"year":2017,"cited_by_count":7},{"year":2016,"cited_by_count":3},{"year":2012,"cited_by_count":2}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
