{"id":"https://openalex.org/W2137377401","doi":"https://doi.org/10.1177/1059712312449547","title":"Rewards for pairs of Q-learning agents conducive to turn-taking in medium-access games","display_name":"Rewards for pairs of Q-learning agents conducive to turn-taking in medium-access games","publication_year":2012,"publication_date":"2012-06-25","ids":{"openalex":"https://openalex.org/W2137377401","doi":"https://doi.org/10.1177/1059712312449547","mag":"2137377401"},"language":"en","primary_location":{"id":"doi:10.1177/1059712312449547","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1059712312449547","pdf_url":null,"source":{"id":"https://openalex.org/S183337005","display_name":"Adaptive Behavior","issn_l":"1059-7123","issn":["1059-7123","1741-2633"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Adaptive Behavior","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004476114","display_name":"Peter A Raffensperger","orcid":null},"institutions":[{"id":"https://openalex.org/I185492890","display_name":"University of Canterbury","ror":"https://ror.org/03y7q9t39","country_code":"NZ","type":"education","lineage":["https://openalex.org/I185492890"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Peter A Raffensperger","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Canterbury, New Zealand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Canterbury, New Zealand","institution_ids":["https://openalex.org/I185492890"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049612660","display_name":"Philip J. Bones","orcid":"https://orcid.org/0000-0003-1611-7601"},"institutions":[{"id":"https://openalex.org/I185492890","display_name":"University of Canterbury","ror":"https://ror.org/03y7q9t39","country_code":"NZ","type":"education","lineage":["https://openalex.org/I185492890"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Philip J Bones","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Canterbury, New Zealand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Canterbury, New Zealand","institution_ids":["https://openalex.org/I185492890"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000362900","display_name":"Allan McInnes","orcid":null},"institutions":[{"id":"https://openalex.org/I185492890","display_name":"University of Canterbury","ror":"https://ror.org/03y7q9t39","country_code":"NZ","type":"education","lineage":["https://openalex.org/I185492890"]}],"countries":["NZ"],"is_corresponding":false,"raw_author_name":"Allan I McInnes","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Canterbury, New Zealand"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Canterbury, New Zealand","institution_ids":["https://openalex.org/I185492890"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5044805750","display_name":"Russell Y. Webb","orcid":null},"institutions":[{"id":"https://openalex.org/I4210153776","display_name":"Apple (United States)","ror":"https://ror.org/059hsda18","country_code":"US","type":"company","lineage":["https://openalex.org/I4210153776"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Russell Y Webb","raw_affiliation_strings":["Apple Computer Inc., Cupertino, California, USA"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Apple Computer Inc., Cupertino, California, USA","institution_ids":["https://openalex.org/I4210153776"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.974,"has_fulltext":false,"cited_by_count":4,"citation_normalized_percentile":{"value":0.86062483,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":94},"biblio":{"volume":"20","issue":"4","first_page":"304","last_page":"318"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11252","display_name":"Evolutionary Game Theory and Cooperation","score":0.984499990940094,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.9799000024795532,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12090","display_name":"Language and cultural evolution","score":0.9725000262260437,"subfield":{"id":"https://openalex.org/subfields/3316","display_name":"Cultural Studies"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7082706689834595},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.6728065609931946},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6495280265808105},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.598166823387146},{"id":"https://openalex.org/keywords/turn-taking","display_name":"Turn-taking","score":0.5424308776855469},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4917450249195099},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.4895552098751068},{"id":"https://openalex.org/keywords/stateful-firewall","display_name":"Stateful firewall","score":0.4426383972167969},{"id":"https://openalex.org/keywords/variety","display_name":"Variety (cybernetics)","score":0.42247626185417175},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.30043846368789673},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.2929065227508545},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.2043118178844452},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.17202073335647583},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.1660899519920349},{"id":"https://openalex.org/keywords/communication","display_name":"Communication","score":0.10414671897888184},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.0813373327255249},{"id":"https://openalex.org/keywords/conversation","display_name":"Conversation","score":0.07945334911346436}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7082706689834595},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.6728065609931946},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6495280265808105},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.598166823387146},{"id":"https://openalex.org/C2776352735","wikidata":"https://www.wikidata.org/wiki/Q2313343","display_name":"Turn-taking","level":3,"score":0.5424308776855469},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4917450249195099},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.4895552098751068},{"id":"https://openalex.org/C22927095","wikidata":"https://www.wikidata.org/wiki/Q1784206","display_name":"Stateful firewall","level":3,"score":0.4426383972167969},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.42247626185417175},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.30043846368789673},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2929065227508545},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2043118178844452},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.17202073335647583},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.1660899519920349},{"id":"https://openalex.org/C46312422","wikidata":"https://www.wikidata.org/wiki/Q11024","display_name":"Communication","level":1,"score":0.10414671897888184},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0813373327255249},{"id":"https://openalex.org/C2777200299","wikidata":"https://www.wikidata.org/wiki/Q52943","display_name":"Conversation","level":2,"score":0.07945334911346436},{"id":"https://openalex.org/C158379750","wikidata":"https://www.wikidata.org/wiki/Q214111","display_name":"Network packet","level":2,"score":0.0},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1177/1059712312449547","is_oa":false,"landing_page_url":"https://doi.org/10.1177/1059712312449547","pdf_url":null,"source":{"id":"https://openalex.org/S183337005","display_name":"Adaptive Behavior","issn_l":"1059-7123","issn":["1059-7123","1741-2633"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320017","host_organization_name":"SAGE Publishing","host_organization_lineage":["https://openalex.org/P4310320017"],"host_organization_lineage_names":["SAGE Publishing"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Adaptive Behavior","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W304415408","https://openalex.org/W1484517649","https://openalex.org/W1515851193","https://openalex.org/W1523025179","https://openalex.org/W1589640982","https://openalex.org/W1963523946","https://openalex.org/W1967048917","https://openalex.org/W1967580276","https://openalex.org/W1970093479","https://openalex.org/W1998677696","https://openalex.org/W2003688174","https://openalex.org/W2013523787","https://openalex.org/W2034587361","https://openalex.org/W2049401150","https://openalex.org/W2060565531","https://openalex.org/W2067050450","https://openalex.org/W2072514121","https://openalex.org/W2077930544","https://openalex.org/W2080213916","https://openalex.org/W2081230844","https://openalex.org/W2083662736","https://openalex.org/W2099618002","https://openalex.org/W2103821767","https://openalex.org/W2109049179","https://openalex.org/W2118549177","https://openalex.org/W2119567691","https://openalex.org/W2120327309","https://openalex.org/W2120846115","https://openalex.org/W2123238705","https://openalex.org/W2136350462","https://openalex.org/W2136656867","https://openalex.org/W2137595467","https://openalex.org/W2145365096","https://openalex.org/W2150666905","https://openalex.org/W2150758132","https://openalex.org/W2153190547","https://openalex.org/W2153348040","https://openalex.org/W2158698691","https://openalex.org/W2162634167","https://openalex.org/W2163052928","https://openalex.org/W2164637474","https://openalex.org/W2226396244","https://openalex.org/W2266755976","https://openalex.org/W2334782222","https://openalex.org/W2774933427","https://openalex.org/W2914656440","https://openalex.org/W2990138404","https://openalex.org/W3011120880","https://openalex.org/W3125885476","https://openalex.org/W4248634141","https://openalex.org/W4301630257"],"related_works":["https://openalex.org/W2583381754","https://openalex.org/W2144255176","https://openalex.org/W2222333653","https://openalex.org/W2286614685","https://openalex.org/W109977192","https://openalex.org/W1970797462","https://openalex.org/W2566747981","https://openalex.org/W4312120139","https://openalex.org/W2342453732","https://openalex.org/W2809541058"],"abstract_inverted_index":{"We":[0,53,90,124,153],"describe":[1],"a":[2,13],"class":[3],"of":[4,28,35,72,98,103,122,137,148],"stateful":[5],"games,":[6],"which":[7,55],"we":[8,109,167,186],"call":[9],"\u2018medium-access":[10],"games\u2019,":[11],"as":[12,31],"model":[14],"for":[15,86,94,101,113,119,135,175,196],"human":[16],"and":[17,20,64,108],"machine":[18],"communication":[19],"demonstrate":[21],"how":[22,66,126],"to":[23,40,67,80,116,127,131,145,172,189,193],"use":[24,110,128,190],"the":[25,49,69,82,120,146],"Nash":[26,70],"equilibria":[27,71],"those":[29],"games":[30,63,74,107],"played":[32],"by":[33,75],"pairs":[34,102,136],"agents":[36,46,115,139],"with":[37],"stationary":[38,88,114],"policies":[39,57],"predict":[41],"turn-taking":[42,59,149,165,178,183],"behaviour":[43,60],"in":[44,61,150],"Q-learning":[45,138],"based":[47],"on":[48,155,181],"agents\u2019":[50,83],"reward":[51,99,133],"function.":[52],"identify":[54],"fixed":[56],"exhibit":[58],"medium-access":[62,106,151],"show":[65],"compute":[68],"such":[73],"using":[76],"Markov":[77],"chain":[78],"methods":[79],"calculate":[81],"expected":[84],"rewards":[85,195],"different":[87],"policies.":[89],"present":[91],"simulation":[92],"results":[93,171],"an":[95],"extensive":[96],"range":[97],"functions":[100,134],"Q-learners":[104],"playing":[105],"our":[111,129,170,182,191],"analysis":[112],"develop":[117],"predictors":[118,130],"emergence":[121,147],"turn-taking.":[123,200],"explain":[125],"design":[132],"that":[140,161],"are":[141],"conducive":[142],"(or":[143],"prohibitive)":[144],"games.":[152],"focus":[154],"designing":[156],"multi-agent":[157],"reinforcement":[158],"learning":[159],"systems":[160],"deliberately":[162],"produce":[163],"coordinated":[164],"but":[166],"also":[168],"intend":[169],"be":[173],"useful":[174],"analysing":[176],"emergent":[177],"behaviour.":[179],"Based":[180],"related":[184],"results,":[185],"suggest":[187],"ways":[188],"methodology":[192],"designs":[194],"quantifiable":[197],"behaviours":[198],"besides":[199]},"counts_by_year":[{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
