{"id":"https://openalex.org/W1996232327","doi":"https://doi.org/10.1109/allerton.2012.6483342","title":"Mean field equilibria of multi armed bandit games","display_name":"Mean field equilibria of multi armed bandit games","publication_year":2012,"publication_date":"2012-10-01","ids":{"openalex":"https://openalex.org/W1996232327","doi":"https://doi.org/10.1109/allerton.2012.6483342","mag":"1996232327"},"language":"en","primary_location":{"id":"doi:10.1109/allerton.2012.6483342","is_oa":false,"landing_page_url":"https://doi.org/10.1109/allerton.2012.6483342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2012 50th Annual Allerton Conference on Communication, Control, and Computing (Allerton)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5109106688","display_name":"Ramki Gummadi","orcid":null},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Ramki Gummadi","raw_affiliation_strings":["Management Science and Engineering, Stanford University, USA","Management Science and Engineering, Stanford University"],"affiliations":[{"raw_affiliation_string":"Management Science and Engineering, Stanford University, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Management Science and Engineering, Stanford University","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042177635","display_name":"Ramesh Johari","orcid":"https://orcid.org/0000-0002-3960-0770"},"institutions":[{"id":"https://openalex.org/I97018004","display_name":"Stanford University","ror":"https://ror.org/00f54p054","country_code":"US","type":"education","lineage":["https://openalex.org/I97018004"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Ramesh Johari","raw_affiliation_strings":["Management Science and Engineering, Stanford University, USA","Management Science and Engineering, Stanford University"],"affiliations":[{"raw_affiliation_string":"Management Science and Engineering, Stanford University, USA","institution_ids":["https://openalex.org/I97018004"]},{"raw_affiliation_string":"Management Science and Engineering, Stanford University","institution_ids":["https://openalex.org/I97018004"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101868923","display_name":"Jia Yuan Yu","orcid":"https://orcid.org/0000-0002-6674-6150"},"institutions":[{"id":"https://openalex.org/I4210145784","display_name":"IBM Research - Ireland","ror":"https://ror.org/04jnxr720","country_code":"IE","type":"facility","lineage":["https://openalex.org/I1341412227","https://openalex.org/I4210114115","https://openalex.org/I4210145784"]}],"countries":["IE"],"is_corresponding":false,"raw_author_name":"Jia Yuan Yu","raw_affiliation_strings":["IBM Research, Dublin, Ireland"],"affiliations":[{"raw_affiliation_string":"IBM Research, Dublin, Ireland","institution_ids":["https://openalex.org/I4210145784"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5109106688"],"corresponding_institution_ids":["https://openalex.org/I97018004"],"apc_list":null,"apc_paid":null,"fwci":0.3999,"has_fulltext":false,"cited_by_count":10,"citation_normalized_percentile":{"value":0.6573913,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1110","last_page":"1110"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T12101","display_name":"Advanced Bandit Algorithms Research","score":0.9907000064849854,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10646","display_name":"Experimental Behavioral Economics Studies","score":0.9746000170707703,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.9581999778747559,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/regret","display_name":"Regret","score":0.7965384721755981},{"id":"https://openalex.org/keywords/uniqueness","display_name":"Uniqueness","score":0.6463867425918579},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5691537857055664},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.5443018674850464},{"id":"https://openalex.org/keywords/mathematical-economics","display_name":"Mathematical economics","score":0.527388334274292},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.4838196635246277},{"id":"https://openalex.org/keywords/fictitious-play","display_name":"Fictitious play","score":0.4795669913291931},{"id":"https://openalex.org/keywords/population","display_name":"Population","score":0.47073376178741455},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.44748836755752563},{"id":"https://openalex.org/keywords/multi-armed-bandit","display_name":"Multi-armed bandit","score":0.43279391527175903},{"id":"https://openalex.org/keywords/nash-equilibrium","display_name":"Nash equilibrium","score":0.382531076669693},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.2871513366699219},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.1866147518157959},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16262054443359375},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.06894999742507935}],"concepts":[{"id":"https://openalex.org/C50817715","wikidata":"https://www.wikidata.org/wiki/Q79895177","display_name":"Regret","level":2,"score":0.7965384721755981},{"id":"https://openalex.org/C2777021972","wikidata":"https://www.wikidata.org/wiki/Q22976830","display_name":"Uniqueness","level":2,"score":0.6463867425918579},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5691537857055664},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5443018674850464},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.527388334274292},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.4838196635246277},{"id":"https://openalex.org/C145071142","wikidata":"https://www.wikidata.org/wiki/Q1411116","display_name":"Fictitious play","level":3,"score":0.4795669913291931},{"id":"https://openalex.org/C2908647359","wikidata":"https://www.wikidata.org/wiki/Q2625603","display_name":"Population","level":2,"score":0.47073376178741455},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.44748836755752563},{"id":"https://openalex.org/C123197309","wikidata":"https://www.wikidata.org/wiki/Q2882343","display_name":"Multi-armed bandit","level":3,"score":0.43279391527175903},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.382531076669693},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.2871513366699219},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.1866147518157959},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16262054443359375},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.06894999742507935},{"id":"https://openalex.org/C50522688","wikidata":"https://www.wikidata.org/wiki/Q189833","display_name":"Economic growth","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C149923435","wikidata":"https://www.wikidata.org/wiki/Q37732","display_name":"Demography","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/allerton.2012.6483342","is_oa":false,"landing_page_url":"https://doi.org/10.1109/allerton.2012.6483342","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2012 50th Annual Allerton Conference on Communication, Control, and Computing (Allerton)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.6000000238418579,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4289341771","https://openalex.org/W4214835929","https://openalex.org/W2958076322","https://openalex.org/W4226086326","https://openalex.org/W3191284239","https://openalex.org/W2996787464","https://openalex.org/W2964268945","https://openalex.org/W3119014777","https://openalex.org/W3174419385","https://openalex.org/W3172572974"],"abstract_inverted_index":{"Much":[0],"of":[1,61,88,95,114,155,190,291,317,328,338,362,372,379,388,413,429,460],"the":[2,27,41,50,59,68,112,117,121,129,141,145,161,182,200,244,249,267,271,281,289,292,296,318,339,345,370,377,380,386,389,402,405,414,430,436,451,458,470,475],"classical":[3,183],"work":[4],"on":[5,11,35,243,450],"algorithms":[6],"for":[7,157,173,181,192,208,211,230,324],"multi-armed":[8],"bandits":[9],"focuses":[10],"rewards":[12,28,246],"that":[13,75,135,167,196,225,247,254,269,280,288,307,358,368,420,435,457],"are":[14,150,332],"stationary":[15,126,137],"over":[16,127],"time.":[17],"By":[18,396],"contrast,":[19],"we":[20,66,76,163,165,198,222,353,366,399],"study":[21,92],"multiarmed":[22,79],"bandit":[23,80],"(MAB)":[24,81],"games,":[25,90],"where":[26,404],"obtained":[29],"by":[30,98,144],"an":[31,110,231,355],"agent":[32,282,382],"also":[33],"depend":[34],"how":[36],"many":[37],"other":[38],"agents":[39,45,115,168,202,214,373,437],"choose":[40],"same":[42,346],"arm.":[43,476],"When":[44],"interact":[46],"in":[47,308,322],"this":[48,136,175,193,204,264,310],"way,":[49],"overall":[51],"system":[52,101,383],"can":[53,223],"no":[54],"longer":[55],"be":[56,177],"analyzed":[57],"through":[58],"eyes":[60],"a":[62,72,78,85,93,99,132,170,178,216,240,325,411,439,442,454],"single":[63],"agent;":[64],"rather,":[65],"view":[67],"agents'":[69,260],"interactions":[70],"as":[71,104,151,220,410],"dynamic":[73],"game,":[74],"call":[77],"game.":[82,233],"We":[83,187,238,302,418],"introduce":[84],"general":[86],"model":[87,162],"MAB":[89,158,185,209,232],"and":[91,236,253,287],"notion":[94],"equilibrium":[96,130],"inspired":[97],"large":[100],"approximation":[102,356],"known":[103],"mean":[105,390],"field":[106,391],"equilibrium.":[107],"In":[108,160,364],"such":[109],"equilibrium,":[111],"proportion":[113],"playing":[116],"various":[118],"arms,":[119],"called":[120],"population":[122,272,283,297,415],"profile,":[123],"is":[124,227,251,284,299,424],"assumed":[125],"time;":[128],"requires":[131,279],"consistency":[133],"check":[134],"profile":[138,273,298,416],"arises":[139],"from":[140,256],"policies":[142],"chosen":[143],"agents.":[146],"Our":[147],"main":[148],"results":[149],"follows.":[152],"(1)":[153],"Existence":[154],"MFE":[156,191,250,265],"games.":[159],"consider,":[164],"assume":[166],"play":[169],"fixed":[171],"policy;":[172],"example,":[174,212],"may":[176],"regret-optimal":[179],"policy":[180,201,218,440,452],"(stationary)":[184],"setting.":[186],"establish":[188,351,367,419],"existence":[189],"model.":[194,392],"Note":[195],"though":[197],"fix":[199],"use,":[203],"approach":[205],"seems":[206,312],"sensible":[207],"games;":[210],"if":[213,369],"use":[215,361],"regret-minimizing":[217],"(such":[219],"UCB),":[221],"show":[224,354],"it":[226],"approximately":[228],"optimal":[229],"(2)":[234],"Uniqueness":[235],"convergence.":[237],"identify":[239],"contraction":[241,277,340,347],"condition":[242,278,348,449],"arm":[245,446,464],"ensures":[248],"unique,":[252],"starting":[255],"any":[257,462],"initial":[258],"state,":[259],"will":[261],"converge":[262,335,384],"to":[263,295,313,334,350,385,401,426,445],"(in":[266],"sense":[268],"eventually":[270],"becomes":[274],"constant).":[275],"The":[276],"sufficiently":[285],"mixing":[286],"sensitivity":[290,444],"reward":[293,406,471],"function":[294,407,412],"low":[300],"enough.":[301],"demonstrate":[303],"via":[304],"numerical":[305],"experiments":[306],"fact":[309],"result":[311,357],"hold":[314],"well":[315],"outside":[316],"regime":[319],"studied":[320],"analytically:":[321],"fact,":[323],"wide":[326],"range":[327],"parameter":[329],"choices,":[330],"dynamics":[331,378,387],"observed":[333],"despite":[336],"violation":[337],"condition.":[341],"(3)":[342],"Approximation.":[343],"Under":[344],"used":[349],"uniqueness,":[352],"justifies":[359],"our":[360],"MFE.":[363],"particular,":[365],"number":[371],"grows":[374],"large,":[375],"then":[376],"finite":[381],"(4)":[393],"Congestion":[394],"externalities.":[395],"congestion":[397,422],"externalities,":[398],"refer":[400],"case":[403],"strictly":[408,467],"decreases":[409],"component.":[417],"having":[421],"externalities":[423],"sufficient":[425],"guarantee":[427],"uniqueness":[428],"Mean":[431],"Field":[432],"Equilibrium,":[433],"provided":[434],"adopt":[438],"satisfies":[441],"positive":[443],"rewards.":[447],"This":[448],"formalizes":[453],"natural":[455],"expectation":[456],"probability":[459,472],"choosing":[461],"given":[463],"should":[465],"increase":[466],"monotone":[468],"with":[469,474],"associated":[473]},"counts_by_year":[{"year":2021,"cited_by_count":3},{"year":2019,"cited_by_count":1},{"year":2018,"cited_by_count":1},{"year":2017,"cited_by_count":3},{"year":2016,"cited_by_count":1},{"year":2013,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
