{"id":"https://openalex.org/W3192510920","doi":"https://doi.org/10.1109/tetci.2022.3166555","title":"Decision Making in Monopoly Using a Hybrid Deep Reinforcement Learning Approach","display_name":"Decision Making in Monopoly Using a Hybrid Deep Reinforcement Learning Approach","publication_year":2022,"publication_date":"2022-05-16","ids":{"openalex":"https://openalex.org/W3192510920","doi":"https://doi.org/10.1109/tetci.2022.3166555","mag":"3192510920"},"language":"en","primary_location":{"id":"doi:10.1109/tetci.2022.3166555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2022.3166555","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5049482803","display_name":"Trevor Bonjour","orcid":"https://orcid.org/0000-0001-5050-0220"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Trevor Bonjour","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5024270752","display_name":"Marina Haliem","orcid":"https://orcid.org/0000-0002-9782-6591"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Marina Haliem","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049998976","display_name":"Aala Oqab Alsalem","orcid":"https://orcid.org/0000-0003-1560-0116"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Aala Alsalem","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021059425","display_name":"Shilpa Thomas","orcid":"https://orcid.org/0000-0003-1498-8614"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Shilpa Thomas","raw_affiliation_strings":["University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100402301","display_name":"Hongyu Li","orcid":"https://orcid.org/0000-0002-5951-1230"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Hongyu Li","raw_affiliation_strings":["University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064822688","display_name":"Vaneet Aggarwal","orcid":"https://orcid.org/0000-0001-9131-4723"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Vaneet Aggarwal","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074197492","display_name":"Mayank Kejriwal","orcid":"https://orcid.org/0000-0001-5988-8305"},"institutions":[{"id":"https://openalex.org/I1174212","display_name":"University of Southern California","ror":"https://ror.org/03taz7m60","country_code":"US","type":"education","lineage":["https://openalex.org/I1174212"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mayank Kejriwal","raw_affiliation_strings":["University of Southern California, Los Angeles, CA, USA"],"affiliations":[{"raw_affiliation_string":"University of Southern California, Los Angeles, CA, USA","institution_ids":["https://openalex.org/I1174212"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5077320731","display_name":"Bharat Bhargava","orcid":"https://orcid.org/0000-0003-3803-8672"},"institutions":[{"id":"https://openalex.org/I219193219","display_name":"Purdue University West Lafayette","ror":"https://ror.org/02dqehb95","country_code":"US","type":"education","lineage":["https://openalex.org/I219193219"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Bharat Bhargava","raw_affiliation_strings":["Purdue University, West Lafayette, IN, USA"],"affiliations":[{"raw_affiliation_string":"Purdue University, West Lafayette, IN, USA","institution_ids":["https://openalex.org/I219193219"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":8,"corresponding_author_ids":["https://openalex.org/A5049482803"],"corresponding_institution_ids":["https://openalex.org/I219193219"],"apc_list":null,"apc_paid":null,"fwci":2.6199,"has_fulltext":false,"cited_by_count":21,"citation_normalized_percentile":{"value":0.90839712,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"6","issue":"6","first_page":"1335","last_page":"1344"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11674","display_name":"Sports Analytics and Performance","score":0.987500011920929,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.9868000149726868,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8658502101898193},{"id":"https://openalex.org/keywords/monopoly","display_name":"Monopoly","score":0.7807005047798157},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6407434344291687},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6096650958061218},{"id":"https://openalex.org/keywords/luck","display_name":"Luck","score":0.5462609529495239},{"id":"https://openalex.org/keywords/function","display_name":"Function (biology)","score":0.43803995847702026},{"id":"https://openalex.org/keywords/adversary","display_name":"Adversary","score":0.43034467101097107},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.34978365898132324},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.2803307771682739},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.27915483713150024},{"id":"https://openalex.org/keywords/computer-security","display_name":"Computer security","score":0.12867552042007446}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8658502101898193},{"id":"https://openalex.org/C2781127519","wikidata":"https://www.wikidata.org/wiki/Q43637","display_name":"Monopoly","level":2,"score":0.7807005047798157},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6407434344291687},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6096650958061218},{"id":"https://openalex.org/C61783943","wikidata":"https://www.wikidata.org/wiki/Q1970348","display_name":"Luck","level":2,"score":0.5462609529495239},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.43803995847702026},{"id":"https://openalex.org/C41065033","wikidata":"https://www.wikidata.org/wiki/Q2825412","display_name":"Adversary","level":2,"score":0.43034467101097107},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.34978365898132324},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.2803307771682739},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.27915483713150024},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.12867552042007446},{"id":"https://openalex.org/C78458016","wikidata":"https://www.wikidata.org/wiki/Q840400","display_name":"Evolutionary biology","level":1,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C27206212","wikidata":"https://www.wikidata.org/wiki/Q34178","display_name":"Theology","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tetci.2022.3166555","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2022.3166555","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.8100000023841858,"id":"https://metadata.un.org/sdg/16"}],"awards":[{"id":"https://openalex.org/G5600146052","display_name":null,"funder_award_id":"W911NF2020003","funder_id":"https://openalex.org/F4320338294","funder_display_name":"Air Force Research Laboratory"}],"funders":[{"id":"https://openalex.org/F4320332180","display_name":"Defense Advanced Research Projects Agency","ror":"https://ror.org/02caytj08"},{"id":"https://openalex.org/F4320338294","display_name":"Air Force Research Laboratory","ror":"https://ror.org/02e2egq70"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":59,"referenced_works":["https://openalex.org/W41554520","https://openalex.org/W1646707810","https://openalex.org/W1658008008","https://openalex.org/W1771410628","https://openalex.org/W2115211925","https://openalex.org/W2116339921","https://openalex.org/W2119717200","https://openalex.org/W2121863487","https://openalex.org/W2139418546","https://openalex.org/W2141559645","https://openalex.org/W2145339207","https://openalex.org/W2155968351","https://openalex.org/W2173248099","https://openalex.org/W2173564293","https://openalex.org/W2201581102","https://openalex.org/W2257979135","https://openalex.org/W2324555000","https://openalex.org/W2574978968","https://openalex.org/W2736601468","https://openalex.org/W2746553466","https://openalex.org/W2761873684","https://openalex.org/W2787938642","https://openalex.org/W2789794870","https://openalex.org/W2951799221","https://openalex.org/W2960876848","https://openalex.org/W2963477884","https://openalex.org/W2963864421","https://openalex.org/W2963890729","https://openalex.org/W2963923407","https://openalex.org/W2964043796","https://openalex.org/W2964121744","https://openalex.org/W2964291307","https://openalex.org/W2970104882","https://openalex.org/W2970130737","https://openalex.org/W2972302081","https://openalex.org/W2977843878","https://openalex.org/W2979501303","https://openalex.org/W2981260474","https://openalex.org/W2982316857","https://openalex.org/W2996100761","https://openalex.org/W3037429136","https://openalex.org/W3089580269","https://openalex.org/W3097499542","https://openalex.org/W3100789280","https://openalex.org/W3118881636","https://openalex.org/W3122029173","https://openalex.org/W4256160650","https://openalex.org/W6636881020","https://openalex.org/W6638018090","https://openalex.org/W6677067356","https://openalex.org/W6677193802","https://openalex.org/W6684921986","https://openalex.org/W6685444567","https://openalex.org/W6687681856","https://openalex.org/W6692846177","https://openalex.org/W6741002519","https://openalex.org/W6748839928","https://openalex.org/W6767224800","https://openalex.org/W6767474370"],"related_works":["https://openalex.org/W2492583102","https://openalex.org/W1591252263","https://openalex.org/W2247420603","https://openalex.org/W2467763060","https://openalex.org/W2082016267","https://openalex.org/W2497388629","https://openalex.org/W2479431988","https://openalex.org/W2369927851","https://openalex.org/W4323306857","https://openalex.org/W3194405162"],"abstract_inverted_index":{"Learning":[0],"to":[1,28,110,188],"adapt":[2],"and":[3,11,46,61,70,177,183],"make":[4,29],"real-time":[5],"informed":[6],"decisions":[7,31],"in":[8,36,124,205],"a":[9,15,20,125,146,160,222],"dynamic":[10],"complex":[12,157],"environment":[13],"is":[14,19,106],"challenging":[16],"problem.":[17],"Monopoly":[18,37,69,91],"popular":[21],"strategic":[22],"board":[23],"game":[24],"that":[25,80,128,149,196],"requires":[26],"players":[27,98],"multiple":[30,101],"during":[32],"the":[33,59,65,112,131,134,139,185,206,219],"game.":[34],"Decision-making":[35],"involves":[38],"many":[39],"real-world":[40],"elements":[41],"such":[42],"as":[43],"strategizing,":[44],"luck,":[45],"modeling":[47],"of":[48,68,115,133,142,208,225],"opponent\u2019s":[49],"policies.":[50],"In":[51,96],"this":[52],"paper,":[53],"we":[54,78,144],"present":[55],"novel":[56],"representations":[57],"for":[58,64,90],"state":[60],"action":[62],"space":[63],"full":[66],"version":[67],"define":[71],"an":[72],"improved":[73],"reward":[74],"function.":[75],"Using":[76],"these,":[77],"show":[79,195],"our":[81,189,197],"deep":[82,151,179],"reinforcement":[83,152],"learning":[84,135,153,170],"agent":[85,217],"can":[86,99],"learn":[87],"winning":[88],"strategies":[89],"against":[92,211,227],"different":[93],"fixed-policy":[94,161,212,228],"agents.":[95,213,229],"Monopoly,":[97],"take":[100],"actions":[102,117],"even":[103],"if":[104],"it":[105],"not":[107],"their.":[108],"turn":[109],"roll":[111],"dice.":[113],"Some":[114],"these":[116],"occur":[118],"more":[119],"frequently":[120],"than":[121],"others,":[122],"resulting":[123],"skewed":[126],"distribution":[127,141],"adversely":[129],"affects":[130],"performance":[132],"agent.":[136],"To":[137],"tackle":[138],"non-uniform":[140],"actions,":[143],"propose":[145],"hybrid":[147,191,198,215],"approach":[148,162,187],"combines":[150],"(for":[154,163],"frequent":[155],"but":[156,165],"decisions)":[158],"with":[159,221],"infrequent":[164],"straightforward":[166],"decisions).":[167],"We":[168],"develop":[169],"agents":[171,199,202],"using":[172],"proximal":[173],"policy":[174],"optimization":[175],"(PPO)":[176],"double":[178],"Q-learning":[180],"(DDQN)":[181],"algorithms":[182],"compare":[184],"standard":[186,201],"proposed":[190],"approach.":[192],"Experimental":[193],"results":[194],"outperform":[200],"by":[203],"20%":[204],"number":[207],"games":[209],"won":[210],"The":[214],"PPO":[216],"performs":[218],"best":[220],"win":[223],"rate":[224],"91%":[226]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":9},{"year":2023,"cited_by_count":4},{"year":2021,"cited_by_count":1}],"updated_date":"2026-03-28T08:17:26.163206","created_date":"2025-10-10T00:00:00"}
