{"id":"https://openalex.org/W4415280676","doi":"https://doi.org/10.48550/arxiv.2510.08607","title":"GRPO-GCC: Enhancing Cooperation in Spatial Public Goods Games via Group Relative Policy Optimization with Global Cooperation Constraint","display_name":"GRPO-GCC: Enhancing Cooperation in Spatial Public Goods Games via Group Relative Policy Optimization with Global Cooperation Constraint","publication_year":2025,"publication_date":"2025-10-07","ids":{"openalex":"https://openalex.org/W4415280676","doi":"https://doi.org/10.48550/arxiv.2510.08607"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2510.08607","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.08607","pdf_url":"https://arxiv.org/pdf/2510.08607","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2510.08607","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052641051","display_name":"Zhaoqilin Yang","orcid":"https://orcid.org/0000-0002-3676-4761"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Yang, Zhaoqilin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5023878331","display_name":"Chanchan Li","orcid":"https://orcid.org/0000-0002-2395-0928"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Chanchan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100618135","display_name":"Tianqi Liu","orcid":"https://orcid.org/0000-0002-0224-045X"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Tianqi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101600551","display_name":"Hongxin Zhao","orcid":"https://orcid.org/0000-0001-6753-8698"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Hongxin","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5052363813","display_name":"Youliang Tian","orcid":"https://orcid.org/0000-0002-5974-1570"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tian, Youliang","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052641051"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.8977000117301941,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11031","display_name":"Game Theory and Applications","score":0.8977000117301941,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11182","display_name":"Auction Theory and Applications","score":0.8180000185966492,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12137","display_name":"Economic theories and models","score":0.7713000178337097,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/incentive","display_name":"Incentive","score":0.7746000289916992},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7171000242233276},{"id":"https://openalex.org/keywords/public-good","display_name":"Public good","score":0.6413999795913696},{"id":"https://openalex.org/keywords/constraint","display_name":"Constraint (computer-aided design)","score":0.6288999915122986},{"id":"https://openalex.org/keywords/public-goods-game","display_name":"Public goods game","score":0.5778999924659729},{"id":"https://openalex.org/keywords/baseline","display_name":"Baseline (sea)","score":0.5550000071525574},{"id":"https://openalex.org/keywords/work","display_name":"Work (physics)","score":0.39640000462532043},{"id":"https://openalex.org/keywords/simple","display_name":"Simple (philosophy)","score":0.37130001187324524}],"concepts":[{"id":"https://openalex.org/C29122968","wikidata":"https://www.wikidata.org/wiki/Q1414816","display_name":"Incentive","level":2,"score":0.7746000289916992},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7171000242233276},{"id":"https://openalex.org/C162222271","wikidata":"https://www.wikidata.org/wiki/Q92779871","display_name":"Public good","level":2,"score":0.6413999795913696},{"id":"https://openalex.org/C2776036281","wikidata":"https://www.wikidata.org/wiki/Q48769818","display_name":"Constraint (computer-aided design)","level":2,"score":0.6288999915122986},{"id":"https://openalex.org/C72273685","wikidata":"https://www.wikidata.org/wiki/Q1673101","display_name":"Public goods game","level":3,"score":0.5778999924659729},{"id":"https://openalex.org/C12725497","wikidata":"https://www.wikidata.org/wiki/Q810247","display_name":"Baseline (sea)","level":2,"score":0.5550000071525574},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.48579999804496765},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.47099998593330383},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.428600013256073},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.39640000462532043},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.37130001187324524},{"id":"https://openalex.org/C2781311116","wikidata":"https://www.wikidata.org/wiki/Q83306","display_name":"Group (periodic table)","level":2,"score":0.36800000071525574},{"id":"https://openalex.org/C206103860","wikidata":"https://www.wikidata.org/wiki/Q5570906","display_name":"Global strategy","level":2,"score":0.3278999924659729},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.3176000118255615},{"id":"https://openalex.org/C153517567","wikidata":"https://www.wikidata.org/wiki/Q26090","display_name":"Mechanism design","level":2,"score":0.31130000948905945},{"id":"https://openalex.org/C109986646","wikidata":"https://www.wikidata.org/wiki/Q546113","display_name":"Public policy","level":2,"score":0.30880001187324524},{"id":"https://openalex.org/C136197465","wikidata":"https://www.wikidata.org/wiki/Q1729295","display_name":"Variety (cybernetics)","level":2,"score":0.29980000853538513},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C123650614","wikidata":"https://www.wikidata.org/wiki/Q282491","display_name":"Strategic dominance","level":2,"score":0.2849000096321106},{"id":"https://openalex.org/C61797465","wikidata":"https://www.wikidata.org/wiki/Q1188986","display_name":"Term (time)","level":2,"score":0.2840000092983246},{"id":"https://openalex.org/C20701700","wikidata":"https://www.wikidata.org/wiki/Q388791","display_name":"Group decision-making","level":2,"score":0.2766000032424927}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2510.08607","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.08607","pdf_url":"https://arxiv.org/pdf/2510.08607","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2510.08607","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2510.08607","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2510.08607","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2510.08607","pdf_url":"https://arxiv.org/pdf/2510.08607","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Inspired":[0],"by":[1,95],"the":[2,12,26],"principle":[3],"of":[4],"self-regulating":[5],"cooperation":[6,55,62,120],"in":[7,151],"collective":[8,77],"institutions,":[9],"we":[10],"propose":[11],"Group":[13],"Relative":[14],"Policy":[15],"Optimization":[16],"with":[17,52,75],"Global":[18],"Cooperation":[19],"Constraint":[20],"(GRPO-GCC)":[21],"framework.":[22],"This":[23,69],"work":[24],"is":[25],"first":[27],"to":[28],"introduce":[29],"GRPO":[30],"into":[31,82],"spatial":[32],"public":[33],"goods":[34],"games,":[35],"establishing":[36],"a":[37,53,100,105,115,131,144],"new":[38,145],"deep":[39],"reinforcement":[40,149],"learning":[41,150],"baseline":[42],"for":[43,147],"structured":[44],"populations.":[45],"GRPO-GCC":[46,128],"integrates":[47],"group":[48],"relative":[49],"policy":[50,123],"optimization":[51],"global":[54,106,134],"constraint":[56],"that":[57,109],"strengthens":[58],"incentives":[59,138],"at":[60,67],"intermediate":[61],"levels":[63],"while":[64],"weakening":[65],"them":[66],"extremes.":[68],"mechanism":[70],"aligns":[71],"local":[72],"decision":[73],"making":[74],"sustainable":[76],"outcomes":[78],"and":[79,104,125,142],"prevents":[80],"collapse":[81],"either":[83],"universal":[84],"defection":[85],"or":[86],"unconditional":[87],"cooperation.":[88],"The":[89],"framework":[90],"advances":[91],"beyond":[92],"existing":[93],"approaches":[94],"combining":[96],"group-normalized":[97],"advantage":[98],"estimation,":[99],"reference-anchored":[101],"KL":[102],"penalty,":[103],"incentive":[107],"term":[108],"dynamically":[110],"adjusts":[111],"cooperative":[112],"payoffs.":[113],"As":[114],"result,":[116],"it":[117],"achieves":[118],"accelerated":[119],"onset,":[121],"stabilized":[122],"adaptation,":[124],"long-term":[126],"sustainability.":[127],"demonstrates":[129],"how":[130],"simple":[132],"yet":[133],"signal":[135],"can":[136],"reshape":[137],"toward":[139],"resilient":[140],"cooperation,":[141],"provides":[143],"paradigm":[146],"multi-agent":[148],"socio-technical":[152],"systems.":[153]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-17T00:00:00"}
