{"id":"https://openalex.org/W7160866698","doi":"https://doi.org/10.48550/arxiv.2605.07240","title":"Rethinking Priority Scheduling for Sequential Multi-Agent Decision Making in Stackelberg Games","display_name":"Rethinking Priority Scheduling for Sequential Multi-Agent Decision Making in Stackelberg Games","publication_year":2026,"publication_date":"2026-05-08","ids":{"openalex":"https://openalex.org/W7160866698","doi":"https://doi.org/10.48550/arxiv.2605.07240"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.07240","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.07240","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.07240","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135865804","display_name":"Xiangyu Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiangyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135831331","display_name":"Liang Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Liang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135880859","display_name":"Bo Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Bo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135878497","display_name":"Ziqi Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Ziqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.8228999972343445,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.8228999972343445,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13553","display_name":"Age of Information Optimization","score":0.06669999659061432,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.012199999764561653,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/stackelberg-competition","display_name":"Stackelberg competition","score":0.8704000115394592},{"id":"https://openalex.org/keywords/markov-decision-process","display_name":"Markov decision process","score":0.598800003528595},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.47450000047683716},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.4368000030517578},{"id":"https://openalex.org/keywords/repeated-game","display_name":"Repeated game","score":0.42750000953674316},{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.4260999858379364},{"id":"https://openalex.org/keywords/markov-chain","display_name":"Markov chain","score":0.41269999742507935},{"id":"https://openalex.org/keywords/stochastic-game","display_name":"Stochastic game","score":0.4018000066280365},{"id":"https://openalex.org/keywords/coordination-game","display_name":"Coordination game","score":0.40139999985694885},{"id":"https://openalex.org/keywords/upper-and-lower-bounds","display_name":"Upper and lower bounds","score":0.3889000117778778}],"concepts":[{"id":"https://openalex.org/C199510392","wikidata":"https://www.wikidata.org/wiki/Q1184602","display_name":"Stackelberg competition","level":2,"score":0.8704000115394592},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6735000014305115},{"id":"https://openalex.org/C106189395","wikidata":"https://www.wikidata.org/wiki/Q176789","display_name":"Markov decision process","level":3,"score":0.598800003528595},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.5976999998092651},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.47450000047683716},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.4368000030517578},{"id":"https://openalex.org/C202556891","wikidata":"https://www.wikidata.org/wiki/Q1584646","display_name":"Repeated game","level":3,"score":0.42750000953674316},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.4260999858379364},{"id":"https://openalex.org/C98763669","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov chain","level":2,"score":0.41269999742507935},{"id":"https://openalex.org/C22171661","wikidata":"https://www.wikidata.org/wiki/Q1074380","display_name":"Stochastic game","level":2,"score":0.4018000066280365},{"id":"https://openalex.org/C107257861","wikidata":"https://www.wikidata.org/wiki/Q656316","display_name":"Coordination game","level":2,"score":0.40139999985694885},{"id":"https://openalex.org/C77553402","wikidata":"https://www.wikidata.org/wiki/Q13222579","display_name":"Upper and lower bounds","level":2,"score":0.3889000117778778},{"id":"https://openalex.org/C177142836","wikidata":"https://www.wikidata.org/wiki/Q44455","display_name":"Game theory","level":2,"score":0.38119998574256897},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.35370001196861267},{"id":"https://openalex.org/C150325174","wikidata":"https://www.wikidata.org/wiki/Q4335500","display_name":"Optimal decision","level":3,"score":0.34940001368522644},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.3449000120162964},{"id":"https://openalex.org/C17098449","wikidata":"https://www.wikidata.org/wiki/Q176814","display_name":"Partially observable Markov decision process","level":4,"score":0.3425000011920929},{"id":"https://openalex.org/C2984634286","wikidata":"https://www.wikidata.org/wiki/Q1331926","display_name":"Decision process","level":2,"score":0.3375000059604645},{"id":"https://openalex.org/C115988155","wikidata":"https://www.wikidata.org/wiki/Q3262192","display_name":"Decision problem","level":2,"score":0.33320000767707825},{"id":"https://openalex.org/C47175762","wikidata":"https://www.wikidata.org/wiki/Q13422573","display_name":"Non-cooperative game","level":3,"score":0.32350000739097595},{"id":"https://openalex.org/C46814582","wikidata":"https://www.wikidata.org/wiki/Q23389","display_name":"Nash equilibrium","level":2,"score":0.31310001015663147},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.31189998984336853},{"id":"https://openalex.org/C28901747","wikidata":"https://www.wikidata.org/wiki/Q177571","display_name":"Decision theory","level":2,"score":0.2969000041484833},{"id":"https://openalex.org/C32407928","wikidata":"https://www.wikidata.org/wiki/Q2733833","display_name":"Best response","level":3,"score":0.2953999936580658},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2946000099182129},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.28439998626708984},{"id":"https://openalex.org/C94766913","wikidata":"https://www.wikidata.org/wiki/Q1530271","display_name":"Equilibrium point","level":3,"score":0.2840000092983246},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2831000089645386},{"id":"https://openalex.org/C155930848","wikidata":"https://www.wikidata.org/wiki/Q1069099","display_name":"Normal-form game","level":4,"score":0.2728999853134155},{"id":"https://openalex.org/C55416958","wikidata":"https://www.wikidata.org/wiki/Q6206757","display_name":"Job shop scheduling","level":3,"score":0.26919999718666077},{"id":"https://openalex.org/C95940807","wikidata":"https://www.wikidata.org/wiki/Q12237274","display_name":"Simultaneous game","level":4,"score":0.26030001044273376},{"id":"https://openalex.org/C50318809","wikidata":"https://www.wikidata.org/wiki/Q2145081","display_name":"Replicator equation","level":3,"score":0.25760000944137573}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.07240","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.07240","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.07240","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.07240","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16","score":0.8067240118980408}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Current":[0],"research":[1],"applying":[2],"N-level":[3,47,197],"Stackelberg":[4,48,198],"Game":[5,131],"to":[6,61,134,181],"multi-agent":[7,170],"systems":[8],"often":[9],"uses":[10],"the":[11,19,24,27,33,38,46,52,68,84,94,99,107,115,120,127,135,156,160,187,192],"default":[12],"decision":[13,96,109,194],"order":[14,28,53,110,195],"of":[15,29,37,111,159,190],"agents":[16,30,56,112,123],"provided":[17],"by":[18],"environment.":[20],"However,":[21],"this":[22,80],"raises":[23],"question:":[25],"does":[26],"necessarily":[31],"affect":[32],"final":[34],"equilibrium":[35,69],"point":[36,70],"game?":[39],"To":[40,138],"address":[41],"this,":[42],"we":[43,82,144],"formally":[44],"analyze":[45],"Game,":[49],"where":[50],"changing":[51,182],"in":[54,126,196],"which":[55,90],"make":[57],"decisions":[58],"typically":[59],"leads":[60],"an":[62,102],"overdetermined":[63],"system.":[64],"As":[65],"a":[66,146],"result,":[67],"shifts":[71],"unless":[72],"special":[73],"structural":[74],"conditions":[75],"are":[76],"satisfied.":[77],"Based":[78],"on":[79,114,165],"analysis,":[81],"propose":[83],"Hierarchical":[85],"Priority":[86],"Adjustment":[87],"(HPA)":[88],"method,":[89],"adjusts":[91],"and":[92,178],"selects":[93,106],"agents'":[95,193],"order.":[97,137],"At":[98,119],"upper":[100,103,161],"level,":[101,122],"policy":[104],"dynamically":[105],"optimal":[108],"based":[113],"current":[116],"game":[117],"state.":[118],"lower":[121],"execute":[124],"strategies":[125],"Spatio-Temporal":[128],"Sequential":[129],"Markov":[130],"(STMG)":[132],"according":[133],"selected":[136],"coordinate":[139],"learning":[140],"across":[141],"time":[142],"scales,":[143],"employ":[145],"slow-fast":[147],"update":[148],"scheme":[149],"with":[150],"shared":[151],"intrinsic":[152],"rewards":[153],"derived":[154],"from":[155],"advantage":[157],"function":[158],"policy.":[162],"Experimental":[163],"results":[164,185],"high-precision":[166],"control":[167],"tasks,":[168],"including":[169],"MuJoCo,":[171],"show":[172],"that":[173],"HPA":[174],"outperforms":[175],"benchmark":[176],"algorithms":[177],"robustly":[179],"adapts":[180],"environments.":[183],"These":[184],"highlight":[186],"crucial":[188],"role":[189],"optimizing":[191],"Game.":[199]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-12T00:00:00"}
