{"id":"https://openalex.org/W7160448228","doi":"https://doi.org/10.48550/arxiv.2605.03142","title":"MARS-DA: A Hierarchical Reinforcement Learning Framework for Risk-Aware Multi-Agent Bidding in Power Grids","display_name":"MARS-DA: A Hierarchical Reinforcement Learning Framework for Risk-Aware Multi-Agent Bidding in Power Grids","publication_year":2026,"publication_date":"2026-05-04","ids":{"openalex":"https://openalex.org/W7160448228","doi":"https://doi.org/10.48550/arxiv.2605.03142"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.03142","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03142","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.03142","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135530695","display_name":"Jiayi Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Jiayi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135456010","display_name":"Xuan Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5100744283","display_name":"Guiling Wang","orcid":"https://orcid.org/0000-0003-1880-4763"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Guiling","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10424","display_name":"Electric Power System Optimization","score":0.6025999784469604,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10424","display_name":"Electric Power System Optimization","score":0.6025999784469604,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.27619999647140503,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11052","display_name":"Energy Load and Power Forecasting","score":0.03999999910593033,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/bidding","display_name":"Bidding","score":0.7639999985694885},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6931999921798706},{"id":"https://openalex.org/keywords/profit-maximization","display_name":"Profit maximization","score":0.6467999815940857},{"id":"https://openalex.org/keywords/testbed","display_name":"Testbed","score":0.5648999810218811},{"id":"https://openalex.org/keywords/electricity-market","display_name":"Electricity market","score":0.5275999903678894},{"id":"https://openalex.org/keywords/electricity","display_name":"Electricity","score":0.5015000104904175},{"id":"https://openalex.org/keywords/overfitting","display_name":"Overfitting","score":0.4648999869823456},{"id":"https://openalex.org/keywords/profit","display_name":"Profit (economics)","score":0.43849998712539673},{"id":"https://openalex.org/keywords/volatility","display_name":"Volatility (finance)","score":0.4156999886035919}],"concepts":[{"id":"https://openalex.org/C9233905","wikidata":"https://www.wikidata.org/wiki/Q3276328","display_name":"Bidding","level":2,"score":0.7639999985694885},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6931999921798706},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6575999855995178},{"id":"https://openalex.org/C2777780509","wikidata":"https://www.wikidata.org/wiki/Q1377422","display_name":"Profit maximization","level":3,"score":0.6467999815940857},{"id":"https://openalex.org/C31395832","wikidata":"https://www.wikidata.org/wiki/Q1318674","display_name":"Testbed","level":2,"score":0.5648999810218811},{"id":"https://openalex.org/C146733006","wikidata":"https://www.wikidata.org/wiki/Q676081","display_name":"Electricity market","level":3,"score":0.5275999903678894},{"id":"https://openalex.org/C206658404","wikidata":"https://www.wikidata.org/wiki/Q12725","display_name":"Electricity","level":2,"score":0.5015000104904175},{"id":"https://openalex.org/C22019652","wikidata":"https://www.wikidata.org/wiki/Q331309","display_name":"Overfitting","level":3,"score":0.4648999869823456},{"id":"https://openalex.org/C181622380","wikidata":"https://www.wikidata.org/wiki/Q26911","display_name":"Profit (economics)","level":2,"score":0.43849998712539673},{"id":"https://openalex.org/C91602232","wikidata":"https://www.wikidata.org/wiki/Q756115","display_name":"Volatility (finance)","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.40549999475479126},{"id":"https://openalex.org/C2776330181","wikidata":"https://www.wikidata.org/wiki/Q18358244","display_name":"Maximization","level":2,"score":0.3878999948501587},{"id":"https://openalex.org/C160623529","wikidata":"https://www.wikidata.org/wiki/Q273088","display_name":"Arbitrage","level":2,"score":0.38670000433921814},{"id":"https://openalex.org/C137631369","wikidata":"https://www.wikidata.org/wiki/Q7617831","display_name":"Stochastic programming","level":2,"score":0.35830000042915344},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.35339999198913574},{"id":"https://openalex.org/C177606310","wikidata":"https://www.wikidata.org/wiki/Q5674297","display_name":"Adaptability","level":2,"score":0.3294000029563904},{"id":"https://openalex.org/C32896092","wikidata":"https://www.wikidata.org/wiki/Q189447","display_name":"Risk management","level":2,"score":0.3237000107765198},{"id":"https://openalex.org/C188573790","wikidata":"https://www.wikidata.org/wiki/Q12705","display_name":"Renewable energy","level":2,"score":0.3154999911785126},{"id":"https://openalex.org/C7668479","wikidata":"https://www.wikidata.org/wiki/Q7882446","display_name":"Unbundling","level":2,"score":0.3118000030517578},{"id":"https://openalex.org/C2989491980","wikidata":"https://www.wikidata.org/wiki/Q676081","display_name":"Power market","level":4,"score":0.29739999771118164},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.29490000009536743},{"id":"https://openalex.org/C14981831","wikidata":"https://www.wikidata.org/wiki/Q1713661","display_name":"Market clearing","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C2779438525","wikidata":"https://www.wikidata.org/wiki/Q5255048","display_name":"Demand response","level":3,"score":0.27970001101493835},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.27390000224113464},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.2667999863624573},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.26080000400543213},{"id":"https://openalex.org/C5496284","wikidata":"https://www.wikidata.org/wiki/Q5420856","display_name":"Expected shortfall","level":3,"score":0.259799987077713},{"id":"https://openalex.org/C16520705","wikidata":"https://www.wikidata.org/wiki/Q601799","display_name":"Cournot competition","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C2985793214","wikidata":"https://www.wikidata.org/wiki/Q3274096","display_name":"Utility maximization","level":2,"score":0.2556000053882599},{"id":"https://openalex.org/C98965940","wikidata":"https://www.wikidata.org/wiki/Q877496","display_name":"Transaction cost","level":2,"score":0.25279998779296875},{"id":"https://openalex.org/C10558101","wikidata":"https://www.wikidata.org/wiki/Q689855","display_name":"Smart grid","level":2,"score":0.2524000108242035}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.03142","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03142","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.03142","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.03142","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy","score":0.691230297088623}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"The":[0],"increasing":[1],"penetration":[2],"of":[3,144,188],"renewable":[4],"energy":[5],"has":[6],"introduced":[7],"substantial":[8],"volatility":[9],"into":[10],"wholesale":[11],"electricity":[12,78],"markets,":[13],"complicating":[14],"the":[15,47,87,90,94,142],"optimal":[16],"bidding":[17],"strategies":[18],"for":[19,46,76,106,117,128,154],"power":[20],"producers.":[21],"Traditional":[22],"Reinforcement":[23],"Learning":[24],"(RL)":[25],"approaches":[26],"often":[27],"struggle":[28],"to":[29,38,44,139,178],"balance":[30],"profit":[31,132],"maximization":[32],"with":[33],"risk":[34,129],"management,":[35],"frequently":[36],"overfitting":[37],"specific":[39],"market":[40,79,190],"conditions":[41],"or":[42],"failing":[43],"account":[45],"stochastic":[48],"spread":[49],"between":[50,96],"Day-Ahead":[51,118],"(DA)":[52],"and":[53,70,99,108,131,158],"Real-Time":[54],"(RT)":[55],"settlements.":[56],"To":[57],"address":[58],"these":[59],"challenges,":[60],"this":[61],"paper":[62],"makes":[63],"two":[64,145],"primary":[65],"contributions.":[66],"First,":[67],"we":[68,112],"introduce":[69],"open-source":[71],"a":[72,103,120,136,149,159],"high-fidelity":[73],"gymnasium":[74],"environment":[75,91],"two-settlement":[77],"bidding.":[80],"Grounded":[81],"in":[82],"extensive":[83],"empirical":[84],"data":[85],"from":[86],"PJM":[88],"Interconnection,":[89],"explicitly":[92],"models":[93],"interplay":[95],"DA":[97,156],"commitments":[98],"RT":[100,165],"deviations,":[101],"providing":[102],"standardized":[104],"testbed":[105],"general":[107],"risk-sensitive":[109],"agents.":[110],"Second,":[111],"propose":[113],"MARS-DA":[114,134,172],"(Multi-Agent":[115],"Regime-Switching":[116],"markets),":[119],"novel":[121],"hierarchical":[122],"framework":[123],"that":[124,152,162,171],"orchestrates":[125],"distinct":[126],"sub-policies":[127],"management":[130],"seeking.":[133],"utilizes":[135],"top-level":[137],"Meta-Controller":[138],"dynamically":[140],"blend":[141],"actions":[143],"specialized":[146],"base":[147],"agents:":[148],"\"Safe":[150],"Agent\"":[151,161],"optimizes":[153],"reliable":[155],"allocation":[157],"\"Speculator":[160],"targets":[163],"volatile":[164],"arbitrage":[166],"opportunities.":[167],"Extensive":[168],"experiments":[169],"demonstrate":[170],"achieves":[173],"superior":[174],"risk-adjusted":[175],"returns":[176],"compared":[177],"state-of-the-art":[179],"baselines":[180],"while":[181],"maintaining":[182],"robust":[183],"regime":[184],"alignment":[185],"during":[186],"periods":[187],"extreme":[189],"volatility.":[191]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-07T00:00:00"}
