{"id":"https://openalex.org/W2808261958","doi":"https://doi.org/10.24963/ijcai.2018/79","title":"Recurrent Deep Multiagent Q-Learning for Autonomous Brokers in Smart Grid","display_name":"Recurrent Deep Multiagent Q-Learning for Autonomous Brokers in Smart Grid","publication_year":2018,"publication_date":"2018-07-01","ids":{"openalex":"https://openalex.org/W2808261958","doi":"https://doi.org/10.24963/ijcai.2018/79","mag":"2808261958"},"language":"en","primary_location":{"id":"doi:10.24963/ijcai.2018/79","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2018/79","pdf_url":"https://www.ijcai.org/proceedings/2018/0079.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.ijcai.org/proceedings/2018/0079.pdf","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5090073634","display_name":"Yaodong Yang","orcid":"https://orcid.org/0000-0001-8132-5613"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yaodong Yang","raw_affiliation_strings":["School of Computer Software, Tianjin University"],"affiliations":[{"raw_affiliation_string":"School of Computer Software, Tianjin University","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047509839","display_name":"Jianye Hao","orcid":"https://orcid.org/0000-0002-0422-8235"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jianye Hao","raw_affiliation_strings":["School of Computer Software, Tianjin University"],"affiliations":[{"raw_affiliation_string":"School of Computer Software, Tianjin University","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5079378336","display_name":"Mingyang Sun","orcid":"https://orcid.org/0000-0002-5790-5025"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Mingyang Sun","raw_affiliation_strings":["Imperial College London"],"affiliations":[{"raw_affiliation_string":"Imperial College London","institution_ids":["https://openalex.org/I47508984"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100707447","display_name":"Zan Wang","orcid":"https://orcid.org/0000-0001-6173-8170"},"institutions":[{"id":"https://openalex.org/I162868743","display_name":"Tianjin University","ror":"https://ror.org/012tb2g32","country_code":"CN","type":"education","lineage":["https://openalex.org/I162868743"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zan Wang","raw_affiliation_strings":["School of Computer Software, Tianjin University"],"affiliations":[{"raw_affiliation_string":"School of Computer Software, Tianjin University","institution_ids":["https://openalex.org/I162868743"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022008180","display_name":"Changjie Fan","orcid":"https://orcid.org/0000-0001-5420-0516"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Changjie Fan","raw_affiliation_strings":["NetEase, Inc"],"affiliations":[{"raw_affiliation_string":"NetEase, Inc","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5014643856","display_name":"Goran \u0160trbac","orcid":"https://orcid.org/0000-0001-7421-3947"},"institutions":[{"id":"https://openalex.org/I47508984","display_name":"Imperial College London","ror":"https://ror.org/041kmwe10","country_code":"GB","type":"education","lineage":["https://openalex.org/I47508984"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Goran Strbac","raw_affiliation_strings":["Imperial College London"],"affiliations":[{"raw_affiliation_string":"Imperial College London","institution_ids":["https://openalex.org/I47508984"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5090073634"],"corresponding_institution_ids":["https://openalex.org/I162868743"],"apc_list":null,"apc_paid":null,"fwci":2.8787,"has_fulltext":false,"cited_by_count":34,"citation_normalized_percentile":{"value":0.91399955,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"569","last_page":"575"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":1.0,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9966999888420105,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11052","display_name":"Energy Load and Power Forecasting","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7318751215934753},{"id":"https://openalex.org/keywords/smart-grid","display_name":"Smart grid","score":0.702947199344635},{"id":"https://openalex.org/keywords/profit","display_name":"Profit (economics)","score":0.6253628134727478},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6227641105651855},{"id":"https://openalex.org/keywords/grid","display_name":"Grid","score":0.5560106635093689},{"id":"https://openalex.org/keywords/cluster-analysis","display_name":"Cluster analysis","score":0.4989607334136963},{"id":"https://openalex.org/keywords/electricity","display_name":"Electricity","score":0.4954327344894409},{"id":"https://openalex.org/keywords/order","display_name":"Order (exchange)","score":0.46576666831970215},{"id":"https://openalex.org/keywords/multi-agent-system","display_name":"Multi-agent system","score":0.4578060805797577},{"id":"https://openalex.org/keywords/dynamic-pricing","display_name":"Dynamic pricing","score":0.4352337718009949},{"id":"https://openalex.org/keywords/demand-response","display_name":"Demand response","score":0.43182051181793213},{"id":"https://openalex.org/keywords/industrial-organization","display_name":"Industrial organization","score":0.3812702000141144},{"id":"https://openalex.org/keywords/operations-research","display_name":"Operations research","score":0.3552815020084381},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.31605273485183716},{"id":"https://openalex.org/keywords/business","display_name":"Business","score":0.3014451861381531},{"id":"https://openalex.org/keywords/microeconomics","display_name":"Microeconomics","score":0.25085991621017456},{"id":"https://openalex.org/keywords/marketing","display_name":"Marketing","score":0.20747819542884827},{"id":"https://openalex.org/keywords/economics","display_name":"Economics","score":0.1173953115940094},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08678212761878967}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7318751215934753},{"id":"https://openalex.org/C10558101","wikidata":"https://www.wikidata.org/wiki/Q689855","display_name":"Smart grid","level":2,"score":0.702947199344635},{"id":"https://openalex.org/C181622380","wikidata":"https://www.wikidata.org/wiki/Q26911","display_name":"Profit (economics)","level":2,"score":0.6253628134727478},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6227641105651855},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.5560106635093689},{"id":"https://openalex.org/C73555534","wikidata":"https://www.wikidata.org/wiki/Q622825","display_name":"Cluster analysis","level":2,"score":0.4989607334136963},{"id":"https://openalex.org/C206658404","wikidata":"https://www.wikidata.org/wiki/Q12725","display_name":"Electricity","level":2,"score":0.4954327344894409},{"id":"https://openalex.org/C182306322","wikidata":"https://www.wikidata.org/wiki/Q1779371","display_name":"Order (exchange)","level":2,"score":0.46576666831970215},{"id":"https://openalex.org/C41550386","wikidata":"https://www.wikidata.org/wiki/Q529909","display_name":"Multi-agent system","level":2,"score":0.4578060805797577},{"id":"https://openalex.org/C2779391423","wikidata":"https://www.wikidata.org/wiki/Q17009728","display_name":"Dynamic pricing","level":2,"score":0.4352337718009949},{"id":"https://openalex.org/C2779438525","wikidata":"https://www.wikidata.org/wiki/Q5255048","display_name":"Demand response","level":3,"score":0.43182051181793213},{"id":"https://openalex.org/C40700","wikidata":"https://www.wikidata.org/wiki/Q1411783","display_name":"Industrial organization","level":1,"score":0.3812702000141144},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.3552815020084381},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.31605273485183716},{"id":"https://openalex.org/C144133560","wikidata":"https://www.wikidata.org/wiki/Q4830453","display_name":"Business","level":0,"score":0.3014451861381531},{"id":"https://openalex.org/C175444787","wikidata":"https://www.wikidata.org/wiki/Q39072","display_name":"Microeconomics","level":1,"score":0.25085991621017456},{"id":"https://openalex.org/C162853370","wikidata":"https://www.wikidata.org/wiki/Q39809","display_name":"Marketing","level":1,"score":0.20747819542884827},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.1173953115940094},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08678212761878967},{"id":"https://openalex.org/C10138342","wikidata":"https://www.wikidata.org/wiki/Q43015","display_name":"Finance","level":1,"score":0.0},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.24963/ijcai.2018/79","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2018/79","pdf_url":"https://www.ijcai.org/proceedings/2018/0079.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.24963/ijcai.2018/79","is_oa":true,"landing_page_url":"https://doi.org/10.24963/ijcai.2018/79","pdf_url":"https://www.ijcai.org/proceedings/2018/0079.pdf","source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the Twenty-Seventh International Joint Conference on Artificial Intelligence","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/7","score":0.5,"display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G1063510118","display_name":null,"funder_award_id":"6170236","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1121271761","display_name":null,"funder_award_id":"Program","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1231421488","display_name":null,"funder_award_id":"under","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G1428435317","display_name":null,"funder_award_id":"Grant No.:","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2087396116","display_name":null,"funder_award_id":"China","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G2702356746","display_name":null,"funder_award_id":"61702","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G3317480652","display_name":null,"funder_award_id":"Science","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5854786607","display_name":null,"funder_award_id":"Tianjin","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5939423041","display_name":null,"funder_award_id":"Technology","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5994120800","display_name":null,"funder_award_id":"Natural","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7726157001","display_name":null,"funder_award_id":"Grant No.","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320326190","display_name":"Tianjin Science and Technology Committee","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W2808261958.pdf","grobid_xml":"https://content.openalex.org/works/W2808261958.grobid-xml"},"referenced_works_count":24,"referenced_works":["https://openalex.org/W33597319","https://openalex.org/W46933459","https://openalex.org/W139860952","https://openalex.org/W1545757366","https://openalex.org/W1948566616","https://openalex.org/W1980358463","https://openalex.org/W2008668719","https://openalex.org/W2034059032","https://openalex.org/W2091921805","https://openalex.org/W2121863487","https://openalex.org/W2122763142","https://openalex.org/W2144823724","https://openalex.org/W2145339207","https://openalex.org/W2156049817","https://openalex.org/W2364298186","https://openalex.org/W2396385459","https://openalex.org/W2467523955","https://openalex.org/W2523841471","https://openalex.org/W2560037007","https://openalex.org/W2575705757","https://openalex.org/W2580995980","https://openalex.org/W2589616230","https://openalex.org/W2787564712","https://openalex.org/W2963440040"],"related_works":["https://openalex.org/W1589973774","https://openalex.org/W2353074559","https://openalex.org/W2171108821","https://openalex.org/W2023642087","https://openalex.org/W2074513827","https://openalex.org/W2402141875","https://openalex.org/W3125701662","https://openalex.org/W1498762745","https://openalex.org/W2946986200","https://openalex.org/W2057315382"],"abstract_inverted_index":{"The":[0,97],"broker":[1,28],"mechanism":[2],"is":[3,29],"widely":[4],"applied":[5],"to":[6,11,17,51,88],"serve":[7],"for":[8,64,93],"interested":[9],"parties":[10],"derive":[12],"long-term":[13],"policies":[14],"in":[15,23,66],"order":[16],"reduce":[18],"costs":[19],"or":[20],"gain":[21],"profits":[22],"smart":[24],"grid.":[25],"However,":[26],"a":[27,32],"faced":[30],"with":[31,47],"number":[33],"of":[34,103,112],"challenging":[35],"problems":[36],"such":[37],"as":[38],"balancing":[39],"demand":[40],"and":[41,45,78,108],"supply":[42],"from":[43],"customers":[44],"competing":[46],"other":[48],"coexisting":[49],"brokers":[50,65],"maximize":[52],"its":[53],"profit.":[54],"In":[55],"this":[56],"paper,":[57],"we":[58],"develop":[59],"an":[60],"effective":[61],"pricing":[62,106],"strategy":[63,107],"local":[67],"electricity":[68,85],"retail":[69,91],"market":[70,92],"based":[71],"on":[72],"recurrent":[73],"deep":[74],"multiagent":[75],"reinforcement":[76],"learning":[77],"sequential":[79],"clustering.":[80],"We":[81],"use":[82],"real":[83],"household":[84],"consumption":[86],"data":[87],"simulate":[89],"the":[90,100,104,110],"evaluating":[94],"our":[95,113],"strategy.":[96],"experiments":[98],"demonstrate":[99],"superior":[101],"performance":[102],"proposed":[105],"highlight":[109],"effectiveness":[111],"reward":[114],"shaping":[115],"mechanism.":[116]},"counts_by_year":[{"year":2025,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2022,"cited_by_count":9},{"year":2021,"cited_by_count":5},{"year":2020,"cited_by_count":5},{"year":2019,"cited_by_count":8},{"year":2018,"cited_by_count":4}],"updated_date":"2026-04-14T08:04:32.555800","created_date":"2025-10-10T00:00:00"}
