{"id":"https://openalex.org/W4399568695","doi":"https://doi.org/10.1109/tcyb.2024.3403680","title":"Policy Iteration <i>Q</i>-Learning for Linear It\u00f4 Stochastic Systems With Markovian Jumps and its Application to Power Systems","display_name":"Policy Iteration <i>Q</i>-Learning for Linear It\u00f4 Stochastic Systems With Markovian Jumps and its Application to Power Systems","publication_year":2024,"publication_date":"2024-06-12","ids":{"openalex":"https://openalex.org/W4399568695","doi":"https://doi.org/10.1109/tcyb.2024.3403680","pmid":"https://pubmed.ncbi.nlm.nih.gov/38865225"},"language":"en","primary_location":{"id":"doi:10.1109/tcyb.2024.3403680","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2024.3403680","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5010477724","display_name":"Zhongyang Ming","orcid":"https://orcid.org/0009-0001-1002-6840"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhongyang Ming","raw_affiliation_strings":["School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100625792","display_name":"Huaguang Zhang","orcid":"https://orcid.org/0000-0002-2375-9824"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaguang Zhang","raw_affiliation_strings":["School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100613148","display_name":"Yingchun Wang","orcid":"https://orcid.org/0000-0003-4968-8398"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yingchun Wang","raw_affiliation_strings":["School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"affiliations":[{"raw_affiliation_string":"School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101958099","display_name":"Jing Dai","orcid":"https://orcid.org/0000-0002-3273-8881"},"institutions":[{"id":"https://openalex.org/I4210095546","display_name":"Tsinghua Sichuan Energy Internet Research Institute","ror":"https://ror.org/00pkx4k51","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210095546"]},{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jing Dai","raw_affiliation_strings":["Energy Internet Innovation Research Institute, Tsinghua University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Energy Internet Innovation Research Institute, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I4210095546","https://openalex.org/I99065089"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5010477724"],"corresponding_institution_ids":["https://openalex.org/I9224756"],"apc_list":null,"apc_paid":null,"fwci":2.3374,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.88662795,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"54","issue":"12","first_page":"7804","last_page":"7813"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10603","display_name":"Smart Grid Energy Management","score":0.9837999939918518,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10917","display_name":"Smart Grid Security and Resilience","score":0.9628000259399414,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.548719048500061},{"id":"https://openalex.org/keywords/power","display_name":"Power (physics)","score":0.528488278388977},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4349576532840729},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4190079867839813},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.3974703550338745},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3782576620578766},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.33694928884506226},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.16907107830047607},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.11861449480056763},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.11570081114768982}],"concepts":[{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.548719048500061},{"id":"https://openalex.org/C163258240","wikidata":"https://www.wikidata.org/wiki/Q25342","display_name":"Power (physics)","level":2,"score":0.528488278388977},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4349576532840729},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4190079867839813},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.3974703550338745},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3782576620578766},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.33694928884506226},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.16907107830047607},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.11861449480056763},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.11570081114768982},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.0},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcyb.2024.3403680","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcyb.2024.3403680","pdf_url":null,"source":{"id":"https://openalex.org/S4210191041","display_name":"IEEE Transactions on Cybernetics","issn_l":"2168-2267","issn":["2168-2267","2168-2275"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Cybernetics","raw_type":"journal-article"},{"id":"pmid:38865225","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/38865225","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on cybernetics","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2034784894","display_name":null,"funder_award_id":"U23B20118","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G451589156","display_name":null,"funder_award_id":"2018YFA0702200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"},{"id":"https://openalex.org/G6212556491","display_name":null,"funder_award_id":"62173080","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G837822842","display_name":null,"funder_award_id":"XLYC1801005","funder_id":"https://openalex.org/F4320329895","funder_display_name":"Liaoning Revitalization Talents Program"},{"id":"https://openalex.org/G8585005597","display_name":null,"funder_award_id":"N2304005","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329895","display_name":"Liaoning Revitalization Talents Program","ror":null},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":36,"referenced_works":["https://openalex.org/W394334121","https://openalex.org/W2020047580","https://openalex.org/W2024303516","https://openalex.org/W2078790707","https://openalex.org/W2139416664","https://openalex.org/W2189990206","https://openalex.org/W2331243380","https://openalex.org/W2564717627","https://openalex.org/W2796251577","https://openalex.org/W2917322258","https://openalex.org/W2982838649","https://openalex.org/W2993531987","https://openalex.org/W3008282592","https://openalex.org/W3031391912","https://openalex.org/W3034456914","https://openalex.org/W3127008750","https://openalex.org/W3134387361","https://openalex.org/W3138923910","https://openalex.org/W3181437685","https://openalex.org/W3182680309","https://openalex.org/W3195322794","https://openalex.org/W3195458200","https://openalex.org/W3197988808","https://openalex.org/W3200909074","https://openalex.org/W3206104399","https://openalex.org/W4280607589","https://openalex.org/W4285293172","https://openalex.org/W4285505818","https://openalex.org/W4301392153","https://openalex.org/W4320712923","https://openalex.org/W4379805448","https://openalex.org/W4384789633","https://openalex.org/W4388076083","https://openalex.org/W4389987972","https://openalex.org/W4392939427","https://openalex.org/W4393184596"],"related_works":["https://openalex.org/W1982160337","https://openalex.org/W1971380437","https://openalex.org/W1983548084","https://openalex.org/W2141691317","https://openalex.org/W2110846987","https://openalex.org/W2160609742","https://openalex.org/W2979526210","https://openalex.org/W1997414638","https://openalex.org/W2031091109","https://openalex.org/W2049254832"],"abstract_inverted_index":{"This":[0,69],"article":[1,70],"addresses":[2],"the":[3,40,51,54,59,62,72,83,87,110,125,129,134,145],"solution":[4],"of":[5,53,61,124,133],"continuous-time":[6],"linear":[7],"It\u00f4":[8,99],"stochastic":[9,100],"systems":[10,101],"with":[11,102],"Markovian":[12,103],"jumps":[13],"using":[14],"an":[15],"online":[16,94],"policy":[17],"iteration":[18],"(PI)":[19],"approach":[20],"grounded":[21],"in":[22,86],"-learning.":[23],"Initially,":[24],"a":[25,92,120,140],"model-dependent":[26],"offline":[27,55,88],"algorithm,":[28,89],"structured":[29],"according":[30],"to":[31,38,75,81],"traditional":[32],"optimal":[33],"control":[34,64],"strategies,":[35],"is":[36],"designed":[37],"solve":[39],"algebraic":[41],"Riccati":[42],"equation":[43],"(ARE).":[44],"Employing":[45],"Lyapunov":[46],"theory,":[47],"we":[48,90],"rigorously":[49],"derive":[50],"convergence":[52],"PI":[56],"algorithm":[57,96,108],"and":[58,115,131],"admissibility":[60],"iterative":[63],"law":[65],"through":[66,139],"mathematical":[67],"analysis.":[68],"represents":[71],"first":[73],"attempt":[74],"tackle":[76],"these":[77],"technical":[78],"challenges.":[79],"Subsequently,":[80],"address":[82],"limitations":[84],"inherent":[85],"introduce":[91],"novel":[93],"-learning":[95,107],"tailored":[97],"for":[98,112],"jumps.":[104],"The":[105],"proposed":[106,135],"obviates":[109],"need":[111],"transition":[113],"probabilities":[114],"system":[116],"matrices.":[117],"We":[118],"provide":[119],"thorough":[121],"stability":[122],"analysis":[123],"closed-loop":[126],"system.":[127],"Finally,":[128],"effectiveness":[130],"applicability":[132],"algorithms":[136],"are":[137],"demonstrated":[138],"simulation":[141],"example,":[142],"underpinned":[143],"by":[144],"theorems":[146],"established":[147],"herein.":[148]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":6},{"year":2024,"cited_by_count":3}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
