{"id":"https://openalex.org/W4403059015","doi":"https://doi.org/10.1109/tai.2024.3471729","title":"Optimal Control of Stochastic Markovian Jump Systems With Wiener and Poisson Noises: Two Reinforcement Learning Approaches","display_name":"Optimal Control of Stochastic Markovian Jump Systems With Wiener and Poisson Noises: Two Reinforcement Learning Approaches","publication_year":2024,"publication_date":"2024-10-02","ids":{"openalex":"https://openalex.org/W4403059015","doi":"https://doi.org/10.1109/tai.2024.3471729"},"language":"en","primary_location":{"id":"doi:10.1109/tai.2024.3471729","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2024.3471729","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004980004","display_name":"Zhiguo Yan","orcid":"https://orcid.org/0000-0001-7375-0724"},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhiguo Yan","raw_affiliation_strings":["School of Information and Automation, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","School of Information and Automation, Qilu University of Technology(Shandong Academy of Sciences), Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Automation, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I4210142748","https://openalex.org/I152269853"]},{"raw_affiliation_string":"School of Information and Automation, Qilu University of Technology(Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I4210142748","https://openalex.org/I152269853"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043788859","display_name":"Tingkun Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tingkun Sun","raw_affiliation_strings":["School of Mathematics and Statistics, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","School of Mathematics and Statistics, Qilu University of Technology(Shandong Academy of Sciences), Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Mathematics and Statistics, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"]},{"raw_affiliation_string":"School of Mathematics and Statistics, Qilu University of Technology(Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5103173858","display_name":"Guolin Hu","orcid":null},"institutions":[{"id":"https://openalex.org/I152269853","display_name":"Qilu University of Technology","ror":"https://ror.org/04hyzq608","country_code":"CN","type":"education","lineage":["https://openalex.org/I152269853"]},{"id":"https://openalex.org/I4210142748","display_name":"Shandong Academy of Sciences","ror":"https://ror.org/04y8d6y55","country_code":"CN","type":"education","lineage":["https://openalex.org/I4210142748"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guolin Hu","raw_affiliation_strings":["School of Information and Automation, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","School of Information and Automation, Qilu University of Technology(Shandong Academy of Sciences), Jinan, China"],"affiliations":[{"raw_affiliation_string":"School of Information and Automation, Qilu University of Technology (Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I4210142748","https://openalex.org/I152269853"]},{"raw_affiliation_string":"School of Information and Automation, Qilu University of Technology(Shandong Academy of Sciences), Jinan, China","institution_ids":["https://openalex.org/I4210142748","https://openalex.org/I152269853"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5004980004"],"corresponding_institution_ids":["https://openalex.org/I152269853","https://openalex.org/I4210142748"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.20012428,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"5","issue":"12","first_page":"6591","last_page":"6600"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.7839999794960022,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.7839999794960022,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11347","display_name":"Neural Networks Stability and Synchronization","score":0.7533000111579895,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.7405999898910522,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7046246528625488},{"id":"https://openalex.org/keywords/jump","display_name":"Jump","score":0.6934678554534912},{"id":"https://openalex.org/keywords/markov-process","display_name":"Markov process","score":0.6091718077659607},{"id":"https://openalex.org/keywords/poisson-distribution","display_name":"Poisson distribution","score":0.5972078442573547},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.49734213948249817},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.485185444355011},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4450567662715912},{"id":"https://openalex.org/keywords/statistical-physics","display_name":"Statistical physics","score":0.4141656160354614},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.4134133458137512},{"id":"https://openalex.org/keywords/applied-mathematics","display_name":"Applied mathematics","score":0.39939409494400024},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.3614541292190552},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.18636274337768555},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.15443959832191467},{"id":"https://openalex.org/keywords/statistics","display_name":"Statistics","score":0.12735408544540405}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7046246528625488},{"id":"https://openalex.org/C2780695682","wikidata":"https://www.wikidata.org/wiki/Q4005959","display_name":"Jump","level":2,"score":0.6934678554534912},{"id":"https://openalex.org/C159886148","wikidata":"https://www.wikidata.org/wiki/Q176645","display_name":"Markov process","level":2,"score":0.6091718077659607},{"id":"https://openalex.org/C100906024","wikidata":"https://www.wikidata.org/wiki/Q205692","display_name":"Poisson distribution","level":2,"score":0.5972078442573547},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.49734213948249817},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.485185444355011},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4450567662715912},{"id":"https://openalex.org/C121864883","wikidata":"https://www.wikidata.org/wiki/Q677916","display_name":"Statistical physics","level":1,"score":0.4141656160354614},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.4134133458137512},{"id":"https://openalex.org/C28826006","wikidata":"https://www.wikidata.org/wiki/Q33521","display_name":"Applied mathematics","level":1,"score":0.39939409494400024},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.3614541292190552},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.18636274337768555},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.15443959832191467},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.12735408544540405},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tai.2024.3471729","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tai.2024.3471729","pdf_url":null,"source":{"id":"https://openalex.org/S4210169448","display_name":"IEEE Transactions on Artificial Intelligence","issn_l":"2691-4581","issn":["2691-4581"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Artificial Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8216974108","display_name":null,"funder_award_id":"62373204","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":33,"referenced_works":["https://openalex.org/W1970928532","https://openalex.org/W1984948634","https://openalex.org/W2024303516","https://openalex.org/W2062805416","https://openalex.org/W2069904367","https://openalex.org/W2093837911","https://openalex.org/W2126394835","https://openalex.org/W2132778652","https://openalex.org/W2148439597","https://openalex.org/W2343245314","https://openalex.org/W2346408824","https://openalex.org/W2594267261","https://openalex.org/W2602458259","https://openalex.org/W2887259460","https://openalex.org/W2927299624","https://openalex.org/W2972275995","https://openalex.org/W2984421996","https://openalex.org/W3049000493","https://openalex.org/W3108003339","https://openalex.org/W3114506529","https://openalex.org/W3163723204","https://openalex.org/W3172934943","https://openalex.org/W3184481401","https://openalex.org/W3200997590","https://openalex.org/W3210955860","https://openalex.org/W4214895024","https://openalex.org/W4223502737","https://openalex.org/W4281777641","https://openalex.org/W4312655313","https://openalex.org/W4362603939","https://openalex.org/W4387682369","https://openalex.org/W4390018125","https://openalex.org/W4390204102"],"related_works":["https://openalex.org/W4306904969","https://openalex.org/W2138720691","https://openalex.org/W4362501864","https://openalex.org/W4380318855","https://openalex.org/W2031695474","https://openalex.org/W2379968129","https://openalex.org/W2089289553","https://openalex.org/W2950380473","https://openalex.org/W2048674388","https://openalex.org/W2320258968"],"abstract_inverted_index":{"This":[0,76],"article":[1],"investigates":[2],"the":[3,39,53,58,72,85,96,114,119],"infinite":[4],"horizon":[5],"optimal":[6,40,73,86],"control":[7,74],"problem":[8],"for":[9],"stochastic":[10,44],"Markovian":[11],"jump":[12,104],"systems":[13],"with":[14],"Wiener":[15],"and":[16,33,55,60,88,116],"Poisson":[17,103],"noises.":[18],"First,":[19],"a":[20,64],"new":[21],"policy":[22,65],"iteration":[23,66],"algorithm":[24,67,77,97],"is":[25,68,89,110],"designed":[26],"by":[27,100],"using":[28],"integral":[29],"reinforcement":[30],"learning":[31],"approach":[32],"subsystems":[34],"transformation":[35,54],"technique,":[36],"which":[37],"obtains":[38],"solution":[41],"without":[42],"solving":[43],"coupled":[45],"algebraic":[46],"Riccati":[47],"equation":[48],"(SCARE)":[49],"directly.":[50],"Second,":[51],"through":[52],"substitution":[56],"of":[57,118],"SCARE":[59],"feedback":[61],"gain":[62],"matrix,":[63],"devised":[69],"to":[70,83,112],"determine":[71],"strategy.":[75],"leverages":[78],"only":[79],"state":[80],"trajectory":[81],"information":[82],"obtain":[84],"solution,":[87],"updated":[90],"in":[91,102],"an":[92,107],"unfixed":[93],"form.":[94],"Additionally,":[95],"remains":[98],"unaffected":[99],"variations":[101],"intensity.":[105],"Finally,":[106],"numerical":[108],"example":[109],"given":[111],"verify":[113],"effectiveness":[115],"convergence":[117],"proposed":[120],"algorithms.":[121]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
