{"id":"https://openalex.org/W2919774326","doi":"https://doi.org/10.1109/tnnls.2019.2897814","title":"Data-Driven Robust Control of Discrete-Time Uncertain Linear Systems via Off-Policy Reinforcement Learning","display_name":"Data-Driven Robust Control of Discrete-Time Uncertain Linear Systems via Off-Policy Reinforcement Learning","publication_year":2019,"publication_date":"2019-03-01","ids":{"openalex":"https://openalex.org/W2919774326","doi":"https://doi.org/10.1109/tnnls.2019.2897814","mag":"2919774326","pmid":"https://pubmed.ncbi.nlm.nih.gov/30843810"},"language":"en","primary_location":{"id":"doi:10.1109/tnnls.2019.2897814","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2019.2897814","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053342436","display_name":"Yongliang Yang","orcid":"https://orcid.org/0000-0002-3144-8604"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yongliang Yang","raw_affiliation_strings":["Key Laboratory of Knowledge Automation for Industrial Process, Ministry of Education, Beijing, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-3144-8604","affiliations":[{"raw_affiliation_string":"Key Laboratory of Knowledge Automation for Industrial Process, Ministry of Education, Beijing, China","institution_ids":[]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067621571","display_name":"Zhishan Guo","orcid":"https://orcid.org/0000-0002-5967-1058"},"institutions":[{"id":"https://openalex.org/I106165777","display_name":"University of Central Florida","ror":"https://ror.org/036nfer12","country_code":"US","type":"education","lineage":["https://openalex.org/I106165777"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Zhishan Guo","raw_affiliation_strings":["Department of Electrical and Computer Engineering, University of Central Florida, Orlando, USA"],"raw_orcid":"https://orcid.org/0000-0002-5967-1058","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, University of Central Florida, Orlando, USA","institution_ids":["https://openalex.org/I106165777"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081254155","display_name":"Haoyi Xiong","orcid":"https://orcid.org/0000-0002-5451-3253"},"institutions":[{"id":"https://openalex.org/I4210129579","display_name":"National Engineering Laboratory of Deep Learning Technology and Application","ror":"https://ror.org/03z8p5796","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210129579"]},{"id":"https://openalex.org/I98301712","display_name":"Baidu (China)","ror":"https://ror.org/03vs3wt56","country_code":"CN","type":"company","lineage":["https://openalex.org/I98301712"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyi Xiong","raw_affiliation_strings":["Big Data Laboratory, Baidu Research, Beijing, China","National Engineering Laboratory for Deep Learning Technology and Applications, Baidu Inc., Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Big Data Laboratory, Baidu Research, Beijing, China","institution_ids":["https://openalex.org/I98301712"]},{"raw_affiliation_string":"National Engineering Laboratory for Deep Learning Technology and Applications, Baidu Inc., Beijing, China","institution_ids":["https://openalex.org/I4210129579","https://openalex.org/I98301712"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5073089333","display_name":"Da\u2010Wei Ding","orcid":"https://orcid.org/0000-0003-1201-7785"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Da-Wei Ding","raw_affiliation_strings":["Key Laboratory of Knowledge Automation for Industrial Process, Ministry of Education, Beijing, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-1201-7785","affiliations":[{"raw_affiliation_string":"Key Laboratory of Knowledge Automation for Industrial Process, Ministry of Education, Beijing, China","institution_ids":[]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101512101","display_name":"Yixin Yin","orcid":"https://orcid.org/0000-0001-6056-8878"},"institutions":[{"id":"https://openalex.org/I92403157","display_name":"University of Science and Technology Beijing","ror":"https://ror.org/02egmk993","country_code":"CN","type":"education","lineage":["https://openalex.org/I92403157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yixin Yin","raw_affiliation_strings":["Key Laboratory of Knowledge Automation for Industrial Process, Ministry of Education, Beijing, China","School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-6056-8878","affiliations":[{"raw_affiliation_string":"Key Laboratory of Knowledge Automation for Industrial Process, Ministry of Education, Beijing, China","institution_ids":[]},{"raw_affiliation_string":"School of Automation and Electrical Engineering, University of Science and Technology Beijing, Beijing, China","institution_ids":["https://openalex.org/I92403157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5038037619","display_name":"Donald C. Wunsch","orcid":"https://orcid.org/0000-0002-9726-9051"},"institutions":[{"id":"https://openalex.org/I20382870","display_name":"Missouri University of Science and Technology","ror":"https://ror.org/00scwqd12","country_code":"US","type":"education","lineage":["https://openalex.org/I20382870"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Donald C. Wunsch","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, USA"],"raw_orcid":"https://orcid.org/0000-0002-9726-9051","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Missouri University of Science and Technology, Rolla, USA","institution_ids":["https://openalex.org/I20382870"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5053342436"],"corresponding_institution_ids":["https://openalex.org/I92403157"],"apc_list":null,"apc_paid":null,"fwci":10.9982,"has_fulltext":false,"cited_by_count":92,"citation_normalized_percentile":{"value":0.98733616,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":100},"biblio":{"volume":"30","issue":"12","first_page":"3735","last_page":"3747"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10675","display_name":"Mechanical Circulatory Support Devices","score":0.9800999760627747,"subfield":{"id":"https://openalex.org/subfields/2204","display_name":"Biomedical Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9697999954223633,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/algebraic-riccati-equation","display_name":"Algebraic Riccati equation","score":0.8052472472190857},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7945769429206848},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.7914259433746338},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.6682253479957581},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5948280096054077},{"id":"https://openalex.org/keywords/riccati-equation","display_name":"Riccati equation","score":0.5758505463600159},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.5419588088989258},{"id":"https://openalex.org/keywords/robust-control","display_name":"Robust control","score":0.5310032367706299},{"id":"https://openalex.org/keywords/discrete-time-and-continuous-time","display_name":"Discrete time and continuous time","score":0.5191649198532104},{"id":"https://openalex.org/keywords/mathematical-optimization","display_name":"Mathematical optimization","score":0.4999873638153076},{"id":"https://openalex.org/keywords/optimal-control","display_name":"Optimal control","score":0.49187779426574707},{"id":"https://openalex.org/keywords/algebraic-number","display_name":"Algebraic number","score":0.44304734468460083},{"id":"https://openalex.org/keywords/controller","display_name":"Controller (irrigation)","score":0.43983781337738037},{"id":"https://openalex.org/keywords/noise","display_name":"Noise (video)","score":0.41322994232177734},{"id":"https://openalex.org/keywords/control-system","display_name":"Control system","score":0.31495994329452515},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.31395912170410156},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.30608993768692017},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.12124267220497131},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.11309531331062317}],"concepts":[{"id":"https://openalex.org/C13847129","wikidata":"https://www.wikidata.org/wiki/Q4723989","display_name":"Algebraic Riccati equation","level":4,"score":0.8052472472190857},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7945769429206848},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.7914259433746338},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.6682253479957581},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5948280096054077},{"id":"https://openalex.org/C45473103","wikidata":"https://www.wikidata.org/wiki/Q851503","display_name":"Riccati equation","level":3,"score":0.5758505463600159},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.5419588088989258},{"id":"https://openalex.org/C31531917","wikidata":"https://www.wikidata.org/wiki/Q915157","display_name":"Robust control","level":3,"score":0.5310032367706299},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.5191649198532104},{"id":"https://openalex.org/C126255220","wikidata":"https://www.wikidata.org/wiki/Q141495","display_name":"Mathematical optimization","level":1,"score":0.4999873638153076},{"id":"https://openalex.org/C91575142","wikidata":"https://www.wikidata.org/wiki/Q1971426","display_name":"Optimal control","level":2,"score":0.49187779426574707},{"id":"https://openalex.org/C9376300","wikidata":"https://www.wikidata.org/wiki/Q168817","display_name":"Algebraic number","level":2,"score":0.44304734468460083},{"id":"https://openalex.org/C203479927","wikidata":"https://www.wikidata.org/wiki/Q5165939","display_name":"Controller (irrigation)","level":2,"score":0.43983781337738037},{"id":"https://openalex.org/C99498987","wikidata":"https://www.wikidata.org/wiki/Q2210247","display_name":"Noise (video)","level":3,"score":0.41322994232177734},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.31495994329452515},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.31395912170410156},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.30608993768692017},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.12124267220497131},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.11309531331062317},{"id":"https://openalex.org/C86803240","wikidata":"https://www.wikidata.org/wiki/Q420","display_name":"Biology","level":0,"score":0.0},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0},{"id":"https://openalex.org/C134306372","wikidata":"https://www.wikidata.org/wiki/Q7754","display_name":"Mathematical analysis","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C6557445","wikidata":"https://www.wikidata.org/wiki/Q173113","display_name":"Agronomy","level":1,"score":0.0},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0},{"id":"https://openalex.org/C78045399","wikidata":"https://www.wikidata.org/wiki/Q11214","display_name":"Differential equation","level":2,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tnnls.2019.2897814","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tnnls.2019.2897814","pdf_url":null,"source":{"id":"https://openalex.org/S4210175523","display_name":"IEEE Transactions on Neural Networks and Learning Systems","issn_l":"2162-237X","issn":["2162-237X","2162-2388"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Neural Networks and Learning Systems","raw_type":"journal-article"},{"id":"pmid:30843810","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/30843810","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on neural networks and learning systems","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2423437851","display_name":null,"funder_award_id":"FRF-BD-17-002A","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G3094653860","display_name":null,"funder_award_id":"W911NF-18-2-0260","funder_id":"https://openalex.org/F4320338295","funder_display_name":"Army Research Laboratory"},{"id":"https://openalex.org/G5205608926","display_name":null,"funder_award_id":"FRF-TP-18-031A1","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G5523829882","display_name":null,"funder_award_id":"2018M641197","funder_id":"https://openalex.org/F4320321543","funder_display_name":"China Postdoctoral Science Foundation"},{"id":"https://openalex.org/G6311521850","display_name":null,"funder_award_id":"CNS-1850851","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"},{"id":"https://openalex.org/G7934771358","display_name":null,"funder_award_id":"61333002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8473603101","display_name":null,"funder_award_id":"61473032","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8505461575","display_name":null,"funder_award_id":"61873028","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"},{"id":"https://openalex.org/F4320333675","display_name":"Intelligent Systems Center","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null},{"id":"https://openalex.org/F4320338295","display_name":"Army Research Laboratory","ror":"https://ror.org/011hc8f90"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":45,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W648594167","https://openalex.org/W968045710","https://openalex.org/W1498502445","https://openalex.org/W1566309885","https://openalex.org/W1588998206","https://openalex.org/W1601081659","https://openalex.org/W1601803999","https://openalex.org/W1614417283","https://openalex.org/W1968315580","https://openalex.org/W1977671496","https://openalex.org/W1983523797","https://openalex.org/W2010152647","https://openalex.org/W2012451615","https://openalex.org/W2030033366","https://openalex.org/W2042106612","https://openalex.org/W2048687352","https://openalex.org/W2060605484","https://openalex.org/W2104843094","https://openalex.org/W2121863487","https://openalex.org/W2124829859","https://openalex.org/W2136064843","https://openalex.org/W2137002893","https://openalex.org/W2148439597","https://openalex.org/W2430619152","https://openalex.org/W2461613850","https://openalex.org/W2484646121","https://openalex.org/W2487144912","https://openalex.org/W2501776475","https://openalex.org/W2519144068","https://openalex.org/W2552936679","https://openalex.org/W2579592432","https://openalex.org/W2580629550","https://openalex.org/W2585299106","https://openalex.org/W2610857016","https://openalex.org/W2742195311","https://openalex.org/W2772589676","https://openalex.org/W2789789879","https://openalex.org/W2793914020","https://openalex.org/W2798534591","https://openalex.org/W2809302593","https://openalex.org/W3213472335","https://openalex.org/W4214717370","https://openalex.org/W4229706427","https://openalex.org/W6804409665"],"related_works":["https://openalex.org/W2005019312","https://openalex.org/W2105459831","https://openalex.org/W1546579375","https://openalex.org/W1563296412","https://openalex.org/W2127238600","https://openalex.org/W2096105566","https://openalex.org/W2114791549","https://openalex.org/W16457797","https://openalex.org/W2792258377","https://openalex.org/W1987193149"],"abstract_inverted_index":{"This":[0],"paper":[1],"presents":[2],"a":[3,63,113],"model-free":[4,64],"solution":[5,65],"to":[6,28,66,76,103,119],"the":[7,30,47,53,58,67,78,83,90,101,107,121,124],"robust":[8,31],"stabilization":[9],"problem":[10,79],"of":[11,85,123],"discrete-time":[12],"linear":[13],"dynamical":[14],"systems":[15],"with":[16],"bounded":[17],"and":[18,94,106],"mismatched":[19],"uncertainty.":[20],"An":[21],"optimal":[22,48],"controller":[23,49],"design":[24],"method":[25],"is":[26,44,74,116],"derived":[27],"solve":[29,77],"control":[32],"problem,":[33],"which":[34],"results":[35],"in":[36,80],"solving":[37,52],"an":[38],"algebraic":[39],"Riccati":[40],"equation":[41],"(ARE).":[42],"It":[43],"shown":[45],"that":[46],"obtained":[50],"by":[51],"ARE":[54],"can":[55],"robustly":[56],"stabilize":[57],"uncertain":[59],"system.":[60],"To":[61],"develop":[62],"translated":[68],"ARE,":[69],"off-policy":[70,95,126],"reinforcement":[71],"learning":[72],"(RL)":[73],"employed":[75],"hand":[81],"without":[82],"requirement":[84],"system":[86,110],"dynamics.":[87,111],"In":[88],"addition,":[89],"comparisons":[91],"between":[92],"on-":[93],"RL":[96,127],"methods":[97],"are":[98],"presented":[99,125],"regarding":[100],"robustness":[102],"probing":[104],"noise":[105],"dependence":[108],"on":[109],"Finally,":[112],"simulation":[114],"example":[115],"carried":[117],"out":[118],"validate":[120],"efficacy":[122],"approach.":[128]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":13},{"year":2024,"cited_by_count":13},{"year":2023,"cited_by_count":10},{"year":2022,"cited_by_count":12},{"year":2021,"cited_by_count":16},{"year":2020,"cited_by_count":15},{"year":2019,"cited_by_count":12}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
