{"id":"https://openalex.org/W4412164404","doi":"https://doi.org/10.1109/tsmc.2025.3580988","title":"Optimal Time-Varying <i>Q</i> -Learning Algorithm for Affine Nonlinear Systems With Coupled Players","display_name":"Optimal Time-Varying <i>Q</i> -Learning Algorithm for Affine Nonlinear Systems With Coupled Players","publication_year":2025,"publication_date":"2025-07-09","ids":{"openalex":"https://openalex.org/W4412164404","doi":"https://doi.org/10.1109/tsmc.2025.3580988"},"language":"en","primary_location":{"id":"doi:10.1109/tsmc.2025.3580988","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2025.3580988","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100625792","display_name":"Huaguang Zhang","orcid":"https://orcid.org/0000-0002-2375-9824"},"institutions":[{"id":"https://openalex.org/I4391767858","display_name":"State Key Laboratory of Synthetical Automation for Process Industries","ror":"https://ror.org/0380ng272","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767858","https://openalex.org/I9224756"]},{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huaguang Zhang","raw_affiliation_strings":["State Key Laboratory of Synthetical Automation for Process Industries and the School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","College of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"raw_orcid":"https://orcid.org/0000-0002-2375-9824","affiliations":[{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries and the School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756","https://openalex.org/I4391767858"]},{"raw_affiliation_string":"College of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090191942","display_name":"Shuhang Yu","orcid":"https://orcid.org/0000-0001-9928-8232"},"institutions":[{"id":"https://openalex.org/I4391767858","display_name":"State Key Laboratory of Synthetical Automation for Process Industries","ror":"https://ror.org/0380ng272","country_code":null,"type":"facility","lineage":["https://openalex.org/I4391767858","https://openalex.org/I9224756"]},{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shuhang Yu","raw_affiliation_strings":["College of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","State Key Laboratory of Synthetical Automation for Process Industries and the School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"raw_orcid":"https://orcid.org/0000-0001-9928-8232","affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]},{"raw_affiliation_string":"State Key Laboratory of Synthetical Automation for Process Industries and the School of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756","https://openalex.org/I4391767858"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002903770","display_name":"Jiayue Sun","orcid":"https://orcid.org/0000-0002-7774-2606"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiayue Sun","raw_affiliation_strings":["College of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"raw_orcid":"https://orcid.org/0000-0002-7774-2606","affiliations":[{"raw_affiliation_string":"College of Information Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100331912","display_name":"Mei Li","orcid":"https://orcid.org/0000-0002-5814-6091"},"institutions":[{"id":"https://openalex.org/I9224756","display_name":"Northeastern University","ror":"https://ror.org/03awzbc87","country_code":"CN","type":"education","lineage":["https://openalex.org/I9224756"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Mei Li","raw_affiliation_strings":["School of Computer Science and Engineering, Northeastern University, Shenyang, Liaoning, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Computer Science and Engineering, Northeastern University, Shenyang, Liaoning, China","institution_ids":["https://openalex.org/I9224756"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.9042,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.75503995,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":95,"max":98},"biblio":{"volume":"55","issue":"10","first_page":"7037","last_page":"7047"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11749","display_name":"Iterative Learning Control Systems","score":0.9807999730110168,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9661999940872192,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13717","display_name":"Advanced Algorithms and Applications","score":0.9661999940872192,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/nonlinear-system","display_name":"Nonlinear system","score":0.6344190239906311},{"id":"https://openalex.org/keywords/affine-transformation","display_name":"Affine transformation","score":0.5305714011192322},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.5081257820129395},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.48421430587768555},{"id":"https://openalex.org/keywords/q-learning","display_name":"Q-learning","score":0.4130017161369324},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.32969895005226135},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.3125462234020233},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.24879825115203857},{"id":"https://openalex.org/keywords/physics","display_name":"Physics","score":0.18059712648391724},{"id":"https://openalex.org/keywords/geometry","display_name":"Geometry","score":0.104328453540802},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.07879775762557983},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.07038140296936035}],"concepts":[{"id":"https://openalex.org/C158622935","wikidata":"https://www.wikidata.org/wiki/Q660848","display_name":"Nonlinear system","level":2,"score":0.6344190239906311},{"id":"https://openalex.org/C92757383","wikidata":"https://www.wikidata.org/wiki/Q382497","display_name":"Affine transformation","level":2,"score":0.5305714011192322},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.5081257820129395},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.48421430587768555},{"id":"https://openalex.org/C188116033","wikidata":"https://www.wikidata.org/wiki/Q2664563","display_name":"Q-learning","level":3,"score":0.4130017161369324},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.32969895005226135},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.3125462234020233},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.24879825115203857},{"id":"https://openalex.org/C121332964","wikidata":"https://www.wikidata.org/wiki/Q413","display_name":"Physics","level":0,"score":0.18059712648391724},{"id":"https://openalex.org/C2524010","wikidata":"https://www.wikidata.org/wiki/Q8087","display_name":"Geometry","level":1,"score":0.104328453540802},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.07879775762557983},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.07038140296936035},{"id":"https://openalex.org/C62520636","wikidata":"https://www.wikidata.org/wiki/Q944","display_name":"Quantum mechanics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tsmc.2025.3580988","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tsmc.2025.3580988","pdf_url":null,"source":{"id":"https://openalex.org/S4210209078","display_name":"IEEE Transactions on Systems Man and Cybernetics Systems","issn_l":"2168-2216","issn":["2168-2216","2168-2232"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Systems, Man, and Cybernetics: Systems","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2034784894","display_name":null,"funder_award_id":"U23B20118","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6225353205","display_name":null,"funder_award_id":"N2404029","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G796113218","display_name":null,"funder_award_id":"62403116","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":35,"referenced_works":["https://openalex.org/W1968315580","https://openalex.org/W1972809999","https://openalex.org/W1997603681","https://openalex.org/W2013895638","https://openalex.org/W2015381356","https://openalex.org/W2100276679","https://openalex.org/W2108383324","https://openalex.org/W2137092694","https://openalex.org/W2147556634","https://openalex.org/W2344109271","https://openalex.org/W2564717627","https://openalex.org/W2606378794","https://openalex.org/W2779486833","https://openalex.org/W2917721237","https://openalex.org/W2998579696","https://openalex.org/W3084233102","https://openalex.org/W3096135216","https://openalex.org/W3117938601","https://openalex.org/W3182680309","https://openalex.org/W3195322794","https://openalex.org/W3204358175","https://openalex.org/W3206104399","https://openalex.org/W4200574011","https://openalex.org/W4205561196","https://openalex.org/W4224211769","https://openalex.org/W4225661228","https://openalex.org/W4285505818","https://openalex.org/W4290717511","https://openalex.org/W4312714074","https://openalex.org/W4319990437","https://openalex.org/W4320712923","https://openalex.org/W4321609042","https://openalex.org/W4322731391","https://openalex.org/W4327522695","https://openalex.org/W4382658113"],"related_works":["https://openalex.org/W2051487156","https://openalex.org/W2073681303","https://openalex.org/W4409439182","https://openalex.org/W2053286651","https://openalex.org/W2038416447","https://openalex.org/W2181743346","https://openalex.org/W2187401768","https://openalex.org/W2181413294","https://openalex.org/W1982160337","https://openalex.org/W2364151838"],"abstract_inverted_index":{"To":[0],"address":[1],"the":[2,50,84,88,109,113,137,140,147,164,167],"finite-horizon":[3],"coupled":[4,127],"two-player":[5],"mixed":[6,114],"<italic":[7,29,98,115],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[8,10,12,14,30,99,116,118,120,122],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">H</i><sub":[9,13,117,121],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">2</sub>/<italic":[11,119],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">\u221e</sub>":[15,123],"control":[16,124,149,170],"challenge":[17,59],"within":[18],"a":[19,27,57,70,95,157],"continuous-time":[20],"affine":[21,143],"nonlinear":[22,67,144],"system,":[23],"this":[24],"research":[25],"introduces":[26],"distinctive":[28],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Q</i>-function":[31,100],"and":[32,66,82],"presents":[33],"an":[34],"innovative":[35],"adaptive":[36],"dynamic":[37],"programming":[38],"(ADP)":[39],"method":[40],"that":[41],"operates":[42],"autonomously":[43],"of":[44,87,90,139,166],"system-specific":[45],"information.":[46],"Initially,":[47],"we":[48],"formulate":[49],"time-varying":[51],"Hamilton\u2013Jacobi\u2013Isaacs":[52],"(HJI)":[53],"equations,":[54],"which":[55],"pose":[56],"significant":[58],"for":[60],"resolution":[61],"due":[62],"to":[63,103,135,162],"their":[64],"time-dependent":[65],"nature.":[68],"Subsequently,":[69],"novel":[71,96],"offline":[72],"policy":[73],"iteration":[74],"(PI)":[75],"algorithm":[76],"is":[77,101,133,160],"introduced,":[78],"highlighting":[79],"its":[80],"convergence":[81],"reinforcing":[83],"substantive":[85],"proof":[86],"existence":[89],"Nash":[91],"equilibrium":[92],"points.":[93],"Moreover,":[94],"action-dependent":[97],"established":[102],"facilitate":[104],"entirely":[105],"model-free":[106],"learning,":[107],"representing":[108],"initial":[110],"foray":[111],"into":[112],"problem":[125],"involving":[126],"players.":[128],"The":[129],"Lyapunov":[130],"direct":[131],"approach":[132],"employed":[134],"ensure":[136],"stability":[138],"closed-loop":[141],"uncertain":[142],"system":[145],"under":[146],"ADP-based":[148,169],"scheme,":[150],"guaranteeing":[151],"uniform":[152],"ultimate":[153],"boundedness":[154],"(UUB).":[155],"Finally,":[156],"numerical":[158],"simulation":[159],"conducted":[161],"validate":[163],"effectiveness":[165],"aforementioned":[168],"approach.":[171]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-07-10T00:00:00"}
