{"id":"https://openalex.org/W4402435285","doi":"https://doi.org/10.1109/tiv.2024.3458894","title":"Reinforcement Learning Control for a Class of Discrete-Time Non-Strict Feedback Multi-Agent Systems and Application to Multi-Marine Vehicles","display_name":"Reinforcement Learning Control for a Class of Discrete-Time Non-Strict Feedback Multi-Agent Systems and Application to Multi-Marine Vehicles","publication_year":2024,"publication_date":"2024-09-11","ids":{"openalex":"https://openalex.org/W4402435285","doi":"https://doi.org/10.1109/tiv.2024.3458894"},"language":"en","primary_location":{"id":"doi:10.1109/tiv.2024.3458894","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3458894","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5035160808","display_name":"Weiwei Bai","orcid":"https://orcid.org/0000-0002-1374-2228"},"institutions":[{"id":"https://openalex.org/I43313876","display_name":"Dalian Maritime University","ror":"https://ror.org/002b7nr53","country_code":"CN","type":"education","lineage":["https://openalex.org/I43313876"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Weiwei Bai","raw_affiliation_strings":["Navigation College, Dalian Maritime University, Dalian, China"],"affiliations":[{"raw_affiliation_string":"Navigation College, Dalian Maritime University, Dalian, China","institution_ids":["https://openalex.org/I43313876"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061331291","display_name":"Dewang Chen","orcid":"https://orcid.org/0000-0002-8660-9700"},"institutions":[{"id":"https://openalex.org/I83791580","display_name":"Fujian University of Technology","ror":"https://ror.org/03c8fdb16","country_code":"CN","type":"education","lineage":["https://openalex.org/I83791580"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dewang Chen","raw_affiliation_strings":["School of Transportation, Fujian University of Technology, Fuzhou, China"],"affiliations":[{"raw_affiliation_string":"School of Transportation, Fujian University of Technology, Fuzhou, China","institution_ids":["https://openalex.org/I83791580"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5074387543","display_name":"Bo Zhao","orcid":"https://orcid.org/0000-0002-7684-7342"},"institutions":[{"id":"https://openalex.org/I25254941","display_name":"Beijing Normal University","ror":"https://ror.org/022k4wk35","country_code":"CN","type":"education","lineage":["https://openalex.org/I25254941"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bo Zhao","raw_affiliation_strings":["School of Systems Science, Beijing Normal University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Systems Science, Beijing Normal University, Beijing, China","institution_ids":["https://openalex.org/I25254941"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5107125628","display_name":"Andrea D Ariano","orcid":null},"institutions":[{"id":"https://openalex.org/I119003972","display_name":"Roma Tre University","ror":"https://ror.org/05vf0dg29","country_code":"IT","type":"education","lineage":["https://openalex.org/I119003972"]}],"countries":["IT"],"is_corresponding":false,"raw_author_name":"Andrea D'Ariano","raw_affiliation_strings":["Department of Civil, Computer Science and Aeronautical Technologies Engineering, Roma Tre University, Rome, Italy"],"affiliations":[{"raw_affiliation_string":"Department of Civil, Computer Science and Aeronautical Technologies Engineering, Roma Tre University, Rome, Italy","institution_ids":["https://openalex.org/I119003972"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5035160808"],"corresponding_institution_ids":["https://openalex.org/I43313876"],"apc_list":null,"apc_paid":null,"fwci":7.3606,"has_fulltext":false,"cited_by_count":20,"citation_normalized_percentile":{"value":0.9771197,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":90,"max":100},"biblio":{"volume":"10","issue":"5","first_page":"3613","last_page":"3625"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.963699996471405,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.963699996471405,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.942300021648407,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7517189979553223},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.7082817554473877},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5508324503898621},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.5501238107681274},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.4291917383670807},{"id":"https://openalex.org/keywords/discrete-time-and-continuous-time","display_name":"Discrete time and continuous time","score":0.42606717348098755},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3486185073852539},{"id":"https://openalex.org/keywords/mathematics","display_name":"Mathematics","score":0.1641324758529663},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.11643502116203308},{"id":"https://openalex.org/keywords/social-psychology","display_name":"Social psychology","score":0.07036253809928894}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7517189979553223},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.7082817554473877},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5508324503898621},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.5501238107681274},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.4291917383670807},{"id":"https://openalex.org/C55689738","wikidata":"https://www.wikidata.org/wiki/Q15963867","display_name":"Discrete time and continuous time","level":2,"score":0.42606717348098755},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3486185073852539},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.1641324758529663},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.11643502116203308},{"id":"https://openalex.org/C77805123","wikidata":"https://www.wikidata.org/wiki/Q161272","display_name":"Social psychology","level":1,"score":0.07036253809928894},{"id":"https://openalex.org/C105795698","wikidata":"https://www.wikidata.org/wiki/Q12483","display_name":"Statistics","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tiv.2024.3458894","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tiv.2024.3458894","pdf_url":null,"source":{"id":"https://openalex.org/S4210199657","display_name":"IEEE Transactions on Intelligent Vehicles","issn_l":"2379-8858","issn":["2379-8858","2379-8904"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Intelligent Vehicles","raw_type":"journal-article"},{"id":"pmh:oai:iris.uniroma3.it:11590/526182","is_oa":false,"landing_page_url":"https://hdl.handle.net/11590/526182","pdf_url":null,"source":{"id":"https://openalex.org/S4377196120","display_name":"Iris (Roma Tre University)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I119003972","host_organization_name":"Roma Tre University","host_organization_lineage":["https://openalex.org/I119003972"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"info:eu-repo/semantics/article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","score":0.550000011920929,"display_name":"Life below water"}],"awards":[{"id":"https://openalex.org/G3406314644","display_name":null,"funder_award_id":"52271360","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5075166346","display_name":null,"funder_award_id":"61903092","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6927519788","display_name":null,"funder_award_id":"61973330","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8317918283","display_name":null,"funder_award_id":"61976055","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":49,"referenced_works":["https://openalex.org/W1559261542","https://openalex.org/W1991360560","https://openalex.org/W1991535489","https://openalex.org/W2012812921","https://openalex.org/W2035625658","https://openalex.org/W2077195478","https://openalex.org/W2089684487","https://openalex.org/W2103759346","https://openalex.org/W2111366290","https://openalex.org/W2117945258","https://openalex.org/W2135574445","https://openalex.org/W2139542706","https://openalex.org/W2142923542","https://openalex.org/W2162601317","https://openalex.org/W2165501837","https://openalex.org/W2166000057","https://openalex.org/W2166132612","https://openalex.org/W2171018355","https://openalex.org/W2320262435","https://openalex.org/W2338588725","https://openalex.org/W2344237528","https://openalex.org/W2590302930","https://openalex.org/W2603406422","https://openalex.org/W2624600449","https://openalex.org/W2740962288","https://openalex.org/W2780814805","https://openalex.org/W2807555830","https://openalex.org/W2884733963","https://openalex.org/W2954033048","https://openalex.org/W2967622731","https://openalex.org/W2973026380","https://openalex.org/W3003040443","https://openalex.org/W3044422455","https://openalex.org/W3114263192","https://openalex.org/W3174645049","https://openalex.org/W3179972165","https://openalex.org/W3209777177","https://openalex.org/W3213092112","https://openalex.org/W3213705378","https://openalex.org/W4214756064","https://openalex.org/W4247617015","https://openalex.org/W4312700658","https://openalex.org/W4366818928","https://openalex.org/W4367595705","https://openalex.org/W4379531887","https://openalex.org/W4386608660","https://openalex.org/W4388505269","https://openalex.org/W4389382592","https://openalex.org/W4395961216"],"related_works":["https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W1977959518","https://openalex.org/W2038908348","https://openalex.org/W2107890255","https://openalex.org/W2106552856","https://openalex.org/W2145821588","https://openalex.org/W2086122291","https://openalex.org/W1987513656"],"abstract_inverted_index":{"A":[0],"novel":[1,38],"control":[2],"design":[3,72],"problem":[4,48,66],"for":[5,31,96],"a":[6,37],"class":[7],"of":[8,34,83,99,147,157],"non-strict":[9,140],"feedback":[10,141],"multi-agent":[11],"systems":[12],"(MAS)":[13],"in":[14,51,68,122,138],"discrete-time":[15,35],"form":[16,142],"is":[17,61,73,94,108,129],"studied":[18],"based":[19],"on":[20],"reinforcement":[21],"learning":[22],"(RL)":[23],"and":[24,79,110],"applied":[25,130],"to":[26,115,131,143],"multi-marine":[27],"vehicles":[28],"(MMV).":[29],"Firstly,":[30],"this":[32,127,158],"kind":[33],"MAS,":[36],"system":[39],"transformation,":[40],"which":[41,134],"can":[42,135],"not":[43],"only":[44],"solve":[45],"the":[46,52,58,64,69,77,81,88,97,101,105,123,132,139,145,148,155],"noncausal":[47],"that":[49],"exists":[50],"backstepping":[53],"method":[54],"but":[55],"also":[56],"reduce":[57],"computational":[59],"complexity,":[60],"proposed.":[62],"Secondly,":[63],"algebraic-loop":[65],"inherent":[67],"conventional":[70],"controller":[71],"solved":[74],"by":[75],"compensating":[76],"dynamics":[78],"using":[80],"property":[82],"neural":[84],"network":[85],"(NN).":[86],"Thirdly,":[87],"multi-gradient":[89],"recursive":[90],"(MGR)":[91],"RL":[92],"scheme":[93,128],"developed":[95],"sake":[98],"designing":[100],"optimal":[102],"controller.":[103,150],"Finally,":[104],"stability":[106],"analysis":[107],"presented,":[109],"all":[111],"signals":[112],"are":[113],"ensured":[114],"be":[116,136],"semi-global":[117],"uniformly":[118],"ultimately":[119],"bounded":[120],"(SGUUB)":[121],"Lyapunov's":[124],"sense.":[125],"Besides,":[126],"MMV":[133,152],"described":[137],"extend":[144],"application":[146],"designed":[149],"The":[151],"simulation":[153],"demonstrates":[154],"validation":[156],"scheme.":[159]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":15},{"year":2024,"cited_by_count":1}],"updated_date":"2026-03-20T23:20:44.827607","created_date":"2025-10-10T00:00:00"}
