{"id":"https://openalex.org/W4393241388","doi":"https://doi.org/10.1109/tcst.2024.3377876","title":"Path-Following Control of Unmanned Underwater Vehicle Based on an Improved TD3 Deep Reinforcement Learning","display_name":"Path-Following Control of Unmanned Underwater Vehicle Based on an Improved TD3 Deep Reinforcement Learning","publication_year":2024,"publication_date":"2024-03-27","ids":{"openalex":"https://openalex.org/W4393241388","doi":"https://doi.org/10.1109/tcst.2024.3377876"},"language":"en","primary_location":{"id":"doi:10.1109/tcst.2024.3377876","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcst.2024.3377876","pdf_url":null,"source":{"id":"https://openalex.org/S133363738","display_name":"IEEE Transactions on Control Systems Technology","issn_l":"1063-6536","issn":["1063-6536","1558-0865","2374-0159"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control Systems Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102636415","display_name":"Yexin Fan","orcid":null},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":true,"raw_author_name":"Yexin Fan","raw_affiliation_strings":["Intelligent Control and Smart Energy (ICSE) Research Group, School of Engineering, University of Warwick, Coventry, U.K","School of Engineering, Intelligent Control and Smart Energy (ICSE) Research Group, University of Warwick, Coventry, U.K"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Intelligent Control and Smart Energy (ICSE) Research Group, School of Engineering, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"School of Engineering, Intelligent Control and Smart Energy (ICSE) Research Group, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018165929","display_name":"Hongyang Dong","orcid":"https://orcid.org/0000-0003-4302-5323"},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Hongyang Dong","raw_affiliation_strings":["Intelligent Control and Smart Energy (ICSE) Research Group, School of Engineering, University of Warwick, Coventry, U.K","School of Engineering, Intelligent Control and Smart Energy (ICSE) Research Group, University of Warwick, Coventry, U.K"],"raw_orcid":"https://orcid.org/0000-0003-4302-5323","affiliations":[{"raw_affiliation_string":"Intelligent Control and Smart Energy (ICSE) Research Group, School of Engineering, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"School of Engineering, Intelligent Control and Smart Energy (ICSE) Research Group, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5000635250","display_name":"Xiaowei Zhao","orcid":"https://orcid.org/0000-0002-1182-4502"},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Xiaowei Zhao","raw_affiliation_strings":["Intelligent Control and Smart Energy (ICSE) Research Group, School of Engineering, University of Warwick, Coventry, U.K","School of Engineering, Intelligent Control and Smart Energy (ICSE) Research Group, University of Warwick, Coventry, U.K"],"raw_orcid":"https://orcid.org/0000-0002-1182-4502","affiliations":[{"raw_affiliation_string":"Intelligent Control and Smart Energy (ICSE) Research Group, School of Engineering, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]},{"raw_affiliation_string":"School of Engineering, Intelligent Control and Smart Energy (ICSE) Research Group, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5006072539","display_name":"Petr Denissenko","orcid":"https://orcid.org/0000-0002-9631-5810"},"institutions":[{"id":"https://openalex.org/I39555362","display_name":"University of Warwick","ror":"https://ror.org/01a77tt86","country_code":"GB","type":"education","lineage":["https://openalex.org/I39555362"]}],"countries":["GB"],"is_corresponding":false,"raw_author_name":"Petr Denissenko","raw_affiliation_strings":["School of Engineering, University of Warwick, Coventry, U.K"],"raw_orcid":"https://orcid.org/0000-0002-9631-5810","affiliations":[{"raw_affiliation_string":"School of Engineering, University of Warwick, Coventry, U.K","institution_ids":["https://openalex.org/I39555362"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5102636415"],"corresponding_institution_ids":["https://openalex.org/I39555362"],"apc_list":null,"apc_paid":null,"fwci":17.3686,"has_fulltext":false,"cited_by_count":56,"citation_normalized_percentile":{"value":0.99724093,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"32","issue":"5","first_page":"1904","last_page":"1919"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11192","display_name":"Underwater Vehicles and Communication Systems","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11192","display_name":"Underwater Vehicles and Communication Systems","score":0.9955999851226807,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10040","display_name":"Adaptive Control of Nonlinear Systems","score":0.9613999724388123,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10249","display_name":"Distributed Control Multi-Agent Systems","score":0.9232000112533569,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7008568048477173},{"id":"https://openalex.org/keywords/remotely-operated-underwater-vehicle","display_name":"Remotely operated underwater vehicle","score":0.5745019912719727},{"id":"https://openalex.org/keywords/underwater","display_name":"Underwater","score":0.5542867183685303},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5017039775848389},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.48414474725723267},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.46664857864379883},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.4445532262325287},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.3621748685836792},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.3292127251625061},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.2842693328857422},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.26001572608947754},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.14861884713172913},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08805814385414124}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7008568048477173},{"id":"https://openalex.org/C145424490","wikidata":"https://www.wikidata.org/wiki/Q618465","display_name":"Remotely operated underwater vehicle","level":4,"score":0.5745019912719727},{"id":"https://openalex.org/C98083399","wikidata":"https://www.wikidata.org/wiki/Q3246517","display_name":"Underwater","level":2,"score":0.5542867183685303},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5017039775848389},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.48414474725723267},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.46664857864379883},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.4445532262325287},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.3621748685836792},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3292127251625061},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.2842693328857422},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.26001572608947754},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.14861884713172913},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08805814385414124},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.0},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tcst.2024.3377876","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcst.2024.3377876","pdf_url":null,"source":{"id":"https://openalex.org/S133363738","display_name":"IEEE Transactions on Control Systems Technology","issn_l":"1063-6536","issn":["1063-6536","1558-0865","2374-0159"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Control Systems Technology","raw_type":"journal-article"},{"id":"pmh:oai:wrap.warwick.ac.uk:187403","is_oa":false,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4306400665","display_name":"Warwick Research Archive Portal (University of Warwick)","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I39555362","host_organization_name":"University of Warwick","host_organization_lineage":["https://openalex.org/I39555362"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"acceptedVersion","is_accepted":true,"is_published":false,"raw_source_name":"","raw_type":"Journal Article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4584818719","display_name":null,"funder_award_id":"EP/Y016297/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"},{"id":"https://openalex.org/G8910033785","display_name":"Supergen ORE Impact Hub 2023","funder_award_id":"EP/Y016297/1","funder_id":"https://openalex.org/F4320334627","funder_display_name":"Engineering and Physical Sciences Research Council"}],"funders":[{"id":"https://openalex.org/F4320334627","display_name":"Engineering and Physical Sciences Research Council","ror":"https://ror.org/0439y7842"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":47,"referenced_works":["https://openalex.org/W1845894706","https://openalex.org/W1945616565","https://openalex.org/W1979483959","https://openalex.org/W2021082829","https://openalex.org/W2126058202","https://openalex.org/W2145287296","https://openalex.org/W2192028265","https://openalex.org/W2201581102","https://openalex.org/W2512056218","https://openalex.org/W2774922731","https://openalex.org/W2792969186","https://openalex.org/W2808470116","https://openalex.org/W2908854797","https://openalex.org/W2963542245","https://openalex.org/W2963729305","https://openalex.org/W2963917788","https://openalex.org/W2966233982","https://openalex.org/W2972571107","https://openalex.org/W2973588514","https://openalex.org/W2978951642","https://openalex.org/W2999762404","https://openalex.org/W3006536688","https://openalex.org/W3013722072","https://openalex.org/W3023077548","https://openalex.org/W3034598088","https://openalex.org/W3046096360","https://openalex.org/W3102621632","https://openalex.org/W3135682060","https://openalex.org/W3164385739","https://openalex.org/W3206503085","https://openalex.org/W3207244163","https://openalex.org/W3207657697","https://openalex.org/W4206032480","https://openalex.org/W4206068387","https://openalex.org/W4206789995","https://openalex.org/W4220808849","https://openalex.org/W4280598493","https://openalex.org/W4282927171","https://openalex.org/W4289303873","https://openalex.org/W4289549727","https://openalex.org/W4297024676","https://openalex.org/W4312713104","https://openalex.org/W6640425456","https://openalex.org/W6687681856","https://openalex.org/W6748839928","https://openalex.org/W6771730547","https://openalex.org/W6797024940"],"related_works":["https://openalex.org/W2071768959","https://openalex.org/W4319442894","https://openalex.org/W2290286193","https://openalex.org/W2921408402","https://openalex.org/W2920061524","https://openalex.org/W4310083477","https://openalex.org/W2328553770","https://openalex.org/W4372267671","https://openalex.org/W2079693677","https://openalex.org/W4312756471"],"abstract_inverted_index":{"This":[0,19,105],"work":[1],"proposes":[2],"an":[3],"innovative":[4],"path-following":[5],"control":[6,86,95,139,178],"method,":[7],"anchored":[8],"in":[9,170,189],"deep":[10,55,181],"reinforcement":[11],"learning":[12,33,157],"(DRL),":[13],"for":[14],"unmanned":[15],"underwater":[16],"vehicles":[17],"(UUVs).":[18],"approach":[20],"is":[21,48,128,149],"driven":[22],"by":[23,68],"several":[24],"new":[25],"designs,":[26],"all":[27,204],"of":[28,65,135],"which":[29,130],"aim":[30],"to":[31,83,108,137,151,196,216],"enhance":[32],"efficiency":[34],"and":[35,37,50,74,114,155,186,202,211],"effectiveness":[36],"achieve":[38],"high-performance":[39],"UUV":[40,81,190],"control.":[41],"Specifically,":[42],"a":[43,70,123,132,142],"novel":[44],"experience":[45],"replay":[46],"strategy":[47],"designed":[49,150],"integrated":[51],"within":[52,93],"the":[53,63,80,138,218],"twin-delayed":[54],"deterministic":[56,182],"policy":[57,183],"gradient":[58,184],"algorithm":[59],"(TD3).":[60],"It":[61],"distinguishes":[62],"significance":[64],"stored":[66],"transitions":[67],"making":[69],"trade-off":[71],"between":[72],"rewards":[73,169],"temporal-difference":[75],"(TD)":[76],"errors,":[77],"thus":[78],"enabling":[79],"agent":[82],"explore":[84],"optimal":[85],"policies":[87],"more":[88],"efficiently.":[89],"Another":[90],"major":[91],"challenge":[92],"this":[94,121],"problem":[96],"arises":[97],"from":[98],"action":[99],"oscillations":[100],"associated":[101],"with":[102,175],"DRL":[103],"policies.":[104],"issue":[106],"leads":[107],"excessive":[109],"system":[110],"wear":[111],"on":[112],"actuators":[113],"makes":[115],"real-time":[116],"application":[117],"difficult.":[118],"To":[119],"mitigate":[120],"challenge,":[122],"newly":[124],"improved":[125],"regularization":[126],"method":[127,166],"proposed,":[129],"provides":[131],"moderate":[133],"level":[134],"smoothness":[136],"policy.":[140],"Furthermore,":[141],"dynamic":[143],"reward":[144],"function":[145],"featuring":[146],"adaptive":[147],"constraints":[148],"avoid":[152],"unproductive":[153],"exploration":[154],"expedite":[156],"convergence":[158],"speed":[159],"further.":[160],"Simulation":[161,210],"results":[162],"show":[163],"that":[164],"our":[165],"garners":[167],"higher":[168],"fewer":[171],"training":[172],"episodes":[173],"compared":[174],"mainstream":[176],"DRL-based":[177],"approaches":[179],"(e.g.,":[180],"(DDPG)":[185],"vanilla":[187],"TD3)":[188],"applications.":[191],"Moreover,":[192],"it":[193],"can":[194],"adapt":[195],"varying":[197],"path":[198],"configurations":[199],"amid":[200],"uncertainties":[201],"disturbances,":[203],"while":[205],"ensuring":[206],"high":[207],"tracking":[208],"accuracy.":[209],"experimental":[212],"studies":[213],"are":[214],"conducted":[215],"verify":[217],"effectiveness.":[219]},"counts_by_year":[{"year":2026,"cited_by_count":10},{"year":2025,"cited_by_count":39},{"year":2024,"cited_by_count":7}],"updated_date":"2026-05-15T08:27:34.491423","created_date":"2025-10-10T00:00:00"}
