{"id":"https://openalex.org/W2138366160","doi":"https://doi.org/10.1109/robio.2009.5420445","title":"Application of Reinforcement Learning to autonomous heading control for bionic underwater robots","display_name":"Application of Reinforcement Learning to autonomous heading control for bionic underwater robots","publication_year":2009,"publication_date":"2009-12-01","ids":{"openalex":"https://openalex.org/W2138366160","doi":"https://doi.org/10.1109/robio.2009.5420445","mag":"2138366160"},"language":"en","primary_location":{"id":"doi:10.1109/robio.2009.5420445","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio.2009.5420445","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100829512","display_name":"Longxin Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Longxin Lin","raw_affiliation_strings":["National University of Defense Technology, Changsha, China","National University of Defense, Technology, ChangSha, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense, Technology, ChangSha, China#TAB#","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5032618881","display_name":"Haibin Xie","orcid":"https://orcid.org/0000-0002-6650-9155"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haibin Xie","raw_affiliation_strings":["National University of Defense Technology, Changsha, China","National University of Defense, Technology, ChangSha, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense, Technology, ChangSha, China#TAB#","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5056012647","display_name":"Lincheng Shen","orcid":null},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lincheng Shen","raw_affiliation_strings":["National University of Defense Technology, Changsha, China","National University of Defense, Technology, ChangSha, China#TAB#"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Changsha, China","institution_ids":["https://openalex.org/I170215575"]},{"raw_affiliation_string":"National University of Defense, Technology, ChangSha, China#TAB#","institution_ids":["https://openalex.org/I170215575"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5100829512"],"corresponding_institution_ids":["https://openalex.org/I170215575"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":7,"citation_normalized_percentile":{"value":0.1161294,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":89,"max":99},"biblio":{"volume":"55","issue":null,"first_page":"2486","last_page":"2490"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11170","display_name":"Biomimetic flight and propulsion mechanisms","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11170","display_name":"Biomimetic flight and propulsion mechanisms","score":0.9980999827384949,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11192","display_name":"Underwater Vehicles and Communication Systems","score":0.9970999956130981,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.9962000250816345,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/heading","display_name":"Heading (navigation)","score":0.8075894117355347},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.7938863635063171},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.784957230091095},{"id":"https://openalex.org/keywords/underwater","display_name":"Underwater","score":0.7466700673103333},{"id":"https://openalex.org/keywords/robot-control","display_name":"Robot control","score":0.492497056722641},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.48600515723228455},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4679621160030365},{"id":"https://openalex.org/keywords/robot-learning","display_name":"Robot learning","score":0.46065306663513184},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.45957040786743164},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.45122095942497253},{"id":"https://openalex.org/keywords/control-engineering","display_name":"Control engineering","score":0.4275432825088501},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.40757471323013306},{"id":"https://openalex.org/keywords/simulation","display_name":"Simulation","score":0.3252320885658264},{"id":"https://openalex.org/keywords/aerospace-engineering","display_name":"Aerospace engineering","score":0.07674077153205872}],"concepts":[{"id":"https://openalex.org/C2776937971","wikidata":"https://www.wikidata.org/wiki/Q4384217","display_name":"Heading (navigation)","level":2,"score":0.8075894117355347},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.7938863635063171},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.784957230091095},{"id":"https://openalex.org/C98083399","wikidata":"https://www.wikidata.org/wiki/Q3246517","display_name":"Underwater","level":2,"score":0.7466700673103333},{"id":"https://openalex.org/C65401140","wikidata":"https://www.wikidata.org/wiki/Q7353385","display_name":"Robot control","level":4,"score":0.492497056722641},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48600515723228455},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4679621160030365},{"id":"https://openalex.org/C188888258","wikidata":"https://www.wikidata.org/wiki/Q7353390","display_name":"Robot learning","level":4,"score":0.46065306663513184},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.45957040786743164},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.45122095942497253},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.4275432825088501},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.40757471323013306},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.3252320885658264},{"id":"https://openalex.org/C146978453","wikidata":"https://www.wikidata.org/wiki/Q3798668","display_name":"Aerospace engineering","level":1,"score":0.07674077153205872},{"id":"https://openalex.org/C127313418","wikidata":"https://www.wikidata.org/wiki/Q1069","display_name":"Geology","level":0,"score":0.0},{"id":"https://openalex.org/C111368507","wikidata":"https://www.wikidata.org/wiki/Q43518","display_name":"Oceanography","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/robio.2009.5420445","is_oa":false,"landing_page_url":"https://doi.org/10.1109/robio.2009.5420445","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2009 IEEE International Conference on Robotics and Biomimetics (ROBIO)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/14","score":0.6600000262260437,"display_name":"Life below water"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320320766","display_name":"Nanyang Technological University","ror":"https://ror.org/02e7b5302"},{"id":"https://openalex.org/F4320322684","display_name":"Hubei University of Automotive Technology","ror":"https://ror.org/039m95m06"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":11,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1972789031","https://openalex.org/W2029230226","https://openalex.org/W2062859931","https://openalex.org/W2086389099","https://openalex.org/W2101190173","https://openalex.org/W2114882146","https://openalex.org/W2117289015","https://openalex.org/W2125353490","https://openalex.org/W2162836633","https://openalex.org/W3209380510"],"related_works":["https://openalex.org/W2930863966","https://openalex.org/W2126211886","https://openalex.org/W3153786280","https://openalex.org/W3127551068","https://openalex.org/W2165180011","https://openalex.org/W3165944253","https://openalex.org/W4220829754","https://openalex.org/W2351343564","https://openalex.org/W2170052867","https://openalex.org/W2171010636"],"abstract_inverted_index":{"The":[0,101],"bionic":[1,23,94,143],"underwater":[2,16,24,95,144],"robot":[3,76,96,145],"propelled":[4],"by":[5,60],"undulating":[6,45,99],"fins":[7],"is":[8],"an":[9],"interesting":[10],"field":[11],"in":[12,137],"current":[13],"research":[14],"on":[15],"robots.":[17],"With":[18,127],"the":[19,51,63,71,81,86,110,115,128,131,142],"prosperous":[20],"development":[21],"of":[22,39,41,44,93,133,141],"robots,":[25],"its":[26,57],"control":[27,58,89,123,140],"problem":[28],"remains":[29],"big":[30],"challenging":[31],"for":[32,90],"strong":[33],"nonlinearity,":[34],"uncertainty":[35],"environments,":[36],"and":[37,65,112,120],"lack":[38],"understanding":[40],"dynamic":[42],"characteristics":[43],"fins.":[46,100],"As":[47],"a":[48,67,91],"model-free":[49],"method,":[50],"Q-learning":[52],"based":[53],"reinforcement":[54,134],"learning":[55,135],"achieves":[56],"motivation":[59],"interacting":[61],"with":[62,97],"environment":[64],"maximizing":[66],"reward,":[68],"so":[69],"suits":[70],"complicated":[72],"applications":[73],"such":[74],"as":[75],"control.":[77],"This":[78],"paper":[79],"introduced":[80],"online":[82],"Q_learning":[83],"algorithm":[84,102,136],"to":[85,105],"autonomous":[87,138],"heading":[88,139],"kind":[92],"two":[98],"doesn't":[103],"need":[104],"know":[106],"any":[107],"knowledge":[108],"about":[109],"robot,":[111],"can":[113],"learn":[114],"internal":[116],"mapping":[117],"between":[118],"states":[119],"actions":[121],"that":[122],"behaviors":[124],"must":[125],"contain.":[126],"simulation":[129],"experiments,":[130],"validity":[132],"was":[146],"validated.":[147]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2024,"cited_by_count":1},{"year":2023,"cited_by_count":1},{"year":2020,"cited_by_count":1},{"year":2019,"cited_by_count":2},{"year":2014,"cited_by_count":1}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
