{"id":"https://openalex.org/W4399430147","doi":"https://doi.org/10.3390/rs16122072","title":"A Soft Actor-Critic Deep Reinforcement-Learning-Based Robot Navigation Method Using LiDAR","display_name":"A Soft Actor-Critic Deep Reinforcement-Learning-Based Robot Navigation Method Using LiDAR","publication_year":2024,"publication_date":"2024-06-07","ids":{"openalex":"https://openalex.org/W4399430147","doi":"https://doi.org/10.3390/rs16122072"},"language":"en","primary_location":{"id":"doi:10.3390/rs16122072","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs16122072","pdf_url":"https://www.mdpi.com/2072-4292/16/12/2072/pdf?version=1717768303","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","doaj"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://www.mdpi.com/2072-4292/16/12/2072/pdf?version=1717768303","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100601303","display_name":"Yanjie Liu","orcid":"https://orcid.org/0000-0002-7274-4979"},"institutions":[{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]},{"id":"https://openalex.org/I4391767639","display_name":"State Key Laboratory of Robotics and Systems","ror":"https://ror.org/015m77g16","country_code":null,"type":"facility","lineage":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanjie Liu","raw_affiliation_strings":["State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101940143","display_name":"Chao Wang","orcid":"https://orcid.org/0000-0002-0343-3982"},"institutions":[{"id":"https://openalex.org/I4391767639","display_name":"State Key Laboratory of Robotics and Systems","ror":"https://ror.org/015m77g16","country_code":null,"type":"facility","lineage":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Chao Wang","raw_affiliation_strings":["State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5008282144","display_name":"Changsen Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I4391767639","display_name":"State Key Laboratory of Robotics and Systems","ror":"https://ror.org/015m77g16","country_code":null,"type":"facility","lineage":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Changsen Zhao","raw_affiliation_strings":["State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100341990","display_name":"Wu H","orcid":"https://orcid.org/0009-0008-8295-0400"},"institutions":[{"id":"https://openalex.org/I4391767639","display_name":"State Key Laboratory of Robotics and Systems","ror":"https://ror.org/015m77g16","country_code":null,"type":"facility","lineage":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Heng Wu","raw_affiliation_strings":["State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5086405236","display_name":"Yanlong Wei","orcid":null},"institutions":[{"id":"https://openalex.org/I4391767639","display_name":"State Key Laboratory of Robotics and Systems","ror":"https://ror.org/015m77g16","country_code":null,"type":"facility","lineage":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]},{"id":"https://openalex.org/I204983213","display_name":"Harbin Institute of Technology","ror":"https://ror.org/01yqg2h08","country_code":"CN","type":"education","lineage":["https://openalex.org/I204983213"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yanlong Wei","raw_affiliation_strings":["State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Robotics and Systems (HIT), Department of Mechatronics Engineering, Harbin Institute of Technology, Harbin 150001, China","institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4391767639"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101940143"],"corresponding_institution_ids":["https://openalex.org/I204983213","https://openalex.org/I4391767639"],"apc_list":{"value":2500,"currency":"CHF","value_usd":2707},"apc_paid":{"value":2500,"currency":"CHF","value_usd":2707},"fwci":5.1814,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.95940066,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":94,"max":100},"biblio":{"volume":"16","issue":"12","first_page":"2072","last_page":"2072"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9988999962806702,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9965000152587891,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9918000102043152,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8490530252456665},{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.8225687146186829},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7877858281135559},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6647883653640747},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.5375252962112427},{"id":"https://openalex.org/keywords/obstacle","display_name":"Obstacle","score":0.516042947769165},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.41789793968200684},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.4116251468658447},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.33852607011795044},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.3111571669578552}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8490530252456665},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.8225687146186829},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7877858281135559},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6647883653640747},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.5375252962112427},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.516042947769165},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.41789793968200684},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.4116251468658447},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33852607011795044},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.3111571669578552},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.0},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.3390/rs16122072","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs16122072","pdf_url":"https://www.mdpi.com/2072-4292/16/12/2072/pdf?version=1717768303","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},{"id":"pmh:oai:doaj.org/article:43c039fde36b4839bb489f676c30175d","is_oa":true,"landing_page_url":"https://doaj.org/article/43c039fde36b4839bb489f676c30175d","pdf_url":null,"source":{"id":"https://openalex.org/S112646816","display_name":"SHILAP Revista de lepidopterolog\u00eda","issn_l":"0300-5267","issn":["0300-5267","2340-4078"],"is_oa":true,"is_in_doaj":true,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":"Remote Sensing, Vol 16, Iss 12, p 2072 (2024)","raw_type":"article"}],"best_oa_location":{"id":"doi:10.3390/rs16122072","is_oa":true,"landing_page_url":"https://doi.org/10.3390/rs16122072","pdf_url":"https://www.mdpi.com/2072-4292/16/12/2072/pdf?version=1717768303","source":{"id":"https://openalex.org/S43295729","display_name":"Remote Sensing","issn_l":"2072-4292","issn":["2072-4292"],"is_oa":true,"is_in_doaj":true,"is_core":true,"host_organization":"https://openalex.org/P4310310987","host_organization_name":"Multidisciplinary Digital Publishing Institute","host_organization_lineage":["https://openalex.org/P4310310987"],"host_organization_lineage_names":["Multidisciplinary Digital Publishing Institute"],"type":"journal"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Remote Sensing","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4399430147.pdf"},"referenced_works_count":21,"referenced_works":["https://openalex.org/W192919555","https://openalex.org/W1665214252","https://openalex.org/W1994955764","https://openalex.org/W2124175081","https://openalex.org/W2173564293","https://openalex.org/W2562788852","https://openalex.org/W2594103415","https://openalex.org/W2746553466","https://openalex.org/W3041244724","https://openalex.org/W3163878499","https://openalex.org/W3176452384","https://openalex.org/W3205400264","https://openalex.org/W4240813273","https://openalex.org/W4316038501","https://openalex.org/W4385655053","https://openalex.org/W4387170679","https://openalex.org/W4388379734","https://openalex.org/W4391853549","https://openalex.org/W4392514157","https://openalex.org/W4393979731","https://openalex.org/W6684205842"],"related_works":["https://openalex.org/W2930076404","https://openalex.org/W4253519380","https://openalex.org/W2071957557","https://openalex.org/W2596413128","https://openalex.org/W4391249562","https://openalex.org/W2356867392","https://openalex.org/W2782776446","https://openalex.org/W3043170174","https://openalex.org/W2155948905","https://openalex.org/W2906946336"],"abstract_inverted_index":{"When":[0],"there":[1],"are":[2],"dynamic":[3,148],"obstacles":[4],"in":[5,140,147],"the":[6,48,55,82,88,108,112,123,127,135,179,183],"environment,":[7],"it":[8,63,155],"is":[9,156],"difficult":[10],"for":[11,87],"traditional":[12],"path-generation":[13,44],"algorithms":[14],"to":[15,46,50,80,106,133,172],"achieve":[16],"desired":[17],"obstacle-avoidance":[18,145,180],"results.":[19],"To":[20],"solve":[21],"this":[22],"problem,":[23],"we":[24,40,68,98,115],"propose":[25],"a":[26,42,65,141,163],"robot":[27,49,56,184],"navigation":[28,131,168],"control":[29,47],"method":[30,105,161],"based":[31,76],"on":[32,77],"SAC":[33,70,128],"(Soft":[34],"Actor-Critic)":[35],"Deep":[36,129],"Reinforcement":[37],"Learning.":[38],"Firstly,":[39],"use":[41,99],"fast":[43],"algorithm":[45],"generate":[51],"expert":[52,78,96],"trajectories":[53,79],"when":[54,62],"encounters":[57],"danger":[58],"as":[59,61],"well":[60],"approaches":[64],"target,":[66],"and":[67,95,144,152,167],"combine":[69],"reinforcement":[71],"learning":[72,75,109],"with":[73],"imitation":[74],"improve":[81,107,134],"safety":[83],"of":[84,92,111,126,182],"training.":[85],"Then,":[86],"hybrid":[89],"data":[90,94],"consisting":[91],"agent":[93],"data,":[97],"an":[100],"improved":[101],"prioritized":[102],"experience":[103],"replay":[104],"efficiency":[110,166],"policies.":[113],"Finally,":[114],"introduce":[116],"RNN":[117],"(Recurrent":[118],"Neural":[119],"Network)":[120],"units":[121],"into":[122],"network":[124],"structure":[125],"Reinforcement-Learning":[130],"policy":[132],"agent\u2019s":[136],"transfer":[137],"inference":[138],"ability":[139,146],"new":[142],"environment":[143],"environments.":[149],"Through":[150],"simulation":[151],"practical":[153],"experiments,":[154],"fully":[157],"verified":[158],"that":[159],"our":[160],"has":[162],"higher":[164],"training":[165],"success":[169],"rate":[170],"compared":[171],"state-of-the-art":[173],"reinforcement-learning":[174],"algorithms,":[175],"which":[176],"further":[177],"enhances":[178],"capability":[181],"system.":[185]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":8},{"year":2024,"cited_by_count":2}],"updated_date":"2026-04-02T15:55:50.835912","created_date":"2025-10-10T00:00:00"}
