{"id":"https://openalex.org/W2954957659","doi":"https://doi.org/10.1109/icnsc.2019.8743192","title":"Reinforcement Learning for Robots Path Planning with Rule-based Shallow-trial","display_name":"Reinforcement Learning for Robots Path Planning with Rule-based Shallow-trial","publication_year":2019,"publication_date":"2019-05-01","ids":{"openalex":"https://openalex.org/W2954957659","doi":"https://doi.org/10.1109/icnsc.2019.8743192","mag":"2954957659"},"language":"en","primary_location":{"id":"doi:10.1109/icnsc.2019.8743192","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icnsc.2019.8743192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 16th International Conference on Networking, Sensing and Control (ICNSC)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5031185739","display_name":"Kaiqiang Tang","orcid":"https://orcid.org/0000-0002-7456-0962"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kaiqiang Tang","raw_affiliation_strings":["Department of Control and Systems Engineenng, School of Management and Engineering, Nanjing University, Nanjing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Control and Systems Engineenng, School of Management and Engineering, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5025551679","display_name":"Huiqiao Fu","orcid":"https://orcid.org/0000-0001-9403-2449"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Huiqiao Fu","raw_affiliation_strings":["Department of Control and Systems Engineerin, School of Management and Engineering, Nanjing University, Mianyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Control and Systems Engineerin, School of Management and Engineering, Nanjing University, Mianyang, China","institution_ids":["https://openalex.org/I881766915"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100650436","display_name":"Hao Jiang","orcid":"https://orcid.org/0000-0002-8901-0760"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hao Jiang","raw_affiliation_strings":["Southwest University of Science and Technology, Mianyang, Sichuan, CN"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Southwest University of Science and Technology, Mianyang, Sichuan, CN","institution_ids":["https://openalex.org/I1297991670"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5047792053","display_name":"Canghai Liu","orcid":"https://orcid.org/0009-0004-4890-1825"},"institutions":[{"id":"https://openalex.org/I1297991670","display_name":"Southwest University of Science and Technology","ror":"https://ror.org/04d996474","country_code":"CN","type":"education","lineage":["https://openalex.org/I1297991670"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Canghai Liu","raw_affiliation_strings":["School of Manufacturing Science and Engineenng, Key Laboratory of Testing Technology for Manufacturing Process of Ministry of Education, Southwest University of Science and Technology, Mianyang, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Manufacturing Science and Engineenng, Key Laboratory of Testing Technology for Manufacturing Process of Ministry of Education, Southwest University of Science and Technology, Mianyang, China","institution_ids":["https://openalex.org/I1297991670"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5060857183","display_name":"Lan Wang","orcid":"https://orcid.org/0000-0003-3852-1875"},"institutions":[{"id":"https://openalex.org/I881766915","display_name":"Nanjing University","ror":"https://ror.org/01rxvg760","country_code":"CN","type":"education","lineage":["https://openalex.org/I881766915"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Lan Wang","raw_affiliation_strings":["Department of Control and Systems Engineenng, Nanjing University, Nanjing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Department of Control and Systems Engineenng, Nanjing University, Nanjing, China","institution_ids":["https://openalex.org/I881766915"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.3051,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.60026454,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":95},"biblio":{"volume":"29","issue":null,"first_page":"340","last_page":"345"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.9994999766349792,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10653","display_name":"Robot Manipulation and Learning","score":0.9983999729156494,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8828663229942322},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6398604512214661},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.6349490284919739},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.6051896810531616},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5438836216926575},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.518618106842041},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.4552823305130005},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.41873079538345337},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.3532392978668213},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.2056712806224823},{"id":"https://openalex.org/keywords/computer-network","display_name":"Computer network","score":0.08941179513931274},{"id":"https://openalex.org/keywords/structural-engineering","display_name":"Structural engineering","score":0.05859294533729553}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8828663229942322},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6398604512214661},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.6349490284919739},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.6051896810531616},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5438836216926575},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.518618106842041},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.4552823305130005},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.41873079538345337},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.3532392978668213},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.2056712806224823},{"id":"https://openalex.org/C31258907","wikidata":"https://www.wikidata.org/wiki/Q1301371","display_name":"Computer network","level":1,"score":0.08941179513931274},{"id":"https://openalex.org/C66938386","wikidata":"https://www.wikidata.org/wiki/Q633538","display_name":"Structural engineering","level":1,"score":0.05859294533729553}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/icnsc.2019.8743192","is_oa":false,"landing_page_url":"https://doi.org/10.1109/icnsc.2019.8743192","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2019 IEEE 16th International Conference on Networking, Sensing and Control (ICNSC)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.4300000071525574,"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":23,"referenced_works":["https://openalex.org/W1638373997","https://openalex.org/W1752367861","https://openalex.org/W1977655452","https://openalex.org/W2033439284","https://openalex.org/W2056325504","https://openalex.org/W2117211893","https://openalex.org/W2210721416","https://openalex.org/W2259258048","https://openalex.org/W2343296810","https://openalex.org/W2345195955","https://openalex.org/W2401657790","https://openalex.org/W2413992829","https://openalex.org/W2525939318","https://openalex.org/W2571212026","https://openalex.org/W2592373391","https://openalex.org/W2773076209","https://openalex.org/W2789543555","https://openalex.org/W2793798239","https://openalex.org/W2824479732","https://openalex.org/W2952063594","https://openalex.org/W2963781688","https://openalex.org/W6636948731","https://openalex.org/W6731886670"],"related_works":["https://openalex.org/W1904098742","https://openalex.org/W3158921809","https://openalex.org/W2161428574","https://openalex.org/W2077416514","https://openalex.org/W2618632915","https://openalex.org/W2359600231","https://openalex.org/W4292862729","https://openalex.org/W2380019117","https://openalex.org/W2150982344","https://openalex.org/W2157678966"],"abstract_inverted_index":{"A":[0],"key":[1],"skill":[2],"for":[3,24],"mobile":[4,25],"robots":[5],"is":[6,18,79],"the":[7,52,88,103,109],"ability":[8],"to":[9,47,83,108],"navigate":[10],"efficiently":[11,50],"through":[12],"their":[13,66],"environment,":[14],"and":[15,35,94,114],"reinforcement":[16,106],"learning":[17,49,111,116],"widely":[19],"used":[20],"in":[21,56],"path":[22,72],"planning":[23],"robots.":[26],"However,":[27],"this":[28],"algorithm":[29],"has":[30,75],"a":[31,36],"slow":[32],"convergence":[33],"speed":[34],"large":[37],"number":[38],"of":[39,54,80,91,112],"iterations.":[40],"There":[41],"are":[42],"few":[43],"studies":[44],"on":[45,65],"how":[46],"improve":[48,115],"from":[51],"perspective":[53],"acquisition":[55],"rule-based":[57,104],"shallow-trial":[58,99,105],"strategy.":[59],"In":[60],"biological":[61],"world,":[62],"animals":[63],"depend":[64],"own":[67],"empirical":[68],"knowledge":[69,90],"when":[70],"making":[71],"planing.":[73],"Humanity":[74],"transcendental":[76,89],"knowledge,":[77],"which":[78],"great":[81],"help":[82],"peoples":[84],"navigation.":[85],"We":[86],"take":[87],"human":[92],"behavior,":[93],"express":[95],"it":[96],"acts":[97],"as":[98],"rules,":[100],"then":[101],"apply":[102],"learning(RSRL)":[107],"navigation":[110],"robot":[113],"efficiently.":[117]},"counts_by_year":[{"year":2021,"cited_by_count":2},{"year":2019,"cited_by_count":1}],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
