{"id":"https://openalex.org/W4416677242","doi":"https://doi.org/10.1109/sbr/wre66973.2025.11249623","title":"Reinforcement Learning-Based Path Following for Robots: A Survey of Reward Functions","display_name":"Reinforcement Learning-Based Path Following for Robots: A Survey of Reward Functions","publication_year":2025,"publication_date":"2025-10-13","ids":{"openalex":"https://openalex.org/W4416677242","doi":"https://doi.org/10.1109/sbr/wre66973.2025.11249623"},"language":null,"primary_location":{"id":"doi:10.1109/sbr/wre66973.2025.11249623","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sbr/wre66973.2025.11249623","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Brazilian Symposium on Robotics (SBR) and 2025 Workshop on Robotics in Education (WRE)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5045992220","display_name":"Jardel D. S. Dyonisio","orcid":"https://orcid.org/0009-0003-7722-7203"},"institutions":[{"id":"https://openalex.org/I126460647","display_name":"Universidade Federal do Rio Grande","ror":"https://ror.org/05hpfkn88","country_code":"BR","type":"education","lineage":["https://openalex.org/I126460647"]},{"id":"https://openalex.org/I94328231","display_name":"University of Rio Grande and Rio Grande Community College","ror":"https://ror.org/02sghbs34","country_code":"US","type":"education","lineage":["https://openalex.org/I94328231"]}],"countries":["BR","US"],"is_corresponding":false,"raw_author_name":"Jardel dos Santos Dyonisio","raw_affiliation_strings":["Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil"],"raw_orcid":"https://orcid.org/0009-0003-7722-7203","affiliations":[{"raw_affiliation_string":"Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil","institution_ids":["https://openalex.org/I126460647","https://openalex.org/I94328231"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5004365999","display_name":"Stephanie L. Bri\u00e3o","orcid":"https://orcid.org/0000-0001-9345-2038"},"institutions":[{"id":"https://openalex.org/I126460647","display_name":"Universidade Federal do Rio Grande","ror":"https://ror.org/05hpfkn88","country_code":"BR","type":"education","lineage":["https://openalex.org/I126460647"]},{"id":"https://openalex.org/I94328231","display_name":"University of Rio Grande and Rio Grande Community College","ror":"https://ror.org/02sghbs34","country_code":"US","type":"education","lineage":["https://openalex.org/I94328231"]}],"countries":["BR","US"],"is_corresponding":false,"raw_author_name":"Stephanie Loi Bri\u00e3o","raw_affiliation_strings":["Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil"],"raw_orcid":"https://orcid.org/0000-0001-9345-2038","affiliations":[{"raw_affiliation_string":"Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil","institution_ids":["https://openalex.org/I126460647","https://openalex.org/I94328231"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020192402","display_name":"Kristofer S. Kappel","orcid":"https://orcid.org/0000-0002-9124-8540"},"institutions":[{"id":"https://openalex.org/I126460647","display_name":"Universidade Federal do Rio Grande","ror":"https://ror.org/05hpfkn88","country_code":"BR","type":"education","lineage":["https://openalex.org/I126460647"]},{"id":"https://openalex.org/I94328231","display_name":"University of Rio Grande and Rio Grande Community College","ror":"https://ror.org/02sghbs34","country_code":"US","type":"education","lineage":["https://openalex.org/I94328231"]}],"countries":["BR","US"],"is_corresponding":false,"raw_author_name":"Kristofer Stift Kappel","raw_affiliation_strings":["Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil"],"raw_orcid":"https://orcid.org/0000-0002-9124-8540","affiliations":[{"raw_affiliation_string":"Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil","institution_ids":["https://openalex.org/I126460647","https://openalex.org/I94328231"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017613080","display_name":"Rodrigo da Silva Guerra","orcid":"https://orcid.org/0000-0003-4011-0901"},"institutions":[{"id":"https://openalex.org/I126460647","display_name":"Universidade Federal do Rio Grande","ror":"https://ror.org/05hpfkn88","country_code":"BR","type":"education","lineage":["https://openalex.org/I126460647"]},{"id":"https://openalex.org/I94328231","display_name":"University of Rio Grande and Rio Grande Community College","ror":"https://ror.org/02sghbs34","country_code":"US","type":"education","lineage":["https://openalex.org/I94328231"]}],"countries":["BR","US"],"is_corresponding":false,"raw_author_name":"Rodrigo Silva Guerra","raw_affiliation_strings":["Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil"],"raw_orcid":"https://orcid.org/0000-0003-4011-0901","affiliations":[{"raw_affiliation_string":"Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil","institution_ids":["https://openalex.org/I126460647","https://openalex.org/I94328231"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022136971","display_name":"Emanuel da Silva Diaz Estrada","orcid":"https://orcid.org/0000-0003-4088-5002"},"institutions":[{"id":"https://openalex.org/I126460647","display_name":"Universidade Federal do Rio Grande","ror":"https://ror.org/05hpfkn88","country_code":"BR","type":"education","lineage":["https://openalex.org/I126460647"]},{"id":"https://openalex.org/I94328231","display_name":"University of Rio Grande and Rio Grande Community College","ror":"https://ror.org/02sghbs34","country_code":"US","type":"education","lineage":["https://openalex.org/I94328231"]}],"countries":["BR","US"],"is_corresponding":false,"raw_author_name":"Emanuel da Silva Diaz Estrada","raw_affiliation_strings":["Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil"],"raw_orcid":"https://orcid.org/0000-0003-4088-5002","affiliations":[{"raw_affiliation_string":"Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil","institution_ids":["https://openalex.org/I126460647","https://openalex.org/I94328231"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037041582","display_name":"Paulo Drews","orcid":"https://orcid.org/0000-0002-7519-0502"},"institutions":[{"id":"https://openalex.org/I126460647","display_name":"Universidade Federal do Rio Grande","ror":"https://ror.org/05hpfkn88","country_code":"BR","type":"education","lineage":["https://openalex.org/I126460647"]},{"id":"https://openalex.org/I94328231","display_name":"University of Rio Grande and Rio Grande Community College","ror":"https://ror.org/02sghbs34","country_code":"US","type":"education","lineage":["https://openalex.org/I94328231"]}],"countries":["BR","US"],"is_corresponding":false,"raw_author_name":"Paulo Lilles Jorge Drews","raw_affiliation_strings":["Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil"],"raw_orcid":"https://orcid.org/0000-0002-7519-0502","affiliations":[{"raw_affiliation_string":"Centro de Ciencias Computacionais, Universidade Federal de Rio Grande,Rio Grande,Brazil","institution_ids":["https://openalex.org/I126460647","https://openalex.org/I94328231"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.17316584,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"158","last_page":"163"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.522599995136261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.522599995136261,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.17870000004768372,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.049300000071525574,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.8374999761581421},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.6008999943733215},{"id":"https://openalex.org/keywords/reinforcement","display_name":"Reinforcement","score":0.5254999995231628},{"id":"https://openalex.org/keywords/reward-system","display_name":"Reward system","score":0.5189999938011169},{"id":"https://openalex.org/keywords/domain","display_name":"Domain (mathematical analysis)","score":0.45489999651908875},{"id":"https://openalex.org/keywords/mobile-robot","display_name":"Mobile robot","score":0.4544999897480011}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.8374999761581421},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.6008999943733215},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5931000113487244},{"id":"https://openalex.org/C67203356","wikidata":"https://www.wikidata.org/wiki/Q1321905","display_name":"Reinforcement","level":2,"score":0.5254999995231628},{"id":"https://openalex.org/C143661069","wikidata":"https://www.wikidata.org/wiki/Q670713","display_name":"Reward system","level":2,"score":0.5189999938011169},{"id":"https://openalex.org/C36503486","wikidata":"https://www.wikidata.org/wiki/Q11235244","display_name":"Domain (mathematical analysis)","level":2,"score":0.45489999651908875},{"id":"https://openalex.org/C19966478","wikidata":"https://www.wikidata.org/wiki/Q4810574","display_name":"Mobile robot","level":3,"score":0.4544999897480011},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3953999876976013},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.3935999870300293},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.34529998898506165},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3443000018596649},{"id":"https://openalex.org/C196340769","wikidata":"https://www.wikidata.org/wiki/Q7698910","display_name":"Temporal difference learning","level":3,"score":0.2865999937057495}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/sbr/wre66973.2025.11249623","is_oa":false,"landing_page_url":"https://doi.org/10.1109/sbr/wre66973.2025.11249623","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 Brazilian Symposium on Robotics (SBR) and 2025 Workshop on Robotics in Education (WRE)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":30,"referenced_works":["https://openalex.org/W2007866599","https://openalex.org/W2198041288","https://openalex.org/W2515466314","https://openalex.org/W2754000639","https://openalex.org/W2897767831","https://openalex.org/W2908536213","https://openalex.org/W2963917788","https://openalex.org/W3008195728","https://openalex.org/W3008232782","https://openalex.org/W3023077548","https://openalex.org/W3046474649","https://openalex.org/W3047772261","https://openalex.org/W3094546435","https://openalex.org/W3119264617","https://openalex.org/W3127561923","https://openalex.org/W3152878473","https://openalex.org/W4210643767","https://openalex.org/W4313496152","https://openalex.org/W4389276149","https://openalex.org/W4389332619","https://openalex.org/W4390755345","https://openalex.org/W4390933158","https://openalex.org/W4392266853","https://openalex.org/W4400648754","https://openalex.org/W4405180451","https://openalex.org/W4406459482","https://openalex.org/W4407524863","https://openalex.org/W4409262116","https://openalex.org/W4410229622","https://openalex.org/W4411233466"],"related_works":[],"abstract_inverted_index":{"Reward":[0],"functions":[1,24,41,68],"define":[2],"an":[3],"agent's":[4],"behavior":[5],"in":[6,59,102],"reinforcement":[7,99],"learning":[8,100],"by":[9],"determining":[10],"actions":[11],"based":[12],"on":[13,43],"the":[14,18,26,31,66,94],"feedback":[15,57],"received.":[16],"In":[17],"domain":[19],"of":[20,39,65],"path":[21],"following,":[22],"reward":[23,40,67,80,95],"guide":[25],"agent":[27],"toward":[28],"successfully":[29],"following":[30],"desired":[32],"path.":[33],"This":[34],"paper":[35],"presents":[36],"a":[37],"survey":[38],"focused":[42],"path-following":[44],"tasks":[45],"for":[46,78],"mobile":[47,84],"robots.":[48],"The":[49],"characteristics,":[50],"strategies,":[51],"and":[52,75,83],"challenges":[53],"associated":[54],"with":[55],"creating":[56],"mechanisms":[58],"various":[60],"domains":[61],"are":[62,73,86],"highlighted.":[63],"Components":[64],"that":[69,97],"can":[70],"be":[71],"controlled":[72],"explored":[74],"discussed.":[76],"Furthermore,":[77],"each":[79],"function,":[81],"scenarios":[82],"robots":[85],"indicated.":[87],"Thus,":[88],"this":[89],"study":[90],"provides":[91],"insights":[92],"into":[93],"components":[96],"influence":[98],"systems":[101],"robotic":[103],"navigation.":[104]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-11-25T00:00:00"}
