{"id":"https://openalex.org/W7154476485","doi":"https://doi.org/10.1109/upinlbs68186.2025.11468417","title":"Reinforcement-Fine-Tuned LLM Navigation Decision-Making System: A Dynamic Obstacle Avoidance Method Based on the Time-Decay Reward Mechanism","display_name":"Reinforcement-Fine-Tuned LLM Navigation Decision-Making System: A Dynamic Obstacle Avoidance Method Based on the Time-Decay Reward Mechanism","publication_year":2025,"publication_date":"2025-12-17","ids":{"openalex":"https://openalex.org/W7154476485","doi":"https://doi.org/10.1109/upinlbs68186.2025.11468417"},"language":null,"primary_location":{"id":"doi:10.1109/upinlbs68186.2025.11468417","is_oa":false,"landing_page_url":"https://doi.org/10.1109/upinlbs68186.2025.11468417","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Ubiquitous Positioning, Indoor Navigation and Location-Based Services Conference (UPINLBS)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5133682327","display_name":"Yukang Lou","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yukang Lou","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132620177","display_name":"Z G Cao","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Cao","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100427179","display_name":"Haoyu Wang","orcid":"https://orcid.org/0000-0002-2124-3453"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyu Wang","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133700857","display_name":"Zilong Xiao","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zilong Xiao","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100710578","display_name":"Hongjuan Zhang","orcid":"https://orcid.org/0000-0002-2545-8451"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongjuan Zhang","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133674026","display_name":"Zhen Dong","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhen Dong","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5133633336","display_name":"Bijun Li","orcid":null},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]},{"id":"https://openalex.org/I4210118728","display_name":"State Key Laboratory of Information Engineering in Surveying Mapping and Remote Sensing","ror":"https://ror.org/02bpap860","country_code":"CN","type":"facility","lineage":["https://openalex.org/I4210118728"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bijun Li","raw_affiliation_strings":["Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China"],"affiliations":[{"raw_affiliation_string":"Wuhan University,State Key Laboratory of Information Engineering in Surveying, Mapping and Remote Sensing,Wuhan,China","institution_ids":["https://openalex.org/I4210118728","https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5133682327"],"corresponding_institution_ids":["https://openalex.org/I37461747","https://openalex.org/I4210118728"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.74332038,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.3481000065803528,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.3481000065803528,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11622","display_name":"Maritime Navigation and Safety","score":0.10199999809265137,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11082","display_name":"Spacecraft Dynamics and Control","score":0.09220000356435776,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.6388000249862671},{"id":"https://openalex.org/keywords/mechanism","display_name":"Mechanism (biology)","score":0.48539999127388},{"id":"https://openalex.org/keywords/control-theory","display_name":"Control theory (sociology)","score":0.4334000051021576},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.36239999532699585},{"id":"https://openalex.org/keywords/control","display_name":"Control (management)","score":0.3303999900817871},{"id":"https://openalex.org/keywords/control-system","display_name":"Control system","score":0.28769999742507935}],"concepts":[{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.6388000249862671},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6122000217437744},{"id":"https://openalex.org/C89611455","wikidata":"https://www.wikidata.org/wiki/Q6804646","display_name":"Mechanism (biology)","level":2,"score":0.48539999127388},{"id":"https://openalex.org/C47446073","wikidata":"https://www.wikidata.org/wiki/Q5165890","display_name":"Control theory (sociology)","level":3,"score":0.4334000051021576},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3736000061035156},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.36239999532699585},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.3589000105857849},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.3303999900817871},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.28769999742507935},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.28600001335144043},{"id":"https://openalex.org/C2776650193","wikidata":"https://www.wikidata.org/wiki/Q264661","display_name":"Obstacle","level":2,"score":0.2816999852657318},{"id":"https://openalex.org/C13662910","wikidata":"https://www.wikidata.org/wiki/Q193139","display_name":"Trajectory","level":2,"score":0.2815999984741211},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.27970001101493835},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.27390000224113464},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.26840001344680786},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.26159998774528503}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/upinlbs68186.2025.11468417","is_oa":false,"landing_page_url":"https://doi.org/10.1109/upinlbs68186.2025.11468417","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 International Ubiquitous Positioning, Indoor Navigation and Location-Based Services Conference (UPINLBS)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2057407891","display_name":null,"funder_award_id":"42571522","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6287202219","display_name":null,"funder_award_id":"2023YFB3907102","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,12,22,81,99,108,113,120,139,154],"development":[2],"of":[3,14,26,101,157],"large":[4,17],"models,":[5,146],"there":[6],"is":[7,40,116],"an":[8,93,173],"urgent":[9],"demand":[10],"for":[11,84],"advancement":[13],"technologies":[15],"integrating":[16],"models":[18,31],"with":[19,142],"navigation.":[20],"Addressing":[21],"decision":[23,30,132,167],"bias":[24],"issue":[25],"current":[27],"LLM-based":[28],"navigation":[29,68,131],"in":[32,138,153,166,179],"indoor":[33],"dynamic":[34,130,158,181],"scenarios":[35],"where":[36],"long-term":[37],"path":[38,90],"optimization":[39],"prioritized":[41],"over":[42],"short-term":[43,102],"risk":[44,103],"avoidance,":[45],"this":[46],"paper":[47],"proposes":[48],"a":[49,62,74,149,162],"LLM":[50,122],"Reinforcement":[51],"Fine-Tuning":[52],"Model":[53],"based":[54,106],"on":[55,107],"time-decay":[56,75],"reward":[57,76,82],"Mechanism":[58],"(TDR-LLM-RFT).":[59],"TDR-LLM-RFT":[60,147],"constructs":[61],"\u201cperception-decision-feedback\u201d":[63],"closed-loop":[64],"system,":[65],"takes":[66],"multimodal":[67],"data":[69],"as":[70],"input":[71],"and":[72,88,161],"designs":[73],"function.":[77],"It":[78],"dynamically":[79],"allocates":[80],"weights":[83],"\u201cimmediate":[85],"obstacle":[86,159],"avoidance\u201d":[87],"\u201clong-term":[89],"planning\u201d":[91],"through":[92],"exponential":[94],"decay":[95],"coefficient,":[96],"thereby":[97],"prioritizing":[98],"triggering":[100],"responses.":[104],"Meanwhile,":[105],"VLN-R1":[109],"reinforcement":[110],"fine-tuning":[111],"paradigm,":[112],"PPO":[114],"algorithm":[115],"used":[117],"to":[118,127,129],"fine-tune":[119],"base":[121],"(Llama3":[123],"7B),":[124],"enabling":[125],"it":[126,170],"adapt":[128],"logic.":[133],"Experimental":[134],"results":[135],"show":[136],"that":[137],"dataset,":[140],"compared":[141],"traditional":[143],"discrete":[144],"RL":[145],"achieves":[148],"5.7":[150],"%":[151,164,175],"increase":[152],"success":[155],"rate":[156,178],"avoidance":[160],"6.2":[163],"reduction":[165],"delay.":[168],"Moreover,":[169],"still":[171],"maintains":[172],"84.3":[174],"semantic":[176],"satisfaction":[177],"high":[180],"density":[182],"scenarios.":[183]},"counts_by_year":[],"updated_date":"2026-04-17T05:58:53.018234","created_date":"2026-04-16T00:00:00"}
