{"id":"https://openalex.org/W4415974592","doi":"https://doi.org/10.1016/j.procs.2025.09.189","title":"Dynamic Reward-Based Deep Reinforcement Learning Algorithm for UAV Path Planning in Large-Scale Environments","display_name":"Dynamic Reward-Based Deep Reinforcement Learning Algorithm for UAV Path Planning in Large-Scale Environments","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4415974592","doi":"https://doi.org/10.1016/j.procs.2025.09.189"},"language":"en","primary_location":{"id":"doi:10.1016/j.procs.2025.09.189","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2025.09.189","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"diamond","oa_url":"https://doi.org/10.1016/j.procs.2025.09.189","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5053628100","display_name":"Raja Jarray","orcid":"https://orcid.org/0000-0002-3759-1436"},"institutions":[{"id":"https://openalex.org/I63596082","display_name":"Tunis El Manar University","ror":"https://ror.org/029cgt552","country_code":"TN","type":"education","lineage":["https://openalex.org/I63596082"]},{"id":"https://openalex.org/I4210131288","display_name":"National Engineering School of Tunis","ror":"https://ror.org/03b1zjt31","country_code":"TN","type":"education","lineage":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]},{"id":"https://openalex.org/I68916915","display_name":"University of Gab\u00e8s","ror":"https://ror.org/022efad20","country_code":"TN","type":"education","lineage":["https://openalex.org/I68916915"]}],"countries":["TN"],"is_corresponding":true,"raw_author_name":"Raja Jarray","raw_affiliation_strings":["High Institute of Industrial Systems of Gab\u00e8s, University of Gab\u00e8s, 6072 Gab\u00e8s, Tunisia","Research Laboratory in Automatic Control (LARA), National Engineering School of Tunis (ENIT), University of Tunis El Manar, 1002 Tunis, Tunisia"],"affiliations":[{"raw_affiliation_string":"High Institute of Industrial Systems of Gab\u00e8s, University of Gab\u00e8s, 6072 Gab\u00e8s, Tunisia","institution_ids":["https://openalex.org/I68916915"]},{"raw_affiliation_string":"Research Laboratory in Automatic Control (LARA), National Engineering School of Tunis (ENIT), University of Tunis El Manar, 1002 Tunis, Tunisia","institution_ids":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5106530055","display_name":"Imen Zaghbani","orcid":null},"institutions":[{"id":"https://openalex.org/I4210131288","display_name":"National Engineering School of Tunis","ror":"https://ror.org/03b1zjt31","country_code":"TN","type":"education","lineage":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]},{"id":"https://openalex.org/I63596082","display_name":"Tunis El Manar University","ror":"https://ror.org/029cgt552","country_code":"TN","type":"education","lineage":["https://openalex.org/I63596082"]},{"id":"https://openalex.org/I68916915","display_name":"University of Gab\u00e8s","ror":"https://ror.org/022efad20","country_code":"TN","type":"education","lineage":["https://openalex.org/I68916915"]}],"countries":["TN"],"is_corresponding":false,"raw_author_name":"Imen Zaghbani","raw_affiliation_strings":["National Engineering School of Gab\u00e8s, University of Gab\u00e8s, 6029 Gab\u00e8s, Tunisia","Research Laboratory in Automatic Control (LARA), National Engineering School of Tunis (ENIT), University of Tunis El Manar, 1002 Tunis, Tunisia"],"affiliations":[{"raw_affiliation_string":"National Engineering School of Gab\u00e8s, University of Gab\u00e8s, 6029 Gab\u00e8s, Tunisia","institution_ids":["https://openalex.org/I68916915"]},{"raw_affiliation_string":"Research Laboratory in Automatic Control (LARA), National Engineering School of Tunis (ENIT), University of Tunis El Manar, 1002 Tunis, Tunisia","institution_ids":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5037036654","display_name":"Soufiene Bouall\u00e8gue","orcid":"https://orcid.org/0000-0003-3172-6333"},"institutions":[{"id":"https://openalex.org/I4210131288","display_name":"National Engineering School of Tunis","ror":"https://ror.org/03b1zjt31","country_code":"TN","type":"education","lineage":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]},{"id":"https://openalex.org/I63596082","display_name":"Tunis El Manar University","ror":"https://ror.org/029cgt552","country_code":"TN","type":"education","lineage":["https://openalex.org/I63596082"]},{"id":"https://openalex.org/I68916915","display_name":"University of Gab\u00e8s","ror":"https://ror.org/022efad20","country_code":"TN","type":"education","lineage":["https://openalex.org/I68916915"]}],"countries":["TN"],"is_corresponding":false,"raw_author_name":"Soufiene Bouall\u00e8gue","raw_affiliation_strings":["High Institute of Industrial Systems of Gab\u00e8s, University of Gab\u00e8s, 6072 Gab\u00e8s, Tunisia","Research Laboratory in Automatic Control (LARA), National Engineering School of Tunis (ENIT), University of Tunis El Manar, 1002 Tunis, Tunisia"],"affiliations":[{"raw_affiliation_string":"High Institute of Industrial Systems of Gab\u00e8s, University of Gab\u00e8s, 6072 Gab\u00e8s, Tunisia","institution_ids":["https://openalex.org/I68916915"]},{"raw_affiliation_string":"Research Laboratory in Automatic Control (LARA), National Engineering School of Tunis (ENIT), University of Tunis El Manar, 1002 Tunis, Tunisia","institution_ids":["https://openalex.org/I4210131288","https://openalex.org/I63596082"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5053628100"],"corresponding_institution_ids":["https://openalex.org/I4210131288","https://openalex.org/I63596082","https://openalex.org/I68916915"],"apc_list":null,"apc_paid":null,"fwci":1.3634,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.86509431,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":"270","issue":null,"first_page":"692","last_page":"702"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9007999897003174,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.9007999897003174,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.02319999970495701,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10462","display_name":"Reinforcement Learning in Robotics","score":0.00930000003427267,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.824400007724762},{"id":"https://openalex.org/keywords/motion-planning","display_name":"Motion planning","score":0.7215999960899353},{"id":"https://openalex.org/keywords/convergence","display_name":"Convergence (economics)","score":0.6212999820709229},{"id":"https://openalex.org/keywords/stability","display_name":"Stability (learning theory)","score":0.5508000254631042},{"id":"https://openalex.org/keywords/path","display_name":"Path (computing)","score":0.5393000245094299},{"id":"https://openalex.org/keywords/drone","display_name":"Drone","score":0.4943999946117401},{"id":"https://openalex.org/keywords/grid-reference","display_name":"Grid reference","score":0.4693000018596649},{"id":"https://openalex.org/keywords/position","display_name":"Position (finance)","score":0.4424000084400177}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8604000210762024},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.824400007724762},{"id":"https://openalex.org/C81074085","wikidata":"https://www.wikidata.org/wiki/Q366872","display_name":"Motion planning","level":3,"score":0.7215999960899353},{"id":"https://openalex.org/C2777303404","wikidata":"https://www.wikidata.org/wiki/Q759757","display_name":"Convergence (economics)","level":2,"score":0.6212999820709229},{"id":"https://openalex.org/C112972136","wikidata":"https://www.wikidata.org/wiki/Q7595718","display_name":"Stability (learning theory)","level":2,"score":0.5508000254631042},{"id":"https://openalex.org/C2777735758","wikidata":"https://www.wikidata.org/wiki/Q817765","display_name":"Path (computing)","level":2,"score":0.5393000245094299},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.4943999946117401},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4878000020980835},{"id":"https://openalex.org/C156172958","wikidata":"https://www.wikidata.org/wiki/Q3438407","display_name":"Grid reference","level":4,"score":0.4693000018596649},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.4542999863624573},{"id":"https://openalex.org/C198082294","wikidata":"https://www.wikidata.org/wiki/Q3399648","display_name":"Position (finance)","level":2,"score":0.4424000084400177},{"id":"https://openalex.org/C187691185","wikidata":"https://www.wikidata.org/wiki/Q2020720","display_name":"Grid","level":2,"score":0.42989999055862427},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.41679999232292175},{"id":"https://openalex.org/C197947376","wikidata":"https://www.wikidata.org/wiki/Q5155608","display_name":"Comparability","level":2,"score":0.4120999872684479},{"id":"https://openalex.org/C14036430","wikidata":"https://www.wikidata.org/wiki/Q3736076","display_name":"Function (biology)","level":2,"score":0.40230000019073486},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.39100000262260437},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.34529998898506165},{"id":"https://openalex.org/C14646407","wikidata":"https://www.wikidata.org/wiki/Q1430750","display_name":"Bellman equation","level":2,"score":0.34200000762939453},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.3416000008583069},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.29109999537467957},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.26429998874664307},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.2574999928474426},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.25049999356269836}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1016/j.procs.2025.09.189","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2025.09.189","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1016/j.procs.2025.09.189","is_oa":true,"landing_page_url":"https://doi.org/10.1016/j.procs.2025.09.189","pdf_url":null,"source":{"id":"https://openalex.org/S120348307","display_name":"Procedia Computer Science","issn_l":"1877-0509","issn":["1877-0509"],"is_oa":true,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320990","host_organization_name":"Elsevier BV","host_organization_lineage":["https://openalex.org/P4310320990"],"host_organization_lineage_names":["Elsevier BV"],"type":"journal"},"license":"cc-by-nc-nd","license_id":"https://openalex.org/licenses/cc-by-nc-nd","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Procedia Computer Science","raw_type":"journal-article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":25,"referenced_works":["https://openalex.org/W32403112","https://openalex.org/W1601081659","https://openalex.org/W1977655452","https://openalex.org/W2061438946","https://openalex.org/W2169245194","https://openalex.org/W2181005557","https://openalex.org/W2573831046","https://openalex.org/W2738900493","https://openalex.org/W2899746873","https://openalex.org/W2964884740","https://openalex.org/W2978276956","https://openalex.org/W3111564136","https://openalex.org/W3206647606","https://openalex.org/W4200512239","https://openalex.org/W4214504571","https://openalex.org/W4248885725","https://openalex.org/W4283696902","https://openalex.org/W4285541102","https://openalex.org/W4319985867","https://openalex.org/W4362637420","https://openalex.org/W4389779734","https://openalex.org/W4401610808","https://openalex.org/W4406705755","https://openalex.org/W4407315436","https://openalex.org/W4408170367"],"related_works":[],"abstract_inverted_index":{"Path":[0],"planning":[1,21,158],"for":[2,22,29,98,155],"Unmanned":[3],"Aerial":[4],"Vehicles":[5],"(UAV)":[6],"is":[7,60,77,129],"a":[8,30,55,80,93,124],"vital":[9],"component":[10],"of":[11,82,110,118,150,159],"navigation":[12,38],"in":[13,36,161],"robotics.":[14],"The":[15],"reinforcement":[16,45],"Q-learning":[17],"algorithm":[18,114],"enhances":[19,105],"path":[20,157],"drones":[23],"but":[24],"suffers":[25],"from":[26],"the":[27,66,74,99,106,111,133,136,148,151],"need":[28],"large":[31],"Q-value":[32],"table":[33],"and":[34,62,108,140,145],"challenges":[35],"complex":[37,162],"situations.":[39],"By":[40],"integrating":[41],"deep":[42],"learning":[43],"with":[44],"one,":[46],"these":[47],"shortcomings":[48],"can":[49],"be":[50],"addressed.":[51],"In":[52,71],"this":[53,72],"paper,":[54],"Deep":[56],"Q-Network":[57],"(DQN)":[58],"model":[59],"developed":[61],"trained":[63],"to":[64,88],"estimate":[65],"drone\u2019s":[67,137],"state-action":[68],"value":[69],"function.":[70],"work,":[73],"flight":[75],"space":[76],"represented":[78],"by":[79,115],"grid":[81],"cells,":[83],"which":[84],"are":[85],"then":[86],"encoded":[87],"convert":[89],"environmental":[90],"information":[91],"into":[92],"new":[94,125],"input":[95],"format":[96],"suitable":[97],"DQN":[100,113],"model.":[101],"Normalizing":[102],"state":[103],"inputs":[104],"stability":[107],"convergence":[109],"proposed":[112,152],"ensuring":[116],"comparability":[117],"features":[119],"across":[120],"different":[121],"scales.":[122],"Besides,":[123],"dynamic":[126],"reward":[127],"function":[128],"established":[130],"based":[131],"on":[132],"distance":[134],"between":[135],"current":[138],"position":[139],"its":[141],"destination.":[142],"Simulation":[143],"results":[144],"discussion":[146],"illustrate":[147],"effectiveness":[149],"DQN-based":[153],"approach":[154],"collision-free":[156],"UAV":[160],"environments.":[163]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-03-15T09:29:46.208133","created_date":"2025-11-06T00:00:00"}
