{"id":"https://openalex.org/W4415744131","doi":"https://doi.org/10.1109/qrs-c65679.2025.00042","title":"Reinforcement Learning Based UAV Control Algorithm and Safety Performance Analysis","display_name":"Reinforcement Learning Based UAV Control Algorithm and Safety Performance Analysis","publication_year":2025,"publication_date":"2025-07-16","ids":{"openalex":"https://openalex.org/W4415744131","doi":"https://doi.org/10.1109/qrs-c65679.2025.00042"},"language":null,"primary_location":{"id":"doi:10.1109/qrs-c65679.2025.00042","is_oa":false,"landing_page_url":"https://doi.org/10.1109/qrs-c65679.2025.00042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 25th International Conference on Software Quality, Reliability, and Security Companion (QRS-C)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113964686","display_name":"Siwei Yan","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Siwei Yan","raw_affiliation_strings":["Beihang University, Beijing,Beijing,China"],"affiliations":[{"raw_affiliation_string":"Beihang University, Beijing,Beijing,China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":1,"corresponding_author_ids":["https://openalex.org/A5113964686"],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.34256585,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"278","last_page":"286"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.2921000123023987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10586","display_name":"Robotic Path Planning Algorithms","score":0.2921000123023987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12794","display_name":"Adaptive Dynamic Programming Control","score":0.14890000224113464,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11489","display_name":"Air Traffic Management and Optimization","score":0.07500000298023224,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.7867000102996826},{"id":"https://openalex.org/keywords/obstacle-avoidance","display_name":"Obstacle avoidance","score":0.715499997138977},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.4350000023841858},{"id":"https://openalex.org/keywords/learning-classifier-system","display_name":"Learning classifier system","score":0.3885999917984009},{"id":"https://openalex.org/keywords/safer","display_name":"SAFER","score":0.29829999804496765},{"id":"https://openalex.org/keywords/collision-avoidance","display_name":"Collision avoidance","score":0.2847999930381775},{"id":"https://openalex.org/keywords/control-system","display_name":"Control system","score":0.28110000491142273}],"concepts":[{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.7867000102996826},{"id":"https://openalex.org/C6683253","wikidata":"https://www.wikidata.org/wiki/Q7075535","display_name":"Obstacle avoidance","level":4,"score":0.715499997138977},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.585099995136261},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.4350000023841858},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4291999936103821},{"id":"https://openalex.org/C199190896","wikidata":"https://www.wikidata.org/wiki/Q3509276","display_name":"Learning classifier system","level":3,"score":0.3885999917984009},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.328000009059906},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.3034000098705292},{"id":"https://openalex.org/C2776654903","wikidata":"https://www.wikidata.org/wiki/Q2601463","display_name":"SAFER","level":2,"score":0.29829999804496765},{"id":"https://openalex.org/C2780864053","wikidata":"https://www.wikidata.org/wiki/Q5147495","display_name":"Collision avoidance","level":3,"score":0.2847999930381775},{"id":"https://openalex.org/C44154836","wikidata":"https://www.wikidata.org/wiki/Q45045","display_name":"Simulation","level":1,"score":0.28220000863075256},{"id":"https://openalex.org/C17500928","wikidata":"https://www.wikidata.org/wiki/Q959968","display_name":"Control system","level":2,"score":0.28110000491142273},{"id":"https://openalex.org/C2777943292","wikidata":"https://www.wikidata.org/wiki/Q3319996","display_name":"Flight test","level":2,"score":0.27869999408721924},{"id":"https://openalex.org/C41376638","wikidata":"https://www.wikidata.org/wiki/Q214932","display_name":"Flight simulator","level":2,"score":0.2757999897003174},{"id":"https://openalex.org/C59519942","wikidata":"https://www.wikidata.org/wiki/Q650665","display_name":"Drone","level":2,"score":0.27129998803138733},{"id":"https://openalex.org/C2775924081","wikidata":"https://www.wikidata.org/wiki/Q55608371","display_name":"Control (management)","level":2,"score":0.2619999945163727},{"id":"https://openalex.org/C2776053266","wikidata":"https://www.wikidata.org/wiki/Q5037194","display_name":"CarSim","level":3,"score":0.2619999945163727},{"id":"https://openalex.org/C207609745","wikidata":"https://www.wikidata.org/wiki/Q4944086","display_name":"Bootstrapping (finance)","level":2,"score":0.25270000100135803},{"id":"https://openalex.org/C127757376","wikidata":"https://www.wikidata.org/wiki/Q2056514","display_name":"Active safety","level":2,"score":0.251800000667572},{"id":"https://openalex.org/C133731056","wikidata":"https://www.wikidata.org/wiki/Q4917288","display_name":"Control engineering","level":1,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/qrs-c65679.2025.00042","is_oa":false,"landing_page_url":"https://doi.org/10.1109/qrs-c65679.2025.00042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 25th International Conference on Software Quality, Reliability, and Security Companion (QRS-C)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":14,"referenced_works":["https://openalex.org/W2159379766","https://openalex.org/W2288616283","https://openalex.org/W2782014475","https://openalex.org/W3046474649","https://openalex.org/W3126403556","https://openalex.org/W3131850807","https://openalex.org/W3204026096","https://openalex.org/W4200438872","https://openalex.org/W4229040499","https://openalex.org/W4293370597","https://openalex.org/W4297339084","https://openalex.org/W4312875263","https://openalex.org/W4328137129","https://openalex.org/W4405786494"],"related_works":[],"abstract_inverted_index":{"With":[0],"the":[1,7,35,70,83,87,107,111,123,139,162,165,184,190,199,204,216,247,257,260,264,268,275],"rapid":[2],"development":[3],"of":[4,11,37,64,73,86,101,113,126,141,156,203,219,230,250,259,267],"UAV":[5,38],"technology,":[6],"safety":[8,54,71,84,200,217,265],"performance":[9,72,85,218,266],"analysis":[10],"flight":[12,23,60,74],"control":[13,24,39,75,159],"algorithms":[14,25,51,76,88,116,270],"has":[15],"become":[16],"a":[17,99,131],"hot":[18],"research":[19,109],"topic.":[20],"In":[21,188],"particular,":[22],"based":[26,77,273],"on":[27,78,274],"reinforcement":[28,49,79,114,133,157,205],"learning":[29,50,115,134,158,163,206],"have":[30,129],"been":[31],"widely":[32],"used":[33,148],"in":[34,56,106],"field":[36],"due":[40],"to":[41,68,121,181,196,214,254],"their":[42],"excellent":[43],"decision-making":[44],"ability":[45],"and":[46,58,81,97,117,143,152,171,178,201,223,240,262],"adaptivity.":[47],"However,":[48],"may":[52],"face":[53],"challenges":[55],"complex":[57],"dynamic":[59],"environments.":[61],"The":[62],"purpose":[63],"this":[65],"paper":[66,208],"is":[67,147,167,194,271],"analyze":[69,215],"learning,":[80],"evaluate":[82],"under":[89],"different":[90],"interference":[91],"conditions":[92],"by":[93,174],"constructing":[94],"simulation":[95,119,135],"environments":[96,252],"conducting":[98],"series":[100],"experimental":[102,276],"tests,":[103],"as":[104],"described":[105],"following":[108],"work:1.Through":[110],"interaction":[112],"Airsim":[118,142],"environment":[120],"realize":[122],"autonomous":[124],"navigation":[125],"UAVs,":[127],"we":[128],"constructed":[130],"vehicle":[132],"test":[136,155,212,251,256],"platform":[137],"with":[138],"help":[140],"Unreal4":[144],"engine,":[145],"which":[146],"for":[149,246],"obstacle":[150,221],"avoidance":[151,222],"automatic":[153,224],"path-finding":[154],"algorithms.2.To":[160],"optimize":[161],"process,":[164],"task":[166],"divided":[168],"into":[169],"bootstrapping":[170,185],"exploration":[172],"phases":[173],"combining":[175],"stochastic":[176],"annealing":[177],"jump-starting":[179],"strategies":[180],"gradually":[182],"reduce":[183],"time":[186],"domain.":[187],"addition,":[189],"Lyapunov":[191],"function":[192,242],"constraint":[193],"designed":[195],"further":[197,255],"ensure":[198],"robustness":[202,258],"process.3.This":[207],"puts":[209],"forward":[210],"nine":[211],"indexes":[213],"aircraft":[220],"pathfinding":[225],"tests.":[226],"And":[227],"four":[228],"kinds":[229],"external":[231],"disturbances,":[232],"namely,":[233],"ground":[234],"effect,":[235,237],"downwash":[236],"wind":[238],"interference,":[239,243],"reward":[241],"are":[244],"introduced":[245],"two":[248],"types":[249],"respectively":[253],"algorithms,":[261],"finally":[263],"three":[269],"analyzed":[272],"data.":[277]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-31T00:00:00"}
