{"id":"https://openalex.org/W7123346774","doi":"https://doi.org/10.1109/dsa66321.2025.00042","title":"Challenges, Progress, and Future Directions of Visual Tracking in UAVs","display_name":"Challenges, Progress, and Future Directions of Visual Tracking in UAVs","publication_year":2025,"publication_date":"2025-11-24","ids":{"openalex":"https://openalex.org/W7123346774","doi":"https://doi.org/10.1109/dsa66321.2025.00042"},"language":null,"primary_location":{"id":"doi:10.1109/dsa66321.2025.00042","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsa66321.2025.00042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 12th International Conference on Dependable Systems and Their Applications (DSA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5122865205","display_name":"Li Mai","orcid":null},"institutions":[{"id":"https://openalex.org/I118987531","display_name":"Anhui Jianzhu University","ror":"https://ror.org/0108wjw08","country_code":"CN","type":"education","lineage":["https://openalex.org/I118987531"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Li Mai","raw_affiliation_strings":["Anhui Mingsheng Hengzhuo Technology Co., Ltd.,Power Grid Digitalization Division,Hefei,Anhui,China"],"affiliations":[{"raw_affiliation_string":"Anhui Mingsheng Hengzhuo Technology Co., Ltd.,Power Grid Digitalization Division,Hefei,Anhui,China","institution_ids":["https://openalex.org/I118987531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122862929","display_name":"Chen Dai","orcid":null},"institutions":[{"id":"https://openalex.org/I118987531","display_name":"Anhui Jianzhu University","ror":"https://ror.org/0108wjw08","country_code":"CN","type":"education","lineage":["https://openalex.org/I118987531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chen Dai","raw_affiliation_strings":["Anhui Mingsheng Hengzhuo Technology Co., Ltd.,System Integration Division,Hefei,Anhui,China"],"affiliations":[{"raw_affiliation_string":"Anhui Mingsheng Hengzhuo Technology Co., Ltd.,System Integration Division,Hefei,Anhui,China","institution_ids":["https://openalex.org/I118987531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122849871","display_name":"Hongji Ma","orcid":null},"institutions":[{"id":"https://openalex.org/I118987531","display_name":"Anhui Jianzhu University","ror":"https://ror.org/0108wjw08","country_code":"CN","type":"education","lineage":["https://openalex.org/I118987531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongji Ma","raw_affiliation_strings":["Anhui Mingsheng Hengzhuo Technology Co., Ltd.,System Integration Division,Hefei,Anhui,China"],"affiliations":[{"raw_affiliation_string":"Anhui Mingsheng Hengzhuo Technology Co., Ltd.,System Integration Division,Hefei,Anhui,China","institution_ids":["https://openalex.org/I118987531"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5122856939","display_name":"Xin Lin","orcid":null},"institutions":[{"id":"https://openalex.org/I118987531","display_name":"Anhui Jianzhu University","ror":"https://ror.org/0108wjw08","country_code":"CN","type":"education","lineage":["https://openalex.org/I118987531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Lin","raw_affiliation_strings":["Anhui Mingsheng Hengzhuo Technology Co., Ltd.,Power Grid Digitalization Division,Hefei,Anhui,China"],"affiliations":[{"raw_affiliation_string":"Anhui Mingsheng Hengzhuo Technology Co., Ltd.,Power Grid Digitalization Division,Hefei,Anhui,China","institution_ids":["https://openalex.org/I118987531"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040759252","display_name":"Shiwei Guo","orcid":"https://orcid.org/0000-0002-0683-4044"},"institutions":[{"id":"https://openalex.org/I118987531","display_name":"Anhui Jianzhu University","ror":"https://ror.org/0108wjw08","country_code":"CN","type":"education","lineage":["https://openalex.org/I118987531"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shiwei Guo","raw_affiliation_strings":["Anhui Mingsheng Hengzhuo Technology Co., Ltd.,Power Grid Digitalization Division,Hefei,Anhui,China"],"affiliations":[{"raw_affiliation_string":"Anhui Mingsheng Hengzhuo Technology Co., Ltd.,Power Grid Digitalization Division,Hefei,Anhui,China","institution_ids":["https://openalex.org/I118987531"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5122865205"],"corresponding_institution_ids":["https://openalex.org/I118987531"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.69746826,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"295","last_page":"303"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.6559000015258789,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.6559000015258789,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11133","display_name":"UAV Applications and Optimization","score":0.24570000171661377,"subfield":{"id":"https://openalex.org/subfields/2202","display_name":"Aerospace Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.015699999406933784,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5037000179290771},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.484499990940094},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.47760000824928284},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4708999991416931},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.44510000944137573},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.429500013589859},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.4138000011444092},{"id":"https://openalex.org/keywords/feature-extraction","display_name":"Feature extraction","score":0.41040000319480896},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.399399995803833}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7218999862670898},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7092000246047974},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6787999868392944},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5037000179290771},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.484499990940094},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.47760000824928284},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4708999991416931},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.44510000944137573},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.429500013589859},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.4138000011444092},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.41040000319480896},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.399399995803833},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.38749998807907104},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.37869998812675476},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.364300012588501},{"id":"https://openalex.org/C2780023022","wikidata":"https://www.wikidata.org/wiki/Q1338171","display_name":"Compensation (psychology)","level":2,"score":0.3361000120639801},{"id":"https://openalex.org/C94124525","wikidata":"https://www.wikidata.org/wiki/Q912550","display_name":"Categorization","level":2,"score":0.3287999927997589},{"id":"https://openalex.org/C204323151","wikidata":"https://www.wikidata.org/wiki/Q905424","display_name":"Range (aeronautics)","level":2,"score":0.3264999985694885},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.31779998540878296},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.30079999566078186},{"id":"https://openalex.org/C5339829","wikidata":"https://www.wikidata.org/wiki/Q1425977","display_name":"Machine vision","level":2,"score":0.2718999981880188},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.26829999685287476},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.26759999990463257},{"id":"https://openalex.org/C87833898","wikidata":"https://www.wikidata.org/wiki/Q1060280","display_name":"Advanced driver assistance systems","level":2,"score":0.26339998841285706}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/dsa66321.2025.00042","is_oa":false,"landing_page_url":"https://doi.org/10.1109/dsa66321.2025.00042","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 12th International Conference on Dependable Systems and Their Applications (DSA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Zero hunger","id":"https://metadata.un.org/sdg/2","score":0.77448570728302}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Unmanned":[0],"Aerial":[1],"Vehicles":[2],"(UAVs)":[3],"have":[4],"emerged":[5],"as":[6,194],"versatile":[7],"and":[8,22,28,49,61,73,82,91,133,178,184,196],"indispensable":[9],"tools":[10],"in":[11,68,122],"a":[12,116],"wide":[13],"range":[14],"of":[15,38,52,96,119,170],"intelligent":[16],"vision":[17,155],"applications,":[18],"including":[19,167],"surveillance,":[20],"search":[21],"rescue,":[23],"environmental":[24],"monitoring,":[25],"precision":[26],"agriculture,":[27],"traffic":[29],"analysis.":[30],"Central":[31],"to":[32,46,138],"these":[33],"applications":[34],"is":[35],"the":[36,92,120,135,147,168],"task":[37],"Visual":[39],"Object":[40],"Tracking":[41],"(VOT),":[42],"which":[43,198],"enables":[44],"UAVs":[45],"continuously":[47],"localize":[48],"follow":[50],"objects":[51],"interest":[53],"across":[54],"frames,":[55],"thereby":[56],"supporting":[57],"higher-level":[58],"perception,":[59],"navigation,":[60],"decision-making":[62],"functions.":[63],"Despite":[64],"its":[65],"significance,":[66],"VOT":[67],"UAV-captured":[69],"imagery":[70],"presents":[71],"unique":[72],"formidable":[74],"challenges":[75,136],"arising":[76],"from":[77],"drastic":[78],"scale":[79],"variations,":[80],"rapid":[81],"irregular":[83],"camera":[84],"motion,":[85],"frequent":[86],"object":[87],"occlusions,":[88],"illumination":[89],"changes,":[90],"limited":[93],"computational":[94],"resources":[95],"onboard":[97],"platforms.":[98],"These":[99],"factors":[100],"collectively":[101],"make":[102],"UAV-based":[103],"tracking":[104,111,124],"fundamentally":[105],"more":[106,158],"complex":[107],"than":[108],"conventional":[109],"ground-based":[110],"tasks.":[112],"The":[113],"paper":[114],"provides":[115],"comprehensive":[117],"survey":[118],"state-of-the-art":[121],"visual":[123],"specifically":[125],"tailored":[126],"for":[127,180],"UAV":[128],"scenarios.":[129],"We":[130,163],"systematically":[131],"categorize":[132],"analyze":[134],"inherent":[137],"this":[139],"domain,":[140],"followed":[141],"by":[142],"an":[143],"in-depth":[144],"discussion":[145],"on":[146],"recent":[148],"progress":[149],"achieved":[150],"through":[151],"both":[152],"traditional":[153],"computer":[154],"methods":[156,179],"and,":[157],"significantly,":[159],"deep":[160],"learning-based":[161],"approaches.":[162],"explore":[164],"key":[165],"advancements,":[166],"development":[169],"specialized":[171],"correlation":[172],"filters,":[173],"robust":[174],"feature":[175],"extraction":[176],"networks,":[177],"integrating":[181],"motion":[182],"compensation":[183],"spatial-temporal":[185],"information.":[186],"Furthermore,":[187],"we":[188],"summarize":[189],"important":[190],"benchmark":[191],"datasets,":[192],"such":[193],"VisDrone":[195],"UAV123,":[197],"facilitate":[199],"rigorous":[200],"evaluation.":[201]},"counts_by_year":[],"updated_date":"2026-02-23T20:09:44.859080","created_date":"2026-01-14T00:00:00"}
