{"id":"https://openalex.org/W4410779755","doi":"https://doi.org/10.1109/cacml64929.2025.11010979","title":"Real-time Multi-Object Tracking Algorithm for UAV Based on Deep Learning","display_name":"Real-time Multi-Object Tracking Algorithm for UAV Based on Deep Learning","publication_year":2025,"publication_date":"2025-03-28","ids":{"openalex":"https://openalex.org/W4410779755","doi":"https://doi.org/10.1109/cacml64929.2025.11010979"},"language":"en","primary_location":{"id":"doi:10.1109/cacml64929.2025.11010979","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cacml64929.2025.11010979","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 4th Asia Conference on Algorithms, Computing and Machine Learning (CACML)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5028580598","display_name":"Zhongmin Zhang","orcid":"https://orcid.org/0000-0002-6761-6120"},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Zhongmin Zhang","raw_affiliation_strings":["Harbin Engineering University,College of Information and Communication Engineering,Harbin,China"],"affiliations":[{"raw_affiliation_string":"Harbin Engineering University,College of Information and Communication Engineering,Harbin,China","institution_ids":["https://openalex.org/I151727225"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5113291251","display_name":"Cong Ye","orcid":null},"institutions":[{"id":"https://openalex.org/I151727225","display_name":"Harbin Engineering University","ror":"https://ror.org/03x80pn82","country_code":"CN","type":"education","lineage":["https://openalex.org/I151727225"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Cong Ye","raw_affiliation_strings":["Harbin Engineering University,College of Information and Communication Engineering,Harbin,China"],"affiliations":[{"raw_affiliation_string":"Harbin Engineering University,College of Information and Communication Engineering,Harbin,China","institution_ids":["https://openalex.org/I151727225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":2,"corresponding_author_ids":["https://openalex.org/A5028580598"],"corresponding_institution_ids":["https://openalex.org/I151727225"],"apc_list":null,"apc_paid":null,"fwci":3.7968,"has_fulltext":false,"cited_by_count":3,"citation_normalized_percentile":{"value":0.9318111,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":97},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"9"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13717","display_name":"Advanced Algorithms and Applications","score":0.973800003528595,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13717","display_name":"Advanced Algorithms and Applications","score":0.973800003528595,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14225","display_name":"Advanced Sensor and Control Systems","score":0.9478999972343445,"subfield":{"id":"https://openalex.org/subfields/2207","display_name":"Control and Systems Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14257","display_name":"Advanced Measurement and Detection Methods","score":0.9320999979972839,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7807225584983826},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.704451858997345},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6116819381713867},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5732424259185791},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5459675788879395},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.5346575975418091},{"id":"https://openalex.org/keywords/deep-learning","display_name":"Deep learning","score":0.4604331851005554},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.42484909296035767},{"id":"https://openalex.org/keywords/algorithm","display_name":"Algorithm","score":0.3457282483577728},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.23330900073051453}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7807225584983826},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.704451858997345},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6116819381713867},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5732424259185791},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5459675788879395},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.5346575975418091},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.4604331851005554},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.42484909296035767},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.3457282483577728},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.23330900073051453},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cacml64929.2025.11010979","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cacml64929.2025.11010979","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 4th Asia Conference on Algorithms, Computing and Machine Learning (CACML)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":28,"referenced_works":["https://openalex.org/W2124781496","https://openalex.org/W2531409750","https://openalex.org/W2908055158","https://openalex.org/W2968269224","https://openalex.org/W3034971973","https://openalex.org/W3086436251","https://openalex.org/W3214821014","https://openalex.org/W4286904999","https://openalex.org/W4292388164","https://openalex.org/W4312906297","https://openalex.org/W4319866011","https://openalex.org/W4379799985","https://openalex.org/W4380758563","https://openalex.org/W4386076204","https://openalex.org/W4387264720","https://openalex.org/W4390498922","https://openalex.org/W4391070391","https://openalex.org/W4392231788","https://openalex.org/W4400777596","https://openalex.org/W4402050781","https://openalex.org/W4402124727","https://openalex.org/W4402626522","https://openalex.org/W4402804479","https://openalex.org/W4408250502","https://openalex.org/W6839744764","https://openalex.org/W6843239693","https://openalex.org/W6848712460","https://openalex.org/W6868582632"],"related_works":["https://openalex.org/W2949096641","https://openalex.org/W2970686063","https://openalex.org/W4320729701","https://openalex.org/W4254103348","https://openalex.org/W3210378990","https://openalex.org/W3034745255","https://openalex.org/W4285271403","https://openalex.org/W2542007731","https://openalex.org/W4292830139","https://openalex.org/W2968379562"],"abstract_inverted_index":{"Unmanned":[0],"Aerial":[1],"Vehicles":[2],"(UAVs)":[3],"with":[4,36,177,208,229],"multi-target":[5,52],"tracking":[6,53,193,202,234],"technology":[7],"are":[8],"of":[9,19,39,45,60,159,192,204,214],"significant":[10],"importance":[11],"in":[12,184,227],"various":[13],"key":[14],"areas,":[15],"including":[16],"the":[17,37,58,72,80,88,92,109,115,123,145,157,165,170,174,205,230,241],"management":[18],"modern":[20],"urban":[21],"life":[22],"and":[23,41,181,187,198,211,216,219,221,223,239],"military":[24],"strategic":[25],"deployment.":[26],"This":[27],"paper":[28,64,143],"proposes":[29],"an":[30,42,96,150],"advanced":[31],"Multi-Object":[32],"Tracking":[33],"(MOT)":[34],"method":[35,154,243],"combination":[38],"TStsm-yolov10":[40],"improved":[43,97,171],"version":[44],"ByteTrack,":[46],"which":[47],"is":[48,136],"well-suited":[49],"to":[50,70,78,107,155],"real-time":[51,252],"tasks":[54],"for":[55,83,99],"UAVs.":[56],"In":[57,91,190],"realm":[59],"object":[61,133],"detection,":[62],"this":[63,142],"introduces":[65],"a":[66,178],"tiny":[67],"detection":[68,75,81,134,160,175],"head":[69],"replace":[71],"existing":[73],"large":[74],"head,":[76],"aiming":[77],"enhance":[79],"capabilities":[82],"small":[84,132],"objects":[85],"while":[86],"constraining":[87],"parameter":[89],"count.":[90],"neck":[93],"section,":[94],"utilizing":[95],"TFPN":[98],"feature":[100,111],"fusion":[101],"across":[102],"three":[103],"distinct":[104],"scales":[105],"aims":[106],"improve":[108],"overall":[110],"representation":[112],"capability.":[113],"Additionally,":[114],"SCSA":[116],"attention":[117],"mechanism":[118],"has":[119],"been":[120],"integrated":[121],"into":[122],"C2f":[124],"module,":[125],"designated":[126],"as":[127,237],"C2f-SCSA.":[128],"The":[129],"newly":[130],"designed":[131],"model":[135],"named":[137],"TStsm-yolov10.":[138],"For":[139],"UAVs":[140],"tracking,":[141],"enhances":[144],"Kalman":[146],"filter":[147],"by":[148],"incorporating":[149],"adaptive":[151],"noise":[152],"estimation":[153],"alleviate":[156],"impact":[158],"results.":[161],"Experiments":[162],"conducted":[163],"on":[164,196],"VisDrone2019":[166],"dataset":[167],"demonstrate":[168],"that":[169],"methodology":[172],"improves":[173],"performance,":[176,194],"5.7%,":[179],"5.6%,":[180],"6.9%":[182],"improvement":[183],"precision,":[185],"recall,":[186],"mAP50,":[188],"respectively.":[189,225],"terms":[191],"experiments":[195],"VisDrone2019-MOT-test":[197],"VisDrone2019-MOT-train":[199],"demonstrated":[200],"excellent":[201,247],"performance":[203,248],"proposed":[206,242],"method,":[207],"HOTA,":[209],"MOTA":[210],"IDF1":[212],"improvements":[213],"4.083%":[215],"4.013%,":[217],"3.205%":[218],"5.001%,":[220],"5.221%":[222],"5.988%,":[224],"Furthermore,":[226],"comparison":[228],"current":[231],"popular":[232],"two-stage":[233],"algorithms":[235],"such":[236],"StrongSort":[238],"OCSort,":[240],"not":[244],"only":[245],"demonstrates":[246],"but":[249],"also":[250],"ensures":[251],"performance.":[253]},"counts_by_year":[{"year":2025,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
