{"id":"https://openalex.org/W4414054579","doi":"https://doi.org/10.1109/hsi66212.2025.11142427","title":"A Real-Time Object Detection and Tracking Framework Based on RT-DETR and DeepSORT","display_name":"A Real-Time Object Detection and Tracking Framework Based on RT-DETR and DeepSORT","publication_year":2025,"publication_date":"2025-07-16","ids":{"openalex":"https://openalex.org/W4414054579","doi":"https://doi.org/10.1109/hsi66212.2025.11142427"},"language":"en","primary_location":{"id":"doi:10.1109/hsi66212.2025.11142427","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hsi66212.2025.11142427","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 17th International Conference on Human System Interaction (HSI)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5102910988","display_name":"Dung Nguyen","orcid":"https://orcid.org/0009-0000-4510-7504"},"institutions":[{"id":"https://openalex.org/I4210095101","display_name":"Hue University","ror":"https://ror.org/00qaa6j11","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210095101"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Dung Nguyen","raw_affiliation_strings":["University of Sciences, Hue University,Hue City,Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"University of Sciences, Hue University,Hue City,Vietnam","institution_ids":["https://openalex.org/I4210095101"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011476665","display_name":"Van-Dung Hoang","orcid":"https://orcid.org/0000-0001-7554-1707"},"institutions":[{"id":"https://openalex.org/I4210148201","display_name":"Ho Chi Minh City University of Technology and Engineering","ror":"https://ror.org/05hzn5427","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210148201"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Van-Dung Hoang","raw_affiliation_strings":["HCMC University of Technology and Education,Ho Chi Minh City,Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"HCMC University of Technology and Education,Ho Chi Minh City,Vietnam","institution_ids":["https://openalex.org/I4210148201"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5105938018","display_name":"Van-Tuong-Lan Le","orcid":"https://orcid.org/0000-0002-0538-8425"},"institutions":[{"id":"https://openalex.org/I4210095101","display_name":"Hue University","ror":"https://ror.org/00qaa6j11","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210095101"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Van-Tuong-Lan Le","raw_affiliation_strings":["Hue University,Department of Academic and Students&#x0027; Affairs,Hue City,Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Hue University,Department of Academic and Students&#x0027; Affairs,Hue City,Vietnam","institution_ids":["https://openalex.org/I4210095101"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5001532275","display_name":"Tri-Cong Pham","orcid":"https://orcid.org/0000-0002-5507-6454"},"institutions":[{"id":"https://openalex.org/I182526193","display_name":"Thuyloi University","ror":"https://ror.org/04afshy24","country_code":"VN","type":"education","lineage":["https://openalex.org/I182526193"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Tri-Cong Pham","raw_affiliation_strings":["Thuy Loi University,Hanoi,Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Thuy Loi University,Hanoi,Vietnam","institution_ids":["https://openalex.org/I182526193"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101795562","display_name":"Quang-Khai Tran","orcid":"https://orcid.org/0000-0002-9796-2964"},"institutions":[{"id":"https://openalex.org/I4210148201","display_name":"Ho Chi Minh City University of Technology and Engineering","ror":"https://ror.org/05hzn5427","country_code":"VN","type":"education","lineage":["https://openalex.org/I4210148201"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Quang-Khai Tran","raw_affiliation_strings":["HCMC University of Technology and Education,Ho Chi Minh City,Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"HCMC University of Technology and Education,Ho Chi Minh City,Vietnam","institution_ids":["https://openalex.org/I4210148201"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026818330","display_name":"Chi-Mai Luong","orcid":null},"institutions":[{"id":"https://openalex.org/I70349855","display_name":"Vietnam Academy of Science and Technology","ror":"https://ror.org/02wsd5p50","country_code":"VN","type":"government","lineage":["https://openalex.org/I70349855"]}],"countries":["VN"],"is_corresponding":false,"raw_author_name":"Chi-Mai Luong","raw_affiliation_strings":["Institute of Information Technology, Vietnam Academy of Science and Technology,Hanoi,Vietnam"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Information Technology, Vietnam Academy of Science and Technology,Hanoi,Vietnam","institution_ids":["https://openalex.org/I70349855"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26569115,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"6"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9354000091552734,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},"topics":[{"id":"https://openalex.org/T12702","display_name":"Brain Tumor Detection and Classification","score":0.9354000091552734,"subfield":{"id":"https://openalex.org/subfields/2808","display_name":"Neurology"},"field":{"id":"https://openalex.org/fields/28","display_name":"Neuroscience"},"domain":{"id":"https://openalex.org/domains/1","display_name":"Life Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9075000286102295,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.7038999795913696},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.6226999759674072},{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5848000049591064},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5515999794006348},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.5418000221252441},{"id":"https://openalex.org/keywords/consistency","display_name":"Consistency (knowledge bases)","score":0.5181999802589417}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7283999919891357},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7163000106811523},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.7038999795913696},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6657000184059143},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.6226999759674072},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5848000049591064},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5515999794006348},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.5418000221252441},{"id":"https://openalex.org/C2776436953","wikidata":"https://www.wikidata.org/wiki/Q5163215","display_name":"Consistency (knowledge bases)","level":2,"score":0.5181999802589417},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.35740000009536743},{"id":"https://openalex.org/C2778355321","wikidata":"https://www.wikidata.org/wiki/Q17079427","display_name":"Identity (music)","level":2,"score":0.34779998660087585},{"id":"https://openalex.org/C71681937","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object-class detection","level":5,"score":0.3269999921321869},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.2935999929904938},{"id":"https://openalex.org/C182521987","wikidata":"https://www.wikidata.org/wiki/Q2493877","display_name":"Viola\u2013Jones object detection framework","level":5,"score":0.2892000079154968},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2858999967575073}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hsi66212.2025.11142427","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hsi66212.2025.11142427","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 17th International Conference on Human System Interaction (HSI)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G4585115989","display_name":null,"funder_award_id":"102.05-2021.04","funder_id":"https://openalex.org/F4320309617","funder_display_name":"National Foundation for Science and Technology Development"}],"funders":[{"id":"https://openalex.org/F4320309617","display_name":"National Foundation for Science and Technology Development","ror":"https://ror.org/04rw64z44"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":22,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1786529921","https://openalex.org/W1861492603","https://openalex.org/W2112796928","https://openalex.org/W2161969291","https://openalex.org/W2164598857","https://openalex.org/W2193145675","https://openalex.org/W2194775991","https://openalex.org/W2252355370","https://openalex.org/W2570343428","https://openalex.org/W2603203130","https://openalex.org/W2963037989","https://openalex.org/W3084173793","https://openalex.org/W3096609285","https://openalex.org/W3159481202","https://openalex.org/W3165924482","https://openalex.org/W4214886591","https://openalex.org/W4286904999","https://openalex.org/W4386076325","https://openalex.org/W4400656560","https://openalex.org/W4402754006","https://openalex.org/W4403295672"],"related_works":["https://openalex.org/W4285271403","https://openalex.org/W2542007731","https://openalex.org/W4292830139","https://openalex.org/W2968379562","https://openalex.org/W4319309705","https://openalex.org/W2091015105","https://openalex.org/W4388689193","https://openalex.org/W2110899030","https://openalex.org/W29633852","https://openalex.org/W2985362983"],"abstract_inverted_index":{"Object":[0],"detection":[1,25,89],"and":[2,18,45,90,115,131,143,185],"tracking":[3,51,113,165],"are":[4,148,167],"two":[5],"critical":[6],"tasks":[7],"in":[8,13,23,55,112,124,164],"computer":[9],"vision,":[10],"widely":[11,98],"applied":[12],"security":[14],"surveillance,":[15],"autonomous":[16,186],"vehicles,":[17],"behavioral":[19],"analysis.":[20],"Strong":[21],"performance":[22,121],"object":[24,88,129],"has":[26],"been":[27],"demonstrated":[28],"by":[29,150],"recent":[30],"Transformer-based":[31],"models,":[32],"such":[33,127,181],"as":[34,128,182],"RT-DETR":[35,74],"(Real-Time":[36],"Detection":[37],"Transformer),":[38],"due":[39],"to":[40,61,85,104],"their":[41],"global":[42],"context":[43],"modeling":[44],"high":[46],"accuracy.":[47],"However,":[48],"an":[49,71,134],"inherent":[50],"mechanism":[52],"is":[53,77,102,122,172],"lacking":[54],"RT-DETR,":[56],"which":[57],"requires":[58],"additional":[59],"components":[60],"maintain":[62],"identity":[63],"consistency":[64],"across":[65],"frames.":[66],"To":[67],"address":[68],"this":[69],"limitation,":[70],"integration":[72],"of":[73,82,108,137,141,146],"with":[75,95],"DeepSORT":[76],"proposed,":[78],"leveraging":[79],"the":[80,106,109,153,175],"strengths":[81],"both":[83],"models":[84],"enhance":[86],"real-time":[87,100,170],"tracking.":[91],"A":[92],"comparative":[93],"evaluation":[94],"YOLOv8,":[96],"a":[97,139,144],"used":[99],"detector,":[101],"conducted":[103],"highlight":[105],"advantages":[107],"proposed":[110,176],"approach":[111,177],"accuracy":[114,166],"robustness.":[116],"Experiments":[117],"show":[118],"that":[119,161],"effective":[120],"achieved":[123],"challenging":[125],"scenarios":[126],"occlusion":[130],"intersection.":[132],"Specifically,":[133],"IDF1":[135],"score":[136],"60.0%,":[138],"MOTA":[140],"42.4%,":[142],"MOTP":[145],"43.3%":[147],"obtained":[149],"RTl+DeepSORT":[151],"on":[152],"MOT17-02-DPM":[154],"dataset,":[155],"outperforming":[156],"YOLOv8x+DeepSORT.":[157],"These":[158],"results":[159],"indicate":[160],"significant":[162],"improvements":[163],"attained":[168],"while":[169],"efficiency":[171],"maintained,":[173],"making":[174],"well-suited":[178],"for":[179],"applications":[180],"intelligent":[183],"surveillance":[184],"navigation.":[187]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2025-10-10T00:00:00"}
