{"id":"https://openalex.org/W4417001709","doi":"https://doi.org/10.1109/tii.2025.3631698","title":"FastTrackTr: Real-Time Multiobject Tracking With Transformers for Real World","display_name":"FastTrackTr: Real-Time Multiobject Tracking With Transformers for Real World","publication_year":2025,"publication_date":"2025-12-04","ids":{"openalex":"https://openalex.org/W4417001709","doi":"https://doi.org/10.1109/tii.2025.3631698"},"language":null,"primary_location":{"id":"doi:10.1109/tii.2025.3631698","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tii.2025.3631698","pdf_url":null,"source":{"id":"https://openalex.org/S184777250","display_name":"IEEE Transactions on Industrial Informatics","issn_l":"1551-3203","issn":["1551-3203","1941-0050"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Industrial Informatics","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101367497","display_name":"Pan Liao","orcid":"https://orcid.org/0009-0008-9734-2918"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Pan Liao","raw_affiliation_strings":["School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5062038689","display_name":"Feng Yang","orcid":"https://orcid.org/0000-0001-6991-1628"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Feng Yang","raw_affiliation_strings":["School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101577317","display_name":"Di Wu","orcid":"https://orcid.org/0000-0003-1664-5893"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Di Wu","raw_affiliation_strings":["School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5086637913","display_name":"Jinwen Yu","orcid":"https://orcid.org/0009-0001-6366-7836"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinwen Yu","raw_affiliation_strings":["School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101493609","display_name":"Xingxin Li","orcid":"https://orcid.org/0000-0002-6776-7367"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xingxin Li","raw_affiliation_strings":["China North Vehicle Research Institute, Beijing, China"],"affiliations":[{"raw_affiliation_string":"China North Vehicle Research Institute, Beijing, China","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101954574","display_name":"Dingwen Zhang","orcid":"https://orcid.org/0000-0001-8369-8886"},"institutions":[{"id":"https://openalex.org/I17145004","display_name":"Northwestern Polytechnical University","ror":"https://ror.org/01y0j0j86","country_code":"CN","type":"education","lineage":["https://openalex.org/I17145004"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Dingwen Zhang","raw_affiliation_strings":["School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China"],"affiliations":[{"raw_affiliation_string":"School of Automation, Northwestern Polytechnical University, Xi&#x2019;an, China","institution_ids":["https://openalex.org/I17145004"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5101367497"],"corresponding_institution_ids":["https://openalex.org/I17145004"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.42049759,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"22","issue":"3","first_page":"1817","last_page":"1827"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9455000162124634,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9455000162124634,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.009499999694526196,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.009399999864399433,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/rendering","display_name":"Rendering (computer graphics)","score":0.6085000038146973},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.578499972820282},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.527400016784668},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5133000016212463},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.4977000057697296},{"id":"https://openalex.org/keywords/encode","display_name":"ENCODE","score":0.4643000066280365},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.3982999920845032},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.3752000033855438},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.36410000920295715}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8184000253677368},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.6085000038146973},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.578499972820282},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.527400016784668},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5133000016212463},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.4977000057697296},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49729999899864197},{"id":"https://openalex.org/C66746571","wikidata":"https://www.wikidata.org/wiki/Q1134833","display_name":"ENCODE","level":3,"score":0.4643000066280365},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.42100000381469727},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.3982999920845032},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.3752000033855438},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.36410000920295715},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.3531999886035919},{"id":"https://openalex.org/C154586513","wikidata":"https://www.wikidata.org/wiki/Q4420972","display_name":"Tracking system","level":3,"score":0.34299999475479126},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.3402000069618225},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3328999876976013},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.32170000672340393},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.31529998779296875},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.31290000677108765},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.304500013589859},{"id":"https://openalex.org/C3261483","wikidata":"https://www.wikidata.org/wiki/Q119565","display_name":"Frame rate","level":2,"score":0.3043000102043152},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.2985000014305115},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.28760001063346863},{"id":"https://openalex.org/C64876066","wikidata":"https://www.wikidata.org/wiki/Q5141226","display_name":"Cognitive neuroscience of visual object recognition","level":3,"score":0.2809999883174896},{"id":"https://openalex.org/C126042441","wikidata":"https://www.wikidata.org/wiki/Q1324888","display_name":"Frame (networking)","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C108882727","wikidata":"https://www.wikidata.org/wiki/Q2991685","display_name":"Solid modeling","level":2,"score":0.2637999951839447},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.258899986743927}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tii.2025.3631698","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tii.2025.3631698","pdf_url":null,"source":{"id":"https://openalex.org/S184777250","display_name":"IEEE Transactions on Industrial Informatics","issn_l":"1551-3203","issn":["1551-3203","1941-0050"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Industrial Informatics","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Transformer-based":[0,13,212],"multiobject":[1],"tracking":[2,50,150,173,196],"(MOT)":[3],"methods":[4],"have":[5],"attracted":[6],"significant":[7],"attention":[8],"from":[9,17,59,136],"researchers.":[10],"However,":[11],"these":[12,137],"models":[14],"often":[15],"suffer":[16],"suboptimal":[18],"inference":[19],"speeds":[20],"due":[21],"to":[22,33,233],"their":[23],"architectural":[24],"complexities":[25],"or":[26,110],"other":[27,210],"inherent":[28],"issues,":[29],"rendering":[30],"them":[31],"difficult":[32],"deploy":[34],"in":[35],"practical":[36,245],"industrial":[37],"applications.":[38,246],"To":[39],"address":[40],"this":[41],"challenge,":[42],"we":[43,71],"revisited":[44],"the":[45,144,206,222],"classic":[46],"joint":[47],"detection":[48],"and":[49,53,75,115,120,125],"(JDT)":[51],"paradigm":[52],"analyzed":[54],"existing":[55],"models.":[56],"Drawing":[57],"inspiration":[58],"Detection":[60],"Transformer\u2019s":[61],"(DETR)":[62],"object":[63,68],"queries,":[64],"which":[65],"naturally":[66],"encode":[67],"appearance":[69],"features,":[70],"constructed":[72],"a":[73,97,112,126],"fast":[74],"novel":[76],"JDT-type":[77],"MOT":[78],"framework":[79,91],"named":[80],"FastTrackTr":[81],"by":[82],"implementing":[83],"an":[84,179,184],"efficient":[85],"interframe":[86],"information":[87,105],"transfer":[88],"mechanism.":[89],"This":[90],"integrates":[92],"three":[93],"key":[94],"technological":[95],"innovations:":[96],"cross-decoder":[98],"mechanism":[99],"that":[100,130,168],"implicitly":[101],"incorporates":[102],"historical":[103,113,122],"trajectory":[104],"without":[106],"requiring":[107],"additional":[108],"queries":[109,147],"decoders,":[111],"encoder":[114],"decoder":[116],"pair":[117],"for":[118,149,244],"refining":[119],"utilizing":[121],"feature":[123],"representations,":[124],"deterministic":[127],"fixed-shape":[128],"architecture":[129],"enables":[131],"seamless":[132],"TensorRT":[133],"acceleration.":[134],"Benefiting":[135],"designs,":[138],"our":[139,169],"approach":[140],"not":[141],"only":[142],"reduces":[143],"number":[145],"of":[146,187],"required":[148],"but":[151],"also":[152],"avoids":[153],"introducing":[154],"excessive":[155],"network":[156],"structures,":[157],"ensuring":[158],"model":[159],"simplicity":[160],"while":[161,174],"maintaining":[162,175],"high":[163],"accuracy.":[164,177],"Experimental":[165],"results":[166],"show":[167],"method":[170],"achieves":[171,231],"real-time":[172,242],"state-of-the-art":[176],"On":[178],"NVIDIA":[180,223],"RTX":[181],"4090":[182],"with":[183],"image":[185],"size":[186],"1333":[188],"\u00d7":[189,238],"800,":[190],"it":[191,215],"reaches":[192],"62.4":[193],"higher":[194],"order":[195],"accuracy":[197],"(HOTA)":[198],"at":[199],"86.6":[200],"frames":[201],"per":[202],"second":[203],"(FPS)":[204],"on":[205,217,236],"DanceTrack":[207],"dataset,":[208],"outperforming":[209],"advanced":[211],"methods.":[213],"Furthermore,":[214],"excels":[216],"edge":[218],"devices,":[219],"such":[220],"as":[221],"Jetson":[224],"AGX":[225],"Orin,":[226],"where":[227],"its":[228],"lightweight":[229],"variant":[230],"up":[232],"59.2":[234],"FPS":[235],"640":[237,239],"images,":[240],"meeting":[241],"requirements":[243]},"counts_by_year":[],"updated_date":"2026-03-06T06:45:51.903784","created_date":"2025-12-04T00:00:00"}
