{"id":"https://openalex.org/W4362501010","doi":"https://doi.org/10.1109/tcsvt.2023.3263884","title":"STDFormer: Spatial-Temporal Motion Transformer for Multiple Object Tracking","display_name":"STDFormer: Spatial-Temporal Motion Transformer for Multiple Object Tracking","publication_year":2023,"publication_date":"2023-04-03","ids":{"openalex":"https://openalex.org/W4362501010","doi":"https://doi.org/10.1109/tcsvt.2023.3263884"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3263884","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3263884","pdf_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10091152.pdf","source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"bronze","oa_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10091152.pdf","any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5017033250","display_name":"Mengjie Hu","orcid":"https://orcid.org/0000-0001-7712-3322"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Mengjie Hu","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-7712-3322","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068069124","display_name":"Xiaotong Zhu","orcid":"https://orcid.org/0000-0002-8485-2598"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaotong Zhu","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-8485-2598","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100383995","display_name":"Haotian Wang","orcid":"https://orcid.org/0000-0002-0816-6211"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haotian Wang","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054854116","display_name":"Shixiang Cao","orcid":"https://orcid.org/0000-0001-8816-7304"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shixiang Cao","raw_affiliation_strings":["Beijing Institute of Space Mechanics and Electricity, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0001-8816-7304","affiliations":[{"raw_affiliation_string":"Beijing Institute of Space Mechanics and Electricity, Beijing, China","institution_ids":[]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5013806533","display_name":"Chun Liu","orcid":"https://orcid.org/0000-0002-2834-9461"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chun Liu","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0002-2834-9461","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5045391965","display_name":"Qing Song","orcid":"https://orcid.org/0000-0003-4616-2200"},"institutions":[{"id":"https://openalex.org/I139759216","display_name":"Beijing University of Posts and Telecommunications","ror":"https://ror.org/04w9fbh59","country_code":"CN","type":"education","lineage":["https://openalex.org/I139759216"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qing Song","raw_affiliation_strings":["School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4616-2200","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beijing University of Posts and Telecommunications, Beijing, China","institution_ids":["https://openalex.org/I139759216"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5017033250"],"corresponding_institution_ids":["https://openalex.org/I139759216"],"apc_list":null,"apc_paid":null,"fwci":6.2406,"has_fulltext":true,"cited_by_count":53,"citation_normalized_percentile":{"value":0.97572499,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":98,"max":100},"biblio":{"volume":"33","issue":"11","first_page":"6571","last_page":"6594"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.996999979019165,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11448","display_name":"Face recognition and analysis","score":0.9934999942779541,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7583034038543701},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6964436173439026},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.6175135374069214},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.5792623162269592},{"id":"https://openalex.org/keywords/motion-estimation","display_name":"Motion estimation","score":0.5144665241241455},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.46246641874313354},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.4195820093154907},{"id":"https://openalex.org/keywords/embedding","display_name":"Embedding","score":0.41512274742126465},{"id":"https://openalex.org/keywords/match-moving","display_name":"Match moving","score":0.410357266664505},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.3737180233001709},{"id":"https://openalex.org/keywords/motion","display_name":"Motion (physics)","score":0.31113898754119873},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.22420817613601685}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7583034038543701},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6964436173439026},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6175135374069214},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.5792623162269592},{"id":"https://openalex.org/C10161872","wikidata":"https://www.wikidata.org/wiki/Q557891","display_name":"Motion estimation","level":2,"score":0.5144665241241455},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.46246641874313354},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.4195820093154907},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.41512274742126465},{"id":"https://openalex.org/C95020103","wikidata":"https://www.wikidata.org/wiki/Q1813492","display_name":"Match moving","level":3,"score":0.410357266664505},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.3737180233001709},{"id":"https://openalex.org/C104114177","wikidata":"https://www.wikidata.org/wiki/Q79782","display_name":"Motion (physics)","level":2,"score":0.31113898754119873},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.22420817613601685},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3263884","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3263884","pdf_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10091152.pdf","source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":{"id":"doi:10.1109/tcsvt.2023.3263884","is_oa":true,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3263884","pdf_url":"https://ieeexplore.ieee.org/ielx7/76/4358651/10091152.pdf","source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.6200000047683716,"display_name":"Peace, Justice and strong institutions"}],"awards":[{"id":"https://openalex.org/G2627180095","display_name":null,"funder_award_id":"2022YFC3302200","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null}],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4362501010.pdf","grobid_xml":"https://content.openalex.org/works/W4362501010.grobid-xml"},"referenced_works_count":113,"referenced_works":["https://openalex.org/W639708223","https://openalex.org/W1536680647","https://openalex.org/W2016135469","https://openalex.org/W2020934227","https://openalex.org/W2113926057","https://openalex.org/W2119539043","https://openalex.org/W2124781496","https://openalex.org/W2252355370","https://openalex.org/W2291627510","https://openalex.org/W2511791013","https://openalex.org/W2525726571","https://openalex.org/W2570343428","https://openalex.org/W2579024533","https://openalex.org/W2603203130","https://openalex.org/W2605035112","https://openalex.org/W2618529757","https://openalex.org/W2766984662","https://openalex.org/W2786464815","https://openalex.org/W2889935068","https://openalex.org/W2891254924","https://openalex.org/W2894642126","https://openalex.org/W2900871370","https://openalex.org/W2903855329","https://openalex.org/W2908510526","https://openalex.org/W2920942303","https://openalex.org/W2951585248","https://openalex.org/W2962766617","https://openalex.org/W2963063317","https://openalex.org/W2963263347","https://openalex.org/W2963351448","https://openalex.org/W2963677766","https://openalex.org/W2964019074","https://openalex.org/W2981393651","https://openalex.org/W3005680577","https://openalex.org/W3006651016","https://openalex.org/W3012922853","https://openalex.org/W3018207438","https://openalex.org/W3027919498","https://openalex.org/W3035524453","https://openalex.org/W3035578948","https://openalex.org/W3035727180","https://openalex.org/W3084173793","https://openalex.org/W3086436251","https://openalex.org/W3094000868","https://openalex.org/W3095753995","https://openalex.org/W3096609285","https://openalex.org/W3099887740","https://openalex.org/W3104218139","https://openalex.org/W3104778224","https://openalex.org/W3106763294","https://openalex.org/W3108316907","https://openalex.org/W3115390238","https://openalex.org/W3115517346","https://openalex.org/W3119686997","https://openalex.org/W3126235906","https://openalex.org/W3130778992","https://openalex.org/W3149485574","https://openalex.org/W3165926952","https://openalex.org/W3166285241","https://openalex.org/W3167949052","https://openalex.org/W3171485246","https://openalex.org/W3174101598","https://openalex.org/W3174690341","https://openalex.org/W3179985441","https://openalex.org/W3184439416","https://openalex.org/W3185016686","https://openalex.org/W3195775608","https://openalex.org/W3197804339","https://openalex.org/W3205100603","https://openalex.org/W3207452968","https://openalex.org/W4205537101","https://openalex.org/W4226078731","https://openalex.org/W4283748233","https://openalex.org/W4285357233","https://openalex.org/W4286904999","https://openalex.org/W4304479854","https://openalex.org/W4307415560","https://openalex.org/W4310467366","https://openalex.org/W4312473433","https://openalex.org/W4312689495","https://openalex.org/W4312906297","https://openalex.org/W4313072323","https://openalex.org/W4313117614","https://openalex.org/W4319299988","https://openalex.org/W4319866011","https://openalex.org/W4385245566","https://openalex.org/W4386076204","https://openalex.org/W6620707391","https://openalex.org/W6678664622","https://openalex.org/W6696672603","https://openalex.org/W6726497184","https://openalex.org/W6736160952","https://openalex.org/W6739901393","https://openalex.org/W6748176785","https://openalex.org/W6757817989","https://openalex.org/W6760212410","https://openalex.org/W6774314701","https://openalex.org/W6775253321","https://openalex.org/W6778485988","https://openalex.org/W6780383567","https://openalex.org/W6788023325","https://openalex.org/W6795368335","https://openalex.org/W6798838024","https://openalex.org/W6799133303","https://openalex.org/W6801013943","https://openalex.org/W6802459829","https://openalex.org/W6803363630","https://openalex.org/W6809649412","https://openalex.org/W6810826495","https://openalex.org/W6810827814","https://openalex.org/W6839744764","https://openalex.org/W6840663683","https://openalex.org/W6846111883"],"related_works":["https://openalex.org/W2965594636","https://openalex.org/W2164674712","https://openalex.org/W2154918876","https://openalex.org/W3034182891","https://openalex.org/W2130582613","https://openalex.org/W4253668313","https://openalex.org/W2338820443","https://openalex.org/W2164117788","https://openalex.org/W2359434423","https://openalex.org/W2101683776"],"abstract_inverted_index":{"Mainstream":[0],"multi-object":[1],"tracking":[2,73],"methods":[3,265],"exploit":[4,93],"appearance":[5,18,25,49],"information":[6,9,29,103,109],"and/or":[7],"motion":[8,28,42,55,69,106,122,136,166],"to":[10,38,57,66,83,100,117,133,138,145,159,181,282],"achieve":[11],"interframe":[12],"association.":[13,89],"However,":[14],"dealing":[15],"with":[16,74,196,212],"similar":[17,243],"and":[19,35,51,70,107,113,141,172,202,224,230,262,275],"occlusion":[20,245],"is":[21,30,36,81,325],"a":[22,53,178,219,267],"challenge":[23],"for":[24,87,190,270],"information,":[26],"while":[27],"limited":[31],"by":[32],"linear":[33],"assumptions":[34],"prone":[37],"failure":[39],"in":[40,104,110,187,239,278,288,319],"nonlinear":[41,247],"patterns.":[43],"In":[44,151,280],"this":[45],"work,":[46],"we":[47,91,125,176,294],"disregard":[48],"clues":[50],"propose":[52],"pure":[54],"tracker":[56],"address":[58],"the":[59,94,119,147,161,165,169,173,183,205,215,234,250,253,257,271,284],"above":[60,184],"issues.":[61],"It":[62],"dexterously":[63],"utilizes":[64],"Transformer":[65,99,274],"estimate":[67],"complex":[68],"achieves":[71,225,305],"high-performance":[72],"low":[75],"computing":[76],"resources.":[77],"Furthermore,":[78],"contrastive":[79,127,263,276],"learning":[80,128,277],"introduced":[82],"optimize":[84],"feature":[85],"representation":[86],"robust":[88],"Specifically,":[90],"first":[92],"long-range":[95],"modeling":[96],"capability":[97],"of":[98,121,168,207,236,256,273,286],"mine":[101],"intention":[102],"temporal":[105],"decision":[108],"spatial":[111],"interaction":[112],"introduce":[114,126,142],"prior":[115],"detection":[116,174],"constrain":[118],"range":[120],"estimation.":[123],"Then,":[124],"as":[129],"an":[130],"auxiliary":[131],"task":[132],"extract":[134],"reliable":[135],"features":[137,167],"compute":[139],"affinity":[140,148],"bidirectional":[143],"matching":[144],"improve":[146],"computation":[149],"distribution.":[150],"addition,":[152,281],"given":[153],"that":[154,303,312],"both":[155],"tasks":[156,186],"are":[157],"dedicated":[158],"narrowing":[160],"embedding":[162],"distance":[163],"between":[164],"tracked":[170],"object":[171,317],"features,":[175],"design":[177],"joint-motion-and-association":[179],"framework":[180,189],"unify":[182],"two":[185],"one":[188],"optimization.":[191],"The":[192,300,323],"experimental":[193],"results":[194,301],"achieved":[195],"three":[197],"benchmark":[198],"datasets,":[199],"MOT17,":[200],"MOT20":[201],"DanceTrack,":[203],"verify":[204,283],"effectiveness":[206],"our":[208,237],"proposed":[209,216,258],"method.":[210],"Compared":[211],"state-of-the-art":[213,221,306],"methods,":[214],"STDFormer":[217,287,297,304],"sets":[218],"new":[220,268],"on":[222,228,298,308],"DanceTrack":[223],"competitive":[226],"performance":[227,307],"MOT17":[229],"MOT20.":[231],"This":[232],"demonstrates":[233],"advantage":[235],"method":[238,259],"handling":[240],"associations":[241,318],"under":[242],"appearance,":[244],"or":[246],"motion.":[248],"At":[249],"same":[251],"time,":[252],"significant":[254],"advantages":[255],"over":[260],"Transformer-based":[261],"learning-based":[264],"suggest":[266],"direction":[269],"application":[272],"MOT.":[279],"generalization":[285],"unmanned":[289],"aerial":[290],"vehicle":[291],"(UAV)":[292],"videos,":[293],"also":[295],"evaluate":[296],"VisDrone2019.":[299],"show":[302],"VisDrone2019,":[309],"which":[310],"proves":[311],"it":[313],"can":[314],"handle":[315],"small-scale":[316],"UAV":[320],"videos":[321],"well.":[322],"code":[324],"available":[326],"at":[327],"https://github.com/Xiaotong-Zhu/STDFormer.":[328]},"counts_by_year":[{"year":2026,"cited_by_count":5},{"year":2025,"cited_by_count":29},{"year":2024,"cited_by_count":14},{"year":2023,"cited_by_count":5}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
