{"id":"https://openalex.org/W4381735302","doi":"https://doi.org/10.1109/tcsvt.2023.3288353","title":"Unified Transformer With Isomorphic Branches for Natural Language Tracking","display_name":"Unified Transformer With Isomorphic Branches for Natural Language Tracking","publication_year":2023,"publication_date":"2023-06-23","ids":{"openalex":"https://openalex.org/W4381735302","doi":"https://doi.org/10.1109/tcsvt.2023.3288353"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2023.3288353","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3288353","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5100324876","display_name":"Rong Wang","orcid":"https://orcid.org/0000-0001-9251-3775"},"institutions":[{"id":"https://openalex.org/I37448385","display_name":"China People's Public Security University","ror":"https://ror.org/05twya590","country_code":"CN","type":"education","lineage":["https://openalex.org/I37448385"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Rong Wang","raw_affiliation_strings":["Police Information Engineering and Network Security College, People&#x2019;s Public Security University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Police Information Engineering and Network Security College, People&#x2019;s Public Security University of China, Beijing, China","institution_ids":["https://openalex.org/I37448385"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075863583","display_name":"Zongheng Tang","orcid":"https://orcid.org/0000-0002-9903-802X"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zongheng Tang","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China","Hangzhou Innovation Institute, Beihang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"Hangzhou Innovation Institute, Beihang University, Hangzhou, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101187943","display_name":"Qianli Zhou","orcid":null},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Qianli Zhou","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China","Hangzhou Innovation Institute, Beihang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"Hangzhou Innovation Institute, Beihang University, Hangzhou, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100683619","display_name":"Xiaoqian Liu","orcid":"https://orcid.org/0009-0006-1919-6519"},"institutions":[{"id":"https://openalex.org/I177955009","display_name":"China University of Political Science and Law","ror":"https://ror.org/00e49gy82","country_code":"CN","type":"education","lineage":["https://openalex.org/I177955009"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoqian Liu","raw_affiliation_strings":["School of Sociology, China University of Political Science and Law, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Sociology, China University of Political Science and Law, Beijing, China","institution_ids":["https://openalex.org/I177955009"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5056811650","display_name":"Tianrui Hui","orcid":"https://orcid.org/0000-0002-1172-1554"},"institutions":[{"id":"https://openalex.org/I19820366","display_name":"Chinese Academy of Sciences","ror":"https://ror.org/034t30j35","country_code":"CN","type":"government","lineage":["https://openalex.org/I19820366"]},{"id":"https://openalex.org/I4210156404","display_name":"Institute of Information Engineering","ror":"https://ror.org/04r53se39","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210156404"]},{"id":"https://openalex.org/I4210165038","display_name":"University of Chinese Academy of Sciences","ror":"https://ror.org/05qbk4x57","country_code":"CN","type":"education","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210165038"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Tianrui Hui","raw_affiliation_strings":["Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China","School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Institute of Information Engineering, Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210156404","https://openalex.org/I19820366"]},{"raw_affiliation_string":"School of Cyber Security, University of Chinese Academy of Sciences, Beijing, China","institution_ids":["https://openalex.org/I4210165038"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050916960","display_name":"Quange Tan","orcid":null},"institutions":[{"id":"https://openalex.org/I37448385","display_name":"China People's Public Security University","ror":"https://ror.org/05twya590","country_code":"CN","type":"education","lineage":["https://openalex.org/I37448385"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Quange Tan","raw_affiliation_strings":["Police Information Engineering and Network Security College, People&#x2019;s Public Security University of China, Beijing, China"],"affiliations":[{"raw_affiliation_string":"Police Information Engineering and Network Security College, People&#x2019;s Public Security University of China, Beijing, China","institution_ids":["https://openalex.org/I37448385"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100330138","display_name":"Si Liu","orcid":"https://orcid.org/0000-0002-9180-2935"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Si Liu","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University, Beijing, China","Hangzhou Innovation Institute, Beihang University, Hangzhou, China"],"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]},{"raw_affiliation_string":"Hangzhou Innovation Institute, Beihang University, Hangzhou, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5100324876"],"corresponding_institution_ids":["https://openalex.org/I37448385"],"apc_list":null,"apc_paid":null,"fwci":1.6851,"has_fulltext":false,"cited_by_count":14,"citation_normalized_percentile":{"value":0.86296945,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":90,"max":99},"biblio":{"volume":"33","issue":"9","first_page":"4529","last_page":"4541"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10812","display_name":"Human Pose and Action Recognition","score":0.9891999959945679,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.9847000241279602,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7973192930221558},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.6274807453155518},{"id":"https://openalex.org/keywords/natural-language","display_name":"Natural language","score":0.6089960932731628},{"id":"https://openalex.org/keywords/video-tracking","display_name":"Video tracking","score":0.5869559645652771},{"id":"https://openalex.org/keywords/minimum-bounding-box","display_name":"Minimum bounding box","score":0.5845350027084351},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.5252465605735779},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.44592535495758057},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.43136709928512573},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.42155903577804565},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.4137979745864868},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.36510002613067627},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.3182498514652252},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.1346847414970398},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08772489428520203}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7973192930221558},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6274807453155518},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.6089960932731628},{"id":"https://openalex.org/C202474056","wikidata":"https://www.wikidata.org/wiki/Q1931635","display_name":"Video tracking","level":3,"score":0.5869559645652771},{"id":"https://openalex.org/C147037132","wikidata":"https://www.wikidata.org/wiki/Q6865426","display_name":"Minimum bounding box","level":3,"score":0.5845350027084351},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.5252465605735779},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.44592535495758057},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.43136709928512573},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.42155903577804565},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.4137979745864868},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.36510002613067627},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.3182498514652252},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.1346847414970398},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08772489428520203},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2023.3288353","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2023.3288353","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.7599999904632568}],"awards":[{"id":"https://openalex.org/G1874218645","display_name":null,"funder_award_id":"61976250","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G5696407354","display_name":null,"funder_award_id":"62122010","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8087517129","display_name":null,"funder_award_id":"62076246","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G8986216942","display_name":null,"funder_award_id":"2022ZD0115502","funder_id":"https://openalex.org/F4320335777","funder_display_name":"National Key Research and Development Program of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320335777","display_name":"National Key Research and Development Program of China","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":70,"referenced_works":["https://openalex.org/W1773149199","https://openalex.org/W1825604117","https://openalex.org/W1857884451","https://openalex.org/W2089961441","https://openalex.org/W2194775991","https://openalex.org/W2222512263","https://openalex.org/W2247513039","https://openalex.org/W2251512949","https://openalex.org/W2470394683","https://openalex.org/W2571175805","https://openalex.org/W2747053578","https://openalex.org/W2799058067","https://openalex.org/W2808989867","https://openalex.org/W2886904239","https://openalex.org/W2920748649","https://openalex.org/W2963080533","https://openalex.org/W2963109634","https://openalex.org/W2963534981","https://openalex.org/W2963735856","https://openalex.org/W2964242925","https://openalex.org/W2964423614","https://openalex.org/W2965373594","https://openalex.org/W2966759264","https://openalex.org/W2978370258","https://openalex.org/W2989688045","https://openalex.org/W2993231436","https://openalex.org/W2997896013","https://openalex.org/W3001584168","https://openalex.org/W3010072143","https://openalex.org/W3034772468","https://openalex.org/W3035356601","https://openalex.org/W3035419698","https://openalex.org/W3035571898","https://openalex.org/W3035590142","https://openalex.org/W3096609285","https://openalex.org/W3098232790","https://openalex.org/W3106542916","https://openalex.org/W3108519869","https://openalex.org/W3116359960","https://openalex.org/W3127152723","https://openalex.org/W3131500599","https://openalex.org/W3135450171","https://openalex.org/W3138516171","https://openalex.org/W3162090017","https://openalex.org/W3162457465","https://openalex.org/W3166712493","https://openalex.org/W3167536469","https://openalex.org/W3171547673","https://openalex.org/W3173871266","https://openalex.org/W3175187932","https://openalex.org/W3178075329","https://openalex.org/W3181069167","https://openalex.org/W4214490042","https://openalex.org/W4214759957","https://openalex.org/W4285134409","https://openalex.org/W4285283873","https://openalex.org/W4289126595","https://openalex.org/W4312295550","https://openalex.org/W4312330256","https://openalex.org/W4315473428","https://openalex.org/W4385245566","https://openalex.org/W6620707391","https://openalex.org/W6684191040","https://openalex.org/W6746052068","https://openalex.org/W6757135208","https://openalex.org/W6769243733","https://openalex.org/W6771096273","https://openalex.org/W6795146805","https://openalex.org/W6795704626","https://openalex.org/W6797397777"],"related_works":["https://openalex.org/W4318751391","https://openalex.org/W2940082708","https://openalex.org/W2901505109","https://openalex.org/W4292829955","https://openalex.org/W2287881387","https://openalex.org/W4298299496","https://openalex.org/W2609618931","https://openalex.org/W2988815316","https://openalex.org/W3082619268","https://openalex.org/W4390755799"],"abstract_inverted_index":{"Natural":[0],"language":[1,13,110,130,181,189,209],"tracking":[2,30,70,79,131,142,174,197,210],"aims":[3],"to":[4,10,44,54,81,104,149],"localize":[5],"the":[6,46,52,56,109,113,154,173,177],"target":[7,57,175],"object":[8,29],"referred":[9],"by":[11],"a":[12,16,34,59,124,160,200],"description":[14,111],"using":[15],"sequence":[17],"of":[18,48,172,186],"bounding":[19,35],"boxes":[20],"in":[21,58,90],"video":[22],"frames.":[23],"Compared":[24],"with":[25,32,101,198],"traditional":[26],"visual":[27,178,187],"single":[28,201],"initialized":[31],"only":[33,199],"box":[36],"(BBox),":[37],"this":[38,83],"task":[39],"introduces":[40],"high-level":[41],"semantic":[42],"information":[43,117,171],"reduce":[45],"ambiguity":[47],"BBox":[49],"and":[50,68,78,112,141,180,188],"enhance":[51],"ability":[53],"retrieve":[55],"global":[60,170],"manner.":[61],"Thus,":[62],"it":[63],"can":[64,99,167,192],"yield":[65],"more":[66],"accurate":[67],"robust":[69],"results.":[71],"Previous":[72],"methods":[73],"usually":[74],"adopt":[75],"off-the-shelf":[76],"grounding":[77,140],"branches":[80,98,143],"tackle":[82],"task,":[84],"where":[85,144],"feature":[86],"representations":[87],"are":[88],"learned":[89],"isolation":[91],"without":[92],"benefiting":[93],"each":[94,102],"other.":[95],"The":[96],"two":[97],"associate":[100],"other":[103],"discover":[105],"crucial":[106],"clues":[107],"since":[108],"template":[114,179],"image":[115],"provide":[116],"from":[118,176],"different":[119],"sources.":[120],"Therefore,":[121],"we":[122,158,191],"propose":[123,159],"unified":[125],"transformer":[126],"method":[127],"for":[128,139,153],"natural":[129,208],"named":[132],"TransNLT,":[133],"which":[134,166],"utilizes":[135],"isomorphic":[136],"Transformer":[137],"structures":[138],"collaborative":[145],"learning":[146],"is":[147],"enabled":[148],"construct":[150],"comprehensive":[151],"features":[152],"target.":[155],"In":[156],"addition,":[157],"Selective":[161],"Feature":[162],"Gathering":[163],"(SFG)":[164],"module":[165],"integrate":[168],"cross-modal":[169],"description.":[182],"Through":[183],"effective":[184],"interaction":[185],"information,":[190],"achieve":[193],"better":[194],"results":[195],"than":[196],"modality.":[202],"Extensive":[203],"experiments":[204],"on":[205],"three":[206],"popular":[207],"benchmarks":[211],"show":[212],"our":[213],"proposed":[214],"TransNLT":[215],"outperforms":[216],"previous":[217],"state-of-the-art":[218],"methods.":[219]},"counts_by_year":[{"year":2026,"cited_by_count":2},{"year":2025,"cited_by_count":9},{"year":2024,"cited_by_count":2},{"year":2023,"cited_by_count":1}],"updated_date":"2026-03-27T05:58:40.876381","created_date":"2025-10-10T00:00:00"}
