{"id":"https://openalex.org/W4405755115","doi":"https://doi.org/10.1109/tmm.2024.3521842","title":"Augment One With Others: Generalizing to Unforeseen Variations for Visual Tracking","display_name":"Augment One With Others: Generalizing to Unforeseen Variations for Visual Tracking","publication_year":2024,"publication_date":"2024-12-24","ids":{"openalex":"https://openalex.org/W4405755115","doi":"https://doi.org/10.1109/tmm.2024.3521842"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2024.3521842","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3521842","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101490398","display_name":"Jinpu Zhang","orcid":"https://orcid.org/0000-0002-0617-0452"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jinpu Zhang","raw_affiliation_strings":["School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0002-0617-0452","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101584518","display_name":"Ziwen Li","orcid":"https://orcid.org/0000-0002-8594-3133"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ziwen Li","raw_affiliation_strings":["School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0002-8594-3133","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067428532","display_name":"Ruonan Wei","orcid":"https://orcid.org/0000-0002-2562-6021"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ruonan Wei","raw_affiliation_strings":["School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0002-2562-6021","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5030517812","display_name":"Yuehuan Wang","orcid":"https://orcid.org/0000-0001-7046-7587"},"institutions":[{"id":"https://openalex.org/I47720641","display_name":"Huazhong University of Science and Technology","ror":"https://ror.org/00p991c53","country_code":"CN","type":"education","lineage":["https://openalex.org/I47720641"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yuehuan Wang","raw_affiliation_strings":["School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0001-7046-7587","affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence and Automation, Huazhong University of Science and Technology, Wuhan, China","institution_ids":["https://openalex.org/I47720641"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5101490398"],"corresponding_institution_ids":["https://openalex.org/I47720641"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.23418114,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"27","issue":null,"first_page":"1461","last_page":"1474"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.8964999914169312,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11707","display_name":"Gaze Tracking and Assistive Technology","score":0.8964999914169312,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.8381999731063843,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.7832000255584717,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7927933931350708},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5088315606117249},{"id":"https://openalex.org/keywords/augment","display_name":"Augment","score":0.4518935978412628},{"id":"https://openalex.org/keywords/eye-tracking","display_name":"Eye tracking","score":0.44194936752319336},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4176673889160156},{"id":"https://openalex.org/keywords/visualization","display_name":"Visualization","score":0.416833758354187},{"id":"https://openalex.org/keywords/human\u2013computer-interaction","display_name":"Human\u2013computer interaction","score":0.39120015501976013}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7927933931350708},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5088315606117249},{"id":"https://openalex.org/C2779070825","wikidata":"https://www.wikidata.org/wiki/Q760434","display_name":"Augment","level":2,"score":0.4518935978412628},{"id":"https://openalex.org/C56461940","wikidata":"https://www.wikidata.org/wiki/Q970687","display_name":"Eye tracking","level":2,"score":0.44194936752319336},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4176673889160156},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.416833758354187},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.39120015501976013},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2024.3521842","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2024.3521842","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":71,"referenced_works":["https://openalex.org/W153185079","https://openalex.org/W2158592639","https://openalex.org/W2470394683","https://openalex.org/W2776035257","https://openalex.org/W2794744029","https://openalex.org/W2799058067","https://openalex.org/W2891033863","https://openalex.org/W2898200825","https://openalex.org/W2937749627","https://openalex.org/W2955747520","https://openalex.org/W2962824803","https://openalex.org/W2963227409","https://openalex.org/W2963534981","https://openalex.org/W2963855133","https://openalex.org/W2964242925","https://openalex.org/W2964423614","https://openalex.org/W2966759264","https://openalex.org/W2987460522","https://openalex.org/W2990205821","https://openalex.org/W2992308087","https://openalex.org/W2998027361","https://openalex.org/W2998237070","https://openalex.org/W2998434318","https://openalex.org/W3001584168","https://openalex.org/W3009294634","https://openalex.org/W3017266435","https://openalex.org/W3034297219","https://openalex.org/W3034617042","https://openalex.org/W3035257046","https://openalex.org/W3035453691","https://openalex.org/W3035571898","https://openalex.org/W3035672751","https://openalex.org/W3035682985","https://openalex.org/W3038946636","https://openalex.org/W3047841915","https://openalex.org/W3104158266","https://openalex.org/W3108519869","https://openalex.org/W3126121388","https://openalex.org/W3127756064","https://openalex.org/W3159231306","https://openalex.org/W3167536469","https://openalex.org/W3167762749","https://openalex.org/W3168663926","https://openalex.org/W3172355732","https://openalex.org/W3172670627","https://openalex.org/W3173344965","https://openalex.org/W3185864054","https://openalex.org/W3203857058","https://openalex.org/W3204554907","https://openalex.org/W3214586131","https://openalex.org/W4214759957","https://openalex.org/W4304481542","https://openalex.org/W4312255167","https://openalex.org/W4312323989","https://openalex.org/W4312472480","https://openalex.org/W4312751983","https://openalex.org/W4312805142","https://openalex.org/W4313555658","https://openalex.org/W4386066459","https://openalex.org/W4388505511","https://openalex.org/W6743928203","https://openalex.org/W6746638498","https://openalex.org/W6755837410","https://openalex.org/W6765721730","https://openalex.org/W6766093832","https://openalex.org/W6770979763","https://openalex.org/W6779913302","https://openalex.org/W6788840927","https://openalex.org/W6797888435","https://openalex.org/W6805147364","https://openalex.org/W6852835101"],"related_works":["https://openalex.org/W2943769328","https://openalex.org/W4386921804","https://openalex.org/W2802830363","https://openalex.org/W3187381656","https://openalex.org/W2810824249","https://openalex.org/W2811430115","https://openalex.org/W2994363382","https://openalex.org/W2052481242","https://openalex.org/W2774867697","https://openalex.org/W4302387238"],"abstract_inverted_index":{"Unforeseen":[0],"appearance":[1],"variation":[2],"is":[3],"a":[4,13,89],"challenging":[5,150],"factor":[6],"for":[7,26],"visual":[8],"tracking.":[9],"This":[10],"paper":[11],"provides":[12],"novel":[14],"solution":[15],"from":[16],"semantic":[17,92,118],"data":[18],"augmentation,":[19],"which":[20,102],"facilitates":[21],"offline":[22],"training":[23,77,127],"of":[24,41,80],"trackers":[25],"better":[27],"generalization.":[28],"We":[29],"utilize":[30],"existing":[31],"samples":[32,108],"to":[33,36,68,109],"obtain":[34],"knowledge":[35],"augment":[37],"another":[38],"in":[39,53],"terms":[40],"diversity":[42],"and":[43,72,112,115,124,161,175],"hardness.":[44],"First,":[45],"we":[46,62,95],"propose":[47,96],"that":[48,153],"the":[49,64,84,97,122,126,141,169],"similarity":[50,78],"matching":[51],"space":[52],"Siamese-like":[54],"models":[55],"has":[56],"class-agnostic":[57],"transferability.":[58],"Based":[59],"on":[60,148],"this,":[61],"design":[63],"Latent":[65],"Augmentation":[66],"(LaAug)":[67],"transfer":[69],"relevant":[70],"variations":[71],"suppress":[73],"irrelevant":[74],"ones":[75],"between":[76,105],"embeddings":[79],"different":[81,106],"classes.":[82],"Thus":[83],"model":[85,142],"can":[86,138,163],"generalize":[87],"across":[88],"more":[90],"diverse":[91],"distribution.":[93],"Then,":[94],"Semantic":[98],"Interaction":[99],"Mix":[100],"(SIMix),":[101],"interacts":[103],"moments":[104],"feature":[107],"contaminate":[110],"structure":[111],"texture":[113],"attributes":[114],"retain":[116],"other":[117],"attributes.":[119],"SIMix":[120],"simulates":[121],"occlusion":[123],"complements":[125],"distribution":[128],"with":[129,135],"hard":[130],"cases.":[131],"The":[132],"mixed":[133],"features":[134],"adversarial":[136],"perturbations":[137],"empirically":[139],"enable":[140],"against":[143],"external":[144],"environmental":[145],"disturbances.":[146],"Experiments":[147],"six":[149],"benchmarks":[151],"demonstrate":[152],"three":[154],"representative":[155],"tracking":[156],"models,":[157],"i.e.,":[158],"SiamBAN,":[159],"TransT":[160],"OSTrack,":[162],"be":[164],"consistently":[165],"improved":[166],"by":[167],"incorporating":[168],"proposed":[170],"methods":[171],"without":[172],"extra":[173],"parameters":[174],"inference":[176],"cost.":[177]},"counts_by_year":[],"updated_date":"2025-12-23T23:11:35.936235","created_date":"2025-10-10T00:00:00"}
