{"id":"https://openalex.org/W4403792266","doi":"https://doi.org/10.1145/3664647.3680878","title":"Breaking Modality Gap in RGBT Tracking: Coupled Knowledge Distillation","display_name":"Breaking Modality Gap in RGBT Tracking: Coupled Knowledge Distillation","publication_year":2024,"publication_date":"2024-10-26","ids":{"openalex":"https://openalex.org/W4403792266","doi":"https://doi.org/10.1145/3664647.3680878"},"language":"en","primary_location":{"id":"doi:10.1145/3664647.3680878","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680878","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5007991351","display_name":"Andong Lu","orcid":"https://orcid.org/0000-0002-0902-2260"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Andong Lu","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, HeFei, AnHui, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, HeFei, AnHui, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108419236","display_name":"J. Zhao","orcid":"https://orcid.org/0009-0002-8480-3988"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiacong Zhao","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, HeFei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, HeFei, Anhui, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100398932","display_name":"Chenglong Li","orcid":"https://orcid.org/0000-0002-7233-2739"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenglong Li","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, HeFei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, HeFei, Anhui, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101419454","display_name":"Yun Xiao","orcid":"https://orcid.org/0000-0002-5285-8565"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yun Xiao","raw_affiliation_strings":["Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, HeFei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, HeFei, Anhui, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100372676","display_name":"Bin Luo","orcid":"https://orcid.org/0000-0001-5948-5055"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Bin Luo","raw_affiliation_strings":["Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, HeFei, Anhui, China"],"affiliations":[{"raw_affiliation_string":"Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, HeFei, Anhui, China","institution_ids":["https://openalex.org/I143868143"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5007991351"],"corresponding_institution_ids":["https://openalex.org/I143868143"],"apc_list":null,"apc_paid":null,"fwci":1.5495,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.8471148,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":97,"max":99},"biblio":{"volume":null,"issue":null,"first_page":"9291","last_page":"9300"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9993000030517578,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10531","display_name":"Advanced Vision and Imaging","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11099","display_name":"Autonomous Vehicle Technology and Safety","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/2203","display_name":"Automotive Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6693481206893921},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5582261085510254},{"id":"https://openalex.org/keywords/distillation","display_name":"Distillation","score":0.5482689142227173},{"id":"https://openalex.org/keywords/tracking","display_name":"Tracking (education)","score":0.5151006579399109},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.33233642578125},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.3301195502281189},{"id":"https://openalex.org/keywords/chemistry","display_name":"Chemistry","score":0.11772790551185608},{"id":"https://openalex.org/keywords/psychology","display_name":"Psychology","score":0.10586455464363098},{"id":"https://openalex.org/keywords/chromatography","display_name":"Chromatography","score":0.0832798182964325}],"concepts":[{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6693481206893921},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5582261085510254},{"id":"https://openalex.org/C204030448","wikidata":"https://www.wikidata.org/wiki/Q101017","display_name":"Distillation","level":2,"score":0.5482689142227173},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.5151006579399109},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.33233642578125},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.3301195502281189},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.11772790551185608},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.10586455464363098},{"id":"https://openalex.org/C43617362","wikidata":"https://www.wikidata.org/wiki/Q170050","display_name":"Chromatography","level":1,"score":0.0832798182964325},{"id":"https://openalex.org/C19417346","wikidata":"https://www.wikidata.org/wiki/Q7922","display_name":"Pedagogy","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3664647.3680878","is_oa":false,"landing_page_url":"https://doi.org/10.1145/3664647.3680878","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 32nd ACM International Conference on Multimedia","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":56,"referenced_works":["https://openalex.org/W2527415613","https://openalex.org/W2603777577","https://openalex.org/W2765667535","https://openalex.org/W2963188742","https://openalex.org/W2963905288","https://openalex.org/W2996575194","https://openalex.org/W3012425959","https://openalex.org/W3034203264","https://openalex.org/W3035020406","https://openalex.org/W3099671582","https://openalex.org/W3099681648","https://openalex.org/W3101990647","https://openalex.org/W3110562975","https://openalex.org/W3132864630","https://openalex.org/W3158472981","https://openalex.org/W3167917117","https://openalex.org/W3171106688","https://openalex.org/W3174102142","https://openalex.org/W3176765321","https://openalex.org/W3177008256","https://openalex.org/W3183152796","https://openalex.org/W3183904268","https://openalex.org/W3190537575","https://openalex.org/W3212622989","https://openalex.org/W4210368306","https://openalex.org/W4226017279","https://openalex.org/W4226126595","https://openalex.org/W4226385753","https://openalex.org/W4234552385","https://openalex.org/W4283807600","https://openalex.org/W4283808043","https://openalex.org/W4286974493","https://openalex.org/W4287660544","https://openalex.org/W4304098539","https://openalex.org/W4312262772","https://openalex.org/W4312751983","https://openalex.org/W4313156423","https://openalex.org/W4375843773","https://openalex.org/W4376226279","https://openalex.org/W4382240192","https://openalex.org/W4385215686","https://openalex.org/W4386066394","https://openalex.org/W4386075603","https://openalex.org/W4386075647","https://openalex.org/W4386075687","https://openalex.org/W4386075851","https://openalex.org/W4386083029","https://openalex.org/W4386083135","https://openalex.org/W4387969861","https://openalex.org/W4389345002","https://openalex.org/W4390872684","https://openalex.org/W4390873110","https://openalex.org/W4392824656","https://openalex.org/W4393147243","https://openalex.org/W4393148493","https://openalex.org/W4394625688"],"related_works":["https://openalex.org/W2772917594","https://openalex.org/W2036807459","https://openalex.org/W2058170566","https://openalex.org/W2755342338","https://openalex.org/W2166024367","https://openalex.org/W3116076068","https://openalex.org/W2229312674","https://openalex.org/W2951359407","https://openalex.org/W2079911747","https://openalex.org/W1969923398"],"abstract_inverted_index":{"Modality":[0],"gap":[1,27,100],"between":[2],"RGB":[3,130,172],"and":[4,71,131,137,173,187,200],"thermal":[5,174],"infrared":[6],"(TIR)":[7],"images":[8],"is":[9],"a":[10,40,183,188],"crucial":[11],"issue":[12],"but":[13],"often":[14],"overlooked":[15],"in":[16,30,120,161],"existing":[17],"RGBT":[18,62,208],"tracking":[19,198,209,225],"methods.":[20],"It":[21],"can":[22,97],"be":[23],"observed":[24],"that":[25],"modality":[26,57,99,177],"mainly":[28],"lies":[29],"the":[31,73,89,106,114,135,148,156,212,215,223],"image":[32],"style":[33,74,80,90,109],"difference.":[34],"In":[35,64,179],"this":[36,125],"work,":[37],"we":[38,66,96,127,181],"propose":[39],"novel":[41],"Coupled":[42],"Knowledge":[43],"Distillation":[44],"framework":[45,165],"called":[46],"CKD,":[47],"which":[48],"pursues":[49],"common":[50],"styles":[51],"of":[52,92,101,108,117,171,214,227],"different":[53,102],"modalities":[54,103,119,175],"to":[55,77,113,166,196],"break":[56,98],"gap,":[58],"for":[59],"high":[60],"performance":[61],"tracking.":[63],"particular,":[65],"introduce":[67],"two":[68,93,118,143,158],"student":[69,94,121,144],"networks":[70,133,145],"employ":[72],"distillation":[75,107,159],"loss":[76],"make":[78],"their":[79,139],"features":[81,110],"consistent":[82],"as":[83,85,134],"much":[84],"possible.":[86],"Through":[87],"alleviating":[88],"difference":[91],"networks,":[95],"well.":[104],"However,":[105],"might":[111],"harm":[112],"content":[115,140],"representations":[116,170],"networks.":[122],"To":[123],"handle":[124],"issue,":[126],"take":[128],"original":[129],"TIR":[132],"teachers,":[136],"distill":[138],"knowledge":[141],"into":[142,194],"respectively":[146],"by":[147],"style-content":[149],"orthogonal":[150],"feature":[151,169],"decoupling":[152],"scheme.":[153],"We":[154],"couple":[155],"above":[157],"processes":[160],"an":[162],"online":[163],"optimization":[164],"form":[167],"new":[168],"without":[176],"gap.":[178],"addition,":[180],"design":[182],"masked":[184],"modeling":[185],"strategy":[186,193],"multi-modal":[189],"candidate":[190],"token":[191],"elimination":[192],"CKD":[195],"improve":[197],"robustness":[199],"efficiency":[201],"respectively.":[202],"Extensive":[203],"experiments":[204],"on":[205],"five":[206],"standard":[207],"datasets":[210],"validate":[211],"effectiveness":[213],"proposed":[216],"method":[217],"against":[218],"state-of-the-art":[219],"methods":[220],"while":[221],"achieving":[222],"fastest":[224],"speed":[226],"96.4":[228],"FPS.":[229]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":5}],"updated_date":"2026-03-12T08:34:05.389933","created_date":"2025-10-10T00:00:00"}
