{"id":"https://openalex.org/W4395017442","doi":"https://doi.org/10.1109/tcsvt.2024.3391802","title":"RGBT Tracking via Progressive Fusion Transformer With Dynamically Guided Learning","display_name":"RGBT Tracking via Progressive Fusion Transformer With Dynamically Guided Learning","publication_year":2024,"publication_date":"2024-04-22","ids":{"openalex":"https://openalex.org/W4395017442","doi":"https://doi.org/10.1109/tcsvt.2024.3391802"},"language":"en","primary_location":{"id":"doi:10.1109/tcsvt.2024.3391802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3391802","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5038904514","display_name":"Yabin Zhu","orcid":"https://orcid.org/0000-0002-1000-2750"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yabin Zhu","raw_affiliation_strings":["Key Laboratory of Intelligent Computing and Signal Processing of Ministry of Education, Anhui University, Hefei, China","Key Laboratory of Electromagnetic Environmental Sensing of Anhui Higher Education Institutes, School of Electronic and Information Engineering, Key Laboratory of Intelligent Computing and Signal Processing of Ministry of Education, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Key Laboratory of Intelligent Computing and Signal Processing of Ministry of Education, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"Key Laboratory of Electromagnetic Environmental Sensing of Anhui Higher Education Institutes, School of Electronic and Information Engineering, Key Laboratory of Intelligent Computing and Signal Processing of Ministry of Education, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100398932","display_name":"Chenglong Li","orcid":"https://orcid.org/0000-0002-7233-2739"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chenglong Li","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, Hefei, China","Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Artificial Intelligence, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100411426","display_name":"Xiao Wang","orcid":"https://orcid.org/0000-0001-6117-6745"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiao Wang","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, Hefei, China","Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030720334","display_name":"Jin Tang","orcid":"https://orcid.org/0000-0001-8375-3590"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jin Tang","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, Hefei, China","Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"Anhui Provincial Key Laboratory of Multimodal Cognitive Computation, School of Computer Science and Technology, Information Materials and Intelligent Sensing Laboratory of Anhui Province, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5049963236","display_name":"Zhixiang Huang","orcid":"https://orcid.org/0000-0002-8023-9075"},"institutions":[{"id":"https://openalex.org/I143868143","display_name":"Anhui University","ror":"https://ror.org/05th6yx34","country_code":"CN","type":"education","lineage":["https://openalex.org/I143868143"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhixiang Huang","raw_affiliation_strings":["Information Materials and Intelligent Sensing Laboratory of Anhui Province, Center for Big Data and Population Health of the Institute of Health and Medcine, Anhui University, Hefei, China","Key Laboratory of Electromagnetic Environmental Sensing of Anhui Higher Education Institutes, School of Electronic and Information Engineering, Key Laboratory of Intelligent Computing and Signal Processing of Ministry of Education, Anhui University, Hefei, China"],"affiliations":[{"raw_affiliation_string":"Information Materials and Intelligent Sensing Laboratory of Anhui Province, Center for Big Data and Population Health of the Institute of Health and Medcine, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]},{"raw_affiliation_string":"Key Laboratory of Electromagnetic Environmental Sensing of Anhui Higher Education Institutes, School of Electronic and Information Engineering, Key Laboratory of Intelligent Computing and Signal Processing of Ministry of Education, Anhui University, Hefei, China","institution_ids":["https://openalex.org/I143868143"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5038904514"],"corresponding_institution_ids":["https://openalex.org/I143868143"],"apc_list":null,"apc_paid":null,"fwci":3.9474,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.94696196,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"34","issue":"9","first_page":"8722","last_page":"8735"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10331","display_name":"Video Surveillance and Tracking Methods","score":0.9998000264167786,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10036","display_name":"Advanced Neural Network Applications","score":0.9950000047683716,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11605","display_name":"Visual Attention and Saliency Detection","score":0.9941999912261963,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.7265461087226868},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.6981908082962036},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.6500009298324585},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.637151837348938},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5288019180297852},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.517665445804596},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.4851861596107483},{"id":"https://openalex.org/keywords/fusion-mechanism","display_name":"Fusion mechanism","score":0.46101298928260803},{"id":"https://openalex.org/keywords/multimodal-learning","display_name":"Multimodal learning","score":0.43014290928840637},{"id":"https://openalex.org/keywords/machine-learning","display_name":"Machine learning","score":0.38640522956848145},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.3417772948741913},{"id":"https://openalex.org/keywords/engineering","display_name":"Engineering","score":0.08735853433609009}],"concepts":[{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.7265461087226868},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6981908082962036},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.6500009298324585},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.637151837348938},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5288019180297852},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.517665445804596},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.4851861596107483},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.46101298928260803},{"id":"https://openalex.org/C2780660688","wikidata":"https://www.wikidata.org/wiki/Q25052564","display_name":"Multimodal learning","level":2,"score":0.43014290928840637},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.38640522956848145},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.3417772948741913},{"id":"https://openalex.org/C127413603","wikidata":"https://www.wikidata.org/wiki/Q11023","display_name":"Engineering","level":0,"score":0.08735853433609009},{"id":"https://openalex.org/C199539241","wikidata":"https://www.wikidata.org/wiki/Q7748","display_name":"Law","level":1,"score":0.0},{"id":"https://openalex.org/C17744445","wikidata":"https://www.wikidata.org/wiki/Q36442","display_name":"Political science","level":0,"score":0.0},{"id":"https://openalex.org/C103038307","wikidata":"https://www.wikidata.org/wiki/Q6556360","display_name":"Lipid bilayer fusion","level":3,"score":0.0},{"id":"https://openalex.org/C36289849","wikidata":"https://www.wikidata.org/wiki/Q34749","display_name":"Social science","level":1,"score":0.0},{"id":"https://openalex.org/C144024400","wikidata":"https://www.wikidata.org/wiki/Q21201","display_name":"Sociology","level":0,"score":0.0},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0},{"id":"https://openalex.org/C94625758","wikidata":"https://www.wikidata.org/wiki/Q7163","display_name":"Politics","level":2,"score":0.0},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.0},{"id":"https://openalex.org/C119599485","wikidata":"https://www.wikidata.org/wiki/Q43035","display_name":"Electrical engineering","level":1,"score":0.0},{"id":"https://openalex.org/C165801399","wikidata":"https://www.wikidata.org/wiki/Q25428","display_name":"Voltage","level":2,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tcsvt.2024.3391802","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tcsvt.2024.3391802","pdf_url":null,"source":{"id":"https://openalex.org/S115173108","display_name":"IEEE Transactions on Circuits and Systems for Video Technology","issn_l":"1051-8215","issn":["1051-8215","1558-2205"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Circuits and Systems for Video Technology","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2366631306","display_name":null,"funder_award_id":"62102205","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G564616603","display_name":null,"funder_award_id":"62202002","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G845944294","display_name":null,"funder_award_id":"62376004","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G849060900","display_name":null,"funder_award_id":"2208085J18","funder_id":"https://openalex.org/F4320334897","funder_display_name":"Natural Science Foundation of Anhui Province"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320334897","display_name":"Natural Science Foundation of Anhui Province","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":77,"referenced_works":["https://openalex.org/W1861492603","https://openalex.org/W2194775991","https://openalex.org/W2765667535","https://openalex.org/W2794744029","https://openalex.org/W2889054948","https://openalex.org/W2891033863","https://openalex.org/W2897436422","https://openalex.org/W2898200825","https://openalex.org/W2908510526","https://openalex.org/W2962766617","https://openalex.org/W2963188742","https://openalex.org/W2963905288","https://openalex.org/W2981851019","https://openalex.org/W2997131652","https://openalex.org/W2998027361","https://openalex.org/W2998756268","https://openalex.org/W3001584168","https://openalex.org/W3002567850","https://openalex.org/W3005080107","https://openalex.org/W3012425959","https://openalex.org/W3035020406","https://openalex.org/W3035652667","https://openalex.org/W3064498204","https://openalex.org/W3096609285","https://openalex.org/W3096831136","https://openalex.org/W3098092829","https://openalex.org/W3099671582","https://openalex.org/W3099681648","https://openalex.org/W3101990647","https://openalex.org/W3110562975","https://openalex.org/W3119686997","https://openalex.org/W3132864630","https://openalex.org/W3153607844","https://openalex.org/W3158472981","https://openalex.org/W3171106688","https://openalex.org/W3171516518","https://openalex.org/W3176724088","https://openalex.org/W3183152796","https://openalex.org/W3183904268","https://openalex.org/W3187284461","https://openalex.org/W3187310259","https://openalex.org/W3188267239","https://openalex.org/W3188427387","https://openalex.org/W3193319282","https://openalex.org/W3193488896","https://openalex.org/W3204221554","https://openalex.org/W3214116948","https://openalex.org/W4213019189","https://openalex.org/W4214624153","https://openalex.org/W4214736485","https://openalex.org/W4226089683","https://openalex.org/W4226126595","https://openalex.org/W4280526073","https://openalex.org/W4283808043","https://openalex.org/W4286974493","https://openalex.org/W4287556358","https://openalex.org/W4293523180","https://openalex.org/W4296425724","https://openalex.org/W4309800376","https://openalex.org/W4312651496","https://openalex.org/W4312668764","https://openalex.org/W4312671791","https://openalex.org/W4321195219","https://openalex.org/W4377971262","https://openalex.org/W4379929801","https://openalex.org/W4380884766","https://openalex.org/W4381894703","https://openalex.org/W4385245566","https://openalex.org/W4385686754","https://openalex.org/W4386057714","https://openalex.org/W4386071994","https://openalex.org/W4386075647","https://openalex.org/W6766904570","https://openalex.org/W6779590353","https://openalex.org/W6799063536","https://openalex.org/W6810827410","https://openalex.org/W6846689209"],"related_works":["https://openalex.org/W73545470","https://openalex.org/W4224266612","https://openalex.org/W2383394264","https://openalex.org/W4320153225","https://openalex.org/W4293261942","https://openalex.org/W3125968744","https://openalex.org/W203959209","https://openalex.org/W2110287964","https://openalex.org/W2167701463","https://openalex.org/W4307407935"],"abstract_inverted_index":{"Existing":[0],"Transformer-based":[1],"RGB-Thermal":[2],"(RGBT)":[3],"tracking":[4],"methods":[5],"either":[6],"use":[7,15],"cross-attention":[8,18,89],"to":[9,19,79,91,124,131],"fuse":[10],"the":[11,27,34,42,64,82,95,98,106,121,126,133],"two":[12,88],"modalities,":[13],"or":[14],"self-attention":[16,77],"and":[17,23,155],"model":[20],"both":[21],"modality-specific":[22,103],"modality-sharing":[24],"information.":[25],"However,":[26],"significant":[28],"appearance":[29],"gap":[30],"between":[31],"modalities":[32,40,100],"limits":[33],"feature":[35],"representation":[36,66,134],"ability":[37,135],"of":[38,97,128,136],"certain":[39],"during":[41],"fusion":[43],"process.":[44],"To":[45],"address":[46],"this":[47],"problem,":[48],"we":[49,111],"propose":[50,112],"a":[51,76,113,147],"novel":[52],"Progressive":[53],"Fusion":[54],"Transformer":[55],"called":[56],"ProFormer,":[57],"which":[58],"progressively":[59],"integrates":[60],"single-modality":[61],"information":[62,104],"into":[63],"multimodal":[65,83,107],"for":[67,101],"robust":[68],"RGBT":[69],"tracking.":[70],"In":[71,109],"particular,":[72],"ProFormer":[73,86,145],"first":[74],"uses":[75],"module":[78],"collaboratively":[80],"extract":[81],"representation.":[84,108],"Then,":[85],"introduces":[87],"modules":[90],"interact":[92],"it":[93],"with":[94],"features":[96],"dual":[99],"enhancing":[102],"in":[105],"addition,":[110],"dynamically":[114],"guided":[115],"learning":[116,127],"algorithm":[117],"that":[118,142],"adaptively":[119],"employs":[120],"well-performing":[122],"branches":[123],"guide":[125],"other":[129],"branches,":[130],"improve":[132],"each":[137],"branch.":[138],"Extensive":[139],"experiments":[140],"demonstrate":[141],"our":[143],"proposed":[144],"achieves":[146],"new":[148],"state-of-the-art":[149],"performance":[150],"on":[151],"RGBT210,":[152],"RGBT234,":[153],"LasHeR,":[154],"VTUAV":[156],"datasets.":[157]},"counts_by_year":[{"year":2026,"cited_by_count":1},{"year":2025,"cited_by_count":11},{"year":2024,"cited_by_count":3}],"updated_date":"2025-11-06T03:46:38.306776","created_date":"2025-10-10T00:00:00"}
