{"id":"https://openalex.org/W4414603268","doi":"https://doi.org/10.1109/lra.2025.3615529","title":"Semantic-Guided Illumination-Aware Deformable Transformer for RGB-T Object Detection","display_name":"Semantic-Guided Illumination-Aware Deformable Transformer for RGB-T Object Detection","publication_year":2025,"publication_date":"2025-09-29","ids":{"openalex":"https://openalex.org/W4414603268","doi":"https://doi.org/10.1109/lra.2025.3615529"},"language":"en","primary_location":{"id":"doi:10.1109/lra.2025.3615529","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3615529","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101664660","display_name":"Yanhao Liu","orcid":"https://orcid.org/0009-0003-8706-5543"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Yanhao Liu","raw_affiliation_strings":["School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0003-8706-5543","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Zhuo Chen","orcid":"https://orcid.org/0009-0003-4351-6349"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Zhuo Chen","raw_affiliation_strings":["School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0009-0003-4351-6349","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100609886","display_name":"Chuan Hu","orcid":"https://orcid.org/0000-0001-5379-1561"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chuan Hu","raw_affiliation_strings":["School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-5379-1561","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100747108","display_name":"Shengbo Eben Li","orcid":"https://orcid.org/0000-0003-4923-3633"},"institutions":[{"id":"https://openalex.org/I99065089","display_name":"Tsinghua University","ror":"https://ror.org/03cve4549","country_code":"CN","type":"education","lineage":["https://openalex.org/I99065089"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shengbo Eben Li","raw_affiliation_strings":["State Key Lab of Automotive Safety and Energy, School of Vehicle and Mobility, Tsinghua University, Beijing, China"],"raw_orcid":"https://orcid.org/0000-0003-4923-3633","affiliations":[{"raw_affiliation_string":"State Key Lab of Automotive Safety and Energy, School of Vehicle and Mobility, Tsinghua University, Beijing, China","institution_ids":["https://openalex.org/I99065089"]}]},{"author_position":"last","author":{"id":null,"display_name":"Xi Zhang","orcid":"https://orcid.org/0000-0001-8909-2201"},"institutions":[{"id":"https://openalex.org/I183067930","display_name":"Shanghai Jiao Tong University","ror":"https://ror.org/0220qvk04","country_code":"CN","type":"education","lineage":["https://openalex.org/I183067930"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xi Zhang","raw_affiliation_strings":["School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China"],"raw_orcid":"https://orcid.org/0000-0001-8909-2201","affiliations":[{"raw_affiliation_string":"School of Mechanical Engineering, Shanghai Jiao Tong University, Shanghai, China","institution_ids":["https://openalex.org/I183067930"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5101664660"],"corresponding_institution_ids":["https://openalex.org/I183067930"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.36163558,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"10","issue":"11","first_page":"11936","last_page":"11943"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9815999865531921,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12111","display_name":"Industrial Vision Systems and Defect Detection","score":0.9815999865531921,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11666","display_name":"Color Science and Applications","score":0.9656999707221985,"subfield":{"id":"https://openalex.org/subfields/3107","display_name":"Atomic and Molecular Physics, and Optics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11992","display_name":"CCD and CMOS Imaging Sensors","score":0.9598000049591064,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.6664999723434448},{"id":"https://openalex.org/keywords/transformer","display_name":"Transformer","score":0.6334999799728394},{"id":"https://openalex.org/keywords/rgb-color-model","display_name":"RGB color model","score":0.6049000024795532},{"id":"https://openalex.org/keywords/object-detection","display_name":"Object detection","score":0.5580000281333923},{"id":"https://openalex.org/keywords/sensor-fusion","display_name":"Sensor fusion","score":0.4408999979496002},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.36809998750686646}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6855000257492065},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.6664999723434448},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.6398000121116638},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.6363000273704529},{"id":"https://openalex.org/C66322947","wikidata":"https://www.wikidata.org/wiki/Q11658","display_name":"Transformer","level":3,"score":0.6334999799728394},{"id":"https://openalex.org/C82990744","wikidata":"https://www.wikidata.org/wiki/Q166194","display_name":"RGB color model","level":2,"score":0.6049000024795532},{"id":"https://openalex.org/C2776151529","wikidata":"https://www.wikidata.org/wiki/Q3045304","display_name":"Object detection","level":3,"score":0.5580000281333923},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.4408999979496002},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.36809998750686646},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.35420000553131104},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.3246000111103058},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.31450000405311584},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.2809999883174896},{"id":"https://openalex.org/C94915269","wikidata":"https://www.wikidata.org/wiki/Q1834857","display_name":"Detector","level":2,"score":0.25220000743865967}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/lra.2025.3615529","is_oa":false,"landing_page_url":"https://doi.org/10.1109/lra.2025.3615529","pdf_url":null,"source":{"id":"https://openalex.org/S4210169774","display_name":"IEEE Robotics and Automation Letters","issn_l":"2377-3766","issn":["2377-3766"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Robotics and Automation Letters","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G8787995571","display_name":null,"funder_award_id":"52177218","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":26,"referenced_works":["https://openalex.org/W1910108985","https://openalex.org/W2119112357","https://openalex.org/W2608096492","https://openalex.org/W2741620214","https://openalex.org/W2791779647","https://openalex.org/W2889480448","https://openalex.org/W2963188557","https://openalex.org/W2963579094","https://openalex.org/W2964027659","https://openalex.org/W2987131085","https://openalex.org/W3039479109","https://openalex.org/W3106149304","https://openalex.org/W3116967329","https://openalex.org/W3138516171","https://openalex.org/W3164576087","https://openalex.org/W3186570689","https://openalex.org/W3209002923","https://openalex.org/W4220724622","https://openalex.org/W4312594135","https://openalex.org/W4312960790","https://openalex.org/W4323022579","https://openalex.org/W4366378409","https://openalex.org/W4377971464","https://openalex.org/W4386189887","https://openalex.org/W4390874817","https://openalex.org/W4402915974"],"related_works":[],"abstract_inverted_index":{"RGB-T":[0,20,72,150],"object":[1,151],"detection":[2,73,152],"in":[3,10,168,174],"autonomous":[4],"driving":[5],"has":[6,146],"been":[7,147],"researched":[8],"increasingly":[9],"recent":[11],"years.":[12],"Nevertheless,":[13],"several":[14],"problems":[15],"limit":[16],"the":[17,35,67,78,103,136,183,194,197,201],"performance":[18,199],"of":[19,37,163,172,193,200],"fusion":[21,33,62,89,96,100,126,137],"perception.":[22],"Initially,":[23],"although":[24],"illumination":[25,80,88],"awareness":[26],"is":[27,75,83,109,132],"a":[28,60,70,140],"mature":[29],"technology":[30],"to":[31,58,85,98,111,123,134,186],"guide":[32,99],"process,":[34],"outputs":[36],"previous":[38],"methods":[39],"lack":[40],"sufficient":[41,87],"semantic":[42,79],"detail.":[43],"What's":[44],"more,":[45],"RGB":[46,113],"and":[47,94,114,155,160,170],"thermal":[48,115],"modalities":[49],"have":[50],"severe":[51],"imbalance":[52],"problems,":[53,69],"which":[54,91],"makes":[55],"it":[56],"difficult":[57],"generate":[59],"well-performed":[61,125],"modality.":[63,142],"Thus,":[64],"concerned":[65],"about":[66],"above":[68],"novel":[71],"network":[74,145],"proposed.":[76],"Firstly,":[77],"extraction":[81],"module":[82,108,118],"proposed":[84,144,202],"produce":[86],"weights,":[90],"contain":[92],"global-level":[93],"semantic-level":[95],"weights":[97],"process.":[101],"Secondly,":[102],"multi-modal":[104,130],"illumination-guided":[105,129],"deformable":[106],"transformer":[107],"designed":[110],"aggregate":[112],"modalities.":[116],"The":[117,143,191],"implements":[119],"fusion-modality":[120],"query":[121],"initiation":[122],"obtain":[124],"queries.":[127],"Then":[128],"aggregation":[131],"utilized":[133],"refine":[135],"queries":[138],"with":[139],"single":[141],"tested":[148],"on":[149],"datasets,":[153],"KAIST":[154,169],"<inline-formula":[156,164,175],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[157,165,176],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[158,166,177],"notation=\"LaTeX\">$M^{3}FD$</tex-math></inline-formula>,":[159],"achieved":[161],"7.44%":[162],"notation=\"LaTeX\">$MR^{-2}$</tex-math></inline-formula>":[167],"80.0%":[171],"mAP":[173],"notation=\"LaTeX\">$M^{3}FD$</tex-math></inline-formula>":[178],"separately.":[179],"Meanwhile,":[180],"we":[181],"implement":[182],"real-time":[184],"test":[185],"evaluate":[187],"its":[188],"practical":[189],"feasibility.":[190],"results":[192],"experiment":[195],"demonstrate":[196],"superior":[198],"method.":[203]},"counts_by_year":[],"updated_date":"2026-01-30T23:17:42.513302","created_date":"2025-10-10T00:00:00"}
