{"id":"https://openalex.org/W4413465567","doi":"https://doi.org/10.1109/tmm.2025.3599020","title":"Fusion-Mamba for Cross-Modality Object Detection","display_name":"Fusion-Mamba for Cross-Modality Object Detection","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4413465567","doi":"https://doi.org/10.1109/tmm.2025.3599020"},"language":"en","primary_location":{"id":"doi:10.1109/tmm.2025.3599020","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3599020","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Wenhao Dong","orcid":"https://orcid.org/0009-0004-4921-1834"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Wenhao Dong","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Haodong Zhu","orcid":"https://orcid.org/0009-0008-2569-4965"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haodong Zhu","raw_affiliation_strings":["School of Artificial Intelligence, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043643513","display_name":"Shaohui Lin","orcid":"https://orcid.org/0000-0003-0284-9940"},"institutions":[{"id":"https://openalex.org/I66867065","display_name":"East China Normal University","ror":"https://ror.org/02n96ep67","country_code":"CN","type":"education","lineage":["https://openalex.org/I66867065"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shaohui Lin","raw_affiliation_strings":["School of Computer Science and Technology, East China Normal University, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"School of Computer Science and Technology, East China Normal University, Shanghai, China","institution_ids":["https://openalex.org/I66867065"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072050541","display_name":"Xiaoyan Luo","orcid":"https://orcid.org/0000-0002-7256-4329"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xiaoyan Luo","raw_affiliation_strings":["School of Astronautics, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Astronautics, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5039883116","display_name":"Yunhang Shen","orcid":"https://orcid.org/0000-0002-3970-7519"},"institutions":[{"id":"https://openalex.org/I2250653659","display_name":"Tencent (China)","ror":"https://ror.org/00hhjss72","country_code":"CN","type":"company","lineage":["https://openalex.org/I2250653659"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yunhang Shen","raw_affiliation_strings":["Tencent Youtu Lab, Shanghai, China"],"affiliations":[{"raw_affiliation_string":"Tencent Youtu Lab, Shanghai, China","institution_ids":["https://openalex.org/I2250653659"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5085022758","display_name":"Guodong Guo","orcid":"https://orcid.org/0000-0001-9583-0055"},"institutions":[{"id":"https://openalex.org/I4394709157","display_name":"Eastern Institute of Technology, Ningbo","ror":"https://ror.org/036mbz113","country_code":null,"type":"education","lineage":["https://openalex.org/I4394709157"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Guodong Guo","raw_affiliation_strings":["Ningbo Institute of Digital Twin, Eastern Institute of Technology, Ningbo, China"],"affiliations":[{"raw_affiliation_string":"Ningbo Institute of Digital Twin, Eastern Institute of Technology, Ningbo, China","institution_ids":["https://openalex.org/I4394709157"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5015525872","display_name":"Baochang Zhang","orcid":"https://orcid.org/0000-0001-7396-6218"},"institutions":[{"id":"https://openalex.org/I82880672","display_name":"Beihang University","ror":"https://ror.org/00wk2mp56","country_code":"CN","type":"education","lineage":["https://openalex.org/I82880672"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Baochang Zhang","raw_affiliation_strings":["School of Artificial Intelligence, Beihang University, Beijing, China"],"affiliations":[{"raw_affiliation_string":"School of Artificial Intelligence, Beihang University, Beijing, China","institution_ids":["https://openalex.org/I82880672"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I82880672"],"apc_list":null,"apc_paid":null,"fwci":39.1694,"has_fulltext":false,"cited_by_count":33,"citation_normalized_percentile":{"value":0.99854967,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":"27","issue":null,"first_page":"7392","last_page":"7406"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9614999890327454,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.9614999890327454,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11398","display_name":"Hand Gesture Recognition Systems","score":0.9021000266075134,"subfield":{"id":"https://openalex.org/subfields/1709","display_name":"Human-Computer Interaction"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7808727025985718},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6318957805633545},{"id":"https://openalex.org/keywords/object","display_name":"Object (grammar)","score":0.4789624512195587},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.3839852809906006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7808727025985718},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6318957805633545},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.4789624512195587},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3839852809906006}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tmm.2025.3599020","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tmm.2025.3599020","pdf_url":null,"source":{"id":"https://openalex.org/S137030581","display_name":"IEEE Transactions on Multimedia","issn_l":"1520-9210","issn":["1520-9210","1941-0077"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Multimedia","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2312352739","display_name":null,"funder_award_id":"L223024","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"},{"id":"https://openalex.org/G3010619704","display_name":null,"funder_award_id":"L244043","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"},{"id":"https://openalex.org/G4391473945","display_name":null,"funder_award_id":"KLATASDS2305","funder_id":"https://openalex.org/F4320312071","funder_display_name":"Ministry of Education, Libya"},{"id":"https://openalex.org/G5437778857","display_name":null,"funder_award_id":"62102151","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G6586239910","display_name":null,"funder_award_id":"Z241100001324017","funder_id":"https://openalex.org/F4320322919","funder_display_name":"Natural Science Foundation of Beijing Municipality"}],"funders":[{"id":"https://openalex.org/F4320312071","display_name":"Ministry of Education, Libya","ror":"https://ror.org/02w030k33"},{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320322919","display_name":"Natural Science Foundation of Beijing Municipality","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":78,"referenced_works":["https://openalex.org/W2194775991","https://openalex.org/W2765811365","https://openalex.org/W2798987894","https://openalex.org/W2912147220","https://openalex.org/W2963037989","https://openalex.org/W2963188557","https://openalex.org/W2963351448","https://openalex.org/W2963579094","https://openalex.org/W2964241181","https://openalex.org/W2965912241","https://openalex.org/W2970929725","https://openalex.org/W2987131085","https://openalex.org/W2990546238","https://openalex.org/W2997889428","https://openalex.org/W3035467948","https://openalex.org/W3036931590","https://openalex.org/W3046194589","https://openalex.org/W3094502228","https://openalex.org/W3096609285","https://openalex.org/W3114651545","https://openalex.org/W3118570274","https://openalex.org/W3138516171","https://openalex.org/W3158128549","https://openalex.org/W3171950886","https://openalex.org/W3190808861","https://openalex.org/W3207919963","https://openalex.org/W3209478434","https://openalex.org/W3213472242","https://openalex.org/W4220724622","https://openalex.org/W4220893768","https://openalex.org/W4224315825","https://openalex.org/W4246193833","https://openalex.org/W4304080362","https://openalex.org/W4304080855","https://openalex.org/W4308310215","https://openalex.org/W4312440143","https://openalex.org/W4312594135","https://openalex.org/W4312596062","https://openalex.org/W4312750622","https://openalex.org/W4312950730","https://openalex.org/W4313007055","https://openalex.org/W4313065862","https://openalex.org/W4313267411","https://openalex.org/W4317496152","https://openalex.org/W4319866558","https://openalex.org/W4366352735","https://openalex.org/W4366378409","https://openalex.org/W4367663172","https://openalex.org/W4367721788","https://openalex.org/W4376106313","https://openalex.org/W4379528676","https://openalex.org/W4385245566","https://openalex.org/W4385801610","https://openalex.org/W4386038403","https://openalex.org/W4386076504","https://openalex.org/W4386083115","https://openalex.org/W4386189887","https://openalex.org/W4387968049","https://openalex.org/W4387968493","https://openalex.org/W4390659919","https://openalex.org/W4391461226","https://openalex.org/W4391849436","https://openalex.org/W4391974567","https://openalex.org/W4392523614","https://openalex.org/W4392796741","https://openalex.org/W4392824656","https://openalex.org/W4392939416","https://openalex.org/W4393171245","https://openalex.org/W4398760112","https://openalex.org/W4399375400","https://openalex.org/W4399801051","https://openalex.org/W4399881535","https://openalex.org/W4400391271","https://openalex.org/W4400519485","https://openalex.org/W4400975112","https://openalex.org/W4402775842","https://openalex.org/W4403602501","https://openalex.org/W4414243662"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2385859805","https://openalex.org/W2530972254","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109"],"abstract_inverted_index":{"Cross-modality":[0],"object":[1,46,187],"detection":[2,47],"aims":[3],"to":[4,11,44,86],"fuse":[5],"complementary":[6],"information":[7,144],"from":[8],"different":[9],"modalities":[10],"improve":[12],"model":[13,41],"performance,":[14],"which":[15,39,122,136],"achieves":[16],"a":[17,54,64,74,91,182,190],"wider":[18],"range":[19],"of":[20,36,126,158,176],"applications.":[21],"However,":[22],"traditional":[23],"cross-modality":[24,56,186],"fusion":[25,57,125,139],"methods,":[26],"based":[27,68],"on":[28,69,102,164],"CNN":[29],"or":[30],"Transformer,":[31],"inadequately":[32],"address":[33],"the":[34,80,99,124,146,174],"issue":[35],"pseudo-target":[37,143],"information,":[38],"causes":[40],"attention":[42,76,101],"dispersion":[43],"degrade":[45],"performance.":[48,109],"In":[49],"this":[50,179,197],"paper,":[51],"we":[52],"investigate":[53],"novel":[55],"approach":[58],"by":[59],"associating":[60],"cross-modal":[61,88],"features":[62,89],"in":[63,196],"hidden":[65,92,147],"state":[66,93,148],"space":[67,94],"an":[70],"improved":[71],"Mamba":[72],"with":[73],"gating":[75],"mechanism.":[77],"We":[78],"propose":[79],"<italic":[81],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[82,166],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">Fusion-Mamba":[83],"Block</i>(FMB),":[84],"designed":[85],"map":[87],"into":[90],"for":[95,185,193],"interaction,":[96],"thereby":[97],"refining":[98],"model\u2019s":[100],"true":[103],"target":[104],"areas":[105],"and":[106,129,140,161,170],"enhancing":[107],"overall":[108],"The":[110],"FMB":[111],"comprises":[112],"two":[113],"key":[114],"modules:":[115],"State":[116,131],"Space":[117,132],"Channel":[118],"Swapping":[119],"(SSCS)":[120],"module,":[121,135],"facilitates":[123],"shallow":[127],"features,":[128],"Dual":[130],"Fusion":[133],"(DSSF)":[134],"enables":[137],"deep":[138],"effectively":[141],"suppresses":[142],"within":[145],"space.":[149],"Our":[150],"proposed":[151],"method":[152],"outperforms":[153],"state-of-the-art":[154],"approaches,":[155],"achieving":[156],"improvements":[157],"5.9%,":[159],"3.5%":[160],"2.1%":[162],"mAP":[163],"<inline-formula":[165],"xmlns:xlink=\"http://www.w3.org/1999/xlink\"><tex-math":[167],"notation=\"LaTeX\">$M^{3}$</tex-math></inline-formula>FD,":[168],"DroneVehicle":[169],"FLIR-Aligned,":[171],"respectively.":[172],"To":[173],"best":[175],"our":[177],"knowledge,":[178],"work":[180],"establishes":[181],"new":[183],"baseline":[184],"detection,":[188],"providing":[189],"robust":[191],"foundation":[192],"future":[194],"research":[195],"area.":[198]},"counts_by_year":[{"year":2026,"cited_by_count":19},{"year":2025,"cited_by_count":14}],"updated_date":"2026-04-15T08:11:43.952461","created_date":"2025-10-10T00:00:00"}
