{"id":"https://openalex.org/W4408125035","doi":"https://doi.org/10.1109/tetci.2025.3542146","title":"MSDT: Multiscale Diffusion Transformer for Multimodality Image Fusion","display_name":"MSDT: Multiscale Diffusion Transformer for Multimodality Image Fusion","publication_year":2025,"publication_date":"2025-03-03","ids":{"openalex":"https://openalex.org/W4408125035","doi":"https://doi.org/10.1109/tetci.2025.3542146"},"language":"en","primary_location":{"id":"doi:10.1109/tetci.2025.3542146","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2025.3542146","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Caifeng Xia","orcid":"https://orcid.org/0009-0005-4641-7826"},"institutions":[{"id":"https://openalex.org/I116036724","display_name":"Shenyang Ligong University","ror":"https://ror.org/03m20nr07","country_code":"CN","type":"education","lineage":["https://openalex.org/I116036724"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Caifeng Xia","raw_affiliation_strings":["Graduate School, Shenyang Ligong University, Shenyang, China"],"raw_orcid":"https://orcid.org/0009-0005-4641-7826","affiliations":[{"raw_affiliation_string":"Graduate School, Shenyang Ligong University, Shenyang, China","institution_ids":["https://openalex.org/I116036724"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101574121","display_name":"Hongwei Gao","orcid":"https://orcid.org/0000-0002-7666-2970"},"institutions":[{"id":"https://openalex.org/I116036724","display_name":"Shenyang Ligong University","ror":"https://ror.org/03m20nr07","country_code":"CN","type":"education","lineage":["https://openalex.org/I116036724"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongwei Gao","raw_affiliation_strings":["School of Automation and Electrical Engineering, Shenyang Ligong University, Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0002-7666-2970","affiliations":[{"raw_affiliation_string":"School of Automation and Electrical Engineering, Shenyang Ligong University, Shenyang, China","institution_ids":["https://openalex.org/I116036724"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100709268","display_name":"Wei Yang","orcid":"https://orcid.org/0000-0003-0178-7135"},"institutions":[{"id":"https://openalex.org/I116036724","display_name":"Shenyang Ligong University","ror":"https://ror.org/03m20nr07","country_code":"CN","type":"education","lineage":["https://openalex.org/I116036724"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Wei Yang","raw_affiliation_strings":["Graduate School, Shenyang Ligong University, Shenyang, China"],"raw_orcid":"https://orcid.org/0000-0003-0178-7135","affiliations":[{"raw_affiliation_string":"Graduate School, Shenyang Ligong University, Shenyang, China","institution_ids":["https://openalex.org/I116036724"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5001205723","display_name":"Jiahui Yu","orcid":"https://orcid.org/0000-0003-1314-2481"},"institutions":[{"id":"https://openalex.org/I76130692","display_name":"Zhejiang University","ror":"https://ror.org/00a2xv884","country_code":"CN","type":"education","lineage":["https://openalex.org/I76130692"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiahui Yu","raw_affiliation_strings":["Department of Biomedical Engineering, MOE Key Laboratory of Biomedical Engineering, State Key Laboratory of Extreme Photonics and Instrumentation, Zhejiang Provincial Key Laboratory of CardioCerebral Vascular Detection Technology and Medicinal Effectiveness Appraisal, Zhejiang University, Hangzhou, China"],"raw_orcid":"https://orcid.org/0000-0003-1314-2481","affiliations":[{"raw_affiliation_string":"Department of Biomedical Engineering, MOE Key Laboratory of Biomedical Engineering, State Key Laboratory of Extreme Photonics and Instrumentation, Zhejiang Provincial Key Laboratory of CardioCerebral Vascular Detection Technology and Medicinal Effectiveness Appraisal, Zhejiang University, Hangzhou, China","institution_ids":["https://openalex.org/I76130692"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I116036724"],"apc_list":null,"apc_paid":null,"fwci":5.2653,"has_fulltext":false,"cited_by_count":6,"citation_normalized_percentile":{"value":0.95266796,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":99},"biblio":{"volume":"9","issue":"3","first_page":"2269","last_page":"2283"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9975000023841858,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.9684000015258789,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/multimodality","display_name":"Multimodality","score":0.8334842920303345},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.460932195186615},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.3892560601234436},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.34682148694992065},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.3170582056045532},{"id":"https://openalex.org/keywords/world-wide-web","display_name":"World Wide Web","score":0.06856310367584229}],"concepts":[{"id":"https://openalex.org/C2780910867","wikidata":"https://www.wikidata.org/wiki/Q1952416","display_name":"Multimodality","level":2,"score":0.8334842920303345},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.460932195186615},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3892560601234436},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.34682148694992065},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.3170582056045532},{"id":"https://openalex.org/C136764020","wikidata":"https://www.wikidata.org/wiki/Q466","display_name":"World Wide Web","level":1,"score":0.06856310367584229}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/tetci.2025.3542146","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tetci.2025.3542146","pdf_url":null,"source":{"id":"https://openalex.org/S4210210251","display_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","issn_l":"2471-285X","issn":["2471-285X"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Emerging Topics in Computational Intelligence","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":51,"referenced_works":["https://openalex.org/W2809795042","https://openalex.org/W2912147220","https://openalex.org/W2950648852","https://openalex.org/W2998529071","https://openalex.org/W3011768656","https://openalex.org/W3030921250","https://openalex.org/W3046194589","https://openalex.org/W3102911434","https://openalex.org/W3108042295","https://openalex.org/W3159235206","https://openalex.org/W3207918547","https://openalex.org/W3215723718","https://openalex.org/W4211151538","https://openalex.org/W4220893768","https://openalex.org/W4224256886","https://openalex.org/W4283732315","https://openalex.org/W4285600783","https://openalex.org/W4286361941","https://openalex.org/W4292851041","https://openalex.org/W4308310215","https://openalex.org/W4310461873","https://openalex.org/W4312052673","https://openalex.org/W4312250205","https://openalex.org/W4312594135","https://openalex.org/W4312933868","https://openalex.org/W4313555022","https://openalex.org/W4319069103","https://openalex.org/W4319663704","https://openalex.org/W4362496246","https://openalex.org/W4367147113","https://openalex.org/W4376126900","https://openalex.org/W4376131895","https://openalex.org/W4382119107","https://openalex.org/W4385800876","https://openalex.org/W4386075910","https://openalex.org/W4386076504","https://openalex.org/W4387682254","https://openalex.org/W4390872797","https://openalex.org/W4391128328","https://openalex.org/W4393148430","https://openalex.org/W4393379613","https://openalex.org/W4394595838","https://openalex.org/W4400132802","https://openalex.org/W6679045638","https://openalex.org/W6765775151","https://openalex.org/W6779823529","https://openalex.org/W6784333009","https://openalex.org/W6796588791","https://openalex.org/W6838327568","https://openalex.org/W6838452192","https://openalex.org/W6847038466"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W4205899436","https://openalex.org/W2462138927","https://openalex.org/W3111427900","https://openalex.org/W2373946551","https://openalex.org/W2032636564","https://openalex.org/W2350275110","https://openalex.org/W2381578981"],"abstract_inverted_index":{"Multimodal":[0],"image":[1,196],"fusion":[2,32,66,81,122],"is":[3],"a":[4,15,79,86,91,96,105,119,133,142],"vital":[5],"technique":[6],"that":[7,83,161],"integrates":[8],"images":[9,103],"from":[10],"various":[11],"sensors":[12],"to":[13,44,64,100,136,145],"create":[14],"comprehensive":[16],"and":[17,27,54,127,141,182],"coherent":[18],"representation,":[19,38],"with":[20,35,90,191],"broad":[21],"applications":[22],"in":[23],"surveillance,":[24],"medical":[25],"imaging,":[26],"autonomous":[28],"driving.":[29],"However,":[30],"current":[31],"methods":[33,166],"struggle":[34],"inadequate":[36],"feature":[37,121],"limited":[39],"global":[40],"context":[41],"understanding":[42],"due":[43],"the":[45,55,74,185],"small":[46],"receptive":[47],"fields":[48],"of":[49,57,61,175,187],"convolutional":[50],"neural":[51],"networks":[52],"(CNNs),":[53],"loss":[56],"high-frequency":[58,139],"information,":[59],"all":[60],"which":[62],"lead":[63],"suboptimal":[65],"quality.":[67],"To":[68],"address":[69],"these":[70],"challenges,":[71],"we":[72],"propose":[73],"Multi-Scale":[75],"Diffusion":[76],"Transformer":[77],"(MSDT),":[78],"novel":[80],"framework":[82],"seamlessly":[84],"combines":[85],"latent":[87,107],"diffusion":[88,189],"model":[89],"transformer-based":[92],"architecture.":[93],"MSDT":[94,131,162,178],"uses":[95],"perceptual":[97],"compression":[98],"network":[99],"encode":[101],"source":[102],"into":[104],"low-dimensional":[106],"space,":[108],"reducing":[109],"computational":[110],"complexity":[111],"while":[112],"preserving":[113],"essential":[114],"features.":[115],"It":[116],"also":[117],"incorporates":[118],"multiscale":[120],"mechanism,":[123],"enhancing":[124],"both":[125],"detail":[126],"structural":[128],"understanding.":[129,154],"Additionally,":[130],"features":[132,140,149],"self-attention":[134],"module":[135,144],"extract":[137],"unique":[138],"cross-attention":[143],"identify":[146],"common":[147],"low-frequency":[148],"across":[150,167],"modalities,":[151],"improving":[152],"contextual":[153],"Extensive":[155],"experiments":[156],"on":[157],"three":[158],"datasets":[159],"show":[160],"significantly":[163],"outperforms":[164],"state-of-the-art":[165],"twelve":[168],"evaluation":[169],"metrics,":[170],"achieving":[171],"an":[172],"SSIM":[173],"score":[174],"0.98.":[176],"Moreover,":[177],"demonstrates":[179],"superior":[180],"robustness":[181],"generalizability,":[183],"highlighting":[184],"potential":[186],"integrating":[188],"models":[190],"transformer":[192],"architectures":[193],"for":[194],"multimodal":[195],"fusion.":[197]},"counts_by_year":[{"year":2026,"cited_by_count":3},{"year":2025,"cited_by_count":3}],"updated_date":"2026-06-08T08:47:23.578185","created_date":"2025-10-10T00:00:00"}
