{"id":"https://openalex.org/W4414162864","doi":"https://doi.org/10.1109/tpami.2025.3609323","title":"Mask-DiFuser: A Masked Diffusion Model for Unified Unsupervised Image Fusion","display_name":"Mask-DiFuser: A Masked Diffusion Model for Unified Unsupervised Image Fusion","publication_year":2025,"publication_date":"2025-09-12","ids":{"openalex":"https://openalex.org/W4414162864","doi":"https://doi.org/10.1109/tpami.2025.3609323","pmid":"https://pubmed.ncbi.nlm.nih.gov/40938718"},"language":"en","primary_location":{"id":"doi:10.1109/tpami.2025.3609323","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3609323","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011864594","display_name":"Linfeng Tang","orcid":"https://orcid.org/0000-0002-8566-5743"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Linfeng Tang","raw_affiliation_strings":["Electronic Information School, Wuhan University, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0002-8566-5743","affiliations":[{"raw_affiliation_string":"Electronic Information School, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Chunyu Li","orcid":"https://orcid.org/0009-0009-0896-2961"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chunyu Li","raw_affiliation_strings":["Electronic Information School, Wuhan University, Wuhan, China"],"raw_orcid":"https://orcid.org/0009-0009-0896-2961","affiliations":[{"raw_affiliation_string":"Electronic Information School, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5040010053","display_name":"Jiayi Ma","orcid":"https://orcid.org/0000-0003-3264-3265"},"institutions":[{"id":"https://openalex.org/I37461747","display_name":"Wuhan University","ror":"https://ror.org/033vjfk17","country_code":"CN","type":"education","lineage":["https://openalex.org/I37461747"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jiayi Ma","raw_affiliation_strings":["Electronic Information School, Wuhan University, Wuhan, China"],"raw_orcid":"https://orcid.org/0000-0003-3264-3265","affiliations":[{"raw_affiliation_string":"Electronic Information School, Wuhan University, Wuhan, China","institution_ids":["https://openalex.org/I37461747"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5011864594"],"corresponding_institution_ids":["https://openalex.org/I37461747"],"apc_list":null,"apc_paid":null,"fwci":10.5136,"has_fulltext":false,"cited_by_count":11,"citation_normalized_percentile":{"value":0.9831684,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":95,"max":100},"biblio":{"volume":"48","issue":"1","first_page":"591","last_page":"608"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.995199978351593,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10688","display_name":"Image and Signal Denoising Methods","score":0.95660001039505,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.5989000201225281},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.5748999714851379},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5145999789237976},{"id":"https://openalex.org/keywords/encoder","display_name":"Encoder","score":0.5113999843597412},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.49230000376701355},{"id":"https://openalex.org/keywords/masking","display_name":"Masking (illustration)","score":0.4803999960422516},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.45820000767707825},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.4487000107765198},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.41290000081062317}],"concepts":[{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7473999857902527},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.746399998664856},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.5989000201225281},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.5748999714851379},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5145999789237976},{"id":"https://openalex.org/C118505674","wikidata":"https://www.wikidata.org/wiki/Q42586063","display_name":"Encoder","level":2,"score":0.5113999843597412},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.49230000376701355},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4837000072002411},{"id":"https://openalex.org/C2777402240","wikidata":"https://www.wikidata.org/wiki/Q6783436","display_name":"Masking (illustration)","level":2,"score":0.4803999960422516},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.45820000767707825},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.4487000107765198},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.41290000081062317},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.3815999925136566},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.3659999966621399},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.3605000078678131},{"id":"https://openalex.org/C146849305","wikidata":"https://www.wikidata.org/wiki/Q370766","display_name":"Ground truth","level":2,"score":0.35040000081062317},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.3368000090122223},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.32600000500679016},{"id":"https://openalex.org/C33954974","wikidata":"https://www.wikidata.org/wiki/Q486494","display_name":"Sensor fusion","level":2,"score":0.3246000111103058},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2930999994277954},{"id":"https://openalex.org/C2779304628","wikidata":"https://www.wikidata.org/wiki/Q3503480","display_name":"Face (sociological concept)","level":2,"score":0.2888999879360199},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.27970001101493835},{"id":"https://openalex.org/C9417928","wikidata":"https://www.wikidata.org/wiki/Q1070689","display_name":"Image processing","level":3,"score":0.27959999442100525},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2754000127315521},{"id":"https://openalex.org/C163716315","wikidata":"https://www.wikidata.org/wiki/Q901177","display_name":"Gaussian","level":2,"score":0.27379998564720154},{"id":"https://openalex.org/C57273362","wikidata":"https://www.wikidata.org/wiki/Q576722","display_name":"Decoding methods","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C189950617","wikidata":"https://www.wikidata.org/wiki/Q937228","display_name":"Property (philosophy)","level":2,"score":0.2615000009536743},{"id":"https://openalex.org/C83248878","wikidata":"https://www.wikidata.org/wiki/Q344000","display_name":"Active appearance model","level":3,"score":0.2605000138282776},{"id":"https://openalex.org/C8038995","wikidata":"https://www.wikidata.org/wiki/Q1152135","display_name":"Unsupervised learning","level":2,"score":0.25429999828338623}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tpami.2025.3609323","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tpami.2025.3609323","pdf_url":null,"source":{"id":"https://openalex.org/S199944782","display_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","issn_l":"0162-8828","issn":["0162-8828","1939-3539","2160-9292"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310320439","host_organization_name":"IEEE Computer Society","host_organization_lineage":["https://openalex.org/P4310320439","https://openalex.org/P4310319808"],"host_organization_lineage_names":["IEEE Computer Society","Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Pattern Analysis and Machine Intelligence","raw_type":"journal-article"},{"id":"pmid:40938718","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/40938718","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on pattern analysis and machine intelligence","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G415731887","display_name":null,"funder_award_id":"62276192","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":68,"referenced_works":["https://openalex.org/W1708141795","https://openalex.org/W1999034606","https://openalex.org/W2012893378","https://openalex.org/W2741137940","https://openalex.org/W2774839435","https://openalex.org/W2783573276","https://openalex.org/W2798987894","https://openalex.org/W2912147220","https://openalex.org/W2963037989","https://openalex.org/W2963530785","https://openalex.org/W2963787388","https://openalex.org/W2964060609","https://openalex.org/W2998012573","https://openalex.org/W3046194589","https://openalex.org/W3083574456","https://openalex.org/W3091503912","https://openalex.org/W3131111098","https://openalex.org/W3171420223","https://openalex.org/W3190808861","https://openalex.org/W3216987090","https://openalex.org/W4206713196","https://openalex.org/W4220893768","https://openalex.org/W4283732315","https://openalex.org/W4285600783","https://openalex.org/W4308310215","https://openalex.org/W4309730479","https://openalex.org/W4312440143","https://openalex.org/W4312594135","https://openalex.org/W4312740349","https://openalex.org/W4312804044","https://openalex.org/W4312827269","https://openalex.org/W4312933868","https://openalex.org/W4313156423","https://openalex.org/W4313267411","https://openalex.org/W4320717244","https://openalex.org/W4366352735","https://openalex.org/W4379741379","https://openalex.org/W4385271156","https://openalex.org/W4385848801","https://openalex.org/W4386065887","https://openalex.org/W4386083029","https://openalex.org/W4386179772","https://openalex.org/W4387682254","https://openalex.org/W4389195380","https://openalex.org/W4389491034","https://openalex.org/W4389722441","https://openalex.org/W4390578924","https://openalex.org/W4390660033","https://openalex.org/W4390727645","https://openalex.org/W4390872095","https://openalex.org/W4390872583","https://openalex.org/W4390872797","https://openalex.org/W4393148388","https://openalex.org/W4396621108","https://openalex.org/W4399717717","https://openalex.org/W4402215582","https://openalex.org/W4402704554","https://openalex.org/W4402715923","https://openalex.org/W4402774288","https://openalex.org/W4403235758","https://openalex.org/W4403791267","https://openalex.org/W4404520532","https://openalex.org/W4406362830","https://openalex.org/W4406891929","https://openalex.org/W4408648851","https://openalex.org/W4413157478","https://openalex.org/W4413158072","https://openalex.org/W4415795416"],"related_works":["https://openalex.org/W2386346147","https://openalex.org/W2016474688","https://openalex.org/W2392191343","https://openalex.org/W4231937131","https://openalex.org/W2357430536","https://openalex.org/W323219885","https://openalex.org/W2373946551","https://openalex.org/W2032636564","https://openalex.org/W2350275110","https://openalex.org/W2381578981"],"abstract_inverted_index":{"The":[0,184],"absence":[1,89],"of":[2,90],"ground":[3],"truth":[4],"(GT)":[5],"in":[6],"most":[7],"fusion":[8,20,30,57,65,196,209,225],"tasks":[9],"poses":[10],"significant":[11],"challenges":[12],"for":[13],"model":[14,108,158],"optimization,":[15],"evaluation,":[16],"and":[17,32,39,104,134,171,215],"generalization.":[18],"Existing":[19],"methods":[21],"achieving":[22],"complementary":[23,102,119,136],"context":[24,151],"aggregation":[25],"predominantly":[26],"rely":[27],"on":[28,176,207],"hand-crafted":[29],"rules":[31],"sophisticated":[33],"loss":[34],"functions,":[35],"which":[36,152],"introduce":[37],"subjectivity":[38],"often":[40],"fail":[41],"to":[42,44,100,109,132,148,179],"adapt":[43],"complex":[45],"real-world":[46],"scenarios.":[47],"To":[48],"address":[49],"this":[50],"challenge,":[51],"we":[52,94],"propose":[53],"Mask-DiFuser,":[54],"a":[55,68,80,96,106,143,160,168],"novel":[56],"paradigm":[58],"that":[59,195,220],"ingeniously":[60],"transforms":[61],"the":[62,88,156],"unsupervised":[63],"image":[64,71,77,217],"task":[66,73],"into":[67,155],"dual":[69,97],"masked":[70,76,115,185],"reconstruction":[72],"by":[74],"incorporating":[75],"modeling":[78],"with":[79,124,167,201],"diffusion":[81,107,157,186],"model,":[82,187],"overcoming":[83],"various":[84],"issues":[85],"arising":[86],"from":[87,113,190],"GT.":[91],"In":[92],"particular,":[93],"devise":[95],"masking":[98],"scheme":[99],"simulate":[101],"information":[103],"employ":[105],"restore":[110],"source":[111],"images":[112,178],"two":[114],"inputs,":[116],"thereby":[117],"aggregating":[118],"contexts.":[120],"A":[121],"content":[122,140],"encoder":[123,145],"an":[125],"attention":[126],"parallel":[127],"feature":[128],"mixer":[129],"is":[130,146,153],"deployed":[131],"extract":[133],"integrate":[135],"features,":[137],"offering":[138],"local":[139],"guidance.":[141],"Moreover,":[142],"semantic":[144],"developed":[147],"supply":[149],"global":[150],"integrated":[154],"via":[159],"cross-attention":[161],"mechanism.":[162],"During":[163],"inference,":[164],"Mask-DiFuser":[165,221],"begins":[166],"Gaussian":[169],"distribution":[170],"iteratively":[172],"denoises":[173],"it":[174],"conditioned":[175],"multi-source":[177],"directly":[180],"generate":[181],"fused":[182],"images.":[183],"learning":[188],"priors":[189],"high-quality":[191],"natural":[192],"images,":[193],"ensures":[194],"results":[197],"align":[198],"more":[199],"closely":[200],"human":[202],"visual":[203],"perception.":[204],"Extensive":[205],"experiments":[206],"several":[208],"tasks,":[210],"including":[211],"infrared-visible,":[212],"medical,":[213],"multi-exposure,":[214],"multi-focus":[216],"fusion,":[218],"demonstrate":[219],"significantly":[222],"outshines":[223],"SOTA":[224],"alternatives.":[226]},"counts_by_year":[{"year":2026,"cited_by_count":9},{"year":2025,"cited_by_count":2}],"updated_date":"2026-05-14T08:36:36.166977","created_date":"2025-10-10T00:00:00"}
