{"id":"https://openalex.org/W4414934240","doi":"https://doi.org/10.1109/tip.2025.3615680","title":"MVFusion: Generative Representation Learning With Masked Variational Autoencoders for Multi-Modality Image Fusion","display_name":"MVFusion: Generative Representation Learning With Masked Variational Autoencoders for Multi-Modality Image Fusion","publication_year":2025,"publication_date":"2025-01-01","ids":{"openalex":"https://openalex.org/W4414934240","doi":"https://doi.org/10.1109/tip.2025.3615680","pmid":"https://pubmed.ncbi.nlm.nih.gov/41052155"},"language":"en","primary_location":{"id":"doi:10.1109/tip.2025.3615680","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3615680","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},"type":"article","indexed_in":["crossref","pubmed"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5004773195","display_name":"Jingwei Xin","orcid":"https://orcid.org/0000-0001-9551-6007"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Jingwei Xin","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103604735","display_name":"Breanna Shi","orcid":null},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Boneng Shi","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Nannan Wang","orcid":"https://orcid.org/0000-0002-4695-6134"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Nannan Wang","raw_affiliation_strings":["State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"State Key Laboratory of Integrated Services Networks, School of Telecommunications Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Jie Li","orcid":"https://orcid.org/0000-0001-7950-4233"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jie Li","raw_affiliation_strings":["School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5101785348","display_name":"Xinbo Gao","orcid":"https://orcid.org/0000-0002-7985-0037"},"institutions":[{"id":"https://openalex.org/I149594827","display_name":"Xidian University","ror":"https://ror.org/05s92vm98","country_code":"CN","type":"education","lineage":["https://openalex.org/I149594827"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xinbo Gao","raw_affiliation_strings":["School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China"],"affiliations":[{"raw_affiliation_string":"School of Electronic Engineering, Xidian University, Xi&#x2019;an, Shaanxi, China","institution_ids":["https://openalex.org/I149594827"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5004773195"],"corresponding_institution_ids":["https://openalex.org/I149594827"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.26761865,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":"34","issue":null,"first_page":"6418","last_page":"6431"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9796000123023987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10824","display_name":"Image Retrieval and Classification Techniques","score":0.9796000123023987,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11659","display_name":"Advanced Image Fusion Techniques","score":0.9269999861717224,"subfield":{"id":"https://openalex.org/subfields/2214","display_name":"Media Technology"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14339","display_name":"Image Processing and 3D Reconstruction","score":0.909600019454956,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/autoencoder","display_name":"Autoencoder","score":0.8083999752998352},{"id":"https://openalex.org/keywords/feature-learning","display_name":"Feature learning","score":0.635200023651123},{"id":"https://openalex.org/keywords/generative-grammar","display_name":"Generative grammar","score":0.6122999787330627},{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.5902000069618225},{"id":"https://openalex.org/keywords/redundancy","display_name":"Redundancy (engineering)","score":0.5429999828338623},{"id":"https://openalex.org/keywords/pattern-recognition","display_name":"Pattern recognition (psychology)","score":0.5364999771118164},{"id":"https://openalex.org/keywords/generative-model","display_name":"Generative model","score":0.5327000021934509},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.4950000047683716},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.48669999837875366}],"concepts":[{"id":"https://openalex.org/C101738243","wikidata":"https://www.wikidata.org/wiki/Q786435","display_name":"Autoencoder","level":3,"score":0.8083999752998352},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.7612000107765198},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7350000143051147},{"id":"https://openalex.org/C59404180","wikidata":"https://www.wikidata.org/wiki/Q17013334","display_name":"Feature learning","level":2,"score":0.635200023651123},{"id":"https://openalex.org/C39890363","wikidata":"https://www.wikidata.org/wiki/Q36108","display_name":"Generative grammar","level":2,"score":0.6122999787330627},{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.5902000069618225},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.5429999828338623},{"id":"https://openalex.org/C153180895","wikidata":"https://www.wikidata.org/wiki/Q7148389","display_name":"Pattern recognition (psychology)","level":2,"score":0.5364999771118164},{"id":"https://openalex.org/C167966045","wikidata":"https://www.wikidata.org/wiki/Q5532625","display_name":"Generative model","level":3,"score":0.5327000021934509},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.4950000047683716},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.48669999837875366},{"id":"https://openalex.org/C173414695","wikidata":"https://www.wikidata.org/wiki/Q5510276","display_name":"Fusion mechanism","level":4,"score":0.43709999322891235},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.4260999858379364},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.3896999955177307},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.3889999985694885},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.36340001225471497},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.34220001101493835},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.33399999141693115},{"id":"https://openalex.org/C83665646","wikidata":"https://www.wikidata.org/wiki/Q42139305","display_name":"Feature vector","level":2,"score":0.32589998841285706},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.32409998774528503},{"id":"https://openalex.org/C52622490","wikidata":"https://www.wikidata.org/wiki/Q1026626","display_name":"Feature extraction","level":2,"score":0.320499986410141},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.3109000027179718},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.2992999851703644},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.29840001463890076},{"id":"https://openalex.org/C55020928","wikidata":"https://www.wikidata.org/wiki/Q3813865","display_name":"Image quality","level":3,"score":0.2953000068664551},{"id":"https://openalex.org/C75294576","wikidata":"https://www.wikidata.org/wiki/Q5165192","display_name":"Contextual image classification","level":3,"score":0.27970001101493835},{"id":"https://openalex.org/C106430172","wikidata":"https://www.wikidata.org/wiki/Q6002272","display_name":"Image restoration","level":4,"score":0.27469998598098755},{"id":"https://openalex.org/C142575187","wikidata":"https://www.wikidata.org/wiki/Q3358290","display_name":"Pyramid (geometry)","level":2,"score":0.26429998874664307}],"mesh":[],"locations_count":2,"locations":[{"id":"doi:10.1109/tip.2025.3615680","is_oa":false,"landing_page_url":"https://doi.org/10.1109/tip.2025.3615680","pdf_url":null,"source":{"id":"https://openalex.org/S4210173141","display_name":"IEEE Transactions on Image Processing","issn_l":"1057-7149","issn":["1057-7149","1941-0042"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Transactions on Image Processing","raw_type":"journal-article"},{"id":"pmid:41052155","is_oa":false,"landing_page_url":"https://pubmed.ncbi.nlm.nih.gov/41052155","pdf_url":null,"source":{"id":"https://openalex.org/S4306525036","display_name":"PubMed","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I1299303238","host_organization_name":"National Institutes of Health","host_organization_lineage":["https://openalex.org/I1299303238"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE transactions on image processing : a publication of the IEEE Signal Processing Society","raw_type":null}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G2452297484","display_name":null,"funder_award_id":"QTZX23042","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G4297946667","display_name":null,"funder_award_id":"U22A2096","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G4395595032","display_name":null,"funder_award_id":"62441601","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G494101563","display_name":null,"funder_award_id":"KYFZ25001","funder_id":"https://openalex.org/F4320335787","funder_display_name":"Fundamental Research Funds for the Central Universities"},{"id":"https://openalex.org/G7408314144","display_name":null,"funder_award_id":"62206211","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G7985540183","display_name":null,"funder_award_id":"2025RS-CXTD-011","funder_id":"https://openalex.org/F4320329794","funder_display_name":"Social Science Foundation of Shaanxi Province"},{"id":"https://openalex.org/G8946150788","display_name":null,"funder_award_id":"62176195","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"},{"id":"https://openalex.org/G913836228","display_name":null,"funder_award_id":"62036007","funder_id":"https://openalex.org/F4320321001","funder_display_name":"National Natural Science Foundation of China"}],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320329794","display_name":"Social Science Foundation of Shaanxi Province","ror":null},{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":57,"referenced_works":["https://openalex.org/W1967595981","https://openalex.org/W1970758811","https://openalex.org/W2133665775","https://openalex.org/W2152218325","https://openalex.org/W2547774815","https://openalex.org/W2783573276","https://openalex.org/W2787242136","https://openalex.org/W2978157082","https://openalex.org/W2998529071","https://openalex.org/W3014859219","https://openalex.org/W3046194589","https://openalex.org/W3095064240","https://openalex.org/W3135530979","https://openalex.org/W3152132512","https://openalex.org/W3169965317","https://openalex.org/W3199044200","https://openalex.org/W4206713196","https://openalex.org/W4210571497","https://openalex.org/W4220893768","https://openalex.org/W4225672218","https://openalex.org/W4286361941","https://openalex.org/W4301184982","https://openalex.org/W4312440143","https://openalex.org/W4312498215","https://openalex.org/W4313156423","https://openalex.org/W4313555022","https://openalex.org/W4362014679","https://openalex.org/W4366352735","https://openalex.org/W4379741379","https://openalex.org/W4384916907","https://openalex.org/W4385819922","https://openalex.org/W4386071584","https://openalex.org/W4386076504","https://openalex.org/W4386315034","https://openalex.org/W4386902810","https://openalex.org/W4389195380","https://openalex.org/W4390241455","https://openalex.org/W4392207639","https://openalex.org/W4393032603","https://openalex.org/W4393240973","https://openalex.org/W4399167823","https://openalex.org/W4399526541","https://openalex.org/W4399880844","https://openalex.org/W4401024099","https://openalex.org/W4401024612","https://openalex.org/W4402715923","https://openalex.org/W4404037176","https://openalex.org/W4405303798","https://openalex.org/W4406891755","https://openalex.org/W4408667798","https://openalex.org/W4409200564","https://openalex.org/W4409366935","https://openalex.org/W4409367774","https://openalex.org/W4410640240","https://openalex.org/W4413144810","https://openalex.org/W4413157478","https://openalex.org/W4413158072"],"related_works":[],"abstract_inverted_index":{"Creating":[0],"a":[1,13,61,89,102],"comprehensively":[2],"representative":[3],"image":[4,83,172],"while":[5,33,92],"maintaining":[6],"the":[7,56,108,115,121,129,143,148],"merits":[8],"of":[9,16,31,96,110,124],"various":[10],"modalities":[11],"is":[12,77,176],"key":[14],"focus":[15],"current":[17],"Multi-Modality":[18],"Image":[19],"Fusion":[20],"research.":[21],"Existing":[22],"unified":[23,90],"methods":[24],"often":[25],"struggle":[26],"to":[27,43,79,106,140],"handle":[28],"varying":[29,82],"types":[30],"degradation":[32,113],"extracting":[34],"modality-shared":[35],"and":[36,73,85,112,118,170],"modality-specific":[37],"information":[38],"from":[39],"source":[40,116],"images,":[41,117],"leading":[42],"limitations":[44],"in":[45,114,128,147,161],"their":[46],"generative":[47,71,130],"or":[48],"representation":[49,74,149],"capabilities":[50],"under":[51],"different":[52],"conditions.":[53],"To":[54],"address":[55],"challenge,":[57],"we":[58,135],"propose":[59],"MVFusion,":[60],"novel":[62],"self-supervised":[63,103],"masked":[64,104],"variational":[65,137],"autoencoder":[66,105],"framework":[67,91],"that":[68,155],"simultaneously":[69],"enhances":[70],"training":[72,131],"learning.":[75],"It":[76],"designed":[78],"cope":[80],"with":[81,88],"quality":[84],"dataset":[86],"composition":[87],"ensuring":[93],"effective":[94],"fusion":[95,164],"modality":[97,145],"information.":[98],"Specifically,":[99],"MVFusion":[100],"employs":[101],"reduce":[107],"impact":[109],"redundancy":[111],"thus":[119],"learns":[120],"latent":[122],"distribution":[123],"degraded":[125],"input":[126],"images":[127],"stage.":[132,151],"In":[133],"addition,":[134],"incorporate":[136],"feature":[138],"learning":[139,150],"further":[141],"preserve":[142],"distinctive":[144],"features":[146],"Extensive":[152],"experiments":[153],"demonstrate":[154],"our":[156],"model":[157],"achieves":[158],"promising":[159],"results":[160],"several":[162],"classical":[163],"tasks,":[165],"including":[166],"infrared-visible,":[167],"multi-focus,":[168],"multi-exposure,":[169],"medical":[171],"fusion.":[173],"The":[174],"code":[175],"available":[177],"at":[178],"https://github.com/shiboneng/MVFusion.":[179]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
