{"id":"https://openalex.org/W4413144420","doi":"https://doi.org/10.1109/cvpr52734.2025.01666","title":"Every SAM Drop Counts: Embracing Semantic Priors for Multi-Modality Image Fusion and Beyond","display_name":"Every SAM Drop Counts: Embracing Semantic Priors for Multi-Modality Image Fusion and Beyond","publication_year":2025,"publication_date":"2025-06-10","ids":{"openalex":"https://openalex.org/W4413144420","doi":"https://doi.org/10.1109/cvpr52734.2025.01666"},"language":"en","primary_location":{"id":"doi:10.1109/cvpr52734.2025.01666","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.01666","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052984338","display_name":"Guanyao Wu","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Guanyao Wu","raw_affiliation_strings":["Dalian University of Technology,School of Software Technology,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Software Technology,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100444762","display_name":"Haoyu Liu","orcid":"https://orcid.org/0000-0003-3755-5184"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Haoyu Liu","raw_affiliation_strings":["Dalian University of Technology,School of Software Technology,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Software Technology,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5089009502","display_name":"Hongming Fu","orcid":null},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hongming Fu","raw_affiliation_strings":["Dalian University of Technology,School of Software Technology,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Software Technology,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5045227272","display_name":"Yichuan Peng","orcid":"https://orcid.org/0000-0002-6234-8083"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Yichuan Peng","raw_affiliation_strings":["Dalian University of Technology,School of Software Technology,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Software Technology,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100675904","display_name":"Jinyuan Liu","orcid":"https://orcid.org/0000-0003-2085-2676"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jinyuan Liu","raw_affiliation_strings":["Dalian University of Technology,School of Mechanical Engineering,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Mechanical Engineering,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057776894","display_name":"Xin Fan","orcid":"https://orcid.org/0000-0002-8991-4188"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xin Fan","raw_affiliation_strings":["Dalian University of Technology,School of Software Technology,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Software Technology,China","institution_ids":["https://openalex.org/I27357992"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5042370642","display_name":"Risheng Liu","orcid":"https://orcid.org/0000-0002-9554-0565"},"institutions":[{"id":"https://openalex.org/I27357992","display_name":"Dalian University of Technology","ror":"https://ror.org/023hj5876","country_code":"CN","type":"education","lineage":["https://openalex.org/I27357992"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Risheng Liu","raw_affiliation_strings":["Dalian University of Technology,School of Software Technology,China"],"affiliations":[{"raw_affiliation_string":"Dalian University of Technology,School of Software Technology,China","institution_ids":["https://openalex.org/I27357992"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5052984338"],"corresponding_institution_ids":["https://openalex.org/I27357992"],"apc_list":null,"apc_paid":null,"fwci":31.722,"has_fulltext":false,"cited_by_count":15,"citation_normalized_percentile":{"value":0.9989491,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":99,"max":100},"biblio":{"volume":null,"issue":null,"first_page":"17882","last_page":"17891"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10271","display_name":"Seismic Imaging and Inversion Techniques","score":0.8403000235557556,"subfield":{"id":"https://openalex.org/subfields/1908","display_name":"Geophysics"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10271","display_name":"Seismic Imaging and Inversion Techniques","score":0.8403000235557556,"subfield":{"id":"https://openalex.org/subfields/1908","display_name":"Geophysics"},"field":{"id":"https://openalex.org/fields/19","display_name":"Earth and Planetary Sciences"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10399","display_name":"Hydrocarbon exploration and reservoir analysis","score":0.7961000204086304,"subfield":{"id":"https://openalex.org/subfields/2211","display_name":"Mechanics of Materials"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11801","display_name":"Reservoir Engineering and Simulation Methods","score":0.7573000192642212,"subfield":{"id":"https://openalex.org/subfields/2212","display_name":"Ocean Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.6365649700164795},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.5820593237876892},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5547934174537659},{"id":"https://openalex.org/keywords/fusion","display_name":"Fusion","score":0.5260037183761597},{"id":"https://openalex.org/keywords/prior-probability","display_name":"Prior probability","score":0.5239976644515991},{"id":"https://openalex.org/keywords/image","display_name":"Image (mathematics)","score":0.48394468426704407},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.42340725660324097},{"id":"https://openalex.org/keywords/image-fusion","display_name":"Image fusion","score":0.4195399582386017},{"id":"https://openalex.org/keywords/bayesian-probability","display_name":"Bayesian probability","score":0.08138644695281982},{"id":"https://openalex.org/keywords/linguistics","display_name":"Linguistics","score":0.06665605306625366}],"concepts":[{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.6365649700164795},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5820593237876892},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5547934174537659},{"id":"https://openalex.org/C158525013","wikidata":"https://www.wikidata.org/wiki/Q2593739","display_name":"Fusion","level":2,"score":0.5260037183761597},{"id":"https://openalex.org/C177769412","wikidata":"https://www.wikidata.org/wiki/Q278090","display_name":"Prior probability","level":3,"score":0.5239976644515991},{"id":"https://openalex.org/C115961682","wikidata":"https://www.wikidata.org/wiki/Q860623","display_name":"Image (mathematics)","level":2,"score":0.48394468426704407},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.42340725660324097},{"id":"https://openalex.org/C69744172","wikidata":"https://www.wikidata.org/wiki/Q860822","display_name":"Image fusion","level":3,"score":0.4195399582386017},{"id":"https://openalex.org/C107673813","wikidata":"https://www.wikidata.org/wiki/Q812534","display_name":"Bayesian probability","level":2,"score":0.08138644695281982},{"id":"https://openalex.org/C41895202","wikidata":"https://www.wikidata.org/wiki/Q8162","display_name":"Linguistics","level":1,"score":0.06665605306625366},{"id":"https://openalex.org/C138885662","wikidata":"https://www.wikidata.org/wiki/Q5891","display_name":"Philosophy","level":0,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/cvpr52734.2025.01666","is_oa":false,"landing_page_url":"https://doi.org/10.1109/cvpr52734.2025.01666","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Reduced inequalities","score":0.4099999964237213,"id":"https://metadata.un.org/sdg/10"}],"awards":[],"funders":[{"id":"https://openalex.org/F4320321001","display_name":"National Natural Science Foundation of China","ror":"https://ror.org/01h0zpd94"},{"id":"https://openalex.org/F4320321543","display_name":"China Postdoctoral Science Foundation","ror":"https://ror.org/0426zh255"},{"id":"https://openalex.org/F4320337495","display_name":"Technology Development","ror":null}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W2788731446","https://openalex.org/W2204403038","https://openalex.org/W3152170969","https://openalex.org/W2379054866","https://openalex.org/W2370195708","https://openalex.org/W1490651872","https://openalex.org/W2139242969","https://openalex.org/W2284201331","https://openalex.org/W2095903272","https://openalex.org/W1989561795"],"abstract_inverted_index":{"Multi-modality":[0],"image":[1],"fusion,":[2],"particularly":[3],"infrared":[4],"and":[5,28,80,155],"visible,":[6],"plays":[7],"a":[8,59,90,125,149],"crucial":[9],"role":[10],"in":[11],"integrating":[12],"diverse":[13],"modalities":[14],"to":[15,30,49,73,114,138],"enhance":[16],"scene":[17],"understanding.":[18],"Although":[19],"early":[20],"research":[21],"prioritized":[22],"visual":[23,153],"quality,":[24],"preserving":[25],"fine":[26],"details":[27],"adapting":[29],"downstream":[31,82,156],"tasks":[32],"remains":[33],"challenging.":[34],"Recent":[35],"approaches":[36],"attempt":[37],"task-specific":[38],"design":[39,89],"but":[40],"rarely":[41],"achieve":[42],"\"The":[43],"Best":[44],"of":[45,77],"Both":[46],"Worlds\"":[47],"due":[48],"inconsistent":[50],"optimization":[51],"goals.":[52],"To":[53],"address":[54],"these":[55],"issues,":[56],"we":[57,88,123],"propose":[58],"novel":[60],"method":[61,147],"that":[62,96,145],"leverages":[63],"the":[64,68,75,102,116,135],"semantic":[65,108],"knowledge":[66],"from":[67,110],"Segment":[69],"Anything":[70],"Model":[71],"(SAM)":[72],"Grow":[74],"quality":[76],"fusion":[78],"results":[79,154],"Enable":[81],"task":[83,157],"adaptability,":[84],"namely":[85],"SAGE.":[86],"Specifically,":[87],"Semantic":[91],"Persistent":[92],"Attention":[93],"(SPA)":[94],"Module":[95],"efficiently":[97],"maintains":[98],"source":[99],"information":[100],"via":[101],"persistent":[103],"repository":[104],"while":[105,159],"extracting":[106],"high-level":[107],"priors":[109],"SAM.":[111],"More":[112],"importantly,":[113],"eliminate":[115],"impractical":[117],"dependence":[118],"on":[119],"SAM":[120],"during":[121],"inference,":[122],"introduce":[124],"bi-level":[126],"optimization-driven":[127],"distillation":[128],"mechanism":[129],"with":[130],"triplet":[131],"losses,":[132],"which":[133],"allow":[134],"student":[136],"network":[137],"effectively":[139],"extract":[140],"knowledge.":[141],"Extensive":[142],"experiments":[143],"show":[144],"our":[146],"achieves":[148],"balance":[150],"between":[151],"high-quality":[152],"adaptability":[158],"maintaining":[160],"practical":[161],"deployment":[162],"efficiency.":[163],"The":[164],"code":[165],"is":[166],"available":[167],"at":[168],"https://github.com/RollingPlain/SAGE_IVIF.":[169]},"counts_by_year":[{"year":2026,"cited_by_count":4},{"year":2025,"cited_by_count":11}],"updated_date":"2026-03-09T08:58:05.943551","created_date":"2025-10-10T00:00:00"}
