{"id":"https://openalex.org/W7134245016","doi":"https://doi.org/10.48550/arxiv.2603.06508","title":"When One Modality Rules Them All: Backdoor Modality Collapse in Multimodal Diffusion Models","display_name":"When One Modality Rules Them All: Backdoor Modality Collapse in Multimodal Diffusion Models","publication_year":2026,"publication_date":"2026-03-06","ids":{"openalex":"https://openalex.org/W7134245016","doi":"https://doi.org/10.48550/arxiv.2603.06508"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.06508","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5101488348","display_name":"Qitong Wang","orcid":"https://orcid.org/0000-0001-6360-3800"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Qitong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5108293594","display_name":"Haoran Dai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dai, Haoran","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128622811","display_name":"Haotian Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Haotian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005424498","display_name":"Christopher Rasmussen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rasmussen, Christopher","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128466874","display_name":"Binghui Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Binghui","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.4462999999523163,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.4462999999523163,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11574","display_name":"Artificial Intelligence in Games","score":0.11050000041723251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.08479999750852585,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/backdoor","display_name":"Backdoor","score":0.9750000238418579},{"id":"https://openalex.org/keywords/modality","display_name":"Modality (human\u2013computer interaction)","score":0.5127999782562256},{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.3598000109195709},{"id":"https://openalex.org/keywords/intuition","display_name":"Intuition","score":0.35569998621940613},{"id":"https://openalex.org/keywords/salience","display_name":"Salience (neuroscience)","score":0.3366999924182892},{"id":"https://openalex.org/keywords/modalities","display_name":"Modalities","score":0.31869998574256897}],"concepts":[{"id":"https://openalex.org/C2781045450","wikidata":"https://www.wikidata.org/wiki/Q254569","display_name":"Backdoor","level":2,"score":0.9750000238418579},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6302000284194946},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.552299976348877},{"id":"https://openalex.org/C2780226545","wikidata":"https://www.wikidata.org/wiki/Q6888030","display_name":"Modality (human\u2013computer interaction)","level":2,"score":0.5127999782562256},{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.3598000109195709},{"id":"https://openalex.org/C132010649","wikidata":"https://www.wikidata.org/wiki/Q189222","display_name":"Intuition","level":2,"score":0.35569998621940613},{"id":"https://openalex.org/C108154423","wikidata":"https://www.wikidata.org/wiki/Q1469792","display_name":"Salience (neuroscience)","level":2,"score":0.3366999924182892},{"id":"https://openalex.org/C2779903281","wikidata":"https://www.wikidata.org/wiki/Q6888026","display_name":"Modalities","level":2,"score":0.31869998574256897},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3151000142097473},{"id":"https://openalex.org/C205711294","wikidata":"https://www.wikidata.org/wiki/Q176953","display_name":"Rendering (computer graphics)","level":2,"score":0.31139999628067017},{"id":"https://openalex.org/C108583219","wikidata":"https://www.wikidata.org/wiki/Q197536","display_name":"Deep learning","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C135798126","wikidata":"https://www.wikidata.org/wiki/Q2167279","display_name":"Top-down and bottom-up design","level":2,"score":0.26409998536109924}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.06508","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.06508","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.06508","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.06508","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"While":[0],"diffusion":[1,25],"models":[2],"have":[3],"revolutionized":[4],"visual":[5],"content":[6],"generation,":[7],"their":[8],"rapid":[9],"adoption":[10],"has":[11],"underscored":[12],"the":[13,47,59,68,142],"critical":[14,151],"need":[15],"to":[16,20,30,72],"investigate":[17],"vulnerabilities,":[18],"e.g.,":[19],"backdoor":[21,69,119],"attacks.":[22],"In":[23,50],"multimodal":[24,109],"models,":[26],"it":[27],"is":[28,136],"natural":[29],"expect":[31],"that":[32,124,158],"attacking":[33],"multiple":[34],"modalities":[35],"simultaneously":[36],"(e.g.,":[37],"text":[38],"and":[39,45,97,132,181],"image)":[40],"would":[41],"yield":[42],"complementary":[43],"effects":[44],"strengthen":[46],"overall":[48],"backdoor.":[49],"this":[51,55,86],"paper,":[52],"we":[53,88,112],"challenge":[54],"assumption":[56],"by":[57],"investigating":[58],"phenomenon":[60],"of":[61,78,144,171],"Backdoor":[62],"Modality":[63,94],"Collapse,":[64],"a":[65,76,115,150,165,169,175],"scenario":[66],"where":[67],"mechanism":[70],"degenerates":[71],"rely":[73],"predominantly":[74],"on":[75,168],"subset":[77,170],"modalities,":[79],"rendering":[80],"others":[81],"redundant.":[82],"To":[83],"rigorously":[84],"quantify":[85],"behavior,":[87],"introduce":[89],"two":[90],"novel":[91],"metrics:":[92],"Trigger":[93],"Attribution":[95],"(TMA)":[96],"Cross-Trigger":[98],"Interaction":[99],"(CTI).":[100],"Through":[101],"extensive":[102],"experiments":[103],"across":[104],"diverse":[105],"training":[106],"configurations":[107],"in":[108,118,154],"conditional":[110],"diffusion,":[111],"consistently":[113],"observe":[114],"``winner-takes-all''":[116],"dynamic":[117],"behavior.":[120],"Our":[121],"results":[122],"reveal":[123],"(1)":[125],"attacks":[126],"often":[127,163],"collapse":[128],"into":[129],"subset-modality":[130],"dominance,":[131],"(2)":[133],"cross-modal":[134],"interaction":[135],"negligible":[137],"or":[138],"even":[139],"negative,":[140],"contradicting":[141],"intuition":[143],"synergistic":[145],"vulnerability.":[146],"These":[147],"findings":[148],"highlight":[149],"blind":[152],"spot":[153],"current":[155],"assessments,":[156],"suggesting":[157],"high":[159],"attack":[160],"success":[161],"rates":[162],"mask":[164],"fundamental":[166],"reliance":[167],"modalities.":[172],"This":[173],"establishes":[174],"principled":[176],"foundation":[177],"for":[178],"mechanistic":[179],"analysis":[180],"future":[182],"defense":[183],"development.":[184]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-10T00:00:00"}
