{"id":"https://openalex.org/W4411631871","doi":"https://doi.org/10.1145/3731715.3733407","title":"On the Adversarial Robustness of Visual-Language Chat Models","display_name":"On the Adversarial Robustness of Visual-Language Chat Models","publication_year":2025,"publication_date":"2025-06-25","ids":{"openalex":"https://openalex.org/W4411631871","doi":"https://doi.org/10.1145/3731715.3733407"},"language":"en","primary_location":{"id":"doi:10.1145/3731715.3733407","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3731715.3733407","pdf_url":null,"source":null,"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":true,"oa_status":"gold","oa_url":"https://doi.org/10.1145/3731715.3733407","any_repository_has_fulltext":null},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5118625832","display_name":"Tianrui Qin","orcid":"https://orcid.org/0009-0002-8386-2003"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Tianrui Qin","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China and OPPO Research Institute, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China and OPPO Research Institute, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002605073","display_name":"Xuan Wang","orcid":"https://orcid.org/0000-0001-9900-9117"},"institutions":[{"id":"https://openalex.org/I170215575","display_name":"National University of Defense Technology","ror":"https://ror.org/05d2yfz11","country_code":"CN","type":"education","lineage":["https://openalex.org/I170215575"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xuan Wang","raw_affiliation_strings":["National University of Defense Technology, Hefei, China"],"affiliations":[{"raw_affiliation_string":"National University of Defense Technology, Hefei, China","institution_ids":["https://openalex.org/I170215575"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100539153","display_name":"Juanjuan Zhao","orcid":"https://orcid.org/0000-0003-1002-9272"},"institutions":[{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Juanjuan Zhao","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012757772","display_name":"Kejiang Ye","orcid":"https://orcid.org/0000-0001-6133-407X"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Kejiang Ye","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China and Shenzhen University of Advanced Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China and Shenzhen University of Advanced Technology, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I180726961"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5012773300","display_name":"Chengzhong Xu","orcid":"https://orcid.org/0000-0001-9480-0356"},"institutions":[{"id":"https://openalex.org/I204512498","display_name":"University of Macau","ror":"https://ror.org/01r4q9n85","country_code":"MO","type":"education","lineage":["https://openalex.org/I204512498"]}],"countries":["MO"],"is_corresponding":false,"raw_author_name":"Cheng-zhong Xu","raw_affiliation_strings":["University of Macau, Macau, China"],"affiliations":[{"raw_affiliation_string":"University of Macau, Macau, China","institution_ids":["https://openalex.org/I204512498"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5026189787","display_name":"Xitong Gao","orcid":"https://orcid.org/0000-0002-2063-2051"},"institutions":[{"id":"https://openalex.org/I180726961","display_name":"Shenzhen University","ror":"https://ror.org/01vy4gh70","country_code":"CN","type":"education","lineage":["https://openalex.org/I180726961"]},{"id":"https://openalex.org/I4210145761","display_name":"Shenzhen Institutes of Advanced Technology","ror":"https://ror.org/04gh4er46","country_code":"CN","type":"facility","lineage":["https://openalex.org/I19820366","https://openalex.org/I4210145761"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xitong Gao","raw_affiliation_strings":["Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China and Shenzhen University of Advanced Technology, Shenzhen, China"],"affiliations":[{"raw_affiliation_string":"Shenzhen Institutes of Advanced Technology, Chinese Academy of Sciences, Shenzhen, China and Shenzhen University of Advanced Technology, Shenzhen, China","institution_ids":["https://openalex.org/I4210145761","https://openalex.org/I180726961"]}]}],"institutions":[],"countries_distinct_count":2,"institutions_distinct_count":6,"corresponding_author_ids":["https://openalex.org/A5118625832"],"corresponding_institution_ids":["https://openalex.org/I4210145761"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.07086709,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1118","last_page":"1127"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":1.0,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11307","display_name":"Domain Adaptation and Few-Shot Learning","score":0.9919000267982483,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11147","display_name":"Misinformation and Its Impacts","score":0.9854999780654907,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/robustness","display_name":"Robustness (evolution)","score":0.8444938063621521},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7983243465423584},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7366394996643066},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.534291684627533},{"id":"https://openalex.org/keywords/computer-vision","display_name":"Computer vision","score":0.4322527050971985},{"id":"https://openalex.org/keywords/speech-recognition","display_name":"Speech recognition","score":0.4123688340187073},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.36061131954193115}],"concepts":[{"id":"https://openalex.org/C63479239","wikidata":"https://www.wikidata.org/wiki/Q7353546","display_name":"Robustness (evolution)","level":3,"score":0.8444938063621521},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7983243465423584},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7366394996643066},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.534291684627533},{"id":"https://openalex.org/C31972630","wikidata":"https://www.wikidata.org/wiki/Q844240","display_name":"Computer vision","level":1,"score":0.4322527050971985},{"id":"https://openalex.org/C28490314","wikidata":"https://www.wikidata.org/wiki/Q189436","display_name":"Speech recognition","level":1,"score":0.4123688340187073},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.36061131954193115},{"id":"https://openalex.org/C185592680","wikidata":"https://www.wikidata.org/wiki/Q2329","display_name":"Chemistry","level":0,"score":0.0},{"id":"https://openalex.org/C104317684","wikidata":"https://www.wikidata.org/wiki/Q7187","display_name":"Gene","level":2,"score":0.0},{"id":"https://openalex.org/C55493867","wikidata":"https://www.wikidata.org/wiki/Q7094","display_name":"Biochemistry","level":1,"score":0.0}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1145/3731715.3733407","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3731715.3733407","pdf_url":null,"source":null,"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"}],"best_oa_location":{"id":"doi:10.1145/3731715.3733407","is_oa":true,"landing_page_url":"https://doi.org/10.1145/3731715.3733407","pdf_url":null,"source":null,"license":"cc-by-nc-sa","license_id":"https://openalex.org/licenses/cc-by-nc-sa","version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"Proceedings of the 2025 International Conference on Multimedia Retrieval","raw_type":"proceedings-article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/4","display_name":"Quality Education","score":0.41999998688697815}],"awards":[{"id":"https://openalex.org/G3633650628","display_name":null,"funder_award_id":"2024A1515030209, 2024A1515011970","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"},{"id":"https://openalex.org/G7229203384","display_name":null,"funder_award_id":"62376263, 62372443, 62271496","funder_id":"https://openalex.org/F4320323817","funder_display_name":"Universitas Brawijaya"}],"funders":[{"id":"https://openalex.org/F4320323817","display_name":"Universitas Brawijaya","ror":"https://ror.org/01wk3d929"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":29,"referenced_works":["https://openalex.org/W2108598243","https://openalex.org/W2194775991","https://openalex.org/W2593463961","https://openalex.org/W2963564844","https://openalex.org/W2966491090","https://openalex.org/W3095319910","https://openalex.org/W3171312896","https://openalex.org/W3171774521","https://openalex.org/W3177174258","https://openalex.org/W3179916154","https://openalex.org/W4224308101","https://openalex.org/W4225323055","https://openalex.org/W4226278401","https://openalex.org/W4236965008","https://openalex.org/W4287113019","https://openalex.org/W4313022653","https://openalex.org/W4387623745","https://openalex.org/W4390190425","https://openalex.org/W4390872822","https://openalex.org/W4392903024","https://openalex.org/W4393145119","https://openalex.org/W4403791428","https://openalex.org/W4405718500","https://openalex.org/W4409365868","https://openalex.org/W6600175266","https://openalex.org/W6600424091","https://openalex.org/W6600545252","https://openalex.org/W6796729313","https://openalex.org/W6810081322"],"related_works":["https://openalex.org/W2502115930","https://openalex.org/W2482350142","https://openalex.org/W4246396837","https://openalex.org/W3126451824","https://openalex.org/W1561927205","https://openalex.org/W3191453585","https://openalex.org/W4297672492","https://openalex.org/W4310988119","https://openalex.org/W4285226279","https://openalex.org/W4288019534"],"abstract_inverted_index":{"With":[0],"the":[1,34,50,63,73,85,88,91,99,135,143,153],"rapid":[2],"development":[3,154],"of":[4,36,52,65,76,87,94,101,138,155],"large":[5],"language":[6,105],"models":[7,157],"(LLMs),":[8],"there":[9],"has":[10,41],"been":[11,43],"a":[12,79],"strong":[13],"interest":[14],"in":[15,30,141],"integrating":[16],"other":[17],"modalities":[18],"such":[19],"as":[20],"image":[21,119],"comprehension":[22],"capabilities.":[23],"While":[24],"they":[25],"have":[26],"shown":[27],"impressive":[28],"performance":[29],"various":[31],"multimodal":[32,74,156],"tasks,":[33],"robustness":[35,51],"Visual":[37],"Language":[38],"Models":[39],"(VLMs)":[40],"not":[42],"thoroughly":[44],"investigated.":[45],"We":[46,70,125,146],"mainly":[47],"focus":[48],"on":[49,54,128],"VLMs":[53,77,132],"visual":[55,95],"adversarial":[56,66,102,115,139,161],"examples.":[57],"In":[58],"this":[59],"work,":[60],"we":[61,109],"explore":[62],"capability":[64],"examples":[67,116,140],"targeting":[68,117],"VLMs.":[69],"highlight":[71],"that":[72,148],"nature":[75,93],"presents":[78],"unique":[80],"attack":[81],"surface":[82],"to":[83,160],"manipulate":[84],"outputs":[86],"LLMs,":[89],"and":[90,122,133],"continuous":[92],"inputs":[96],"further":[97],"enhances":[98],"effectiveness":[100],"attacks":[103],"against":[104],"generative":[106],"models.":[107],"Furthermore,":[108],"demonstrate":[110,134],"three":[111],"application":[112,137],"scenarios":[113],"for":[114],"VLMs:":[118],"description,":[120],"jailbreaking,":[121],"information":[123],"hiding.":[124],"conduct":[126],"experiments":[127],"several":[129],"leading":[130],"open-source":[131],"successful":[136],"all":[142],"proposed":[144],"scenarios.":[145],"hope":[147],"our":[149],"findings":[150],"would":[151],"enable":[152],"more":[158],"robust":[159],"attacks.":[162],"Our":[163],"code":[164],"is":[165],"available":[166],"at":[167],"https://github.com/lafeat/m3-break.":[168]},"counts_by_year":[],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2025-10-10T00:00:00"}
