{"id":"https://openalex.org/W4406272103","doi":"https://doi.org/10.1109/iccv51701.2025.00198","title":"Jailbreaking Multimodal Large Language Models via Shuffle Inconsistency","display_name":"Jailbreaking Multimodal Large Language Models via Shuffle Inconsistency","publication_year":2025,"publication_date":"2025-10-19","ids":{"openalex":"https://openalex.org/W4406272103","doi":"https://doi.org/10.1109/iccv51701.2025.00198"},"language":"en","primary_location":{"id":"doi:10.1109/iccv51701.2025.00198","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},"type":"preprint","indexed_in":["arxiv","crossref","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2501.04931","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Shiji Zhao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":true,"raw_author_name":"Shiji Zhao","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043909623","display_name":"Ranjie Duan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Ranjie Duan","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100639703","display_name":"Fengxiang Wang","orcid":"https://orcid.org/0000-0002-7383-4634"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Fengxiang Wang","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103056709","display_name":"Chi Chen","orcid":"https://orcid.org/0000-0002-8472-641X"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Chi Chen","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048132729","display_name":"Caixin Kang","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Caixin Kang","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Shouwei Ruan","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Shouwei Ruan","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115843913","display_name":"Jialing Tao","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Jialing Tao","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":null,"display_name":"YueFeng Chen","orcid":null},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"YueFeng Chen","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057436798","display_name":"Hui Xue","orcid":"https://orcid.org/0000-0002-5856-4445"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Hui Xue","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5079657274","display_name":"Xingxing Wei","orcid":"https://orcid.org/0000-0002-0778-8377"},"institutions":[{"id":"https://openalex.org/I4210100255","display_name":"Beijing Academy of Artificial Intelligence","ror":"https://ror.org/016a74861","country_code":"CN","type":"other","lineage":["https://openalex.org/I4210100255"]}],"countries":["CN"],"is_corresponding":false,"raw_author_name":"Xingxing Wei","raw_affiliation_strings":["Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China"],"raw_orcid":null,"affiliations":[{"raw_affiliation_string":"Institute of Artificial Intelligence, Beihang University,State Key Laboratory of Virtual Reality Technology and Systems,Beijing,China","institution_ids":["https://openalex.org/I4210100255"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":10,"corresponding_author_ids":[],"corresponding_institution_ids":["https://openalex.org/I4210100255"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":true,"cited_by_count":0,"citation_normalized_percentile":{"value":0.00244215,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"2045","last_page":"2054"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.9923999905586243,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.9864000082015991,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.9648000001907349,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.5882223844528198},{"id":"https://openalex.org/keywords/natural-language-processing","display_name":"Natural language processing","score":0.3372197449207306}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5882223844528198},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3372197449207306}],"mesh":[],"locations_count":3,"locations":[{"id":"doi:10.1109/iccv51701.2025.00198","is_oa":false,"landing_page_url":"https://doi.org/10.1109/iccv51701.2025.00198","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE/CVF International Conference on Computer Vision (ICCV)","raw_type":"proceedings-article"},{"id":"pmh:oai:arXiv.org:2501.04931","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.04931","pdf_url":"https://arxiv.org/pdf/2501.04931","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2501.04931","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2501.04931","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2501.04931","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2501.04931","pdf_url":"https://arxiv.org/pdf/2501.04931","source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320335787","display_name":"Fundamental Research Funds for the Central Universities","ror":null}],"has_content":{"pdf":true,"grobid_xml":false},"content_urls":{"pdf":"https://content.openalex.org/works/W4406272103.pdf"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Multimodal":[0],"Large":[1],"Language":[2],"Models":[3],"(MLLMs)":[4],"have":[5,10,22,70],"achieved":[6],"impressive":[7],"performance":[8,198],"and":[9,39,62,96,159],"been":[11],"put":[12],"into":[13],"practical":[14],"use":[15],"in":[16],"commercial":[17,77,213],"applications,":[18],"but":[19],"they":[20,69,122],"still":[21],"potential":[23,42],"safety":[24,37,52,97,136],"mechanism":[25,53],"vulnerabilities.":[26],"Jailbreak":[27],"attacks":[28],"are":[29],"red":[30],"teaming":[31],"methods":[32,47,57],"that":[33,86,192],"aim":[34],"to":[35,139,153,171],"bypass":[36,49],"mechanisms":[38],"discover":[40],"MLLMs'":[41,45,93],"risks.":[43],"Existing":[44],"jailbreak":[46,148],"often":[48],"the":[50,100,107,115,128,133,156,161,173,180,183,196,208],"model's":[51],"through":[54],"complex":[55],"optimization":[56,169],"or":[58,218],"carefully":[59],"designed":[60],"image":[61],"text":[63],"prompts.":[64],"Despite":[65],"achieving":[66],"some":[67],"progress,":[68],"a":[71,89,146,166],"low":[72],"attack":[73,149,209],"success":[74,210],"rate":[75,211],"on":[76,179,199],"closed-source":[78],"MLLMs.":[79],"Unlike":[80],"previous":[81],"research,":[82],"we":[83,143,164],"empirically":[84],"find":[85],"there":[87],"exists":[88],"Shuffle":[90,157],"Inconsistency":[91,158],"between":[92],"comprehension":[94,110],"ability":[95,98],"for":[99,212],"shuffled":[101,116,129,176],"harmful":[102,117,130,140,175],"instruction.":[103],"That":[104],"is,":[105],"from":[106,132],"perspective":[108,134],"of":[109,135,182,189],"ability,":[111,137],"MLLMs":[112,214],"can":[113,123,194,205],"understand":[114],"text-image":[118,147],"instructions":[119,131],"well.":[120],"However,":[121],"be":[124],"easily":[125],"bypassed":[126],"by":[127],"leading":[138],"responses.":[141],"Then":[142],"innovatively":[144],"propose":[145],"named":[150],"SI-Attack.":[151],"Specifically,":[152],"fully":[154],"utilize":[155],"overcome":[160],"shuffle":[162],"randomness,":[163],"apply":[165],"query-based":[167],"black-box":[168],"method":[170],"select":[172],"most":[174],"inputs":[177],"based":[178],"feedback":[181],"toxic":[184],"judge":[185],"model.":[186],"A":[187],"series":[188],"experiments":[190],"show":[191],"SI-Attack":[193,204],"improve":[195,207],"attack's":[197],"three":[200],"benchmarks.":[201],"In":[202],"particular,":[203],"obviously":[206],"such":[215],"as":[216],"GPT-4o":[217],"Claude-3.5-Sonnet.":[219]},"counts_by_year":[],"updated_date":"2026-05-06T06:03:25.996018","created_date":"2025-10-10T00:00:00"}
