{"id":"https://openalex.org/W7134944025","doi":"https://doi.org/10.48550/arxiv.2603.09246","title":"Reasoning-Oriented Programming: Chaining Semantic Gadgets to Jailbreak Large Vision Language Models","display_name":"Reasoning-Oriented Programming: Chaining Semantic Gadgets to Jailbreak Large Vision Language Models","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7134944025","doi":"https://doi.org/10.48550/arxiv.2603.09246"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.09246","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09246","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.09246","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128776113","display_name":"Quanchen Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zou, Quanchen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5048192370","display_name":"Minghao Chen","orcid":"https://orcid.org/0000-0003-3437-6578"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Moyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5020945039","display_name":"Zonghao Ying","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ying, Zonghao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5103643521","display_name":"Wenzhuo Xu","orcid":"https://orcid.org/0009-0000-7905-3428"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Wenzhuo","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5076884053","display_name":"Yisong Xiao","orcid":"https://orcid.org/0000-0001-8227-0052"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Yisong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128744690","display_name":"Deyue Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Deyue","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128786633","display_name":"Dongdong Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Dongdong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128800176","display_name":"Zhao Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zhao","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128783418","display_name":"Xiangzheng Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiangzheng","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5128776113"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.8853999972343445,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.8853999972343445,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.04740000143647194,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11424","display_name":"Security and Verification in Computing","score":0.02239999920129776,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/chaining","display_name":"Chaining","score":0.8410999774932861},{"id":"https://openalex.org/keywords/analogy","display_name":"Analogy","score":0.7063000202178955},{"id":"https://openalex.org/keywords/exploit","display_name":"Exploit","score":0.600600004196167},{"id":"https://openalex.org/keywords/feature","display_name":"Feature (linguistics)","score":0.54830002784729},{"id":"https://openalex.org/keywords/backward-chaining","display_name":"Backward chaining","score":0.5462999939918518},{"id":"https://openalex.org/keywords/forward-chaining","display_name":"Forward chaining","score":0.46549999713897705},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.46369999647140503},{"id":"https://openalex.org/keywords/visual-reasoning","display_name":"Visual reasoning","score":0.43479999899864197},{"id":"https://openalex.org/keywords/logic-programming","display_name":"Logic programming","score":0.3720000088214874}],"concepts":[{"id":"https://openalex.org/C49020025","wikidata":"https://www.wikidata.org/wiki/Q1059099","display_name":"Chaining","level":2,"score":0.8410999774932861},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8303999900817871},{"id":"https://openalex.org/C521332185","wikidata":"https://www.wikidata.org/wiki/Q185816","display_name":"Analogy","level":2,"score":0.7063000202178955},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.600600004196167},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.551800012588501},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.54830002784729},{"id":"https://openalex.org/C129916263","wikidata":"https://www.wikidata.org/wiki/Q1141183","display_name":"Backward chaining","level":4,"score":0.5462999939918518},{"id":"https://openalex.org/C142614401","wikidata":"https://www.wikidata.org/wiki/Q777433","display_name":"Forward chaining","level":3,"score":0.46549999713897705},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.46369999647140503},{"id":"https://openalex.org/C2777508537","wikidata":"https://www.wikidata.org/wiki/Q7936620","display_name":"Visual reasoning","level":2,"score":0.43479999899864197},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.4142000079154968},{"id":"https://openalex.org/C128838566","wikidata":"https://www.wikidata.org/wiki/Q275603","display_name":"Logic programming","level":2,"score":0.3720000088214874},{"id":"https://openalex.org/C90312973","wikidata":"https://www.wikidata.org/wiki/Q7449052","display_name":"Semantic data model","level":2,"score":0.36629998683929443},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.34369999170303345},{"id":"https://openalex.org/C2780878386","wikidata":"https://www.wikidata.org/wiki/Q1659648","display_name":"Visual language","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.31040000915527344},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.3034999966621399},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2994999885559082},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2892000079154968},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2797999978065491},{"id":"https://openalex.org/C2781238097","wikidata":"https://www.wikidata.org/wiki/Q175026","display_name":"Object (grammar)","level":2,"score":0.27639999985694885},{"id":"https://openalex.org/C2779662365","wikidata":"https://www.wikidata.org/wiki/Q5416694","display_name":"Event (particle physics)","level":2,"score":0.2676999866962433},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2644999921321869},{"id":"https://openalex.org/C2781122975","wikidata":"https://www.wikidata.org/wiki/Q16928266","display_name":"Semantic feature","level":2,"score":0.2615000009536743},{"id":"https://openalex.org/C2775955345","wikidata":"https://www.wikidata.org/wiki/Q7449071","display_name":"Semantic mapping","level":2,"score":0.2581999897956848},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.257999986410141},{"id":"https://openalex.org/C2983448237","wikidata":"https://www.wikidata.org/wiki/Q1078276","display_name":"Language understanding","level":2,"score":0.2574999928474426}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.09246","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09246","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.09246","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.09246","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.7223316431045532,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"Vision-Language":[1],"Models":[2],"(LVLMs)":[3],"undergo":[4],"safety":[5,175],"alignment":[6],"to":[7,44,63,87,128,138],"suppress":[8],"harmful":[9,46,123],"content.":[10],"However,":[11],"current":[12],"defenses":[13],"predominantly":[14],"target":[15],"explicit":[16],"malicious":[17,136],"patterns":[18],"in":[19,28,66],"the":[20,25,83,122,135,142,178],"input":[21],"representation,":[22],"often":[23],"overlooking":[24],"vulnerabilities":[26],"inherent":[27],"compositional":[29],"reasoning.":[30],"In":[31],"this":[32,53,98],"paper,":[33],"we":[34],"identify":[35],"a":[36,60,89],"systemic":[37],"flaw":[38],"where":[39],"LVLMs":[40],"can":[41],"be":[42],"induced":[43],"synthesize":[45],"logic":[47,137],"from":[48,121],"benign":[49,77,94],"premises.":[50],"We":[51,96,151],"formalize":[52],"attack":[54],"paradigm":[55,99],"as":[56,70],"\\textit{Reasoning-Oriented":[57],"Programming},":[58],"drawing":[59],"structural":[61],"analogy":[62],"Return-Oriented":[64],"Programming":[65],"systems":[67],"security.":[68],"Just":[69],"ROP":[71],"circumvents":[72,174],"memory":[73],"protections":[74],"by":[75,182],"chaining":[76],"instruction":[78],"sequences,":[79],"our":[80],"approach":[81],"exploits":[82],"model's":[84],"instruction-following":[85],"capability":[86],"orchestrate":[88],"semantic":[90],"collision":[91],"of":[92,185],"orthogonal":[93],"inputs.":[95],"instantiate":[97],"via":[100],"\\tool{},":[101],"an":[102,183],"automated":[103],"framework":[104],"that":[105,117,171],"optimizes":[106],"for":[107],"\\textit{semantic":[108],"orthogonality}":[109],"and":[110,125,156,164,190],"\\textit{spatial":[111],"isolation}.":[112],"By":[113],"generating":[114],"visual":[115],"gadgets":[116],"are":[118],"semantically":[119],"decoupled":[120],"intent":[124],"arranging":[126],"them":[127],"prevent":[129],"premature":[130],"feature":[131],"fusion,":[132],"\\tool{}":[133,153,172],"forces":[134],"emerge":[139],"only":[140],"during":[141],"late-stage":[143],"reasoning":[144],"process.":[145],"This":[146],"effectively":[147],"bypasses":[148],"perception-level":[149],"alignment.":[150],"evaluate":[152],"on":[154,187,192],"SafeBench":[155],"MM-SafetyBench":[157],"across":[158],"7":[159],"state-of-the-art":[160],"0.LVLMs,":[161],"including":[162],"GPT-4o":[163],"Claude":[165],"3.7":[166],"Sonnet.":[167],"Our":[168],"results":[169],"demonstrate":[170],"consistently":[173],"alignment,":[176],"outperforming":[177],"strongest":[179],"existing":[180],"baseline":[181],"average":[184],"4.67\\%":[186],"open-source":[188],"models":[189],"9.50\\%":[191],"commercial":[193],"models.":[194]},"counts_by_year":[],"updated_date":"2026-03-12T06:18:43.230356","created_date":"2026-03-12T00:00:00"}
