{"id":"https://openalex.org/W7161775162","doi":"https://doi.org/10.48550/arxiv.2605.19328","title":"RoboJailBench: Benchmarking Adversarial Attacks and Defenses in Embodied Robotic Agents","display_name":"RoboJailBench: Benchmarking Adversarial Attacks and Defenses in Embodied Robotic Agents","publication_year":2026,"publication_date":"2026-05-19","ids":{"openalex":"https://openalex.org/W7161775162","doi":"https://doi.org/10.48550/arxiv.2605.19328"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.19328","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19328","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.19328","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136519289","display_name":"Doguhuan Yeke","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yeke, Doguhuan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136599221","display_name":"Yanming Zhou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Yanming","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121552075","display_name":"Leo Y. Lin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lin, Leo Y.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136539129","display_name":"Hongyu Cai","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cai, Hongyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121542937","display_name":"Antonio Bianchi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bianchi, Antonio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135391333","display_name":"Z. Berkay Celik","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Celik, Z. Berkay","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":6,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9549000263214111,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.9549000263214111,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10883","display_name":"Ethics and Social Impacts of AI","score":0.009200000204145908,"subfield":{"id":"https://openalex.org/subfields/3311","display_name":"Safety Research"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.007300000172108412,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/embodied-cognition","display_name":"Embodied cognition","score":0.843500018119812},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.7364000082015991},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.6492999792098999},{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.5712000131607056},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4383000135421753},{"id":"https://openalex.org/keywords/robot","display_name":"Robot","score":0.4052000045776367},{"id":"https://openalex.org/keywords/cognitive-robotics","display_name":"Cognitive robotics","score":0.3970000147819519},{"id":"https://openalex.org/keywords/security-domain","display_name":"Security domain","score":0.38909998536109924}],"concepts":[{"id":"https://openalex.org/C100609095","wikidata":"https://www.wikidata.org/wiki/Q1335050","display_name":"Embodied cognition","level":2,"score":0.843500018119812},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.7364000082015991},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.717199981212616},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.6492999792098999},{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.5712000131607056},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4830999970436096},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4383000135421753},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.4350000023841858},{"id":"https://openalex.org/C90509273","wikidata":"https://www.wikidata.org/wiki/Q11012","display_name":"Robot","level":2,"score":0.4052000045776367},{"id":"https://openalex.org/C192327766","wikidata":"https://www.wikidata.org/wiki/Q1038799","display_name":"Cognitive robotics","level":3,"score":0.3970000147819519},{"id":"https://openalex.org/C2780264999","wikidata":"https://www.wikidata.org/wiki/Q7445032","display_name":"Security domain","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.3885999917984009},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.3772999942302704},{"id":"https://openalex.org/C58642233","wikidata":"https://www.wikidata.org/wiki/Q8269924","display_name":"Taxonomy (biology)","level":2,"score":0.37380000948905945},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.3718000054359436},{"id":"https://openalex.org/C103683099","wikidata":"https://www.wikidata.org/wiki/Q5370102","display_name":"Embodied agent","level":3,"score":0.36329999566078186},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.3513000011444092},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.33820000290870667},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.2824000120162964},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C36464697","wikidata":"https://www.wikidata.org/wiki/Q451553","display_name":"Visualization","level":2,"score":0.27390000224113464},{"id":"https://openalex.org/C2522767166","wikidata":"https://www.wikidata.org/wiki/Q2374463","display_name":"Data science","level":1,"score":0.27390000224113464}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.19328","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19328","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.19328","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.19328","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"display_name":"Peace, Justice and strong institutions","score":0.7651071548461914,"id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Recent":[0],"advances":[1],"in":[2,36,109,238],"Vision-Language":[3],"Models":[4],"(VLMs)":[5],"facilitate":[6],"a":[7,130,187,203,254],"new":[8,194,204],"class":[9],"of":[10,124,147],"embodied":[11,48,93,110,152,225,239],"AI":[12,111,240],"systems,":[13],"where":[14],"these":[15],"models":[16,85],"are":[17],"integrated":[18],"into":[19],"physical":[20],"platforms,":[21],"e.g.":[22],"robots":[23],"and":[24,31,45,59,69,78,102,139,168,175,186,192,196,207,216,241,250,252],"autonomous":[25],"vehicles,":[26],"to":[27,72,171,219],"interpret":[28],"visual":[29],"scenes":[30],"execute":[32],"natural":[33],"language":[34],"commands":[35],"diverse":[37],"environments.":[38],"Previous":[39],"research":[40],"has":[41],"introduced":[42],"jailbreak":[43,107,236],"attacks":[44,108,195,215,237],"defenses":[46,218],"for":[47,92,106,151,190,235],"AI.":[49,153],"Their":[50],"evaluations,":[51],"however,":[52],"rely":[53],"on":[54,88,223],"ad-hoc":[55],"datasets,":[56,249],"limited":[57],"metrics,":[58],"emphasize":[60],"attack":[61],"success":[62],"while":[63],"neglecting":[64],"the":[65,70,97,230],"trade-off":[66],"between":[67],"security":[68,131,148,174],"ability":[71],"follow":[73],"benign":[74,169],"commands.":[75],"Existing":[76],"benchmarks":[77],"evaluation":[79,91,103,233],"frameworks":[80],"either":[81],"target":[82],"traditional":[83],"chat-based":[84],"or":[86],"focus":[87],"non-adversarial":[89],"safety":[90],"AI;":[94],"neither":[95],"captures":[96],"adversarial":[98,167],"risks,":[99],"inputs,":[100],"consequences,":[101],"criteria":[104],"necessary":[105],"systems.":[112],"In":[113],"this":[114,118,199],"paper,":[115],"we":[116,178,201],"address":[117],"gap":[119],"with":[120,165,183],"RoboJailBench,":[121],"which":[122],"consists":[123],"three":[125],"core":[126],"components.":[127],"We":[128,154,212,245],"establish":[129],"taxonomy":[132],"derived":[133],"from":[134],"ISO":[135],"standards,":[136],"regulatory":[137],"rules,":[138],"documented":[140],"incidents.":[141],"This":[142,227],"effort":[143],"yields":[144],"18":[145],"categories":[146],"violation":[149],"consequences":[150],"introduce":[155],"an":[156,180],"intent":[157],"contrast":[158],"dataset":[159,206],"pipeline":[160],"that":[161],"augments":[162],"existing":[163,210],"datasets":[164],"paired":[166],"goals":[170],"measure":[172],"both":[173],"utility.":[176],"Lastly,":[177],"provide":[179],"evolving":[181],"repository":[182],"standardized":[184,232],"metrics":[185],"unified":[188],"process":[189],"assessing":[191],"integrating":[193],"defenses.":[197],"With":[198],"benchmark,":[200],"construct":[202],"taxonomy-balanced":[205],"augment":[208],"five":[209],"datasets.":[211],"integrate":[213],"four":[214],"two":[217],"evaluate":[220],"their":[221],"performance":[222],"leading":[224],"VLMs.":[226],"benchmark":[228],"provides":[229],"first":[231],"framework":[234],"supports":[242],"future":[243],"research.":[244],"release":[246],"our":[247],"code,":[248],"artifacts,":[251],"maintain":[253],"leaderboard":[255],"at":[256],"https://purseclab.github.io/benchmark-for-robotics-security.":[257]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-21T00:00:00"}
