{"id":"https://openalex.org/W7147247395","doi":"https://doi.org/10.48550/arxiv.2603.28807","title":"SafeClaw-R: Towards Safe and Secure Multi-Agent Personal Assistants","display_name":"SafeClaw-R: Towards Safe and Secure Multi-Agent Personal Assistants","publication_year":2026,"publication_date":"2026-03-28","ids":{"openalex":"https://openalex.org/W7147247395","doi":"https://doi.org/10.48550/arxiv.2603.28807"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.28807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.28807","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5132597889","display_name":"Haoyu Albert Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Haoyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132723173","display_name":"Zibo Xiao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xiao, Zibo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5132696881","display_name":"Yedi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yedi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5053470148","display_name":"Christopher M. Poskitt","orcid":"https://orcid.org/0000-0002-9376-2471"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poskitt, Christopher M.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5132593773","display_name":"Jun Sun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sun, Jun","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.320499986410141,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11689","display_name":"Adversarial Robustness in Machine Learning","score":0.320499986410141,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11241","display_name":"Advanced Malware Detection Techniques","score":0.14630000293254852,"subfield":{"id":"https://openalex.org/subfields/1711","display_name":"Signal Processing"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11424","display_name":"Security and Verification in Computing","score":0.1282999962568283,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.6223999857902527},{"id":"https://openalex.org/keywords/enforcement","display_name":"Enforcement","score":0.6183000206947327},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.4383000135421753},{"id":"https://openalex.org/keywords/compromise","display_name":"Compromise","score":0.4059000015258789},{"id":"https://openalex.org/keywords/static-analysis","display_name":"Static analysis","score":0.38909998536109924},{"id":"https://openalex.org/keywords/autonomy","display_name":"Autonomy","score":0.36579999327659607},{"id":"https://openalex.org/keywords/productivity","display_name":"Productivity","score":0.33629998564720154}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8144000172615051},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.6223999857902527},{"id":"https://openalex.org/C2779777834","wikidata":"https://www.wikidata.org/wiki/Q4202277","display_name":"Enforcement","level":2,"score":0.6183000206947327},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.4830000102519989},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.4383000135421753},{"id":"https://openalex.org/C46355384","wikidata":"https://www.wikidata.org/wiki/Q726686","display_name":"Compromise","level":2,"score":0.4059000015258789},{"id":"https://openalex.org/C97686452","wikidata":"https://www.wikidata.org/wiki/Q7604153","display_name":"Static analysis","level":2,"score":0.38909998536109924},{"id":"https://openalex.org/C65414064","wikidata":"https://www.wikidata.org/wiki/Q484105","display_name":"Autonomy","level":2,"score":0.36579999327659607},{"id":"https://openalex.org/C204983608","wikidata":"https://www.wikidata.org/wiki/Q2111958","display_name":"Productivity","level":2,"score":0.33629998564720154},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3334999978542328},{"id":"https://openalex.org/C58581272","wikidata":"https://www.wikidata.org/wiki/Q12741163","display_name":"Workspace","level":3,"score":0.29829999804496765},{"id":"https://openalex.org/C43126263","wikidata":"https://www.wikidata.org/wiki/Q128751","display_name":"Source code","level":2,"score":0.29440000653266907},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.2802000045776367},{"id":"https://openalex.org/C105339364","wikidata":"https://www.wikidata.org/wiki/Q2297740","display_name":"Software deployment","level":2,"score":0.26190000772476196},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.25369998812675476}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.28807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.28807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.28807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"LLM-based":[0],"multi-agent":[1],"systems":[2],"(MASs)":[3],"are":[4,115],"transforming":[5],"personal":[6,27],"productivity":[7,134],"by":[8,111],"autonomously":[9],"executing":[10],"complex,":[11],"cross-platform":[12],"tasks.":[13],"Frameworks":[14],"such":[15],"as":[16,103],"OpenClaw":[17],"demonstrate":[18,176],"the":[19,59,108],"potential":[20],"of":[21,66,158],"locally":[22],"deployed":[23],"agents":[24],"integrated":[25],"with":[26,124],"data":[28],"and":[29,37,80,86,120,139,163],"services,":[30],"but":[31],"this":[32],"autonomy":[33],"introduces":[34],"significant":[35],"safety":[36,102],"security":[38],"risks.":[39,74],"Unintended":[40],"actions":[41,114],"from":[42],"LLM":[43],"reasoning":[44],"failures":[45],"can":[46],"cause":[47],"irreversible":[48],"harm,":[49],"while":[50],"prompt":[51],"injection":[52],"attacks":[53],"may":[54],"exfiltrate":[55],"credentials":[56],"or":[57,72],"compromise":[58],"system.":[60],"Our":[61],"analysis":[62],"shows":[63],"that":[64,100,113,177],"36.4%":[65],"OpenClaw's":[67],"built-in":[68],"skills":[69,123],"pose":[70],"high":[71],"critical":[73],"Existing":[75],"approaches,":[76],"including":[77],"static":[78],"guardrails":[79],"LLM-as-a-Judge,":[81],"lack":[82],"reliable":[83],"real-time":[84],"enforcement":[85,182],"consistent":[87],"authority":[88],"in":[89,147,168],"MAS":[90],"settings.":[91],"To":[92],"address":[93],"this,":[94],"we":[95],"propose":[96],"SafeClaw-R,":[97],"a":[98,104],"framework":[99],"enforces":[101],"system-level":[105],"invariant":[106],"over":[107],"execution":[109,141,172],"graph":[110],"ensuring":[112],"mediated":[116],"prior":[117],"to":[118],"execution,":[119],"systematically":[121],"augments":[122],"safe":[125],"counterparts.":[126],"We":[127],"evaluate":[128],"SafeClaw-R":[129,143,178],"across":[130],"three":[131],"representative":[132],"domains:":[133],"platforms,":[135],"third-party":[136,160],"skill":[137,161],"ecosystems,":[138],"code":[140,171],"environments.":[142],"achieves":[144,164],"95.2%":[145],"accuracy":[146,167],"Google":[148],"Workspace":[149],"scenarios,":[150],"significantly":[151],"outperforming":[152],"regex":[153],"baselines":[154],"(61.6%),":[155],"detects":[156],"97.8%":[157],"malicious":[159],"patterns,":[162],"100%":[165],"detection":[166],"our":[169],"adversarial":[170],"benchmark.":[173],"These":[174],"results":[175],"enables":[179],"practical":[180],"runtime":[181],"for":[183],"autonomous":[184],"MASs.":[185]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-02T00:00:00"}
