{"id":"https://openalex.org/W7147436548","doi":"https://doi.org/10.48550/arxiv.2603.29665","title":"Near-Miss: Latent Policy Failure Detection in Agentic Workflows","display_name":"Near-Miss: Latent Policy Failure Detection in Agentic Workflows","publication_year":2026,"publication_date":"2026-03-31","ids":{"openalex":"https://openalex.org/W7147436548","doi":"https://doi.org/10.48550/arxiv.2603.29665"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.29665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.29665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.29665","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5113719560","display_name":"Ella Rabinovich","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rabinovich, Ella","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5090206761","display_name":"David Boaz","orcid":"https://orcid.org/0009-0003-5515-0479"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Boaz, David","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5043433328","display_name":"Naama Zwerdling","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zwerdling, Naama","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5078882226","display_name":"Ateret Anaby-Tavor","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Anaby-Tavor, Ateret","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.6014000177383423,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10703","display_name":"Business Process Modeling and Analysis","score":0.6014000177383423,"subfield":{"id":"https://openalex.org/subfields/1404","display_name":"Management Information Systems"},"field":{"id":"https://openalex.org/fields/14","display_name":"Business, Management and Accounting"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.07500000298023224,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13287","display_name":"Robotic Process Automation Applications","score":0.0681999996304512,"subfield":{"id":"https://openalex.org/subfields/2209","display_name":"Industrial and Manufacturing Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/guard","display_name":"Guard (computer science)","score":0.657800018787384},{"id":"https://openalex.org/keywords/workflow","display_name":"Workflow","score":0.5981000065803528},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.5221999883651733},{"id":"https://openalex.org/keywords/executable","display_name":"Executable","score":0.49799999594688416},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.489300012588501},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.4880000054836273},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.44179999828338623}],"concepts":[{"id":"https://openalex.org/C141141315","wikidata":"https://www.wikidata.org/wiki/Q2379942","display_name":"Guard (computer science)","level":2,"score":0.657800018787384},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6164000034332275},{"id":"https://openalex.org/C177212765","wikidata":"https://www.wikidata.org/wiki/Q627335","display_name":"Workflow","level":2,"score":0.5981000065803528},{"id":"https://openalex.org/C112930515","wikidata":"https://www.wikidata.org/wiki/Q4389547","display_name":"Risk analysis (engineering)","level":1,"score":0.5486999750137329},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.5221999883651733},{"id":"https://openalex.org/C160145156","wikidata":"https://www.wikidata.org/wiki/Q778586","display_name":"Executable","level":2,"score":0.49799999594688416},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.489300012588501},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.4880000054836273},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.44179999828338623},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.39640000462532043},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.3499999940395355},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.33550000190734863},{"id":"https://openalex.org/C33499554","wikidata":"https://www.wikidata.org/wiki/Q1417134","display_name":"Dashboard","level":2,"score":0.3285999894142151},{"id":"https://openalex.org/C85345410","wikidata":"https://www.wikidata.org/wiki/Q851587","display_name":"Business process","level":3,"score":0.3239000141620636},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.29809999465942383},{"id":"https://openalex.org/C115901376","wikidata":"https://www.wikidata.org/wiki/Q184199","display_name":"Automation","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C2778994249","wikidata":"https://www.wikidata.org/wiki/Q2842324","display_name":"TRAC","level":2,"score":0.2797999978065491},{"id":"https://openalex.org/C38652104","wikidata":"https://www.wikidata.org/wiki/Q3510521","display_name":"Computer security","level":1,"score":0.27070000767707825},{"id":"https://openalex.org/C174348530","wikidata":"https://www.wikidata.org/wiki/Q188635","display_name":"Bridging (networking)","level":2,"score":0.26100000739097595},{"id":"https://openalex.org/C57501372","wikidata":"https://www.wikidata.org/wiki/Q2021268","display_name":"BitTorrent tracker","level":3,"score":0.2517000138759613}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.29665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.29665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.29665","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.29665","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.8283447027206421,"display_name":"Peace, Justice and strong institutions","id":"https://metadata.un.org/sdg/16"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Agentic":[0],"systems":[1],"for":[2,90,184],"business":[3],"process":[4,196],"automation":[5],"often":[6],"require":[7],"compliance":[8],"with":[9],"policies":[10,107],"governing":[11],"conditional":[12],"updates":[13],"to":[14,69,74,117,198],"the":[15,31,101,131,162,166,182,194],"system":[16,33],"state.":[17,169],"Evaluation":[18],"of":[19,54,154],"policy":[20,45,61,93],"adherence":[21],"in":[22,56,95,152,176],"LLM-based":[23],"agentic":[24],"workflows":[25],"is":[26],"typically":[27],"performed":[28],"by":[29],"comparing":[30],"final":[32,163,190],"state":[34],"against":[35],"a":[36,50,65,87,173],"predefined":[37],"ground":[38],"truth.":[39],"While":[40],"this":[41,83],"approach":[42,129],"detects":[43],"explicit":[44],"violations,":[46],"it":[47],"may":[48],"overlook":[49],"more":[51],"subtle":[52],"class":[53],"issues":[55],"which":[57,104],"agents":[58],"bypass":[59],"required":[60],"checks,":[62],"yet":[63],"reach":[64],"correct":[66],"outcome":[67,164],"due":[68],"favorable":[70],"circumstances.":[71],"We":[72,126],"refer":[73],"such":[75],"cases":[76],"as":[77,143],"near-misses":[78],"or":[79],"latent":[80,92,149],"failures.":[81],"In":[82],"work,":[84],"we":[85],"introduce":[86],"novel":[88],"metric":[89],"detecting":[91],"failures":[94,150],"agent":[96,115],"conversations":[97],"traces.":[98],"Building":[99],"on":[100,130],"ToolGuard":[102],"framework,":[103],"converts":[105],"natural-language":[106],"into":[108],"executable":[109],"guard":[110],"code,":[111],"our":[112,128],"method":[113],"analyzes":[114],"trajectories":[116,155],"determine":[118],"whether":[119],"agent's":[120],"tool-calling":[121],"decisions":[122],"where":[123],"sufficiently":[124],"informed.":[125],"evaluate":[127],"$\u03c4^2$-verified":[132],"Airlines":[133],"benchmark":[134],"across":[135],"several":[136],"contemporary":[137],"open":[138],"and":[139,180],"proprietary":[140],"LLMs":[141],"acting":[142],"agents.":[144],"Our":[145],"results":[146],"show":[147],"that":[148,186],"occur":[151],"8-17%":[153],"involving":[156],"mutating":[157],"tool":[158],"calls,":[159],"even":[160],"when":[161],"matches":[165],"expected":[167],"ground-truth":[168],"These":[170],"findings":[171],"reveal":[172],"blind":[174],"spot":[175],"current":[177],"evaluation":[178],"methodologies":[179],"highlight":[181],"need":[183],"metrics":[185],"assess":[187],"not":[188],"only":[189],"outcomes":[191],"but":[192],"also":[193],"decision":[195],"leading":[197],"them.":[199]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-02T00:00:00"}
