{"id":"https://openalex.org/W7162318026","doi":"https://doi.org/10.48550/arxiv.2605.23772","title":"Agentic Proving for Program Verification","display_name":"Agentic Proving for Program Verification","publication_year":2026,"publication_date":"2026-05-22","ids":{"openalex":"https://openalex.org/W7162318026","doi":"https://doi.org/10.48550/arxiv.2605.23772"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.23772","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23772","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.23772","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5120384013","display_name":"Alessandro Sosso","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sosso, Alessandro","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134930880","display_name":"Akhil; id_orcid 0000-0002-8650-8213 Arora","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Arora, Akhil","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5043123968","display_name":"Bas Spitters","orcid":"https://orcid.org/0000-0002-2802-0973"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Spitters, Bas","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.7465999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.7465999722480774,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10142","display_name":"Formal Methods in Verification","score":0.10339999943971634,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10743","display_name":"Software Testing and Debugging Techniques","score":0.01899999938905239,"subfield":{"id":"https://openalex.org/subfields/1712","display_name":"Software"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/implementation","display_name":"Implementation","score":0.5861999988555908},{"id":"https://openalex.org/keywords/code","display_name":"Code (set theory)","score":0.5507000088691711},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.5162000060081482},{"id":"https://openalex.org/keywords/verifiable-secret-sharing","display_name":"Verifiable secret sharing","score":0.5008000135421753},{"id":"https://openalex.org/keywords/formal-verification","display_name":"Formal verification","score":0.4519999921321869},{"id":"https://openalex.org/keywords/point","display_name":"Point (geometry)","score":0.44909998774528503},{"id":"https://openalex.org/keywords/pipeline","display_name":"Pipeline (software)","score":0.4449999928474426},{"id":"https://openalex.org/keywords/program-analysis","display_name":"Program analysis","score":0.4120999872684479}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7206000089645386},{"id":"https://openalex.org/C26713055","wikidata":"https://www.wikidata.org/wiki/Q245962","display_name":"Implementation","level":2,"score":0.5861999988555908},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.5770000219345093},{"id":"https://openalex.org/C2776760102","wikidata":"https://www.wikidata.org/wiki/Q5139990","display_name":"Code (set theory)","level":3,"score":0.5507000088691711},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.5162000060081482},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.5008000135421753},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.45399999618530273},{"id":"https://openalex.org/C111498074","wikidata":"https://www.wikidata.org/wiki/Q173326","display_name":"Formal verification","level":2,"score":0.4519999921321869},{"id":"https://openalex.org/C28719098","wikidata":"https://www.wikidata.org/wiki/Q44946","display_name":"Point (geometry)","level":2,"score":0.44909998774528503},{"id":"https://openalex.org/C43521106","wikidata":"https://www.wikidata.org/wiki/Q2165493","display_name":"Pipeline (software)","level":2,"score":0.4449999928474426},{"id":"https://openalex.org/C98183937","wikidata":"https://www.wikidata.org/wiki/Q2112188","display_name":"Program analysis","level":2,"score":0.4120999872684479},{"id":"https://openalex.org/C110251889","wikidata":"https://www.wikidata.org/wiki/Q1569697","display_name":"Model checking","level":2,"score":0.3711000084877014},{"id":"https://openalex.org/C33054407","wikidata":"https://www.wikidata.org/wiki/Q6504747","display_name":"Software verification","level":5,"score":0.3587999939918518},{"id":"https://openalex.org/C164155591","wikidata":"https://www.wikidata.org/wiki/Q2067766","display_name":"Satisfiability modulo theories","level":2,"score":0.35260000824928284},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3495999872684479},{"id":"https://openalex.org/C75606506","wikidata":"https://www.wikidata.org/wiki/Q1049183","display_name":"Formal methods","level":2,"score":0.3393999934196472},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3393999934196472},{"id":"https://openalex.org/C137287247","wikidata":"https://www.wikidata.org/wiki/Q1329550","display_name":"Static program analysis","level":4,"score":0.3319000005722046},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.32030001282691956},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3156000077724457},{"id":"https://openalex.org/C120936955","wikidata":"https://www.wikidata.org/wiki/Q2155640","display_name":"Empirical research","level":2,"score":0.29339998960494995},{"id":"https://openalex.org/C206880738","wikidata":"https://www.wikidata.org/wiki/Q431667","display_name":"Automated theorem proving","level":2,"score":0.28780001401901245},{"id":"https://openalex.org/C166052673","wikidata":"https://www.wikidata.org/wiki/Q83021","display_name":"Empirical evidence","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C111065885","wikidata":"https://www.wikidata.org/wiki/Q1189053","display_name":"Fuzz testing","level":3,"score":0.2599000036716461},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.25699999928474426},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.2524999976158142}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.23772","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23772","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.23772","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23772","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Agentic":[0],"systems":[1],"have":[2],"recently":[3],"emerged":[4],"as":[5],"state-of-the-art":[6],"approaches":[7],"for":[8,40,53,78,155,164,190],"automated":[9],"theorem":[10],"proving":[11,32],"in":[12,29,126,162],"formal":[13],"mathematics.":[14],"To":[15],"assess":[16],"how":[17],"far":[18],"these":[19],"capabilities":[20,145],"extend":[21],"to":[22,152,166],"program":[23,91,140,192],"verification,":[24],"we":[25],"evaluate":[26],"Claude":[27,48,104],"Code":[28],"an":[30],"agentic":[31,148,182],"framework":[33],"on":[34,65,88,109],"CLEVER,":[35],"a":[36,84,132],"Lean":[37],"4":[38],"benchmark":[39],"verifiable":[41],"code":[42],"generation.":[43],"Our":[44],"results":[45,175],"show":[46],"that":[47,179],"generates":[49],"arguably":[50],"valid":[51],"specifications":[52,77],"98.8%":[54],"of":[55,69,80,121,138,146,169],"problems":[56],"(with":[57],"81.3%":[58],"also":[59],"accepted":[60],"by":[61],"CLEVER's":[62],"isomorphism-based":[63,167],"scoring":[64,168],"the":[66,70,89,127,136,144,153,186],"correct":[67,75],"portion":[68],"benchmark),":[71],"certifies":[72],"implementations":[73],"against":[74],"ground-truth":[76],"87.5%":[79],"problems,":[81],"and":[82,93,123,143,150,161],"reaches":[83],"98.1%":[85],"success":[86],"rate":[87],"end-to-end":[90],"generation":[92],"verification":[94,141],"pipeline":[95],"over":[96],"entries":[97],"with":[98],"self-consistent":[99],"premises.":[100],"Across":[101],"all":[102],"stages,":[103],"further":[105],"provides":[106],"high-quality":[107],"feedback":[108],"its":[110],"own":[111],"attempts":[112],"(as":[113],"confirmed":[114],"under":[115],"manual":[116],"review),":[117],"identifying":[118],"underlying":[119],"causes":[120],"failure":[122],"lingering":[124],"bugs":[125],"dataset.":[128],"These":[129],"findings":[130],"highlight":[131],"growing":[133],"mismatch":[134],"between":[135],"difficulty":[137],"existing":[139],"benchmarks":[142],"modern":[147],"provers,":[149],"point":[151],"need":[154],"more":[156],"rigorous,":[157],"bug-resilient":[158],"evaluation":[159],"methodologies,":[160],"particular":[163],"alternatives":[165],"generated":[170],"specifications.":[171],"More":[172],"broadly,":[173],"our":[174],"provide":[176],"empirical":[177],"evidence":[178],"tight":[180],"compiler-in-the-loop":[181],"paradigms":[183],"are":[184],"currently":[185],"most":[187],"effective":[188],"approach":[189],"foundational":[191],"verification.":[193]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-26T00:00:00"}
