{"id":"https://openalex.org/W7133534856","doi":"https://doi.org/10.48550/arxiv.2603.02668","title":"SorryDB: Can AI Provers Complete Real-World Lean Theorems?","display_name":"SorryDB: Can AI Provers Complete Real-World Lean Theorems?","publication_year":2026,"publication_date":"2026-03-03","ids":{"openalex":"https://openalex.org/W7133534856","doi":"https://doi.org/10.48550/arxiv.2603.02668"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.02668","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02668","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.02668","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5127849194","display_name":"Austin Letson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Letson, Austin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5127819186","display_name":"Leopoldo Sarra","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sarra, Leopoldo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128072039","display_name":"Auguste Poiroux","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poiroux, Auguste","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128128038","display_name":"Oliver Dressler","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dressler, Oliver","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128056091","display_name":"Paul Lezeau","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lezeau, Paul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128050940","display_name":"Dhyan Aranha","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aranha, Dhyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081961287","display_name":"Fangling Pu","orcid":"https://orcid.org/0000-0002-1490-0347"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pu, Frederick","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022774766","display_name":"Aaron Hill","orcid":"https://orcid.org/0000-0002-9737-1718"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hill, Aaron","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128107149","display_name":"Miguel Corredera Hidalgo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hidalgo, Miguel Corredera","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128069072","display_name":"Julian Berman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Berman, Julian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114402843","display_name":"George Tsoukalas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tsoukalas, George","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5011292891","display_name":"Lenny Taelman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Taelman, Lenny","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":12,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.19859999418258667,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11986","display_name":"Scientific Computing and Data Management","score":0.19859999418258667,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.14329999685287476,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11704","display_name":"Mobile Crowdsensing and Crowdsourcing","score":0.06930000334978104,"subfield":{"id":"https://openalex.org/subfields/1706","display_name":"Computer Science Applications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/usable","display_name":"USable","score":0.6137999892234802},{"id":"https://openalex.org/keywords/symbolic-execution","display_name":"Symbolic execution","score":0.4747999906539917},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.43470001220703125},{"id":"https://openalex.org/keywords/metric","display_name":"Metric (unit)","score":0.3337000012397766},{"id":"https://openalex.org/keywords/merge","display_name":"Merge (version control)","score":0.32670000195503235},{"id":"https://openalex.org/keywords/liveness","display_name":"Liveness","score":0.31459999084472656},{"id":"https://openalex.org/keywords/snapshot","display_name":"Snapshot (computer storage)","score":0.3073999881744385}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6797000169754028},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.6137999892234802},{"id":"https://openalex.org/C2779639559","wikidata":"https://www.wikidata.org/wiki/Q7661178","display_name":"Symbolic execution","level":3,"score":0.4747999906539917},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.45339998602867126},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.43470001220703125},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.4077000021934509},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.40610000491142273},{"id":"https://openalex.org/C176217482","wikidata":"https://www.wikidata.org/wiki/Q860554","display_name":"Metric (unit)","level":2,"score":0.3337000012397766},{"id":"https://openalex.org/C197129107","wikidata":"https://www.wikidata.org/wiki/Q1921621","display_name":"Merge (version control)","level":2,"score":0.32670000195503235},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31769999861717224},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.31529998779296875},{"id":"https://openalex.org/C15569618","wikidata":"https://www.wikidata.org/wiki/Q3561421","display_name":"Liveness","level":2,"score":0.31459999084472656},{"id":"https://openalex.org/C55282118","wikidata":"https://www.wikidata.org/wiki/Q252683","display_name":"Snapshot (computer storage)","level":2,"score":0.3073999881744385},{"id":"https://openalex.org/C2776937632","wikidata":"https://www.wikidata.org/wiki/Q4117718","display_name":"Program synthesis","level":2,"score":0.2944999933242798},{"id":"https://openalex.org/C56666940","wikidata":"https://www.wikidata.org/wiki/Q788790","display_name":"Documentation","level":2,"score":0.28949999809265137},{"id":"https://openalex.org/C136643341","wikidata":"https://www.wikidata.org/wiki/Q1361526","display_name":"Reachability","level":2,"score":0.2816999852657318},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.27880001068115234},{"id":"https://openalex.org/C2776543023","wikidata":"https://www.wikidata.org/wiki/Q2147046","display_name":"Rework","level":2,"score":0.27149999141693115},{"id":"https://openalex.org/C2985583900","wikidata":"https://www.wikidata.org/wiki/Q722617","display_name":"Formal description","level":2,"score":0.2680000066757202},{"id":"https://openalex.org/C183469790","wikidata":"https://www.wikidata.org/wiki/Q333501","display_name":"Crash","level":2,"score":0.2621999979019165},{"id":"https://openalex.org/C152124472","wikidata":"https://www.wikidata.org/wiki/Q1204361","display_name":"Redundancy (engineering)","level":2,"score":0.251800000667572}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.02668","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02668","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.02668","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.02668","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"We":[0,82,108],"present":[1],"SorryDB,":[2],"a":[3,56,68,84,100,142],"dynamically-updating":[4],"benchmark":[5,31],"of":[6,25,49,60,86,103,145],"open":[7],"Lean":[8,146],"tasks":[9,105],"drawn":[10],"from":[11,106],"78":[12],"real":[13],"world":[14],"formalization":[15],"projects":[16],"on":[17,121],"GitHub.":[18],"Unlike":[19],"existing":[20],"static":[21],"benchmarks,":[22],"often":[23],"composed":[24],"competition":[26],"problems,":[27],"hillclimbing":[28],"the":[29,39,125],"SorryDB":[30,62],"will":[32],"yield":[33],"tools":[34],"that":[35,110],"are":[36,113],"aligned":[37],"to":[38,75,77],"community":[40],"needs,":[41],"more":[42,47],"usable":[43],"by":[44,54],"mathematicians,":[45],"and":[46,66,95],"capable":[48],"understanding":[50],"complex":[51],"dependencies.":[52],"Moreover,":[53],"providing":[55],"continuously":[57],"updated":[58],"stream":[59],"tasks,":[61],"mitigates":[63],"test-set":[64],"contamination":[65],"offers":[67],"robust":[69],"metric":[70],"for":[71],"an":[72,117],"agent's":[73],"ability":[74],"contribute":[76],"novel":[78],"formal":[79],"mathematics":[80],"projects.":[81],"evaluate":[83],"collection":[85],"approaches,":[87,94],"including":[88],"generalist":[89],"large":[90],"language":[91],"models,":[92,137],"agentic":[93,118],"specialized":[96,138],"symbolic":[97],"provers,":[98,139],"over":[99],"selected":[101],"snapshot":[102],"1000":[104],"SorryDB.":[107],"show":[109],"current":[111],"approaches":[112],"complementary:":[114],"even":[115,141],"though":[116],"approach":[119],"based":[120],"Gemini":[122],"Flash":[123],"is":[124,129],"most":[126],"performant,":[127],"it":[128],"not":[130],"strictly":[131],"better":[132],"than":[133],"other":[134],"off-the-shelf":[135],"large-language":[136],"or":[140],"curated":[143],"list":[144],"tactics.":[147]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-03-05T00:00:00"}
