{"id":"https://openalex.org/W4417085246","doi":"https://doi.org/10.48550/arxiv.2505.05758","title":"APOLLO: Automated LLM and Lean Collaboration for Advanced Formal Reasoning","display_name":"APOLLO: Automated LLM and Lean Collaboration for Advanced Formal Reasoning","publication_year":2025,"publication_date":"2025-05-09","ids":{"openalex":"https://openalex.org/W4417085246","doi":"https://doi.org/10.48550/arxiv.2505.05758"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2505.05758","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.05758","pdf_url":"https://arxiv.org/pdf/2505.05758","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2505.05758","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5114188122","display_name":"Azim Ospanov","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ospanov, Azim","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5017160178","display_name":"Farzan Farnia","orcid":"https://orcid.org/0000-0002-6049-9232"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Farnia, Farzan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5084130340","display_name":"Roozbeh Yousefzadeh","orcid":"https://orcid.org/0000-0003-4551-5342"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yousefzadeh, Roozbeh","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5114188122"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.5684999823570251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10126","display_name":"Logic, programming, and type systems","score":0.5684999823570251,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.07800000160932541,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.06539999693632126,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/mathematical-proof","display_name":"Mathematical proof","score":0.8598999977111816},{"id":"https://openalex.org/keywords/proof-assistant","display_name":"Proof assistant","score":0.6018000245094299},{"id":"https://openalex.org/keywords/formal-verification","display_name":"Formal verification","score":0.5745999813079834},{"id":"https://openalex.org/keywords/automated-reasoning","display_name":"Automated reasoning","score":0.5562999844551086},{"id":"https://openalex.org/keywords/formal-methods","display_name":"Formal methods","score":0.5514000058174133},{"id":"https://openalex.org/keywords/compiler","display_name":"Compiler","score":0.5006999969482422},{"id":"https://openalex.org/keywords/automated-theorem-proving","display_name":"Automated theorem proving","score":0.49070000648498535},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.487199991941452},{"id":"https://openalex.org/keywords/syntax","display_name":"Syntax","score":0.45590001344680786}],"concepts":[{"id":"https://openalex.org/C108710211","wikidata":"https://www.wikidata.org/wiki/Q11538","display_name":"Mathematical proof","level":2,"score":0.8598999977111816},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7646999955177307},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.6396999955177307},{"id":"https://openalex.org/C203265346","wikidata":"https://www.wikidata.org/wiki/Q11387554","display_name":"Proof assistant","level":3,"score":0.6018000245094299},{"id":"https://openalex.org/C111498074","wikidata":"https://www.wikidata.org/wiki/Q173326","display_name":"Formal verification","level":2,"score":0.5745999813079834},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.5562999844551086},{"id":"https://openalex.org/C75606506","wikidata":"https://www.wikidata.org/wiki/Q1049183","display_name":"Formal methods","level":2,"score":0.5514000058174133},{"id":"https://openalex.org/C169590947","wikidata":"https://www.wikidata.org/wiki/Q47506","display_name":"Compiler","level":2,"score":0.5006999969482422},{"id":"https://openalex.org/C206880738","wikidata":"https://www.wikidata.org/wiki/Q431667","display_name":"Automated theorem proving","level":2,"score":0.49070000648498535},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.487199991941452},{"id":"https://openalex.org/C60048249","wikidata":"https://www.wikidata.org/wiki/Q37437","display_name":"Syntax","level":2,"score":0.45590001344680786},{"id":"https://openalex.org/C48145219","wikidata":"https://www.wikidata.org/wiki/Q1335365","display_name":"Security token","level":2,"score":0.43950000405311584},{"id":"https://openalex.org/C116253237","wikidata":"https://www.wikidata.org/wiki/Q1437424","display_name":"Formal specification","level":2,"score":0.430400013923645},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.40849998593330383},{"id":"https://openalex.org/C2777904410","wikidata":"https://www.wikidata.org/wiki/Q7397","display_name":"Software","level":2,"score":0.3874000012874603},{"id":"https://openalex.org/C94461902","wikidata":"https://www.wikidata.org/wiki/Q2762418","display_name":"Formal proof","level":3,"score":0.38679999113082886},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.38420000672340393},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3702000081539154},{"id":"https://openalex.org/C13766981","wikidata":"https://www.wikidata.org/wiki/Q11387554","display_name":"Automated proof checking","level":3,"score":0.3562000095844269},{"id":"https://openalex.org/C105605280","wikidata":"https://www.wikidata.org/wiki/Q7249999","display_name":"Proof complexity","level":3,"score":0.34060001373291016},{"id":"https://openalex.org/C114408938","wikidata":"https://www.wikidata.org/wiki/Q333373","display_name":"Abstract syntax","level":3,"score":0.3098999857902527},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.30309998989105225},{"id":"https://openalex.org/C110251889","wikidata":"https://www.wikidata.org/wiki/Q1569697","display_name":"Model checking","level":2,"score":0.28220000863075256},{"id":"https://openalex.org/C2318724","wikidata":"https://www.wikidata.org/wiki/Q852732","display_name":"Proof theory","level":3,"score":0.28119999170303345},{"id":"https://openalex.org/C146072743","wikidata":"https://www.wikidata.org/wiki/Q192161","display_name":"Formal language","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C140779682","wikidata":"https://www.wikidata.org/wiki/Q210868","display_name":"Sampling (signal processing)","level":3,"score":0.2775000035762787},{"id":"https://openalex.org/C33054407","wikidata":"https://www.wikidata.org/wiki/Q6504747","display_name":"Software verification","level":5,"score":0.26510000228881836},{"id":"https://openalex.org/C124978682","wikidata":"https://www.wikidata.org/wiki/Q1201019","display_name":"Proof of concept","level":2,"score":0.2565000057220459},{"id":"https://openalex.org/C198531522","wikidata":"https://www.wikidata.org/wiki/Q485146","display_name":"Sample (material)","level":2,"score":0.2515999972820282},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.2500999867916107}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2505.05758","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.05758","pdf_url":"https://arxiv.org/pdf/2505.05758","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2505.05758","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2505.05758","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2505.05758","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2505.05758","pdf_url":"https://arxiv.org/pdf/2505.05758","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Formal":[0],"reasoning":[1,115],"and":[2,96,126,168,186,272],"automated":[3,133,166,280],"theorem":[4,281],"proving":[5,19],"constitute":[6],"a":[7,34,45,56,99,123,131,143,177,191,203,242,275],"challenging":[8],"subfield":[9],"of":[10,78,108,145,195,207,214,263],"machine":[11],"learning,":[12],"in":[13,62,135,157,269],"which":[14,136],"machines":[15],"are":[16,184],"tasked":[17],"with":[18,50,112,176],"mathematical":[20],"theorems":[21],"using":[22,160],"formal":[23,28,35,48],"languages":[24],"like":[25],"Lean.":[26],"A":[27],"verification":[29,84],"system":[30],"can":[31],"check":[32],"whether":[33],"proof":[36,49],"is":[37,65],"correct":[38,47],"or":[39],"not":[40],"almost":[41],"instantaneously,":[42],"but":[43],"generating":[44],"completely":[46],"large":[51],"language":[52],"models":[53,212,246],"(LLMs)":[54],"remains":[55],"formidable":[57],"task.":[58],"The":[59,181],"usual":[60],"approach":[61],"the":[63,68,79,83,106,109,137,148,151,155,158,198,219,228],"literature":[64],"to":[66,73,117,190,233,241,252],"prompt":[67],"LLM":[69,138,171,264],"many":[70],"times":[71],"(up":[72],"several":[74],"thousands)":[75],"until":[76],"one":[77,223],"generated":[80],"proofs":[81,140,159],"passes":[82],"system.":[85],"In":[86],"this":[87],"work,":[88],"we":[89,201],"present":[90],"APOLLO":[91],"(Automated":[92],"PrOof":[93],"repair":[94,262],"viaLLM":[95],"Lean":[97,110],"cOllaboration),":[98],"modular,":[100],"model-agnostic":[101],"agentic":[102],"framework":[103],"that":[104,259],"combines":[105],"strengths":[107],"compiler":[111],"an":[113,170],"LLM's":[114],"abilities":[116],"achieve":[118],"better":[119],"proof-generation":[120],"results":[121,257],"at":[122],"low":[124,178],"token":[125],"sampling":[127,220],"budgets.":[128],"Apollo":[129,226],"directs":[130],"fully":[132],"process":[134],"generates":[139],"for":[141,231,278],"theorems,":[142],"set":[144],"agents":[146],"analyze":[147],"proofs,":[149],"fix":[150],"syntax":[152],"errors,":[153],"identify":[154],"mistakes":[156],"Lean,":[161],"isolate":[162],"failing":[163],"sub-lemmas,":[164],"utilize":[165],"solvers,":[167],"invoke":[169],"on":[172],"each":[173],"remaining":[174],"goal":[175],"top-K":[179],"budget.":[180],"repaired":[182],"sub-proofs":[183],"recombined":[185],"reverified,":[187],"iterating":[188],"up":[189],"user-controlled":[192],"maximum":[193],"number":[194],"attempts.":[196],"On":[197],"miniF2F":[199],"benchmark,":[200],"establish":[202],"new":[204],"state-of-the-art":[205,229],"accuracy":[206,230],"84.9%":[208],"among":[209],"sub":[210],"8B-parameter":[211],"(as":[213],"August":[215],"2025)":[216],"while":[217,235],"keeping":[218],"budget":[221],"below":[222],"hundred.":[224,244],"Moreover,":[225],"raises":[227],"Goedel-Prover-SFT":[232],"65.6%":[234],"cutting":[236],"sample":[237],"complexity":[238],"from":[239,250],"25,600":[240],"few":[243],"General-purpose":[245],"(o3-mini,":[247],"o4-mini)":[248],"jump":[249],"3-7%":[251],"over":[253],"40%":[254],"accuracy.":[255],"Our":[256],"demonstrate":[258],"targeted,":[260],"compiler-guided":[261],"outputs":[265],"yields":[266],"dramatic":[267],"gains":[268],"both":[270],"efficiency":[271],"correctness,":[273],"suggesting":[274],"general":[276],"paradigm":[277],"scalable":[279],"proving.":[282]},"counts_by_year":[],"updated_date":"2026-03-07T16:01:11.037858","created_date":"2025-10-10T00:00:00"}
