{"id":"https://openalex.org/W7128683060","doi":"https://doi.org/10.48550/arxiv.2602.10538","title":"Why Agentic Theorem Prover Works: A Statistical Provability Theory of Mathematical Reasoning Models","display_name":"Why Agentic Theorem Prover Works: A Statistical Provability Theory of Mathematical Reasoning Models","publication_year":2026,"publication_date":"2026-02-11","ids":{"openalex":"https://openalex.org/W7128683060","doi":"https://doi.org/10.48550/arxiv.2602.10538"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.10538","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125693883","display_name":"Sho Sonoda","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Sonoda, Sho","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5068264832","display_name":"Shunta Akiyama","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Akiyama, Shunta","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5125693171","display_name":"Yuya Uezato","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Uezato, Yuya","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5125693883"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.32820001244544983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.32820001244544983,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11596","display_name":"Constraint Satisfaction and Optimization","score":0.1339000016450882,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12002","display_name":"Computability, Logic, AI Algorithms","score":0.07909999787807465,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/representation","display_name":"Representation (politics)","score":0.567300021648407},{"id":"https://openalex.org/keywords/margin","display_name":"Margin (machine learning)","score":0.5644999742507935},{"id":"https://openalex.org/keywords/automated-theorem-proving","display_name":"Automated theorem proving","score":0.4390000104904175},{"id":"https://openalex.org/keywords/calculus","display_name":"Calculus (dental)","score":0.4156999886035919},{"id":"https://openalex.org/keywords/mathematical-proof","display_name":"Mathematical proof","score":0.4065999984741211},{"id":"https://openalex.org/keywords/adversarial-system","display_name":"Adversarial system","score":0.40459999442100525},{"id":"https://openalex.org/keywords/gas-meter-prover","display_name":"Gas meter prover","score":0.39959999918937683}],"concepts":[{"id":"https://openalex.org/C2776359362","wikidata":"https://www.wikidata.org/wiki/Q2145286","display_name":"Representation (politics)","level":3,"score":0.567300021648407},{"id":"https://openalex.org/C774472","wikidata":"https://www.wikidata.org/wiki/Q6760393","display_name":"Margin (machine learning)","level":2,"score":0.5644999742507935},{"id":"https://openalex.org/C33923547","wikidata":"https://www.wikidata.org/wiki/Q395","display_name":"Mathematics","level":0,"score":0.5307000279426575},{"id":"https://openalex.org/C144237770","wikidata":"https://www.wikidata.org/wiki/Q747534","display_name":"Mathematical economics","level":1,"score":0.43959999084472656},{"id":"https://openalex.org/C206880738","wikidata":"https://www.wikidata.org/wiki/Q431667","display_name":"Automated theorem proving","level":2,"score":0.4390000104904175},{"id":"https://openalex.org/C2777686260","wikidata":"https://www.wikidata.org/wiki/Q144037","display_name":"Calculus (dental)","level":2,"score":0.4156999886035919},{"id":"https://openalex.org/C108710211","wikidata":"https://www.wikidata.org/wiki/Q11538","display_name":"Mathematical proof","level":2,"score":0.4065999984741211},{"id":"https://openalex.org/C37736160","wikidata":"https://www.wikidata.org/wiki/Q1801315","display_name":"Adversarial system","level":2,"score":0.40459999442100525},{"id":"https://openalex.org/C159718280","wikidata":"https://www.wikidata.org/wiki/Q5526353","display_name":"Gas meter prover","level":3,"score":0.39959999918937683},{"id":"https://openalex.org/C136119220","wikidata":"https://www.wikidata.org/wiki/Q1000660","display_name":"Algebra over a field","level":2,"score":0.3873000144958496},{"id":"https://openalex.org/C2776230367","wikidata":"https://www.wikidata.org/wiki/Q7314222","display_name":"Representation theorem","level":2,"score":0.37059998512268066},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.35690000653266907},{"id":"https://openalex.org/C118615104","wikidata":"https://www.wikidata.org/wiki/Q121416","display_name":"Discrete mathematics","level":1,"score":0.35260000824928284},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.3521000146865845},{"id":"https://openalex.org/C122203268","wikidata":"https://www.wikidata.org/wiki/Q5862903","display_name":"Probability theory","level":2,"score":0.3458000123500824},{"id":"https://openalex.org/C94461902","wikidata":"https://www.wikidata.org/wiki/Q2762418","display_name":"Formal proof","level":3,"score":0.32420000433921814},{"id":"https://openalex.org/C2776502983","wikidata":"https://www.wikidata.org/wiki/Q690182","display_name":"Contrast (vision)","level":2,"score":0.31119999289512634},{"id":"https://openalex.org/C2318724","wikidata":"https://www.wikidata.org/wiki/Q852732","display_name":"Proof theory","level":3,"score":0.3003999888896942},{"id":"https://openalex.org/C11413529","wikidata":"https://www.wikidata.org/wiki/Q8366","display_name":"Algorithm","level":1,"score":0.27390000224113464},{"id":"https://openalex.org/C18762648","wikidata":"https://www.wikidata.org/wiki/Q42213","display_name":"Work (physics)","level":2,"score":0.2651999890804291}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.10538","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.10538","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.10538","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.10538","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Agentic":[0],"theorem":[1,139],"provers":[2,140],"--":[3,21],"pipelines":[4,78],"that":[5],"couple":[6],"a":[7,17,51,66,130],"mathematical":[8],"reasoning":[9],"model":[10],"with":[11],"library":[12],"retrieval,":[13],"subgoal-decomposition/search":[14],"planner,":[15],"and":[16,36,54,74,100,122,136],"proof":[18,47],"assistant":[19],"verifier":[20],"have":[22],"recently":[23],"achieved":[24],"striking":[25],"empirical":[26],"success,":[27],"yet":[28],"it":[29],"remains":[30],"unclear":[31],"which":[32],"components":[33],"drive":[34],"performance":[35,103],"why":[37,137],"such":[38],"systems":[39],"work":[40],"at":[41],"all":[42],"despite":[43],"classical":[44],"hardness":[45],"of":[46,64,88,105,111,134],"search.":[48],"We":[49],"propose":[50],"distributional":[52],"viewpoint":[53],"introduce":[55],"\\textbf{statistical":[56],"provability},":[57],"defined":[58],"as":[59,79],"the":[60,102],"finite-horizon":[61],"success":[62],"probability":[63],"reaching":[65],"verified":[67],"proof,":[68],"averaged":[69],"over":[70],"an":[71],"instance":[72],"distribution,":[73],"formalize":[75],"modern":[76],"theorem-proving":[77],"time-bounded":[80],"MDPs.":[81],"Exploiting":[82],"Bellman":[83],"structure,":[84],"we":[85],"prove":[86],"existence":[87],"optimal":[89],"policies":[90],"under":[91],"mild":[92],"regularity,":[93],"derive":[94],"provability":[95],"certificates":[96],"via":[97],"sub-/super-solution":[98],"inequalities,":[99],"bound":[101],"gap":[104],"score-guided":[106],"planning":[107],"(greedy/top-\\(k\\)/beam/rollouts)":[108],"in":[109,150],"terms":[110],"approximation":[112],"error,":[113],"sequential":[114],"statistical":[115],"complexity,":[116],"representation":[117],"geometry":[118],"(metric":[119],"entropy/doubling":[120],"structure),":[121],"action-gap":[123],"margin":[124],"tails.":[125],"Together,":[126],"our":[127],"theory":[128],"provides":[129],"principled,":[131],"component-sensitive":[132],"explanation":[133],"when":[135],"agentic":[138],"succeed":[141],"on":[142],"biased":[143],"real-world":[144],"problem":[145],"distributions,":[146],"while":[147],"clarifying":[148],"limitations":[149],"worst-case":[151],"or":[152],"adversarial":[153],"regimes.":[154]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-13T00:00:00"}
