{"id":"https://openalex.org/W7137926406","doi":"https://doi.org/10.48550/arxiv.2603.15617","title":"HorizonMath: Measuring AI Progress Toward Mathematical Discovery with Automatic Verification","display_name":"HorizonMath: Measuring AI Progress Toward Mathematical Discovery with Automatic Verification","publication_year":2026,"publication_date":"2026-03-16","ids":{"openalex":"https://openalex.org/W7137926406","doi":"https://doi.org/10.48550/arxiv.2603.15617"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.15617","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15617","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.15617","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5125292925","display_name":"Erik Y. Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Erik Y.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5125326051","display_name":"Sumeet Motwani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Motwani, Sumeet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5119912927","display_name":"James V. Roggeveen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Roggeveen, James V.","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129685387","display_name":"Eliot Hodges","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hodges, Eliot","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5121685887","display_name":"Dulhan Jayalath","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jayalath, Dulhan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129682583","display_name":"Charles London","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"London, Charles","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5064310723","display_name":"Kalyan Ramakrishnan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ramakrishnan, Kalyan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5016219632","display_name":"Flaviu Cipcigan","orcid":"https://orcid.org/0000-0002-5015-1443"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cipcigan, Flaviu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5129721038","display_name":"Philip Torr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Torr, Philip","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5129686690","display_name":"Alessandro Abate","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Abate, Alessandro","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":10,"corresponding_author_ids":["https://openalex.org/A5125292925"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.2879999876022339,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T13523","display_name":"Mathematics, Computing, and Information Processing","score":0.2879999876022339,"subfield":{"id":"https://openalex.org/subfields/1703","display_name":"Computational Theory and Mathematics"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.19699999690055847,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11206","display_name":"Model Reduction and Neural Networks","score":0.06939999759197235,"subfield":{"id":"https://openalex.org/subfields/3109","display_name":"Statistical and Nonlinear Physics"},"field":{"id":"https://openalex.org/fields/31","display_name":"Physics and Astronomy"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.7265999913215637},{"id":"https://openalex.org/keywords/class","display_name":"Class (philosophy)","score":0.4733999967575073},{"id":"https://openalex.org/keywords/mathematical-model","display_name":"Mathematical model","score":0.4433000087738037},{"id":"https://openalex.org/keywords/expert-system","display_name":"Expert system","score":0.32260000705718994},{"id":"https://openalex.org/keywords/computational-model","display_name":"Computational model","score":0.3151000142097473},{"id":"https://openalex.org/keywords/scientific-discovery","display_name":"Scientific discovery","score":0.30239999294281006}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.788100004196167},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.7265999913215637},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5149999856948853},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.48489999771118164},{"id":"https://openalex.org/C2777212361","wikidata":"https://www.wikidata.org/wiki/Q5127848","display_name":"Class (philosophy)","level":2,"score":0.4733999967575073},{"id":"https://openalex.org/C76969082","wikidata":"https://www.wikidata.org/wiki/Q486902","display_name":"Mathematical model","level":2,"score":0.4433000087738037},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.32260000705718994},{"id":"https://openalex.org/C66024118","wikidata":"https://www.wikidata.org/wiki/Q1122506","display_name":"Computational model","level":2,"score":0.3151000142097473},{"id":"https://openalex.org/C2984917352","wikidata":"https://www.wikidata.org/wiki/Q12772819","display_name":"Scientific discovery","level":2,"score":0.30239999294281006},{"id":"https://openalex.org/C2779193601","wikidata":"https://www.wikidata.org/wiki/Q20026918","display_name":"Mathematical theory","level":2,"score":0.28790000081062317},{"id":"https://openalex.org/C115903868","wikidata":"https://www.wikidata.org/wiki/Q80993","display_name":"Software engineering","level":1,"score":0.2833000123500824},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.28200000524520874},{"id":"https://openalex.org/C111498074","wikidata":"https://www.wikidata.org/wiki/Q173326","display_name":"Formal verification","level":2,"score":0.2727000117301941},{"id":"https://openalex.org/C75606506","wikidata":"https://www.wikidata.org/wiki/Q1049183","display_name":"Formal methods","level":2,"score":0.2655999958515167},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.26159998774528503}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.15617","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15617","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.15617","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.15617","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"score":0.5583564639091492,"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Can":[0],"AI":[1],"make":[2],"progress":[3],"on":[4,107,137],"important,":[5],"unsolved":[6,43,168],"mathematical":[7,17,75,177],"problems?":[8],"Large":[9],"language":[10],"models":[11,98],"are":[12,87,117],"now":[13],"capable":[14],"of":[15,39,67,115],"sophisticated":[16],"and":[18,32,50,82,95,156],"scientific":[19],"reasoning,":[20],"but":[21,77],"whether":[22],"they":[23],"can":[24],"perform":[25],"novel":[26,144,173],"research":[27],"is":[28,71,79,90],"still":[29],"widely":[30],"debated":[31],"underexplored.":[33],"We":[34,149],"introduce":[35],"HorizonMath,":[36],"a":[37,65,157],"benchmark":[38,63],"over":[40],"100":[41],"predominantly":[42],"problems":[44,68,127,165],"spanning":[45],"8":[46],"domains":[47],"in":[48,166,175],"computational":[49],"applied":[51],"mathematics,":[52],"paired":[53],"with":[54],"an":[55,153],"open-source":[56],"evaluation":[57],"framework":[58],"for":[59,128],"automated":[60],"verification.":[61],"Our":[62],"targets":[64],"class":[66],"where":[69,161],"discovery":[70],"hard,":[72],"requiring":[73],"meaningful":[74],"insight,":[76],"verification":[78,110],"computationally":[80],"efficient":[81],"simple.":[83],"Because":[84],"these":[85],"solutions":[86,134,163],"unknown,":[88],"HorizonMath":[89,151],"immune":[91],"to":[92,119,164],"data":[93],"contamination,":[94],"most":[96],"state-of-the-art":[97],"score":[99],"near":[100],"0%.":[101],"Existing":[102],"research-level":[103],"benchmarks":[104],"instead":[105],"rely":[106],"formal":[108],"proof":[109],"or":[111],"manual":[112],"review,":[113],"both":[114],"which":[116,129],"expensive":[118],"scale.":[120],"Using":[121],"this":[122],"platform,":[123],"we":[124],"find":[125],"two":[126],"GPT":[130],"5.4":[131],"Pro":[132],"proposes":[133],"that":[135],"improve":[136],"the":[138,167,176],"best-known":[139],"published":[140],"results,":[141],"representing":[142],"potential":[143],"contributions":[145],"(pending":[146],"expert":[147],"review).":[148],"release":[150],"as":[152],"open":[154],"challenge":[155],"growing":[158],"community":[159],"resource,":[160],"correct":[162],"problem":[169],"classes":[170],"could":[171],"constitute":[172],"results":[174],"literature.":[178]},"counts_by_year":[],"updated_date":"2026-03-18T06:31:55.123368","created_date":"2026-03-18T00:00:00"}
