{"id":"https://openalex.org/W4415310641","doi":"https://doi.org/10.48550/arxiv.2507.13337","title":"FormulaOne: Measuring the Depth of Algorithmic Reasoning Beyond Competitive Programming","display_name":"FormulaOne: Measuring the Depth of Algorithmic Reasoning Beyond Competitive Programming","publication_year":2025,"publication_date":"2025-07-17","ids":{"openalex":"https://openalex.org/W4415310641","doi":"https://doi.org/10.48550/arxiv.2507.13337"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2507.13337","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.13337","pdf_url":"https://arxiv.org/pdf/2507.13337","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2507.13337","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5011260370","display_name":"Gal Beniamini","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Beniamini, Gal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015931743","display_name":"Yuval Dor","orcid":"https://orcid.org/0000-0003-2456-2289"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dor, Yuval","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5087961910","display_name":"Alon Vinnikov","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Vinnikov, Alon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Peled, Shir Granot","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peled, Shir Granot","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082275399","display_name":"Or Weinstein","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weinstein, Or","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5061121204","display_name":"Or Sharir","orcid":"https://orcid.org/0000-0003-4957-8957"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sharir, Or","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5081397200","display_name":"Noam Wies","orcid":"https://orcid.org/0000-0002-1337-2298"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wies, Noam","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115012325","display_name":"Tomer Nussbaum","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nussbaum, Tomer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5114982663","display_name":"Ido Ben Shaul","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shaul, Ido Ben","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120047756","display_name":"Tomer Zekharya","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zekharya, Tomer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5005177735","display_name":"Yoav Levine","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Levine, Yoav","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078263052","display_name":"Shai Shalev\u2010Shwartz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shalev-Shwartz, Shai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5075004917","display_name":"Amnon Shashua","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shashua, Amnon","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":13,"corresponding_author_ids":["https://openalex.org/A5011260370"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.9010999798774719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11010","display_name":"Logic, Reasoning, and Knowledge","score":0.9010999798774719,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/frontier","display_name":"Frontier","score":0.6288999915122986},{"id":"https://openalex.org/keywords/focus","display_name":"Focus (optics)","score":0.5776000022888184},{"id":"https://openalex.org/keywords/intersection","display_name":"Intersection (aeronautics)","score":0.5755000114440918},{"id":"https://openalex.org/keywords/construct","display_name":"Construct (python library)","score":0.524399995803833},{"id":"https://openalex.org/keywords/set","display_name":"Set (abstract data type)","score":0.513700008392334},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4505999982357025},{"id":"https://openalex.org/keywords/ideal","display_name":"Ideal (ethics)","score":0.44929999113082886},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.42500001192092896}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6488000154495239},{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.6288999915122986},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.5776000022888184},{"id":"https://openalex.org/C64543145","wikidata":"https://www.wikidata.org/wiki/Q162942","display_name":"Intersection (aeronautics)","level":2,"score":0.5755000114440918},{"id":"https://openalex.org/C2780801425","wikidata":"https://www.wikidata.org/wiki/Q5164392","display_name":"Construct (python library)","level":2,"score":0.524399995803833},{"id":"https://openalex.org/C177264268","wikidata":"https://www.wikidata.org/wiki/Q1514741","display_name":"Set (abstract data type)","level":2,"score":0.513700008392334},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4505999982357025},{"id":"https://openalex.org/C2776639384","wikidata":"https://www.wikidata.org/wiki/Q840396","display_name":"Ideal (ethics)","level":2,"score":0.44929999113082886},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4471000134944916},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4462999999523163},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.42500001192092896},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.41130000352859497},{"id":"https://openalex.org/C2780586882","wikidata":"https://www.wikidata.org/wiki/Q7520643","display_name":"Simple (philosophy)","level":2,"score":0.38830000162124634},{"id":"https://openalex.org/C182620335","wikidata":"https://www.wikidata.org/wiki/Q2852531","display_name":"Answer set programming","level":3,"score":0.323199987411499},{"id":"https://openalex.org/C34165917","wikidata":"https://www.wikidata.org/wiki/Q188267","display_name":"Programming paradigm","level":2,"score":0.3125},{"id":"https://openalex.org/C2780980858","wikidata":"https://www.wikidata.org/wiki/Q110022","display_name":"Dual (grammatical number)","level":2,"score":0.304500013589859},{"id":"https://openalex.org/C41045048","wikidata":"https://www.wikidata.org/wiki/Q202843","display_name":"Linear programming","level":2,"score":0.2782000005245209},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.274399995803833},{"id":"https://openalex.org/C9652623","wikidata":"https://www.wikidata.org/wiki/Q190109","display_name":"Field (mathematics)","level":2,"score":0.27399998903274536},{"id":"https://openalex.org/C20693621","wikidata":"https://www.wikidata.org/wiki/Q6667502","display_name":"Logical framework","level":2,"score":0.26179999113082886}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2507.13337","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.13337","pdf_url":"https://arxiv.org/pdf/2507.13337","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2507.13337","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2507.13337","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2507.13337","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2507.13337","pdf_url":"https://arxiv.org/pdf/2507.13337","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Frontier":[0],"AI":[1],"models":[2,200],"demonstrate":[3],"formidable":[4],"breadth":[5],"of":[6,32,39,68,80,91,103,132,155,164,212,247],"knowledge.":[7],"But":[8],"how":[9,226],"close":[10],"are":[11,85,158],"they":[12,228],"to":[13,108,161,169],"true":[14],"human":[15],"--":[16,19,224],"or":[17],"superhuman":[18],"expertise?":[20],"Genuine":[21],"experts":[22],"can":[23],"tackle":[24],"the":[25,30,37,66,77,128,140,162,175,213,251,256],"hardest":[26],"problems":[27,84,157],"and":[28,51,72,106,120,168,220],"push":[29],"boundaries":[31],"scientific":[33],"understanding.":[34],"To":[35,236],"illuminate":[36],"limits":[38],"frontier":[40,81,163],"model":[41],"capabilities,":[42],"we":[43,240],"turn":[44],"away":[45],"from":[46,127,230,250],"contrived":[47],"competitive":[48],"programming":[49],"puzzles,":[50],"instead":[52],"focus":[53],"on":[54,137,187,206],"real-life":[55],"research":[56],"problems.":[57],"We":[58,254],"construct":[59],"FormulaOne,":[60,207],"a":[61,245,261],"benchmark":[62],"that":[63],"lies":[64],"at":[65,146],"intersection":[67],"graph":[69],"theory,":[70],"logic,":[71],"algorithms,":[73],"all":[74],"well":[75],"within":[76],"training":[78],"distribution":[79],"models.":[82],"Our":[83],"incredibly":[86],"demanding,":[87],"requiring":[88],"an":[89],"array":[90],"reasoning":[92],"steps.":[93],"The":[94],"dataset":[95],"has":[96],"three":[97],"key":[98],"properties.":[99],"First,":[100],"it":[101,124],"is":[102,125],"commercial":[104],"interest":[105],"relates":[107],"practical":[109],"large-scale":[110],"optimisation":[111],"problems,":[112],"such":[113,173],"as":[114,174],"those":[115],"arising":[116],"in":[117,233],"routing,":[118],"scheduling,":[119],"network":[121],"design.":[122],"Second,":[123],"generated":[126],"highly":[129],"expressive":[130],"framework":[131],"Monadic":[133],"Second-Order":[134],"(MSO)":[135],"logic":[136],"graphs,":[138],"paving":[139],"way":[141],"toward":[142],"automatic":[143],"problem":[144],"generation":[145],"scale;":[147],"ideal":[148],"for":[149],"building":[150],"RL":[151],"environments.":[152],"Third,":[153],"many":[154],"our":[156,188],"intimately":[159],"related":[160],"theoretical":[165,196],"computer":[166],"science,":[167],"central":[170],"conjectures":[171],"therein,":[172],"Strong":[176],"Exponential":[177],"Time":[178],"Hypothesis":[179],"(SETH).":[180],"As":[181],"such,":[182],"any":[183],"significant":[184],"algorithmic":[185],"progress":[186],"dataset,":[189],"beyond":[190],"known":[191],"results,":[192],"could":[193],"carry":[194],"profound":[195],"implications.":[197],"Remarkably,":[198],"state-of-the-art":[199],"like":[201],"OpenAI's":[202],"o3":[203],"fail":[204],"entirely":[205],"solving":[208],"less":[209],"than":[210],"1%":[211],"questions,":[214],"even":[215],"when":[216],"given":[217],"10":[218],"attempts":[219],"explanatory":[221],"fewshot":[222],"examples":[223],"highlighting":[225],"far":[227],"remain":[229],"expert-level":[231],"understanding":[232],"some":[234],"domains.":[235],"support":[237],"further":[238],"research,":[239],"additionally":[241],"curate":[242],"FormulaOne-Warmup,":[243],"offering":[244],"set":[246],"simpler":[248],"tasks,":[249],"same":[252],"distribution.":[253],"release":[255],"full":[257],"corpus":[258],"along":[259],"with":[260],"comprehensive":[262],"evaluation":[263],"framework.":[264]},"counts_by_year":[],"updated_date":"2026-05-05T08:41:31.759640","created_date":"2025-10-18T00:00:00"}
