{"id":"https://openalex.org/W4407422861","doi":"https://doi.org/10.48550/arxiv.2502.06807","title":"Competitive Programming with Large Reasoning Models","display_name":"Competitive Programming with Large Reasoning Models","publication_year":2025,"publication_date":"2025-02-03","ids":{"openalex":"https://openalex.org/W4407422861","doi":"https://doi.org/10.48550/arxiv.2502.06807"},"language":"en","primary_location":{"id":"pmh:oai:arXiv.org:2502.06807","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.06807","pdf_url":"https://arxiv.org/pdf/2502.06807","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"type":"preprint","indexed_in":["arxiv","datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://arxiv.org/pdf/2502.06807","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"OpenAI","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"OpenAI","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A9999999999","display_name":":","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":":","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5035119055","display_name":"Ahmed El-Kishky","orcid":"https://orcid.org/0000-0003-0121-7781"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"El-Kishky, Ahmed","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011565557","display_name":"Alexander Wei","orcid":"https://orcid.org/0000-0002-8587-1037"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Alexander","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5082777139","display_name":"Andr\u00e9 Saraiva","orcid":"https://orcid.org/0000-0002-7209-9180"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Saraiva, Andre","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116248258","display_name":"Borys Minaev","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Minaiev, Borys","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5058572832","display_name":"Daniel Selsam","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Selsam, Daniel","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5069446643","display_name":"David Dohan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dohan, David","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031035504","display_name":"Francis Song","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Song, Francis","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5092070318","display_name":"Hunter Lightman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lightman, Hunter","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116248256","display_name":"Ignasi Clavera","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Clavera, Ignasi","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5011053473","display_name":"Jakub Pachocki","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pachocki, Jakub","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5044086066","display_name":"Jerry Tworek","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Tworek, Jerry","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054381323","display_name":"Lorenz Kuhn","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuhn, Lorenz","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031789995","display_name":"\u0141ukasz Kaiser","orcid":"https://orcid.org/0000-0003-1092-6010"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaiser, Lukasz","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5030935953","display_name":"Mark Chen","orcid":"https://orcid.org/0000-0001-9369-5830"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Mark","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5015580523","display_name":"Max Schwarzer","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwarzer, Max","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5115637740","display_name":"Mostafa Rohaninejad","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Rohaninejad, Mostafa","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5003470218","display_name":"Nat McAleese","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McAleese, Nat","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5116248257","display_name":"o contributors","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"contributors, o3","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5070241238","display_name":"Oleg M\u00fcrk","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"M\u00fcrk, Oleg","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5078476582","display_name":"Rhythm Garg","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Garg, Rhythm","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072460888","display_name":"Rui Shu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shu, Rui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5051574174","display_name":"Szymon Sidor","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sidor, Szymon","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5065338363","display_name":"Vineet Kosaraju","orcid":"https://orcid.org/0000-0001-5258-7673"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kosaraju, Vineet","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5046898877","display_name":"Wenda Zhou","orcid":"https://orcid.org/0000-0003-4371-3118"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhou, Wenda","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":26,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":true,"cited_by_count":5,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10050","display_name":"Multi-Criteria Decision Making","score":0.7797999978065491,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T10050","display_name":"Multi-Criteria Decision Making","score":0.7797999978065491,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12137","display_name":"Economic theories and models","score":0.6694999933242798,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.4923332929611206},{"id":"https://openalex.org/keywords/programming-language","display_name":"Programming language","score":0.38292673230171204}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.4923332929611206},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.38292673230171204}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:oai:arXiv.org:2502.06807","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.06807","pdf_url":"https://arxiv.org/pdf/2502.06807","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},{"id":"doi:10.48550/arxiv.2502.06807","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2502.06807","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:oai:arXiv.org:2502.06807","is_oa":true,"landing_page_url":"http://arxiv.org/abs/2502.06807","pdf_url":"https://arxiv.org/pdf/2502.06807","source":{"id":"https://openalex.org/S4393918464","display_name":"ArXiv.org","issn_l":"2331-8422","issn":["2331-8422"],"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"text"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":true,"grobid_xml":true},"content_urls":{"pdf":"https://content.openalex.org/works/W4407422861.pdf","grobid_xml":"https://content.openalex.org/works/W4407422861.grobid-xml"},"referenced_works_count":0,"referenced_works":[],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"We":[0,58],"show":[1,108],"that":[2,95,109,158],"reinforcement":[3,161],"learning":[4],"applied":[5],"to":[6],"large":[7],"language":[8],"models":[9,26,89],"(LLMs)":[10],"significantly":[11],"boosts":[12],"performance":[13],"on":[14,129,148,166],"complex":[15],"coding":[16],"and":[17,30,143],"reasoning":[18,25,177],"tasks.":[19],"Additionally,":[20],"we":[21,93],"compare":[22],"two":[23],"general-purpose":[24,121,160],"-":[27,36],"OpenAI":[28],"o1":[29],"an":[31],"early":[32],"checkpoint":[33],"of":[34],"o3":[35,96,122,134],"with":[37,64,150],"a":[38,82,136,145,170],"domain-specific":[39,101,167],"system,":[40],"o1-ioi,":[41],"which":[42],"uses":[43],"hand-engineered":[44],"inference":[45,131],"strategies":[46,102],"designed":[47],"for":[48],"competing":[49],"in":[50,55,72,176],"the":[51,73,119,140],"2024":[52,63,141],"International":[53],"Olympiad":[54],"Informatics":[56],"(IOI).":[57],"competed":[59],"live":[60],"at":[61,139],"IOI":[62,142],"o1-ioi":[65,80,115],"and,":[66],"using":[67],"hand-crafted":[68,100,130],"test-time":[69],"strategies,":[70],"placed":[71],"49th":[74],"percentile.":[75],"Under":[76],"relaxed":[77,104],"competition":[78],"constraints,":[79],"achieved":[81],"gold":[83,98,137],"medal.":[84],"However,":[85],"when":[86],"evaluating":[87],"later":[88],"such":[90,113,179],"as":[91,114,180],"o3,":[92],"find":[94],"achieves":[97,135],"without":[99,127],"or":[103],"constraints.":[105],"Our":[106],"findings":[107],"although":[110],"specialized":[111],"pipelines":[112],"yield":[116],"solid":[117],"improvements,":[118],"scaled-up,":[120],"model":[123],"surpasses":[124],"those":[125],"results":[126,156],"relying":[128,165],"heuristics.":[132],"Notably,":[133],"medal":[138],"obtains":[144],"Codeforces":[146],"rating":[147],"par":[149],"elite":[151],"human":[152],"competitors.":[153],"Overall,":[154],"these":[155],"indicate":[157],"scaling":[159],"learning,":[162],"rather":[163],"than":[164],"techniques,":[168],"offers":[169],"robust":[171],"path":[172],"toward":[173],"state-of-the-art":[174],"AI":[175],"domains,":[178],"competitive":[181],"programming.":[182]},"counts_by_year":[{"year":2025,"cited_by_count":5}],"updated_date":"2026-04-16T15:07:20.185449","created_date":"2025-10-10T00:00:00"}
