{"id":"https://openalex.org/W7154623269","doi":"https://doi.org/10.48550/arxiv.2604.14140","title":"LongCoT: Benchmarking Long-Horizon Chain-of-Thought Reasoning","display_name":"LongCoT: Benchmarking Long-Horizon Chain-of-Thought Reasoning","publication_year":2026,"publication_date":"2026-04-15","ids":{"openalex":"https://openalex.org/W7154623269","doi":"https://doi.org/10.48550/arxiv.2604.14140"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.14140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.14140","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5092964228","display_name":"Sumeet Motwani","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Motwani, Sumeet Ramesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133763081","display_name":"Daniel Nichols","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Nichols, Daniel","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133764655","display_name":"Charles London","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"London, Charles","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133727946","display_name":"Peggy Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Peggy","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133805140","display_name":"Fabio Pizzati","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pizzati, Fabio","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133783733","display_name":"Acer Blake","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Blake, Acer","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133794311","display_name":"Hasan Hammoud","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hammoud, Hasan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5071135007","display_name":"Tavish McDonald","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"McDonald, Tavish","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133797782","display_name":"Akshat Naik","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Naik, Akshat","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5022459043","display_name":"A. V. Ivanova","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ivanova, Alesia","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133816148","display_name":"Vignesh Baskaran","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Baskaran, Vignesh","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133773080","display_name":"Ivan Laptev","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Laptev, Ivan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5021316298","display_name":"Ruben Glatt","orcid":"https://orcid.org/0000-0002-4401-3810"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Glatt, Ruben","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5002615744","display_name":"Tal Ben\u2010Nun","orcid":"https://orcid.org/0000-0002-3657-6568"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ben-Nun, Tal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133797112","display_name":"Philip Torr","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Torr, Philip","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5046953322","display_name":"Natasha Jaques","orcid":"https://orcid.org/0000-0002-8413-9469"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jaques, Natasha","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133813323","display_name":"Ameya Prabhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Prabhu, Ameya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133816268","display_name":"Brian Bartoldson","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bartoldson, Brian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5133775787","display_name":"Bhavya Kailkhura","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kailkhura, Bhavya","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5133813721","display_name":"Christian Schroeder de Witt","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"de Witt, Christian Schroeder","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":20,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.18770000338554382,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11948","display_name":"Machine Learning in Materials Science","score":0.18770000338554382,"subfield":{"id":"https://openalex.org/subfields/2505","display_name":"Materials Chemistry"},"field":{"id":"https://openalex.org/fields/25","display_name":"Materials Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.1444000005722046,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.12470000237226486,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/benchmarking","display_name":"Benchmarking","score":0.7372999787330627},{"id":"https://openalex.org/keywords/measure","display_name":"Measure (data warehouse)","score":0.541100025177002},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.5378000140190125},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.5291000008583069},{"id":"https://openalex.org/keywords/verifiable-secret-sharing","display_name":"Verifiable secret sharing","score":0.47699999809265137},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4553000032901764},{"id":"https://openalex.org/keywords/interdependence","display_name":"Interdependence","score":0.39160001277923584},{"id":"https://openalex.org/keywords/graph","display_name":"Graph","score":0.3628000020980835}],"concepts":[{"id":"https://openalex.org/C86251818","wikidata":"https://www.wikidata.org/wiki/Q816754","display_name":"Benchmarking","level":2,"score":0.7372999787330627},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6883999705314636},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.541100025177002},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.5378000140190125},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.5291000008583069},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4821000099182129},{"id":"https://openalex.org/C85847156","wikidata":"https://www.wikidata.org/wiki/Q59015987","display_name":"Verifiable secret sharing","level":3,"score":0.47699999809265137},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4553000032901764},{"id":"https://openalex.org/C185874996","wikidata":"https://www.wikidata.org/wiki/Q269699","display_name":"Interdependence","level":2,"score":0.39160001277923584},{"id":"https://openalex.org/C132525143","wikidata":"https://www.wikidata.org/wiki/Q141488","display_name":"Graph","level":2,"score":0.3628000020980835},{"id":"https://openalex.org/C159032336","wikidata":"https://www.wikidata.org/wiki/Q2488768","display_name":"Non-monotonic logic","level":2,"score":0.35760000348091125},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.3434000015258789},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.33410000801086426},{"id":"https://openalex.org/C195344581","wikidata":"https://www.wikidata.org/wiki/Q2555318","display_name":"Automated reasoning","level":2,"score":0.32850000262260437},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.31520000100135803},{"id":"https://openalex.org/C2778571376","wikidata":"https://www.wikidata.org/wiki/Q1355821","display_name":"Frontier","level":2,"score":0.2994000017642975},{"id":"https://openalex.org/C89288958","wikidata":"https://www.wikidata.org/wiki/Q7301504","display_name":"Reasoning system","level":2,"score":0.29589998722076416},{"id":"https://openalex.org/C2781181686","wikidata":"https://www.wikidata.org/wiki/Q4226068","display_name":"Coherence (philosophical gambling strategy)","level":2,"score":0.28220000863075256},{"id":"https://openalex.org/C37335422","wikidata":"https://www.wikidata.org/wiki/Q6888134","display_name":"Model-based reasoning","level":3,"score":0.27790001034736633},{"id":"https://openalex.org/C114073186","wikidata":"https://www.wikidata.org/wiki/Q2631895","display_name":"Automated planning and scheduling","level":2,"score":0.2556999921798706},{"id":"https://openalex.org/C136643341","wikidata":"https://www.wikidata.org/wiki/Q1361526","display_name":"Reachability","level":2,"score":0.2522999942302704},{"id":"https://openalex.org/C59656382","wikidata":"https://www.wikidata.org/wiki/Q191536","display_name":"Conjunction (astronomy)","level":2,"score":0.25099998712539673}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.14140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.14140","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.14140","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"As":[0],"language":[1],"models":[2,114,148],"are":[3],"increasingly":[4],"deployed":[5],"for":[6,101],"complex":[7,32],"autonomous":[8],"tasks,":[9],"their":[10],"ability":[11,25,145],"to":[12,53,88,149],"reason":[13,150],"accurately":[14],"over":[15,152],"longer":[16],"horizons":[17],"becomes":[18],"critical.":[19],"An":[20],"essential":[21],"component":[22],"of":[23,41,63,68,82,90,92,140,146],"this":[24],"is":[26,98],"planning":[27],"and":[28,51,55],"managing":[29],"a":[30,38,69,73,80,128,137],"long,":[31],"chain-of-thought":[33],"(CoT).":[34],"We":[35],"introduce":[36],"LongCoT,":[37,126],"scalable":[39],"benchmark":[40],"2,500":[42],"expert-designed":[43],"problems":[44],"spanning":[45],"chemistry,":[46],"mathematics,":[47],"computer":[48],"science,":[49],"chess,":[50],"logic":[52],"isolate":[54],"directly":[56],"measure":[57,139],"the":[58,112,144],"long-horizon":[59,107,141],"CoT":[60],"reasoning":[61,93,108],"capabilities":[62],"frontier":[64,102,147],"models.":[65],"Problems":[66],"consist":[67],"short":[70],"input":[71],"with":[72],"verifiable":[74],"answer;":[75],"solving":[76],"them":[77],"requires":[78],"navigating":[79],"graph":[81],"interdependent":[83],"steps":[84],"that":[85],"span":[86],"tens":[87],"hundreds":[89],"thousands":[91],"tokens.":[94],"Each":[95],"local":[96],"step":[97],"individually":[99],"tractable":[100],"models,":[103],"so":[104],"failures":[105],"reflect":[106],"limitations.":[109],"At":[110],"release,":[111],"best":[113],"achieve":[115],"&lt;10%":[116],"accuracy":[117],"(GPT":[118],"5.2:":[119],"9.8%;":[120],"Gemini":[121],"3":[122],"Pro:":[123],"6.1%)":[124],"on":[125],"revealing":[127],"substantial":[129],"gap":[130],"in":[131],"current":[132],"capabilities.":[133],"Overall,":[134],"LongCoT":[135],"provides":[136],"rigorous":[138],"reasoning,":[142],"tracking":[143],"reliably":[151],"extended":[153],"periods.":[154]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-04-17T00:00:00"}
