{"id":"https://openalex.org/W7159044814","doi":"https://doi.org/10.48550/arxiv.2604.26106","title":"Evaluating Strategic Reasoning in Forecasting Agents","display_name":"Evaluating Strategic Reasoning in Forecasting Agents","publication_year":2026,"publication_date":"2026-04-28","ids":{"openalex":"https://openalex.org/W7159044814","doi":"https://doi.org/10.48550/arxiv.2604.26106"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.26106","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26106","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.26106","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5086987119","display_name":"Tom Liptay","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liptay, Tom","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134901355","display_name":"Dan Schwarz","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Schwarz, Dan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5083728763","display_name":"Rafael Poyiadzi","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Poyiadzi, Rafael","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120355157","display_name":"Jack Wildman","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wildman, Jack","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5052203594","display_name":"Nikos I Bosse","orcid":"https://orcid.org/0000-0002-7750-5280"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bosse, Nikos I.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11918","display_name":"Forecasting Techniques and Applications","score":0.5091999769210815,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},"topics":[{"id":"https://openalex.org/T11918","display_name":"Forecasting Techniques and Applications","score":0.5091999769210815,"subfield":{"id":"https://openalex.org/subfields/1803","display_name":"Management Science and Operations Research"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T14350","display_name":"Innovation, Sustainability, Human-Machine Systems","score":0.03709999844431877,"subfield":{"id":"https://openalex.org/subfields/3312","display_name":"Sociology and Political Science"},"field":{"id":"https://openalex.org/fields/33","display_name":"Social Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11674","display_name":"Sports Analytics and Performance","score":0.030300000682473183,"subfield":{"id":"https://openalex.org/subfields/2002","display_name":"Economics and Econometrics"},"field":{"id":"https://openalex.org/fields/20","display_name":"Economics, Econometrics and Finance"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/hindsight-bias","display_name":"Hindsight bias","score":0.8278999924659729},{"id":"https://openalex.org/keywords/strategic-intelligence","display_name":"Strategic intelligence","score":0.38109999895095825},{"id":"https://openalex.org/keywords/scoring-rule","display_name":"Scoring rule","score":0.37229999899864197},{"id":"https://openalex.org/keywords/debiasing","display_name":"Debiasing","score":0.36820000410079956},{"id":"https://openalex.org/keywords/black-box","display_name":"Black box","score":0.35260000824928284},{"id":"https://openalex.org/keywords/brier-score","display_name":"Brier score","score":0.351500004529953},{"id":"https://openalex.org/keywords/strategic-planning","display_name":"Strategic planning","score":0.34380000829696655},{"id":"https://openalex.org/keywords/differential","display_name":"Differential (mechanical device)","score":0.34049999713897705}],"concepts":[{"id":"https://openalex.org/C10347200","wikidata":"https://www.wikidata.org/wiki/Q1960297","display_name":"Hindsight bias","level":2,"score":0.8278999924659729},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6244999766349792},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.49480000138282776},{"id":"https://openalex.org/C2778542649","wikidata":"https://www.wikidata.org/wiki/Q4443415","display_name":"Strategic intelligence","level":2,"score":0.38109999895095825},{"id":"https://openalex.org/C42475967","wikidata":"https://www.wikidata.org/wiki/Q194292","display_name":"Operations research","level":1,"score":0.37229999899864197},{"id":"https://openalex.org/C63002673","wikidata":"https://www.wikidata.org/wiki/Q2260590","display_name":"Scoring rule","level":2,"score":0.37229999899864197},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.36820000410079956},{"id":"https://openalex.org/C2779458634","wikidata":"https://www.wikidata.org/wiki/Q24963715","display_name":"Debiasing","level":2,"score":0.36820000410079956},{"id":"https://openalex.org/C94966114","wikidata":"https://www.wikidata.org/wiki/Q29256","display_name":"Black box","level":2,"score":0.35260000824928284},{"id":"https://openalex.org/C35405484","wikidata":"https://www.wikidata.org/wiki/Q4967066","display_name":"Brier score","level":2,"score":0.351500004529953},{"id":"https://openalex.org/C48243021","wikidata":"https://www.wikidata.org/wiki/Q932522","display_name":"Strategic planning","level":2,"score":0.34380000829696655},{"id":"https://openalex.org/C93226319","wikidata":"https://www.wikidata.org/wiki/Q193137","display_name":"Differential (mechanical device)","level":2,"score":0.34049999713897705},{"id":"https://openalex.org/C49937458","wikidata":"https://www.wikidata.org/wiki/Q2599292","display_name":"Probabilistic logic","level":2,"score":0.3346000015735626},{"id":"https://openalex.org/C63882131","wikidata":"https://www.wikidata.org/wiki/Q17122954","display_name":"Strengths and weaknesses","level":2,"score":0.326200008392334},{"id":"https://openalex.org/C162324750","wikidata":"https://www.wikidata.org/wiki/Q8134","display_name":"Economics","level":0,"score":0.3052000105381012},{"id":"https://openalex.org/C128913409","wikidata":"https://www.wikidata.org/wiki/Q3566063","display_name":"Belief revision","level":2,"score":0.3018999993801117},{"id":"https://openalex.org/C193809577","wikidata":"https://www.wikidata.org/wiki/Q3409300","display_name":"Demand forecasting","level":2,"score":0.29179999232292175},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.27630001306533813},{"id":"https://openalex.org/C149782125","wikidata":"https://www.wikidata.org/wiki/Q160039","display_name":"Econometrics","level":1,"score":0.2754000127315521},{"id":"https://openalex.org/C120954023","wikidata":"https://www.wikidata.org/wiki/Q1127277","display_name":"Consensus forecast","level":2,"score":0.271699994802475},{"id":"https://openalex.org/C539667460","wikidata":"https://www.wikidata.org/wiki/Q2414942","display_name":"Management science","level":1,"score":0.2667999863624573},{"id":"https://openalex.org/C163068380","wikidata":"https://www.wikidata.org/wiki/Q3409313","display_name":"Economic forecasting","level":2,"score":0.26409998536109924},{"id":"https://openalex.org/C2776325391","wikidata":"https://www.wikidata.org/wiki/Q6917865","display_name":"Motivated reasoning","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C58328972","wikidata":"https://www.wikidata.org/wiki/Q184609","display_name":"Expert system","level":2,"score":0.257099986076355}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.26106","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26106","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.26106","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26106","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Forecasting":[0],"benchmarks":[1],"produce":[2],"accuracy":[3,48],"leaderboards":[4],"but":[5],"little":[6],"insight":[7],"into":[8],"why":[9],"some":[10],"forecasters":[11,110],"are":[12,120],"more":[13,70],"accurate":[14,71],"than":[15,72],"others.":[16],"We":[17,64,88],"introduce":[18],"Bench":[19],"to":[20,80,131],"the":[21,90,112],"Future":[22],"2":[23],"(BTF-2),":[24],"1,417":[25],"pastcasting":[26],"questions":[27],"with":[28],"a":[29,66],"frozen":[30],"15M-document":[31],"research":[32,38,61],"corpus":[33],"in":[34,60,95,121],"which":[35],"agents":[36,119],"reproducibly":[37],"and":[39,54,77,103,124,137],"forecast":[40],"offline,":[41],"producing":[42],"full":[43],"reasoning":[44,84,115],"traces.":[45],"BTF-2":[46],"detects":[47],"differences":[49],"of":[50,99,105,117],"0.004":[51],"Brier":[52,69],"score,":[53],"can":[55],"distinguish":[56],"differential":[57],"agent":[58,82],"strengths":[59],"vs.":[62],"judgment.":[63],"build":[65],"forecaster":[67,92],"0.011":[68],"any":[73],"single":[74],"frontier":[75,118],"agent,":[76],"use":[78],"it":[79],"evaluate":[81],"strategic":[83,114],"without":[85],"hindsight":[86],"bias.":[87],"find":[89],"better":[91],"differs":[93],"primarily":[94],"its":[96,100],"pre-mortem":[97],"analysis":[98],"blind":[101],"spots":[102],"consideration":[104],"black":[106],"swans.":[107],"Expert":[108],"human":[109],"found":[111],"dominant":[113],"failures":[116],"assessing":[122],"political":[123],"business":[125],"leaders'":[126],"incentives,":[127],"judging":[128],"their":[129],"likelihood":[130],"follow":[132],"through":[133],"on":[134],"stated":[135],"plans,":[136],"modeling":[138],"institutional":[139],"processes.":[140]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-01T00:00:00"}
