{"id":"https://openalex.org/W7158614130","doi":"https://doi.org/10.48550/arxiv.2604.26733","title":"FutureWorld: A Live Reinforcement Learning Environment for Predictive Agents with Real-World Outcome Rewards","display_name":"FutureWorld: A Live Reinforcement Learning Environment for Predictive Agents with Real-World Outcome Rewards","publication_year":2026,"publication_date":"2026-04-29","ids":{"openalex":"https://openalex.org/W7158614130","doi":"https://doi.org/10.48550/arxiv.2604.26733"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2604.26733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2604.26733","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5134893847","display_name":"Zhixin Han","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Han, Zhixin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134893280","display_name":"Yanzhi Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yanzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5072238873","display_name":"Chuyang Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Chuyang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134005664","display_name":"Maohang Gao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Gao, Maohang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134897788","display_name":"Xiawei Yue","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yue, Xiawei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5101672513","display_name":"Kefei Chen","orcid":"https://orcid.org/0000-0003-1961-5614"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Kefei","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134089074","display_name":"Yu Zhuang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhuang, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134896060","display_name":"Haoxiang Guan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guan, Haoxiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134878693","display_name":"Jiyan He","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"He, Jiyan","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134910771","display_name":"Jian Li","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Li, Jian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067992353","display_name":"Yitong Duan","orcid":"https://orcid.org/0000-0002-1150-3995"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Duan, Yitong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134884441","display_name":"Yu Shi","orcid":"https://orcid.org/0000-0002-3821-2151"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shi, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5134922470","display_name":"Mengting Hu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hu, Mengting","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5134887476","display_name":"Shuxin Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zheng, Shuxin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":["https://openalex.org/A5134893847"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.18719999492168427,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.18719999492168427,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.17949999868869781,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12026","display_name":"Explainable Artificial Intelligence (XAI)","score":0.16339999437332153,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/leverage","display_name":"Leverage (statistics)","score":0.679099977016449},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6474000215530396},{"id":"https://openalex.org/keywords/outcome","display_name":"Outcome (game theory)","score":0.6215999722480774},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6007999777793884},{"id":"https://openalex.org/keywords/training","display_name":"Training (meteorology)","score":0.4350000023841858},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.4244999885559082}],"concepts":[{"id":"https://openalex.org/C153083717","wikidata":"https://www.wikidata.org/wiki/Q6535263","display_name":"Leverage (statistics)","level":2,"score":0.679099977016449},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6474000215530396},{"id":"https://openalex.org/C148220186","wikidata":"https://www.wikidata.org/wiki/Q7111912","display_name":"Outcome (game theory)","level":2,"score":0.6215999722480774},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6007999777793884},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5837000012397766},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.47450000047683716},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.46540001034736633},{"id":"https://openalex.org/C2777211547","wikidata":"https://www.wikidata.org/wiki/Q17141490","display_name":"Training (meteorology)","level":2,"score":0.4350000023841858},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.4244999885559082},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.3052000105381012},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.29679998755455017},{"id":"https://openalex.org/C51632099","wikidata":"https://www.wikidata.org/wiki/Q3985153","display_name":"Training set","level":2,"score":0.2906000018119812},{"id":"https://openalex.org/C4554734","wikidata":"https://www.wikidata.org/wiki/Q593744","display_name":"Knowledge base","level":2,"score":0.288100004196167},{"id":"https://openalex.org/C22367795","wikidata":"https://www.wikidata.org/wiki/Q7625208","display_name":"Structured prediction","level":2,"score":0.2563000023365021},{"id":"https://openalex.org/C77967617","wikidata":"https://www.wikidata.org/wiki/Q4677561","display_name":"Active learning (machine learning)","level":2,"score":0.25279998779296875}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2604.26733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2604.26733","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2604.26733","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Live":[0],"future":[1,65],"prediction":[2,49,147],"refers":[3],"to":[4,143],"the":[5,39,62,78,128],"task":[6,17],"of":[7,48,64],"making":[8],"predictions":[9],"about":[10],"real-world":[11,54,121,156],"events":[12],"before":[13],"they":[14],"unfold.":[15],"This":[16],"is":[18,29],"increasingly":[19],"studied":[20],"using":[21],"large":[22,46],"language":[23],"model-based":[24],"agent":[25],"systems,":[26],"and":[27,85,91,125,151],"it":[28],"important":[30],"for":[31,131],"building":[32],"agents":[33],"that":[34,76,99,109,154],"can":[35,43,159],"continually":[36],"learn":[37],"from":[38],"real":[40],"world.":[41],"It":[42],"provide":[44],"a":[45,70,96],"number":[47],"questions":[50],"grounded":[51],"in":[52,95,146],"diverse":[53],"events,":[55],"while":[56],"preventing":[57],"answer":[58],"leakage.":[59],"To":[60],"leverage":[61],"advantages":[63],"prediction,":[66,82],"we":[67,89,100],"present":[68],"FutureWorld,":[69],"live":[71],"agentic":[72],"reinforcement":[73,105,164],"learning":[74,106,165],"environment":[75],"closes":[77],"training":[79,107,140],"loop":[80],"between":[81],"outcome":[83,157],"realization,":[84],"parameter":[86],"updates.":[87],"Specifically,":[88],"modify":[90],"extend":[92],"verl-tool,":[93],"resulting":[94],"new":[97],"framework":[98],"call":[101],"verl-tool-future.":[102],"Unlike":[103],"standard":[104],"frameworks":[108],"rely":[110],"on":[111],"immediate":[112],"rewards,":[113],"verl-tool-future":[114],"stores":[115],"prediction-time":[116],"rollouts,":[117],"backfills":[118],"rewards":[119],"after":[120],"outcomes":[122],"become":[123],"available,":[124],"then":[126],"replays":[127],"completed":[129],"trajectories":[130],"policy":[132],"update.":[133],"Across":[134],"three":[135],"open-source":[136],"agents,":[137],"successive":[138],"FutureWorld":[139],"rounds":[141],"lead":[142],"consistent":[144],"improvements":[145],"accuracy,":[148],"probabilistic":[149],"scoring,":[150],"calibration,":[152],"demonstrating":[153],"delayed":[155],"feedback":[158],"serve":[160],"as":[161],"an":[162],"effective":[163],"signal.":[166]},"counts_by_year":[],"updated_date":"2026-05-12T06:07:45.972803","created_date":"2026-05-01T00:00:00"}
