{"id":"https://openalex.org/W7162401240","doi":"https://doi.org/10.48550/arxiv.2605.23972","title":"Why We Need World Models for AGI: Where LLMs Fail and How World Models May Outperform","display_name":"Why We Need World Models for AGI: Where LLMs Fail and How World Models May Outperform","publication_year":2026,"publication_date":"2026-05-13","ids":{"openalex":"https://openalex.org/W7162401240","doi":"https://doi.org/10.48550/arxiv.2605.23972"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.23972","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23972","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.23972","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5130369663","display_name":"Feisal Alaswad","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alaswad, Feisal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5130399612","display_name":"Batoul Aljaddouh","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Aljaddouh, Batoul","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5054787684","display_name":"Maher Alrahhal","orcid":"https://orcid.org/0000-0001-9688-3431"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Alrahhal, Maher","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5034914166","display_name":"E. Poovammal","orcid":"https://orcid.org/0000-0002-4996-1377"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"E, Poovammal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5009450763","display_name":"Talal Bonny","orcid":"https://orcid.org/0000-0003-1111-0304"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bonny, Talal","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.3944999873638153,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.3944999873638153,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.15539999306201935,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12031","display_name":"Speech and dialogue systems","score":0.0414000004529953,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6381000280380249},{"id":"https://openalex.org/keywords/transition","display_name":"Transition (genetics)","score":0.5802000164985657},{"id":"https://openalex.org/keywords/sequence","display_name":"Sequence (biology)","score":0.5289999842643738},{"id":"https://openalex.org/keywords/state","display_name":"State (computer science)","score":0.49880000948905945},{"id":"https://openalex.org/keywords/aggregate","display_name":"Aggregate (composite)","score":0.4934000074863434},{"id":"https://openalex.org/keywords/perspective","display_name":"Perspective (graphical)","score":0.4805000126361847},{"id":"https://openalex.org/keywords/causal-reasoning","display_name":"Causal reasoning","score":0.4090999960899353},{"id":"https://openalex.org/keywords/language-model","display_name":"Language model","score":0.3898000121116638}],"concepts":[{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6381000280380249},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.5943999886512756},{"id":"https://openalex.org/C194232998","wikidata":"https://www.wikidata.org/wiki/Q1606712","display_name":"Transition (genetics)","level":3,"score":0.5802000164985657},{"id":"https://openalex.org/C2778112365","wikidata":"https://www.wikidata.org/wiki/Q3511065","display_name":"Sequence (biology)","level":2,"score":0.5289999842643738},{"id":"https://openalex.org/C48103436","wikidata":"https://www.wikidata.org/wiki/Q599031","display_name":"State (computer science)","level":2,"score":0.49880000948905945},{"id":"https://openalex.org/C4679612","wikidata":"https://www.wikidata.org/wiki/Q866298","display_name":"Aggregate (composite)","level":2,"score":0.4934000074863434},{"id":"https://openalex.org/C12713177","wikidata":"https://www.wikidata.org/wiki/Q1900281","display_name":"Perspective (graphical)","level":2,"score":0.4805000126361847},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.42559999227523804},{"id":"https://openalex.org/C115086926","wikidata":"https://www.wikidata.org/wiki/Q17004651","display_name":"Causal reasoning","level":3,"score":0.4090999960899353},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.3898000121116638},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.35670000314712524},{"id":"https://openalex.org/C158600405","wikidata":"https://www.wikidata.org/wiki/Q5054566","display_name":"Causal inference","level":2,"score":0.3377000093460083},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.3337000012397766},{"id":"https://openalex.org/C72434380","wikidata":"https://www.wikidata.org/wiki/Q230930","display_name":"State space","level":2,"score":0.32089999318122864},{"id":"https://openalex.org/C2778572836","wikidata":"https://www.wikidata.org/wiki/Q380933","display_name":"Space (punctuation)","level":2,"score":0.31520000100135803},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.31349998712539673},{"id":"https://openalex.org/C2775936607","wikidata":"https://www.wikidata.org/wiki/Q466845","display_name":"Tracking (education)","level":2,"score":0.3093000054359436},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3086000084877014},{"id":"https://openalex.org/C83725634","wikidata":"https://www.wikidata.org/wiki/Q7268699","display_name":"Qualitative reasoning","level":2,"score":0.2980000078678131},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.296099990606308},{"id":"https://openalex.org/C195324797","wikidata":"https://www.wikidata.org/wiki/Q33742","display_name":"Natural language","level":2,"score":0.28600001335144043},{"id":"https://openalex.org/C51167844","wikidata":"https://www.wikidata.org/wiki/Q4422623","display_name":"Latent variable","level":2,"score":0.2775000035762787},{"id":"https://openalex.org/C145912823","wikidata":"https://www.wikidata.org/wiki/Q113558","display_name":"Dynamics (music)","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C23224414","wikidata":"https://www.wikidata.org/wiki/Q176769","display_name":"Hidden Markov model","level":2,"score":0.26600000262260437}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.23972","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23972","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.23972","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.23972","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[{"display_name":"Sustainable cities and communities","score":0.43487346172332764,"id":"https://metadata.un.org/sdg/11"}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1,7,61],"models":[2],"achieve":[3],"strong":[4,218],"performance":[5],"in":[6,15,111,164],"generation":[8],"and":[9,23,40,62,134,196,236],"knowledge-intensive":[10],"tasks,":[11],"yet":[12],"remain":[13],"limited":[14],"settings":[16],"requiring":[17],"causal":[18],"reasoning,":[19],"persistent":[20,188,233],"state":[21,143,157,189,234],"tracking,":[22,190],"long-horizon":[24,165,227],"planning.":[25],"We":[26],"argue":[27],"that":[28,59,105,217],"these":[29,214],"limitations":[30],"may":[31,222],"arise":[32],"from":[33,117],"an":[34,100,168],"objective-level":[35],"mismatch":[36],"between":[37,126],"sequence":[38,219],"prediction":[39,220],"reasoning":[41,82,198,229],"over":[42,131],"latent":[43,107,142,156],"environment":[44,83,206],"dynamics.":[45,71],"To":[46,72],"formalize":[47],"this":[48,75,146],"distinction,":[49],"we":[50,77],"introduce":[51,78],"Latent":[52],"Dynamics":[53],"Inference":[54],"(LDI),":[55],"a":[56,80,90,123],"conceptual":[57],"perspective":[58],"interprets":[60],"multimodal":[63],"observations":[64,133],"as":[65],"partial":[66],"evidence":[67],"of":[68,172,203],"underlying":[69],"transition":[70,108,237],"empirically":[73],"investigate":[74],"perspective,":[76],"Flux,":[79],"sequential":[81],"specified":[84],"entirely":[85],"through":[86],"natural-language":[87],"rules.":[88],"As":[89],"proof-of-concept":[91],"case":[92,147],"study,":[93,148],"the":[94,127,140,155,204,211],"rules":[95],"are":[96],"first":[97],"compiled":[98],"into":[99],"explicit":[101,152],"state-transition":[102],"simulator,":[103],"illustrating":[104],"structured":[106],"dynamics":[109],"can,":[110],"some":[112],"cases,":[113],"be":[114],"operationally":[115],"extracted":[116,141],"textual":[118,132],"rule":[119],"descriptions.":[120],"This":[121],"enables":[122],"controlled":[124],"comparison":[125],"LLMs":[128],"operating":[129,150],"purely":[130],"reinforcement-learning":[135],"agents":[136,149],"trained":[137],"directly":[138],"within":[139],"space.":[144],"Within":[145,210],"with":[151,186],"access":[153],"to":[154,224],"space":[158],"exhibit":[159],"substantially":[160],"more":[161],"stable":[162],"behavior":[163],"gameplay,":[166],"achieving":[167],"aggregate":[169],"win":[170],"rate":[171],"approximately":[173],"79%":[174],"versus":[175],"11%":[176],"for":[177,232],"LLMs.":[178],"Qualitative":[179],"analysis":[180],"further":[181],"reveals":[182],"failure":[183],"modes":[184],"consistent":[185],"unstable":[187],"including":[191],"invalid":[192],"actions,":[193],"state-tracking":[194],"errors,":[195],"short-horizon":[197],"failures.":[199],"The":[200],"complete":[201],"implementation":[202],"Flux":[205],"available":[207],"at":[208],"https://github.com/FeisalAlaswad/FLUX-RL-Agent":[209],"evaluated":[212],"setting,":[213],"results":[215],"suggest":[216],"alone":[221],"struggle":[223],"support":[225],"robust":[226],"dynamic":[228],"without":[230],"mechanisms":[231],"tracking":[235],"modeling":[238]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-05-27T00:00:00"}
