{"id":"https://openalex.org/W7162780049","doi":"https://doi.org/10.48550/arxiv.2605.29341","title":"WorldMemArena: Evaluating Multimodal Agent Memory Through Action-World Interaction","display_name":"WorldMemArena: Evaluating Multimodal Agent Memory Through Action-World Interaction","publication_year":2026,"publication_date":"2026-05-28","ids":{"openalex":"https://openalex.org/W7162780049","doi":"https://doi.org/10.48550/arxiv.2605.29341"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.29341","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29341","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.29341","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5137319669","display_name":"Chengzhi Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Chengzhi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137323714","display_name":"Yuzhe Yang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yang, Yuzhe","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5120308982","display_name":"Sophia Xiao Pu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Pu, Sophia Xiao","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5057313834","display_name":"Yepeng Liu","orcid":"https://orcid.org/0000-0001-6340-7818"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Yepeng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5067197600","display_name":"Lin Long","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Long, Lin","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137353784","display_name":"Yichen Guo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Guo, Yichen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137321651","display_name":"Nuo Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Nuo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137316052","display_name":"Zhaotian Weng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Weng, Zhaotian","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5075871561","display_name":"Elena Kochkina","orcid":"https://orcid.org/0000-0003-0691-3647"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kochkina, Elena","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5031351140","display_name":"Simerjot Kaur","orcid":"https://orcid.org/0000-0002-5863-4749"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kaur, Simerjot","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135237715","display_name":"Charese Smiley","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Smiley, Charese","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137392450","display_name":"Xiaomo Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Xiaomo","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137361835","display_name":"James Zou","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zou, James","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137370378","display_name":"Sheng Liu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Sheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137398277","display_name":"Yuheng Bu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Bu, Yuheng","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5137360376","display_name":"Songyou Peng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Peng, Songyou","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5137345927","display_name":"Xin Eric Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Xin Eric","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":17,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6215999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.6215999722480774,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10709","display_name":"Social Robot Interaction and HRI","score":0.06480000168085098,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T11431","display_name":"Action Observation and Synchronization","score":0.02759999968111515,"subfield":{"id":"https://openalex.org/subfields/3207","display_name":"Social Psychology"},"field":{"id":"https://openalex.org/fields/32","display_name":"Psychology"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/recall","display_name":"Recall","score":0.6345999836921692},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.5812000036239624},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.447299987077713},{"id":"https://openalex.org/keywords/overlay","display_name":"Overlay","score":0.41370001435279846},{"id":"https://openalex.org/keywords/memory-map","display_name":"Memory map","score":0.41100001335144043},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.40070000290870667},{"id":"https://openalex.org/keywords/episodic-memory","display_name":"Episodic memory","score":0.3935000002384186},{"id":"https://openalex.org/keywords/multimodal-interaction","display_name":"Multimodal interaction","score":0.3822999894618988},{"id":"https://openalex.org/keywords/auxiliary-memory","display_name":"Auxiliary memory","score":0.3725000023841858}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8033000230789185},{"id":"https://openalex.org/C100660578","wikidata":"https://www.wikidata.org/wiki/Q18733","display_name":"Recall","level":2,"score":0.6345999836921692},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.5812000036239624},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.5238999724388123},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.447299987077713},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.4311999976634979},{"id":"https://openalex.org/C136085584","wikidata":"https://www.wikidata.org/wiki/Q910289","display_name":"Overlay","level":2,"score":0.41370001435279846},{"id":"https://openalex.org/C74426580","wikidata":"https://www.wikidata.org/wiki/Q719484","display_name":"Memory map","level":3,"score":0.41100001335144043},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.40070000290870667},{"id":"https://openalex.org/C88576662","wikidata":"https://www.wikidata.org/wiki/Q18646","display_name":"Episodic memory","level":3,"score":0.3935000002384186},{"id":"https://openalex.org/C135641252","wikidata":"https://www.wikidata.org/wiki/Q738567","display_name":"Multimodal interaction","level":2,"score":0.3822999894618988},{"id":"https://openalex.org/C82687282","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Auxiliary memory","level":2,"score":0.3725000023841858},{"id":"https://openalex.org/C178278151","wikidata":"https://www.wikidata.org/wiki/Q7936607","display_name":"Visual memory","level":3,"score":0.35839998722076416},{"id":"https://openalex.org/C63511323","wikidata":"https://www.wikidata.org/wiki/Q908936","display_name":"Interleaved memory","level":4,"score":0.3573000133037567},{"id":"https://openalex.org/C58632812","wikidata":"https://www.wikidata.org/wiki/Q7936625","display_name":"Visual short-term memory","level":4,"score":0.35679998993873596},{"id":"https://openalex.org/C197914299","wikidata":"https://www.wikidata.org/wiki/Q18650","display_name":"Semantic memory","level":3,"score":0.3562000095844269},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.34860000014305115},{"id":"https://openalex.org/C2985957978","wikidata":"https://www.wikidata.org/wiki/Q492","display_name":"Human memory","level":3,"score":0.31529998779296875},{"id":"https://openalex.org/C39528615","wikidata":"https://www.wikidata.org/wiki/Q1229610","display_name":"Distributed shared memory","level":5,"score":0.30399999022483826},{"id":"https://openalex.org/C188147891","wikidata":"https://www.wikidata.org/wiki/Q147638","display_name":"Cognitive science","level":1,"score":0.2928999960422516},{"id":"https://openalex.org/C112049663","wikidata":"https://www.wikidata.org/wiki/Q18608","display_name":"Explicit memory","level":4,"score":0.2921000123023987},{"id":"https://openalex.org/C180747234","wikidata":"https://www.wikidata.org/wiki/Q23373","display_name":"Cognitive psychology","level":1,"score":0.2867000102996826},{"id":"https://openalex.org/C165696696","wikidata":"https://www.wikidata.org/wiki/Q11287","display_name":"Exploit","level":2,"score":0.2822999954223633},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.27630001306533813},{"id":"https://openalex.org/C15686315","wikidata":"https://www.wikidata.org/wiki/Q18614","display_name":"Implicit memory","level":3,"score":0.27570000290870667},{"id":"https://openalex.org/C76399640","wikidata":"https://www.wikidata.org/wiki/Q189401","display_name":"Virtual memory","level":4,"score":0.2615000009536743},{"id":"https://openalex.org/C192209626","wikidata":"https://www.wikidata.org/wiki/Q190909","display_name":"Focus (optics)","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C30390489","wikidata":"https://www.wikidata.org/wiki/Q4680748","display_name":"Adaptive memory","level":3,"score":0.2590000033378601},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.2578999996185303},{"id":"https://openalex.org/C2780009758","wikidata":"https://www.wikidata.org/wiki/Q6804172","display_name":"Measure (data warehouse)","level":2,"score":0.25130000710487366}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.29341","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29341","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.29341","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.29341","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.5882006883621216,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Multimodal":[0],"large":[1],"language":[2],"models":[3],"are":[4,198],"increasingly":[5],"deployed":[6],"as":[7,103],"long-horizon":[8],"agents,":[9],"where":[10],"memory":[11,44,77,102,143,166,170,177,188,211],"must":[12,18],"do":[13,181],"more":[14,213],"than":[15],"recall:":[16],"it":[17,115],"track":[19],"an":[20,104,109],"evolving":[21],"world,":[22],"revise":[23],"what":[24],"has":[25],"gone":[26],"stale,":[27],"and":[28,50,113,127,130,138,147,164,168,179,202,208,218],"surface":[29],"the":[30,155],"right":[31],"evidence":[32,148],"at":[33],"decision":[34],"time.":[35],"Existing":[36],"benchmarks":[37],"measure":[38],"recall":[39],"over":[40],"static":[41],"dialogue,":[42],"collapse":[43],"into":[45],"a":[46],"single":[47],"end-of-task":[48],"accuracy,":[49],"reduce":[51],"visual":[52,194],"observations":[53],"to":[54,59,62,87,191],"captions,":[55],"leaving":[56],"us":[57],"unable":[58],"localize":[60],"failures":[61],"writing,":[63],"maintenance,":[64],"retrieval,":[65],"or":[66],"use.":[67],"The":[68],"rise":[69],"of":[70,159],"agent":[71,101],"harnesses":[72],"that":[73],"author":[74],"their":[75],"own":[76],"sharpens":[78],"this":[79],"gap,":[80],"since":[81],"we":[82,98],"have":[83],"no":[84],"principled":[85],"way":[86],"compare":[88],"hand-designed":[89],"pipelines":[90],"with":[91,108,141],"self-managing":[92],"alternatives.":[93],"To":[94],"close":[95],"these":[96],"gaps,":[97],"formulate":[99],"multimodal":[100,120,187],"Action-World":[105],"Interaction":[106],"Loop":[107],"observable":[110],"four-stage":[111],"lifecycle,":[112],"instantiate":[114],"in":[116],"WorldMemArena:":[117],"400":[118],"multi-session":[119],"tasks":[121],"spanning":[122],"Lifelong":[123],"Evolution":[124],"(evolving":[125],"personal":[126],"task":[128],"states)":[129],"Agentic":[131],"Execution":[132],"(memory":[133],"from":[134],"real":[135],"observations,":[136],"actions,":[137],"feedback),":[139],"annotated":[140],"gold":[142],"points,":[144],"updates,":[145],"distractors,":[146],"chains":[149],"for":[150],"stage-level":[151],"diagnosis.":[152],"This":[153],"enables":[154],"first":[156],"head-to-head":[157],"comparison":[158],"long-context,":[160],"manually":[161],"designed":[162],"(RAG":[163],"external":[165],"systems),":[167],"harness-based":[169],"agents.":[171],"Results":[172],"show":[173],"that:":[174],"(1)":[175],"better":[176,184],"writing":[178],"storage":[180],"not":[182],"guarantee":[183],"performance;":[185],"(2)":[186],"still":[189],"struggles":[190],"fully":[192],"use":[193],"evidence;":[195],"(3)":[196],"systems":[197],"unstable":[199],"across":[200],"domains":[201],"degrade":[203],"on":[204],"realistic":[205],"agentic":[206],"trajectories;":[207],"(4)":[209],"harness":[210],"is":[212],"flexible":[214],"but":[215],"remains":[216],"costly":[217],"less":[219],"reliable.":[220]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-30T00:00:00"}
