{"id":"https://openalex.org/W7161958096","doi":"https://doi.org/10.48550/arxiv.2605.20833","title":"MemGym: a Long-Horizon Memory Environment for LLM Agents","display_name":"MemGym: a Long-Horizon Memory Environment for LLM Agents","publication_year":2026,"publication_date":"2026-05-20","ids":{"openalex":"https://openalex.org/W7161958096","doi":"https://doi.org/10.48550/arxiv.2605.20833"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.20833","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20833","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.20833","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5136629615","display_name":"Wujiang Xu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Xu, Wujiang","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136675986","display_name":"Wang, Yu, 1964-","orcid":"https://orcid.org/0000-0002-0683-9857"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Yu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136712794","display_name":"Kai Mei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Mei, Kai","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136636333","display_name":"Kaiqu Liang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liang, Kaiqu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136650897","display_name":"Zhenting Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Zhenting","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136708844","display_name":"Mingyu Jin","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Jin, Mingyu","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136711336","display_name":"Zhang, Han, 1960-","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Han","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136662345","display_name":"Shi-Xiong Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Shi-Xiong","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136695459","display_name":"Wenyue Hua","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Hua, Wenyue","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5136692139","display_name":"Sambit Sahu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Sahu, Sambit","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5136682451","display_name":"Dimitris N. Metaxas","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Metaxas, Dimitris N.","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":11,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.19189999997615814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10456","display_name":"Multi-Agent Systems and Negotiation","score":0.19189999997615814,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.14399999380111694,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.10830000042915344,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/coding","display_name":"Coding (social sciences)","score":0.5692999958992004},{"id":"https://openalex.org/keywords/memory-model","display_name":"Memory model","score":0.4921000003814697},{"id":"https://openalex.org/keywords/memory-map","display_name":"Memory map","score":0.3700000047683716},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.3691999912261963},{"id":"https://openalex.org/keywords/extended-memory","display_name":"Extended memory","score":0.33959999680519104},{"id":"https://openalex.org/keywords/benchmark","display_name":"Benchmark (surveying)","score":0.33649998903274536},{"id":"https://openalex.org/keywords/flat-memory-model","display_name":"Flat memory model","score":0.30959999561309814}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7329000234603882},{"id":"https://openalex.org/C179518139","wikidata":"https://www.wikidata.org/wiki/Q5140297","display_name":"Coding (social sciences)","level":2,"score":0.5692999958992004},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.4921000003814697},{"id":"https://openalex.org/C74426580","wikidata":"https://www.wikidata.org/wiki/Q719484","display_name":"Memory map","level":3,"score":0.3700000047683716},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.3691999912261963},{"id":"https://openalex.org/C171675096","wikidata":"https://www.wikidata.org/wiki/Q1143380","display_name":"Extended memory","level":4,"score":0.33959999680519104},{"id":"https://openalex.org/C185798385","wikidata":"https://www.wikidata.org/wiki/Q1161707","display_name":"Benchmark (surveying)","level":2,"score":0.33649998903274536},{"id":"https://openalex.org/C57863822","wikidata":"https://www.wikidata.org/wiki/Q905488","display_name":"Flat memory model","level":4,"score":0.30959999561309814},{"id":"https://openalex.org/C48455012","wikidata":"https://www.wikidata.org/wiki/Q2892593","display_name":"Memory consolidation","level":3,"score":0.26980000734329224},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.26579999923706055},{"id":"https://openalex.org/C63511323","wikidata":"https://www.wikidata.org/wiki/Q908936","display_name":"Interleaved memory","level":4,"score":0.2644999921321869},{"id":"https://openalex.org/C92855701","wikidata":"https://www.wikidata.org/wiki/Q5830907","display_name":"Computer memory","level":3,"score":0.26429998874664307},{"id":"https://openalex.org/C78548338","wikidata":"https://www.wikidata.org/wiki/Q2493","display_name":"Data compression","level":2,"score":0.26089999079704285},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.2574000060558319},{"id":"https://openalex.org/C153247305","wikidata":"https://www.wikidata.org/wiki/Q835713","display_name":"Memory address","level":3,"score":0.2563000023365021},{"id":"https://openalex.org/C39528615","wikidata":"https://www.wikidata.org/wiki/Q1229610","display_name":"Distributed shared memory","level":5,"score":0.25600001215934753}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.20833","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20833","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.20833","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.20833","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Memory":[0],"is":[1],"a":[2,57,153,166],"central":[3],"capability":[4],"for":[5,59,126],"LLM":[6],"agents":[7],"operating":[8],"across":[9],"long-horizon":[10],"tasks.":[11],"Existing":[12],"memory":[13,28,38,61,106,115],"benchmarks":[14],"predominantly":[15],"evaluate":[16],"retention":[17],"of":[18,172],"personalized":[19],"information":[20],"in":[21,170],"multi-turn":[22,88],"chat":[23],"scenarios,":[24],"overlooking":[25],"the":[26,37],"dynamic":[27],"formation":[29],"that":[30,62,104,161],"occurs":[31],"during":[32],"extended":[33],"agent":[34,65],"execution.":[35],"Consequently,":[36],"systems":[39],"they":[40],"produce":[41],"transfer":[42],"poorly":[43],"to":[44],"realistic":[45],"agentic":[46,60,83],"environments,":[47],"such":[48],"as":[49,165],"coding":[50,92,146],"and":[51,67,94,96,111,128,136],"web":[52],"navigation.":[53],"We":[54],"present":[55],"MemGym,":[56],"benchmark":[58],"unifies":[63],"existing":[64],"gyms":[66],"in-house":[68],"memory-grounded":[69],"pipelines":[70,125],"behind":[71],"one":[72],"memory-reasoning":[73],"interface.":[74],"MemGym":[75,100],"spans":[76],"five":[77],"evaluation":[78,144],"tracks":[79],"grouped":[80],"into":[81],"four":[82],"regimes:":[84],"tool-use":[85,112],"dialogue":[86],"(tau2-bench),":[87],"deep-research":[89],"search":[90],"(MEMGYM-DR),":[91],"(SWE-Gym":[93],"MEMGYM-CODEQA),":[95],"computer":[97],"use":[98],"(WebArena-Infinity).":[99],"reports":[101],"memory-isolated":[102],"scores":[103,162],"decouple":[105],"performance":[107],"from":[108],"reasoning,":[109],"retrieval,":[110],"ability,":[113],"so":[114],"strategies":[116],"can":[117],"be":[118],"ranked":[119],"without":[120],"those":[121],"confounders.":[122],"Our":[123],"synthetic":[124],"MEMGYM-CODEQA":[127],"MEMGYM-DR":[129],"are":[130],"length-controllable,":[131],"ablation-verified":[132],"at":[133],"every":[134],"stage,":[135],"tightly":[137],"aligned":[138],"with":[139,159],"downstream":[140],"scenarios.":[141],"To":[142],"make":[143],"on":[145],"environments":[147],"academically":[148],"tractable,":[149],"we":[150],"train":[151],"MemRM,":[152],"lightweight":[154],"reward":[155],"model":[156],"(Qwen3-1.7B":[157],"fine-tuned":[158],"QLoRA)":[160],"compression":[163],"quality":[164],"fast":[167],"scalar":[168],"read":[169],"place":[171],"full":[173],"Docker":[174],"rollouts.":[175]},"counts_by_year":[],"updated_date":"2026-06-11T09:08:48.828518","created_date":"2026-05-22T00:00:00"}
