{"id":"https://openalex.org/W7133702628","doi":"https://doi.org/10.48550/arxiv.2603.04257","title":"Memex(RL): Scaling Long-Horizon LLM Agents via Indexed Experience Memory","display_name":"Memex(RL): Scaling Long-Horizon LLM Agents via Indexed Experience Memory","publication_year":2026,"publication_date":"2026-03-04","ids":{"openalex":"https://openalex.org/W7133702628","doi":"https://doi.org/10.48550/arxiv.2603.04257"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2603.04257","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5128151801","display_name":"Zhenting Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Wang, Zhenting","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128157459","display_name":"Huancheng Chen","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Chen, Huancheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128137487","display_name":"Jiayun Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Jiayun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5128137185","display_name":"Wei Wei","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wei, Wei","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":4,"corresponding_author_ids":["https://openalex.org/A5128151801"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2694000005722046,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.2694000005722046,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.1542000025510788,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11636","display_name":"Artificial Intelligence in Healthcare and Education","score":0.10119999945163727,"subfield":{"id":"https://openalex.org/subfields/2718","display_name":"Health Informatics"},"field":{"id":"https://openalex.org/fields/27","display_name":"Medicine"},"domain":{"id":"https://openalex.org/domains/4","display_name":"Health Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/context","display_name":"Context (archaeology)","score":0.6765999794006348},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6403999924659729},{"id":"https://openalex.org/keywords/reinforcement-learning","display_name":"Reinforcement learning","score":0.6243000030517578},{"id":"https://openalex.org/keywords/bounded-function","display_name":"Bounded function","score":0.474700003862381},{"id":"https://openalex.org/keywords/computation","display_name":"Computation","score":0.45809999108314514},{"id":"https://openalex.org/keywords/lossy-compression","display_name":"Lossy compression","score":0.4408000111579895},{"id":"https://openalex.org/keywords/index","display_name":"Index (typography)","score":0.361299991607666}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8033999800682068},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.6765999794006348},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6403999924659729},{"id":"https://openalex.org/C97541855","wikidata":"https://www.wikidata.org/wiki/Q830687","display_name":"Reinforcement learning","level":2,"score":0.6243000030517578},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.5231000185012817},{"id":"https://openalex.org/C34388435","wikidata":"https://www.wikidata.org/wiki/Q2267362","display_name":"Bounded function","level":2,"score":0.474700003862381},{"id":"https://openalex.org/C45374587","wikidata":"https://www.wikidata.org/wiki/Q12525525","display_name":"Computation","level":2,"score":0.45809999108314514},{"id":"https://openalex.org/C165021410","wikidata":"https://www.wikidata.org/wiki/Q55564","display_name":"Lossy compression","level":2,"score":0.4408000111579895},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.4153999984264374},{"id":"https://openalex.org/C2777382242","wikidata":"https://www.wikidata.org/wiki/Q6017816","display_name":"Index (typography)","level":2,"score":0.361299991607666},{"id":"https://openalex.org/C183322885","wikidata":"https://www.wikidata.org/wiki/Q17007702","display_name":"Context model","level":3,"score":0.35929998755455017},{"id":"https://openalex.org/C53833338","wikidata":"https://www.wikidata.org/wiki/Q1061424","display_name":"Context switch","level":2,"score":0.3301999866962433},{"id":"https://openalex.org/C99844830","wikidata":"https://www.wikidata.org/wiki/Q102441924","display_name":"Scaling","level":2,"score":0.328000009059906},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3253999948501587},{"id":"https://openalex.org/C82687282","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Auxiliary memory","level":2,"score":0.32010000944137573},{"id":"https://openalex.org/C175154964","wikidata":"https://www.wikidata.org/wiki/Q380077","display_name":"Task analysis","level":3,"score":0.305400013923645},{"id":"https://openalex.org/C107457646","wikidata":"https://www.wikidata.org/wiki/Q207434","display_name":"Human\u2013computer interaction","level":1,"score":0.28110000491142273},{"id":"https://openalex.org/C97399411","wikidata":"https://www.wikidata.org/wiki/Q825367","display_name":"Coin flipping","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C106195933","wikidata":"https://www.wikidata.org/wiki/Q7847935","display_name":"Truncation (statistics)","level":2,"score":0.2703000009059906},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.26330000162124634}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2603.04257","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2603.04257","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.04257","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2603.04257","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"publisher-specific-oa","license_id":"https://openalex.org/licenses/publisher-specific-oa","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[{"id":"https://metadata.un.org/sdg/16","score":0.5777451992034912,"display_name":"Peace, Justice and strong institutions"}],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"model":[2],"(LLM)":[3],"agents":[4],"are":[5,65],"fundamentally":[6,66],"bottlenecked":[7],"by":[8],"finite":[9],"context":[10,30,37,56,87,96,162],"windows":[11],"on":[12,226],"long-horizon":[13,191,228],"tasks.":[14],"As":[15],"trajectories":[16],"grow,":[17],"retaining":[18],"tool":[19],"outputs":[20],"and":[21,39,102,128,143,178],"intermediate":[22],"reasoning":[23],"in-context":[24,219],"quickly":[25],"becomes":[26,31],"infeasible:":[27],"the":[28,36,130,136,165,203,206],"working":[29,95,243],"prohibitively":[32],"long,":[33],"eventually":[34],"exceeds":[35],"budget,":[38,163],"makes":[40],"distant":[41],"evidence":[42,74,133],"harder":[43],"to":[44,124,156,169,172,175,180,209],"use":[45],"even":[46],"when":[47,123,179],"it":[48],"is":[49],"still":[50],"present.":[51],"Existing":[52],"solutions":[53],"typically":[54],"shorten":[55],"through":[57],"truncation":[58],"or":[59,71],"running":[60],"summaries,":[61],"but":[62],"these":[63],"methods":[64],"lossy":[67,188],"because":[68],"they":[69],"compress":[70],"discard":[72],"past":[73,132],"itself.":[75],"We":[76,139,196],"introduce":[77],"Memex,":[78],"an":[79,111,126],"indexed":[80,157],"experience":[81,113],"memory":[82,158,192],"mechanism":[83],"that":[84],"instead":[85],"compresses":[86],"without":[88],"discarding":[89],"evidence.":[90],"Memex":[91,207,230],"maintains":[92],"a":[93,161,185,199,240],"compact":[94],"consisting":[97],"of":[98,190,205],"concise":[99],"structured":[100],"summaries":[101],"stable":[103],"indices,":[104],"while":[105,216,238],"storing":[106],"full-fidelity":[107],"underlying":[108],"interactions":[109],"in":[110],"external":[112],"database":[114],"under":[115,160],"those":[116],"indices.":[117],"The":[118],"agent":[119,166,231],"can":[120],"then":[121],"decide":[122],"dereference":[125],"index":[127,176],"recover":[129],"exact":[131],"needed":[134],"for":[135],"current":[137],"subgoal.":[138],"optimize":[140],"both":[141],"write":[142],"read":[144],"behaviors":[145],"with":[146,213,233],"our":[147],"reinforcement":[148],"learning":[149],"framework":[150],"MemexRL,":[151],"using":[152,239],"reward":[153],"shaping":[154],"tailored":[155],"usage":[159],"so":[164],"learns":[167],"what":[168,171],"summarize,":[170],"archive,":[173],"how":[174],"it,":[177],"retrieve":[181],"it.":[182],"This":[183],"yields":[184],"substantially":[186],"less":[187],"form":[189],"than":[193],"summary-only":[194],"approaches.":[195],"further":[197],"provide":[198],"theoretical":[200],"analysis":[201],"showing":[202],"potential":[204],"loop":[208],"preserve":[210],"decision":[211],"quality":[212],"bounded":[214,221],"dereferencing":[215],"keeping":[217],"effective":[218],"computation":[220],"as":[222],"history":[223],"grows.":[224],"Empirically,":[225],"challenging":[227],"tasks,":[229],"trained":[232],"MemexRL":[234],"improves":[235],"task":[236],"success":[237],"significantly":[241],"smaller":[242],"context.":[244]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-03-06T00:00:00"}
