{"id":"https://openalex.org/W7160827086","doi":"https://doi.org/10.48550/arxiv.2605.07313","title":"When Stored Evidence Stops Being Usable: Scale-Conditioned Evaluation of Agent Memory","display_name":"When Stored Evidence Stops Being Usable: Scale-Conditioned Evaluation of Agent Memory","publication_year":2026,"publication_date":"2026-05-08","ids":{"openalex":"https://openalex.org/W7160827086","doi":"https://doi.org/10.48550/arxiv.2605.07313"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2605.07313","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.07313","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2605.07313","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5135907250","display_name":"Jiaqi Shao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shao, Jiaqi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042611833","display_name":"Yiyi Lu","orcid":"https://orcid.org/0009-0001-0606-1395"},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Lu, Yiyi","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5135889781","display_name":"Yunzhen Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Yunzhen","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5135858254","display_name":"Bing Luo","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Bing","raw_affiliation_strings":[],"raw_orcid":null,"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":0,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.12960000336170197,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T12808","display_name":"Ferroelectric and Negative Capacitance Devices","score":0.12960000336170197,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12607","display_name":"Personal Information Management and User Behavior","score":0.1088000014424324,"subfield":{"id":"https://openalex.org/subfields/1802","display_name":"Information Systems and Management"},"field":{"id":"https://openalex.org/fields/18","display_name":"Decision Sciences"},"domain":{"id":"https://openalex.org/domains/2","display_name":"Social Sciences"}},{"id":"https://openalex.org/T12127","display_name":"Software System Performance and Reliability","score":0.06689999997615814,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/reliability","display_name":"Reliability (semiconductor)","score":0.7512999773025513},{"id":"https://openalex.org/keywords/protocol","display_name":"Protocol (science)","score":0.7437999844551086},{"id":"https://openalex.org/keywords/task","display_name":"Task (project management)","score":0.6031000018119812},{"id":"https://openalex.org/keywords/usable","display_name":"USable","score":0.4999000132083893},{"id":"https://openalex.org/keywords/scale","display_name":"Scale (ratio)","score":0.4348999857902527}],"concepts":[{"id":"https://openalex.org/C43214815","wikidata":"https://www.wikidata.org/wiki/Q7310987","display_name":"Reliability (semiconductor)","level":3,"score":0.7512999773025513},{"id":"https://openalex.org/C2780385302","wikidata":"https://www.wikidata.org/wiki/Q367158","display_name":"Protocol (science)","level":3,"score":0.7437999844551086},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6643999814987183},{"id":"https://openalex.org/C2780451532","wikidata":"https://www.wikidata.org/wiki/Q759676","display_name":"Task (project management)","level":2,"score":0.6031000018119812},{"id":"https://openalex.org/C2780615836","wikidata":"https://www.wikidata.org/wiki/Q2471869","display_name":"USable","level":2,"score":0.4999000132083893},{"id":"https://openalex.org/C2778755073","wikidata":"https://www.wikidata.org/wiki/Q10858537","display_name":"Scale (ratio)","level":2,"score":0.4348999857902527},{"id":"https://openalex.org/C133112747","wikidata":"https://www.wikidata.org/wiki/Q7251931","display_name":"Protocol analysis","level":2,"score":0.3806999921798706},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3644999861717224},{"id":"https://openalex.org/C15744967","wikidata":"https://www.wikidata.org/wiki/Q9418","display_name":"Psychology","level":0,"score":0.30300000309944153},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.2989000082015991},{"id":"https://openalex.org/C200601418","wikidata":"https://www.wikidata.org/wiki/Q2193887","display_name":"Reliability engineering","level":1,"score":0.2874999940395355},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2840000092983246},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.27230000495910645},{"id":"https://openalex.org/C133462117","wikidata":"https://www.wikidata.org/wiki/Q4929239","display_name":"Data collection","level":2,"score":0.2630999982357025}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2605.07313","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.07313","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"Preprint"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2605.07313","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2605.07313","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":null,"license_id":null,"version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Preprint"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Memory-agent":[0],"evaluations":[1],"report":[2],"fixed-snapshot":[3],"accuracy":[4],"or":[5],"retrieval":[6],"quality,":[7],"but":[8,112],"these":[9],"scores":[10],"do":[11],"not":[12,22,100],"show":[13],"whether":[14],"evidence":[15,26,47],"remains":[16],"usable":[17],"as":[18,24,120],"irrelevant":[19,52,121],"sessions":[20,53,122],"(sessions":[21],"annotated":[23],"task-relevant":[25],"for":[27,37,43,153],"the":[28,73,80,94,109,131,136,145],"query)":[29],"accumulate.":[30],"We":[31],"present":[32],"a":[33,101,151],"scale-conditioned":[34],"evaluation":[35],"protocol":[36,57,95],"agent":[38],"memory":[39,92],"under":[40],"evidence-preserving":[41],"growth:":[42],"each":[44],"query,":[45],"task":[46],"is":[48,99],"held":[49],"fixed":[50],"while":[51,138],"are":[54,123],"added.":[55],"The":[56,148],"logs":[58],"agent--memory":[59],"trajectories":[60],"and":[61,72,85,90,140,163],"reports":[62],"four":[63],"diagnostics:":[64],"budget-compliant":[65,118],"reliability,":[66],"tail":[67],"memory-call":[68],"burden,":[69],"failure-regime":[70],"decomposition,":[71],"usable-scale":[74],"boundary":[75],"where":[76],"reliability":[77,97,119],"falls":[78],"below":[79],"target.":[81],"Applied":[82],"to":[83],"LongMemEval":[84],"LoCoMo":[86],"across":[87],"flat,":[88],"planar,":[89],"hierarchical":[91],"interfaces,":[93],"shows":[96],"loss":[98],"single":[102],"phenomenon.":[103],"On":[104],"LongMemEval,":[105],"HippoRAG":[106],"stays":[107],"within":[108],"two-call":[110],"budget":[111,137],"loses":[113],"16--20":[114],"percentage":[115],"points":[116],"in":[117,144],"added;":[124],"LiCoMemory's":[125],"observed":[126],"failures":[127],"depend":[128],"strongly":[129],"on":[130,158],"agent,":[132,159],"with":[133],"Qwen3-8B":[134],"exceeding":[135],"Qwen3-32B":[139],"Qwen3-235B":[141],"remain":[142],"reliable":[143],"tested":[146],"range.":[147],"result":[149],"supports":[150],"framework":[152],"making":[154],"scalable-memory":[155],"claims":[156],"conditional":[157],"interface,":[160],"scale":[161],"range,":[162],"interaction":[164],"budget.":[165]},"counts_by_year":[],"updated_date":"2026-07-01T08:55:40.977307","created_date":"2026-05-12T00:00:00"}
