{"id":"https://openalex.org/W7129445708","doi":"https://doi.org/10.48550/arxiv.2602.13933","title":"HyMem: Hybrid Memory Architecture with Dynamic Retrieval Scheduling","display_name":"HyMem: Hybrid Memory Architecture with Dynamic Retrieval Scheduling","publication_year":2026,"publication_date":"2026-02-15","ids":{"openalex":"https://openalex.org/W7129445708","doi":"https://doi.org/10.48550/arxiv.2602.13933"},"language":null,"primary_location":{"id":"pmh:doi:10.48550/arxiv.2602.13933","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":null,"any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5070505636","display_name":"Xiaochen Zhao","orcid":"https://orcid.org/0000-0001-8976-7723"},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Zhao, Xiaochen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126265850","display_name":"Kaikai Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Kaikai","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126218622","display_name":"Xiaowen Zhang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhang, Xiaowen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":"https://openalex.org/A5126232867","display_name":"Chen Yao","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yao, Chen","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":"https://openalex.org/A5126199578","display_name":"Aili Wang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wang, Aili","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5070505636"],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4375999867916107,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.4375999867916107,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.09669999778270721,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11714","display_name":"Multimodal Machine Learning Applications","score":0.09019999951124191,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/scheduling","display_name":"Scheduling (production processes)","score":0.5095999836921692},{"id":"https://openalex.org/keywords/flat-memory-model","display_name":"Flat memory model","score":0.4487999975681305},{"id":"https://openalex.org/keywords/overhead","display_name":"Overhead (engineering)","score":0.4221000075340271},{"id":"https://openalex.org/keywords/interleaved-memory","display_name":"Interleaved memory","score":0.41690000891685486},{"id":"https://openalex.org/keywords/memory-architecture","display_name":"Memory architecture","score":0.40849998593330383},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.3880000114440918},{"id":"https://openalex.org/keywords/computing-with-memory","display_name":"Computing with Memory","score":0.35409998893737793},{"id":"https://openalex.org/keywords/architecture","display_name":"Architecture","score":0.35280001163482666},{"id":"https://openalex.org/keywords/dynamic-random-access-memory","display_name":"Dynamic random-access memory","score":0.3521000146865845}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8294000029563904},{"id":"https://openalex.org/C120314980","wikidata":"https://www.wikidata.org/wiki/Q180634","display_name":"Distributed computing","level":1,"score":0.5253000259399414},{"id":"https://openalex.org/C206729178","wikidata":"https://www.wikidata.org/wiki/Q2271896","display_name":"Scheduling (production processes)","level":2,"score":0.5095999836921692},{"id":"https://openalex.org/C57863822","wikidata":"https://www.wikidata.org/wiki/Q905488","display_name":"Flat memory model","level":4,"score":0.4487999975681305},{"id":"https://openalex.org/C2779960059","wikidata":"https://www.wikidata.org/wiki/Q7113681","display_name":"Overhead (engineering)","level":2,"score":0.4221000075340271},{"id":"https://openalex.org/C63511323","wikidata":"https://www.wikidata.org/wiki/Q908936","display_name":"Interleaved memory","level":4,"score":0.41690000891685486},{"id":"https://openalex.org/C2779602883","wikidata":"https://www.wikidata.org/wiki/Q15544750","display_name":"Memory architecture","level":2,"score":0.40849998593330383},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.3880000114440918},{"id":"https://openalex.org/C152890283","wikidata":"https://www.wikidata.org/wiki/Q4129922","display_name":"Computing with Memory","level":5,"score":0.35409998893737793},{"id":"https://openalex.org/C123657996","wikidata":"https://www.wikidata.org/wiki/Q12271","display_name":"Architecture","level":2,"score":0.35280001163482666},{"id":"https://openalex.org/C118702147","wikidata":"https://www.wikidata.org/wiki/Q189396","display_name":"Dynamic random-access memory","level":3,"score":0.3521000146865845},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.3407000005245209},{"id":"https://openalex.org/C107568181","wikidata":"https://www.wikidata.org/wiki/Q5319000","display_name":"Dynamic priority scheduling","level":3,"score":0.33820000290870667},{"id":"https://openalex.org/C51290061","wikidata":"https://www.wikidata.org/wiki/Q1936765","display_name":"Uniform memory access","level":4,"score":0.3271999955177307},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.32120001316070557},{"id":"https://openalex.org/C82687282","wikidata":"https://www.wikidata.org/wiki/Q66221","display_name":"Auxiliary memory","level":2,"score":0.3181999921798706},{"id":"https://openalex.org/C76679254","wikidata":"https://www.wikidata.org/wiki/Q5165163","display_name":"Context-dependent memory","level":4,"score":0.3075999915599823},{"id":"https://openalex.org/C74426580","wikidata":"https://www.wikidata.org/wiki/Q719484","display_name":"Memory map","level":3,"score":0.3043999969959259},{"id":"https://openalex.org/C171675096","wikidata":"https://www.wikidata.org/wiki/Q1143380","display_name":"Extended memory","level":4,"score":0.3041999936103821},{"id":"https://openalex.org/C12186640","wikidata":"https://www.wikidata.org/wiki/Q6815743","display_name":"Memory model","level":3,"score":0.303600013256073},{"id":"https://openalex.org/C2779343474","wikidata":"https://www.wikidata.org/wiki/Q3109175","display_name":"Context (archaeology)","level":2,"score":0.2777000069618225},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.27410000562667847},{"id":"https://openalex.org/C20854674","wikidata":"https://www.wikidata.org/wiki/Q4386060","display_name":"Cognitive architecture","level":3,"score":0.271699994802475},{"id":"https://openalex.org/C30390489","wikidata":"https://www.wikidata.org/wiki/Q4680748","display_name":"Adaptive memory","level":3,"score":0.26989999413490295},{"id":"https://openalex.org/C91481028","wikidata":"https://www.wikidata.org/wiki/Q1054686","display_name":"Distributed memory","level":3,"score":0.26899999380111694},{"id":"https://openalex.org/C113775141","wikidata":"https://www.wikidata.org/wiki/Q428691","display_name":"Computer engineering","level":1,"score":0.2644999921321869},{"id":"https://openalex.org/C119948110","wikidata":"https://www.wikidata.org/wiki/Q7858726","display_name":"Two-level scheduling","level":4,"score":0.2605000138282776},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2540000081062317},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.2529999911785126}],"mesh":[],"locations_count":2,"locations":[{"id":"pmh:doi:10.48550/arxiv.2602.13933","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},{"id":"doi:10.48550/arxiv.2602.13933","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2602.13933","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"pmh:doi:10.48550/arxiv.2602.13933","is_oa":true,"landing_page_url":null,"pdf_url":null,"source":{"id":"https://openalex.org/S4406922384","display_name":"Open MIND","issn_l":null,"issn":null,"is_oa":false,"is_in_doaj":false,"is_core":false,"host_organization":null,"host_organization_name":null,"host_organization_lineage":[],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":"submittedVersion","is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"Article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Large":[0],"language":[1],"model":[2],"(LLM)":[3],"agents":[4],"demonstrate":[5],"strong":[6,161],"performance":[7,162,185],"in":[8,14,56,79,186],"short-text":[9],"contexts":[10],"but":[11],"often":[12],"underperform":[13],"extended":[15],"dialogues":[16],"due":[17],"to":[18,69,83,85],"inefficient":[19],"memory":[20,32,61,75,101,110,188],"management.":[21,189],"Existing":[22],"approaches":[23],"face":[24],"a":[25,99,114,120,125,149,179],"fundamental":[26],"trade-off":[27],"between":[28,182],"efficiency":[29,183],"and":[30,63,73,167,184],"effectiveness:":[31],"compression":[33],"risks":[34],"losing":[35],"critical":[36],"details":[37],"required":[38],"for":[39,50,131,144,152],"complex":[40,145],"reasoning,":[41],"while":[42,135,172],"retaining":[43],"raw":[44],"text":[45],"introduces":[46],"unnecessary":[47],"computational":[48,174],"overhead":[49],"simple":[51],"queries.":[52],"The":[53],"crux":[54],"lies":[55],"the":[57,71,91,165],"limitations":[58],"of":[59,93],"monolithic":[60],"representations":[62],"static":[64],"retrieval":[65,123],"mechanisms,":[66],"which":[67],"fail":[68],"emulate":[70],"flexible":[72],"proactive":[74],"scheduling":[76,107],"capabilities":[77],"observed":[78],"humans,":[80],"thus":[81],"struggling":[82],"adapt":[84],"diverse":[86],"problem":[87],"scenarios.":[88],"Inspired":[89],"by":[90,148,176],"principle":[92],"cognitive":[94],"economy,":[95],"we":[96],"propose":[97],"HyMem,":[98],"hybrid":[100],"architecture":[102],"that":[103,158],"enables":[104],"dynamic":[105,121],"on-demand":[106],"through":[108],"multi-granular":[109],"representations.":[111],"HyMem":[112,159],"adopts":[113],"dual-granular":[115],"storage":[116],"scheme":[117],"paired":[118],"with":[119],"two-tier":[122],"system:":[124],"lightweight":[126],"module":[127,139],"constructs":[128],"summary-level":[129],"context":[130],"efficient":[132],"response":[133],"generation,":[134],"an":[136],"LLM-based":[137],"deep":[138],"is":[140],"selectively":[141],"activated":[142],"only":[143],"queries,":[146],"augmented":[147],"reflection":[150],"mechanism":[151],"iterative":[153],"reasoning":[154],"refinement.":[155],"Experiments":[156],"show":[157],"achieves":[160],"on":[163],"both":[164],"LOCOMO":[166],"LongMemEval":[168],"benchmarks,":[169],"outperforming":[170],"full-context":[171],"reducing":[173],"cost":[175],"92.6\\%,":[177],"establishing":[178],"state-of-the-art":[180],"balance":[181],"long-term":[187]},"counts_by_year":[],"updated_date":"2026-04-04T16:13:02.066488","created_date":"2026-02-18T00:00:00"}
