{"id":"https://openalex.org/W7135045430","doi":"https://doi.org/10.48550/arxiv.2603.10087","title":"Pooling Engram Conditional Memory in Large Language Models using CXL","display_name":"Pooling Engram Conditional Memory in Large Language Models using CXL","publication_year":2026,"publication_date":"2026-03-10","ids":{"openalex":"https://openalex.org/W7135045430","doi":"https://doi.org/10.48550/arxiv.2603.10087"},"language":null,"primary_location":{"id":"doi:10.48550/arxiv.2603.10087","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10087","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"type":"preprint","indexed_in":["datacite"],"open_access":{"is_oa":true,"oa_status":"green","oa_url":"https://doi.org/10.48550/arxiv.2603.10087","any_repository_has_fulltext":true},"authorships":[{"author_position":"first","author":{"id":null,"display_name":"Ma, Ruiyang","orcid":null},"institutions":[],"countries":[],"is_corresponding":true,"raw_author_name":"Ma, Ruiyang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Ma, Teng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Ma, Teng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Su, Zhiyuan","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Su, Zhiyuan","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zha, Hantian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zha, Hantian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Zhao, Xinpeng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Zhao, Xinpeng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Shang, Xuchun","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Shang, Xuchun","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Yi, Xingrui","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Yi, Xingrui","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Zheng","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Zheng","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Cao, Zhu","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Cao, Zhu","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Wu, An","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Wu, An","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Dou, Zhichong","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Dou, Zhichong","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Liu, Ziqian","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Liu, Ziqian","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"middle","author":{"id":null,"display_name":"Kuang, Daikang","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Kuang, Daikang","raw_affiliation_strings":[],"affiliations":[]},{"author_position":"last","author":{"id":null,"display_name":"Luo, Guojie","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Luo, Guojie","raw_affiliation_strings":[],"affiliations":[]}],"institutions":[],"countries_distinct_count":0,"institutions_distinct_count":14,"corresponding_author_ids":[],"corresponding_institution_ids":[],"apc_list":null,"apc_paid":null,"fwci":null,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":null,"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":null,"last_page":null},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.31220000982284546,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.31220000982284546,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T12292","display_name":"Graph Theory and Algorithms","score":0.14409999549388885,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10101","display_name":"Cloud Computing and Resource Management","score":0.06239999830722809,"subfield":{"id":"https://openalex.org/subfields/1710","display_name":"Information Systems"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/engram","display_name":"Engram","score":0.8345000147819519},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6244999766349792},{"id":"https://openalex.org/keywords/pooling","display_name":"Pooling","score":0.623199999332428},{"id":"https://openalex.org/keywords/scalability","display_name":"Scalability","score":0.4090999960899353},{"id":"https://openalex.org/keywords/component","display_name":"Component (thermodynamics)","score":0.3684999942779541},{"id":"https://openalex.org/keywords/decoupling","display_name":"Decoupling (probability)","score":0.3443000018596649}],"concepts":[{"id":"https://openalex.org/C28093023","wikidata":"https://www.wikidata.org/wiki/Q175168","display_name":"Engram","level":2,"score":0.8345000147819519},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6244999766349792},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6241999864578247},{"id":"https://openalex.org/C70437156","wikidata":"https://www.wikidata.org/wiki/Q7228652","display_name":"Pooling","level":2,"score":0.623199999332428},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.48980000615119934},{"id":"https://openalex.org/C48044578","wikidata":"https://www.wikidata.org/wiki/Q727490","display_name":"Scalability","level":2,"score":0.4090999960899353},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.3684999942779541},{"id":"https://openalex.org/C119857082","wikidata":"https://www.wikidata.org/wiki/Q2539","display_name":"Machine learning","level":1,"score":0.3578000068664551},{"id":"https://openalex.org/C205606062","wikidata":"https://www.wikidata.org/wiki/Q5249645","display_name":"Decoupling (probability)","level":2,"score":0.3443000018596649},{"id":"https://openalex.org/C41608201","wikidata":"https://www.wikidata.org/wiki/Q980509","display_name":"Embedding","level":2,"score":0.3206999897956848},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3093000054359436},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.28029999136924744},{"id":"https://openalex.org/C45235069","wikidata":"https://www.wikidata.org/wiki/Q278425","display_name":"Table (database)","level":2,"score":0.2750000059604645},{"id":"https://openalex.org/C137293760","wikidata":"https://www.wikidata.org/wiki/Q3621696","display_name":"Language model","level":2,"score":0.2655999958515167}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.48550/arxiv.2603.10087","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10087","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":null,"raw_source_name":null,"raw_type":"article"}],"best_oa_location":{"id":"doi:10.48550/arxiv.2603.10087","is_oa":true,"landing_page_url":"https://doi.org/10.48550/arxiv.2603.10087","pdf_url":null,"source":{"id":"https://openalex.org/S4306400194","display_name":"arXiv (Cornell University)","issn_l":null,"issn":null,"is_oa":true,"is_in_doaj":false,"is_core":false,"host_organization":"https://openalex.org/I205783295","host_organization_name":"Cornell University","host_organization_lineage":["https://openalex.org/I205783295"],"host_organization_lineage_names":[],"type":"repository"},"license":"cc-by","license_id":"https://openalex.org/licenses/cc-by","version":null,"is_accepted":false,"is_published":false,"raw_source_name":null,"raw_type":"article"},"sustainable_development_goals":[],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":0,"referenced_works":[],"related_works":[],"abstract_inverted_index":{"Engram":[0,20,52,76],"conditional":[1],"memory":[2,49],"has":[3],"emerged":[4],"as":[5],"a":[6,86],"promising":[7],"component":[8],"for":[9,34,51,92],"LLMs":[10,95],"by":[11,64],"decoupling":[12],"static":[13],"knowledge":[14],"lookup":[15],"from":[16],"dynamic":[17],"computation.":[18],"Since":[19],"exhibits":[21],"sparse":[22],"access":[23,62],"patterns":[24,69],"and":[25,60,66,88],"supports":[26],"prefetching,":[27],"its":[28],"massive":[29],"embedding":[30],"tables":[31],"are":[32],"well-suited":[33],"offloading":[35],"to":[36,55],"lower-tier":[37],"memory.":[38],"In":[39],"this":[40],"paper,":[41],"we":[42],"propose":[43],"using":[44],"Compute":[45],"Express":[46],"Link":[47],"(CXL)":[48],"pool":[50,77],"storage.":[53],"Compared":[54],"RDMA,":[56],"CXL":[57],"provides":[58,85],"fine-grained":[59],"low-latency":[61],"required":[63],"minimal":[65],"discrete":[67],"retrieval":[68],"of":[70],"Engram.":[71],"We":[72],"integrate":[73],"the":[74],"CXL-based":[75],"into":[78],"SGLang,":[79],"achieving":[80],"near-DRAM":[81],"end-to-end":[82],"performance.":[83,99],"This":[84],"scalable":[87],"cost-efficient":[89],"storage":[90],"solution":[91],"future":[93],"Engram-integrated":[94],"without":[96],"compromising":[97],"inference":[98]},"counts_by_year":[],"updated_date":"2026-03-13T16:22:10.518609","created_date":"2026-03-10T00:00:00"}
