{"id":"https://openalex.org/W4410986208","doi":"https://doi.org/10.1109/mm.2025.3575280","title":"Compute-Enabled CXL Memory Expansion for Efficient Retrieval Augmented Generation","display_name":"Compute-Enabled CXL Memory Expansion for Efficient Retrieval Augmented Generation","publication_year":2025,"publication_date":"2025-06-03","ids":{"openalex":"https://openalex.org/W4410986208","doi":"https://doi.org/10.1109/mm.2025.3575280"},"language":"en","primary_location":{"id":"doi:10.1109/mm.2025.3575280","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mm.2025.3575280","pdf_url":null,"source":{"id":"https://openalex.org/S59697426","display_name":"IEEE Micro","issn_l":"0272-1732","issn":["0272-1732","1937-4143"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Micro","raw_type":"journal-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5023012463","display_name":"Derrick Quinn","orcid":"https://orcid.org/0009-0000-5862-6565"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Derrick Quinn","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","Cornell University, Ithaca, NY, USA"],"raw_orcid":"https://orcid.org/0009-0000-5862-6565","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]},{"raw_affiliation_string":"Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5042812673","display_name":"Neel Patel","orcid":"https://orcid.org/0000-0002-8055-4243"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Neel Patel","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","Cornell University, Ithaca, NY, USA"],"raw_orcid":"https://orcid.org/0000-0002-8055-4243","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]},{"raw_affiliation_string":"Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5069911395","display_name":"Mohammad Alian","orcid":"https://orcid.org/0000-0002-4622-2181"},"institutions":[{"id":"https://openalex.org/I205783295","display_name":"Cornell University","ror":"https://ror.org/05bnh6r87","country_code":"US","type":"education","lineage":["https://openalex.org/I205783295"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Mohammad Alian","raw_affiliation_strings":["Department of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","Cornell University, Ithaca, NY, USA"],"raw_orcid":"https://orcid.org/0000-0002-4622-2181","affiliations":[{"raw_affiliation_string":"Department of Electrical and Computer Engineering, Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]},{"raw_affiliation_string":"Cornell University, Ithaca, NY, USA","institution_ids":["https://openalex.org/I205783295"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":3,"corresponding_author_ids":["https://openalex.org/A5023012463"],"corresponding_institution_ids":["https://openalex.org/I205783295"],"apc_list":null,"apc_paid":null,"fwci":1.1332,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.78459671,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":91,"max":95},"biblio":{"volume":"45","issue":"6","first_page":"100","last_page":"107"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.944100022315979,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10627","display_name":"Advanced Image and Video Retrieval Techniques","score":0.944100022315979,"subfield":{"id":"https://openalex.org/subfields/1707","display_name":"Computer Vision and Pattern Recognition"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10320","display_name":"Neural Networks and Applications","score":0.9420999884605408,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T11269","display_name":"Algorithms and Data Compression","score":0.9311000108718872,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.8563639521598816},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.41736841201782227},{"id":"https://openalex.org/keywords/parallel-computing","display_name":"Parallel computing","score":0.3850648105144501},{"id":"https://openalex.org/keywords/information-retrieval","display_name":"Information retrieval","score":0.32309162616729736}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.8563639521598816},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.41736841201782227},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.3850648105144501},{"id":"https://openalex.org/C23123220","wikidata":"https://www.wikidata.org/wiki/Q816826","display_name":"Information retrieval","level":1,"score":0.32309162616729736}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/mm.2025.3575280","is_oa":false,"landing_page_url":"https://doi.org/10.1109/mm.2025.3575280","pdf_url":null,"source":{"id":"https://openalex.org/S59697426","display_name":"IEEE Micro","issn_l":"0272-1732","issn":["0272-1732","1937-4143"],"is_oa":false,"is_in_doaj":false,"is_core":true,"host_organization":"https://openalex.org/P4310319808","host_organization_name":"Institute of Electrical and Electronics Engineers","host_organization_lineage":["https://openalex.org/P4310319808"],"host_organization_lineage_names":["Institute of Electrical and Electronics Engineers"],"type":"journal"},"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"IEEE Micro","raw_type":"journal-article"}],"best_oa_location":null,"sustainable_development_goals":[{"score":0.7099999785423279,"id":"https://metadata.un.org/sdg/7","display_name":"Affordable and clean energy"}],"awards":[{"id":"https://openalex.org/G879073502","display_name":null,"funder_award_id":"2239020","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":9,"referenced_works":["https://openalex.org/W2112300321","https://openalex.org/W2982008795","https://openalex.org/W3099700870","https://openalex.org/W3156789018","https://openalex.org/W3189166979","https://openalex.org/W4238135788","https://openalex.org/W4318541517","https://openalex.org/W4399677840","https://openalex.org/W4407197060"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W2390279801","https://openalex.org/W4391913857","https://openalex.org/W2358668433","https://openalex.org/W4396701345","https://openalex.org/W2376932109","https://openalex.org/W2001405890","https://openalex.org/W4396696052"],"abstract_inverted_index":{"Conventional":[0],"near-memory":[1,47,66],"processing":[2,48],"architectures":[3],"often":[4],"strike":[5],"a":[6,40,61,78],"trade-off":[7],"between":[8],"memory":[9,12,26,34,62,72,89,109],"capacity":[10,90],"and":[11,91,95],"bandwidth,":[13],"leading":[14],"to":[15,25,74],"high":[16,21,70],"initial":[17],"data":[18],"movement":[19],"or":[20],"capital":[22],"costs":[23],"due":[24],"stranding.":[27],"In":[28],"this":[29],"work,":[30],"we":[31],"introduce":[32],"compute-enabled":[33],"expansion":[35],"enabled":[36],"by":[37],"CXL":[38],"as":[39],"solution":[41],"for":[42],"the":[43,53],"widespread":[44],"adoption":[45],"of":[46,81],"at":[49],"scale.":[50],"We":[51],"present":[52],"Intelligent":[54],"Knowledge":[55],"Store":[56],"(IKS),":[57],"which":[58],"is":[59],"fundamentally":[60],"expander":[63],"with":[64,107],"lightweight":[65],"accelerators":[67],"that":[68],"leverage":[69],"internal":[71,88],"bandwidth":[73],"accelerate":[75],"dense":[76,102],"retrieval,":[77],"key":[79],"component":[80],"retrieval-augmented":[82],"generation":[83],"(RAG).":[84],"IKS":[85],"disaggregates":[86],"its":[87],"supports":[92],"both":[93],"spatial":[94],"temporal":[96],"multi-tenancy.":[97],"It":[98],"significantly":[99],"accelerates":[100],"high-quality":[101],"retrieval":[103],"while":[104],"enabling":[105],"multi-tenancy":[106],"modest":[108],"access":[110],"interference.":[111]},"counts_by_year":[{"year":2025,"cited_by_count":1}],"updated_date":"2025-12-31T23:11:33.660297","created_date":"2025-10-10T00:00:00"}
