{"id":"https://openalex.org/W7133552343","doi":"https://doi.org/10.1109/hpca68181.2026.11408599","title":"The Memory Processing Unit: A Generalized Interface for End-to-End In-Memory Execution","display_name":"The Memory Processing Unit: A Generalized Interface for End-to-End In-Memory Execution","publication_year":2026,"publication_date":"2026-01-31","ids":{"openalex":"https://openalex.org/W7133552343","doi":"https://doi.org/10.1109/hpca68181.2026.11408599"},"language":null,"primary_location":{"id":"doi:10.1109/hpca68181.2026.11408599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca68181.2026.11408599","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5013669746","display_name":"Minh S. Q. Truong","orcid":"https://orcid.org/0000-0001-8430-2513"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":true,"raw_author_name":"Minh S. Q. Truong","raw_affiliation_strings":["Carnegie Mellon University,USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128121321","display_name":"Yiqiu Sun","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Yiqiu Sun","raw_affiliation_strings":["University of Illinois Urbana-Champaign,USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128099786","display_name":"Dawei Xiong","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Dawei Xiong","raw_affiliation_strings":["University of Illinois Urbana-Champaign,USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109343186","display_name":"AB Shah","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Amol Shah","raw_affiliation_strings":["University of Illinois Urbana-Champaign,USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5018268672","display_name":"Alexander Glass","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Alexander Glass","raw_affiliation_strings":["Carnegie Mellon University,USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109682061","display_name":"Abraham Farrell","orcid":null},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Abraham Farrell","raw_affiliation_strings":["University of Illinois Urbana-Champaign,USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,USA","institution_ids":["https://openalex.org/I157725225"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5050099355","display_name":"James A. Bain","orcid":"https://orcid.org/0000-0002-5355-5048"},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"James A. Bain","raw_affiliation_strings":["Carnegie Mellon University,USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128082390","display_name":"L. Richard Carley","orcid":null},"institutions":[{"id":"https://openalex.org/I74973139","display_name":"Carnegie Mellon University","ror":"https://ror.org/05x2bcf33","country_code":"US","type":"education","lineage":["https://openalex.org/I74973139"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"L. Richard Carley","raw_affiliation_strings":["Carnegie Mellon University,USA"],"affiliations":[{"raw_affiliation_string":"Carnegie Mellon University,USA","institution_ids":["https://openalex.org/I74973139"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5036666743","display_name":"Saugata Ghose","orcid":"https://orcid.org/0000-0002-9138-0613"},"institutions":[{"id":"https://openalex.org/I157725225","display_name":"University of Illinois Urbana-Champaign","ror":"https://ror.org/047426m28","country_code":"US","type":"education","lineage":["https://openalex.org/I157725225"]}],"countries":["US"],"is_corresponding":false,"raw_author_name":"Saugata Ghose","raw_affiliation_strings":["University of Illinois Urbana-Champaign,USA"],"affiliations":[{"raw_affiliation_string":"University of Illinois Urbana-Champaign,USA","institution_ids":["https://openalex.org/I157725225"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":9,"corresponding_author_ids":["https://openalex.org/A5013669746"],"corresponding_institution_ids":["https://openalex.org/I74973139"],"apc_list":null,"apc_paid":null,"fwci":88.8974,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.99798038,"is_in_top_1_percent":true,"is_in_top_10_percent":true},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"16"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.34860000014305115,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10054","display_name":"Parallel Computing and Optimization Techniques","score":0.34860000014305115,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10933","display_name":"Real-Time Systems Scheduling","score":0.15029999613761902,"subfield":{"id":"https://openalex.org/subfields/1708","display_name":"Hardware and Architecture"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10772","display_name":"Distributed systems and fault tolerance","score":0.07999999821186066,"subfield":{"id":"https://openalex.org/subfields/1705","display_name":"Computer Networks and Communications"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/interface","display_name":"Interface (matter)","score":0.4846000075340271},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.3221000134944916},{"id":"https://openalex.org/keywords/process","display_name":"Process (computing)","score":0.2793000042438507},{"id":"https://openalex.org/keywords/encoding","display_name":"Encoding (memory)","score":0.27459999918937683},{"id":"https://openalex.org/keywords/signal-processing","display_name":"Signal processing","score":0.2597000002861023}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.6938999891281128},{"id":"https://openalex.org/C113843644","wikidata":"https://www.wikidata.org/wiki/Q901882","display_name":"Interface (matter)","level":4,"score":0.4846000075340271},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.3221000134944916},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.30390000343322754},{"id":"https://openalex.org/C79403827","wikidata":"https://www.wikidata.org/wiki/Q3988","display_name":"Real-time computing","level":1,"score":0.2793999910354614},{"id":"https://openalex.org/C98045186","wikidata":"https://www.wikidata.org/wiki/Q205663","display_name":"Process (computing)","level":2,"score":0.2793000042438507},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.27459999918937683},{"id":"https://openalex.org/C173608175","wikidata":"https://www.wikidata.org/wiki/Q232661","display_name":"Parallel computing","level":1,"score":0.2721000015735626},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.27160000801086426},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.2603999972343445},{"id":"https://openalex.org/C104267543","wikidata":"https://www.wikidata.org/wiki/Q208163","display_name":"Signal processing","level":3,"score":0.2597000002861023},{"id":"https://openalex.org/C138827492","wikidata":"https://www.wikidata.org/wiki/Q6661985","display_name":"Data processing","level":2,"score":0.2558000087738037},{"id":"https://openalex.org/C168167062","wikidata":"https://www.wikidata.org/wiki/Q1117970","display_name":"Component (thermodynamics)","level":2,"score":0.2556000053882599}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca68181.2026.11408599","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca68181.2026.11408599","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[{"id":"https://openalex.org/G6091630843","display_name":null,"funder_award_id":"CCF-2329096","funder_id":"https://openalex.org/F4320306076","funder_display_name":"National Science Foundation"}],"funders":[{"id":"https://openalex.org/F4320306076","display_name":"National Science Foundation","ror":"https://ror.org/021nxhr62"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":78,"referenced_works":["https://openalex.org/W1542981317","https://openalex.org/W1591666071","https://openalex.org/W1993163906","https://openalex.org/W2013259664","https://openalex.org/W2025674646","https://openalex.org/W2057218453","https://openalex.org/W2066280488","https://openalex.org/W2066949876","https://openalex.org/W2073748734","https://openalex.org/W2077791698","https://openalex.org/W2081729575","https://openalex.org/W2120886827","https://openalex.org/W2159159598","https://openalex.org/W2164577583","https://openalex.org/W2169832991","https://openalex.org/W2169875292","https://openalex.org/W2171956063","https://openalex.org/W2216132385","https://openalex.org/W2331783522","https://openalex.org/W2396622873","https://openalex.org/W2518281301","https://openalex.org/W2593172471","https://openalex.org/W2613051255","https://openalex.org/W2613569094","https://openalex.org/W2613989746","https://openalex.org/W2623880136","https://openalex.org/W2765234579","https://openalex.org/W2766489088","https://openalex.org/W2788825665","https://openalex.org/W2798476846","https://openalex.org/W2809295488","https://openalex.org/W2809524490","https://openalex.org/W2900379535","https://openalex.org/W2913104037","https://openalex.org/W2933452742","https://openalex.org/W2944576035","https://openalex.org/W2945951882","https://openalex.org/W2946017187","https://openalex.org/W2949989598","https://openalex.org/W2950138172","https://openalex.org/W2953174564","https://openalex.org/W2960205134","https://openalex.org/W2967324946","https://openalex.org/W2971920536","https://openalex.org/W2979663695","https://openalex.org/W2979874885","https://openalex.org/W2982008795","https://openalex.org/W3002919214","https://openalex.org/W3005997294","https://openalex.org/W3039529370","https://openalex.org/W3100710793","https://openalex.org/W3105003914","https://openalex.org/W3129551008","https://openalex.org/W3134274954","https://openalex.org/W3155004489","https://openalex.org/W3183264033","https://openalex.org/W3191222816","https://openalex.org/W3196818429","https://openalex.org/W3205140122","https://openalex.org/W3207965708","https://openalex.org/W3209151516","https://openalex.org/W3214184609","https://openalex.org/W4235631643","https://openalex.org/W4254901135","https://openalex.org/W4280542458","https://openalex.org/W4281644153","https://openalex.org/W4282551050","https://openalex.org/W4285305074","https://openalex.org/W4308083578","https://openalex.org/W4308083597","https://openalex.org/W4308083751","https://openalex.org/W4321500243","https://openalex.org/W4385896568","https://openalex.org/W4388349073","https://openalex.org/W4393407315","https://openalex.org/W4401568236","https://openalex.org/W4403296896","https://openalex.org/W4409328995"],"related_works":[],"abstract_inverted_index":{"The":[0],"processing-using-memory":[1],"(PUM;":[2],"a.k.a.":[3],"inmemory":[4],"computing)":[5],"paradigm":[6],"aims":[7],"to":[8,21,39,68,71,79,83,93,136,162,201],"eliminate":[9],"data":[10],"movement":[11],"energy":[12,252],"and":[13,88,98,140,160,184,206,251],"performance":[14,250],"costs":[15],"by":[16],"using":[17],"memory":[18,86,111],"cell":[19],"interactions":[20],"directly":[22],"perform":[23],"computation.":[24],"Given":[25],"PUM's":[26],"potential":[27],"for":[28,101,119,225,254],"large":[29],"savings,":[30],"prior":[31,234],"works":[32,235],"have":[33],"proposed":[34],"many":[35,63],"different":[36],"datapath":[37],"microarchitectures":[38],"demonstrate":[40,196],"how":[41,197,207],"general-purpose":[42,120,164],"PUM":[43,121,156,165,204],"benefits":[44],"a":[45,72,115,170,244],"wide":[46],"range":[47],"of":[48,64,155,189,213],"application":[49,138],"kernels.":[50],"Unfortunately,":[51],"these":[52,105,233],"efforts":[53],"largely":[54],"depend":[55],"on":[56],"microarchitecture-specific":[57],"vector-like":[58],"interfaces":[59],"that":[60,150,175],"(1)":[61],"force":[62],"an":[65,84,128,146],"application's":[66],"operations":[67],"be":[69],"offloaded":[70],"CPU,":[73],"(2)":[74],"require":[75],"significant":[76],"programmer":[77],"effort":[78],"scale":[80],"up":[81],"applications":[82,192],"entire":[85],"chip,":[87],"(3)":[89],"make":[90],"it":[91,208],"impractical":[92],"develop":[94,127],"badly-needed":[95],"systems":[96],"software":[97],"programming":[99],"tools":[100],"PUM.":[102,194],"To":[103],"address":[104],"three":[106,123],"issues,":[107],"we":[108,126,144,168],"propose":[109,145],"the":[110,198,255],"processing":[112],"unit":[113],"(MPU),":[114],"microarchitecture-agnostic":[116],"interface":[117],"layer":[118],"with":[122,134,193],"components.":[124],"First,":[125],"MPU":[129,172,178,199],"instruction":[130],"set":[131],"architecture":[132],"(ISA)":[133],"instructions":[135],"facilitate":[137],"scaling":[139],"task":[141],"coordination.":[142],"Second,":[143],"ensemble":[147],"execution":[148,152,188],"model":[149],"coordinates":[151],"across":[153,181],"millions":[154],"vector":[157],"function":[158],"units":[159],"maps":[161,200],"most":[163],"microarchitectures.":[166],"Third,":[167],"design":[169],"comprehensive":[171],"control":[173],"path":[174],"efficiently":[176],"executes":[177],"ISA":[179],"binaries":[180],"multiple":[182,202],"ensembles,":[183],"can":[185],"enable":[186],"CPU-free":[187],"complex":[190,256],"end-to-end":[191,257],"We":[195],"previously-proposed":[203],"datapaths,":[205],"achieves":[209],"average":[210],"performance/energy":[211],"improvements":[212,253],"<tex":[214,226],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[215,227,237],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{1.":[216],"7":[217],"9}":[218],"\\times":[219,239],"\\boldsymbol{/}":[220],"\\mathbf{3.":[221],"2":[222],"3}":[223],"\\times$</tex>":[224,242],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\mathbf{2":[228],"1}$</tex>":[229],"data-intensive":[230],"kernels":[231],"over":[232],"(<tex":[236],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$67":[238],"/":[240],"47":[241],"vs.":[243],"modern":[245],"GPU),":[246],"while":[247],"also":[248],"achieving":[249],"applications.":[258]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-09T08:11:56.329763","created_date":"2026-03-05T00:00:00"}
