{"id":"https://openalex.org/W7133526451","doi":"https://doi.org/10.1109/hpca68181.2026.11408542","title":"RoMe: Row Granularity Access Memory System for Large Language Models","display_name":"RoMe: Row Granularity Access Memory System for Large Language Models","publication_year":2026,"publication_date":"2026-01-31","ids":{"openalex":"https://openalex.org/W7133526451","doi":"https://doi.org/10.1109/hpca68181.2026.11408542"},"language":null,"primary_location":{"id":"doi:10.1109/hpca68181.2026.11408542","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca68181.2026.11408542","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5052317647","display_name":"Hwayong Nam","orcid":"https://orcid.org/0000-0002-2466-9273"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Hwayong Nam","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5128054576","display_name":"Seungmin Baek","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seungmin Baek","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5107886155","display_name":"J. H. Kim","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jumin Kim","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5109756929","display_name":"Michael Jaemin Kim","orcid":null},"institutions":[],"countries":[],"is_corresponding":false,"raw_author_name":"Michael Jaemin Kim","raw_affiliation_strings":["Meta"],"affiliations":[{"raw_affiliation_string":"Meta","institution_ids":[]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5125243766","display_name":"J Ahn","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jung Ho Ahn","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":5,"corresponding_author_ids":["https://openalex.org/A5052317647"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":0.0,"has_fulltext":false,"cited_by_count":0,"citation_normalized_percentile":{"value":0.93056676,"is_in_top_1_percent":false,"is_in_top_10_percent":true},"cited_by_percentile_year":null,"biblio":{"volume":null,"issue":null,"first_page":"1","last_page":"15"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.2606000006198883,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10181","display_name":"Natural Language Processing Techniques","score":0.2606000006198883,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10028","display_name":"Topic Modeling","score":0.2070000022649765,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10201","display_name":"Speech Recognition and Synthesis","score":0.03590000048279762,"subfield":{"id":"https://openalex.org/subfields/1702","display_name":"Artificial Intelligence"},"field":{"id":"https://openalex.org/fields/17","display_name":"Computer Science"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/granularity","display_name":"Granularity","score":0.3747999966144562},{"id":"https://openalex.org/keywords/key","display_name":"Key (lock)","score":0.33079999685287476},{"id":"https://openalex.org/keywords/data-access","display_name":"Data access","score":0.27570000290870667},{"id":"https://openalex.org/keywords/semantics","display_name":"Semantics (computer science)","score":0.2727999985218048},{"id":"https://openalex.org/keywords/memory-management","display_name":"Memory management","score":0.2662000060081482},{"id":"https://openalex.org/keywords/modeling-language","display_name":"Modeling language","score":0.2624000012874603}],"concepts":[{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.744700014591217},{"id":"https://openalex.org/C199360897","wikidata":"https://www.wikidata.org/wiki/Q9143","display_name":"Programming language","level":1,"score":0.38370001316070557},{"id":"https://openalex.org/C177774035","wikidata":"https://www.wikidata.org/wiki/Q1246948","display_name":"Granularity","level":2,"score":0.3747999966144562},{"id":"https://openalex.org/C80444323","wikidata":"https://www.wikidata.org/wiki/Q2878974","display_name":"Theoretical computer science","level":1,"score":0.3562000095844269},{"id":"https://openalex.org/C26517878","wikidata":"https://www.wikidata.org/wiki/Q228039","display_name":"Key (lock)","level":2,"score":0.33079999685287476},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.3264000117778778},{"id":"https://openalex.org/C204321447","wikidata":"https://www.wikidata.org/wiki/Q30642","display_name":"Natural language processing","level":1,"score":0.3179999887943268},{"id":"https://openalex.org/C47487241","wikidata":"https://www.wikidata.org/wiki/Q5227230","display_name":"Data access","level":2,"score":0.27570000290870667},{"id":"https://openalex.org/C184337299","wikidata":"https://www.wikidata.org/wiki/Q1437428","display_name":"Semantics (computer science)","level":2,"score":0.2727999985218048},{"id":"https://openalex.org/C176649486","wikidata":"https://www.wikidata.org/wiki/Q2308807","display_name":"Memory management","level":3,"score":0.2662000060081482},{"id":"https://openalex.org/C124101348","wikidata":"https://www.wikidata.org/wiki/Q172491","display_name":"Data mining","level":1,"score":0.2651999890804291},{"id":"https://openalex.org/C179603123","wikidata":"https://www.wikidata.org/wiki/Q1941921","display_name":"Modeling language","level":3,"score":0.2624000012874603},{"id":"https://openalex.org/C2776401178","wikidata":"https://www.wikidata.org/wiki/Q12050496","display_name":"Feature (linguistics)","level":2,"score":0.2599000036716461},{"id":"https://openalex.org/C77618280","wikidata":"https://www.wikidata.org/wiki/Q1155772","display_name":"Scheme (mathematics)","level":2,"score":0.2547999918460846},{"id":"https://openalex.org/C125411270","wikidata":"https://www.wikidata.org/wiki/Q18653","display_name":"Encoding (memory)","level":2,"score":0.2533000111579895},{"id":"https://openalex.org/C67186912","wikidata":"https://www.wikidata.org/wiki/Q367664","display_name":"Data modeling","level":2,"score":0.2531999945640564}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca68181.2026.11408542","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca68181.2026.11408542","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2026 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[{"display_name":"Quality Education","id":"https://metadata.un.org/sdg/4","score":0.5886108875274658}],"awards":[],"funders":[],"has_content":{"pdf":false,"grobid_xml":false},"content_urls":null,"referenced_works_count":50,"referenced_works":["https://openalex.org/W1964316448","https://openalex.org/W1985431949","https://openalex.org/W1989061323","https://openalex.org/W2026517532","https://openalex.org/W2082375193","https://openalex.org/W2102871765","https://openalex.org/W2119296805","https://openalex.org/W2129513794","https://openalex.org/W2131780201","https://openalex.org/W2132269953","https://openalex.org/W2151917022","https://openalex.org/W2159908132","https://openalex.org/W2165697076","https://openalex.org/W2166263440","https://openalex.org/W2346205343","https://openalex.org/W2607352011","https://openalex.org/W2612695082","https://openalex.org/W2742900615","https://openalex.org/W2761132374","https://openalex.org/W2790546557","https://openalex.org/W2927667751","https://openalex.org/W3005403948","https://openalex.org/W3016166938","https://openalex.org/W3092001024","https://openalex.org/W3136346557","https://openalex.org/W3141915942","https://openalex.org/W4220702013","https://openalex.org/W4220972538","https://openalex.org/W4231734693","https://openalex.org/W4232168013","https://openalex.org/W4236382111","https://openalex.org/W4242747115","https://openalex.org/W4243928162","https://openalex.org/W4245018380","https://openalex.org/W4245941243","https://openalex.org/W4313546932","https://openalex.org/W4380874786","https://openalex.org/W4390098112","https://openalex.org/W4392427708","https://openalex.org/W4392746501","https://openalex.org/W4394998968","https://openalex.org/W4399677071","https://openalex.org/W4401211704","https://openalex.org/W4401211711","https://openalex.org/W4401211861","https://openalex.org/W4404386171","https://openalex.org/W4404954383","https://openalex.org/W4404955001","https://openalex.org/W4407219227","https://openalex.org/W4411471758"],"related_works":[],"abstract_inverted_index":{"Modern":[0],"HBM-based":[1,65,173],"memory":[2,37,66,82,116,121,155,174],"systems":[3,175],"have":[4],"evolved":[5],"over":[6],"generations":[7],"while":[8],"retaining":[9],"cache":[10,76],"line":[11,77],"granularity":[12,17,105],"accesses.":[13],"Preserving":[14],"this":[15,95],"fine":[16],"necessitated":[18],"the":[19,81,115],"introduction":[20],"of":[21,74],"bank":[22,109],"groups":[23],"and":[24,32,106,111,166],"pseudo":[25,112],"channels.":[26],"These":[27],"structures":[28],"expand":[29],"timing":[30],"parameters":[31],"control":[33],"overhead,":[34],"significantly":[35,160],"increasing":[36,138],"controller":[38,83],"scheduling":[39,156],"complexity.":[40],"Large":[41],"language":[42],"models":[43],"(LLMs)":[44],"now":[45],"dominate":[46],"deep":[47],"learning":[48],"workloads,":[49,165],"streaming":[50],"contiguous":[51],"data":[52],"blocks":[53],"ranging":[54],"from":[55,114],"several":[56],"kilobytes":[57],"to":[58,84,90,134],"megabytes":[59],"per":[60,127],"operation.":[61],"In":[62],"a":[63],"conventional":[64],"system,":[67],"these":[68],"transfers":[69],"are":[70,132],"fragmented":[71],"into":[72],"hundreds":[73],"32B":[75],"transactions.":[78],"This":[79,118],"forces":[80],"employ":[85],"unnecessarily":[86],"intricate":[87],"scheduling,":[88,122],"leading":[89],"growing":[91],"inefficiency.":[92],"To":[93],"address":[94],"problem,":[96],"we":[97],"propose":[98],"RoMe.":[99],"RoMe":[100,152],"accesses":[101],"DRAM":[102],"at":[103],"row":[104],"removes":[107],"columns,":[108],"groups,":[110],"channels":[113],"interface.":[117],"design":[119],"simplifies":[120],"thereby":[123],"requiring":[124],"fewer":[125],"pins":[126,131],"channel.":[128],"The":[129],"freed":[130],"aggregated":[133],"form":[135],"additional":[136],"channels,":[137],"overall":[139],"bandwidth":[140,178],"by":[141],"<tex":[142],"xmlns:mml=\"http://www.w3.org/1998/Math/MathML\"":[143],"xmlns:xlink=\"http://www.w3.org/1999/xlink\">$\\text{1":[144],"2.":[145],"5":[146],"\\%}$</tex>":[147],"with":[148,179],"minimal":[149,180],"extra":[150],"pins.":[151],"demonstrates":[153],"how":[154],"logic":[157],"can":[158],"be":[159],"simplified":[161],"for":[162,171],"representative":[163],"LLM":[164],"presents":[167],"an":[168],"alternative":[169],"approach":[170],"next-generation":[172],"achieving":[176],"increased":[177],"hardware":[181],"overhead.":[182]},"counts_by_year":[],"updated_date":"2026-03-06T06:45:51.903784","created_date":"2026-03-05T00:00:00"}
