{"id":"https://openalex.org/W4409248618","doi":"https://doi.org/10.1109/hpca61900.2025.00127","title":"FACIL: Flexible DRAM Address Mapping for SoC-PIM Cooperative On-device LLM Inference","display_name":"FACIL: Flexible DRAM Address Mapping for SoC-PIM Cooperative On-device LLM Inference","publication_year":2025,"publication_date":"2025-03-01","ids":{"openalex":"https://openalex.org/W4409248618","doi":"https://doi.org/10.1109/hpca61900.2025.00127"},"language":"en","primary_location":{"id":"doi:10.1109/hpca61900.2025.00127","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00127","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"},"type":"article","indexed_in":["crossref"],"open_access":{"is_oa":false,"oa_status":"closed","oa_url":null,"any_repository_has_fulltext":false},"authorships":[{"author_position":"first","author":{"id":"https://openalex.org/A5055536948","display_name":"Seong Hoon Seo","orcid":"https://orcid.org/0000-0002-8283-8960"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":true,"raw_author_name":"Seong Hoon Seo","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5100405459","display_name":"Jung-Hoon Kim","orcid":"https://orcid.org/0000-0002-4369-866X"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Junghoon Kim","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5102833773","display_name":"Donghyun Lee","orcid":"https://orcid.org/0009-0004-6925-8824"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Donghyun Lee","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Seonah Yoo","orcid":null},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seonah Yoo","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"middle","author":{"id":null,"display_name":"Seokwon Moon","orcid":null},"institutions":[{"id":"https://openalex.org/I4575257","display_name":"Hanyang University","ror":"https://ror.org/046865y68","country_code":"KR","type":"education","lineage":["https://openalex.org/I4575257"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Seokwon Moon","raw_affiliation_strings":["Hanyang University"],"affiliations":[{"raw_affiliation_string":"Hanyang University","institution_ids":["https://openalex.org/I4575257"]}]},{"author_position":"middle","author":{"id":"https://openalex.org/A5049560946","display_name":"Yeonhong Park","orcid":"https://orcid.org/0009-0008-1425-0971"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Yeonhong Park","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]},{"author_position":"last","author":{"id":"https://openalex.org/A5100415738","display_name":"Jae Wook Lee","orcid":"https://orcid.org/0000-0002-8756-0195"},"institutions":[{"id":"https://openalex.org/I139264467","display_name":"Seoul National University","ror":"https://ror.org/04h9pn542","country_code":"KR","type":"education","lineage":["https://openalex.org/I139264467"]}],"countries":["KR"],"is_corresponding":false,"raw_author_name":"Jae W. Lee","raw_affiliation_strings":["Seoul National University"],"affiliations":[{"raw_affiliation_string":"Seoul National University","institution_ids":["https://openalex.org/I139264467"]}]}],"institutions":[],"countries_distinct_count":1,"institutions_distinct_count":7,"corresponding_author_ids":["https://openalex.org/A5055536948"],"corresponding_institution_ids":["https://openalex.org/I139264467"],"apc_list":null,"apc_paid":null,"fwci":0.6645,"has_fulltext":false,"cited_by_count":1,"citation_normalized_percentile":{"value":0.68595165,"is_in_top_1_percent":false,"is_in_top_10_percent":false},"cited_by_percentile_year":{"min":96,"max":98},"biblio":{"volume":null,"issue":null,"first_page":"1720","last_page":"1733"},"is_retracted":false,"is_paratext":false,"is_xpac":false,"primary_topic":{"id":"https://openalex.org/T10472","display_name":"Semiconductor materials and devices","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},"topics":[{"id":"https://openalex.org/T10472","display_name":"Semiconductor materials and devices","score":0.9995999932289124,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T10558","display_name":"Advancements in Semiconductor Devices and Circuit Design","score":0.9977999925613403,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}},{"id":"https://openalex.org/T14117","display_name":"Integrated Circuits and Semiconductor Failure Analysis","score":0.9961000084877014,"subfield":{"id":"https://openalex.org/subfields/2208","display_name":"Electrical and Electronic Engineering"},"field":{"id":"https://openalex.org/fields/22","display_name":"Engineering"},"domain":{"id":"https://openalex.org/domains/3","display_name":"Physical Sciences"}}],"keywords":[{"id":"https://openalex.org/keywords/dram","display_name":"Dram","score":0.8293710947036743},{"id":"https://openalex.org/keywords/computer-science","display_name":"Computer science","score":0.7249210476875305},{"id":"https://openalex.org/keywords/inference","display_name":"Inference","score":0.6893975138664246},{"id":"https://openalex.org/keywords/computer-architecture","display_name":"Computer architecture","score":0.4719875156879425},{"id":"https://openalex.org/keywords/embedded-system","display_name":"Embedded system","score":0.3213651776313782},{"id":"https://openalex.org/keywords/artificial-intelligence","display_name":"Artificial intelligence","score":0.23935353755950928},{"id":"https://openalex.org/keywords/computer-hardware","display_name":"Computer hardware","score":0.1592596471309662}],"concepts":[{"id":"https://openalex.org/C7366592","wikidata":"https://www.wikidata.org/wiki/Q1255620","display_name":"Dram","level":2,"score":0.8293710947036743},{"id":"https://openalex.org/C41008148","wikidata":"https://www.wikidata.org/wiki/Q21198","display_name":"Computer science","level":0,"score":0.7249210476875305},{"id":"https://openalex.org/C2776214188","wikidata":"https://www.wikidata.org/wiki/Q408386","display_name":"Inference","level":2,"score":0.6893975138664246},{"id":"https://openalex.org/C118524514","wikidata":"https://www.wikidata.org/wiki/Q173212","display_name":"Computer architecture","level":1,"score":0.4719875156879425},{"id":"https://openalex.org/C149635348","wikidata":"https://www.wikidata.org/wiki/Q193040","display_name":"Embedded system","level":1,"score":0.3213651776313782},{"id":"https://openalex.org/C154945302","wikidata":"https://www.wikidata.org/wiki/Q11660","display_name":"Artificial intelligence","level":1,"score":0.23935353755950928},{"id":"https://openalex.org/C9390403","wikidata":"https://www.wikidata.org/wiki/Q3966","display_name":"Computer hardware","level":1,"score":0.1592596471309662}],"mesh":[],"locations_count":1,"locations":[{"id":"doi:10.1109/hpca61900.2025.00127","is_oa":false,"landing_page_url":"https://doi.org/10.1109/hpca61900.2025.00127","pdf_url":null,"source":null,"license":null,"license_id":null,"version":"publishedVersion","is_accepted":true,"is_published":true,"raw_source_name":"2025 IEEE International Symposium on High Performance Computer Architecture (HPCA)","raw_type":"proceedings-article"}],"best_oa_location":null,"sustainable_development_goals":[],"awards":[],"funders":[{"id":"https://openalex.org/F4320320671","display_name":"National Research Foundation","ror":"https://ror.org/05s0g1g46"}],"has_content":{"grobid_xml":false,"pdf":false},"content_urls":null,"referenced_works_count":48,"referenced_works":["https://openalex.org/W1981943579","https://openalex.org/W2002555321","https://openalex.org/W2013073142","https://openalex.org/W2162634167","https://openalex.org/W2162639668","https://openalex.org/W2268589658","https://openalex.org/W2347068719","https://openalex.org/W2545376626","https://openalex.org/W2766489088","https://openalex.org/W2884108789","https://openalex.org/W2979719709","https://openalex.org/W2979874885","https://openalex.org/W2982008795","https://openalex.org/W3006586535","https://openalex.org/W3016765354","https://openalex.org/W3041919703","https://openalex.org/W3043023836","https://openalex.org/W3043140114","https://openalex.org/W3043571714","https://openalex.org/W3043804473","https://openalex.org/W3100710793","https://openalex.org/W3102510044","https://openalex.org/W3111721177","https://openalex.org/W3134274954","https://openalex.org/W3145545382","https://openalex.org/W3178193590","https://openalex.org/W3189166979","https://openalex.org/W3191222816","https://openalex.org/W3206328251","https://openalex.org/W3207399097","https://openalex.org/W3207730694","https://openalex.org/W4214633646","https://openalex.org/W4221001402","https://openalex.org/W4226126604","https://openalex.org/W4249322926","https://openalex.org/W4285121610","https://openalex.org/W4285548014","https://openalex.org/W4385245566","https://openalex.org/W4385834084","https://openalex.org/W4387064011","https://openalex.org/W4387064057","https://openalex.org/W4392427708","https://openalex.org/W4393407315","https://openalex.org/W4394998968","https://openalex.org/W4395073431","https://openalex.org/W4403635905","https://openalex.org/W4406163959","https://openalex.org/W4406650295"],"related_works":["https://openalex.org/W4391375266","https://openalex.org/W2899084033","https://openalex.org/W2748952813","https://openalex.org/W3120961607","https://openalex.org/W4401568740","https://openalex.org/W3148568549","https://openalex.org/W2098207691","https://openalex.org/W1648516568","https://openalex.org/W361036515","https://openalex.org/W2161286015"],"abstract_inverted_index":{"The":[0],"rise":[1],"of":[2,5,63,161,177,199],"on-device":[3,210],"inference":[4,207],"large":[6],"language":[7],"models":[8],"(LLMs)":[9],"is":[10,25],"rapidly":[11],"escalating":[12],"the":[13,31,59,91,122,152,173,188,220,230],"demand":[14],"for":[15,29,96,109,143],"memory-intensive":[16],"operations":[17,145],"on":[18,208],"edge":[19,34],"devices.":[20],"While":[21],"DRAMbased":[22],"processing-in-memory":[23],"(PIM)":[24],"a":[26,42,46,64,70,131,163,183],"promising":[27],"solution":[28,136],"overcoming":[30],"memory":[32,47,53,57,107,164],"wall,":[33],"devices":[35],"require":[36],"PIM":[37,85,110,144,201],"to":[38,50,80,115,150,172],"function":[39],"both":[40,84,97,200],"as":[41,90],"compute":[43],"unit":[44],"and":[45,61,86,100,111,181,202,216,225],"device":[48],"due":[49],"their":[51],"limited":[52],"capacity.":[54],"Such":[55],"PIM-enabled":[56],"complicates":[58],"partition":[60],"placement":[62],"tensor":[65],"into":[66],"DRAM":[67,133,142,169,190],"banks":[68],"in":[69,141],"PIM-operable":[71],"manner.":[72],"Notably,":[73],"we":[74,128],"highlight":[75],"that":[76,137,166,186,195],"LLM":[77,206,211],"weights":[78,93],"need":[79],"be":[81],"accessible":[82],"by":[83,222],"system-on-chip":[87],"(SoC)":[88],"processors,":[89,113],"same":[92,153],"are":[94],"used":[95],"SoC-favorable":[98],"GEMM":[99],"PIM-favorable":[101],"GEMV":[102],"operations.":[103],"This":[104],"necessitates":[105],"different":[106,168],"mappings":[108],"SoC":[112,148,203],"leading":[114],"potential":[116],"re-layout":[117],"costs":[118],"when":[119],"switching":[120],"between":[121],"two.":[123],"To":[124],"address":[125,134,170,191],"this":[126],"challenge,":[127],"propose":[129],"FACIL,":[130],"flexible":[132],"mapping":[135,171],"efficiently":[138],"places":[139],"tensors":[140],"while":[146],"allowing":[147],"processors":[149],"access":[151,198],"data":[154],"using":[155],"contiguous":[156],"virtual":[157],"addresses.":[158],"FACIL":[159],"consists":[160],"(i)":[162],"controller":[165],"assigns":[167],"page":[174,180],"offset":[175],"bits":[176],"each":[178],"huge":[179],"(ii)":[182],"user-level":[184],"library":[185],"determines":[187],"appropriate":[189],"mapping.":[192],"We":[193],"demonstrate":[194],"enabling":[196],"re-layout-free":[197],"processor":[204],"benefits":[205],"various":[209],"tasks,":[212],"including":[213],"short":[214],"conversation":[215],"code":[217],"autocompletion,":[218],"reducing":[219],"time-to-first-token":[221],"$2.37":[223],"\\times$":[224],"$2.63":[226],"\\times$,":[227],"respectively,":[228],"over":[229],"SoC-PIM":[231],"baseline.":[232]},"counts_by_year":[{"year":2026,"cited_by_count":1}],"updated_date":"2026-04-21T08:09:41.155169","created_date":"2025-10-10T00:00:00"}
